%PDF-1.3 1 0 obj << /Kids [ 3 0 R 4 0 R 5 0 R 6 0 R 7 0 R 8 0 R 9 0 R 10 0 R 11 0 R 12 0 R ] /Type /Pages /Count 10 >> endobj 2 0 obj << /Title (Semantic Video Segmentation by Gated Recurrent Flow Propagation) /Producer (PyPDF2) /Author (David Nilsson\054 Cristian Sminchisescu) /Subject (2018 IEEE Conference on Computer Vision and Pattern Recognition) >> endobj 3 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 14 0 R /Resources << /XObject << /x8 15 0 R /x6 18 0 R /x12 21 0 R /x10 24 0 R >> /ExtGState << /s9 27 0 R /s11 30 0 R /a0 << /CA 1 /ca 1 >> /R21 33 0 R /s5 34 0 R /s7 37 0 R >> /Font << /F2 40 0 R /R28 41 0 R /F1 45 0 R /R34 46 0 R /R22 50 0 R /R32 54 0 R /R24 57 0 R /R30 61 0 R /R26 65 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 68 0 R 69 0 R 70 0 R 71 0 R 72 0 R 73 0 R 74 0 R 75 0 R 76 0 R 77 0 R 78 0 R 79 0 R ] >> endobj 4 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 80 0 R /Resources << /XObject << /R83 81 0 R /R82 82 0 R /R81 83 0 R /R87 84 0 R /R86 85 0 R /R85 86 0 R /R84 87 0 R >> /ExtGState << /R21 33 0 R >> /Font << /F2 88 0 R /R79 89 0 R /R100 93 0 R /F1 97 0 R /R102 98 0 R /R76 101 0 R /R104 108 0 R /R98 112 0 R /R88 116 0 R /R96 120 0 R /R90 124 0 R /R92 127 0 R /R22 50 0 R /R94 131 0 R /R24 57 0 R /R30 61 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 134 0 R 135 0 R 136 0 R 137 0 R 138 0 R 139 0 R 140 0 R 141 0 R 142 0 R 143 0 R 144 0 R 145 0 R 146 0 R 147 0 R 148 0 R 149 0 R 150 0 R 151 0 R 152 0 R 153 0 R 154 0 R 155 0 R 156 0 R 157 0 R 158 0 R 159 0 R 160 0 R 161 0 R 162 0 R 163 0 R 164 0 R 165 0 R 166 0 R ] >> endobj 5 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 167 0 R /Resources << /XObject << /R130 168 0 R /R131 169 0 R /R132 170 0 R /R133 171 0 R /R129 172 0 R >> /ExtGState << /R21 33 0 R >> /Font << /R79 89 0 R /R76 101 0 R /R98 112 0 R /R126 173 0 R /R88 116 0 R /R134 180 0 R /R121 183 0 R /R90 124 0 R /R96 120 0 R /F2 187 0 R /R100 93 0 R /R102 98 0 R /R104 108 0 R /F1 188 0 R /R123 189 0 R /R34 46 0 R /R22 50 0 R /R24 57 0 R /R30 61 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 194 0 R 195 0 R 196 0 R 197 0 R 198 0 R 199 0 R 200 0 R 201 0 R 202 0 R 203 0 R ] >> endobj 6 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 204 0 R /Resources << /ExtGState << /R21 33 0 R >> /Font << /F2 205 0 R /R100 93 0 R /R102 98 0 R /R104 108 0 R /R98 112 0 R /F1 206 0 R /R123 189 0 R /R121 183 0 R /R22 50 0 R /R24 57 0 R /R96 120 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 207 0 R 208 0 R 209 0 R 210 0 R 211 0 R 212 0 R 213 0 R 214 0 R 215 0 R 216 0 R 217 0 R 218 0 R 219 0 R 220 0 R 221 0 R 222 0 R 223 0 R 224 0 R 225 0 R 226 0 R 227 0 R ] >> endobj 7 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 228 0 R /Resources << /XObject << /R175 229 0 R /R176 230 0 R /R177 231 0 R >> /ExtGState << /R21 33 0 R >> /Font << /F2 232 0 R /F1 233 0 R /R104 108 0 R /R98 112 0 R /R88 116 0 R /R123 189 0 R /R90 124 0 R /R134 180 0 R /R34 46 0 R /R24 57 0 R /R96 120 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 234 0 R 235 0 R 236 0 R 237 0 R 238 0 R 239 0 R 240 0 R ] >> endobj 8 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 241 0 R /Resources << /XObject << /R192 242 0 R /R190 243 0 R /R191 244 0 R >> /ExtGState << /R21 33 0 R >> /Font << /F2 245 0 R /F1 246 0 R /R104 108 0 R /R98 112 0 R /R88 116 0 R /R134 180 0 R /R90 124 0 R /R22 50 0 R /R24 57 0 R /R96 120 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 247 0 R 248 0 R 249 0 R 250 0 R 251 0 R 252 0 R ] >> endobj 9 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 253 0 R /Resources << /XObject << /R211 254 0 R /R213 255 0 R /R212 256 0 R /R214 257 0 R >> /ExtGState << /R21 33 0 R >> /Font << /F2 258 0 R /R100 93 0 R /R102 98 0 R /R104 108 0 R /R98 112 0 R /F1 259 0 R /R123 189 0 R /R22 50 0 R /R24 57 0 R /R96 120 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 260 0 R 261 0 R 262 0 R 263 0 R 264 0 R 265 0 R 266 0 R 267 0 R 268 0 R 269 0 R 270 0 R 271 0 R ] >> endobj 10 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 272 0 R /Resources << /ExtGState << /R21 33 0 R >> /Font << /R104 108 0 R /F2 273 0 R /F1 274 0 R /R123 189 0 R /R22 50 0 R /R24 57 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 275 0 R 276 0 R 277 0 R 278 0 R 279 0 R 280 0 R 281 0 R 282 0 R 283 0 R 284 0 R 285 0 R 286 0 R 287 0 R ] >> endobj 11 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 288 0 R /Resources << /ExtGState << /R21 33 0 R >> /Font << /F2 289 0 R /R34 46 0 R /R22 50 0 R /R24 57 0 R /F1 290 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 291 0 R 292 0 R 293 0 R 294 0 R 295 0 R 296 0 R 297 0 R 298 0 R 299 0 R 300 0 R 301 0 R 302 0 R 303 0 R 304 0 R 305 0 R 306 0 R 307 0 R 308 0 R 309 0 R 310 0 R 311 0 R 312 0 R 313 0 R 314 0 R 315 0 R 316 0 R 317 0 R 318 0 R 319 0 R 320 0 R 321 0 R 322 0 R 323 0 R 324 0 R 325 0 R 326 0 R 327 0 R 328 0 R 329 0 R 330 0 R 331 0 R 332 0 R 333 0 R 334 0 R 335 0 R 336 0 R 337 0 R 338 0 R 339 0 R 340 0 R 341 0 R 342 0 R 343 0 R 344 0 R 345 0 R 346 0 R 347 0 R ] >> endobj 12 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 348 0 R /Resources << /ExtGState << /R21 33 0 R >> /Font << /F2 349 0 R /R34 46 0 R /F1 350 0 R /R24 57 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 351 0 R 352 0 R 353 0 R 354 0 R 355 0 R 356 0 R 357 0 R 358 0 R 359 0 R 360 0 R 361 0 R 362 0 R ] >> endobj 13 0 obj << /Type /Catalog /Pages 1 0 R >> endobj 14 0 obj << /Length 17483 >> stream q q q 0.1 0 0 0.1 0 0 cm /R21 gs 0 g q 10 0 0 10 0 0 cm BT /R22 14.3462 Tf 1 0 0 1 86.818 675.067 Tm [ (Semantic) -250 (V) 37.0137 (ideo) -250.003 (Segmentation) -250.002 (by) -250.013 (Gated) -250.003 (Recurr) 18 (ent) -250.008 (Flo) 9.98604 (w) -250.002 (Pr) 18.0048 (opagation) ] TJ /R24 11.9552 Tf 103.595 -37.8582 Td [ (Da) 19.9894 (vid) -250.004 (Nilsson) ] TJ /R26 7.9701 Tf 68.5031 4.33906 Td [ (1) -0.30019 ] TJ /R24 11.9552 Tf 7.72109 -4.33906 Td [ (and) -249.987 (Cristian) -249.989 (Sminchisescu) ] TJ /R26 7.9701 Tf 126.855 4.33906 Td [ (1) -0.30019 ] TJ /R28 7.9701 Tf 4.23398 0 Td [ (\073) -0.10109 ] TJ /R26 7.9701 Tf 2.35195 0 Td [ (2) -0.30019 ] TJ -272.018 -13.948 Td [ (1) -0.29866 ] TJ /R24 11.9552 Tf 4.73281 -4.33789 Td [ (Department) -250 (of) -250.015 (Mathematics\054) -250.01 (F) 15.0158 (aculty) -250.01 (of) -250.014 (Engineering\054) -249.985 (Lund) -249.993 (Uni) 24.9957 (v) 14.9851 (ersity) ] TJ /R26 7.9701 Tf 38.2699 -9.61016 Td [ (2) -0.29866 ] TJ /R24 11.9552 Tf 4.73203 -4.33789 Td [ (Institute) -250.016 (of) -250.014 (Mathematics) -249.987 (of) -250.014 (the) -250 (Romanian) -250.008 (Academy) ] TJ /R30 8.9664 Tf -11.9059 -13.948 Td [ (f) -0.8999 ] TJ /R32 8.9664 Tf 4.60703 0 Td [ (david\056nilsson\054) -600.005 (cristian\056sminchisescu) ] TJ /R30 8.9664 Tf 193.674 0 Td [ (g) -0.90126 ] TJ /R32 8.9664 Tf 4.6082 0 Td (\100math\056lth\056se) Tj /R22 11.9552 Tf -220.783 -41.0461 Td (Abstract) Tj /R34 9.9626 Tf -83.9281 -23.9289 Td [ (Semantic) -367.014 (video) -366.989 (se) 39.9946 (gmentation) -368.011 (is) -366.984 (c) 15.0122 (hallenging) -366.99 (due) -366.993 (to) -368.005 (the) ] TJ -11.9547 -11.9551 Td [ (sheer) -386.986 (amount) -387.003 (of) -388.001 (dat) 0.99738 (a) -388.009 (that) -387.009 (needs) -386.987 (to) -386.982 (be) -386.994 (pr) 44.9851 (ocessed) -388.004 (and) -387.019 (la\055) ] TJ 11.9559 TL T* [ (beled) -394.984 (in) -394.981 (or) 36.9852 (der) -394.986 (to) -396 (construct) -395 (accur) 14.9852 (ate) -394.986 (models\056) -744.988 (In) -396.01 (this) -395.008 (pa\055) ] TJ 11.9551 TL T* [ (per) -364.991 (we) -364.989 (pr) 36.9852 (esent) -364.988 (a) -366.012 (deep\054) -392.99 (end\055to\055end) -366 (tr) 14.9914 (ainable) -365.008 (methodolo) 9.99588 (gy) ] TJ T* [ (for) -260.997 (video) -261.007 (se) 39.9952 (gmentation) -261.989 (that) -260.991 (is) -261.002 (capable) -260.997 (of) -261.003 (le) 14.9803 (ver) 15.0147 (a) 10.0032 (ging) -262.013 (t) 0.98758 (h) -1.01454 (e) -261.02 (in\055) ] TJ T* [ (formation) -386.003 (pr) 36.9852 (esent) -384.985 (in) -386.002 (unlabeled) -385.983 (data\054) -419.004 (besides) -385.994 (spar) 9.98118 (sely) -386.009 (la\055) ] TJ T* [ (beled) -291.982 (fr) 14.9914 (ames\054) -302.016 (in) -292.017 (or) 36.9852 (der) -291.983 (to) -292.017 (impr) 44.9937 (o) 10.0032 (ve) -292 (semantic) -292.005 (estimates\056) -436.011 (Our) ] TJ T* [ (model) -278.996 (combines) -280.01 (a) -279.007 (con) 40 (volutional) -279.983 (ar) 36.9852 (c) 15.0122 (hitectur) 37.0036 (e) -279.017 (and) -278.998 (a) -279.988 (spatio\055) ] TJ 11.9563 TL T* [ (tempor) 15 (al) -261.983 (tr) 14.9914 (ansformer) -261.995 (r) 37.0196 (ecurr) 36.9828 (ent) -261.988 (layer) -261.986 (that) -262.01 (is) -261.983 (a) -1.01454 (bl) 0.99248 (e) -263.02 (to) -261.983 (tempo\055) ] TJ 11.9547 TL T* [ (r) 14.984 (ally) -389.998 (pr) 44.9839 (opa) 10.0136 (gate) -388.982 (labeling) -390.016 (information) -389.99 (by) -388.994 (means) -389.999 (of) -390.001 (optical) ] TJ T* [ <036f77> 74.0109 (\054) -450 (adaptive) 1.00596 (ly) -410.008 (gated) -409.992 (based) -409.013 (on) -410 (its) -409.989 (locally) -409.008 (estimated) -410.017 (un\055) ] TJ T* [ (certainty) 54.9957 (\056) -618.012 (The) -352.985 <036f77> 74.0109 (\054) -378.993 (the) -352.993 (r) 38 (eco) 9.99466 (gnition) -352.997 (and) -352.985 (the) -352.993 (gated) -352.983 (tempo\055) ] TJ T* [ (r) 14.984 (al) -249.005 (pr) 44.9839 (opa) 10.0136 (gation) -248.983 (modules) -248.99 (can) -249.011 (be) -249.016 (tr) 14.9914 (ained) -249 (jointly) 55.0055 (\054) -249.995 (end\055to\055end\056) ] TJ 11.9559 TL T* [ (The) -249.982 (tempor) 15 (al\054) -249.003 (gated) -250.018 (r) 37.0196 (ecurr) 36.9828 (ent) -249.01 <036f77> -250.013 (pr) 44.9839 (opa) 10.013 (gation) -250.002 (component) ] TJ 11.9551 TL T* [ (of) -316.013 (our) -316.99 (model) -316.01 (can) -317 (be) -315.985 (plug) 9.98118 (g) 10.0032 (ed) -317.005 (into) -316.001 (any) -317 (static) -315.996 (semantic) -316.981 (se) 39.9958 (g\055) ] TJ T* [ (mentation) -259.995 (ar) 36.9852 (c) 15.0122 (hitectur) 37.0036 (e) -260 (and) -261 (turn) -260.012 (it) -259.981 (into) -260.011 (a) -261.01 (weakly) -259.984 (supervised) ] TJ T* [ (video) -320.997 (pr) 44.9839 (ocessing) -321.019 (one) 14.984 (\056) -523.989 (Our) -320.992 (e) 19.9918 (xperiments) -321.018 (in) -322.012 (the) -320.998 (c) 15.0122 (hallenging) ] TJ T* [ (CityScapes) -262 (and) -261 (Camvid) -262.005 (datasets\054) -263.995 (and) -261.981 (for) -262.018 (mul) 0.99493 (tiple) -262.013 (deep) -261.993 (ar) 20.0089 (\055) ] TJ T* [ (c) 15.0128 (hitectur) 37.003 (es\054) -350.016 (indicate) -329.015 (that) -329.999 (the) -330.016 (r) 37.0196 (esulting) -329.005 (model) -330.009 (can) -330.018 (le) 14.9803 (ver) 15.0147 (a) 10.0032 (g) 10.0032 (e) ] TJ 11.9559 TL T* [ (unlabeled) -297.998 (tempor) 15 (al) -296.997 (fr) 14.9914 (ames\054) -310.014 (ne) 19.9979 (xt) -297.007 (to) -298.016 (a) -297.004 (labeled) -298.009 (one) 10.0032 (\054) -309.005 (in) -298.016 (or) 36.9865 (der) ] TJ 11.9551 TL T* [ (to) -360.006 (impr) 44.9937 (o) 10.0032 (ve) -361.007 (both) -359.996 (the) -360.011 (video) -360.99 (se) 39.9946 (gmentation) -360.013 (accur) 14.9852 (acy) -359.982 (and) -360.984 (the) ] TJ T* [ (consistency) -254.992 (of) -255.984 (its) -254.995 (tempor) 15 (al) -255.004 (labeling) 9.99588 (\054) -257.013 (at) -255.004 (no) -255.006 (additional) -256.016 (anno\055) ] TJ T* [ (tation) -250 (cost) -249.983 (and) -249.983 (with) -250.004 (little) -250.005 (e) 19.9918 (xtr) 14.9865 (a) -249.993 (computation\056) ] TJ /R22 11.9552 Tf 35.9223 TL T* [ (1\056) -249.99 (Intr) 18.0146 (oduction) ] TJ /R24 9.9626 Tf 11.9547 -18.948 Td [ (Systems) -568.016 (capable) -567.984 (of) -567.002 (computing) -568.014 (accurate) -567.996 (and) -568.018 (tempo\055) ] TJ -11.9547 -11.9547 Td [ (rally) -382.003 (consistent) -382.994 (semantic) -381.99 (se) 15.0183 (gmentations) -382.002 (in) -382.983 (video) -381.998 (are) -383.007 (cen\055) ] TJ 11.9563 TL T* [ (tral) -299.982 (to) -300.016 (scene) -299.011 (understanding\054) -313 (being) -298.991 (useful) -300.014 (in) -300.016 (applications) -299.987 (in) ] TJ 11.9551 TL T* [ (robotics\054) -284 (for) -277.014 (instance) -278.015 (grasping\054) -284.003 (or) -277.011 (for) -277.014 (autonomous) -277.981 (v) 14.9828 (ehicles) ] TJ T* [ (where) -375.981 (one) -374.991 (naturally) -375.991 (w) 10 (orks) -376.003 (with) -375.994 (videos) -375.011 (rather) -376.018 (than) -376.003 (single) ] TJ T* [ (images\054) -312.002 (and) -299.984 (high) -300.006 (le) 25.0179 (v) 14.9828 (els) -299 (of) -299.988 (precision) -300.005 (are) -300.001 (needed\056) -459.017 (Since) -300.011 (the) ] TJ T* [ (emer) 17.997 (gence) -343.985 (of) -343 (deep) -343.981 (learning) -342.984 (methods) -343.985 (for) -343.004 (image) -344.006 <636c617373690263612d> ] TJ T* [ (tion\054) -365.01 (the) -342.013 (problem) -341.994 (of) -342.02 (semantic) -341.997 (image) -342.986 (se) 15.0196 (gmentation) -342.016 (has) -342.014 (re\055) ] TJ 11.9559 TL T* [ (cei) 25.0142 (v) 14.9828 (ed) -257.996 (increasing) -256.996 (attention\054) -259.997 (with) -256.994 (some) -258.017 (of) -257.994 (the) -257.009 (most) -258.006 (success\055) ] TJ 11.9551 TL T* [ (ful) -229.992 (methods) -230.004 (based) -229.993 (on) -229.991 (fully) -231 (trainable) -229.986 (con) 39.9982 (v) 20.0016 (olutional) -229.996 (architec\055) ] TJ T* [ (tures) -380.985 (\050CNN\051\056) -382 (Data) -380.994 (for) -382.016 (training) -381.005 (and) -382.009 <7265026e696e67> -381.005 (single) -381.988 (frame\054) ] TJ T* [ (static) -260.996 (models) -260.985 (is) -261.982 (no) 24.986 (w) -261.013 (quite) -260.996 (di) 24.9885 (v) 14.9828 (erse) -260.982 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 190.704 81 Tm (7) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 195.686 81 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 200.786 81 Tm (29) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 210.749 81 Tm [ (\135\056) -343.002 (In) -261.993 (contrast\054) -264.012 (fully) ] TJ 98.1133 473.32 Td [ (trainable) -364.983 (approaches) -364.993 (to) -364.005 (semantic) -365.013 (video) -365.018 (se) 15.0171 (gmentation) -364.993 (f) 9.99343 (ace) ] TJ 11.9551 TL T* [ (the) -308.02 (dif) 24.986 <0263756c7479> -307.012 (of) -307.985 (obtaining) -307.983 (detailed) -306.988 (annotations) -307.983 (for) -307.988 (indi) 25 (vid\055) ] TJ 11.9559 TL T* [ (ual) -402.984 (video) -403.994 (frames\054) -441.02 (although) -404.016 (datas) 0.99003 (ets) -404.001 (are) -403.001 (emer) 17.997 (ging) -403.006 (for) -404.011 (the) ] TJ 11.9551 TL T* [ (\050unsupervised\051) -414.017 (video) -413.012 (se) 15.0196 (gmentation) -414.004 (problem) -413.005 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 496.189 518.454 Tm (11) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 506.152 518.454 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 512.767 518.454 Tm (36) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 522.729 518.454 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 529.345 518.454 Tm (27) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 539.307 518.454 Tm (\135\056) Tj -230.445 -11.9551 Td [ (Therefore) -518.002 (some) -516.992 (of) -517.99 (the) -517.004 (e) 15.0122 (xisting) -517.987 (approaches) -517.007 (to) -518.021 (semantic) ] TJ 11.9551 TL T* [ (video) -290.993 (se) 15.0196 (gmentation) -291.005 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 393.096 494.544 Tm (42) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 403.058 494.544 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 408.458 494.544 Tm (43) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 418.42 494.544 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 423.81 494.544 Tm (25) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 433.773 494.544 Tm [ (\135) -291.015 (rely) -291.005 (on) -291 (single) -292.005 (fram) 0.98023 (e) -291.995 (mod\055) ] TJ -124.911 -11.9551 Td [ (els) -392.003 (with) -391.011 (corresponding) -392.018 (v) 24.9811 (ariables) -392.003 (connected) -390.984 (in) -392.003 (time) -391.988 (using) ] TJ 11.9547 TL T* [ (random) -260.015 <02656c6473> -258.986 (with) -260.013 (higher) 20.0114 (\055order) -258.981 (potentials\054) -261.991 (and) -259.991 (mostly) -259.991 (pre\055) ] TJ 11.9563 TL T* [ <7370656369026564> -357.014 (parameters\056) -628.983 (Fully) -357 (trainable) -356.985 (approaches) -356.014 (to) -356.989 (video) ] TJ 11.9547 TL T* [ (are) -331.016 (rare\056) -553.018 (The) -330.999 (computational) -330.989 (comple) 14.9975 (xity) -331.999 (of) -331.004 (video) -330.984 (process\055) ] TJ T* [ (ing) -250.02 (further) -249.995 (complicated) -250.005 (matters\056) ] TJ 11.9547 -11.9711 Td [ (One) -259.013 (possible) -257.999 (approach) -259.011 (to) -257.986 (designing) -259.016 (semantic) -258.011 (video) -258.996 (se) 15.0171 (g\055) ] TJ -11.9547 -11.9551 Td [ (mentation) -577.002 (models) -577.009 (in) -576.99 (the) -576.992 (long) -577.016 (run) -576.997 (can) -577.007 (be) -577.982 (to) -576.992 (only) -577.016 (la\055) ] TJ T* [ (bel) -449.996 (frames\054) -501.01 (sparsely) 64.9867 (\054) -499.993 (in) -451.011 (video\054) -500.015 (as) -450.003 (it) -451.008 (w) 10.0032 (as) -450.003 (done) -449.994 (for) -450.984 (static) ] TJ (datasets\133) ' ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 343.721 386.932 Tm (7) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 348.702 386.932 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 353.484 386.932 Tm (29) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 363.447 386.932 Tm [ (\135\056) -303.988 (Then) -231.01 (one) -229.996 (should) -230.986 (be) -230 (able) -231.015 (to) -229.991 (le) 25.0203 (v) 14.9828 (erage) -230.991 (tempo\055) ] TJ -54.5848 -11.9563 Td [ (ral) -261.995 (dependencies) -262.998 (in) -261.983 (order) -263.015 (to) -261.986 (propag) 4.99426 (ate) -263.015 (and) -261.991 (aggre) 15.0171 (g) 4.98446 (ate) -263.015 (infor) 20.0065 (\055) ] TJ 11.9547 TL T* [ (mation) -208.012 (in) -207.992 (order) -208.005 (to) -207.012 (decrease) -208.019 (uncertainty) -208.019 (during) ] TJ /R34 9.9626 Tf 183.819 0 Td (both) Tj /R24 9.9626 Tf 19.784 0 Td (learning) Tj -203.603 -11.9551 Td [ (and) -198.982 (inference\056) -293.015 (This) -199.004 (w) 10 (ould) -197.982 (require) -198.986 (a) -198.991 (model) -199.001 (that) -199.011 (can) -198.991 (inte) 14.9926 (grate) ] TJ T* [ (spatio\055temporal) -249.99 (dependencies) -249.983 (across) -249.993 (video) -250.017 (frames\056) ] TJ 11.9547 -11.9711 Td [ (While) -257.981 (approaches) -257.011 (based) -257.986 (on) -257.006 (CNNs) -258.011 (appear) -258.001 (right\054) -258.991 (the) 14.9877 (y) -257.991 (are) ] TJ -11.9547 -11.9551 Td [ (non\055tri) 24.9983 (vial) -201.011 (to) -201.013 (adapt) -201.998 (to) -201.013 (video) -201.006 (se) 15.0171 (gmentation) -201.02 (due) -201.02 (to) -201.996 (the) -201.015 (amount) ] TJ T* [ (of) -283.989 (data) -283.989 (that) -284.016 (needs) -285.004 (to) -284.019 (be) -283.992 (processed) -283.982 (for) -283.992 (dense) -283.982 (predictions\056) -412.99 (If) ] TJ 11.9563 TL T* [ (video) -235.983 (processing) -234.993 (and) -235.995 (temporal) -236.015 (matching) -236.005 (were) -234.99 (to) -235.99 (be) -236 (learned) ] TJ 11.9547 TL T* [ (without) -311.987 (e) 15.0122 (xplicit) -311.012 (components) -311.982 (such) -312.017 (as) -311.007 (optical) -312.002 <036f> 24.9958 (w) -311.982 (w) 10.0032 (arping\054) ] TJ T* [ (one) -350.015 (possibility) -351.01 (w) 10 (oul) 0.99738 (d) -350.995 (be) -350.02 (to) -350.01 (design) -351.015 (a) -349.986 (model) -349.996 (based) -350.01 (on) -350.99 (3D\055) ] TJ T* [ (con) 39.9982 (v) 20.0016 (olutions\054) -277.003 (as) -271.991 (used) -271.001 (e\056g\056) -374.991 (for) -271.994 (action) -270.999 (recognition\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 505.155 255.409 Tm (20) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 515.118 255.409 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 520.318 255.409 Tm (3) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R24 9.9626 Tf 1 0 0 1 525.299 255.409 Tm [ (\135\056) -374.996 (T) 79.9916 (o) ] TJ -216.437 -11.9551 Td [ (our) -311 (kno) 24.9909 (wledge) -310.995 (no) -312.017 (such) -310.995 (approach) -311.002 (has) -311.002 (been) -311.007 (pursued) -312.007 (for) -311.007 (se\055) ] TJ 11.9551 TL T* [ (mantic) -207.002 (video) -207.987 (se) 15.0196 (gmentation\056) -295.98 (Instead\054) -215.988 (we) -206.985 (will) -208.019 (tak) 10.0081 (e) -206.99 (an) -208.005 (e) 15.0122 (xplicit) ] TJ 11.9559 TL T* [ (modeling) -289.008 (approach) -287.986 (relying) -288.991 (on) -289 (e) 15.0122 (xis) 1 (ting) -288.986 (single\055frame) -288.991 (CNNs) ] TJ 11.9551 TL T* [ (augmented) -379.008 (with) -379.013 (spatial) -377.991 (transformer) -378.981 (structures) -379.015 (that) -378.981 (imple\055) ] TJ T* [ (ment) -256.996 (w) 10 (arping) -257.001 (along) -258.018 (optical) -256.991 <036f> 24.9958 (w) -257.011 <02656c64732e> -331.994 (These) -257.011 (will) -256.991 (be) -257.996 (com\055) ] TJ T* [ (bined) -270.016 (with) -270.992 (adapti) 24.9909 (v) 14.9828 (e) -270 (recurrent) -270 (units) -270.004 (in) -271.004 (order) -269.994 (to) -269.984 (learn) -269.994 (to) -271.004 (fuse) ] TJ T* [ (the) -235.992 (estimates) -234.988 (from) -235.99 (single) -234.993 (\050unlabeled\051) -235.985 (frames) -235.995 (with) -234.995 (the) -235.99 (label\055) ] TJ T* [ (ing) -366 (information) -366.012 (temporally) -364.998 (propag) 4.99426 (ated) -366.012 (from) -366.008 (nearby) -366.012 (ones\054) ] TJ 11.9559 TL T* [ (properly) -399.014 (g) 4.98446 (ated) -398.99 (based) -398.985 (on) -398.002 (their) -398.982 (uncertainty) 64.9941 (\056) -757.006 (The) -398.987 (proposed) ] TJ 11.9551 TL T* [ (model) -250.012 (is) -249.985 (dif) 24.986 (ferentiable) -249.99 (and) -249.993 (end\055to\055end) -249.983 (trainable\056) ] TJ /R22 11.9552 Tf 23.957 TL T* [ (2\056) -249.989 (Related) -250.002 (W) 74.9972 (ork) ] TJ /R24 9.9626 Tf 11.9547 -18.9449 Td [ (Our) -221.017 (semantic) -220.017 (video) -221.005 (se) 15.0196 (gmentation) -219.998 (w) 10.0032 (ork) -221.017 (relates) -221.017 (to) -219.993 (the) -221.012 (dif\055) ] TJ -11.9547 -11.9551 Td [ (ferent) -392.996 <02656c6473> -391.984 (of) -392.991 (semantic) -393.008 (image) -391.998 (se) 15.0171 (gmentation\054) -427.997 (as) -392.993 (well) -393.018 (as\054) ] TJ -13.741 -29.8879 Td (1) Tj ET Q Q Q q q 1 1 1 rg /a0 gs 48.406 786.422 515.188 -52.699 re f q /s5 gs /x6 Do Q q /s7 gs /x8 Do Q q /s9 gs /x10 Do Q q /s11 gs /x12 Do Q Q Q Q q 1 0 0 1 0 0 cm BT /F1 12 Tf 14.4 TL ET 1 1 1 rg n 270 47 72 14 re f* 0.5 0.5 0.5 rg BT /F2 9 Tf 10.8 TL ET BT 1 0 0 1 297 50 Tm (6819) Tj T* ET Q endstream endobj 15 0 obj << /Filter /FlateDecode /Resources << /ExtGState << /a0 << /CA 1 /ca 1 >> >> /XObject << /x18 16 0 R >> >> /Length 28 /Group << /Type /Group /S /Transparency /CS /DeviceRGB /I true >> /BBox [ 78 746 96 765 ] /Type /XObject /Subtype /Form >> stream x+O4PH/VЯ0Pp 0 endstream endobj 16 0 obj << /Filter /FlateDecode /Resources 17 0 R /Length 107 /Type /XObject /BBox [ 78 746 96 765 ] /Subtype /Form >> stream xe AC̬wʠ =p,?]%+H-
Jc "82w8VSnGW;"
endstream
endobj
17 0 obj
<<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
>>
endobj
18 0 obj
<<
/Filter /FlateDecode
/Resources <<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
/XObject <<
/x15 19 0 R
>>
>>
/Length 28
/Group <<
/Type /Group
/S /Transparency
/CS /DeviceRGB
/I true
>>
/BBox [ 67 752 84 775 ]
/Type /XObject
/Subtype /Form
>>
stream
x+O4PH/VЯ04Up
0
endstream
endobj
19 0 obj
<<
/Filter /FlateDecode
/Resources 20 0 R
/Length 228
/Type /XObject
/BBox [ 67 752 84 775 ]
/Subtype /Form
>>
stream
xeQKn!s ?FPav6R٪TS.
b];15YyR
{7QL.\:Rv/x9l+L7h%1!}i/AI(kz"U&,YO![R hg{3}4/GyYF:!w}Gn+'xJcO9i뽼_-:`
endstream
endobj
20 0 obj
<<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
>>
endobj
21 0 obj
<<
/Filter /FlateDecode
/Resources <<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
/XObject <<
/x24 22 0 R
>>
>>
/Length 28
/Group <<
/Type /Group
/S /Transparency
/CS /DeviceRGB
/I true
>>
/BBox [ 132 751 480 772 ]
/Type /XObject
/Subtype /Form
>>
stream
x+O4PH/VЯ02Qp
0
endstream
endobj
22 0 obj
<<
/Filter /FlateDecode
/Resources 23 0 R
/Length 53223
/Type /XObject
/BBox [ 132 751 480 772 ]
/Subtype /Form
>>
stream
xtI:6%Q㨈?7rA= u%6 ?Y(WbWo{B>9
x`Znϳ|8{3?0x*z ǃ|,@:w>`c|*ϻⳅKO3`g
:_|}}><.6`Z{{3]#<_o"~:ͺgk7/Ұ@|K yp ]03ʷCmş8˽Y?>(3!Bwqs.Z8,~~=rMT̩y+/*w: uBZ_`ߵp`%M?ɝ1ɳw=vDۉy&xb4Q>d@ sg~lA