%PDF-1.3 1 0 obj << /Kids [ 3 0 R 4 0 R 5 0 R 6 0 R 7 0 R 8 0 R 9 0 R 10 0 R 11 0 R ] /Type /Pages /Count 9 >> endobj 2 0 obj << /Title (Flexible Spatio\055Temporal Networks for Video Prediction) /Producer (PyPDF2) /Author (Chaochao Lu\054 Michael Hirsch\054 Bernhard Scholkopf) /Subject (2017 IEEE Conference on Computer Vision and Pattern Recognition) >> endobj 3 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 13 0 R /Resources << /XObject << /x8 14 0 R /x6 17 0 R /x12 20 0 R /x10 23 0 R >> /ExtGState << /s9 26 0 R /R29 29 0 R /s11 30 0 R /a0 << /CA 1 /ca 1 >> /s5 33 0 R /s7 36 0 R >> /Font << /F2 39 0 R /F1 40 0 R /R38 41 0 R /R36 45 0 R /R34 49 0 R /R32 52 0 R /R42 56 0 R /R30 59 0 R /R40 63 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 66 0 R 67 0 R 68 0 R 69 0 R 70 0 R 71 0 R 72 0 R 73 0 R 74 0 R 75 0 R 76 0 R 77 0 R 78 0 R 79 0 R 80 0 R 81 0 R 82 0 R 83 0 R 84 0 R 85 0 R 86 0 R ] >> endobj 4 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 87 0 R /Resources << /ExtGState << /R29 29 0 R >> /Font << /F2 88 0 R /F1 89 0 R /R79 90 0 R /R32 52 0 R /R30 59 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 95 0 R 96 0 R 97 0 R 98 0 R 99 0 R 100 0 R 101 0 R 102 0 R 103 0 R 104 0 R 105 0 R 106 0 R 107 0 R 108 0 R 109 0 R 110 0 R 111 0 R 112 0 R 113 0 R 114 0 R 115 0 R 116 0 R 117 0 R 118 0 R 119 0 R 120 0 R 121 0 R 122 0 R 123 0 R ] >> endobj 5 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 124 0 R /Resources << /XObject << /R121 125 0 R /R120 127 0 R /R109 128 0 R /R108 129 0 R /R141 130 0 R /R140 132 0 R /R142 133 0 R /R101 135 0 R /R100 136 0 R /R103 137 0 R /R102 138 0 R /R105 139 0 R /R104 140 0 R /R107 141 0 R /R106 142 0 R /R98 143 0 R /R99 144 0 R /R135 131 0 R /R136 145 0 R /R137 146 0 R /R138 134 0 R /R139 147 0 R /R97 126 0 R /R118 148 0 R /R119 149 0 R /R112 150 0 R /R113 151 0 R /R110 152 0 R /R111 153 0 R /R116 154 0 R /R117 155 0 R /R114 156 0 R /R115 157 0 R >> /ExtGState << /R29 29 0 R /R94 158 0 R /R93 159 0 R /R134 160 0 R /R95 161 0 R >> /Font << /F2 162 0 R /R79 90 0 R /R143 163 0 R /F1 167 0 R /R42 56 0 R /R130 168 0 R /R126 171 0 R /R132 174 0 R /R124 178 0 R /R122 182 0 R /R32 52 0 R /R30 59 0 R /R128 187 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 190 0 R 191 0 R 192 0 R 193 0 R 194 0 R 195 0 R 196 0 R 197 0 R ] >> endobj 6 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 198 0 R /Resources << /XObject << /R181 199 0 R /R180 201 0 R /R168 202 0 R /R178 203 0 R /R179 204 0 R /R167 205 0 R /R166 200 0 R /R174 206 0 R /R175 207 0 R /R176 208 0 R /R177 209 0 R /R170 210 0 R /R171 211 0 R /R172 212 0 R /R173 213 0 R /R169 214 0 R >> /ExtGState << /R29 29 0 R /R93 159 0 R >> /Font << /F2 215 0 R /R79 90 0 R /R143 163 0 R /F1 216 0 R /R130 168 0 R /R126 171 0 R /R124 178 0 R /R122 182 0 R /R32 52 0 R /R30 59 0 R /R128 187 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 217 0 R 218 0 R 219 0 R 220 0 R 221 0 R 222 0 R 223 0 R 224 0 R 225 0 R 226 0 R 227 0 R 228 0 R 229 0 R 230 0 R ] >> endobj 7 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 231 0 R /Resources << /ExtGState << /R29 29 0 R >> /Font << /R210 232 0 R /R79 90 0 R /R206 235 0 R /R204 238 0 R /R143 163 0 R /R208 241 0 R /R42 56 0 R /F1 245 0 R /R130 168 0 R /R132 174 0 R /R212 246 0 R /R122 182 0 R /R124 178 0 R /F2 249 0 R /R32 52 0 R /R30 59 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 250 0 R 251 0 R 252 0 R 253 0 R 254 0 R 255 0 R 256 0 R 257 0 R 258 0 R 259 0 R 260 0 R 261 0 R 262 0 R 263 0 R 264 0 R ] >> endobj 8 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 265 0 R /Resources << /XObject << /R264 266 0 R /R265 267 0 R /R266 268 0 R /R267 269 0 R /R260 270 0 R /R261 271 0 R /R262 272 0 R /R263 273 0 R /R268 274 0 R /R269 275 0 R /R255 276 0 R /R249 277 0 R /R257 278 0 R /R288 279 0 R /R289 280 0 R /R282 281 0 R /R283 282 0 R /R280 283 0 R /R281 284 0 R /R286 285 0 R /R287 286 0 R /R284 287 0 R /R285 288 0 R /R253 289 0 R /R252 290 0 R /R279 291 0 R /R278 292 0 R /R259 293 0 R /R258 294 0 R /R273 295 0 R /R272 296 0 R /R271 297 0 R /R256 298 0 R /R251 299 0 R /R276 300 0 R /R275 301 0 R /R274 302 0 R /R291 303 0 R /R290 304 0 R /R250 305 0 R /R292 306 0 R /R295 307 0 R /R294 308 0 R /R297 309 0 R /R296 310 0 R /R277 311 0 R /R254 312 0 R /R270 313 0 R /R293 314 0 R >> /ExtGState << /R29 29 0 R /R298 315 0 R /R93 159 0 R >> /Font << /R79 90 0 R /F1 316 0 R /R40 63 0 R /F2 317 0 R /R124 178 0 R /R247 318 0 R /R245 321 0 R /R32 52 0 R /R30 59 0 R /R128 187 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 324 0 R 325 0 R 326 0 R 327 0 R 328 0 R 329 0 R 330 0 R 331 0 R 332 0 R 333 0 R 334 0 R 335 0 R 336 0 R 337 0 R 338 0 R 339 0 R 340 0 R 341 0 R 342 0 R 343 0 R 344 0 R 345 0 R 346 0 R 347 0 R 348 0 R 349 0 R ] >> endobj 9 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 350 0 R /Resources << /XObject << /R361 351 0 R /R360 352 0 R /R363 353 0 R /R362 354 0 R /R365 355 0 R /R364 356 0 R /R367 357 0 R /R366 358 0 R /R347 359 0 R /R346 360 0 R /R345 361 0 R /R344 362 0 R /R343 363 0 R /R342 364 0 R /R341 365 0 R /R340 366 0 R /R329 367 0 R /R328 368 0 R /R325 369 0 R /R324 370 0 R /R327 371 0 R /R326 372 0 R /R321 373 0 R /R320 374 0 R /R323 375 0 R /R322 376 0 R /R349 377 0 R /R348 378 0 R /R358 379 0 R /R359 380 0 R /R350 381 0 R /R351 382 0 R /R352 383 0 R /R353 384 0 R /R354 385 0 R /R319 386 0 R /R356 387 0 R /R355 388 0 R /R338 389 0 R /R339 390 0 R /R336 391 0 R /R337 392 0 R /R334 393 0 R /R335 394 0 R /R332 395 0 R /R333 396 0 R /R330 397 0 R /R331 398 0 R /R318 399 0 R /R357 400 0 R >> /ExtGState << /R29 29 0 R /R93 159 0 R >> /Font << /F2 401 0 R /F1 402 0 R /R122 182 0 R /R124 178 0 R /R32 52 0 R /R30 59 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 403 0 R 404 0 R 405 0 R 406 0 R 407 0 R 408 0 R 409 0 R 410 0 R 411 0 R 412 0 R 413 0 R 414 0 R 415 0 R 416 0 R ] >> endobj 10 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 417 0 R /Resources << /XObject << /R388 418 0 R /R400 419 0 R /R398 420 0 R /R399 421 0 R /R383 422 0 R /R382 423 0 R /R387 424 0 R /R386 425 0 R /R385 426 0 R /R384 427 0 R /R394 428 0 R /R395 429 0 R /R396 430 0 R /R397 431 0 R /R390 432 0 R /R391 433 0 R /R392 434 0 R /R393 435 0 R /R389 436 0 R >> /ExtGState << /R29 29 0 R >> /Font << /F2 437 0 R /F1 438 0 R /R32 52 0 R /R30 59 0 R /R40 63 0 R >> /ProcSet [ /Text /ImageC /ImageB /PDF /ImageI ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 439 0 R 440 0 R 441 0 R 442 0 R 443 0 R 444 0 R 445 0 R 446 0 R 447 0 R ] >> endobj 11 0 obj << /Parent 1 0 R /Rotate 0 /Type /Page /Contents 448 0 R /Resources << /ExtGState << /R29 29 0 R >> /Font << /F2 449 0 R /F1 450 0 R /R32 52 0 R /R42 56 0 R /R30 59 0 R >> /ProcSet [ /ImageC /Text /PDF /ImageI /ImageB ] >> /MediaBox [ 0 0 612 792 ] /Annots [ 451 0 R 452 0 R 453 0 R 454 0 R 455 0 R 456 0 R 457 0 R 458 0 R 459 0 R 460 0 R 461 0 R 462 0 R 463 0 R 464 0 R 465 0 R 466 0 R 467 0 R 468 0 R 469 0 R 470 0 R 471 0 R 472 0 R 473 0 R 474 0 R 475 0 R 476 0 R 477 0 R 478 0 R 479 0 R 480 0 R 481 0 R 482 0 R 483 0 R 484 0 R 485 0 R 486 0 R 487 0 R 488 0 R 489 0 R 490 0 R 491 0 R 492 0 R 493 0 R 494 0 R 495 0 R 496 0 R 497 0 R 498 0 R 499 0 R 500 0 R 501 0 R 502 0 R 503 0 R ] >> endobj 12 0 obj << /Type /Catalog /Pages 1 0 R >> endobj 13 0 obj << /Length 20717 >> stream q q q 0.10000 0 0 0.10000 0 0 cm /R29 gs 0 g q 10 0 0 10 0 0 cm BT /R30 14.34620 Tf 1 0 0 1 124.98600 675.06700 Tm [ (Flexible) -250.00200 (Spatio\055T) 92.00330 (emporal) -249.98800 (Netw) 9.99455 (orks) -250.01300 (f) 24.99230 (or) -249.99500 (V) 37.01370 (ideo) -250.00300 (Pr) 18.00480 (ediction) ] TJ /R32 11.95520 Tf 13.54300 -37.85820 Td [ (Chaochao) -250 (Lu) ] TJ /R34 7.97010 Tf 67.06800 4.33906 Td [ (1) -0.30019 ] TJ /R36 7.97010 Tf 4.23398 0 Td [ (\073) -0.10109 ] TJ /R34 7.97010 Tf 2.35234 0 Td [ (2) -0.30019 ] TJ /R32 11.95520 Tf 31.63160 -4.33906 Td [ (Michael) -250.00200 (Hirsch) ] TJ /R34 7.97010 Tf 77.02620 4.33906 Td [ (2) -0.30019 ] TJ /R32 11.95520 Tf 31.63200 -4.33906 Td [ (Bernhard) -250.01000 (Sch) ] TJ 66.40390 0.06016 Td (\250) Tj -0.99805 -0.06016 Td [ (olk) 9.98601 (opf) ] TJ /R34 7.97010 Tf 34.08400 4.33906 Td [ (2) -0.30019 ] TJ -340.81800 -13.94800 Td [ (1) -0.29866 ] TJ /R32 11.95520 Tf 7.72109 -4.33789 Td [ (Uni) 24.99460 (v) 14.98620 (ersity) -249.98900 (of) -250.01500 (Cambridge) ] TJ /R34 7.97010 Tf 145.96000 4.33789 Td [ (2) -0.30019 ] TJ /R32 11.95520 Tf 7.72070 -4.33789 Td [ (Max) -250.00400 (Planck) -250 (Institute) -250.01600 (for) -249.99500 (Intelligent) -250.00600 (Systems) ] TJ /R38 8.96640 Tf -52.16990 -13.94800 Td [ (f) -0.90126 ] TJ /R40 8.96640 Tf 4.60703 0 Td [ (clu\054) -600.00200 (mhirsch\054) -600.02100 (bs) ] TJ /R38 8.96640 Tf 86.07810 0 Td [ (g) -0.90126 ] TJ /R40 8.96640 Tf 4.60703 0 Td (\100tue\056mpg\056de) Tj /R30 11.95520 Tf -169.67400 -41.04610 Td (Abstract) Tj /R42 9.96260 Tf -83.92770 -24.25780 Td [ (W) 91.98650 (e) -309.01200 (describe) -308.01100 (a) -309.00200 (modular) -307.99100 (fr) 14.99140 (ame) 14.98160 (work) -308.98800 (for) -308.99000 (video) -308.02000 (fr) 14.99010 (ame) -309.00500 (pr) 36.98650 (e\055) ] TJ -11.95510 -11.95630 Td [ (diction\056) -557.99000 (W) 91.98650 (e) -333.00800 (r) 37.01960 (efer) -332.99800 (to) -332.99100 (it) -332.98900 (as) -332.01200 (a) -332.99800 (Fle) 20.00400 (xible) -332.99200 (Spatio\055T) 91.99200 (empor) 14.99260 (al) -332.99100 (Net\055) ] TJ 11.95510 TL T* [ (work) -346.98100 (\050FSTN\051) -347.00900 (as) -346.99000 (it) -346.98600 (allows) -346.99600 (the) -346.99400 (e) 19.99180 (xtr) 14.98650 (apolation) -346.98900 (of) -348.00800 (a) -346.99600 (video) -346.99400 (se\055) ] TJ T* [ (quence) -438.98400 (as) -439.01400 (well) -439.98200 (as) -439.01400 (the) -439.01700 (estimation) -439.01600 (of) -439.01300 (synthetic) -440.02000 (fr) 14.99010 (ames) -439.01500 (ly\055) ] TJ T* [ (ing) -421.01100 (in) -421.01600 (between) -421.01100 (observ) 0.99371 (ed) -420.98700 (fr) 14.99140 (ames) -421.01800 (and) -421.01300 (thus) -421.00600 (the) -420.98100 (g) 10.00320 (ener) 15.01960 (ation) ] TJ T* [ (of) -423.01500 (slow\055motion) -423.98700 (videos\056) -830.00100 (By) -422.98800 (de) 15.01830 (vising) -423.00200 (a) -422.98300 (customized) -424.01000 (objec\055) ] TJ 11.95590 TL T* [ (tive) -217.99700 (function) -218.00500 (comprising) -217.99700 (decoding) 9.98240 (\054) -225.01900 (encoding) 9.98363 (\054) -225.01900 (and) -217.98800 (adver) 10.00570 (sar) 20.01380 (\055) ] TJ 11.95510 TL T* [ (ial) -314.00600 (losses\054) -329.99500 (we) -314.99800 (ar) 36.98520 (e) -313.99200 (able) -314.01400 (to) -314.01400 (mitigate) -313.98900 (the) -314.01900 (common) -314.98900 (pr) 44.98510 (oblem) -314.01100 (of) ] TJ T* [ (blurry) -365.01200 (pr) 36.98520 (edictions\054) -394.01500 (mana) 10.01670 (ging) -365.99500 (to) -364.98600 (r) 37.01960 (etain) -365.01800 (high) -365.01500 (fr) 36.98650 (equency) -365.98100 (in\055) ] TJ T* [ (formation) -279.00100 (e) 15.01280 (ven) -279.01600 (for) -278.99400 (r) 37.01960 (elatively) -278.99600 (distant) -279.00900 (futur) 37.00360 (e) -279.01700 (pr) 36.98650 (edictions\056) -398.01400 (W) 91.98710 (e) ] TJ T* [ (pr) 44.98390 (opose) -205.98800 (and) -205.00900 (analyse) -205.98500 (dif) 18.01660 (fer) 36.98280 (ent) -205.01700 (tr) 14.99140 (aining) -206.01000 (str) 14.99750 (ate) 40 (gies) -205.01000 (to) -205.99300 (optimize) ] TJ T* [ (our) -358.00300 (model\056) -633.01300 (Extensive) -358.00600 (e) 19.99180 (xperiments) -357.01200 (on) -358.00900 (se) 15.01960 (ver) 15.01470 (al) -358.00600 (c) 15.01220 (hallenging) ] TJ 11.95590 TL T* [ (public) -312.00100 (datasets) -311.99000 (demonstr) 15.01100 (ate) -312.01900 (both) -312.00400 (the) -312.01900 (ver) 9.99588 (satility) -311.98500 (and) -312.01200 (valid\055) ] TJ 11.95510 TL T* [ (ity) -249.98800 (of) -249.98500 (our) -249.98200 (model\056) ] TJ /R30 11.95520 Tf 36.90900 TL T* [ (1\056) -249.99000 (Intr) 18.01460 (oduction) ] TJ /R32 9.96260 Tf 11.95510 -19.27700 Td [ (V) 59.99310 (ideos) -383.99500 (contain) -383.99400 (rich) -384.00900 (spatial) -383.99000 (and) -384.98800 (temporal) -383.99000 (structure) -384 (and) ] TJ -11.95510 -11.95510 Td [ (capture) -299.98800 (non\055tri) 25 (vial) -300.01400 (dependencies) -300.01100 (between) -299.98200 (objects) -300.98700 (and) -299.98400 (con\055) ] TJ 11.95510 TL T* [ (te) 14.98100 (xtual) -476.01800 (information) -475.01500 (along) -475.98100 (with) -476.01600 (scene) -474.98200 (characteristics) -475.98700 (lik) 10.01790 (e) ] TJ T* [ (depth\054) -516.99200 (occlusion\054) -515.99700 (and) -463.99500 (illuminati) 1.00228 (on\056) -949.98600 (Accurate) -464.00600 (modelling) ] TJ T* [ (of) -412.98800 (videos) -413.00500 (ultimately) -413.01900 (requires) -412.98100 (high\055le) 24.99830 (v) 14.98280 (el) -414.00700 (understanding) -412.98500 (of) ] TJ 11.95630 TL T* [ (3D) -269.98600 (spatio\055temporal) -269.98600 (information\054) -275.00700 (which) -270.99900 (resembles) -270.01400 (humans\047) ] TJ 11.95510 TL T* [ (ability) -242.00400 (to) -241.98700 (understand) -242.01100 (their) -241.98700 (surrounding) -241.99600 (ph) 4.98936 (ysi) 0.99738 (cal) -242.00100 (w) 10 (orld\056) -308.01000 (One) ] TJ T* [ (fundamental) -214.01300 (problem) -214.99600 (in) -213.99100 (video) -215.00500 (modelling) -213.99400 (is) -215.01100 (to) -213.99100 (predict) -215.01100 (future) ] TJ T* [ (frames) -253.99400 (in) 40.00560 (v) 20.00160 (olving) -254.00200 (the) -253.98900 (construction) -253.99600 (of) -255.01500 (an) -253.99700 (internal) -254.01600 (representa\055) ] TJ T* [ (tion) -365.01300 (that) -364.98300 (models\054) -393 (to) -364.98600 (some) -365.01900 (de) 15.01830 (gree\054) -394.01800 (both) -365.01500 (video) -365.02000 (content) -365.01800 (and) ] TJ T* [ (dynamics\056) -718.00300 (Ev) 14.98650 (en) -386.01300 (for) -386.01500 (short\055term) -385.98600 (future) -386.00700 (frames\054) -420.00300 (video) -385.99700 (pre\055) ] TJ 11.95590 TL T* [ (diction) -272.98100 (has) -273.98700 (remained) -273 (a) -273.01800 (challenging) -274 (problem) -272.98600 (until) -272.98100 (no) 24.98600 (w) 65.01120 (\054) -279.99000 (o) 24.98110 (w\055) ] TJ 11.95510 TL T* [ (ing) -251 (to) -251.00500 (the) -251.00900 (comple) 14.99870 (xity) -250.01200 (and) -251.01100 (ambiguity) -251.00700 (inherent) -251 (in) -251.00500 (video) -251 (data\056) ] TJ T* [ (V) 59.99310 (ideo) -271.98100 (prediction) -272.00400 (is) -271.98000 (thus) -272.01000 (still) -271.99900 (in) -271.98200 (its) -272.01200 (inf) 10.00690 (anc) 15.01470 (y) 65.01370 (\054) -277.99000 (in) -271.98200 (particular) -271.98200 (the) ] TJ T* [ (long\055term) -250.00600 (prediction) -250.00700 (of) -249.99600 (video) -250.01800 (sequences\056) ] TJ 11.95510 -12.30270 Td [ (There) -299.99200 (are) -300 (a) -299.01400 (number) -300.00900 (of) -299.98800 (recent) -299.99300 (w) 10 (orks) -298.99700 (that) -300.01400 (predict) -300.01600 (unseen) ] TJ -11.95510 -11.95510 Td [ (future) -297.00300 (video) -296.99100 (frames) -297.00600 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 135.34200 140.77600 Tm (20) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 145.30500 140.77600 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 150.76400 140.77600 Tm (19) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 160.72700 140.77600 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 166.17600 140.77600 Tm (25) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 176.13900 140.77600 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 181.58800 140.77600 Tm (16) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 191.55100 140.77600 Tm [ (\135\056) -450.98500 (Predicting) -297.99000 (future) -297.00200 (im\055) ] TJ -141.43900 -11.95590 Td [ (ages) -202.00300 (from) -201.99500 (a) -202.01000 (video) -201.00700 (sequence) -202.00200 (requires) -201.99700 (the) -201.99800 (learning) -201.98800 (of) -202.00300 (an) -202.00600 (inter) 20.00890 (\055) ] TJ 11.95510 TL T* [ (nal) -199.01800 (representation) -199.98300 (that) -199.01100 (captures) -199.01800 (spatio\055temporal) -199.99800 (correlations) ] TJ T* [ (and) -289.98500 (models) -291.01800 (the) -289.98300 (image) -290.99400 (e) 25.01050 (v) 20.00160 (olution) -289.98800 (accurately) 65.00880 (\056) -432.00400 (This) -290.00800 (might) -291.01300 (in\055) ] TJ T* [ (clude) -326.99600 (information) -327 (about) -326.00600 (ho) 24.98600 (w) -327.00200 (objects) -326.98200 (mo) 14.99500 (v) 14.98280 (e\054) -345.98400 (deform) -326.99200 (or) -327.00200 (be\055) ] TJ T* [ (ha) 19.99730 (v) 14.98280 (e\054) -388.99600 (about) -362 (occlusion) -361.98600 (and) -360.99200 (object) -362.00200 (boundaries\054) -389.00400 (scene) -361.98100 (depth) ] TJ 258.75000 487.26700 Td [ (and) -410.98500 (so) -411.01700 (on\056) -794.01200 (V) 59.99240 (ideo) -411.01700 (prediction) -411 (is) -411.01500 (a) -410.99500 (promising) -412 (research) -411.00500 (di\055) ] TJ T* [ (rection) -257.98400 (that) -257.98100 (will) -258.01100 (spa) 14.98520 (wn) -257.98900 (a) -258.00100 (wealth) -257.98100 (of) -257.99600 (stimulating) -258.01100 (applications) ] TJ (\133) ' ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 312.18000 544.35700 Tm (1) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 317.16100 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 322.14200 544.35700 Tm (14) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 332.10500 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 337.08600 544.35700 Tm (17) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 347.04800 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 352.03000 544.35700 Tm (13) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 361.99200 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 366.97300 544.35700 Tm (30) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 376.93600 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 381.91700 544.35700 Tm (29) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 391.88000 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 396.86100 544.35700 Tm (27) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 406.82300 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 411.80500 544.35700 Tm (5) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 416.78600 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 421.76700 544.35700 Tm (7) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 426.74800 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 431.73000 544.35700 Tm (28) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 441.69200 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 446.67300 544.35700 Tm (10) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 456.63600 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 461.61700 544.35700 Tm (23) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 471.58000 544.35700 Tm (\054) Tj ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 476.56100 544.35700 Tm (18) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 486.52300 544.35700 Tm (\135\056) Tj -165.70600 -14.21990 Td [ (K) 25.01790 (e) 15.01220 (y) -418.98400 (to) -419.99600 (the) -418.98200 (success) -419.01800 (of) -418.98900 (pre) 25.01050 (vious) -420.01800 (methods) -418.99400 (is) -419.01300 (the) -418.97900 (use) -420.00300 (of) ] TJ -11.95510 -11.95510 Td [ (Long) -336.98300 (Short\055T) 70.01770 (erm) -338.01700 (Memory) -337.01700 (\050LSTM\051) -337.01700 (autoencoder) -338.01200 (netw) 10.00810 (orks) ] TJ 11.95590 TL T* [ (which) -397.01700 (are) -395.98500 (able) -396.99000 (to) -396 (capture) -396.99300 (spatio\055temporal) -396.00300 (long\055range) -397.01700 (de\055) ] TJ 11.95510 TL T* [ (pendencies\056) -298.00900 (Although) -214.98100 (these) -215.01300 (w) 10.00320 (orks) -213.98900 (ha) 19.99670 (v) 14.98280 (e) -214.98900 (sho) 24.99090 (wn) -215.01300 (encouraging) ] TJ T* [ (results) -272.00900 (for) -271.99600 (short\055time) -271.99400 (prediction\054) -277.99800 (a) -271.99900 (common) -271.99900 (shortcoming) -271.98400 (is) ] TJ T* [ (the) -344.99400 (increasing) -344.98200 (amount) -345.99100 (of) -345.00100 (blur) -344.98700 (for) -345.00100 (predictions) -345.00600 (more) -344.99100 (than) -346.00600 (a) ] TJ T* [ (single) -250.01000 (frame) -250 (ahead\056) ] TJ 11.95510 -14.22110 Td [ (In) -422.98600 (the) -424 (present) -423.01500 (w) 10 (ork) -422.98100 (we) -424.00800 (propose) -423.00800 (a) -422.99300 (ne) 25.01540 (w) -424.00300 (computational) ] TJ -11.95510 -11.95510 Td [ (model) -385.00900 (for) -384.99700 (video) -385.01700 (prediction) -383.98500 (that) -385.01900 (does) -384.98500 (not) -385.01400 (suf) 24.98600 (fer) -385.00400 (from) -384.98500 (this) ] TJ T* [ (nuisance\056) -488.01900 (It) -309.00200 (also) -308.99300 (allo) 24.99090 (ws) -308.99700 (for) -309.98700 (the) -308.99700 (prediction) -309.01700 (of) -309.00700 (an) -309.98700 (e) 1.01454 (n) -1.01454 (t) 0.98513 (ire) -309.98700 (im\055) ] TJ T* [ (age) -378.01800 (sequence) -376.99100 (rather) -378.01800 (than) -376.98100 (just) -377.99100 (a) -377 (single) -377.99100 (frame) -377 (ahead\056) -692.98200 (Fur) 20.01140 (\055) ] TJ T* [ (thermore\054) -413.99200 (it) -380 (is) -380.98300 (not) -381.01700 (only) -381.01200 (able) -380.99000 (to) -380.00500 (e) 15.01220 (xtrapolate) -381.01500 (in) -380.98500 (time) -381.01000 (b) 20.00160 (ut) -380.98500 (is) ] TJ 11.95590 TL T* [ (equally) -443.98500 (suited) -442.99700 (for) -444.00700 (temporal) -443 (interpolation) -443.99500 (between) -444 (subse\055) ] TJ 11.95510 TL T* [ (quent) -370 (frames\056) -668.98200 (Our) -370.01200 (netw) 10.00810 (ork) -370.01200 (can) -369.00200 (be) -370.01700 (trained) -370.00200 (end\055to\055end) -370.00200 (on) ] TJ T* [ (full) -296.01200 (frame) -295.01200 (images\056) -446.99900 (Once) -295.01000 (trained\054) -306.99300 (it) -296.01400 (is) -294.99500 (able) -295.98500 (to) -295 (mak) 10.01300 (e) -295.99500 (predic\055) ] TJ T* [ (tions) -250.00700 (in) -249.98500 (almost) -250.00200 (real\055time\056) ] TJ 11.95510 -14.22070 Td [ (In) -241.99600 (particular) 40.00560 (\054) -243.01600 (we) -242.00100 (describe) -241.99400 (tw) 10.00810 (o) -241.99400 (ne) 25.01540 (w) -241.01400 (netw) 10.00810 (ork) -241.99400 (modules\054) -243.99900 (for) ] TJ -11.95510 -11.95510 Td [ (e) 15.01220 (xtrapolation) -412.00700 (and) -412.98500 (interpolation\054) -453.00800 (each) -412.01900 (of) -412.99000 (which) -411.99500 (predicts) -413.01000 (a) ] TJ T* [ (single) -284.98400 (video) -286.01400 (frame\056) -416.00900 (These) -285.00600 (modules) -285.99600 (can) -285.01600 (be) -285.01100 (concatenated) -285.98200 (to) ] TJ T* [ (enable) -247.01300 (the) -245.99100 (prediction) -246.98800 (of) -247.01500 (an) -245.99800 (entire) -247.00800 (video) -246.01800 (sequence) -247.01300 (with) -246.99300 (arbi\055) ] TJ T* [ (trary) -198.00400 (man) 14.99010 (y) -196.98200 (frames\056) -293.00500 (Since) -197.00900 (each) -198.01600 (module) -198.01600 (is) -197.01100 (fully) -197.98700 (dif) 24.98600 (ferentiable) ] TJ T* [ (the) 14.98520 (y) -217.99800 (allo) 24.99090 (w) -218 (for) -218.98600 (end\055to\055end) -217.98600 (training) -218.01300 (e) 25.01050 (v) 14.98280 (en) -218.00300 (when) -217.99300 (combined\056) -299.99400 (In\055) ] TJ 11.95630 TL T* [ (spired) -423.99300 (by) -425.01700 (recent) -424.01300 (w) 10 (ork) -424 (of) -424.98800 (P) ] TJ 114.55100 0.05000 Td <0b> Tj -0.55273 -0.05000 Td (atr) Tj 11.06290 0.05000 Td <0b> Tj -0.55312 -0.05000 Td [ (aucean) -424.01300 (et) -424.98300 (al\056) -424.00300 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 493.90300 262.59200 Tm (19) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 503.86500 262.59200 Tm [ (\135\054) -468 (each) -424.01700 (of) ] TJ -195.00300 -11.95470 Td [ (the) -203.01800 (modules) -202.98800 (comprises) -202.99600 (a) -202.99100 (spatio\055temporal) -203.01500 (video) -203.00500 (autoencoder) ] TJ 11.95510 TL T* [ (consisting) -233.01000 (of) -233.01700 (a) -232.98600 (con) 39.99820 (v) 20.00160 (olutional) -233.01500 (image) -233.00500 (encoder) 19.99670 (\055decoder) -234.00500 (with) -232.99500 (a) ] TJ T* [ (nested) -304.99300 (memory) -304.98100 (module) -305.01800 (composed) -305.01800 (of) -305.98800 (con) 39.99820 (v) 20.00160 (olutional) -305.00300 (LSTM) ] TJ T* [ (\050Con) 40.01290 (vLSTM\051) -387 (cells\056) -721.00200 (The) -386.98900 (Con) 40.01780 (vLSTM) -386.99400 (features) -388.01400 (a) -387 <6d6f6469026564> ] TJ 11.95590 TL T* [ (Spatial) -434.99400 (T) 35.01870 (ransformer) -433.99900 (Netw) 10.00810 (ork) -435.02100 (\050STN\051) -435.01100 (layer) -434.00600 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 491.07800 202.81600 Tm (9) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 496.05900 202.81600 Tm [ (\135) -434.99100 (to) -435.01600 (capture) ] TJ -187.19700 -11.95510 Td [ (temporal) -363.01300 (changes) -364.01000 (and) -362.99300 (motion) -364.01800 (across) -362.99300 (time) -363.99300 (by) -362.98800 (optical) -363.99300 <036f> 24.99580 (w) ] TJ 11.95510 TL T* [ (estimation) -249.98800 (and) -249.99300 (prediction\056) ] TJ 11.95470 -14.21990 Td [ (Our) -394.00800 (approach) -394.00800 (also) -393.01800 (inte) 14.99260 (grates) -394.00800 (a) -394.01800 (recently) -394.00300 (proposed) -393.98800 (type) ] TJ -11.95470 -11.95510 Td [ (of) -356.01700 (loss) -357.01400 (functions) -355.98700 (named) -356.98500 (deep) -356.01900 (perceptual) -356.00900 (similarity) -356.98500 (metric) ] TJ 11.95590 TL T* [ (\050DeePSiM\051) -434.01100 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 361.88300 140.77500 Tm (4) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 366.86400 140.77500 Tm [ (\135) -434.98900 (that) -433.99100 (has) -435.01800 (been) -434.00600 (sho) 24.99090 (wn) -433.99600 (to) -435.01600 (better) -433.99600 <726503656374> -434.98100 (the) ] TJ -58.00230 -11.95510 Td [ (perceptual) -328.99400 (similarity) -330.01100 (of) -329.00100 (images\056) -548.00200 (It) -329 (measures) -328.98900 (distances) -329.99900 (be\055) ] TJ 11.95510 TL T* [ (tween) -197.01900 (image) -197.99100 (features) -196.98900 (e) 15.01220 (xtracted) -197.99600 (by) -197.01600 (deep) -198.00600 (neural) -196.98200 (netw) 10.00810 (orks) -197.99100 (and) ] TJ T* [ (emplo) 9.98363 (ys) -346.98900 (the) -348.01300 (adv) 14.98280 (ersarial) -347 (netw) 10.00810 (ork) -346.99600 (of) -348.02000 (Goodfello) 25.00560 (w) -346.99600 (et) -346.99600 (al\056) -348.01500 (\133) ] TJ ET Q 0 1 0 rg q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 534.32600 104.91000 Tm (6) Tj ET Q 0 g q 10 0 0 10 0 0 cm BT /R32 9.96260 Tf 1 0 0 1 539.30700 104.91000 Tm (\135\056) Tj -230.44500 -11.95470 Td [ (In) -275.99100 (our) -277.00500 (conte) 14.98520 (xt\054) -282.99700 (the) -275.98600 (e) 15.01220 (xtrapolation) -275.98800 (and) -275.98800 (interpolation) -277.00300 (modules) ] TJ 11.95630 TL T* [ (tak) 10.00570 (e) -262 (the) -261.98800 (role) -263.01000 (of) -261.99300 (the) -261.98800 (generati) 24.98600 (v) 14.98280 (e) -262 (netw) 10.00810 (ork\054) -265.00500 (while) -262.99500 (a) -262 (discrimina\055) ] TJ -13.74100 -29.88670 Td (1) Tj ET Q Q Q q q 1 1 1 rg /a0 gs 48.40600 786.42200 515.18800 -52.69900 re f q /s5 gs /x6 Do Q q /s7 gs /x8 Do Q q /s9 gs /x10 Do Q q /s11 gs /x12 Do Q Q Q Q q 1 0 0 1 0 0 cm BT /F1 12 Tf 14.40000 TL ET 1 1 1 rg n 270 47 72 14 re f* 0.50000 0.50000 0.50000 rg BT /F2 9 Tf 10.80000 TL ET BT 1 0 0 1 297 50 Tm (6523) Tj T* ET Q endstream endobj 14 0 obj << /Filter /FlateDecode /Resources << /ExtGState << /a0 << /CA 1 /ca 1 >> >> /XObject << /x18 15 0 R >> >> /Length 28 /Group << /Type /Group /S /Transparency /CS /DeviceRGB /I true >> /BBox [ 78 746 96 765 ] /Type /XObject /Subtype /Form >> stream x+O4PH/VЯ0Pp 0 endstream endobj 15 0 obj << /Filter /FlateDecode /Resources 16 0 R /Length 107 /Type /XObject /BBox [ 78 746 96 765 ] /Subtype /Form >> stream xe AC̬wʠ =p,?]%+H-
Jc "82w8VSnGW;"
endstream
endobj
16 0 obj
<<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
>>
endobj
17 0 obj
<<
/Filter /FlateDecode
/Resources <<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
/XObject <<
/x15 18 0 R
>>
>>
/Length 28
/Group <<
/Type /Group
/S /Transparency
/CS /DeviceRGB
/I true
>>
/BBox [ 67 752 84 775 ]
/Type /XObject
/Subtype /Form
>>
stream
x+O4PH/VЯ04Up
0
endstream
endobj
18 0 obj
<<
/Filter /FlateDecode
/Resources 19 0 R
/Length 228
/Type /XObject
/BBox [ 67 752 84 775 ]
/Subtype /Form
>>
stream
xeQKn!s ?FPav6R٪TS.
b];15YyR
{7QL.\:Rv/x9l+L7h%1!}i/AI(kz"U&,YO![R hg{3}4/GyYF:!w}Gn+'xJcO9i뽼_-:`
endstream
endobj
19 0 obj
<<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
>>
endobj
20 0 obj
<<
/Filter /FlateDecode
/Resources <<
/ExtGState <<
/a0 <<
/CA 1
/ca 1
>>
>>
/XObject <<
/x24 21 0 R
>>
>>
/Length 28
/Group <<
/Type /Group
/S /Transparency
/CS /DeviceRGB
/I true
>>
/BBox [ 132 751 480 772 ]
/Type /XObject
/Subtype /Form
>>
stream
x+O4PH/VЯ02Qp
0
endstream
endobj
21 0 obj
<<
/Filter /FlateDecode
/Resources 22 0 R
/Length 53223
/Type /XObject
/BBox [ 132 751 480 772 ]
/Subtype /Form
>>
stream
xtI:6%Q㨈?7rA= u%6 ?Y(WbWo{B>9
x`Znϳ|8{3?0x*z ǃ|,@:w>`c|*ϻⳅKO3`g
:_|}}><.6`Z{{3]#<_o"~:ͺgk7/Ұ@|K yp ]03ʷCmş8˽Y?>(3!Bwqs.Z8,~~=rMT̩y+/*w: uBZ_`ߵp`%M?ɝ1ɳw=vDۉy&xb4Q>d@ sg~lA