Curvature-Driven Deformable Convolutional Networks for End-To-End Object Detection

<table class="table-group" id="tab1"><tr><td><table class="table"><tr><td class="thead-hr" colspan="8"><hr/></td></tr><tr class="thead"><td class="align_left" rowspan="2">Method</td><td class="align_center" rowspan="2">Shorter side (600)</td><td class="align_center" colspan="3">Faster R-CNN</td><td class="align_center" colspan="3">YOLOv4</td></tr><tr class="thead"><td class="align_center"><span style="width: 35.9806ptpx;"><svg height="12.308pt" id="M102" style="vertical-align:-0.04979992pt" version="1.1" viewbox="-0.0498162 -12.2582 35.9806 12.308" width="35.9806pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M686 28C612 35 607 44 591 112C563 234 541 360 519 489L489 666L457 658L147 121C100 40 89 36 24 28L17 0H240L250 28C168 34 159 41 190 101L262 237H482C495 180 503 137 510 91C517 47 514 35 441 28L433 0H677L686 28ZM475 280H285L429 541H431L475 280Z"></path></g><g transform="matrix(.013,0,0,-0.013,9.135,0)"><path d="M600 480C600 590 528 650 384 650H143L137 622C222 614 225 607 210 531L130 127C113 41 106 36 23 28L17 0H294L300 28C204 36 195 42 212 127L243 284L314 263C327 263 339 263 352 264C465 271 600 337 600 480ZM508 481C508 351 402 304 329 304C289 304 265 311 250 317L295 559C302 594 310 606 323 611C335 616 350 619 367 619C455 619 508 573 508 481Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,17.161,-5.741)"><path d="M460 334C460 396 434 451 378 451C330 451 241 408 148 300H146L237 679C241 697 241 710 232 710C213 710 153 684 67 675L66 646H95C141 646 145 642 134 595L39 170C23 97 31 54 46 33C64 8 100 -12 137 -12C178 -12 234 3 298 43C391 101 460 222 460 334ZM371 320C371 204 316 89 248 51C230 41 208 37 192 37C143 37 102 72 119 166C124 194 129 215 135 235C202 323 298 392 335 392C353 392 371 372 371 320Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,21.514,-5.741)"><path d="M460 334C460 396 434 451 378 451C330 451 241 408 148 300H146L237 679C241 697 241 710 232 710C213 710 153 684 67 675L66 646H95C141 646 145 642 134 595L39 170C23 97 31 54 46 33C64 8 100 -12 137 -12C178 -12 234 3 298 43C391 101 460 222 460 334ZM371 320C371 204 316 89 248 51C230 41 208 37 192 37C143 37 102 72 119 166C124 194 129 215 135 235C202 323 298 392 335 392C353 392 371 372 371 320Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,25.866,-5.741)"><path d="M452 282C452 397 389 451 302 451C268 451 227 441 188 422C95 377 24 281 24 154C24 65 70 -12 173 -12C240 -12 297 16 342 52C418 113 452 201 452 282ZM359 282C359 163 308 66 247 39C237 35 225 32 212 32C151 32 114 79 114 157C114 301 180 380 223 398C240 405 250 408 265 408C315 408 359 369 359 282Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,30.079,-5.741)"><path d="M545 403C545 425 527 451 498 451C448 451 400 404 312 286L290 341C262 412 246 451 219 451C182 451 138 404 92 345L112 323C152 368 169 378 181 378C192 378 201 359 216 321L257 214C184 115 142 69 113 69C102 69 93 73 88 79S78 89 68 89C47 89 24 61 24 40C24 8 49 -12 75 -12C125 -12 175 31 271 175L312 64C330 15 357 -12 382 -12C421 -12 475 35 515 98L496 121C466 88 439 62 420 62C402 62 384 92 363 147L325 247C349 280 374 309 397 333C422 361 446 381 462 381C471 381 481 374 488 366C493 360 499 357 505 357C521 357 545 380 545 403Z"></path></g></svg></span></td><td class="align_center"><span style="width: 25.3486ptpx;"><svg height="11.927pt" id="M103" style="vertical-align:-3.291101pt" version="1.1" viewbox="-0.0498162 -8.6359 25.3486 11.927" width="25.3486pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M686 28C612 35 607 44 591 112C563 234 541 360 519 489L489 666L457 658L147 121C100 40 89 36 24 28L17 0H240L250 28C168 34 159 41 190 101L262 237H482C495 180 503 137 510 91C517 47 514 35 441 28L433 0H677L686 28ZM475 280H285L429 541H431L475 280Z"></path></g><g transform="matrix(.013,0,0,-0.013,9.135,0)"><path d="M600 480C600 590 528 650 384 650H143L137 622C222 614 225 607 210 531L130 127C113 41 106 36 23 28L17 0H294L300 28C204 36 195 42 212 127L243 284L314 263C327 263 339 263 352 264C465 271 600 337 600 480ZM508 481C508 351 402 304 329 304C289 304 265 311 250 317L295 559C302 594 310 606 323 611C335 616 350 619 367 619C455 619 508 573 508 481Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,15.791,3.132)"><path d="M158 548H390L417 615L410 623H122L83 318C105 326 143 337 185 337C296 337 350 275 350 188C350 116 308 42 225 42C164 42 122 74 100 93C90 101 82 99 72 92C60 82 51 68 50 59C48 46 52 38 66 24C82 9 125 -12 172 -12C225 -11 292 15 346 59C408 108 437 166 437 226C437 309 371 397 242 397C214 397 170 382 133 369L158 548Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,20.223,3.132)"><path d="M245 635C92 635 37 457 37 312C37 149 91 -12 244 -12C395 -12 449 166 449 312C449 469 395 635 245 635ZM243 598C332 598 358 454 358 312C358 173 334 26 245 26C158 26 128 174 128 313S152 598 243 598Z"></path></g></svg></span></td><td class="align_center"><span style="width: 25.3486ptpx;"><svg height="11.927pt" id="M104" style="vertical-align:-3.291101pt" version="1.1" viewbox="-0.0498162 -8.6359 25.3486 11.927" width="25.3486pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M686 28C612 35 607 44 591 112C563 234 541 360 519 489L489 666L457 658L147 121C100 40 89 36 24 28L17 0H240L250 28C168 34 159 41 190 101L262 237H482C495 180 503 137 510 91C517 47 514 35 441 28L433 0H677L686 28ZM475 280H285L429 541H431L475 280Z"></path></g><g transform="matrix(.013,0,0,-0.013,9.135,0)"><path d="M600 480C600 590 528 650 384 650H143L137 622C222 614 225 607 210 531L130 127C113 41 106 36 23 28L17 0H294L300 28C204 36 195 42 212 127L243 284L314 263C327 263 339 263 352 264C465 271 600 337 600 480ZM508 481C508 351 402 304 329 304C289 304 265 311 250 317L295 559C302 594 310 606 323 611C335 616 350 619 367 619C455 619 508 573 508 481Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,15.791,3.132)"><path d="M453 623H65C60 580 56 530 46 472H80C103 538 110 548 175 548H389C310 380 195 168 90 0L98 -12L175 -2C273 206 366 408 462 610L453 623Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,20.224,3.132)"><path d="M158 548H390L417 615L410 623H122L83 318C105 326 143 337 185 337C296 337 350 275 350 188C350 116 308 42 225 42C164 42 122 74 100 93C90 101 82 99 72 92C60 82 51 68 50 59C48 46 52 38 66 24C82 9 125 -12 172 -12C225 -11 292 15 346 59C408 108 437 166 437 226C437 309 371 397 242 397C214 397 170 382 133 369L158 548Z"></path></g></svg></span></td><td class="align_center"><span style="width: 35.9806ptpx;"><svg height="12.308pt" id="M105" style="vertical-align:-0.04979992pt" version="1.1" viewbox="-0.0498162 -12.2582 35.9806 12.308" width="35.9806pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M686 28C612 35 607 44 591 112C563 234 541 360 519 489L489 666L457 658L147 121C100 40 89 36 24 28L17 0H240L250 28C168 34 159 41 190 101L262 237H482C495 180 503 137 510 91C517 47 514 35 441 28L433 0H677L686 28ZM475 280H285L429 541H431L475 280Z"></path></g><g transform="matrix(.013,0,0,-0.013,9.135,0)"><path d="M600 480C600 590 528 650 384 650H143L137 622C222 614 225 607 210 531L130 127C113 41 106 36 23 28L17 0H294L300 28C204 36 195 42 212 127L243 284L314 263C327 263 339 263 352 264C465 271 600 337 600 480ZM508 481C508 351 402 304 329 304C289 304 265 311 250 317L295 559C302 594 310 606 323 611C335 616 350 619 367 619C455 619 508 573 508 481Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,17.161,-5.741)"><path d="M460 334C460 396 434 451 378 451C330 451 241 408 148 300H146L237 679C241 697 241 710 232 710C213 710 153 684 67 675L66 646H95C141 646 145 642 134 595L39 170C23 97 31 54 46 33C64 8 100 -12 137 -12C178 -12 234 3 298 43C391 101 460 222 460 334ZM371 320C371 204 316 89 248 51C230 41 208 37 192 37C143 37 102 72 119 166C124 194 129 215 135 235C202 323 298 392 335 392C353 392 371 372 371 320Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,21.514,-5.741)"><path d="M460 334C460 396 434 451 378 451C330 451 241 408 148 300H146L237 679C241 697 241 710 232 710C213 710 153 684 67 675L66 646H95C141 646 145 642 134 595L39 170C23 97 31 54 46 33C64 8 100 -12 137 -12C178 -12 234 3 298 43C391 101 460 222 460 334ZM371 320C371 204 316 89 248 51C230 41 208 37 192 37C143 37 102 72 119 166C124 194 129 215 135 235C202 323 298 392 335 392C353 392 371 372 371 320Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,25.866,-5.741)"><path d="M452 282C452 397 389 451 302 451C268 451 227 441 188 422C95 377 24 281 24 154C24 65 70 -12 173 -12C240 -12 297 16 342 52C418 113 452 201 452 282ZM359 282C359 163 308 66 247 39C237 35 225 32 212 32C151 32 114 79 114 157C114 301 180 380 223 398C240 405 250 408 265 408C315 408 359 369 359 282Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,30.079,-5.741)"><path d="M545 403C545 425 527 451 498 451C448 451 400 404 312 286L290 341C262 412 246 451 219 451C182 451 138 404 92 345L112 323C152 368 169 378 181 378C192 378 201 359 216 321L257 214C184 115 142 69 113 69C102 69 93 73 88 79S78 89 68 89C47 89 24 61 24 40C24 8 49 -12 75 -12C125 -12 175 31 271 175L312 64C330 15 357 -12 382 -12C421 -12 475 35 515 98L496 121C466 88 439 62 420 62C402 62 384 92 363 147L325 247C349 280 374 309 397 333C422 361 446 381 462 381C471 381 481 374 488 366C493 360 499 357 505 357C521 357 545 380 545 403Z"></path></g></svg></span></td><td class="align_center"><span style="width: 25.3486ptpx;"><svg height="11.927pt" id="M106" style="vertical-align:-3.291101pt" version="1.1" viewbox="-0.0498162 -8.6359 25.3486 11.927" width="25.3486pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M686 28C612 35 607 44 591 112C563 234 541 360 519 489L489 666L457 658L147 121C100 40 89 36 24 28L17 0H240L250 28C168 34 159 41 190 101L262 237H482C495 180 503 137 510 91C517 47 514 35 441 28L433 0H677L686 28ZM475 280H285L429 541H431L475 280Z"></path></g><g transform="matrix(.013,0,0,-0.013,9.135,0)"><path d="M600 480C600 590 528 650 384 650H143L137 622C222 614 225 607 210 531L130 127C113 41 106 36 23 28L17 0H294L300 28C204 36 195 42 212 127L243 284L314 263C327 263 339 263 352 264C465 271 600 337 600 480ZM508 481C508 351 402 304 329 304C289 304 265 311 250 317L295 559C302 594 310 606 323 611C335 616 350 619 367 619C455 619 508 573 508 481Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,15.791,3.132)"><path d="M158 548H390L417 615L410 623H122L83 318C105 326 143 337 185 337C296 337 350 275 350 188C350 116 308 42 225 42C164 42 122 74 100 93C90 101 82 99 72 92C60 82 51 68 50 59C48 46 52 38 66 24C82 9 125 -12 172 -12C225 -11 292 15 346 59C408 108 437 166 437 226C437 309 371 397 242 397C214 397 170 382 133 369L158 548Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,20.223,3.132)"><path d="M245 635C92 635 37 457 37 312C37 149 91 -12 244 -12C395 -12 449 166 449 312C449 469 395 635 245 635ZM243 598C332 598 358 454 358 312C358 173 334 26 245 26C158 26 128 174 128 313S152 598 243 598Z"></path></g></svg></span></td><td class="align_center"><span style="width: 25.3486ptpx;"><svg height="11.927pt" id="M107" style="vertical-align:-3.291101pt" version="1.1" viewbox="-0.0498162 -8.6359 25.3486 11.927" width="25.3486pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M686 28C612 35 607 44 591 112C563 234 541 360 519 489L489 666L457 658L147 121C100 40 89 36 24 28L17 0H240L250 28C168 34 159 41 190 101L262 237H482C495 180 503 137 510 91C517 47 514 35 441 28L433 0H677L686 28ZM475 280H285L429 541H431L475 280Z"></path></g><g transform="matrix(.013,0,0,-0.013,9.135,0)"><path d="M600 480C600 590 528 650 384 650H143L137 622C222 614 225 607 210 531L130 127C113 41 106 36 23 28L17 0H294L300 28C204 36 195 42 212 127L243 284L314 263C327 263 339 263 352 264C465 271 600 337 600 480ZM508 481C508 351 402 304 329 304C289 304 265 311 250 317L295 559C302 594 310 606 323 611C335 616 350 619 367 619C455 619 508 573 508 481Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,15.791,3.132)"><path d="M453 623H65C60 580 56 530 46 472H80C103 538 110 548 175 548H389C310 380 195 168 90 0L98 -12L175 -2C273 206 366 408 462 610L453 623Z"></path></g><g transform="matrix(.0091,0,0,-0.0091,20.224,3.132)"><path d="M158 548H390L417 615L410 623H122L83 318C105 326 143 337 185 337C296 337 350 275 350 188C350 116 308 42 225 42C164 42 122 74 100 93C90 101 82 99 72 92C60 82 51 68 50 59C48 46 52 38 66 24C82 9 125 -12 172 -12C225 -11 292 15 346 59C408 108 437 166 437 226C437 309 371 397 242 397C214 397 170 382 133 369L158 548Z"></path></g></svg></span></td></tr><tr><td class="thead-hr" colspan="8"><hr/></td></tr><tr><td class="align_left">Baseline</td><td class="align_center">Regular</td><td class="align_center">69.7</td><td class="align_center">78.6</td><td class="align_center">62.5</td><td class="align_center">70.5</td><td class="align_center">79.8</td><td class="align_center">63.4</td></tr><tr><td class="align_left" rowspan="2">Deformation</td><td class="align_center">dconv@c3<svg height="5.65839pt" id="M108" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg>c5+</td><td class="align_center" rowspan="2">71.8</td><td class="align_center" rowspan="2">81.4</td><td class="align_center" rowspan="2">65.3</td><td class="align_center" rowspan="2">73.0</td><td class="align_center" rowspan="2">82.5</td><td class="align_center" rowspan="2">65.9</td></tr><tr><td class="align_center">dpool(DCNv1) [<a href="/journals/misy/2022/7556022/#B6" target="_blank">6</a>]</td></tr><tr><td class="align_left" rowspan="2">Modulated deformation</td><td class="align_center">mdconv@c3<svg height="5.65839pt" id="M109" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg>c5+</td><td class="align_center" rowspan="2">73.7</td><td class="align_center" rowspan="2">83.8</td><td class="align_center" rowspan="2">68.5</td><td class="align_center" rowspan="2">74.9</td><td class="align_center" rowspan="2">84.3</td><td class="align_center" rowspan="2">69.6</td></tr><tr><td class="align_center">Mdpool [<a href="/journals/misy/2022/7556022/#B7" target="_blank">7</a>]</td></tr><tr><td class="align_left"><b>Curvature-driven</b></td><td class="align_center"><span width=""><b>C-dconv@c3</b><svg height="5.65839pt" id="M110" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg><b>c5+</b></span></td><td class="align_center" rowspan="2"><b>75.2</b></td><td class="align_center" rowspan="2"><b>85.4</b></td><td class="align_center" rowspan="2"><b>71.6</b></td><td class="align_center" rowspan="2"><b>76.5</b></td><td class="align_center" rowspan="2"><b>86.2</b></td><td class="align_center" rowspan="2"><b>73.5</b></td></tr><tr><td class="align_left"><b>Deformation</b></td><td class="align_center"><b>Cdpool</b></td></tr><tr class="table-tr"><td colspan="8"><hr class="tbody-hr"/></td></tr></table></td></tr><tr class="table-fn"><td><div>The input images are of shorts side 600 pixels. In the setting column, “(m)dconv” and “(m)dpool” stand for (modulated) deformable convolution and (modulated) deformable RoIpooling, respectively. “C-dconv” and “C-dpool” stand for curvature-driven deformable convolution and curvature-driven deformable RoIpooling, And dconv@c3<svg height="5.65839pt" id="M111" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg>c5 stands for applying deformable conv layers at stages conv3<svg height="5.65839pt" id="M112" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg>conv5, C-dconv@c3<svg height="5.65839pt" id="M113" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg>c5″ stands for applying curvature-driven deformable conv layers at stages conv3<svg height="5.65839pt" id="M114" style="vertical-align:-0.04980993pt" version="1.1" viewbox="-0.0498162 -5.60858 7.75925 5.65839" width="7.75925pt" xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink"><g transform="matrix(.013,0,0,-0.013,0,0)"><path d="M548 311L516 323C497 274 452 240 400 240C372 240 342 260 316 278C277 305 235 330 188 330C116 330 66 268 40 199L72 187C91 236 136 270 188 270C216 270 246 250 272 232C311 205 353 180 400 180C472 180 522 242 548 311Z"></path></g></svg>conv5. The bold value means the best value of each item.<br/></div></td></tr></table>

<div>Detection results on PASCAL VOC 2007 test set. The detectors are Faster R-CNN and YOLOv4.</div>

Mobile Information Systems

tab1

Table 1

Table 1: Curvature-Driven Deformable Convolutional Networks for End-To-End Object Detection