-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathreferences-2b.bib
2074 lines (1862 loc) · 152 KB
/
references-2b.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
@inproceedings{cai_efficient_2017,
title = {Efficient {Architecture} {Search} by {Network} {Transformation}},
booktitle = {{AAAI}},
author = {Cai, Han and Chen, Tianyao and Zhang, Weinan and Yu, Yong and Wang, Jun},
year = {2017}
}
@article{brock_smash_2017,
title = {{SMASH}: {One}-{Shot} {Model} {Architecture} {Search} through {HyperNetworks}},
volume = {abs/1708.05344},
journal = {ArXiv},
author = {Brock, Andrew and Lim, Theodore and Ritchie, James M. and Weston, Nick},
year = {2017}
}
@article{zoph_neural_2016,
title = {Neural {Architecture} {Search} with {Reinforcement} {Learning}},
volume = {abs/1611.01578},
journal = {ArXiv},
author = {Zoph, Barret and Le, Quoc V.},
year = {2016}
}
@article{pham_efficient_2018,
title = {Efficient {Neural} {Architecture} {Search} via {Parameter} {Sharing}},
volume = {abs/1802.03268},
journal = {ArXiv},
author = {Pham, Hieu and Guan, Melody Y. and Zoph, Barret and Le, Quoc V. and Dean, Jeff},
year = {2018}
}
@article{liu_progressive_2017,
title = {Progressive {Neural} {Architecture} {Search}},
volume = {abs/1712.00559},
journal = {ArXiv},
author = {Liu, Chenxi and Zoph, Barret and Neumann, Maxim and Shlens, Jonathon and Hua, Wei and Li, Li-Jia and Fei-Fei, Li and Yuille, Alan and Huang, Jonathan and Murphy, Kevin L.},
year = {2017}
}
@article{liu_darts_2018,
title = {{DARTS}: {Differentiable} {Architecture} {Search}},
volume = {abs/1806.09055},
journal = {ArXiv},
author = {Liu, Hanxiao and Simonyan, Karen and Yang, Yiming},
year = {2018}
}
@article{zhong_practical_2017,
title = {Practical {Block}-{Wise} {Neural} {Network} {Architecture} {Generation}},
journal = {2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition},
author = {Zhong, Zhao and Yan, Junjie and Wu, Wei and Shao, Jing and Liu, Cheng-Lin},
year = {2017},
pages = {2423--2432}
}
@article{zoph_learning_2017,
title = {Learning {Transferable} {Architectures} for {Scalable} {Image} {Recognition}},
journal = {2018 IEEE/CVF Conference on Computer Vision and Pattern Recognition},
author = {Zoph, Barret and Vasudevan, Vijay and Shlens, Jonathon and Le, Quoc V.},
year = {2017},
pages = {8697--8710}
}
@article{liu_hierarchical_2017,
title = {Hierarchical {Representations} for {Efficient} {Architecture} {Search}},
volume = {abs/1711.00436},
journal = {ArXiv},
author = {Liu, Hanxiao and Simonyan, Karen and Vinyals, Oriol and Fernando, Chrisantha and Kavukcuoglu, Koray},
year = {2017}
}
@inproceedings{jin_auto-keras_2018,
title = {Auto-{Keras}: {An} {Efficient} {Neural} {Architecture} {Search} {System}},
booktitle = {{KDD}},
author = {Jin, Haifeng and Song, Qingquan and Hu, Xia},
year = {2018}
}
@inproceedings{wei_network_2016,
title = {Network {Morphism}},
booktitle = {{ICML}},
author = {Wei, Tao and Wang, Changhu and Rui, Yong and Chen, Chang Wen},
year = {2016}
}
@article{chen_net2net_2015,
title = {{Net2Net}: {Accelerating} {Learning} via {Knowledge} {Transfer}},
volume = {abs/1511.05641},
journal = {CoRR},
author = {Chen, Tianqi and Goodfellow, Ian J. and Shlens, Jonathon},
year = {2015}
}
@article{baker_designing_2016,
title = {Designing {Neural} {Network} {Architectures} using {Reinforcement} {Learning}},
volume = {abs/1611.02167},
journal = {ArXiv},
author = {Baker, Bowen and Gupta, Otkrist and Naik, Nikhil and Raskar, Ramesh},
year = {2016}
}
@inproceedings{real_regularized_2018,
title = {Regularized {Evolution} for {Image} {Classifier} {Architecture} {Search}},
booktitle = {{AAAI}},
author = {Real, Esteban and Aggarwal, Alok and Huang, Yanping and Le, Quoc V.},
year = {2018}
}
@inproceedings{real_large-scale_2017,
title = {Large-{Scale} {Evolution} of {Image} {Classifiers}},
booktitle = {{ICML}},
author = {Real, Esteban and Moore, Sherry and Selle, Andrew and Saxena, Saurabh and Suematsu, Yutaka Leon and Tan, Jie and Le, Quoc V. and Kurakin, Alexey},
year = {2017}
}
@article{stanley_evolving_2001,
title = {Evolving {Neural} {Networks} through {Augmenting} {Topologies}},
volume = {10},
journal = {Evolutionary Computation},
author = {Stanley, Kenneth O. and Miikkulainen, Risto},
year = {2001},
pages = {99--127}
}
@article{klein_fast_2016,
title = {Fast {Bayesian} {Optimization} of {Machine} {Learning} {Hyperparameters} on {Large} {Datasets}},
volume = {abs/1605.07079},
journal = {ArXiv},
author = {Klein, Aaron and Falkner, Stefan and Bartels, Simon and Hennig, Philipp and Hutter, Frank},
year = {2016}
}
@article{zela_towards_2018,
title = {Towards {Automated} {Deep} {Learning}: {Efficient} {Joint} {Neural} {Architecture} and {Hyperparameter} {Search}},
volume = {abs/1807.06906},
journal = {ArXiv},
author = {Zela, Arber and Klein, Aaron and Falkner, Stefan and Hutter, Frank},
year = {2018}
}
@inproceedings{mendoza_towards_2016,
title = {Towards {Automatically}-{Tuned} {Neural} {Networks}},
booktitle = {{AutoML}@{ICML}},
author = {Mendoza, Hector and Klein, Aaron and Feurer, Matthias and Springenberg, Jost Tobias and Hutter, Frank},
year = {2016}
}
@article{bergstra_random_2012,
title = {Random search for hyper-parameter optimization},
volume = {13},
number = {1},
journal = {Journal of Machine Learning Research},
author = {Bergstra, James and Bengio, Yoshua},
year = {2012},
pages = {281--305}
}
@article{snoek_practical_2012,
title = {Practical {Bayesian} {Optimization} of {Machine} {Learning} {Algorithms}},
author = {Snoek, Jasper and Larochelle, Hugo and Adams, Ryan P},
year = {2012},
pages = {2951--2959}
}
@article{hutter_sequential_2011,
title = {Sequential model-based optimization for general algorithm configuration},
author = {Hutter, Frank and Hoos, Holger H and Leytonbrown, Kevin},
year = {2011},
pages = {507--523}
}
@article{flynn_deepstereo_2015,
title = {{DeepStereo}: {Learning} to {Predict} {New} {Views} from the {World}'s {Imagery}},
volume = {abs/1506.06825},
url = {http://arxiv.org/abs/1506.06825},
journal = {CoRR},
author = {Flynn, John and Neulander, Ivan and Philbin, James and Snavely, Noah},
year = {2015},
note = {\_eprint: 1506.06825}
}
@article{he_deep_2015,
title = {Deep {Residual} {Learning} for {Image} {Recognition}},
volume = {abs/1512.03385},
url = {http://arxiv.org/abs/1512.03385},
journal = {CoRR},
author = {He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
year = {2015},
note = {\_eprint: 1512.03385}
}
@article{ren_faster_2015,
title = {Faster {R}-{CNN}: {Towards} {Real}-{Time} {Object} {Detection} with {Region} {Proposal} {Networks}},
volume = {abs/1506.01497},
url = {http://arxiv.org/abs/1506.01497},
journal = {CoRR},
author = {Ren, Shaoqing and He, Kaiming and Girshick, Ross B. and Sun, Jian},
year = {2015},
note = {\_eprint: 1506.01497}
}
@article{su_multi-view_2015,
title = {Multi-view {Convolutional} {Neural} {Networks} for {3D} {Shape} {Recognition}},
volume = {abs/1505.00880},
url = {http://arxiv.org/abs/1505.00880},
journal = {CoRR},
author = {Su, Hang and Maji, Subhransu and Kalogerakis, Evangelos and Learned-Miller, Erik G.},
year = {2015},
note = {\_eprint: 1505.00880}
}
@article{tatarchenko_single-view_2015,
title = {Single-view to {Multi}-view: {Reconstructing} {Unseen} {Views} with a {Convolutional} {Network}},
volume = {abs/1511.06702},
url = {http://arxiv.org/abs/1511.06702},
journal = {CoRR},
author = {Tatarchenko, Maxim and Dosovitskiy, Alexey and Brox, Thomas},
year = {2015},
note = {\_eprint: 1511.06702}
}
@article{wu_single_2016,
title = {Single {Image} {3D} {Interpreter} {Network}},
volume = {abs/1604.08685},
url = {http://arxiv.org/abs/1604.08685},
journal = {CoRR},
author = {Wu, Jiajun and Xue, Tianfan and Lim, Joseph J. and Tian, Yuandong and Tenenbaum, Joshua B. and Torralba, Antonio and Freeman, William T.},
year = {2016},
note = {\_eprint: 1604.08685}
}
@article{xie_deep3d_2016,
title = {{Deep3D}: {Fully} {Automatic} {2D}-to-{3D} {Video} {Conversion} with {Deep} {Convolutional} {Neural} {Networks}},
volume = {abs/1604.03650},
url = {http://arxiv.org/abs/1604.03650},
journal = {CoRR},
author = {Xie, Junyuan and Girshick, Ross B. and Farhadi, Ali},
year = {2016},
note = {\_eprint: 1604.03650}
}
@article{zamir_generic_2017,
title = {Generic {3D} {Representation} via {Pose} {Estimation} and {Matching}},
volume = {abs/1710.08247},
url = {http://arxiv.org/abs/1710.08247},
journal = {CoRR},
author = {Zamir, Amir Roshan and Wekel, Tilman and Agrawal, Pulkit and Wei, Colin and Malik, Jitendra and Savarese, Silvio},
year = {2017},
note = {\_eprint: 1710.08247}
}
@incollection{lecun_generalization_1989,
title = {Generalization and network design strategies},
booktitle = {Connectionism in perspective},
publisher = {Elsevier},
author = {Lecun, Yann},
editor = {Pfeifer, R. and Schreter, Z. and Fogelman, F. and Steels, L.},
year = {1989}
}
@article{ghiasi_laplacian_2016,
title = {Laplacian {Reconstruction} and {Refinement} for {Semantic} {Segmentation}},
volume = {abs/1605.02264},
url = {http://arxiv.org/abs/1605.02264},
journal = {CoRR},
author = {Ghiasi, Golnaz and Fowlkes, Charless C.},
year = {2016},
note = {\_eprint: 1605.02264}
}
@article{wang_o-cnn_2017,
title = {O-{CNN}: octree-based convolutional neural networks for {3D} shape analysis},
volume = {36},
url = {http://doi.acm.org/10.1145/3072959.3073608},
doi = {10.1145/3072959.3073608},
number = {4},
journal = {ACM Trans. Graph.},
author = {Wang, Peng-Shuai and Liu, Yang and Guo, Yu-Xiao and Sun, Chun-Yu and Tong, Xin},
year = {2017},
pages = {72:1--72:11}
}
@article{riegler_octnet_2016,
title = {{OctNet}: {Learning} {Deep} {3D} {Representations} at {High} {Resolutions}},
volume = {abs/1611.05009},
url = {http://arxiv.org/abs/1611.05009},
journal = {CoRR},
author = {Riegler, Gernot and Ulusoy, Ali Osman and Geiger, Andreas},
year = {2016},
note = {\_eprint: 1611.05009}
}
@inproceedings{huang_point_2016,
title = {Point cloud labeling using {3D} {Convolutional} {Neural} {Network}},
doi = {10.1109/ICPR.2016.7900038},
booktitle = {2016 23rd {International} {Conference} on {Pattern} {Recognition} ({ICPR})},
author = {Huang, Jing and You, Suya},
year = {2016},
keywords = {3D convolutional neural network, 3D point cloud labeling scheme, computer vision, data handling, Labeling, neural nets, Neural networks, object recognition, Testing, testing process, Three-dimensional displays, Training, Training data, training process, Two dimensional displays, urban point cloud dataset},
pages = {2670--2675}
}
@inproceedings{pratikakis_unstructured_2017,
title = {Unstructured {Point} {Cloud} {Semantic} {Labeling} {Using} {Deep} {Segmentation} {Networks}},
isbn = {978-3-03868-030-7},
doi = {10.2312/3dor.20171047},
booktitle = {Eurographics {Workshop} on {3D} {Object} {Retrieval}},
publisher = {The Eurographics Association},
author = {Boulch, Alexandre and Saux, Bertrand Le and Audebert, Nicolas},
editor = {Pratikakis, Ioannis and Dupont, Florent and Ovsjanikov, Maks},
year = {2017},
note = {ISSN: 1997-0471}
}
@article{kamnitsas_efficient_2016,
title = {Efficient {Multi}-{Scale} {3D} {CNN} with {Fully} {Connected} {CRF} for {Accurate} {Brain} {Lesion} {Segmentation}},
volume = {abs/1603.05959},
url = {http://arxiv.org/abs/1603.05959},
journal = {CoRR},
author = {Kamnitsas, Konstantinos and Ledig, Christian and Newcombe, Virginia F. J. and Simpson, Joanna P. and Kane, Andrew D. and Menon, David K. and Rueckert, Daniel and Glocker, Ben},
year = {2016},
note = {\_eprint: 1603.05959}
}
@article{klokov_escape_2017,
title = {Escape from {Cells}: {Deep} {Kd}-{Networks} for {The} {Recognition} of {3D} {Point} {Cloud} {Models}},
volume = {abs/1704.01222},
url = {http://arxiv.org/abs/1704.01222},
journal = {CoRR},
author = {Klokov, Roman and Lempitsky, Victor S.},
year = {2017},
note = {\_eprint: 1704.01222}
}
@inproceedings{kim_3d_2013,
title = {{3D} {Scene} {Understanding} by {Voxel}-{CRF}},
url = {https://doi.org/10.1109/ICCV.2013.180},
doi = {10.1109/ICCV.2013.180},
booktitle = {{IEEE} {International} {Conference} on {Computer} {Vision}, {ICCV} 2013, {Sydney}, {Australia}, {December} 1-8, 2013},
author = {Kim, Byung-soo and Kohli, Pushmeet and Savarese, Silvio},
year = {2013},
pages = {1425--1432}
}
@book{noauthor_ieee_2013,
title = {{IEEE} {International} {Conference} on {Computer} {Vision}, {ICCV} 2013, {Sydney}, {Australia}, {December} 1-8, 2013},
isbn = {978-1-4799-2839-2},
url = {http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=6750807},
publisher = {IEEE Computer Society},
year = {2013}
}
@inproceedings{maturana_voxnet_2015,
title = {{VoxNet}: {A} {3D} {Convolutional} {Neural} {Network} for real-time object recognition},
url = {https://doi.org/10.1109/IROS.2015.7353481},
doi = {10.1109/IROS.2015.7353481},
booktitle = {2015 {IEEE}/{RSJ} {International} {Conference} on {Intelligent} {Robots} and {Systems}, {IROS} 2015, {Hamburg}, {Germany}, {September} 28 - {October} 2, 2015},
author = {Maturana, Daniel and Scherer, Sebastian},
year = {2015},
pages = {922--928}
}
@incollection{tran_deep_2016,
address = {United States},
title = {Deep {End2End} {Voxel2Voxel} {Prediction}},
abstract = {Over the last few years deep learning methods have emerged as one of the most prominent approaches for video analysis. However, so far their most successful applications have been in the area of video classification and detection, i.e., problems involving the prediction of a single class label or a handful of output variables per video. Furthermore, while deep networks are commonly recognized as the best models to use in these domains, there is a widespread perception that in order to yield successful results they often require time-consuming architecture search, manual tweaking of parameters and computationally intensive preprocessing or post-processing methods. In this paper we challenge these views by presenting a deep 3D convolutional architecture trained end to end to perform voxel-level prediction, i.e., to output a variable at every voxel of the video. Most importantly, we show that the same exact architecture can be used to achieve competitive results on three widely different voxel-prediction tasks: video semantic segmentation, optical flow estimation, and video coloring. The three networks learned on these problems are trained from raw video without any form of preprocessing and their outputs do not require post-processing to achieve outstanding performance. Thus, they offer an efficient alternative to traditional and much more computationally expensive methods in these video domains.},
booktitle = {Proceedings - 29th {IEEE} {Conference} on {Computer} {Vision} and {Pattern} {Recognition} {Workshops}, {CVPRW} 2016},
publisher = {IEEE Computer Society},
author = {Tran, Du and Bourdev, Lubomir and Fergus, Rob and Torresani, Lorenzo and Paluri, Manohar},
year = {2016},
doi = {10.1109/CVPRW.2016.57},
pages = {402--409}
}
@article{brock_generative_2016,
title = {Generative and {Discriminative} {Voxel} {Modeling} with {Convolutional} {Neural} {Networks}},
volume = {abs/1608.04236},
url = {http://arxiv.org/abs/1608.04236},
journal = {CoRR},
author = {Brock, André and Lim, Theodore and Ritchie, James M. and Weston, Nick},
year = {2016},
note = {\_eprint: 1608.04236}
}
@inproceedings{silberman_indoor_2012,
address = {Berlin, Heidelberg},
series = {{ECCV}'12},
title = {Indoor {Segmentation} and {Support} {Inference} from {RGBD} {Images}},
isbn = {978-3-642-33714-7},
url = {http://dx.doi.org/10.1007/978-3-642-33715-4_54},
doi = {10.1007/978-3-642-33715-4_54},
booktitle = {Proceedings of the 12th {European} {Conference} on {Computer} {Vision} - {Volume} {Part} {V}},
publisher = {Springer-Verlag},
author = {Silberman, Nathan and Hoiem, Derek and Kohli, Pushmeet and Fergus, Rob},
year = {2012},
note = {event-place: Florence, Italy},
pages = {746--760}
}
@article{meagher_geometric_1982,
title = {Geometric {Modeling} {Using} {Octree}-{Encoding}},
volume = {19},
journal = {Computer Graphics and Image Processing},
author = {Meagher, Donald},
year = {1982},
pages = {129--147}
}
@article{wilhelms_octrees_1992,
title = {Octrees for {Faster} {Isosurface} {Generation}},
volume = {11},
issn = {0730-0301},
url = {http://doi.acm.org/10.1145/130881.130882},
doi = {10.1145/130881.130882},
number = {3},
journal = {ACM Trans. Graph.},
author = {Wilhelms, Jane and Van Gelder, Allen},
year = {1992},
note = {Place: New York, NY, USA
Publisher: ACM},
keywords = {hierarchical spatial enumeration, isosurface extraction, octree, scientific visualization},
pages = {201--227}
}
@article{wu_3d_2014,
title = {{3D} for 2.{5D} {Object} {Recognition} and {Next}-{Best}-{View} {Prediction}},
volume = {abs/1406.5670},
url = {http://arxiv.org/abs/1406.5670},
journal = {CoRR},
author = {Wu, Zhirong and Song, Shuran and Khosla, Aditya and Tang, Xiaoou and Xiao, Jianxiong},
year = {2014},
note = {\_eprint: 1406.5670},
file = {全文:C\:\\Users\\qinka\\Zotero\\storage\\NSJWSBK8\\Wu 等。 - 2014 - 3D for 2.5D Object Recognition and Next-Best-View .pdf:application/pdf}
}
@article{sharma_vconv-dae_2016,
title = {{VConv}-{DAE}: {Deep} {Volumetric} {Shape} {Learning} {Without} {Object} {Labels}},
volume = {abs/1604.03755},
url = {http://arxiv.org/abs/1604.03755},
journal = {CoRR},
author = {Sharma, Abhishek and Grau, Oliver and Fritz, Mario},
year = {2016},
note = {\_eprint: 1604.03755}
}
@article{esteves_3d_2017,
title = {{3D} object classification and retrieval with {Spherical} {CNNs}},
volume = {abs/1711.06721},
url = {http://arxiv.org/abs/1711.06721},
journal = {CoRR},
author = {Esteves, Carlos and Allen-Blanchette, Christine and Makadia, Ameesh and Daniilidis, Kostas},
year = {2017},
note = {\_eprint: 1711.06721}
}
@article{sedaghat_orientation-boosted_2016,
title = {Orientation-boosted {Voxel} {Nets} for {3D} {Object} {Recognition}},
volume = {abs/1604.03351},
url = {http://arxiv.org/abs/1604.03351},
journal = {CoRR},
author = {Sedaghat, Nima and Zolfaghari, Mohammadreza and Brox, Thomas},
year = {2016},
note = {\_eprint: 1604.03351}
}
@article{song_semantic_2017,
title = {Semantic {Scene} {Completion} from a {Single} {Depth} {Image}},
journal = {IEEE Conference on Computer Vision and Pattern Recognition},
author = {Song, Shuran and Yu, Fisher and Zeng, Andy and Chang, Angel X and Savva, Manolis and Funkhouser, Thomas},
year = {2017}
}
@article{tchapmi_segcloud_2017,
title = {{SEGCloud}: {Semantic} {Segmentation} of {3D} {Point} {Clouds}},
volume = {abs/1710.07563},
url = {http://arxiv.org/abs/1710.07563},
journal = {CoRR},
author = {Tchapmi, Lyne P. and Choy, Christopher B. and Armeni, Iro and Gwak, JunYoung and Savarese, Silvio},
year = {2017},
note = {\_eprint: 1710.07563}
}
@article{xu_spidercnn_2018,
title = {{SpiderCNN}: {Deep} {Learning} on {Point} {Sets} with {Parameterized} {Convolutional} {Filters}},
journal = {ArXiv e-prints},
author = {Xu, Y. and Fan, T. a@articleDBLP:journals/tog/WangLGST17, author = Peng-Shuai Wang {and} Yang Liu {and} Yu-Xiao Guo {and} Chun-Yu Sun {and} Xin Tong, title = O-CNN: octree-based convolutional neural networks for 3D shape analysis, journal = ACM Trans. Graph., volume = 36, number = 4, pages = 72:1–72:11, year = 2017, url = http://doi.acm.org/10.1145/3072959.3073608, doi = 10.1145/3072959.3073608, timestamp = Sun, 06 Aug 2017 17:40:31 +0200, biburl = http://dblp.org/rec/bib/journals/tog/WangLGST17, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/RieglerUG16, author = Gernot Riegler {and} Ali Osman Ulusoy {and} Andreas Geiger, title = OctNet: Learning Deep 3D Representations at High Resolutions, journal = CoRR, volume = abs/1611.05009, year = 2016, url = http://arxiv.org/abs/1611.05009, archivePrefix = arXiv, eprint = 1611.05009, timestamp = Wed, 07 Jun 2017 14:40:54 +0200, biburl = http://dblp.org/rec/bib/journals/corr/RieglerUG16, bibsource = dblp computer science bibliography, http://dblp.org @INPROCEEDINGS7900038, author=Jing Huang {and} Suya You, booktitle=2016 23rd International Conference on Pattern Recognition (ICPR), title=Point cloud labeling using 3D Convolutional Neural Network, year=2016, volume=, number=, pages=2670-2675, keywords=computer vision;data handling;neural nets;object recognition;3D convolutional neural network;3D point cloud labeling scheme;computer vision;data handling;object recognition;testing process;training process;urban point cloud dataset;Labeling;Neural networks;Testing;Three-dimensional displays;Training;Training data;Two dimensional displays, doi=10.1109/ICPR.2016.7900038, ISSN=, month=Dec, @inproceedings 3dor.20171047, booktitle = Eurographics Workshop on 3D Object Retrieval, editor = Ioannis Pratikakis {and} Florent Dupont {and} Maks Ovsjanikov, title = Unstructured Point Cloud Semantic Labeling Using Deep Segmentation Networks, author = Boulch, Alexandre {and} Saux, Bertrand Le {and} Audebert, Nicolas, year = 2017, publisher = The Eurographics Association, ISSN = 1997-0471, ISBN = 978-3-03868-030-7, DOI = 10.2312/3dor.20171047 @articleDBLP:journals/corr/EngelckeRWTP16, author = Martin Engelcke {and} Dushyant Rao {and} Dominic Zeng Wang {and} Chi Hay Tong {and} Ingmar Posner, title = Vote3Deep: Fast Object Detection in 3D Point Clouds Using Efficient Convolutional Neural Networks, journal = CoRR, volume = abs/1609.06666, year = 2016, url = http://arxiv.org/abs/1609.06666, archivePrefix = arXiv, eprint = 1609.06666, timestamp = Wed, 07 Jun 2017 14:41:41 +0200, biburl = http://dblp.org/rec/bib/journals/corr/EngelckeRWTP16, bibsource = dblp computer science bibliography, http://dblp.org @proceedingsDBLP:conf/icra/2017, title = 2017 IEEE International Conference on Robotics {and} Automation, ICRA 2017, Singapore, Singapore, May 29 - June 3, 2017, publisher = IEEE, year = 2017, url = http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=7960754, isbn = 978-1-5090-4633-1, timestamp = Wed, 26 Jul 2017 15:16:56 +0200, biburl = http://dblp.org/rec/bib/conf/icra/2017, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/KamnitsasLNSKMR16, author = Konstantinos Kamnitsas {and} Christian Ledig {and} Virginia F. J. Newcombe {and} Joanna P. Simpson {and} Andrew D. Kane {and} David K. Menon {and} Daniel Rueckert {and} Ben Glocker, title = Efficient Multi-Scale 3D CNN with Fully Connected CRF for Accurate Brain Lesion Segmentation, journal = CoRR, volume = abs/1603.05959, year = 2016, url = http://arxiv.org/abs/1603.05959, archivePrefix = arXiv, eprint = 1603.05959, timestamp = Wed, 07 Jun 2017 14:42:35 +0200, biburl = http://dblp.org/rec/bib/journals/corr/KamnitsasLNSKMR16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/KlokovL17, author = Roman Klokov {and} Victor S. Lempitsky, title = Escape from Cells: Deep Kd-Networks for The Recognition of 3D Point Cloud Models, journal = CoRR, volume = abs/1704.01222, year = 2017, url = http://arxiv.org/abs/1704.01222, archivePrefix = arXiv, eprint = 1704.01222, timestamp = Wed, 07 Jun 2017 14:40:16 +0200, biburl = http://dblp.org/rec/bib/journals/corr/KlokovL17, bibsource = dblp computer science bibliography, http://dblp.org @inproceedingsDBLP:conf/iccv/KimKS13, author = Byung-soo Kim {and} Pushmeet Kohli {and} Silvio Savarese, title = 3D Scene Understanding by Voxel-CRF, booktitle = IEEE International Conference on Computer Vision, ICCV 2013, Sydney, Australia, December 1-8, 2013, pages = 1425–1432, year = 2013, crossref = DBLP:conf/iccv/2013, url = https://doi.org/10.1109/ICCV.2013.180, doi = 10.1109/ICCV.2013.180, timestamp = Wed, 24 May 2017 08:31:04 +0200, biburl = http://dblp.org/rec/bib/conf/iccv/KimKS13, bibsource = dblp computer science bibliography, http://dblp.org @proceedingsDBLP:conf/iccv/2013, title = IEEE International Conference on Computer Vision, ICCV 2013, Sydney, Australia, December 1-8, 2013, publisher = IEEE Computer Society, year = 2013, url = http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=6750807, isbn = 978-1-4799-2839-2, timestamp = Fri, 19 Feb 2016 11:45:57 +0100, biburl = http://dblp.org/rec/bib/conf/iccv/2013, bibsource = dblp computer science bibliography, http://dblp.org @inproceedingsDBLP:conf/iros/MaturanaS15, author = Daniel Maturana {and} Sebastian Scherer, title = VoxNet: A 3D Convolutional Neural Network for real-time object recognition, booktitle = 2015 IEEE/RSJ International Conference on Intelligent Robots {and} Systems, IROS 2015, Hamburg, Germany, September 28 - October 2, 2015, pages = 922–928, year = 2015, crossref = DBLP:conf/iros/2015, url = https://doi.org/10.1109/IROS.2015.7353481, doi = 10.1109/IROS.2015.7353481, timestamp = Mon, 22 May 2017 17:11:27 +0200, biburl = http://dblp.org/rec/bib/conf/iros/MaturanaS15, bibsource = dblp computer science bibliography, http://dblp.org @proceedingsDBLP:conf/iros/2015, title = 2015 IEEE/RSJ International Conference on Intelligent Robots {and} Systems, IROS 2015, Hamburg, Germany, September 28 - October 2, 2015, publisher = IEEE, year = 2015, url = http://ieeexplore.ieee.org/xpl/mostRecentIssue.jsp?punumber=7347169, isbn = 978-1-4799-9994-1, timestamp = Mon, 04 Jan 2016 12:12:56 +0100, biburl = http://dblp.org/rec/bib/conf/iros/2015, bibsource = dblp computer science bibliography, http://dblp.org @inbook765ece793c4e4a05ac7b7cd9f4d4da66, title = "Deep End2End Voxel2Voxel Prediction", abstract = "Over the last few years deep learning methods have emerged as one of the most prominent approaches for video analysis. However, so far their most successful applications have been in the area of video classification {and} detection, i.e., problems involving the prediction of a single class label or a handful of output variables per video. Furthermore, while deep networks are commonly recognized as the best models to use in these domains, there is a widespread perception that in order to yield successful results they often require time-consuming architecture search, manual tweaking of parameters {and} computationally intensive preprocessing or post-processing methods. In this paper we challenge these views by presenting a deep 3D convolutional architecture trained end to end to perform voxel-level prediction, i.e., to output a variable at every voxel of the video. Most importantly, we show that the same exact architecture can be used to achieve competitive results on three widely different voxel-prediction tasks: video semantic segmentation, optical flow estimation, {and} video coloring. The three networks learned on these problems are trained from raw video without any form of preprocessing {and} their outputs do not require post-processing to achieve outstanding performance. Thus, they offer an efficient alternative to traditional {and} much more computationally expensive methods in these video domains.", author = "Du Tran {and} Lubomir Bourdev {and} Rob Fergus {and} Lorenzo Torresani {and} Manohar Paluri", year = "2016", month = "12", doi = "10.1109/CVPRW.2016.57", pages = "402–409", booktitle = "Proceedings - 29th IEEE Conference on Computer Vision {and} Pattern Recognition Workshops, CVPRW 2016", publisher = "IEEE Computer Society", address = "United States", @articleDBLP:journals/corr/BrockLRW16, author = André Brock {and} Theodore Lim {and} James M. Ritchie {and} Nick Weston, title = Generative {and} Discriminative Voxel Modeling with Convolutional Neural Networks, journal = CoRR, volume = abs/1608.04236, year = 2016, url = http://arxiv.org/abs/1608.04236, archivePrefix = arXiv, eprint = 1608.04236, timestamp = Wed, 07 Jun 2017 14:42:45 +0200, biburl = http://dblp.org/rec/bib/journals/corr/BrockLRW16, bibsource = dblp computer science bibliography, http://dblp.org @inproceedingsSilberman:2012:ISS:2403138.2403195, author = Silberman, Nathan {and} Hoiem, Derek {and} Kohli, Pushmeet {and} Fergus, Rob, title = Indoor Segmentation {and} Support Inference from RGBD Images, booktitle = Proceedings of the 12th European Conference on Computer Vision - Volume Part V, series = ECCV'12, year = 2012, isbn = 978-3-642-33714-7, location = Florence, Italy, pages = 746–760, numpages = 15, url = http://dx.doi.org/10.1007/978-3-642-33715-4\_54, doi = 10.1007/978-3-642-33715-4\_54, acmid = 2403195, publisher = Springer-Verlag, address = Berlin, Heidelberg, @articleMeagherOctree, author = Meagher, Donald, year = 1982, month = 06, pages = 129-147, title = Geometric Modeling Using Octree-Encoding, volume = 19, booktitle = Computer Graphics {and} Image Processing @articleWilhelms:1992:OFI:130881.130882, author = Wilhelms, Jane {and} Van Gelder, Allen, title = Octrees for Faster Isosurface Generation, journal = ACM Trans. Graph., issue\_date = July 1992, volume = 11, number = 3, month = jul, year = 1992, issn = 0730-0301, pages = 201–227, numpages = 27, url = http://doi.acm.org/10.1145/130881.130882, doi = 10.1145/130881.130882, acmid = 130882, publisher = ACM, address = New York, NY, USA, keywords = hierarchical spatial enumeration, isosurface extraction, octree, scientific visualization, @articleDBLP:journals/corr/WuSKTX14, author = Zhirong Wu {and} Shuran Song {and} Aditya Khosla {and} Xiaoou Tang {and} Jianxiong Xiao, title = 3D for 2.5D Object Recognition {and} Next-Best-View Prediction, journal = CoRR, volume = abs/1406.5670, year = 2014, url = http://arxiv.org/abs/1406.5670, archivePrefix = arXiv, eprint = 1406.5670, timestamp = Wed, 07 Jun 2017 14:42:52 +0200, biburl = http://dblp.org/rec/bib/journals/corr/WuSKTX14, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/SharmaGF16, author = Abhishek Sharma {and} Oliver Grau {and} Mario Fritz, title = VConv-DAE: Deep Volumetric Shape Learning Without Object Labels, journal = CoRR, volume = abs/1604.03755, year = 2016, url = http://arxiv.org/abs/1604.03755, archivePrefix = arXiv, eprint = 1604.03755, timestamp = Wed, 07 Jun 2017 14:43:02 +0200, biburl = http://dblp.org/rec/bib/journals/corr/SharmaGF16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/GirdharFRG16, author = Rohit Girdhar {and} David F. Fouhey {and} Mikel Rodriguez {and} Abhinav Gupta, title = Learning a Predictable {and} Generative Vector Representation for Objects, journal = CoRR, volume = abs/1603.08637, year = 2016, url = http://arxiv.org/abs/1603.08637, archivePrefix = arXiv, eprint = 1603.08637, timestamp = Wed, 07 Jun 2017 14:40:15 +0200, biburl = http://dblp.org/rec/bib/journals/corr/GirdharFRG16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/ChoyXGCS16, author = Christopher Bongsoo Choy {and} Danfei Xu {and} JunYoung Gwak {and} Kevin Chen {and} Silvio Savarese, title = 3D-R2N2: A Unified Approach for Single {and} Multi-view 3D Object Reconstruction, journal = CoRR, volume = abs/1604.00449, year = 2016, url = http://arxiv.org/abs/1604.00449, archivePrefix = arXiv, eprint = 1604.00449, timestamp = Wed, 07 Jun 2017 14:42:32 +0200, biburl = http://dblp.org/rec/bib/journals/corr/ChoyXGCS16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/MilletariNA16, author = Fausto Milletari {and} Nassir Navab {and} Seyed-Ahmad Ahmadi, title = V-Net: Fully Convolutional Neural Networks for Volumetric Medical Image Segmentation, journal = CoRR, volume = abs/1606.04797, year = 2016, url = http://arxiv.org/abs/1606.04797, archivePrefix = arXiv, eprint = 1606.04797, timestamp = Wed, 07 Jun 2017 14:40:44 +0200, biburl = http://dblp.org/rec/bib/journals/corr/MilletariNA16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/SongX15, author = Shuran Song {and} Jianxiong Xiao, title = Deep Sliding Shapes for Amodal 3D Object Detection in RGB-D Images, journal = CoRR, volume = abs/1511.02300, year = 2015, url = http://arxiv.org/abs/1511.02300, archivePrefix = arXiv, eprint = 1511.02300, timestamp = Wed, 07 Jun 2017 14:42:51 +0200, biburl = http://dblp.org/rec/bib/journals/corr/SongX15, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/CicekALBR16, author = Özgün Çiçek {and} Ahmed Abdulkadir {and} Soeren S. Lienkamp {and} Thomas Brox {and} Olaf Ronneberger, title = 3D U-Net: Learning Dense Volumetric Segmentation from Sparse Annotation, journal = CoRR, volume = abs/1606.06650, year = 2016, url = http://arxiv.org/abs/1606.06650, archivePrefix = arXiv, eprint = 1606.06650, timestamp = Wed, 07 Jun 2017 14:41:35 +0200, biburl = http://dblp.org/rec/bib/journals/corr/CicekALBR16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/Graham14, author = Benjamin Graham, title = Spatially-sparse convolutional neural networks, journal = CoRR, volume = abs/1409.6070, year = 2014, url = http://arxiv.org/abs/1409.6070, archivePrefix = arXiv, eprint = 1409.6070, timestamp = Wed, 07 Jun 2017 14:41:28 +0200, biburl = http://dblp.org/rec/bib/journals/corr/Graham14, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/Graham15, author = Ben Graham, title = Sparse 3D convolutional neural networks, journal = CoRR, volume = abs/1505.02890, year = 2015, url = http://arxiv.org/abs/1505.02890, archivePrefix = arXiv, eprint = 1505.02890, timestamp = Wed, 07 Jun 2017 14:42:35 +0200, biburl = http://dblp.org/rec/bib/journals/corr/Graham15, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/KiefelJG15, author = Martin Kiefel {and} Varun Jampani {and} Peter V. Gehler, title = Sparse Convolutional Networks using the Permutohedral Lattice, journal = CoRR, volume = abs/1503.04949, year = 2015, url = http://arxiv.org/abs/1503.04949, archivePrefix = arXiv, eprint = 1503.04949, timestamp = Wed, 07 Jun 2017 14:41:32 +0200, biburl = http://dblp.org/rec/bib/journals/corr/KiefelJG15, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/LiPSQG16, author = Yangyan Li {and} Sören Pirk {and} Hao Su {and} Charles Ruizhongtai Qi {and} Leonidas J. Guibas, title = FPNN: Field Probing Neural Networks for 3D Data, journal = CoRR, volume = abs/1605.06240, year = 2016, url = http://arxiv.org/abs/1605.06240, archivePrefix = arXiv, eprint = 1605.06240, timestamp = Wed, 07 Jun 2017 14:40:47 +0200, biburl = http://dblp.org/rec/bib/journals/corr/LiPSQG16, bibsource = dblp computer science bibliography, http://dblp.org @articleDBLP:journals/corr/abs-1711-06721, author = Carlos Esteves {and} Christine Allen-Blanchette {and} Ameesh Makadia {and} Kostas Daniilidis, title = 3D object classification {and} retrieval with Spherical CNNs, journal = CoRR, volume = abs/1711.06721, year = 2017, url = http://arxiv.org/abs/1711.06721, archivePrefix = arXiv, eprint = 1711.06721, timestamp = Sun, 03 Dec 2017 12:38:15 +0100, biburl = https://dblp.org/rec/bib/journals/corr/abs-1711-06721, bibsource = dblp computer science bibliography, https://dblp.org @articleDBLP:journals/corr/AlvarZB16, author = Nima Sedaghat {and} Mohammadreza Zolfaghari {and} Thomas Brox, title = Orientation-boosted Voxel Nets for 3D Object Recognition, journal = CoRR, volume = abs/1604.03351, year = 2016, url = http://arxiv.org/abs/1604.03351, archivePrefix = arXiv, eprint = 1604.03351, timestamp = Wed, 07 Jun 2017 14:40:18 +0200, biburl = https://dblp.org/rec/bib/journals/corr/AlvarZB16, bibsource = dblp computer science bibliography, https://dblp.org @articlesong2016ssc, title= Semantic Scene Completion from a Single Depth Image, author= Song, Shuran {and} Yu, Fisher {and} Zeng, Andy {and} Chang, Angel X {and} Savva, Manolis {and} Funkhouser, Thomas, journal=IEEE Conference on Computer Vision {and} Pattern Recognition, year=2017 @articleDBLP:journals/corr/abs-1710-07563, author = Lyne P. Tchapmi {and} Christopher B. Choy {and} Iro Armeni {and} JunYoung Gwak {and} Silvio Savarese, title = SEGCloud: Semantic Segmentation of 3D Point Clouds, journal = CoRR, volume = abs/1710.07563, year = 2017, url = http://arxiv.org/abs/1710.07563, archivePrefix = arXiv, eprint = 1710.07563, timestamp = Wed, 01 Nov 2017 19:05:43 +0100, biburl = http://dblp.org/rec/bib/journals/corr/abs-1710-07563, bibsource = dblp computer science bibliography, http://dblp.org @ARTICLE2018arXiv180311527X, author = Xu, Y. {and} Fan, T. {and} Xu, M. {and} Zeng, L. {and} Qiao, Y., title = "SpiderCNN: Deep Learning on Point Sets with Parameterized Convolutional Filters", journal = ArXiv e-prints, archivePrefix = "arXiv", eprint = 1803.11527, primaryClass = "cs.CV", keywords = Computer Science - Computer Vision {and} Pattern Recognition, year = 2018, month = mar, adsurl = http://adsabs.harvard.edu/abs/2018arXiv180311527X, adsnote = Provided by the SAO/NASA Astrophysics Data System @articleDBLP:journals/corr/abs-1802-08275, author = Hang Su {and} Varun Jampani {and} Deqing Sun {and} Subhransu Maji {and} Evangelos Kalogerakis {and} Ming-Hsuan Yang {and} Jan Kautz, title = SPLATNet: Sparse Lattice Networks for Point Cloud Processing, journal = CoRR, volume = abs/1802.08275, year = 2018, url = http://arxiv.org/abs/1802.08275, archivePrefix = arXiv, eprint = 1802.08275, timestamp = Mon, 26 Mar 2018 12:54:00 +0200, biburl = https://dblp.org/rec/bib/journals/corr/abs-1802-08275, bibsource = dblp computer science bibliography, https://dblp.org @ARTICLE2018arXiv180311385S, author = Shao, T. {and} Yang, Y. {and} Weng, Y. {and} Hou, Q. {and} Zhou, K., title = "H-CNN: Spatial Hashing Based CNN for 3D Shape Analysis", journal = ArXiv e-prints, archivePrefix = "arXiv", eprint = 1803.11385, primaryClass = "cs.GR", keywords = Computer Science - Graphics, year = 2018, month = mar, adsurl = http://adsabs.harvard.edu/abs/2018arXiv180311385S, adsnote = Provided by the SAO/NASA Astrophysics Data System @ARTICLE2018arXiv180311303C, author = Cai, J. {and} Lu, L. {and} Xing, F. {and} Yang, L., title = "Pancreas Segmentation in CT {and} MRI Images via Domain Specific Network Designing {and} Recurrent Neural Contextual Learning", journal = ArXiv e-prints, archivePrefix = "arXiv", eprint = 1803.11303, primaryClass = "cs.CV", keywords = Computer Science - Computer Vision {and} Pattern Recognition, year = 2018, month = mar, adsurl = http://adsabs.harvard.edu/abs/2018arXiv180311303C, adsnote = Provided by the SAO/NASA Astrophysics Data System @articleDBLP:journals/corr/QiSMG16, author = Charles Ruizhongtai Qi {and} Hao Su {and} Kaichun Mo {and} Leonidas J. Guibas, title = PointNet: Deep Learning on Point Sets for 3D Classification {and} Segmentation, journal = CoRR, volume = abs/1612.00593, year = 2016, url = http://arxiv.org/abs/1612.00593, archivePrefix = arXiv, eprint = 1612.00593, timestamp = Wed, 07 Jun 2017 14:43:06 +0200, biburl = https://dblp.org/rec/bib/journals/corr/QiSMG16, bibsource = dblp computer science bibliography, https://dblp.org @articleDBLP:journals/corr/QiYSG17, author = Charles Ruizhongtai Qi {and} Li Yi {and} Hao Su {and} Leonidas J. Guibas, title = PointNet++: Deep Hierarchical Feature Learning on Point Sets in a Metric Space, journal = CoRR, volume = abs/1706.02413, year = 2017, url = http://arxiv.org/abs/1706.02413, archivePrefix = arXiv, eprint = 1706.02413, timestamp = Mon, 03 Jul 2017 13:29:02 +0200, biburl = https://dblp.org/rec/bib/journals/corr/QiYSG17, bibsource = dblp computer science bibliography, https://dblp.org @articleDBLP:journals/corr/abs-1801-07791, author = Yangyan Li {and} Rui Bu {and} Mingchao Sun {and} Baoquan Chen, title = PointCNN, journal = CoRR, volume = abs/1801.07791, year = 2018, url = http://arxiv.org/abs/1801.07791, archivePrefix = arXiv, eprint = 1801.07791, timestamp = Fri, 02 Feb 2018 14:20:25 +0100, biburl = https://dblp.org/rec/bib/journals/corr/abs-1801-07791, bibsource = dblp computer science bibliography, https://dblp.org @articleDBLP:journals/corr/YiSGG16, author = Li Yi {and} Hao Su {and} Xingwen Guo {and} Leonidas J. Guibas, title = SyncSpecCNN: Synchronized Spectral CNN for 3D Shape Segmentation, journal = CoRR, volume = abs/1612.00606, year = 2016, url = http://arxiv.org/abs/1612.00606, archivePrefix = arXiv, eprint = 1612.00606, timestamp = Wed, 07 Jun 2017 14:41:52 +0200, biburl = https://dblp.org/rec/bib/journals/corr/YiSGG16, bibsource = dblp computer science bibliography, https://dblp.org @ARTICLE2015arXiv150603767R, author = Rippel, O. {and} Snoek, J. {and} Adams, R. P., title = "Spectral Representations for Convolutional Neural Networks", journal = ArXiv e-prints, archivePrefix = "arXiv", eprint = 1506.03767, primaryClass = "stat.ML", keywords = Statistics - Machine Learning, Computer Science - Learning, year = 2015, month = jun, adsurl = http://adsabs.harvard.edu/abs/2015arXiv150603767R, adsnote = Provided by the SAO/NASA Astrophysics Data System @articleDBLP:journals/corr/abs-1711-06721, author = Carlos Esteves {and} Christine Allen-Blanchette {and} Ameesh Makadia {and} Kostas Daniilidis, title = 3D object classification {and} retrieval with Spherical CNNs, journal = CoRR, volume = abs/1711.06721, year = 2017, url = http://arxiv.org/abs/1711.06721, archivePrefix = arXiv, eprint = 1711.06721, timestamp = Sun, 03 Dec 2017 12:38:15 +0100, biburl = https://dblp.org/rec/bib/journals/corr/abs-1711-06721, bibsource = dblp computer science bibliography, https://dblp.org @inproceedingsDBLP:conf/icra/EngelckeRWTP17, author = Martin Engelcke {and} Dushyant Rao {and} Dominic Zeng Wang {and} Chi Hay Tong {and} Ingmar Posner, title = Vote3Deep: Fast object detection in 3D point clouds using efficient convolutional neural networks, booktitle = 2017 IEEE International Conference on Robotics {and} Automation, ICRA 2017, Singapore, Singapore, May 29 - June 3, 2017, pages = 1355–1361, year = 2017, crossref = DBLP:conf/icra/2017, url = https://doi.org/10.1109/ICRA.2017.7989161, doi = 10.1109/ICRA.2017.7989161, timestamp = Wed, 26 Jul 2017 15:17:30 +0200, biburl = https://dblp.org/rec/bib/conf/icra/EngelckeRWTP17, bibsource = dblp computer science bibliography, https://dblp.org Xu, M. and Zeng, L. and Qiao, Y.},
year = {2018},
note = {\_eprint: 1803.11527},
keywords = {Computer Science - Computer Vision and Pattern Recognition}
}
@article{su_splatnet_2018,
title = {{SPLATNet}: {Sparse} {Lattice} {Networks} for {Point} {Cloud} {Processing}},
volume = {abs/1802.08275},
url = {http://arxiv.org/abs/1802.08275},
journal = {CoRR},
author = {Su, Hang and Jampani, Varun and Sun, Deqing and Maji, Subhransu and Kalogerakis, Evangelos and Yang, Ming-Hsuan and Kautz, Jan},
year = {2018},
note = {\_eprint: 1802.08275}
}
@article{shao_h-cnn_2018,
title = {H-{CNN}: {Spatial} {Hashing} {Based} {CNN} for {3D} {Shape} {Analysis}},
journal = {ArXiv e-prints},
author = {Shao, T. and Yang, Y. and Weng, Y. and Hou, Q. and Zhou, K.},
year = {2018},
note = {\_eprint: 1803.11385},
keywords = {Computer Science - Graphics}
}
@article{cai_pancreas_2018,
title = {Pancreas {Segmentation} in {CT} and {MRI} {Images} via {Domain} {Specific} {Network} {Designing} and {Recurrent} {Neural} {Contextual} {Learning}},
journal = {ArXiv e-prints},
author = {Cai, J. and Lu, L. and Xing, F. and Yang, L.},
year = {2018},
note = {\_eprint: 1803.11303},
keywords = {Computer Science - Computer Vision and Pattern Recognition}
}
@article{qi_pointnet_2016,
title = {{PointNet}: {Deep} {Learning} on {Point} {Sets} for {3D} {Classification} and {Segmentation}},
volume = {abs/1612.00593},
url = {http://arxiv.org/abs/1612.00593},
journal = {CoRR},
author = {Qi, Charles Ruizhongtai and Su, Hao and Mo, Kaichun and Guibas, Leonidas J.},
year = {2016},
note = {\_eprint: 1612.00593}
}
@article{qi_pointnet_2017,
title = {{PointNet}++: {Deep} {Hierarchical} {Feature} {Learning} on {Point} {Sets} in a {Metric} {Space}},
volume = {abs/1706.02413},
url = {http://arxiv.org/abs/1706.02413},
journal = {CoRR},
author = {Qi, Charles Ruizhongtai and Yi, Li and Su, Hao and Guibas, Leonidas J.},
year = {2017},
note = {\_eprint: 1706.02413}
}
@article{li_pointcnn_2018,
title = {{PointCNN}},
volume = {abs/1801.07791},
url = {http://arxiv.org/abs/1801.07791},
journal = {CoRR},
author = {Li, Yangyan and Bu, Rui and Sun, Mingchao and Chen, Baoquan},
year = {2018},
note = {\_eprint: 1801.07791}
}
@article{yi_syncspeccnn_2016,
title = {{SyncSpecCNN}: {Synchronized} {Spectral} {CNN} for {3D} {Shape} {Segmentation}},
volume = {abs/1612.00606},
url = {http://arxiv.org/abs/1612.00606},
journal = {CoRR},
author = {Yi, Li and Su, Hao and Guo, Xingwen and Guibas, Leonidas J.},
year = {2016},
note = {\_eprint: 1612.00606}
}
@article{rippel_spectral_2015,
title = {Spectral {Representations} for {Convolutional} {Neural} {Networks}},
journal = {ArXiv e-prints},
author = {Rippel, O. and Snoek, J. and Adams, R. P.},
year = {2015},
note = {\_eprint: 1506.03767},
keywords = {Computer Science - Learning, Statistics - Machine Learning}
}
@inproceedings{engelcke_vote3deep_2017,
title = {{Vote3Deep}: {Fast} object detection in {3D} point clouds using efficient convolutional neural networks},
url = {https://doi.org/10.1109/ICRA.2017.7989161},
doi = {10.1109/ICRA.2017.7989161},
booktitle = {2017 {IEEE} {International} {Conference} on {Robotics} and {Automation}, {ICRA} 2017, {Singapore}, {Singapore}, {May} 29 - {June} 3, 2017},
author = {Engelcke, Martin and Rao, Dushyant and Wang, Dominic Zeng and Tong, Chi Hay and Posner, Ingmar},
year = {2017},
pages = {1355--1361}
}
@article{shorten_survey_2019,
title = {A survey on {Image} {Data} {Augmentation} for {Deep} {Learning}},
volume = {6},
issn = {2196-1115},
url = {https://doi.org/10.1186/s40537-019-0197-0},
doi = {10.1186/s40537-019-0197-0},
abstract = {Deep convolutional neural networks have performed remarkably well on many Computer Vision tasks. However, these networks are heavily reliant on big data to avoid overfitting. Overfitting refers to the phenomenon when a network learns a function with very high variance such as to perfectly model the training data. Unfortunately, many application domains do not have access to big data, such as medical image analysis. This survey focuses on Data Augmentation, a data-space solution to the problem of limited data. Data Augmentation encompasses a suite of techniques that enhance the size and quality of training datasets such that better Deep Learning models can be built using them. The image augmentation algorithms discussed in this survey include geometric transformations, color space augmentations, kernel filters, mixing images, random erasing, feature space augmentation, adversarial training, generative adversarial networks, neural style transfer, and meta-learning. The application of augmentation methods based on GANs are heavily covered in this survey. In addition to augmentation techniques, this paper will briefly discuss other characteristics of Data Augmentation such as test-time augmentation, resolution impact, final dataset size, and curriculum learning. This survey will present existing methods for Data Augmentation, promising developments, and meta-level decisions for implementing Data Augmentation. Readers will understand how Data Augmentation can improve the performance of their models and expand limited datasets to take advantage of the capabilities of big data.},
number = {1},
journal = {Journal of Big Data},
author = {Shorten, Connor and Khoshgoftaar, Taghi M.},
year = {2019},
pages = {60}
}
@book{chatfield_return_2014,
title = {Return of the {Devil} in the {Details}: {Delving} {Deep} into {Convolutional} {Nets}},
author = {Chatfield, Ken and Simonyan, Karen and Vedaldi, Andrea and Zisserman, Andrew},
year = {2014},
note = {\_eprint: 1405.3531}
}
@inproceedings{jurio_comparison_2010,
address = {Berlin, Heidelberg},
title = {A {Comparison} {Study} of {Different} {Color} {Spaces} in {Clustering} {Based} {Image} {Segmentation}},
isbn = {978-3-642-14058-7},
abstract = {In this work we carry out a comparison study between different color spaces in clustering-based image segmentation. We use two similar clustering algorithms, one based on the entropy and the other on the ignorance. The study involves four color spaces and, in all cases, each pixel is represented by the values of the color channels in that space. Our purpose is to identify the best color representation, if there is any, when using this kind of clustering algorithms.},
booktitle = {Information {Processing} and {Management} of {Uncertainty} in {Knowledge}-{Based} {Systems}. {Applications}},
publisher = {Springer Berlin Heidelberg},
author = {Jurio, Aranzazu and Pagola, Miguel and Galar, Mikel and Lopez-Molina, Carlos and Paternain, Daniel},
editor = {Hüllermeier, Eyke and Kruse, Rudolf and Hoffmann, Frank},
year = {2010},
pages = {532--541}
}
@book{summers_improved_2018,
title = {Improved {Mixed}-{Example} {Data} {Augmentation}},
author = {Summers, Cecilia and Dinneen, Michael J.},
year = {2018},
note = {\_eprint: 1805.11272}
}
@book{zhong_random_2017,
title = {Random {Erasing} {Data} {Augmentation}},
author = {Zhong, Zhun and Zheng, Liang and Kang, Guoliang and Li, Shaozi and Yang, Yi},
year = {2017},
note = {\_eprint: 1708.04896}
}
@article{takahashi_data_2019,
title = {Data {Augmentation} using {Random} {Image} {Cropping} and {Patching} for {Deep} {CNNs}},
issn = {1558-2205},
url = {http://dx.doi.org/10.1109/TCSVT.2019.2935128},
doi = {10.1109/tcsvt.2019.2935128},
journal = {IEEE Transactions on Circuits and Systems for Video Technology},
author = {Takahashi, Ryo and Matsubara, Takashi and Uehara, Kuniaki},
year = {2019},
note = {Publisher: Institute of Electrical and Electronics Engineers (IEEE)},
pages = {1--1}
}
@inproceedings{madani_chest_2018,
title = {Chest x-ray generation and data augmentation for cardiovascular abnormality classification},
volume = {10574},
url = {https://doi.org/10.1117/12.2293971},
doi = {10.1117/12.2293971},
booktitle = {Medical {Imaging} 2018: {Image} {Processing}},
publisher = {SPIE},
author = {Madani, Ali and Moradi, Mehdi and Karargyris, Alexandros and Syeda-Mahmood, Tanveer},
editor = {Angelini, Elsa D. and Landman, Bennett A.},
year = {2018},
note = {Backup Publisher: International Society for Optics and Photonics},
keywords = {Convolutional networks, data augmentation, Generative adversarial networks},
pages = {415 -- 420}
}
@article{goodfellow_challenges_2015,
title = {Challenges in representation learning: {A} report on three machine learning contests},
volume = {64},
issn = {0893-6080},
url = {http://www.sciencedirect.com/science/article/pii/S0893608014002159},
doi = {https://doi.org/10.1016/j.neunet.2014.09.005},
abstract = {The ICML 2013 Workshop on Challenges in Representation Learning11http://deeplearning.net/icml2013-workshop-competition. focused on three challenges: the black box learning challenge, the facial expression recognition challenge, and the multimodal learning challenge. We describe the datasets created for these challenges and summarize the results of the competitions. We provide suggestions for organizers of future challenges and some comments on what kind of knowledge can be gained from machine learning competitions.},
journal = {Neural Networks},
author = {Goodfellow, Ian J. and Erhan, Dumitru and Carrier, Pierre Luc and Courville, Aaron and Mirza, Mehdi and Hamner, Ben and Cukierski, Will and Tang, Yichuan and Thaler, David and Lee, Dong-Hyun and Zhou, Yingbo and Ramaiah, Chetan and Feng, Fangxiang and Li, Ruifan and Wang, Xiaojie and Athanasakis, Dimitris and Shawe-Taylor, John and Milakov, Maxim and Park, John and Ionescu, Radu and Popescu, Marius and Grozea, Cristian and Bergstra, James and Xie, Jingjing and Romaszko, Lukasz and Xu, Bing and Chuang, Zhang and Bengio, Yoshua},
year = {2015},
keywords = {Competition, Dataset, Representation learning},
pages = {59 -- 63}
}
@article{vallet_terramobilitaiqmulus_2015,
title = {{TerraMobilita}/{iQmulus} {Urban} {Point} {Cloud} {Analysis} {Benchmark}},
volume = {49},
journal = {Computers \& Graphics},
author = {Vallet, Bruno and Brédif, Mathieu and Serna, Andrés and Marcotegui, B and Paparoditis, Nicolas},
year = {2015}
}
@article{geiger_vision_2013,
title = {Vision meets {Robotics}: {The} {KITTI} {Dataset}},
journal = {International Journal of Robotics Research (IJRR)},
author = {Geiger, Andreas and Lenz, Philip and Stiller, Christoph and Urtasun, Raquel},
year = {2013}
}
@article{chang_shapenet_2015,
title = {{ShapeNet}: {An} {Information}-{Rich} {3D} {Model} {Repository}},
volume = {abs/1512.03012},
url = {http://arxiv.org/abs/1512.03012},
journal = {CoRR},
author = {Chang, Angel X. and Funkhouser, Thomas A. and Guibas, Leonidas J. and Hanrahan, Pat and Huang, Qi-Xing and Li, Zimo and Savarese, Silvio and Savva, Manolis and Song, Shuran and Su, Hao and Xiao, Jianxiong and Yi, Li and Yu, Fisher},
year = {2015},
note = {\_eprint: 1512.03012}
}
@article{wu_3d_2014-1,
title = {{3D} {ShapeNets}: {A} {Deep} {Representation} for {Volumetric} {Shapes}},
journal = {ArXiv e-prints},
author = {Wu, Z. and Song, S. and Khosla, A. and Yu, F. and Zhang, L. and Tang, X. and Xiao, J.},
year = {2014},
note = {\_eprint: 1406.5670},
keywords = {Computer Science - Computer Vision and Pattern Recognition}
}
@inproceedings{hackel_semantic3dnet_2017,
title = {{SEMANTIC3D}.{NET}: {A} new large-scale point cloud classification benchmark},
volume = {IV-1-W1},
booktitle = {{ISPRS} {Annals} of the {Photogrammetry}, {Remote} {Sensing} and {Spatial} {Information} {Sciences}},
author = {Hackel, Timo and Savinov, N. and Ladicky, L. and Wegner, Jan D. and Schindler, K. and Pollefeys, M.},
year = {2017},
pages = {91--98}
}
@article{armeni_joint_2017,
title = {Joint {2D}-{3D}-{Semantic} {Data} for {Indoor} {Scene} {Understanding}},
volume = {abs/1702.01105},
url = {http://arxiv.org/abs/1702.01105},
journal = {CoRR},
author = {Armeni, Iro and Sax, Sasha and Zamir, Amir Roshan and Savarese, Silvio},
year = {2017},
note = {\_eprint: 1702.01105},
keywords = {Computer Science - Computer Vision and Pattern Recognition, Computer Science - Robotics}
}
@article{kumar_dataset_2017,
title = {A {Dataset} and a {Technique} for {Generalized} {Nuclear} {Segmentation} for {Computational} {Pathology}},
volume = {36},
doi = {10.1109/TMI.2017.2677499},
number = {7},
journal = {IEEE Transactions on Medical Imaging},
author = {Kumar, N. and Verma, R. and Sharma, S. and Bhargava, S. and Vahadane, A. and Sethi, A.},
month = jul,
year = {2017},
keywords = {object recognition, Training, Algorithms, Annotation, biological organs, biological tissues, biomedical optical imaging, boundaries, Cell Nucleus, cellular biophysics, chromatin-sparse, computational pathology, Computer-Assisted, conventional image processing techniques, crowded nuclei, dataset, deep learning, digital microscopic tissue images, disease states, diseases, Diseases, feature extraction, generalized nuclear segmentation, H\&E-stained images, hematoxylin and eosin-stained tissue images, high-quality feature extraction, Humans, image classification, image classification problems, Image color analysis, Image Processing, image segmentation, Image segmentation, learning (artificial intelligence), Machine learning, Machine Learning, machine learning algorithms, machine learning-based segmentation, Measurement, medical image processing, nuclear appearances, nuclear boundaries, nuclear morphometrics, nuclear segmentation, nuclei, object-level errors, optical microscopy, organs, Otsu thresholding, overlapping nuclei, Pathology, pixel-level errors, right out-of-the-box, segmentation technique, Staining and Labeling, watershed segmentation},
pages = {1550--1560}
}
@inproceedings{vahadane_learning_2016,
title = {Learning based super-resolution of histological images},
doi = {10.1109/ISBI.2016.7493391},
booktitle = {2016 {IEEE} 13th {International} {Symposium} on {Biomedical} {Imaging} ({ISBI})},
author = {Vahadane, A. and Kumar, N. and Sethi, A.},
month = apr,
year = {2016},
keywords = {Testing, Training, Artificial neural networks, histological image, Image edge detection, Image reconstruction, Image resolution, Image super-resolution, neural network},
pages = {816--819}
}
@article{setio_validation_2016,
title = {Validation, comparison, and combination of algorithms for automatic detection of pulmonary nodules in computed tomography images: {The} {LUNA16} challenge},
volume = {42},
doi = {10.1016/j.media.2017.06.015},
journal = {Medical Image Analysis},
author = {Setio, Arnaud and Traverso, Alberto and Bel, Thomas and Berens, Moira and Bogaard, Cas and Cerello, Piergiorgio and Chen, Hao and Dou, Qi and Fantacci, Maria and Geurts, Bram and Gugten, Robbert and Heng, Pheng and Jansen, Bart and Kaste, Michael and Kotov, Valentin and Lin, Jack and Manders, Jeroen and Sónora-Mengana, Alexander and Naranjo, Juan Carlos and Papavasileiou, Evgenia},
year = {2016}
}
@article{mueller_alzheimers_2005,
title = {The {Alzheimer}'s {Disease} {Neuroimaging} {Initiative}},
volume = {15},
number = {4},
journal = {Neuroimaging Clinics of North America},
author = {Mueller, Susanne G and Weiner, Michael W and Thal, Leon J and Petersen, Ronald Carl and Jack, Clifford R Jr and Jagust, William J and Trojanowski, John Q and Toga, Arthur W and Beckett, Laurel A},
year = {2005},
pages = {869--877}
}
@book{armato_iii_samuel_g_data_2015,
title = {Data {From} {LIDC}-{IDRI}},
url = {https://wiki.cancerimagingarchive.net/x/rgAe},
publisher = {The Cancer Imaging Archive},
author = {{Armato III, Samuel G.} and McLennan, Geoffrey and Bidaut, Luc and McNitt-Gray, Michael F. and Meyer, Charles R. and Reeves, Anthony P. and Zhao, Binsheng and Aberle, Denise R. and Henschke, Claudia I. and Hoffman, Eric A. and Kazerooni, Ella A. and MacMahon, Heber and Van Beek, Edwin J.R. and Yankelevitz, David and Biancardi, Alberto M. and Bland, Peyton H. and Brown, Matthew S. and Engelmann, Roger M. and Laderach, Gary E. and Max, Daniel and Pais, Richard C. and Qing, David P.Y. and Roberts, Rachael Y. and Smith, Amanda R. and Starkey, Adam and Batra, Poonam and Caligiuri, Philip and Farooqi, Ali and Gladish, Gregory W. and Jude, C. Matilda and Munden, Reginald F. and Petkovska, Iva and Quint, Leslie E. and Schwartz, Lawrence H. and Sundaram, Baskaran and Dodd, Lori E. and Fenimore, Charles and Gur, David and Petrick, Nicholas and Freymann, John and Kirby, Justin and Hughes, Brian and Casteele, Alessi Vande and Gupte, Sangeeta and Sallam, Maha and Heath, Michael D. and Kuhn, Michael H. and Dharaiya, Ekta and Burns, Richard and Fryd, David S. and Salganicoff, Marcos and Anand, Vikram and Shreter, Uri and Vastagh, Stephen and Croft, Barbara Y. and Clarke, Laurence P.},
year = {2015},
doi = {10.7937/K9/TCIA.2015.LO9QL9SX}
}
@article{clark_cancer_2013,
title = {The {Cancer} {Imaging} {Archive} ({TCIA}): {Maintaining} and {Operating} a {Public} {Information} {Repository}},
volume = {26},
issn = {1618-727X},
url = {https://doi.org/10.1007/s10278-013-9622-7},
doi = {10.1007/s10278-013-9622-7},
abstract = {The National Institutes of Health have placed significant emphasis on sharing of research data to support secondary research. Investigators have been encouraged to publish their clinical and imaging data as part of fulfilling their grant obligations. Realizing it was not sufficient to merely ask investigators to publish their collection of imaging and clinical data, the National Cancer Institute (NCI) created the open source National Biomedical Image Archive software package as a mechanism for centralized hosting of cancer related imaging. NCI has contracted with Washington University in Saint Louis to create The Cancer Imaging Archive (TCIA)–an open-source, open-access information resource to support research, development, and educational initiatives utilizing advanced medical imaging of cancer. In its first year of operation, TCIA accumulated 23 collections (3.3 million images). Operating and maintaining a high-availability image archive is a complex challenge involving varied archive-specific resources and driven by the needs of both image submitters and image consumers. Quality archives of any type (traditional library, PubMed, refereed journals) require management and customer service. This paper describes the management tasks and user support model for TCIA.},
number = {6},
journal = {Journal of Digital Imaging},
author = {Clark, Kenneth and Vendt, Bruce and Smith, Kirk and Freymann, John and Kirby, Justin and Koppel, Paul and Moore, Stephen and Phillips, Stanley and Maffitt, David and Pringle, Michael and Tarbox, Lawrence and Prior, Fred},
year = {2013},
pages = {1045--1057}
}
@article{rister_ct_2018,
title = {{CT} organ segmentation using {GPU} data augmentation, unsupervised labels and {IOU} loss},
volume = {abs/1811.11226},
url = {http://arxiv.org/abs/1811.11226},
journal = {CoRR},
author = {Rister, Blaine and Yi, Darvin and Shivakumar, Kaushik and Nobashi, Tomomi and Rubin, Daniel L.},
year = {2018},
note = {\_eprint: 1811.11226}
}
@article{bilic_liver_2019,
title = {The {Liver} {Tumor} {Segmentation} {Benchmark} ({LiTS})},
volume = {abs/1901.04056},
url = {http://arxiv.org/abs/1901.04056},
journal = {CoRR},
author = {Bilic, Patrick and Christ, Patrick Ferdinand and Vorontsov, Eugene and Chlebus, Grzegorz and Chen, Hao and Dou, Qi and Fu, Chi-Wing and Han, Xiao and Heng, Pheng-Ann and Hesser, Jürgen and Kadoury, Samuel and Konopczynski, Tomasz K. and Le, Miao and Li, Chunming and Li, Xiaomeng and Lipková, Jana and Lowengrub, John S. and Meine, Hans and Moltz, Jan Hendrik and Pal, Chris and Piraud, Marie and Qi, Xiaojuan and Qi, Jin and Rempfler, Markus and Roth, Karsten and Schenk, Andrea and Sekuboyina, Anjany and Zhou, Ping and Hülsemeyer, Christian and Beetz, Marcel and Ettlinger, Florian and Grün, Felix and Kaissis, Georgios and Lohöfer, Fabian and Braren, Rickmer and Holch, Julian and Hofmann, Felix and Sommer, Wieland H. and Heinemann, Volker and Jacobs, Colin and Mamani, Gabriel Efrain Humpire and Ginneken, Bram van and Chartrand, Gabriel and Tang, An and Drozdzal, Michal and Ben-Cohen, Avi and Klang, Eyal and Amitai, Michal Marianne and Konen, Eli and Greenspan, Hayit and Moreau, Johan and Hostettler, Alexandre and Soler, Luc and Vivanti, Refael and Szeskin, Adi and Lev-Cohain, Naama and Sosna, Jacob and Joskowicz, Leo and Menze, Bjoern H.},
year = {2019},
note = {\_eprint: 1901.04056}
}
@book{heller_kits19_2019,
title = {The {KiTS19} {Challenge} {Data}: 300 {Kidney} {Tumor} {Cases} with {Clinical} {Context}, {CT} {Semantic} {Segmentations}, and {Surgical} {Outcomes}},
author = {Heller, Nicholas and Sathianathen, Niranjan and Kalapara, Arveen and Walczak, Edward and Moore, Keenan and Kaluzniak, Heather and Rosenberg, Joel and Blake, Paul and Rengel, Zachary and Oestreich, Makinna and Dean, Joshua and Tradewell, Michael and Shah, Aneri and Tejpaul, Resha and Edgerton, Zachary and Peterson, Matthew and Raza, Shaneabbas and Regmi, Subodh and Papanikolopoulos, Nikolaos and Weight, Christopher},
year = {2019},
note = {\_eprint: 1904.00445}
}
@article{rusu_co-registration_2017,
title = {Co-registration of pre-operative {CT} with ex vivo surgically excised ground glass nodules to define spatial extent of invasive adenocarcinoma on in vivo imaging: a proof-of-concept study},
volume = {27},
issn = {1432-1084},
url = {https://doi.org/10.1007/s00330-017-4813-0},
doi = {10.1007/s00330-017-4813-0},
abstract = {To develop an approach for radiology-pathology fusion of ex vivo histology of surgically excised pulmonary nodules with pre-operative CT, to radiologically map spatial extent of the invasive adenocarcinomatous component of the nodule.},
number = {10},
journal = {European Radiology},
author = {Rusu, Mirabela and Rajiah, Prabhakar and Gilkeson, Robert and Yang, Michael and Donatelli, Christopher and Thawani, Rajat and Jacono, Frank J. and Linden, Philip and Madabhushi, Anant},
year = {2017},
pages = {4209--4217}
}
@article{aerts_decoding_2014,
title = {Decoding tumour phenotype by noninvasive imaging using a quantitative radiomics approach},
volume = {5},
issn = {2041-1723},
url = {https://doi.org/10.1038/ncomms5006},
doi = {10.1038/ncomms5006},
abstract = {Human cancers exhibit strong phenotypic differences that can be visualized noninvasively by medical imaging. Radiomics refers to the comprehensive quantification of tumour phenotypes by applying a large number of quantitative image features. Here we present a radiomic analysis of 440 features quantifying tumour image intensity, shape and texture, which are extracted from computed tomography data of 1,019 patients with lung or head-and-neck cancer. We find that a large number of radiomic features have prognostic power in independent data sets of lung and head-and-neck cancer patients, many of which were not identified as significant before. Radiogenomics analysis reveals that a prognostic radiomic signature, capturing intratumour heterogeneity, is associated with underlying gene-expression patterns. These data suggest that radiomics identifies a general prognostic phenotype existing in both lung and head-and-neck cancer. This may have a clinical impact as imaging is routinely used in clinical practice, providing an unprecedented opportunity to improve decision-support in cancer treatment at low cost.},
number = {1},
journal = {Nature Communications},
author = {Aerts, Hugo J. W. L. and Velazquez, Emmanuel Rios and Leijenaar, Ralph T. H. and Parmar, Chintan and Grossmann, Patrick and Carvalho, Sara and Bussink, Johan and Monshouwer, René and Haibe-Kains, Benjamin and Rietveld, Derek and Hoebers, Frank and Rietbergen, Michelle M. and Leemans, C. René and Dekker, Andre and Quackenbush, John and Gillies, Robert J. and Lambin, Philippe},
year = {2014},
pages = {4006}
}
@article{singanamalli_identifying_2016,
title = {Identifying in vivo {DCE} {MRI} markers associated with microvessel architecture and gleason grades of prostate cancer},
volume = {43},
url = {https://onlinelibrary.wiley.com/doi/abs/10.1002/jmri.24975},
doi = {10.1002/jmri.24975},
abstract = {Background To identify computer extracted in vivo dynamic contrast enhanced (DCE) MRI markers associated with quantitative histomorphometric (QH) characteristics of microvessels and Gleason scores (GS) in prostate cancer. Methods This study considered retrospective data from 23 biopsy confirmed prostate cancer patients who underwent 3 Tesla multiparametric MRI before radical prostatectomy (RP). Representative slices from RP specimens were stained with vascular marker CD31. Tumor extent was mapped from RP sections onto DCE MRI using nonlinear registration methods. Seventy-seven microvessel QH features and 18 DCE MRI kinetic features were extracted and evaluated for their ability to distinguish low from intermediate and high GS. The effect of temporal sampling on kinetic features was assessed and correlations between those robust to temporal resolution and microvessel features discriminative of GS were examined. Results A total of 12 microvessel architectural features were discriminative of low and intermediate/high grade tumors with area under the receiver operating characteristic curve (AUC) {\textgreater} 0.7. These features were most highly correlated with mean washout gradient (WG) (max rho = −0.62). Independent analysis revealed WG to be moderately robust to temporal resolution (intraclass correlation coefficient [ICC] = 0.63) and WG variance, which was poorly correlated with microvessel features, to be predictive of low grade tumors (AUC = 0.77). Enhancement ratio was the most robust (ICC = 0.96) and discriminative (AUC = 0.78) kinetic feature but was moderately correlated with microvessel features (max rho = −0.52). Conclusion Computer extracted features of prostate DCE MRI appear to be correlated with microvessel architecture and may be discriminative of low versus intermediate and high GS. J. MAGN. RESON. IMAGING 2016;43:149–158.},
number = {1},
journal = {Journal of Magnetic Resonance Imaging},
author = {Singanamalli, Asha and Rusu, Mirabela and Sparks, Rachel E. and Shih, Natalie N.C. and Ziober, Amy and Wang, Li-Ping and Tomaszewski, John and Rosen, Mark and Feldman, Michael and Madabhushi, Anant},
year = {2016},
note = {\_eprint: https://onlinelibrary.wiley.com/doi/pdf/10.1002/jmri.24975},
keywords = {DCE MRI, Gleason grades, imaging biomarkers, microvessel architecture, prostate cancer, quantitative histomorphometry},
pages = {149--158}
}
@article{kuo_understanding_2016,
title = {Understanding {Convolutional} {Neural} {Networks} with {A} {Mathematical} {Model}},
volume = {abs/1609.04112},
url = {http://arxiv.org/abs/1609.04112},
journal = {CoRR},
author = {Kuo, C.-C. Jay},
year = {2016},
note = {\_eprint: 1609.04112}
}
@article{huang_densely_2016,
title = {Densely {Connected} {Convolutional} {Networks}},
volume = {abs/1608.06993},
url = {http://arxiv.org/abs/1608.06993},
journal = {CoRR},
author = {Huang, Gao and Liu, Zhuang and Weinberger, Kilian Q.},
year = {2016},
note = {\_eprint: 1608.06993}
}
@article{mou_tbcnn_2014,
title = {{TBCNN}: {A} {Tree}-{Based} {Convolutional} {Neural} {Network} for {Programming} {Language} {Processing}},
volume = {abs/1409.5718},
url = {http://arxiv.org/abs/1409.5718},
journal = {CoRR},
author = {Mou, Lili and Li, Ge and Jin, Zhi and Zhang, Lu and Wang, Tao},
year = {2014},
note = {\_eprint: 1409.5718}
}
@incollection{krizhevsky_imagenet_2012,
title = {{ImageNet} {Classification} with {Deep} {Convolutional} {Neural} {Networks}},
url = {http://papers.nips.cc/paper/4824-imagenet-classification-with-deep-convolutional-neural-networks.pdf},
booktitle = {Advances in {Neural} {Information} {Processing} {Systems} 25},
publisher = {Curran Associates, Inc.},
author = {Krizhevsky, Alex and Sutskever, Ilya and Hinton, Geoffrey E},
editor = {Pereira, F. and Burges, C. J. C. and Bottou, L. and Weinberger, K. Q.},
year = {2012},
pages = {1097--1105}
}
@article{bronstein_geometric_2016,
title = {Geometric deep learning: going beyond {Euclidean} data},
volume = {abs/1611.08097},
url = {http://arxiv.org/abs/1611.08097},
journal = {CoRR},
author = {Bronstein, Michael M. and Bruna, Joan and LeCun, Yann and Szlam, Arthur and Vandergheynst, Pierre},
year = {2016},
note = {\_eprint: 1611.08097}
}
@article{lecun_gradient-based_1998,
title = {Gradient-based learning applied to document recognition},
volume = {86},
number = {11},
journal = {Proceedings of the IEEE},
author = {Lecun, Yann and Bottou, Leon and Bengio, Yoshua and Haffner, Patrick},
year = {1998},
pages = {2278--2324}
}
@book{goodfellow_deep_2016,
title = {Deep {Learning}},
publisher = {MIT Press},
author = {Goodfellow, Ian and Bengio, Yoshua and Courville, Aaron},
year = {2016}
}
@incollection{lecun_handbook_1998,
address = {Cambridge, MA, USA},
title = {The {Handbook} of {Brain} {Theory} and {Neural} {Networks}},
isbn = {0-262-51102-9},
url = {http://dl.acm.org/citation.cfm?id=303568.303704},
publisher = {MIT Press},
author = {LeCun, Yann and Bengio, Yoshua},
editor = {Arbib, Michael A.},
year = {1998},
note = {Section: Convolutional Networks for Images, Speech, and Time Series},
pages = {255--258}
}
@book{szegedy_inception-v4_2016,
title = {Inception-v4, {Inception}-{ResNet} and the {Impact} of {Residual} {Connections} on {Learning}},
author = {Szegedy, Christian and Ioffe, Sergey and Vanhoucke, Vincent and Alemi, Alex},
year = {2016},
note = {\_eprint: 1602.07261}
}
@book{ronneberger_u-net_2015,
title = {U-{Net}: {Convolutional} {Networks} for {Biomedical} {Image} {Segmentation}},
author = {Ronneberger, Olaf and Fischer, Philipp and Brox, Thomas},
year = {2015},
note = {\_eprint: 1505.04597}
}
@article{kipf_semi-supervised_2016,
title = {Semi-{Supervised} {Classification} with {Graph} {Convolutional} {Networks}},
volume = {abs/1609.02907},
url = {http://arxiv.org/abs/1609.02907},
journal = {CoRR},
author = {Kipf, Thomas N. and Welling, Max},
year = {2016},
note = {\_eprint: 1609.02907}
}
@article{simonovsky_dynamic_2017,
title = {Dynamic {Edge}-{Conditioned} {Filters} in {Convolutional} {Neural} {Networks} on {Graphs}},
volume = {abs/1704.02901},
url = {http://arxiv.org/abs/1704.02901},
journal = {CoRR},
author = {Simonovsky, Martin and Komodakis, Nikos},
year = {2017},
note = {\_eprint: 1704.02901}
}
@article{wang_dynamic_2018,
title = {Dynamic {Graph} {CNN} for {Learning} on {Point} {Clouds}},
volume = {abs/1801.07829},
url = {http://arxiv.org/abs/1801.07829},
journal = {CoRR},
author = {Wang, Yue and Sun, Yongbin and Liu, Ziwei and Sarma, Sanjay E. and Bronstein, Michael M. and Solomon, Justin M.},
year = {2018},
note = {\_eprint: 1801.07829}
}
@book{sugiyama_graphic_2013,
title = {Graphic {Machine} {Learning}},
publisher = {Posts Telecom Press and Kodansha LTD.},
author = {Sugiyama, Masashi},
translator = {X, Yongwei},
year = {2013}
}
@book{flach_machine_2012,
title = {Machine {Learning}: {The} {Art} and {Science} of {Algorithms} that {Make} {Sense} of {Data}(first edition)},
publisher = {Posts Telecom Press and Cambridge University Press},
author = {Flach, Peter},
translator = {Duan, Fei},
year = {2012}
}
@phdthesis{hsu_practical_2016,