-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathrefs.bib
4227 lines (3721 loc) · 167 KB
/
refs.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
% SSL methods
% context encoder, cpc, simclr, moco, byol, simsiam, vicreg, barlow twins
@string{ICCV="ICCV"}
@string{CVPR="CVPR"}
@string{NIPS="NeurIPS"}
@string{WACV="WACV"}
@string{ECCV="ECCV"}
@string{ICML="ICML"}
@string{ICLR="ICLR"}
@string{ICASSP="ICASSP"}
@string{AISTATS="AISTATS"}
@string{IJCV="IJCV"}
@string{CIVR="CIVR"}
@article{chen2020unsupervised,
title = {Unsupervised Image Classification for Deep Representation Learning},
author = {Chen, Weijie and Pu, Shiliang and Xie, Di and Yang, Shicai and Guo, Yilu and Lin, Luojun},
journal = {arXiv preprint arXiv:2006.11480},
year = {2020}
}
@article{bromley1993signature,
title = {Signature verification using a" siamese" time delay neural network},
author = {Bromley, Jane and Guyon, Isabelle and LeCun, Yann and S{\"a}ckinger, Eduard and Shah, Roopak},
journal = {Advances in neural information processing systems},
volume = {6},
year = {1993}
}
@article{shen2021s2,
title = {S2-BNN: Bridging the Gap Between Self-Supervised Real and 1-bit Neural Networks via Guided Distribution Calibration},
author = {Shen, Zhiqiang and Liu, Zechun and Qin, Jie and Huang, Lei and Cheng, Kwang-Ting and Savvides, Marios},
journal = {arXiv preprint arXiv:2102.08946},
year = {2021}
}
@inproceedings{gidaris2020learning,
title = {Learning representations by predicting bags of visual words},
author = {Gidaris, Spyros and Bursuc, Andrei and Komodakis, Nikos and P{\'e}rez, Patrick and Cord, Matthieu},
booktitle = CVPR,
year = {2020}
}
@article{junnan2021prototypical,
title = {Prototypical Contrastive Learning of Unsupervised Representations},
author = {Junnan Li and Pan Zhou and Caiming Xiong and Steven C.H. Hoi},
journal = ICLR,
year = {2021}
}
@inproceedings{noroozi2018boosting,
title = {Boosting self-supervised learning via knowledge transfer},
author = {Noroozi, Mehdi and Vinjimoor, Ananth and Favaro, Paolo and Pirsiavash, Hamed},
booktitle = CVPR,
year = {2018}
}
@inproceedings{fang2021seed,
title = {SEED: Self-supervised Distillation For Visual Representation},
author = {Fang, Zhiyuan and Wang, Jianfeng and Wang, Lijuan and Zhang, Lei and Yang, Yezhou and Liu, Zicheng},
journal = ICLR,
year = {2021}
}
@article{xu2021seed,
title = {Seed the Views: Hierarchical Semantic Alignment for Contrastive Representation Learning},
author = {Xu, Haohang and Zhang, Xiaopeng and Li, Hao and Xie, Lingxi and Xiong, Hongkai and Tian, Qi},
journal = {arXiv preprint arXiv:2012.02733},
year = {2021}
}
@article{radenovic2018fine,
title = {Fine-tuning CNN image retrieval with no human annotation},
author = {Radenovi{\'c}, Filip and Tolias, Giorgos and Chum, Ond{\v{r}}ej},
journal = {IEEE transactions on pattern analysis and machine intelligence},
year = {2018}
}
@article{gidaris2020obow,
title = {Online Bag-of-Visual-Words Generation for Unsupervised Representation Learning},
author = {Gidaris, Spyros and Bursuc, Andrei and Puy, Gilles and Komodakis, Nikos and Cord, Matthieu and P{\'e}rez, Patrick},
journal = {arXiv preprint arXiv:2012.11552},
year = {2020}
}
@article{berman2019multigrain,
title = {{{MultiGrain}: a unified image embedding for classes and instances}},
author = {Berman, Maxim and J{\'e}gou, Herv{\'e} and Vedaldi Andrea and Kokkinos, Iasonas and Douze, Matthijs},
journal = {arXiv preprint arXiv:1902.05509},
year = {2019}
}
@article{thomee2015yfcc100m,
title = {YFCC100M: The new data in multimedia research},
author = {Thomee, Bart and Shamma, David A and Friedland, Gerald and Elizalde, Benjamin and Ni, Karl and Poland, Douglas and Borth, Damian and Li, Li-Jia},
journal = {arXiv preprint arXiv:1503.01817},
year = {2015}
}
@inproceedings{douze2009evaluation,
title = {Evaluation of gist descriptors for web-scale image search},
author = {Douze, Matthijs and J{\'e}gou, Herv{\'e} and Sandhawalia, Harsimrat and Amsaleg, Laurent and Schmid, Cordelia},
booktitle = CIVR,
year = {2009}
}
@article{sariyildiz2020concept,
title = {Concept generalization in visual representation learning},
author = {Sariyildiz, Mert Bulent and Kalantidis, Yannis and Larlus, Diane and Alahari, Karteek},
journal = {arXiv preprint arXiv:2012.05649},
year = {2020}
}
@article{tolias2015particular,
title = {Particular object retrieval with integral max-pooling of CNN activations},
author = {Tolias, Giorgos and Sicre, Ronan and J{\'e}gou, Herv{\'e}},
journal = {arXiv preprint arXiv:1511.05879},
year = {2015}
}
@inproceedings{revaud2019learning,
title = {Learning with average precision: Training image retrieval with a listwise loss},
author = {Revaud, Jerome and Almaz{\'a}n, Jon and Rezende, Rafael S and Souza, Cesar Roberto de},
booktitle = ICCV,
year = {2019}
}
@article{weyand2020google,
title = {Google landmarks dataset v2-a large-scale benchmark for instance-level recognition and retrieval},
author = {Weyand, Tobias and Araujo, Andre and Cao, Bingyi and Sim, Jack},
booktitle = CVPR,
year = {2020}
}
@inproceedings{philbin2008lost,
title = {Lost in quantization: Improving particular object retrieval in large scale image databases},
author = {Philbin, James and Chum, Ondrej and Isard, Michael and Sivic, Josef and Zisserman, Andrew},
booktitle = CVPR,
year = {2008}
}
@article{radenovic2018revisiting,
title = {Revisiting oxford and paris: Large-scale image retrieval benchmarking},
author = {Radenovi{\'c}, Filip and Iscen, Ahmet and Tolias, Giorgos and Avrithis, Yannis and Chum, Ond{\v{r}}ej},
booktitle = CVPR,
year = {2018}
}
@article{pinheiro2020unsupervised,
title = {Unsupervised Learning of Dense Visual Representations},
author = {Pinheiro, Pedro O and Almahairi, Amjad and Benmaleck, Ryan Y and Golemo, Florian and Courville, Aaron},
booktitle = NIPS,
year = {2020}
}
@article{jabri2020space,
title = {Space-time correspondence as a contrastive random walk},
author = {Jabri, Allan and Owens, Andrew and Efros, Alexei A},
booktitle = NIPS,
year = {2020}
}
@article{polyak1992acceleration,
title = {Acceleration of stochastic approximation by averaging},
author = {Polyak, Boris T and Juditsky, Anatoli B},
journal = {SIAM journal on control and optimization},
volume = {30},
number = {4},
pages = {838--855},
year = {1992},
publisher = {SIAM}
}
@inproceedings{asano2019self,
title = {Self-labelling via simultaneous clustering and representation learning},
author = {Asano, Yuki Markus and Rupprecht, Christian and Vedaldi, Andrea},
booktitle = ICLR,
year = {2020}
}
@inproceedings{caron2018deep,
title = {Deep clustering for unsupervised learning of visual features},
author = {Caron, Mathilde and Bojanowski, Piotr and Joulin, Armand and Douze, Matthijs},
booktitle = ECCV,
year = {2018}
}
@inproceedings{wang2015unsupervised,
title = {Unsupervised learning of visual representations using videos},
author = {Wang, Xiaolong and Gupta, Abhinav},
booktitle = {Proceedings of the IEEE international conference on computer vision},
pages = {2794--2802},
year = {2015}
}
@inproceedings{wu2018unsupervised,
title = {Unsupervised feature learning via non-parametric instance discrimination},
author = {Wu, Zhirong and Xiong, Yuanjun and Yu, Stella X and Lin, Dahua},
booktitle = CVPR,
year = {2018}
}
@inproceedings{caron2019unsupervised,
title = {Unsupervised pre-training of image features on non-curated data},
author = {Caron, Mathilde and Bojanowski, Piotr and Mairal, Julien and Joulin, Armand},
booktitle = ICCV,
year = {2019}
}
@inproceedings{lin2014microsoft,
title = {Microsoft coco: Common objects in context},
author = {Lin, Tsung-Yi and Maire, Michael and Belongie, Serge and Hays, James and Perona, Pietro and Ramanan, Deva and Doll{\'a}r, Piotr and Zitnick, C Lawrence},
booktitle = ECCV,
year = {2014}
}
@inproceedings{he2017mask,
title = {Mask r-cnn},
author = {He, Kaiming and Gkioxari, Georgia and Doll{\'a}r, Piotr and Girshick, Ross},
booktitle = ICCV,
year = {2017}
}
@article{you2017large,
title = {Large Batch Training of Convolutional Networks},
author = {Yang You and Igor Gitman and Boris Ginsburg},
journal = {preprint arXiv:1708.03888},
year = {2017}
}
@article{mairal2019cyanure,
title = {Cyanure: An Open-Source Toolbox for Empirical Risk Minimization for Python, C++, and soon more},
author = {Julien Mairal},
journal = {preprint arXiv:1912.08165},
year = {2019}
}
@inproceedings{touvron2019fixing,
title = {Fixing the train-test resolution discrepancy},
author = {Touvron, Hugo and Vedaldi, Andrea and Douze, Matthijs and J{\'e}gou, Herv{\'e}},
booktitle = NIPS,
year = {2019}
}
@inproceedings{he2020momentum,
title = {Momentum contrast for unsupervised visual representation learning},
author = {He, Kaiming and Fan, Haoqi and Wu, Yuxin and Xie, Saining and Girshick, Ross},
booktitle = CVPR,
year = {2020}
}
@inproceedings{misra2020self,
title = {Self-supervised learning of pretext-invariant representations},
author = {Misra, Ishan and Maaten, Laurens van der},
booktitle = CVPR,
year = {2020}
}
@inproceedings{miech2020end,
title = {End-to-end learning of visual representations from uncurated instructional videos},
author = {Miech, Antoine and Alayrac, Jean-Baptiste and Smaira, Lucas and Laptev, Ivan and Sivic, Josef and Zisserman, Andrew},
booktitle = CVPR,
year = {2020}
}
@inproceedings{yan2020clusterfit,
title = {ClusterFit: Improving Generalization of Visual Representations},
author = {Yan, Xueting and Misra, Ishan and Gupta, Abhinav and Ghadiyaram, Deepti and Mahajan, Dhruv},
booktitle = CVPR,
year = {2020}
}
@inproceedings{mahajan2018exploring,
title = {Exploring the limits of weakly supervised pretraining},
author = {Mahajan, Dhruv and Girshick, Ross and Ramanathan, Vignesh and He, Kaiming and Paluri, Manohar and Li, Yixuan and Bharambe, Ashwin and van der Maaten, Laurens},
booktitle = ECCV,
year = {2018}
}
@inproceedings{joulin2016learning,
title = {Learning visual features from large weakly supervised data},
author = {Joulin, Armand and Van Der Maaten, Laurens and Jabri, Allan and Vasilache, Nicolas},
booktitle = ECCV,
year = {2016}
}
@article{chen2020simple,
title = {A simple framework for contrastive learning of visual representations},
author = {Chen, Ting and Kornblith, Simon and Norouzi, Mohammad and Hinton, Geoffrey},
journal = {preprint arXiv:2002.05709},
year = {2020}
}
@inproceedings{grill2020bootstrap,
title = {Bootstrap your own latent: A new approach to self-supervised learning},
author = {Grill, Jean-Bastien and Strub, Florian and Altch{\'e}, Florent and Tallec, Corentin and Richemond, Pierre H and Buchatskaya, Elena and Doersch, Carl and Pires, Bernardo Avila and Guo, Zhaohan Daniel and Azar, Mohammad Gheshlaghi and Piot, Bilal and Kavukcuoglu, Koray and Munos, Rémi and Valko, Michal},
booktitle = NIPS,
year = {2020}
}
@inproceedings{caron2020unsupervised,
title = {Unsupervised learning of visual features by contrasting cluster assignments},
author = {Caron, Mathilde and Misra, Ishan and Mairal, Julien and Goyal, Priya and Bojanowski, Piotr and Joulin, Armand},
booktitle = NIPS,
year = {2020}
}
@inproceedings{oyallon2017scaling,
title = {Scaling the scattering transform: Deep hybrid networks},
author = {Oyallon, Edouard and Belilovsky, Eugene and Zagoruyko, Sergey},
booktitle = ICCV,
year = {2017}
}
@inproceedings{bojanowski2017unsupervised,
title = {Unsupervised learning by predicting Noise},
author = {Bojanowski, Piotr and Joulin, Armand},
booktitle = ICML,
year = {2017}
}
@article{radford2019language,
title = {Language models are unsupervised multitask learners},
author = {Radford, Alec and Wu, Jeffrey and Child, Rewon and Luan, David and Amodei, Dario and Sutskever, Ilya}
}
@article{devlin2018bert,
title = {Bert: Pre-training of deep bidirectional transformers for language understanding},
author = {Devlin, Jacob and Chang, Ming-Wei and Lee, Kenton and Toutanova, Kristina},
journal = {preprint arXiv:1810.04805},
year = {2018}
}
@article{schneider2019wav2vec,
title = {wav2vec: Unsupervised pre-training for speech recognition},
author = {Schneider, Steffen and Baevski, Alexei and Collobert, Ronan and Auli, Michael},
journal = {preprint arXiv:1904.05862},
year = {2019}
}
@inproceedings{riviere2020unsupervised,
title = {Unsupervised pretraining transfers well across languages},
author = {Rivi{\`e}re, Morgane and Joulin, Armand and Mazar{\'e}, Pierre-Emmanuel and Dupoux, Emmanuel},
booktitle = ICASSP,
year = {2020}
}
@inproceedings{baevski2020wav2vec,
title = {wav2vec 2.0: A framework for self-supervised learning of speech representations},
author = {Baevski, Alexei and Zhou, Henry and Mohamed, Abdelrahman and Auli, Michael},
booktitle = NIPS,
year = {2020}
}
@inproceedings{kahn2020libri,
title = {Libri-light: A benchmark for asr with limited or no supervision},
author = {Kahn, Jacob and Rivi{\`e}re, Morgane and Zheng, Weiyi and Kharitonov, Evgeny and Xu, Qiantong and Mazar{\'e}, Pierre-Emmanuel and Karadayi, Julien and Liptchinsky, Vitaliy and Collobert, Ronan and Fuegen, Christian and others},
booktitle = ICASSP,
year = {2020}
}
@inproceedings{pathak2017learning,
title = {Learning features by watching objects move},
author = {Pathak, Deepak and Girshick, Ross and Doll{\'a}r, Piotr and Darrell, Trevor and Hariharan, Bharath},
booktitle = {Proceedings of the IEEE conference on computer vision and pattern recognition},
pages = {2701--2710},
year = {2017}
}
@inproceedings{noroozi2016unsupervised,
title = {Unsupervised learning of visual representations by solving jigsaw puzzles},
author = {Noroozi, Mehdi and Favaro, Paolo},
booktitle = {European conference on computer vision},
pages = {69--84},
year = {2016},
organization = {Springer}
}
@article{he2021masked,
title = {Masked autoencoders are scalable vision learners},
author = {He, Kaiming and Chen, Xinlei and Xie, Saining and Li, Yanghao and Doll{\'a}r, Piotr and Girshick, Ross},
journal = {arXiv preprint arXiv:2111.06377},
year = {2021}
}
@article{brown2020language,
title = {Language models are few-shot learners},
author = {Brown, Tom B and Mann, Benjamin and Ryder, Nick and Subbiah, Melanie and Kaplan, Jared and Dhariwal, Prafulla and Neelakantan, Arvind and Shyam, Pranav and Sastry, Girish and Askell, Amanda and others},
journal = {preprint arXiv:2005.14165},
year = {2020}
}
@article{raffel2019exploring,
title = {Exploring the limits of transfer learning with a unified text-to-text transformer},
author = {Raffel, Colin and Shazeer, Noam and Roberts, Adam and Lee, Katherine and Narang, Sharan and Matena, Michael and Zhou, Yanqi and Li, Wei and Liu, Peter J},
journal = {preprint arXiv:1910.10683},
year = {2019}
}
@article{henaff2019data,
title = {Data-efficient image recognition with contrastive predictive coding},
author = {H{\'e}naff, Olivier J and Srinivas, Aravind and De Fauw, Jeffrey and Razavi, Ali and Doersch, Carl and Eslami, SM and Oord, Aaron van den},
journal = {preprint arXiv:1905.09272},
year = {2019}
}
@inproceedings{kolesnikov2019big,
title = {Big transfer (BiT): General visual representation learning},
author = {Kolesnikov, Alexander and Beyer, Lucas and Zhai, Xiaohua and Puigcerver, Joan and Yung, Jessica and Gelly, Sylvain and Houlsby, Neil},
booktitle = ECCV,
year = {2020}
}
@inproceedings{kolesnikov2019revisiting,
title = {Revisiting self-supervised visual representation learning},
author = {Kolesnikov, Alexander and Zhai, Xiaohua and Beyer, Lucas},
booktitle = CVPR,
year = {2019}
}
@inproceedings{he2016deep,
title = {Deep residual learning for image recognition},
author = {He, Kaiming and Zhang, Xiangyu and Ren, Shaoqing and Sun, Jian},
booktitle = CVPR,
year = {2016}
}
@article{tan2019efficientnet,
title = {Efficientnet: Rethinking model scaling for convolutional neural networks},
author = {Tan, Mingxing and Le, Quoc V},
journal = {preprint arXiv:1905.11946},
year = {2019}
}
@article{touvron2020fixing,
title = {Fixing the train-test resolution discrepancy: FixEfficientNet},
author = {Touvron, Hugo and Vedaldi, Andrea and Douze, Matthijs and J{\'e}gou, Herv{\'e}},
journal = {preprint arXiv:2003.08237},
year = {2020}
}
@inproceedings{xie2017aggregated,
title = {Aggregated residual transformations for deep neural networks},
author = {Xie, Saining and Girshick, Ross and Doll{\'a}r, Piotr and Tu, Zhuowen and He, Kaiming},
booktitle = CVPR,
year = {2017}
}
@inproceedings{xie2016unsupervised,
title = {Unsupervised deep embedding for clustering analysis},
author = {Xie, Junyuan and Girshick, Ross and Farhadi, Ali},
booktitle = ICML,
year = {2016}
}
@inproceedings{yang2016joint,
title = {Joint unsupervised learning of deep representations and image clusters},
author = {Yang, Jianwei and Parikh, Devi and Batra, Dhruv},
booktitle = CVPR,
year = {2016}
}
@inproceedings{doersch2015unsupervised,
title = {Unsupervised visual representation learning by context prediction},
author = {Doersch, Carl and Gupta, Abhinav and Efros, Alexei A},
booktitle = ICCV,
year = {2015}
}
@inproceedings{vincent2008extracting,
author = {P. Vincent and H. Larochelle and Y. Bengio and P.-A. Manzagol},
title = {Extracting and composing robust features with denoising autoencoders},
booktitle = ICML,
year = {2008}
}
@inproceedings{ranzato2007unsupervised,
author = {Marc’Aurelio Ranzato and Fu-Jie Huang and Y-Lan Boureau and Yann LeCun},
title = {Unsupervised Learning of Invariant Feature Hierarchies with Applications to Object Recognition},
booktitle = CVPR,
year = {2007}
}
@inproceedings{hadsell2006dimensionality,
title = {Dimensionality reduction by learning an invariant mapping},
author = {Hadsell, Raia and Chopra, Sumit and LeCun, Yann},
booktitle = CVPR,
year = {2006}
}
@article{olshausen1996,
author = {B. A. Olshausen and D. J. Field},
title = {Emergence of simple-cell receptive field properties by learning a sparse code for natural images},
journal = {Nature},
volume = {381},
number = {6583},
pages = {607},
year = {1996}
}
@inproceedings{coates2011analysis,
title = {An analysis of single-layer networks in unsupervised feature learning},
author = {Coates, Adam and Ng, Andrew and Lee, Honglak},
booktitle = AISTATS,
year = {2011}
}
@article{li2020prototypical,
title = {Prototypical Contrastive Learning of Unsupervised Representations},
author = {Li, Junnan and Zhou, Pan and Xiong, Caiming and Socher, Richard and Hoi, Steven CH},
journal = {preprint arXiv:2005.04966},
year = {2020}
}
@article{dosovitskiy2016discriminative,
title = {Discriminative unsupervised feature learning with exemplar convolutional neural networks},
author = {Dosovitskiy, Alexey and Fischer, Philipp and Springenberg, Jost Tobias and Riedmiller, Martin and Brox, Thomas},
journal = {TPAMI},
year = {2016}
}
@article{oord2018representation,
title = {Representation learning with contrastive predictive coding},
author = {Oord, Aaron van den and Li, Yazhe and Vinyals, Oriol},
journal = {preprint arXiv:1807.03748},
year = {2018}
}
@article{goyal2017accurate,
title = {Accurate, large minibatch sgd: Training imagenet in 1 hour},
author = {Goyal, Priya and Doll{\'a}r, Piotr and Girshick, Ross and Noordhuis, Pieter and Wesolowski, Lukasz and Kyrola, Aapo and Tulloch, Andrew and Jia, Yangqing and He, Kaiming},
journal = {preprint arXiv:1706.02677},
year = {2017}
}
@article{russakovsky2015imagenet,
title = {Imagenet large scale visual recognition challenge},
author = {Russakovsky, Olga and Deng, Jia and Su, Hao and Krause, Jonathan and Satheesh, Sanjeev and Ma, Sean and Huang, Zhiheng and Karpathy, Andrej and Khosla, Aditya and Bernstein, Michael and Berg, Alexander C and Fei-Fei, Li },
journal = IJCV,
year = {2015}
}
@inproceedings{goyal2019scaling,
title = {Scaling and benchmarking self-supervised visual representation learning},
author = {Goyal, Priya and Mahajan, Dhruv and Gupta, Abhinav and Misra, Ishan},
booktitle = ICCV,
year = {2019}
}
@article{rajbhandari2019zero,
author = {Rajbhandari, Samyam and Rasley, Jeff and Ruwase, Olatunji and He, Yuxiong},
title = {ZeRO: Memory Optimizations Toward Training Trillion Parameter Models},
journal = {preprint arXiv:1910.02054},
year = {2019}
}
@article{chen2016grad,
author = {Tianqi Chen and Bing Xu and Chiyuan Zhang and Carlos Guestrin},
title = {Training Deep Nets with Sublinear Memory Cost},
journal = {preprint arXiv:1604.06174},
year = {2016}
}
@inproceedings{sohn2020fixmatch,
title = {Fixmatch: Simplifying semi-supervised learning with consistency and confidence},
author = {Sohn, Kihyuk and Berthelot, David and Li, Chun-Liang and Zhang, Zizhao and Carlini, Nicholas and Cubuk, Ekin D and Kurakin, Alex and Zhang, Han and Raffel, Colin},
booktitle = NIPS,
year = {2020}
}
@inproceedings{chen2020big,
title = {Big self-supervised models are strong semi-supervised learners},
author = {Chen, Ting and Kornblith, Simon and Swersky, Kevin and Norouzi, Mohammad and Hinton, Geoffrey},
booktitle = NIPS,
year = {2020}
}
@article{xu2020self,
title = {Self-training and Pre-training are Complementary for Speech Recognition},
author = {Xu, Qiantong and Baevski, Alexei and Likhomanenko, Tatiana and Tomasello, Paden and Conneau, Alexis and Collobert, Ronan and Synnaeve, Gabriel and Auli, Michael},
journal = {preprint arXiv:2010.11430},
year = {2020}
}
@article{xu2020iterative,
title = {Iterative pseudo-labeling for speech recognition},
author = {Xu, Qiantong and Likhomanenko, Tatiana and Kahn, Jacob and Hannun, Awni and Synnaeve, Gabriel and Collobert, Ronan},
journal = {preprint arXiv:2005.09267},
year = {2020}
}
@article{french2020milking,
title = {Milking CowMask for Semi-Supervised Image Classification},
author = {French, Geoff and Oliver, Avital and Salimans, Tim},
journal = {preprint arXiv:2003.12022},
year = {2020}
}
@article{dosovitskiy2020image,
title = {An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale},
author = {Dosovitskiy, Alexey and Beyer, Lucas and Kolesnikov, Alexander and Weissenborn, Dirk and Zhai, Xiaohua and Unterthiner, Thomas and Dehghani, Mostafa and Minderer, Matthias and Heigold, Georg and Gelly, Sylvain and others},
journal = {preprint arXiv:2010.11929},
year = {2020}
}
@inproceedings{sun2017revisiting,
title = {Revisiting unreasonable effectiveness of data in deep learning era},
author = {Sun, Chen and Shrivastava, Abhinav and Singh, Saurabh and Gupta, Abhinav},
booktitle = ICCV,
year = {2017}
}
@inproceedings{hu2018squeeze,
title = {Squeeze-and-excitation networks},
author = {Hu, Jie and Shen, Li and Sun, Gang},
booktitle = CVPR,
year = {2018}
}
@inproceedings{van2018inaturalist,
title = {The inaturalist species classification and detection dataset},
author = {Van Horn, Grant and Mac Aodha, Oisin and Song, Yang and Cui, Yin and Sun, Chen and Shepard, Alex and Adam, Hartwig and Perona, Pietro and Belongie, Serge},
booktitle = CVPR,
year = {2018}
}
@article{kuznetsova2018open,
title = {The Open Images Dataset V4: Unified image classification, object detection, and visual relationship detection at scale},
author = {Alina Kuznetsova and Mohamad Hassan Mohamad Rom and Neil Alldrin and Jasper Uijlings and Ivan Krasin and Jordi Pont-Tuset and Shahab Kamali and Stefan Popov and Matteo Malloci and Alexander Kolesnikov and Tom Duerig and Vittorio Ferrari},
journal = IJCV,
year = {2020}
}
@inproceedings{zhou2014learning,
title = {Learning deep features for scene recognition using places database},
author = {Zhou, Bolei and Lapedriza, Agata and Xiao, Jianxiong and Torralba, Antonio and Oliva, Aude},
booktitle = NIPS,
year = {2014}
}
@article{everingham2010pascal,
title = {The pascal visual object classes (voc) challenge},
author = {Everingham, Mark and Van Gool, Luc and Williams, Christopher KI and Winn, John and Zisserman, Andrew},
journal = IJCV,
year = {2010}
}
@article{loshchilov2016sgdr,
title = {Sgdr: Stochastic gradient descent with warm restarts},
author = {Loshchilov, Ilya and Hutter, Frank},
journal = {preprint arXiv:1608.03983},
year = {2016}
}
@article{du2020self,
title = {Self-training improves pre-training for natural language understanding},
author = {Du, Jingfei and Grave, Edouard and Gunel, Beliz and Chaudhary, Vishrav and Celebi, Onur and Auli, Michael and Stoyanov, Ves and Conneau, Alexis},
journal = {preprint arXiv:2010.02194},
year = {2020}
}
@article{yalniz2019billion,
title = {Billion-scale semi-supervised learning for image classification},
author = {Yalniz, I Zeki and J{\'e}gou, Herv{\'e} and Chen, Kan and Paluri, Manohar and Mahajan, Dhruv},
journal = {preprint arXiv:1905.00546},
year = {2019}
}
@article{zoph2020rethinking,
title = {Rethinking pre-training and self-training},
author = {Zoph, Barret and Ghiasi, Golnaz and Lin, Tsung-Yi and Cui, Yin and Liu, Hanxiao and Cubuk, Ekin D and Le, Quoc V},
journal = {preprint arXiv:2006.06882},
year = {2020}
}
@article{zhang2020pushing,
title = {Pushing the Limits of Semi-Supervised Learning for Automatic Speech Recognition},
author = {Zhang, Yu and Qin, James and Park, Daniel S and Han, Wei and Chiu, Chung-Cheng and Pang, Ruoming and Le, Quoc V and Wu, Yonghui},
journal = {preprint arXiv:2010.10504},
year = {2020}
}
@article{richemond2020byol,
title = {BYOL works even without batch statistics},
author = {Richemond, Pierre H and Grill, Jean-Bastien and Altch{\'e}, Florent and Tallec, Corentin and Strub, Florian and Brock, Andrew and Smith, Samuel and De, Soham and Pascanu, Razvan and Piot, Bilal and others},
journal = {preprint arXiv:2010.10241},
year = {2020}
}
@inproceedings{bucilua2006model,
title = {Model compression},
author = {Buciluǎ, Cristian and Caruana, Rich and Niculescu-Mizil, Alexandru},
booktitle = {SIGKDD},
year = {2006}
}
@article{hinton2015distilling,
title = {Distilling the knowledge in a neural network},
author = {Hinton, Geoffrey and Vinyals, Oriol and Dean, Jeff},
journal = {preprint arXiv:1503.02531},
year = {2015}
}
@article{tarvainen2017mean,
title = {Mean teachers are better role models: Weight-averaged consistency targets improve semi-supervised deep learning results},
author = {Tarvainen, Antti and Valpola, Harri},
journal = {preprint arXiv:1703.01780},
year = {2017}
}
@article{touvron2020training,
title = {Training data-efficient image transformers \& distillation through attention},
author = {Touvron, Hugo and Cord, Matthieu and Douze, Matthijs and Massa, Francisco and Sablayrolles, Alexandre and J{\'e}gou, Herv{\'e}},
journal = {preprint arXiv:2012.12877},
year = {2020}
}
@article{chen2020exploring,
title = {Exploring Simple Siamese Representation Learning},
author = {Chen, Xinlei and He, Kaiming},
journal = {preprint arXiv:2011.10566},
year = {2020}
}
@article{chen2020improved,
title = {Improved baselines with momentum contrastive learning},
author = {Chen, Xinlei and Fan, Haoqi and Girshick, Ross and He, Kaiming},
journal = {preprint arXiv:2003.04297},
year = {2020}
}
@article{bautista2016cliquecnn,
title = {Cliquecnn: Deep unsupervised exemplar learning},
author = {Bautista, Miguel A and Sanakoyeu, Artsiom and Sutter, Ekaterina and Ommer, Bj{\"o}rn},
journal = {preprint arXiv:1608.08792},
year = {2016}
}
@inproceedings{huang2019unsupervised,
title = {Unsupervised deep learning by neighbourhood discovery},
author = {Huang, Jiabo and Dong, Qi and Gong, Shaogang and Zhu, Xiatian},
booktitle = ICML,
year = {2019}
}
@inproceedings{zhuang2019local,
title = {Local aggregation for unsupervised learning of visual embeddings},
author = {Zhuang, Chengxu and Zhai, Alex Lin and Yamins, Daniel},
booktitle = ICCV,
year = {2019}
}
@inproceedings{gutmann2010noise,
title = {Noise-contrastive estimation: A new estimation principle for unnormalized statistical models},
author = {Gutmann, Michael and Hyv{\"a}rinen, Aapo},
booktitle = {International Conference on Artificial Intelligence and Statistics},
year = {2010}
}
@article{ermolov2020whitening,
title = {Whitening for self-supervised representation learning},
author = {Ermolov, Aleksandr and Siarohin, Aliaksandr and Sangineto, Enver and Sebe, Nicu},
journal = {preprint arXiv:2007.06346},
year = {2020}
}
@article{zbontar2021barlow,
title = {Barlow Twins: Self-Supervised Learning via Redundancy Reduction},
author = {Zbontar, Jure and Jing, Li and Misra, Ishan and LeCun, Yann and Deny, St{\'e}phane},
journal = {arXiv preprint arXiv:2103.03230},
year = {2021}
}
@inproceedings{lee2013pseudo,
title = {Pseudo-label: The simple and efficient semi-supervised learning method for deep neural networks},
author = {Lee, Dong-Hyun and others},
booktitle = {Workshop on challenges in representation learning, ICML},
year = {2013}
}
@inproceedings{xie2020self,
title = {Self-training with noisy student improves imagenet classification},
author = {Xie, Qizhe and Luong, Minh-Thang and Hovy, Eduard and Le, Quoc V},
booktitle = CVPR,
year = {2020}
}
@inproceedings{vaswani2017attention,
title = {Attention is all you need},
author = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, {\L}ukasz and Polosukhin, Illia},
booktitle = NIPS,
year = {2017}
}
@inproceedings{zhao2020exploring,
title = {Exploring self-attention for image recognition},
author = {Zhao, Hengshuang and Jia, Jiaya and Koltun, Vladlen},
booktitle = CVPR,
year = {2020}
}
@inproceedings{parmar2018image,
title = {Image transformer},
author = {Parmar, Niki and Vaswani, Ashish and Uszkoreit, Jakob and Kaiser, Lukasz and Shazeer, Noam and Ku, Alexander and Tran, Dustin},
booktitle = ICML,
year = {2018}
}
@article{child2019generating,
title = {Generating long sequences with sparse transformers},
author = {Child, Rewon and Gray, Scott and Radford, Alec and Sutskever, Ilya},
journal = {preprint arXiv:1904.10509},
year = {2019}
}
@article{hoffer2019mix,
title = {Mix \& Match: training convnets with mixed image sizes for improved accuracy, speed and scale resiliency},
author = {Hoffer, Elad and Weinstein, Berry and Hubara, Itay and Ben-Nun, Tal and Hoefler, Torsten and Soudry, Daniel},
journal = {preprint arXiv:1908.08986},
year = {2019}
}
@article{bahdanau2014neural,
title = {Neural machine translation by jointly learning to align and translate},
author = {Bahdanau, Dzmitry and Cho, Kyunghyun and Bengio, Yoshua},
journal = {preprint arXiv:1409.0473},
year = {2014}
}
@article{klein2017opennmt,
title = {Opennmt: Open-source toolkit for neural machine translation},
author = {Klein, Guillaume and Kim, Yoon and Deng, Yuntian and Senellart, Jean and Rush, Alexander M},
journal = {preprint arXiv:1701.02810},
year = {2017}
}
@article{chen2018best,
title = {The best of both worlds: Combining recent advances in neural machine translation},
author = {Chen, Mia Xu and Firat, Orhan and Bapna, Ankur and Johnson, Melvin and Macherey, Wolfgang and Foster, George and Jones, Llion and Parmar, Niki and Schuster, Mike and Chen, Zhifeng and others},
journal = {preprint arXiv:1804.09849},
year = {2018}
}
@inproceedings{radosavovic2020designing,
title = {Designing network design spaces},
author = {Radosavovic, Ilija and Kosaraju, Raj Prateek and Girshick, Ross and He, Kaiming and Doll{\'a}r, Piotr},
booktitle = CVPR,
year = {2020}
}
@article{loshchilov2018fixing,
title = {Fixing weight decay regularization in adam},
author = {Loshchilov, Ilya and Hutter, Frank},
year = {2018}
}
@inproceedings{zhang2016colorful,
title = {Colorful image colorization},
author = {Zhang, Richard and Isola, Phillip and Efros, Alexei A},
booktitle = ECCV,
year = {2016}
}
@article{tian2020makes,
title = {What makes for good views for contrastive learning},
author = {Tian, Yonglong and Sun, Chen and Poole, Ben and Krishnan, Dilip and Schmid, Cordelia and Isola, Phillip},
journal = NIPS,
year = {2020}
}
@article{salimans2016weight,
title = {Weight normalization: A simple reparameterization to accelerate training of deep neural networks},
author = {Salimans, Tim and Kingma, Diederik P},
journal = NIPS,
year = {2016}
}
@inproceedings{bach2011non,
title = {Non-asymptotic analysis of stochastic approximation algorithms for machine learning},
author = {Bach, Francis and Moulines, Eric},
booktitle = NIPS,
year = {2011}
}
@techreport{ruppert1988efficient,
title = {Efficient estimations from a slowly convergent Robbins-Monro process},
author = {Ruppert, David},
year = {1988}
}
@article{izmailov2018averaging,
title = {Averaging weights leads to wider optima and better generalization},
author = {Izmailov, Pavel and Podoprikhin, Dmitrii and Garipov, Timur and Vetrov, Dmitry and Wilson, Andrew Gordon},
journal = {preprint arXiv:1803.05407},
year = {2018}
}
@article{jean2014using,
title = {On using very large target vocabulary for neural machine translation},
author = {Jean, S{\'e}bastien and Cho, Kyunghyun and Memisevic, Roland and Bengio, Yoshua},
journal = {preprint arXiv:1412.2007},
year = {2014}
}
@inproceedings{lai2020mast,
title = {MAST: A memory-augmented self-supervised tracker},
author = {Lai, Zihang and Lu, Erika and Xie, Weidi},
booktitle = CVPR,
year = {2020}
}
@inproceedings{oh2019video,
title = {Video object segmentation using space-time memory networks},
author = {Oh, Seoung Wug and Lee, Joon-Young and Xu, Ning and Kim, Seon Joo},
booktitle = ICCV,
year = {2019}
}
@inproceedings{wang2019learning,
title = {Learning correspondence from the cycle-consistency of time},
author = {Wang, Xiaolong and Jabri, Allan and Efros, Alexei A},
booktitle = CVPR,
year = {2019}
}
@article{gur2020visualization,
title = {Visualization of Supervised and Self-Supervised Neural Networks via Attribution Guided Factorization},
author = {Gur, Shir and Ali, Ameen and Wolf, Lior},
journal = {preprint arXiv:2012.02166},
year = {2020}
}
@article{goyal2021self,
title = {Self-supervised Pretraining of Visual Features in the Wild},
author = {Goyal, Priya and Caron, Mathilde and Lefaudeux, Benjamin and Xu, Min and Wang, Pengchao and Pai, Vivek and Singh, Mannat and Liptchinsky, Vitaliy and Misra, Ishan and Joulin, Armand and others},
journal = {preprint arXiv:2103.01988},
year = {2021}
}
@article{el2021training,
title = {Training Vision Transformers for Image Retrieval},
author = {El-Nouby, Alaaeldin and Neverova, Natalia and Laptev, Ivan and J{\'e}gou, Herv{\'e}},
journal = {preprint arXiv:2102.05644},
year = {2021}
}
@article{pont20172017,
title = {The 2017 davis challenge on video object segmentation},
author = {Pont-Tuset, Jordi and Perazzi, Federico and Caelles, Sergi and Arbel{\'a}ez, Pablo and Sorkine-Hornung, Alex and Van Gool, Luc},
journal = {preprint arXiv:1704.00675},
year = {2017}
}
@inproceedings{cuturi2013sinkhorn,
title = {Sinkhorn distances: Lightspeed computation of optimal transport},
author = {Cuturi, Marco},
booktitle = NIPS,
year = {2013}
}
@inproceedings{nilsback2008automated,
title = {Automated flower classification over a large number of classes},
author = {Nilsback, Maria-Elena and Zisserman, Andrew},
booktitle = {2008 Sixth Indian Conference on Computer Vision, Graphics \& Image Processing},
year = {2008}
}
@article{pham2020meta,
title = {Meta pseudo labels},
author = {Pham, Hieu and Xie, Qizhe and Dai, Zihang and Le, Quoc V},
journal = {preprint arXiv:2003.10580},
year = {2020}
}
@article{xie2020unsupervised,
title = {Unsupervised Data Augmentation for Consistency Training},
author = {Xie, Qizhe and Dai, Zihang Dai and Hovy, Eduard and Luong, Minh-Thang and Le, Quoc V.},
journal = {preprint arXiv:1904.12848},
year = {2020}
}
@article{assran2020recovering,
title = {Recovering Petaflops in Contrastive Semi-Supervised Learning of Visual Representations},
author = {Assran, Mahmoud and Ballas, Nicolas and Castrejon, Lluis and Rabbat, Michael},
journal = {preprint arXiv:2006.10803},
year = {2020}
}
@inproceedings{zhang2017split,
title = {Split-brain autoencoders: Unsupervised learning by cross-channel prediction},
author = {Zhang, Richard and Isola, Phillip and Efros, Alexei A},
booktitle = {Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition},
pages = {1058--1067},
year = {2017}