-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathrefs_article.bib
More file actions
225 lines (225 loc) · 9.26 KB
/
Copy pathrefs_article.bib
File metadata and controls
225 lines (225 loc) · 9.26 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
@article{agarap2018ReLU,
title = {Deep Learning using Rectified Linear Units (ReLU)},
author = {Abien Fred Agarap},
year = {2018},
eprint = {1803.08375},
archiveprefix = {arXiv},
primaryclass = {cs.NE},
url = {https://arxiv.org/abs/1803.08375}
}
@article{bahdanau2016NeuralMachineTranslation,
title = {Neural Machine Translation by Jointly Learning to Align and Translate},
author = {Dzmitry Bahdanau and Kyunghyun Cho and Yoshua Bengio},
year = {2016},
eprint = {1409.0473},
archiveprefix = {arXiv},
primaryclass = {cs.CL},
url = {https://arxiv.org/abs/1409.0473}
}
@article{dao2022FlashAttentionv1,
title = {FlashAttention: Fast and Memory-Efficient Exact Attention with IO-Awareness},
author = {Tri Dao and Daniel Y. Fu and Stefano Ermon and Atri Rudra and Christopher Ré},
year = {2022},
eprint = {2205.14135},
archiveprefix = {arXiv},
primaryclass = {cs.LG},
url = {https://arxiv.org/abs/2205.14135}
}
@article{detlefsen2022TorchMetrics,
title = {TorchMetrics - Measuring Reproducibility in PyTorch},
author = {Detlefsen, Nicki Skafte and Borovec, Jiri and Schock, Justus and Jha, Ananya Harsh and Koker, Teddy and Di Liello, Luca and Stancl, Daniel and Quan, Changsheng and Grechkin, Maxim and Falcon, William},
journal = {Journal of Open Source Software},
year = {2022},
volume = {7},
number = {70},
pages = {4101},
doi = {10.21105/joss.04101},
publisher = {The Open Journal},
url = {https://doi.org/10.21105/joss.04101}
}
@article{dosovitskiy2021ViT,
title = {An Image is Worth 16x16 Words: Transformers for Image Recognition at Scale},
author = {Alexey Dosovitskiy and Lucas Beyer and Alexander Kolesnikov and Dirk Weissenborn and Xiaohua Zhai and Thomas Unterthiner and Mostafa Dehghani and Matthias Minderer and Georg Heigold and Sylvain Gelly and Jakob Uszkoreit and Neil Houlsby},
year = {2021},
eprint = {2010.11929},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/2010.11929}
}
@article{girshick2014RCNN,
title = {Rich Feature Hierarchies for Accurate Object Detection and Semantic Segmentation},
author = {Ross Girshick and Jeff Donahue and Trevor Darrell and Jitendra Malik},
year = {2014},
eprint = {1311.2524},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/1311.2524}
}
@article{girshick2015FastRCNN,
title = {Fast R-CNN},
author = {Ross Girshick},
year = {2015},
eprint = {1504.08083},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/1504.08083}
}
@article{goh2021MultimodalNeurons,
title = {Multimodal Neurons in Artificial Neural Networks},
author = {Goh, Gabriel and Nick Cammarata and Chelsea Voss and Carter, Shan and Petrov, Michael and Schubert, Ludwig and Radford, Alec and Olah, Chris},
journal = {Distill},
year = {2021},
note = {https://distill.pub/2021/multimodal-neurons},
doi = {10.23915/distill.00030}
}
@article{goodfellow2014GAN,
title = {Generative Adversarial Networks},
author = {Ian J. Goodfellow and Jean Pouget-Abadie and Mehdi Mirza and Bing Xu and David Warde-Farley and Sherjil Ozair and Aaron Courville and Yoshua Bengio},
year = {2014},
eprint = {1406.2661},
archiveprefix = {arXiv},
primaryclass = {stat.ML},
url = {https://arxiv.org/abs/1406.2661}
}
@article{he2018MaskRCNN,
title = {Mask R-CNN},
author = {Kaiming He and Georgia Gkioxari and Piotr Dollár and Ross Girshick},
year = {2018},
eprint = {1703.06870},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/1703.06870}
}
@inproceedings{higgins2017BetaVAE,
title = {beta-VAE: Learning Basic Visual Concepts with a Constrained Variational Framework},
author = {Irina Higgins and Loic Matthey and Arka Pal and Christopher Burgess and Xavier Glorot and Matthew Botvinick and Shakir Mohamed and Alexander Lerchner},
booktitle = {International Conference on Learning Representations},
year = {2017},
url = {https://openreview.net/forum?id=Sy2fzU9gl}
}
@article{hinton2006AutoEncoder,
title = {Reducing the Dimensionality of Data With Neural Networks},
author = {Hinton, Geoffrey E and Salakhutdinov, Ruslan R},
journal = {science},
volume = {313},
number = {5786},
pages = {504--507},
year = {2006},
publisher = {American Association for the Advancement of Science}
}
@article{ho2020DDPM,
title = {Denoising Diffusion Probabilistic Models},
author = {Jonathan Ho and Ajay Jain and Pieter Abbeel},
year = {2020},
eprint = {2006.11239},
archiveprefix = {arXiv},
primaryclass = {cs.LG},
url = {https://arxiv.org/abs/2006.11239}
}
@article{kingma2022VAE,
title = {Auto-Encoding Variational Bayes},
author = {Diederik P Kingma and Max Welling},
year = {2022},
eprint = {1312.6114},
archiveprefix = {arXiv},
primaryclass = {stat.ML},
url = {https://arxiv.org/abs/1312.6114}
}
@article{li2022BLIP,
title = {BLIP: Bootstrapping Language-Image Pre-training for Unified Vision-Language Understanding and Generation},
author = {Junnan Li and Dongxu Li and Caiming Xiong and Steven Hoi},
year = {2022},
eprint = {2201.12086},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/2201.12086}
}
@article{luo2022UnderstandingDiffusionModels,
title = {Understanding Diffusion Models: A Unified Perspective},
author = {Calvin Luo},
year = {2022},
eprint = {2208.11970},
archiveprefix = {arXiv},
primaryclass = {cs.LG},
url = {https://arxiv.org/abs/2208.11970}
}
@inproceedings{NIPS2015ConditionalVAE,
author = {Sohn, Kihyuk and Lee, Honglak and Yan, Xinchen},
title = {Learning Structured Output Representation using Deep Conditional Generative Models},
booktitle = {Advances in Neural Information Processing Systems},
editor = {C. Cortes and N. Lawrence and D. Lee and M. Sugiyama and R. Garnett},
publisher = {Curran Associates, Inc.},
volume = {28},
year = {2015}
}
@article{oord2018VQVAE,
title = {Neural Discrete Representation Learning},
author = {Aaron van den Oord and Oriol Vinyals and Koray Kavukcuoglu},
year = {2018},
eprint = {1711.00937},
archiveprefix = {arXiv},
primaryclass = {cs.LG},
url = {https://arxiv.org/abs/1711.00937}
}
@article{radford2021CLIP,
title = {Learning Transferable Visual Models From Natural Language Supervision},
author = {Alec Radford and Jong Wook Kim and Chris Hallacy and Aditya Ramesh and Gabriel Goh and Sandhini Agarwal and Girish Sastry and Amanda Askell and Pamela Mishkin and Jack Clark and Gretchen Krueger and Ilya Sutskever},
year = {2021},
eprint = {2103.00020},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/2103.00020}
}
@article{ren2016FasterRCNN,
title = {Faster R-CNN: Towards Real-Time Object Detection with Region Proposal Networks},
author = {Shaoqing Ren and Kaiming He and Ross Girshick and Jian Sun},
year = {2016},
eprint = {1506.01497},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/1506.01497}
}
@article{ronneberger2015UNet,
title = {U-Net: Convolutional Networks for Biomedical Image Segmentation},
author = {Olaf Ronneberger and Philipp Fischer and Thomas Brox},
year = {2015},
eprint = {1505.04597},
archiveprefix = {arXiv},
primaryclass = {cs.CV},
url = {https://arxiv.org/abs/1505.04597}
}
@article{song2022DDIM,
title = {Denoising Diffusion Implicit Models},
author = {Jiaming Song and Chenlin Meng and Stefano Ermon},
year = {2022},
eprint = {2010.02502},
archiveprefix = {arXiv},
primaryclass = {cs.LG},
url = {https://arxiv.org/abs/2010.02502}
}
@article{uijlings2013SelectiveSearch,
title = {Selective Search for Object Recognition},
author = {Uijlings, Jasper RR and Van De Sande, Koen EA and Gevers, Theo and Smeulders, Arnold WM},
journal = {International journal of computer vision},
volume = {104},
number = {2},
pages = {154--171},
year = {2013},
publisher = {Springer}
}
@article{vaswani2023Attention,
title = {Attention is All You Need},
author = {Ashish Vaswani and Noam Shazeer and Niki Parmar and Jakob Uszkoreit and Llion Jones and Aidan N. Gomez and Lukasz Kaiser and Illia Polosukhin},
year = {2023},
eprint = {1706.03762},
archiveprefix = {arXiv},
primaryclass = {cs.CL},
url = {https://arxiv.org/abs/1706.03762}
}
@book{zhang2023d2l,
title = {Dive into Deep Learning},
author = {Zhang, Aston and Lipton, Zachary C. and Li, Mu and Smola, Alexander J.},
publisher = {Cambridge University Press},
url = {https://D2L.ai},
year = {2023}
}