-
Notifications
You must be signed in to change notification settings - Fork 1
/
bi.bib
391 lines (356 loc) · 14.2 KB
/
bi.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
@ARTICLE{v2w,
author = {{Mikolov}, T. and {Chen}, K. and {Corrado}, G. and {Dean}, J.
},
title = "{Efficient Estimation of Word Representations in Vector Space}",
journal = {ArXiv e-prints},
archivePrefix = "arXiv",
eprint = {1301.3781},
primaryClass = "cs.CL",
keywords = {Computer Science - Computation and Language},
year = 2013,
month = jan,
adsurl = {http://adsabs.harvard.edu/abs/2013arXiv1301.3781M},
adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
@inproceedings{elmo,
author={Peters, Matthew E. and Neumann, Mark and Iyyer, Mohit and Gardner, Matt and Clark, Christopher and Lee, Kenton and Zettlemoyer, Luke},
title={Deep contextualized word representations},
booktitle={Proc. of NAACL},
year={2018}
}
@INPROCEEDINGS{glove,
author = {Jeffrey Pennington and Richard Socher and Christopher D. Manning},
title = {Glove: Global vectors for word representation},
booktitle = {In EMNLP},
year = {2014}
}
@article{rnn,
author = {Alex Sherstinsky},
title = {Fundamentals of Recurrent Neural Network {(RNN)} and Long Short-Term
Memory {(LSTM)} Network},
journal = {CoRR},
volume = {abs/1808.03314},
year = {2018},
url = {http://arxiv.org/abs/1808.03314},
archivePrefix = {arXiv},
eprint = {1808.03314},
timestamp = {Sun, 02 Sep 2018 15:01:55 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/abs-1808-03314},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{rnn2,
author = {Andrej Karpathy and
Justin Johnson and
Fei{-}Fei Li},
title = {Visualizing and Understanding Recurrent Networks},
journal = {CoRR},
volume = {abs/1506.02078},
year = {2015},
url = {http://arxiv.org/abs/1506.02078},
archivePrefix = {arXiv},
eprint = {1506.02078},
timestamp = {Mon, 13 Aug 2018 16:46:44 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/KarpathyJL15},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{lstm,
author = {Hochreiter, Sepp and Schmidhuber, J\"{u}rgen},
title = {Long Short-Term Memory},
journal = {Neural Comput.},
issue_date = {November 15, 1997},
volume = {9},
number = {8},
month = nov,
year = {1997},
issn = {0899-7667},
pages = {1735--1780},
numpages = {46},
url = {http://dx.doi.org/10.1162/neco.1997.9.8.1735},
doi = {10.1162/neco.1997.9.8.1735},
acmid = {1246450},
publisher = {MIT Press},
address = {Cambridge, MA, USA},
}
@incollection{attention,
title = {Attention is All you Need},
author = {Vaswani, Ashish and Shazeer, Noam and Parmar, Niki and Uszkoreit, Jakob and Jones, Llion and Gomez, Aidan N and Kaiser, \L ukasz and Polosukhin, Illia},
booktitle = {Advances in Neural Information Processing Systems 30},
editor = {I. Guyon and U. V. Luxburg and S. Bengio and H. Wallach and R. Fergus and S. Vishwanathan and R. Garnett},
pages = {5998--6008},
year = {2017},
publisher = {Curran Associates, Inc.},
url = {http://papers.nips.cc/paper/7181-attention-is-all-you-need.pdf}
}
@article{bert,
author = {Jacob Devlin and
Ming{-}Wei Chang and
Kenton Lee and
Kristina Toutanova},
title = {{BERT:} Pre-training of Deep Bidirectional Transformers for Language
Understanding},
journal = {CoRR},
volume = {abs/1810.04805},
year = {2018},
url = {http://arxiv.org/abs/1810.04805},
archivePrefix = {arXiv},
eprint = {1810.04805},
timestamp = {Tue, 30 Oct 2018 20:39:56 +0100},
biburl = {https://dblp.org/rec/bib/journals/corr/abs-1810-04805},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@ARTICLE{LM,
author = {{Mikolov}, T. and {Le}, Q.~V. and {Sutskever}, I.},
title = "{Exploiting Similarities among Languages for Machine Translation}",
journal = {ArXiv e-prints},
archivePrefix = "arXiv",
eprint = {1309.4168},
primaryClass = "cs.CL",
keywords = {Computer Science - Computation and Language},
year = 2013,
month = sep,
adsurl = {http://adsabs.harvard.edu/abs/2013arXiv1309.4168M},
adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
@ARTICLE{ruder,
author = {{Ruder}, S. and {Vuli{\'c}}, I. and {S{\o}gaard}, A.},
title = "{A Survey Of Cross-lingual Word Embedding Models}",
journal = {ArXiv e-prints},
archivePrefix = "arXiv",
eprint = {1706.04902},
primaryClass = "cs.CL",
keywords = {Computer Science - Computation and Language, Computer Science - Learning},
year = 2017,
month = jun,
adsurl = {http://adsabs.harvard.edu/abs/2017arXiv170604902R},
adsnote = {Provided by the SAO/NASA Astrophysics Data System}
}
@ARTICLE{cca,
author = {Manaal Faruqui and Chris Dyer},
title = "{Improving Vector Space Word Representations
Using Multilingual Correlation}",
journal = {Carnegie Mellon University},
year = 2014,
month = apr,
adsurl = {http://repository.cmu.edu/cgi/viewcontent.cgi?article=1031&context=lti},
}
@inproceedings{pytorch,
title={Automatic differentiation in PyTorch},
author={Paszke, Adam and Gross, Sam and Chintala, Soumith and Chanan, Gregory and Yang, Edward and DeVito, Zachary and Lin, Zeming and Desmaison, Alban and Antiga, Luca and Lerer, Adam},
booktitle={NIPS-W},
year={2017}
}
@inproceedings{opennmt,
author = {Guillaume Klein and
Yoon Kim and
Yuntian Deng and
Jean Senellart and
Alexander M. Rush},
title = {OpenNMT: Open-Source Toolkit for Neural Machine Translation},
booktitle = {Proc. ACL},
year = {2017},
url = {https://doi.org/10.18653/v1/P17-4012},
doi = {10.18653/v1/P17-4012}
}
@article{fasttext,
title={Enriching Word Vectors with Subword Information},
author={Bojanowski, Piotr and Grave, Edouard and Joulin, Armand and Mikolov, Tomas},
journal={arXiv preprint arXiv:1607.04606},
year={2016}
}
@article{joulin2016bag,
title={Bag of Tricks for Efficient Text Classification},
author={Joulin, Armand and Grave, Edouard and Bojanowski, Piotr and Mikolov, Tomas},
journal={arXiv preprint arXiv:1607.01759},
year={2016}
}
@inproceedings{fasttextRepresentations,
title={Learning Word Vectors for 157 Languages},
author={Grave, Edouard and Bojanowski, Piotr and Gupta, Prakhar and Joulin, Armand and Mikolov, Tomas},
booktitle={Proceedings of the International Conference on Language Resources and Evaluation (LREC 2018)},
year={2018}
}
@article{snipsData,
author = {Alice Coucke and
Alaa Saade and
Adrien Ball and
Th{\'{e}}odore Bluche and
Alexandre Caulier and
David Leroy and
Cl{\'{e}}ment Doumouro and
Thibault Gisselbrecht and
Francesco Caltagirone and
Thibaut Lavril and
Ma{\"{e}}l Primet and
Joseph Dureau},
title = {Snips Voice Platform: an embedded Spoken Language Understanding system
for private-by-design voice interfaces},
journal = {CoRR},
volume = {abs/1805.10190},
year = {2018},
url = {http://arxiv.org/abs/1805.10190},
archivePrefix = {arXiv},
eprint = {1805.10190},
timestamp = {Mon, 13 Aug 2018 16:46:59 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/abs-1805-10190},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{deepPavlovCNN,
author = {Yoon Kim},
title = {Convolutional Neural Networks for Sentence Classification},
journal = {CoRR},
volume = {abs/1408.5882},
year = {2014},
url = {http://arxiv.org/abs/1408.5882},
archivePrefix = {arXiv},
eprint = {1408.5882},
timestamp = {Mon, 13 Aug 2018 16:46:21 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/Kim14f},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{doc2vec,
author = {Quoc V. Le and
Tomas Mikolov},
title = {Distributed Representations of Sentences and Documents},
journal = {CoRR},
volume = {abs/1405.4053},
year = {2014},
url = {http://arxiv.org/abs/1405.4053},
archivePrefix = {arXiv},
eprint = {1405.4053},
timestamp = {Mon, 13 Aug 2018 16:48:49 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/LeM14},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@misc{ytranslate,
title={Технологии - Машинный перевод},
url={https://yandex.ru/company/technologies/translation/}, journal={Компания Яндекс},
year={2019},
Author={Yandex},
note = {Дата обращения - 4 апреля 2019}
}
@article{USE,
author = {Daniel Cer and
Yinfei Yang and
Sheng{-}yi Kong and
Nan Hua and
Nicole Limtiaco and
Rhomni St. John and
Noah Constant and
Mario Guajardo{-}Cespedes and
Steve Yuan and
Chris Tar and
Yun{-}Hsuan Sung and
Brian Strope and
Ray Kurzweil},
title = {Universal Sentence Encoder},
journal = {CoRR},
volume = {abs/1803.11175},
year = {2018},
url = {http://arxiv.org/abs/1803.11175},
archivePrefix = {arXiv},
eprint = {1803.11175},
timestamp = {Mon, 13 Aug 2018 16:46:40 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/abs-1803-11175},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{SkipThonught,
author = {Ryan Kiros and
Yukun Zhu and
Ruslan Salakhutdinov and
Richard S. Zemel and
Antonio Torralba and
Raquel Urtasun and
Sanja Fidler},
title = {Skip-Thought Vectors},
journal = {CoRR},
volume = {abs/1506.06726},
year = {2015},
url = {http://arxiv.org/abs/1506.06726},
archivePrefix = {arXiv},
eprint = {1506.06726},
timestamp = {Mon, 13 Aug 2018 16:48:27 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/KirosZSZTUF15},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{XLM,
author = {Guillaume Lample and
Alexis Conneau},
title = {Cross-lingual Language Model Pretraining},
journal = {CoRR},
volume = {abs/1901.07291},
year = {2019},
url = {http://arxiv.org/abs/1901.07291},
archivePrefix = {arXiv},
eprint = {1901.07291},
timestamp = {Fri, 01 Feb 2019 13:39:59 +0100},
biburl = {https://dblp.org/rec/bib/journals/corr/abs-1901-07291},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@article{InferSent,
author = {Alexis Conneau and
Douwe Kiela and
Holger Schwenk and
Lo{\"{\i}}c Barrault and
Antoine Bordes},
title = {Supervised Learning of Universal Sentence Representations from Natural
Language Inference Data},
journal = {CoRR},
volume = {abs/1705.02364},
year = {2017},
url = {http://arxiv.org/abs/1705.02364},
archivePrefix = {arXiv},
eprint = {1705.02364},
timestamp = {Mon, 13 Aug 2018 16:48:46 +0200},
biburl = {https://dblp.org/rec/bib/journals/corr/ConneauKSBB17},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
@InProceedings{elmoRepresentations,
author = {Che, Wanxiang and Liu, Yijia and Wang, Yuxuan and Zheng, Bo and Liu, Ting},
title = {Towards Better {UD} Parsing: Deep Contextualized Word Embeddings, Ensemble, and Treebank Concatenation},
booktitle = {Proceedings of the {CoNLL} 2018 Shared Task: Multilingual Parsing from Raw Text to Universal Dependencies},
month = {October},
year = {2018},
address = {Brussels, Belgium},
publisher = {Association for Computational Linguistics},
pages = {55--64},
url = {http://www.aclweb.org/anthology/K18-2005}
}
@InProceedings{elmoHost,
author = {Fares, Murhaf and Kutuzov, Andrey and Oepen, Stephan and Velldal, Erik},
title = {Word vectors, reuse, and replicability: Towards a community repository of large-text resources},
booktitle = {Proceedings of the 21st Nordic Conference on Computational Linguistics},
month = {May},
year = {2017},
address = {Gothenburg, Sweden},
publisher = {Association for Computational Linguistics},
pages = {271--276},
url = {http://www.aclweb.org/anthology/W17-0237}
}
@inproceedings {tf,
author = {Mart{\'\i}n Abadi and Paul Barham and Jianmin Chen and Zhifeng Chen and Andy Davis and Jeffrey Dean and Matthieu Devin and Sanjay Ghemawat and Geoffrey Irving and Michael Isard and Manjunath Kudlur and Josh Levenberg and Rajat Monga and Sherry Moore and Derek G. Murray and Benoit Steiner and Paul Tucker and Vijay Vasudevan and Pete Warden and Martin Wicke and Yuan Yu and Xiaoqiang Zheng},
title = {TensorFlow: A System for Large-Scale Machine Learning},
booktitle = {12th {USENIX} Symposium on Operating Systems Design and Implementation ({OSDI} 16)},
year = {2016},
isbn = {978-1-931971-33-1},
address = {Savannah, GA},
pages = {265--283},
url = {https://www.usenix.org/conference/osdi16/technical-sessions/presentation/abadi},
publisher = {{USENIX} Association},
}
@inproceedings{adam,
author = {Diederik P. Kingma and
Jimmy Ba},
title = {Adam: {A} Method for Stochastic Optimization},
booktitle = {3rd International Conference on Learning Representations, {ICLR} 2015,
San Diego, CA, USA, May 7-9, 2015, Conference Track Proceedings},
year = {2015},
crossref = {DBLP:conf/iclr/2015},
url = {http://arxiv.org/abs/1412.6980},
timestamp = {Fri, 29 Mar 2019 10:36:36 +0100},
biburl = {https://dblp.org/rec/bib/journals/corr/KingmaB14},
bibsource = {dblp computer science bibliography, https://dblp.org}
}
https://towardsdatascience.com/deep-transfer-learning-for-natural-language-processing-text-classification-with-universal-1a2c69e5baa9
https://openreview.net/forum?id=SyK00v5xx -- про хак для бейслайна
https://code.fb.com/ml-applications/under-the-hood-multilingual-embeddings/ -- про проблему и clwe
https://medium.com/huggingface/universal-word-sentence-embeddings-ce48ddc8fc3a