-
Notifications
You must be signed in to change notification settings - Fork 113
/
thesis.bib
2420 lines (2103 loc) · 76 KB
/
thesis.bib
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
974
975
976
977
978
979
980
981
982
983
984
985
986
987
988
989
990
991
992
993
994
995
996
997
998
999
1000
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%%% Neural Machine Translation %%%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
@ARTICLE{systran16,
author = {Josep Maria Crego and
Jungi Kim and
Guillaume Klein and
Anabel Rebollo and
Kathy Yang and
Jean Senellart and
Egor Akhanov and
Patrice Brunelle and
Aurelien Coquard and
Yongchao Deng and
Satoshi Enoue and
Chiyo Geiss and
Joshua Johanson and
Ardas Khalsa and
Raoum Khiari and
Byeongil Ko and
Catherine Kobus and
Jean Lorieux and
Leidiana Martins and
Dang{-}Chuan Nguyen and
Alexandra Priori and
Thomas Riccardi and
Natalia Segal and
Christophe Servan and
Cyril Tiquet and
Bo Wang and
Jin Yang and
Dakun Zhang and
Jing Zhou and
Peter Zoldan},
title = "{SYSTRAN's Pure Neural Machine Translation Systems}",
journal = {arXiv preprint 1610.05540},
year = 2016,
}
@article{gnmt16,
author = {Yonghui Wu and
Mike Schuster and
Zhifeng Chen and
Quoc V. Le and
Mohammad Norouzi and
Wolfgang Macherey and
Maxim Krikun and
Yuan Cao and
Qin Gao and
Klaus Macherey and
Jeff Klingner and
Apurva Shah and
Melvin Johnson and
Xiaobing Liu and
Lukasz Kaiser and
Stephan Gouws and
Yoshikiyo Kato and
Taku Kudo and
Hideto Kazawa and
Keith Stevens and
George Kurian and
Nishant Patil and
Wei Wang and
Cliff Young and
Jason Smith and
Jason Riesa and
Alex Rudnick and
Oriol Vinyals and
Greg Corrado and
Macduff Hughes and
Jeffrey Dean},
title = {Google's Neural Machine Translation System: Bridging the Gap between
Human and Machine Translation},
journal = {arXiv preprint 1609.08144},
year = {2016},
}
@InProceedings{cohn16,
author = {Cohn, Trevor and Hoang, Cong Duy Vu and Vymolova, Ekaterina and Yao, Kaisheng and Dyer, Chris and Haffari, Gholamreza},
title = {Incorporating Structural Alignment Biases into an Attentional Neural Translation Model},
booktitle = {NAACL},
year = {2016},
}
@InProceedings{tu16coverage,
author = {Tu, Zhaopeng and Lu, Zhengdong and Liu, Yang and Liu, Xiaohua and Li, Hang},
title = {Modeling Coverage for Neural Machine Translation},
booktitle = {ACL},
year = {2016},
}
@inproceedings{kim16distill,
author = {Yoon Kim and
Alexander M. Rush},
title = {Sequence-Level Knowledge Distillation},
booktitle = {EMNLP},
year = {2016},
}
@inproceedings{cheng16,
author = {Cheng, Yong and Xu, Wei and He, Zhongjun and He, Wei and Wu, Hua and Sun, Maosong and Liu, Yang},
booktitle = {ACL},
title = {Semi-Supervised Learning for Neural Machine Translation.},
year = 2016
}
@article{tu16,
author = {{Tu}, Z. and {Liu}, Y. and {Shang}, L. and {Liu}, X. and {Li}, H.},
journal = {arXiv preprint 1611.01874},
title = {Neural Machine Translation with Reconstruction},
year = {2016},
}
@inproceedings{xia16,
author = {Yingce Xia and
Di He and
Tao Qin and
Liwei Wang and
Nenghai Yu and
Tie{-}Yan Liu and
Wei{-}Ying Ma},
booktitle = {NIPS},
title = {Dual Learning for Machine Translation},
year = {2016},
}
@article{ha16,
author = {Thanh-Le Ha and Jan Niehues and Alexander Waibel},
journal = {arXiv preprint 1611.04798},
title = {Toward Multilingual Neural Machine Translation with Universal Encoder and Decoder},
year = {2016},
}
@article{gnmt16multi,
author = {Melvin Johnson and Mike Schuster and Quoc V. Le and Maxim Krikun and Yonghui Wu and Zhifeng Chen and Nikhil Thorat and Fernanda Vi\'{e}gas and Martin Wattenberg and Greg Corrado and Macduff Hughes and Jeffrey Dean},
journal = {arXiv preprint 1611.04558},
title = {Google's Multilingual Neural Machine Translation System: Enabling Zero-Shot Translation},
year = {2016},
}
@InProceedings{firat16,
author = {Firat, Orhan and Cho, Kyunghyun and Bengio, Yoshua},
title = {Multi-Way, Multilingual Neural Machine Translation with a Shared Attention Mechanism},
booktitle = {NAACL},
year = {2016},
}
@InProceedings{zoph16,
author = {Zoph, Barret and Knight, Kevin},
title = {Multi-Source Neural Translation},
booktitle = {NAACL},
year = {2016},
}
@inproceedings{see16,
author = {See, Abigail and Luong, Minh-Thang and Manning, Christopher D.},
booktitle = {CoNLL},
title = {Compression of Neural Machine Translation Models via Pruning},
year = {2016},
}
@inproceedings{luong16,
author = {Luong, Minh-Thang and Manning, Christopher D.},
booktitle = {ACL},
title = {Achieving Open Vocabulary Neural Machine Translation with Hybrid Word-Character Models},
year = {2016},
}
@inproceedings{sennrich16mono,
author = {Rico Sennrich and Barry Haddow and Alexandra Birch},
booktitle = {ACL},
title = {Improving neural machine translation models with monolingual data},
year = {2016},
}
@inproceedings{sennrich16sub,
author = {Rico Sennrich and Barry Haddow and Alexandra Birch},
booktitle = {ACL},
title = {Neural Machine Translation of Rare Words with Subword Units},
year = {2016},
}
@inproceedings{luong16iclr,
author = {Minh-Thang Luong and Quoc V. Le and Ilya Sutskever and Oriol Vinyals and Lukasz Kaiser},
booktitle = {ICLR},
title = {Multi-task sequence to sequence learning},
year = {2016},
}
@article{ling15char,
author = {Wang Ling and Isabel Trancoso and Chris Dyer and Alan Black},
journal = {arXiv preprint arXiv:1511.04586},
title = {Character-based Neural Machine Translation},
year = {2015},
}
@inproceedings{iwslt15,
author = {Mauro Cettolo and Jan Niehues and Sebastian St{\"{u}}ker
and Luisa Bentivogli
and Roldano Cattoni
and Marcello Federico
},
booktitle = {IWSLT},
title = {The IWSLT 2015 Evaluation Campaign},
year = {2015},
}
@inproceedings{luong15iwslt,
author = {Luong, Minh-Thang and Manning, Christopher D.},
booktitle = {IWSLT},
title = {Stanford Neural Machine Translation Systems for Spoken Language Domain},
year = {2015},
}
@inproceedings{jean15wmt,
author = {Jean, S\'{e}bastien and Firat, Orhan and Cho, Kyunghyun and Memisevic, Roland and Bengio, Yoshua},
booktitle = {WMT},
title = {Montreal Neural Machine Translation Systems for {WMT}'15},
year = {2015},
}
@inproceedings{luong15attn,
author = {Luong, Minh-Thang and Pham, Hieu and Manning, Christopher D.},
booktitle = {EMNLP},
title = {Effective Approaches to Attention-based Neural Machine Translation},
year = {2015},
}
@article{gulcehre2015using,
author = {Gulcehre, Caglar and Firat, Orhan and Xu, Kelvin and Cho, Kyunghyun and Barrault, Loic and Lin, Huei-Chi and Bougares, Fethi and Schwenk, Holger and Bengio, Yoshua},
journal = {arXiv preprint arXiv:1503.03535},
title = {On Using Monolingual Corpora in Neural Machine Translation},
year = {2015},
}
@inproceedings{luong15,
author = {Minh-Thang Luong and Ilya Sutskever and Quoc V. Le and Oriol Vinyals and Wojciech Zaremba},
booktitle = {ACL},
title = {Addressing the Rare Word Problem in Neural Machine Translation},
year = {2015},
}
@inproceedings{jean15,
author = {S\'{e}bastien Jean and Kyunghyun Cho and Roland Memisevic and Yoshua Bengio},
booktitle = {ACL},
title = {On Using Very Large Target Vocabulary for Neural Machine Translation},
year = {2015},
}
@inproceedings{bog15,
author = {Dzmitry Bahdanau and Kyunghyun Cho and Yoshua Bengio},
booktitle = {ICLR},
title = {Neural Machine Translation by Jointly Learning to Align and Translate},
year = {2015},
}
@inproceedings{sutskever14,
author = {Ilya Sutskever and Oriol Vinyals and Quoc V. Le},
booktitle = {NIPS},
title = {Sequence to Sequence Learning with Neural Networks},
year = {2014},
}
@inproceedings{cho14,
author = {Kyunghyun Cho and Bart van Merrienboer and Caglar Gulcehre and Fethi Bougares and Holger Schwenk and Yoshua Bengio},
booktitle = {EMNLP},
title = {Learning Phrase Representations using {RNN} Encoder-Decoder for Statistical Machine Translation},
year = {2014},
}
@inproceedings{kal13,
author = {Nal Kalchbrenner and Phil Blunsom},
booktitle = {EMNLP},
title = {Recurrent Continuous Translation Models},
year = {2013},
}
@article{forcada97,
author = {Mikel L. Forcada and Ram\'{o}n \~{N}eco},
journal = {Biological and Artificial Computation: From Neuroscience to
Technology},
publisher = {Springer},
pages = {453--462},
title = {Recursive hetero-associative memories for
translation},
year = {1997},
}
@article{chrisman91,
author = {Lonnie Chrisman},
title = {Learning Recursive Distributed Representations for Holistic Computation},
journal = {Connection Science},
volume = {3},
number = {4},
pages = {345-366},
year = {1991},
}
@INPROCEEDINGS{allen87,
author = {Robert B. Allen},
title = {Several studies on natural language and back-propagation},
booktitle = {ICNN},
year = {1987},
}
%%%%%%%%%%%%%%%%%%%%%%%%%%%
%%% Machine Translation %%%
%%%%%%%%%%%%%%%%%%%%%%%%%%%
@article{winograd_mt16,
author = {Ernest David},
journal = {arXiv preprint arXiv:1608.01884},
title = {Winograd Schemas and Machine Translation},
year = {2016},
}
@InProceedings{luong15nlm,
author = {Luong, Minh-Thang and Kayser, Michael and Manning, Christopher D.},
title = {Deep Neural Language Models for Machine Translation},
booktitle = {CoNLL},
year = {2015},
}
@inproceedings{chrf,
author = {Popovi\'{c}, Maja},
booktitle = {WMT},
title = {{chrF: character n-gram F-score for automatic MT evaluation}},
year = {2015},
}
% Winning entry in WMT'15 for English-Czech
@inproceedings{bojar15wmt,
author = {Bojar, Ond\u{r}ej and Tamchyna, Ale\u{s}},
booktitle = {WMT},
title = {{CUNI in WMT15: Chimera Strikes Again}},
year = {2015},
}
@InProceedings{bojar15,
author = {Bojar, Ond\v{r}ej and Chatterjee, Rajen and Federmann, Christian and Haddow, Barry and Huck, Matthias and Hokamp, Chris and Koehn, Philipp and Logacheva, Varvara and Monz, Christof and Negri, Matteo and Post, Matt and Scarton, Carolina and Specia, Lucia and Turchi, Marco},
title = {Findings of the 2015 Workshop on Statistical Machine Translation},
booktitle = {WMT},
year = {2015},
}
% Winning entry in WMT'14 for English-German
@inproceedings{buck14,
author = {Christian Buck and Kenneth Heafield and Bas van Ooyen},
booktitle = {LREC},
title = {N-gram Counts and Language Models from the Common Crawl},
year = {2014},
}
% Winning entry in WMT'14 for English-French
@inproceedings{durrani-EtAl:2014:W14-33,
author = {Durrani, Nadir and Haddow, Barry and Koehn, Philipp and Heafield, Kenneth},
booktitle = {WMT},
title = {Edinburgh's Phrase-based Machine Translation Systems for {WMT}-14},
year = {2014},
}
@misc{wmt14_en_fr,
author = {Holger Schwenk},
howpublished = {\url{http://www-lium.univ-lemans.fr/~schwenk/cslm_joint_paper/}},
note = {[Online; accessed 03-September-2014]},
title = {University Le Mans},
year = {2014},
}
@misc{statmt,
author = {statmt.org},
howpublished = {\url{http://matrix.startmt.org/matrix/}},
note = {[Online; accessed 03-September-2014]},
title = {statmt.org},
year = {2014},
}
% ACL'14 best paper award, joint neural LM
@inproceedings{devlin14,
author = {Jacob Devlin and Rabih Zbib and Zhongqiang Huang and Thomas Lamar and Richard Schwartz and John Makhoul},
booktitle = {ACL},
title = {Fast and Robust Neural Network Joint Models for Statistical Machine Translation},
year = {2014},
}
@online{mobiledevices,
title = {There are officially more mobile devices than people in the world},
author = {Zachary Davies Boren},
year = 2014,
howpublished = {\url{http://www.independent.co.uk/life-style/gadgets-and-tech/news/there-are-officially-more-mobile-devices-than-people-in-the-world-9780518.html}},
note = {Accessed: 2016-09-10}
}
@online{solvemt,
title = {Why Machines Alone Cannot Solve the World’s Translation Problem},
author = {Nataly Kelly},
year = 2014,
howpublished = {\url{http://www.huffingtonpost.com/nataly-kelly/why-machines-alone-cannot-translation_b_4570018.html}},
note = {Accessed: 2016-09-10}
}
@inproceedings{Auli13,
author = {Auli, Michael and Galley, Michel and Quirk, Chris and Zweig, Geoffrey},
booktitle = {ACL},
title = {Joint Language and Translation Modeling with Recurrent Neural Networks.},
year = 2013
}
@inproceedings{green-EtAl:2013:ACL2013,
author = {Green, Spence and Wang, Sida and Cer, Daniel and Manning, Christopher D.},
booktitle = {ACL},
title = {Fast and Adaptive Online Training of Feature-Rich Translation Models},
year = {2013},
}
@inproceedings{vaswani13decode,
author = {Ashish Vaswani and Yinggong Zhao and Victoria Fossum and David Chiang},
booktitle = {EMNLP},
title = {Decoding with large-scale neural language models improves translation},
year = {2013},
}
@inproceedings{zou13bilingual,
author = {Will Y. Zou and Richard Socher and Daniel Cer and Christopher D. Manning},
booktitle = {EMNLP},
title = {Bilingual Word Embeddings for Phrase-Based Machine Translation},
year = {2013},
}
@article{mikolov13mt,
author = {Tom{\'{a}}{\v{s}} Mikolov and Quoc V. Le and Ilya Sutskever},
ee = {http://arxiv.org/abs/1309.4168},
journal = {CoRR},
title = {Exploiting Similarities among Languages for Machine Translation},
volume = {abs/1309.4168},
year = {2013},
}
@inproceedings{heafield13,
author = {Kenneth Heafield and Ivan Pouzyrevsky and Jonathan H. Clark and Philipp Koehn},
title = {Scalable Modified {Kneser-Ney} Language Model Estimation},
year = {2013},
booktitle = {ACL},
}
@InProceedings{green13,
author = {Green, Spence and Wang, Sida and Cer, Daniel and Manning, Christopher D.},
title = {Fast and Adaptive Online Training of Feature-Rich Translation Models},
booktitle = {ACL},
year = {2013},
}
@inproceedings{Schwenk12continuous,
author = {Holger Schwenk},
booktitle = {COLING},
title = {Continuous Space Translation Models for Phrase-Based Statistical Machine Translation},
year = {2012},
}
@inproceedings{Son:2012:CST,
author = {Son, Le Hai and Allauzen, Alexandre and Yvon, François},
booktitle = {NAACL-HLT},
title = {Continuous Space Translation Models with Neural Networks},
year = {2012},
}
@inproceedings{chiang09,
author = {Chiang, David and Knight, Kevin and Wang, Wei},
title = {11,001 New Features for Statistical Machine Translation},
booktitle = {NAACL},
year = {2009},
}
@inproceedings{Pauls2011,
author = {Pauls, Adam and Klein, Dan},
title = {Faster and Smaller N-gram Language Models},
booktitle = {ACL},
year = {2011},
}
% kenlm
@inproceedings{kenlm,
author = {Kenneth Heafield},
title = {{KenLM:} Faster and Smaller Language Model Queries},
year = {2011},
booktitle = {WMT},
}
% Phrasal
@inproceedings{cer10phrasal,
author = {Daniel Cer and Michel Galley and Daniel Jurafsky and Christopher D. Manning},
booktitle = {ACL, Demonstration Session},
title = {Phrasal: A statistical machine translation toolkit for exploring new model features},
year = {2010},
}
% cdec
@inproceedings{dyer10cdec,
author = {Chris Dyer and Jonathan Weese and Hendra Setiawan and Adam Lopez and Ferhan Ture and Vladimir Eidelman and Juri Ganitkevitch and Phil Blunsom and Philip Resnik},
booktitle = {ACL, Demonstration Session},
title = {cdec: A decoder, alignment, and learning framework for finite-state and context-free translation models},
year = {2010},
}
@book{koehn10smt,
author = {Koehn, Philipp},
title = {Statistical Machine Translation},
year = {2010},
edition = {1st},
publisher = {Cambridge University Press},
}
@misc{languages,
title = {How many languages are there in the world?},
author = {Stephen R. Anderson},
year = {2010},
howpublished = {\url{http://www.linguisticsociety.org/content/how-many-languages-are-there-world}},
note = {Accessed: 2016-09-10}
}
@inproceedings{irstlm,
author = {Federico, Marcello and Bertoldi, Nicola and Cettolo, Mauro},
booktitle = {Interspeech},
title = {{IRSTLM}: an open source toolkit for handling large scale language models},
year = 2008
}
@inproceedings{galley08,
author = {Galley, Michel and Manning, Christopher D.},
title = {A Simple and Effective Hierarchical Phrase Reordering Model},
booktitle = {EMNLP},
year = {2008},
}
@article{schwenk07,
author = {Schwenk, Holger},
title = {Continuous Space Language Models},
journal = {Computer Speech and Languages},
volume = {21},
number = {3},
year = {2007},
pages = {492--518},
}
@incollection{hutchins07,
author = {W. John Hutchins},
title = {Machine translation: A concise history},
year = {2007},
booktitle = {Computer Aided Translation: Theory and Practice},
editor = {Chan Sin Wai},
publisher = {Chinese University of Hong Kong},
howpublished={\url{http://www.hutchinsweb.me.uk/CUHK-2006.pdf}},
}
% Moses
@inproceedings{koehn2007moses,
author = {Koehn, Philipp and Hoang, Hieu and Birch, Alexandra and Callison-Burch, Chris and Federico, Marcello and Bertoldi, Nicola and Cowan, Brooke and Shen, Wade and Moran, Christine and Zens, Richard and others},
booktitle = {ACL, Demonstration Session},
title = {Moses: Open source toolkit for statistical machine translation},
year = {2007},
}
% Hiero
@article{chiang07hiero,
author = {David Chiang},
journal = {Computational Linguistics},
number = {2},
pages = {201-228},
title = {Hierarchical phrase-based translation},
volume = {33},
year = {2007},
}
@INPROCEEDINGS{brants07,
author = {Thorsten Brants and Ashok C. Popat and Peng Xu and Franz J. Och and Jeffrey Dean},
title = {Large language models in machine translation},
booktitle = {EMNLP},
year = {2007},
}
@inproceedings{Liang:2006:EDA,
author = {Liang, Percy and Bouchard-C\^{o}t{\'e}, Alexandre and Klein, Dan and Taskar, Ben},
title = {An End-to-end Discriminative Approach to Machine Translation},
booktitle = {ACL},
year = {2006},
}
% Berkeley aligner
@inproceedings{liang06alignment,
author = {Percy Liang and Ben Taskar and Dan Klein},
booktitle = {NAACL},
title = {Alignment by Agreement},
year = {2006},
}
@inproceedings{chiang05,
author = {Chiang, David},
title = {A Hierarchical Phrase-based Model for Statistical Machine Translation},
booktitle = {ACL},
year = {2005},
}
@article{och04,
author = {Och, Franz Josef and Ney, Hermann},
title = {The Alignment Template Approach to Statistical Machine Translation},
journal = {Computational Linguistics},
volume = {30},
number = {4},
year = {2004},
pages = {417--449},
}
@inproceedings{Koehn:2003:SMT,
author = {Koehn, Philipp and Och, Franz Josef and Marcu, Daniel},
booktitle = {NAACL},
title = {Statistical Phrase-based Translation},
year = {2003},
}
@article{och03,
author = {Och, Franz Josef and Ney, Hermann},
journal = {Computational Linguistics},
number = {1},
pages = {19-51},
title = {A Systematic Comparison of Various Statistical Alignment Models},
volume = {29},
year = {2003},
}
@inproceedings{och03mert,
author = {Och, Franz Josef},
title = {Minimum Error Rate Training in Statistical Machine Translation},
booktitle = {ACL},
year = {2003},
}
@inproceedings{och02,
author = {Och, Franz Josef and Ney, Hermann},
title = {Discriminative Training and Maximum Entropy Models for Statistical Machine Translation},
booktitle = {ACL},
year = {2002},
}
@inproceedings{Marcu:2002,
author = {Marcu, Daniel and Wong, William},
title = {A Phrase-based, Joint Probability Model for Statistical Machine Translation},
booktitle = {EMNLP},
year = {2002},
}
% SRILM
@inproceedings{srilm,
author = "Stolcke, Andreas",
title = "{SRILM} -- An Extensible Language Modeling Toolkit",
booktitle = "ICSLP",
year = "2002",
}
@inproceedings{yamada01,
author = {Yamada, Kenji and Knight, Kevin},
title = {A Syntax-based Statistical Translation Model},
booktitle = {ACL},
year = {2001},
}
@inproceedings{Rosenfeld2000,
author = {Rosenfeld, Ronald},
booktitle = {IEEE},
pages = {1270-1278},
title = {Two decades of statistical language modeling: Where do we go from
here?},
volume = 88,
year = 2000
}
@incollection{hutchins2000early,
title={{Warren Weaver and the launching of MT: brief biographical note}},
author = {W. John Hutchins},
booktitle={Early Years in Machine Translation: Memoirs and Biographies of Pioneers},
pages={17-20},
howpublished={\url{http://www.hutchinsweb.me.uk/Weaver-2000.pdf}},
year={2000},
publisher={John Benjamins}
}
@article{wu97,
author = {Wu, Dekai},
title = {Stochastic Inversion Transduction Grammars and Bilingual Parsing of Parallel Corpora},
journal = {Computational Linguistics},
volume = {23},
number = {3},
year = {1997},
pages = {377--403},
}
@article{berger96,
author = {Berger, Adam L. and Pietra, Vincent J. Della and Pietra, Stephen A. Della},
title = {A Maximum Entropy Approach to Natural Language Processing},
journal = {Computational Linguistics},
volume = {22},
number = {1},
year = {1996},
pages = {39--71},
}
% "the" SMT paper
@article{Brown:1993:MSM,
author = {Brown, Peter F. and Pietra, Vincent J. Della and Pietra, Stephen A. Della and Mercer, Robert L.},
journal = {Computational Linguistics},
month = {06},
number = {2},
pages = {263--311},
title = {The Mathematics of Statistical Machine Translation: Parameter Estimation},
volume = {19},
year = {1993},
}
@inproceedings{Papineni02bleu,
author = {Kishore Papineni and Salim Roukos and Todd Ward and Wei-jing Zhu},
booktitle = {ACL},
title = {{BLEU}: a Method for Automatic Evaluation of Machine Translation},
year = {2002},
}
@incollection{ibm701,
author = {Peter Sheridan},
title = {Research in language translation on the {IBM} type 701},
year = {1955},
number = {9},
booktitle = {IBM Technical Newsletter},
howpublished={\url{http://mt-archive.info/Sheridan-1955.pdf}},
}
@incollection{weaver49,
address = {Cambridge, MA},
author = {Weaver, Warren},
booktitle = {Machine Translation of Languages},
editor = {Locke, William N. and Boothe, A. Donald},
note = {Reprinted from a memorandum written by Weaver in 1949.},
pages = {15--23},
publisher = {MIT Press},
title = {Translation},
year = {1949}
}
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
%%% Sequence to Sequence Models / RNNs %%%
%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%%
@ARTICLE{dozat16,
author = {{Dozat}, Timothy and {Manning}, Christopher D.},
title = "{Deep Biaffine Attention for Neural Dependency Parsing}",
journal = {arXiv preprint arXiv:1611.01734},
year = 2016,
}
@inproceedings{chen16,
title={A Thorough Examination of the CNN/Daily Mail Reading Comprehension Task},
author={Chen, Danqi and Bolton, Jason and Manning, Christopher D.},
booktitle={ACL},
year={2016}
}
@inproceedings{jia16,
author = {Robin Jia and Percy Liang},
booktitle = {ACL},
title = {Data Recombination for Neural Semantic Parsing},
year = {2016},
}
@inproceedings{gulcehre16,
author = {{\c{C}}aglar G{\"{u}}l{\c{c}}ehre and
Sungjin Ahn and
Ramesh Nallapati and
Bowen Zhou and
Yoshua Bengio},
title = {Pointing the Unknown Words},
booktitle = {ACL},
year = {2016},
}
@inproceedings{gu16,
author = {Jiatao Gu and
Zhengdong Lu and
Hang Li and
Victor O. K. Li},
title = {Incorporating Copying Mechanism in Sequence-to-Sequence Learning},
booktitle = {ACL},
year = {2016},
}
@inproceedings{wiseman16,
author = {Sam Wiseman and
Alexander M. Rush},
title = {Sequence-to-Sequence Learning as Beam-Search Optimization},
booktitle = {EMNLP},
year = {2016},
}
@inproceedings{shen16,
author = {Shiqi Shen and
Yong Cheng and
Zhongjun He and
Wei He and
Hua Wu and
Maosong Sun and
Yang Liu},
title = {Minimum Risk Training for Neural Machine Translation},
booktitle = {ACL},
year = {2016},
}
@article{bahdanau16actor,
author = {Dzmitry Bahdanau and
Philemon Brakel and
Kelvin Xu and
Anirudh Goyal and
Ryan Lowe and
Joelle Pineau and
Aaron C. Courville and
Yoshua Bengio},
title = {An Actor-Critic Algorithm for Sequence Prediction},
journal = {arXiv preprint arXiv:1607.07086},
year = {2016},
}
@inproceedings{ranzato16,
author = {Marc'Aurelio Ranzato and
Sumit Chopra and
Michael Auli and
Wojciech Zaremba},
title = {Sequence Level Training with Recurrent Neural Networks},
booktitle = {ICLR},
year = {2016},
}
@InProceedings{li16,
author = {Li, Jiwei and Galley, Michel and Brockett, Chris and Spithourakis, Georgios and Gao, Jianfeng and Dolan, Bill},
title = {A Persona-Based Neural Conversation Model},
booktitle = {ACL},
year = {2016},
}
@article{alrfou16,
author = {Rami Al{-}Rfou and
Marc Pickett and
Javier Snaider and
Yun{-}Hsuan Sung and
Brian Strope and
Ray Kurzweil},
title = {Conversational Contextual Cues: The Case of Personalization and History
for Response Ranking},
journal = {arXiv preprint arXiv:1606.00372},
year = {2016},
}
@inproceedings{serban16,
author = {Iulian Vlad Serban and
Alessandro Sordoni and
Yoshua Bengio and
Aaron C. Courville and
Joelle Pineau},
title = {Building End-To-End Dialogue Systems Using Generative Hierarchical
Neural Network Models},
booktitle = {AAAI},
year = {2016},
}
@inproceedings{bengio15,
title = {Scheduled Sampling for Sequence Prediction with Recurrent Neural Networks},
author = {Samy Bengio and Oriol Vinyals and Navdeep Jaitly and Noam M. Shazeer},
year = 2015,
booktitle = {NIPS}
}
@inproceedings{jozefowicz15,
author = {J\'{o}zefowicz, Rafal and Zaremba, Wojciech and Sutskever, Ilya},
booktitle = {ICML},
title = {An Empirical Exploration of Recurrent Network Architectures.},
year = 2015
}
@article{greff15,
author = {Klaus Greff and
Rupesh Kumar Srivastava and
Jan Koutn{\'{\i}}k and
Bas R. Steunebrink and
J{\"{u}}rgen Schmidhuber},
title = {{LSTM:} {A} Search Space Odyssey},
journal = {arXiv preprint arXiv:1503.04069},
year = {2015},
}
@inproceedings{li15,
author = {Li, Jiwei and Luong, Minh-Thang and Jurafsky, Dan},
booktitle = {ACL},
title = {A Hierarchical Neural Autoencoder for Paragraphs and Documents.},
year = {2015},
}
@inproceedings{dai15,
author = {Andrew M. Dai and Quoc V. Le},
booktitle = {NIPS},
title = {Semi-supervised Sequence Learning},
year = {2015},
}
@inproceedings{kiros15skip,
author = {Ryan Kiros and Yukun Zhu and Ruslan Salakhutdinov and Richard S. Zemel and Antonio Torralba and Raquel Urtasun and Sanja Fidler},
booktitle = {NIPS},
title = {Skip-Thought Vectors},
year = {2015},
}
@inproceedings{vinyals15grammar,
author = {Vinyals, Oriol and Kaiser, Lukasz and Koo, Terry and Petrov, Slav and Sutskever, Ilya and Hinton, Geoffrey},
booktitle = {NIPS},
title = {Grammar as a foreign language},
year = {2015},
}
@inproceedings{draw15,
author = {Karol Gregor and Ivo Danihelka and Alex Graves and Danilo Jimenez Rezende and Daan Wierstra},
booktitle = {ICML},
title = {{DRAW:} {A} Recurrent Neural Network For Image Generation},
year = {2015},
}
@inproceedings{xu15,
author = {Kelvin Xu and Jimmy Ba and Ryan Kiros and Kyunghyun Cho and Aaron C. Courville and Ruslan Salakhutdinov and Richard S. Zemel and Yoshua Bengio},
booktitle = {ICML},
title = {Show, Attend and Tell: Neural Image Caption Generation with Visual Attention},
year = {2015},
}
@inproceedings{vinyals15caption,
author = {Vinyals, Oriol and Toshev, Alexander and Bengio, Samy and Erhan, Dumitru},
booktitle = {CVPR},
title = {Show and tell: A neural image caption generator},
year = {2015},
}
@incollection{mnih14,
author = {Mnih, Volodymyr and Heess, Nicolas and Graves, Alex and Kavukcuoglu, Koray},
booktitle = {NIPS},
title = {Recurrent Models of Visual Attention},
year = {2014},
}
@article{graves14,
author = {Alex Graves and
Greg Wayne and
Ivo Danihelka},
journal = {arXiv preprint arXiv:1410.5401},
title = {Neural {Turing} Machines},
year = {2014},
}
@article{zaremba14,
author = {Wojciech Zaremba and Ilya Sutskever and Oriol Vinyals},
journal = {arXiv preprint arXiv:1409.2329},
title = {Recurrent Neural Network Regularization},
year = {2014},
}
@inproceedings{pham2014dropout,
author = {Pham, Vu and Bluche, Th\'{e}odore and Kermorvant, Christopher
and Louradour, J\'{e}r\^{o}me},
booktitle = {ICFHR},
title = {Dropout improves recurrent neural networks for handwriting recognition},
year = {2014},
}
@inproceedings{graves13c,
author = {Alex Graves},
booktitle = {Arxiv preprint arXiv:1308.0850},
title = {Generating Sequences With Recurrent Neural Networks},
year = {2013},
}
@inproceedings{bengio13,
author = {Bengio, Yoshua and Boulanger-Lewandowski, Nicolas and Pascanu, Razvan},
booktitle = {ICASSP},
title = {Advances in optimizing recurrent networks.},
year = 2013
}
@inproceedings{pascanu13,
author = {Razvan Pascanu and
Tom{\'{a}}{\v{s}} Mikolov and
Yoshua Bengio},
title = {On the difficulty of training recurrent neural networks},
booktitle = {ICML},
year = {2013},
}