-
Notifications
You must be signed in to change notification settings - Fork 4
Expand file tree
/
Copy pathcc2014.bib
More file actions
242 lines (214 loc) · 12.7 KB
/
Copy pathcc2014.bib
File metadata and controls
242 lines (214 loc) · 12.7 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
@InProceedings{cc:PenningtonSocherManning:2014:GloVe-word-vectors,
title = "{GloVe}: Global vectors for word representation",
author = "Pennington, Jeffrey and Socher, Richard and Manning, Christopher D.",
booktitle = "Proceedings of the 2014 conference on empirical methods in natural language processing (EMNLP)",
pages = "1532--1543",
year = "2014",
URL = "https://aclanthology.org/D14-1162.pdf",
cc-author-affiliation = "Stanford University, California, USA",
cc-class = "nlp/word-embeddings",
cc-snippet = "We trained our model on five corpora of varying sizes: [...] and on 42 billion tokens of web data,
from Common Crawl⁵ [⁵ To demonstrate the scalability of the model, we also trained it on a much
larger sixth corpus, containing 840 billion tokens of web data, but in this case we did not lowercase
the vocabulary, so the results are not directly comparable.].",
}
@Article{cc:MedianiWinebargerWaibel:2014:In-domain-data-selection,
year = "2014",
author = "Mohammed Mediani and Joshua Winebarger and Alexander Waibel",
title = "Improving In-Domain Data Selection For Small In-Domain Sets",
URL = "http://www.statmt.org/OSMOSES/IWSLT-36.pdf",
cc-author-affiliation = "Karlsruhe Institute of Technology, Germany",
}
@Article{cc:GuoLiuHanMaletti:2014:Tunable-language-model-SMT,
year = "2014",
author = "Junfei Guo and Juan Liu and Qi Han and Andreas Maletti",
title = "A Tunable Language Model for Statistical Machine Translation",
URL = "http://www.ims.uni-stuttgart.de/institut/mitarbeiter/maletti/pub/guoliuhanmal14.pdf",
cc-author-affiliation = "School of Computer, Wuhan University, China, Institute for Natural Language Processing,
University of Stuttgart, Germany; Institute for Visualization and Interactive Systems, University of
Stuttgart, Germany; Institute of Computer Science, University of Leipzig, Germany",
}
@Article{cc:HannunCaseCasperCatanzaroEtAl:2014:Deep-speech,
year = "2014",
author = "Awni Hannun and Carl Case and Jared Casper and Bryan Catanzaro and Greg Diamos and Erich Elsen and
Ryan Prenger and Sanjeev Satheesh and Shubho Sengupta and Adam Coates and Andrew Y. Ng",
title = "Deep Speech: Scaling up end-to-end speech recognition",
URL = "http://arxiv.org/pdf/1412.5567v2.pdf",
cc-author-affiliation = "Baidu Research – Silicon Valley AI Lab",
}
@Article{cc:HaslerKoehnHaddowBlunsom:2014:Dynamic-Topic-Adaptation-phrase-based-MT,
year = "2014",
author = "Eva Hasler and Philipp Koehn and Barry Haddow and Phil Blunsom",
title = "Dynamic Topic Adaptation for Phrase-based {MT}",
URL = "http://www.aclweb.org/anthology/E/E14/E14-1035.pdf",
cc-author-affiliation = "University of Edinburgh; University of Oxford",
}
@Article{cc:Tortelli:2014:Bloom-filter-based-routing-in-NDN,
year = "2014",
author = "Michele Tortelli",
title = "Bloom filter-based Routing in {NDN}",
URL = "http://www.poliba.it/Didattica/docs/scorepoliba2014_submission_179.pdf",
cc-author-affiliation = "Politecnico di Bari",
}
@Article{cc:GinterKanerva:2014:Fast-training-of-word2vec,
year = "2014",
author = "Filip Ginter and Jenna Kanerva",
title = "Fast Training of word2vec Representations Using {N}-gram Corpora",
URL = "http://www2.lingfil.uu.se/SLTC2014/abstracts/sltc2014_submission_27.pdf",
cc-author-affiliation = "University of Turku",
}
@Article{cc:PetrovskiBrylBizer:2014:Product-attributes-from-e-commerce-microdata,
year = "2014",
author = "Petar Petrovski and Volha Bryl and Christian Bizer",
title = "Learning Regular Expressions for the Extraction of Product Attributes from {E}-commerce Microdata",
URL = "http://ceur-ws.org/Vol-1267/LD4IE2014_Petrovski.pdf",
cc-author-affiliation = "University of Mannheim, Germany- Research Group Data and Web Science",
}
@Article{cc:MeuselPetrovskiBizer:2014:Web-Data-Commons-microdata-RDFa-microformat-dataset-series,
year = "2014",
author = "Robert Meusel and Petar Petrovski and Christian Bizer",
title = "The Web Data Commons Microdata, {RDF}a and Microformat Dataset Series",
URL = "http://link.springer.com/chapter/10.1007/978-3-319-11964-9_18#page-1",
cc-author-affiliation = "University of Mannheim, Germany- Research Group Data and Web Science",
}
@Article{cc:MeuselMikaBlanko:2014:Focused-crawling-for-structured-data,
year = "2014",
author = "Robert Meusel and Peter Mika and Roi Blanko",
title = "Focused Crawling for Structured Data",
URL = "http://dl.acm.org/citation.cfm?id=2661902",
cc-author-affiliation = "University of Mannheim; Yahoo Labs- Barcelona",
}
@Article{cc:DingUtiyamaSumita:2014:Document-level-re-ranking,
year = "2014",
author = "Chenchen Ding and Masao Utiyama and Eiichiro Sumita",
title = "Document-level Re-ranking with Soft Lexical and Semantic Features for Statistical Machine
Translation",
URL = "http://www.mibel.cs.tsukuba.ac.jp/~tei/AMTA2014.pdf",
cc-author-affiliation = "National Institute of Information and Communications Technology Japan",
}
@Article{cc:ShirakawaNakayamaAramakiHaraEtAl:2014:Conceptualized-relations,
year = "2014",
author = "Masumi Shirakawa and Kotaro Nakayama and Eiji Aramaki and Takahiro Hara and Shojiro Nishio",
title = "Collecting Conceptualized Relations from Terabytes of Web Texts for Understanding Unknown Terms",
URL = "http://dl.acm.org/citation.cfm?id=2682777",
cc-author-affiliation = "Osaka University",
}
@Article{cc:KanervaLuotolahtiLaippalaGinter:2014:Syntactic-N-gram-collection,
year = "2014",
author = "Jenna Kanerva and Juhani Luotolahti and Veronika Laippala and Filip Ginter",
title = "Syntactic {N}-gram Collection from a Large-Scale Corpus of Internet Finnish",
URL = "http://ebooks.iospress.nl/volumearticle/38025",
cc-author-affiliation = "University of Turku",
}
@Article{cc:HagePloegerHoeksema:2014:Number-frequency-on-the-web,
year = "2014",
author = "Willem Robert van Hage and Thomas Ploeger and Jesper Hoeksema",
title = "Number frequency on the web",
URL = "http://dl.acm.org/citation.cfm?id=2576962",
cc-author-affiliation = "SynerScope B.V., VU University Amsterdam",
}
@Article{cc:BuckHeafieldOoyen:2014:N-gram-counts-and-language-models,
year = "2014",
author = "Christian Buck and Kenneth Heafield and Bas van Ooyen",
title = "{N}-gram Counts and Language Models from the Common Crawl",
URL = "http://statmt.org/ngrams/BuckEtAl_LREC2014_CommonCrawlLM.pdf",
cc-author-affiliation = "University of Edinburgh, Stanford University, Owlin BV",
}
@Article{cc:HardmeierStymneTiedemannSmithEtAl:2014:Anaphora-models,
year = "2014",
author = "Christian Hardmeier and Sara Stymne and Jörg Tiedemann and Aaron Smith and Joakim Nivre",
title = "Anaphora Models and Reordering for Phrase-Based {SMT}",
URL = "http://acl2014.org/acl2014/W14-33/pdf/W14-3312.pdf",
cc-author-affiliation = "Uppsala University: Department of Linguistics and Philology",
}
@Article{cc:SchwartzAndersonGwinnupYoung:2014:MT-and-monolingual-postediting,
year = "2014",
author = "Lane O. B. Schwartz and Timothy Anderson and Jeremy Gwinnup and Katherine M. Young",
title = "Machine Translation and Monolingual Postediting:The {AFRL} {WMT}-14 System",
URL = "http://www.ling.uni-potsdam.de/~koller/aclpub/W14-33/cdrom/pdf/W14-3321.pdf",
cc-author-affiliation = "Air Force Research Laboratory, SRA International, N-Space Analysis LLC",
}
@Article{cc:CuongSimaan:2014:Latent-domain-translation-models,
year = "2014",
author = "Hoang Cuong and Khalil Sima’an",
title = "Latent Domain Translation Models in Mix-of-Domains Haystack",
URL = "http://www.aclweb.org/anthology/C/C14/C14-1182.pdf",
cc-author-affiliation = "University of Amsterdam - Institute for Logic, Language and Computation",
}
@Article{cc:SteinerMühleisenVerborghChampinEtAl:2014:WebVTT,
year = "2014",
author = "Thomas Steiner and Hannes Mühleisen and Ruben Verborgh and Pierre-Antoine Champin and Benoît Encelle
and Yannick Prié",
title = "Weaving the Web({VTT}) of Data",
URL = "http://telemedicina.unifesp.br/pub/Events/2013-05%20-%20WWW2013/www2013/www2013.org/companion/p1399.pdf",
cc-author-affiliation = "Université de Lyon, Database Architectures Group; Multimedia Lab, Ghent University; iMinds,
Université de Nantes",
}
@Article{cc:WylotCudré-MaurouxGroth:2014:TripleProv,
year = "2014",
author = "Marcin Wylot and Philippe Cudré-Mauroux and Paul Groth",
title = "TripleProv: Efficient Processing of Lineage Queries in a Native {RDF} Store",
URL = "http://exascale.info/sites/default/files/TipleProv.pdf",
cc-author-affiliation = "eXascale Infolab, University of Fribourg; VU University Amsterdam",
}
@InProceedings{cc:LehmbergMeuselBizer:2014:Graph-structure-aggregated-by-pay-level-domain,
title = "Graph structure in the web: aggregated by pay-level domain",
author = "Oliver Lehmberg and Robert Meusel and Christian Bizer",
booktitle = "Web Science Conference",
year = "2014",
URL = "https://dl.acm.org/doi/10.1145/2615569.2615674",
cc-author-affiliation = "University of Mannheim, Germany",
cc-class = "web-science/hyperlinkgraph",
}
@Article{cc:MeuselVignaLehmbergBizer:2014:Graph-structure-in-the-web-revisited,
year = "2014",
author = "Robert Meusel and Sebastiano Vigna and Oliver Lehmberg and Christian Bizer",
title = "Graph Structure in the Web — Revisited",
URL = "http://vigna.di.unimi.it/ftp/papers/GraphStructureRevisited.pdf",
cc-author-affiliation = "Data and Web Science Group - University of Mannheim, Germany; Laboratory for Web - Algorithmics
Università degli Studi di Milano, Italy",
cc-class = "web-science/hyperlinkgraph",
}
@Article{cc:ArdiHeidemann:2014:Web-scale-content-reuse-detection,
year = "2014",
author = "Calvin Ardi and John Heidemann",
title = "Web-scale Content Reuse Detection",
URL = "ftp://ftp.isi.edu/isi-pubs/tr-692.pdf",
cc-author-affiliation = "USC/Information Sciences Institute",
}
@Article{cc:Tsuboi:2014:Neural-tagger,
year = "2014",
author = "Yuta Tsuboi",
title = "Neural Networks Leverage Corpus-wide Information for Part-of-speech Tagging",
URL = "http://2boy.org/~yuta/publications/neuraltagger-emnlp2014-tsuboi.pdf",
cc-author-affiliation = "IBM Resarch",
}
@Article{cc:CettoloBertoldiFedericoSchwenkEtAl:2014:Translation-project-adaptation,
year = "2014",
author = "Mauro Cettolo and Nicola Bertoldi and Marcello Federico and Holger Schwenk and Loïc Barrault and
Christophe Servan",
title = "Translation project adaptation for {MT}-enhanced computer assisted translation",
URL = "http://link.springer.com/article/10.1007/s10590-014-9152-1",
cc-author-affiliation = "Fondazione Bruno Kessler, University of Le Mans, Xerox Research Centre Europe",
}
@Article{cc:Sanchis-TrillesOrtiz-MartınezCasacuberta:2014:Efficient-wordgraph-pruning,
year = "2014",
author = "Germán Sanchis-Trilles and Daniel Ortiz-Martınez and Francisco Casacuberta",
title = "Efficient Wordgraph Pruning for Interactive Translation Prediction",
URL = "http://www.casmacat.eu/uploads/Main/2eamt2014.pdf",
cc-author-affiliation = "PRHLT Centre - Universidad Politécnica de Valencia",
}
@Article{cc:KoliasAnagnostopoulosKayafas:2014:Exploratory-analysis-of-TB-scale-web-corpus,
year = "2014",
author = "Vasilis Kolias and Ioannis Anagnostopoulos and Eleftherios Kayafas",
title = "Exploratory Analysis of a Terabyte Scale Web Corpus",
URL = "http://arxiv.org/abs/1409.5443",
cc-author-affiliation = "National Technical University of Athens, University of Thessaly",
}
@Article{cc:MizukamiNeubigSaktiTodaEtAl:2014:Domain-paraphrase-database,
year = "2014",
author = "Masahiro Mizukami and Graham Neubig and Sakriani Sakti and Tomoki Toda and Satoshi Nakamura",
title = "Building a Free General-Domain Paraphrase Database for Japanese",
URL = "http://isw3.naist.jp/~masahiro-mi/paper/ma14cocosda.pdf",
cc-author-affiliation = "Nara Institute of Science and Technology",
}