@inproceedings{d340240bb6604de7999182393f833b9c,
title = "A corpus of native, non-native and translated texts",
abstract = "We describe a monolingual English corpus of original and (human) translated texts, with an accurate annotation of speaker properties, including the original language of the utterances and the speaker's country of origin. We thus obtain three sub-corpora of texts reflecting native English, non-native English, and English translated from a variety of European languages. This dataset will facilitate the investigation of similarities and differences between these kinds of sub-languages. Moreover, it will facilitate a unified comparative study of translations and language produced by (highly fluent) non-native speakers, two closely-related phenomena that have only been studied in isolation so far.",
keywords = "Bilingualism, Corpus linguistics, Second language acquisition, Translation",
author = "Sergiu Nisioi and Ella Rabinovich and Dinu, {Liviu P.} and Shuly Wintner",
note = "Funding Information: This research was supported by the Israeli Ministry of Science and Technology and partly by UEFISCDI, PNII-IDPCE-2011-3-0959. We are grateful to Noam Ordan for his advices and helpful suggestions.; 10th International Conference on Language Resources and Evaluation, LREC 2016 ; Conference date: 23-05-2016 Through 28-05-2016",
year = "2016",
language = "American English",
series = "Proceedings of the 10th International Conference on Language Resources and Evaluation, LREC 2016",
pages = "4197--4201",
editor = "Nicoletta Calzolari and Khalid Choukri and Helene Mazo and Asuncion Moreno and Thierry Declerck and Sara Goggi and Marko Grobelnik and Jan Odijk and Stelios Piperidis and Bente Maegaard and Joseph Mariani",
booktitle = "Proceedings of the 10th International Conference on Language Resources and Evaluation, LREC 2016",
}