@inproceedings{5e1688ae24274d19bfcc62d6ef5d8514,
title = "Collocation discovery for optimal bilingual lexicon development",
abstract = "The accurate translation of collocations, or multi-word units, is essential for high quality machine translation. However, many collocations do not translate compositionally, thus requiring individual entries in the bilingual lexicon. We present a technique for collocation extraction from large corpora that takes into account the dispersion of the collocations throughout the corpus. Collocations are ranked to more accurately reflect how likely they are to occur in a wide variety of texts; collocations which are specific to a particular text are less useful for lexicon development. Once the collocations are extracted, appropriate bilingual lexical entries can be developed by lexicographers.",
author = "Scott McDonald and Davide Turcato and Paul McFetridge and Fred Popowich and Janine Toole",
year = "2000",
month = may,
day = "19",
doi = "10.1007/3-540-45486-1_11",
language = "English",
isbn = "9783540675570",
series = "Lecture Notes in Computer Science",
publisher = "Springer Verlag",
pages = "126--137",
editor = "Hamilton, {Howard J.}",
booktitle = "Proceedings of 13th Biennial Conference of the Canadian Society for Computational Studies of Intelligence (AI 2000)",
address = "Germany",
note = "13th Biennial Conference of the Canadian Society for Computational Studies of Intelligence: Advances in Artificial Intelligence , AI 2000 ; Conference date: 14-05-2000 Through 17-05-2000",
}