@inproceedings{e2818943aa494f9db973587aea7c57f3,
title = "Collaborative matching for sentence alignment",
abstract = "Existing sentence alignment methods are founded fundamentally on sentence length and lexical correspondences. Methods based on the former follow in general the length proportionality assumption that the lengths of sentences in one language tend to be proportional to that of their translations, and are known to bear poor adaptivity to new languages and corpora. In this paper, we attempt to interpret this assumption from a new perspective via the notion of collaborative matching, based on the observation that sentences can work collaboratively during alignment rather than separately as in previous studies. Our approach is tended to be independent on any specific language and corpus, so that it can be adaptively applied to a variety of texts without binding to any prior knowledge about the texts. We use one-to-one sentence alignment to illustrate this approach and implement two specific alignment methods, which are evaluated on six bilingual corpora of different languages and domains. Experimental results confirm the effectiveness of this collaborative matching approach.",
keywords = "Machine translation, Sentence alignment",
author = "Xiaojun Quan and Chunyu Kit and Wuya Chen",
year = "2018",
month = oct,
doi = "10.1007/978-3-030-01716-3_4",
language = "English",
isbn = "978-3-030-01715-6",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer, Cham",
pages = "39--52",
editor = "Sun, {Maosong } and Ting Liu and Xiaojie Wang and Zhiyuan Liu and Yang Liu",
booktitle = "Chinese Computational Linguistics and Natural Language Processing Based on Naturally Annotated Big Data",
note = "17th China National Conference on Computational Linguistics, CCL 2018 and 6th International Symposium on Natural Language Processing Based on Naturally Annotated Big Data, NLP-NABD 2018 ; Conference date: 19-10-2018 Through 21-10-2018",
}