Multiword Expressions: A Pain in the Neck for NLP. Sag, I. A., Baldwin, T., Bond, F., Copestake, A., & Flickinger, D. In Computational Linguistics and Intelligent Text Processing, of Lecture Notes in Computer Science, pages 1–15, Berlin, Heidelberg, 2002. Springer.
doi  abstract   bibtex   
Multiword expressions are a key problem for the development of large-scale, linguistically sound natural language processing technology. This paper surveys the problem and some currently available analytic techniques. The various kinds of multiword expressions should be analyzed in distinct ways, including listing “words with spaces”, hierarchically organized lexicons, restricted combinatoric rules, lexical selection, “idiomatic constructions” and simple statistical affinity. An adequate comprehensive analysis of multiword expressions must employ both symbolic and statistical techniques.
@inproceedings{Sag_etal_mwe:2002,
	address = {Berlin, Heidelberg},
	series = {Lecture {Notes} in {Computer} {Science}},
	title = {Multiword {Expressions}: {A} {Pain} in the {Neck} for {NLP}},
	isbn = {978-3-540-45715-2},
	shorttitle = {Multiword {Expressions}},
	doi = {10.1007/3-540-45715-1_1},
	abstract = {Multiword expressions are a key problem for the development of large-scale, linguistically sound natural language processing technology. This paper surveys the problem and some currently available analytic techniques. The various kinds of multiword expressions should be analyzed in distinct ways, including listing “words with spaces”, hierarchically organized lexicons, restricted combinatoric rules, lexical selection, “idiomatic constructions” and simple statistical affinity. An adequate comprehensive analysis of multiword expressions must employ both symbolic and statistical techniques.},
	language = {en},
	booktitle = {Computational {Linguistics} and {Intelligent} {Text} {Processing}},
	publisher = {Springer},
	author = {Sag, Ivan A. and Baldwin, Timothy and Bond, Francis and Copestake, Ann and Flickinger, Dan},
	editor = {Gelbukh, Alexander},
	year = {2002},
	keywords = {Combinatory Categorial Grammar, Compositional Account, Lexical Selection, Light Verb, Mass Noun},
	pages = {1--15},
}

Downloads: 0