@inproceedings{02c114c3673e4733ba7dba17c2d360d5,
title = "Enhancing unlexicalized parsing performance using a wide coverage lexicon, fuzzy tag-set mapping, and EM-HMM-based lexical probabilities",
abstract = "We present a framework for interfacing a PCFG parser with lexical information from an external resource following a different tagging scheme than the treebank. This is achieved by defining a stochastic mapping layer between the two resources. Lexical probabilities for rare events are estimated in a semi-supervised manner from a lexicon and large unannotated corpora. We show that this solution greatly enhances the performance of an unlexicalized Hebrew PCFG parser, resulting in state-of-the-art Hebrew parsing results both when a segmentation oracle is assumed, and in a real-word parsing scenario of parsing unsegmented tokens.",
author = "Yoav Goldberg and Reut Tsarfaty and Meni Adler and Michael Elhadad",
year = "2009",
month = jan,
day = "1",
doi = "10.3115/1609067.1609103",
language = "English",
isbn = "9781932432169",
series = "EACL 2009 - 12th Conference of the European Chapter of the Association for Computational Linguistics, Proceedings",
publisher = "Association for Computational Linguistics (ACL)",
pages = "327--335",
booktitle = "EACL 2009 - 12th Conference of the European Chapter of the Association for Computational Linguistics, Proceedings",
address = "United States",
note = "12th Conference of the European Chapter of the Association for Computational Linguistics, EACL 2009 ; Conference date: 30-03-2009 Through 03-04-2009",
}