% % GENERATED FROM https://www.coli.uni-saarland.de % by : anonymous % IP : coli2006.lst.uni-saarland.de % at : Mon, 05 Feb 2024 15:43:02 +0100 GMT % % Selection : Reference #677 % @InProceedings{Keller_et_al:2002, AUTHOR = {Keller, Frank and Lapata, Mirella and Ourioupina, Olga}, TITLE = {Using the Web to Overcome Data Sparseness}, YEAR = {2002}, BOOKTITLE = {Proceedings of the Conference on Empirical Methods in Natural Language Processing}, PAGES = {230-237}, EDITOR = {Hajic, Jan and Matsumoto, Yuji}, ADDRESS = {Philadelphia, USA}, URL = {http://www.iccs.informatics.ed.ac.uk/~keller/papers/emnlp02.pdf}, ABSTRACT = {This paper shows that the web can be employed to obtain frequencies for bigrams that are unseen in a given corpus. We describe a method for retrieving counts for adjective-noun, noun-noun, and verb-object bigrams from the web by querying a search engine. We evaluate this method by demonstrating that web frequencies and correlate with frequencies obtained from a carefully edited, balanced corpus. We also perform a task-based evaluation, showing that web frequencies can reliably predict human plausibility judgments.}, ANNOTE = {COLIURL : Keller:2002:UWO.pdf} }