Automatically assigned DDC number: 00635
Manually assigned DDC number: 00635
Number of references: 8
Title: Homonymy and Polysemy in Information Retrieval
Author:
Subject: Robert Krovetz Homonymy and Polysemy in Information Retrieval
Description: This paper discusses research on distinguishing word meanings in the context of information retrieval systems. We conducted experiments with three sources of evidence for making these distinctions: morphology, part-of-speech, and phrases. We have focused on the distinction between homonymy and polysemy (unrelated vs. related meanings). Our results support the need to distinguish homonymy and polysemy. We found: 1) grouping morphological variants makes a significant improvement in retrieval performance, 2) that more than half of all words in a dictionary that differ in part-of-speech are related in meaning, and 3) that it is crucial to assign credit to the component words of a phrase. These experiments provide a better understanding of word-based methods, and suggest where natural language processing can provide further improvements in retrieval performance. 1 Introduction Lexical ambiguity is a fundamental problem in natural language processing, but relatively little quantitative inf...
Contributor: The Pennsylvania State University CiteSeer Archives
Publisher: unknown
Date: 1997-12-05
Pubyear: 1997
Format: ps
Identifier: http://citeseer.ist.psu.edu/167170.html
Source: ftp://ftp.nj.nec.com/pub/krovetz/homonymy-polysemy.ps
Language: en
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Relation:
Rights: unrestricted
<?xml version="1.0" encoding="UTF-8"?>
<references_metadata>
<rec ID="/576559.html" Type="inproceedings" CiteSeer_Book="ACL Proceedings Second Conference on Applied Natural Language Processing" CiteSeer_Volume="" Title="A tool for investigating the synonymy relation in a sense disambiguated thesaurus,">
<identifier Org="ISBN:0805810889" Paper_ID="/576559.html" Extracted="0805810889" DDC="401/.43" Normalized_DDC="40143" Normalized_Weight="0.25" />
<identifier Org="ISBN:0818622059" Paper_ID="/576559.html" Extracted="0818622059" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.25" />
<identifier Org="ISBN:0897913213" Paper_ID="/576559.html" Extracted="0897913213" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.25" />
<identifier Org="ISBN:1558601570" Paper_ID="/576559.html" Extracted="1558601570" DDC="621.3804" Normalized_DDC="6213804" Normalized_Weight="0.25" />
</rec>
<rec ID="/192832.html" Type="article" CiteSeer_Book="Computational Linguistics" CiteSeer_Volume="20" Title="Word Sense Disambiguation Using a Second Language Monolingual Corpus,">
<identifier Org="ISBN:0262611228" Paper_ID="/192832.html" Extracted="0262611228" DDC="410.72" Normalized_DDC="41072" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0387947019" Paper_ID="/192832.html" Extracted="0387947019" DDC="006.5/4" Normalized_DDC="00654" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:0818679190" Paper_ID="/192832.html" Extracted="0818679190" />
<identifier Org="ISBN:0824790006" Paper_ID="/192832.html" Extracted="0824790006" DDC="006.3/5" Normalized_DDC="00635" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:1402048092" Paper_ID="/192832.html" Extracted="1402048092" DDC="401/.430285" Normalized_DDC="401430285" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:157735236X" Paper_ID="/192832.html" Extracted="157735236X" />
<identifier Org="ISBN:3110155788" Paper_ID="/192832.html" Extracted="3110155788" DDC="410.1/51" Normalized_DDC="410151" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3110176165" Paper_ID="/192832.html" Extracted="3110176165" DDC="401/.43" Normalized_DDC="40143" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540210067" Paper_ID="/192832.html" Extracted="3540210067" DDC="410/.285" Normalized_DDC="410285" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540240179" Paper_ID="/192832.html" Extracted="3540240179" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540340459" Paper_ID="/192832.html" Extracted="3540340459" DDC="469.0285" Normalized_DDC="4690285" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540411178" Paper_ID="/192832.html" Extracted="3540411178" DDC="418/.02/0285" Normalized_DDC="418020285" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540415971" Paper_ID="/192832.html" Extracted="3540415971" DDC="006.3/1" Normalized_DDC="00631" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540652590" Paper_ID="/192832.html" Extracted="3540652590" DDC="418/.02/0285" Normalized_DDC="418020285" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:3540733442" Paper_ID="/192832.html" Extracted="3540733442" />
<identifier Org="ISBN:9027248079" Paper_ID="/192832.html" Extracted="9027248079" DDC="410.285" Normalized_DDC="410285" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:9042015306" Paper_ID="/192832.html" Extracted="9042015306" DDC="418.02" Normalized_DDC="41802" Normalized_Weight="0.06666666666666667" />
<identifier Org="ISBN:9629961482" Paper_ID="/192832.html" Extracted="9629961482" DDC="418.020285" Normalized_DDC="418020285" Normalized_Weight="0.06666666666666667" />
</rec>
<rec ID="/22021.html" Type="article" CiteSeer_Book="Information Systems" CiteSeer_Volume="10" Title="Lexical Ambiguity and Information Retrieval,">
<identifier Org="ISBN:019927634X" Paper_ID="/22021.html" Extracted="019927634X" DDC="410.285" Normalized_DDC="410285" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:038778702X" Paper_ID="/22021.html" Extracted="038778702X" DDC="610.285 22" Normalized_DDC="61028522" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:0387944540" Paper_ID="/22021.html" Extracted="0387944540" DDC="025.06/61" Normalized_DDC="0250661" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:0788129457" Paper_ID="/22021.html" Extracted="0788129457" />
<identifier Org="ISBN:0789023555" Paper_ID="/22021.html" Extracted="0789023555" DDC="025" Normalized_DDC="025" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:0792356853" Paper_ID="/22021.html" Extracted="0792356853" DDC="410/.285" Normalized_DDC="410285" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:079239710X" Paper_ID="/22021.html" Extracted="079239710X" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:0805811273" Paper_ID="/22021.html" Extracted="0805811273" DDC="413/.028" Normalized_DDC="413028" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:0898715008" Paper_ID="/22021.html" Extracted="0898715008" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:1402033435" Paper_ID="/22021.html" Extracted="1402033435" DDC="006.35" Normalized_DDC="00635" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:1581136463" Paper_ID="/22021.html" Extracted="1581136463" />
<identifier Org="ISBN:1588110168" Paper_ID="/22021.html" Extracted="1588110168" DDC="401/.4/0285" Normalized_DDC="40140285" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:1878289519" Paper_ID="/22021.html" Extracted="1878289519" DDC="658.4/038" Normalized_DDC="6584038" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:3540204091" Paper_ID="/22021.html" Extracted="3540204091" DDC="004" Normalized_DDC="004" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:3540213821" Paper_ID="/22021.html" Extracted="3540213821" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:3540261788" Paper_ID="/22021.html" Extracted="3540261788" DDC="021.65" Normalized_DDC="02165" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:354040550X" Paper_ID="/22021.html" Extracted="354040550X" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:3540413480" Paper_ID="/22021.html" Extracted="3540413480" DDC="004" Normalized_DDC="004" Normalized_Weight="0.058823529411764705" />
<identifier Org="ISBN:3540856536" Paper_ID="/22021.html" Extracted="3540856536" />
<identifier Org="ISBN:3790812994" Paper_ID="/22021.html" Extracted="3790812994" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.058823529411764705" />
</rec>
<rec ID="/50937.html" Type="inproceedings" CiteSeer_Book="Proceedings of the Sixteenth Annual International ACM SIGIR Conference on Research and Development in Information Retrieval" CiteSeer_Volume="" Title="{V}iewing {M}orphology as an {I}nference {P}rocess,," />
<rec ID="/29993.html" Type="inproceedings" CiteSeer_Book="Proceedings of SIGIR94 17th ACM International Conference on Research and Development in Information Retrieval" CiteSeer_Volume="" Title="Word sense disambiguation and information retrieval,">
<identifier Org="ISBN:0130950696" Paper_ID="/29993.html" Extracted="0130950696" DDC="410/.285" Normalized_DDC="410285" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:019927634X" Paper_ID="/29993.html" Extracted="019927634X" DDC="410.285" Normalized_DDC="410285" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:026206197X" Paper_ID="/29993.html" Extracted="026206197X" DDC="423/.1" Normalized_DDC="4231" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:038778702X" Paper_ID="/29993.html" Extracted="038778702X" DDC="610.285 22" Normalized_DDC="61028522" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:0792356853" Paper_ID="/29993.html" Extracted="0792356853" DDC="410/.285" Normalized_DDC="410285" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1402048092" Paper_ID="/29993.html" Extracted="1402048092" DDC="401/.430285" Normalized_DDC="401430285" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1402056338" Paper_ID="/29993.html" Extracted="1402056338" DDC="658.4038011" Normalized_DDC="6584038011" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1558604545" Paper_ID="/29993.html" Extracted="1558604545" DDC="025.5/24" Normalized_DDC="025524" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:1581136463" Paper_ID="/29993.html" Extracted="1581136463" />
<identifier Org="ISBN:1581138814" Paper_ID="/29993.html" Extracted="1581138814" />
<identifier Org="ISBN:1595931406" Paper_ID="/29993.html" Extracted="1595931406" />
<identifier Org="ISBN:3540001972" Paper_ID="/29993.html" Extracted="3540001972" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:354019889X" Paper_ID="/29993.html" Extracted="354019889X" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540204946" Paper_ID="/29993.html" Extracted="3540204946" DDC="005.75/8" Normalized_DDC="005758" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540213821" Paper_ID="/29993.html" Extracted="3540213821" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540250700" Paper_ID="/29993.html" Extracted="3540250700" DDC="006.312" Normalized_DDC="006312" Normalized_Weight="0.07142857142857142" />
<identifier Org="ISBN:3540856536" Paper_ID="/29993.html" Extracted="3540856536" />
<identifier Org="ISBN:9051992734" Paper_ID="/29993.html" Extracted="9051992734" DDC="006.3/5" Normalized_DDC="00635" Normalized_Weight="0.07142857142857142" />
</rec>
<rec ID="/350487.html" Type="misc" CiteSeer_Book="" CiteSeer_Volume="" Title="Translation Mismatch in a Hybrid MT System," />
<rec ID="/322454.html" Type="book" CiteSeer_Book="Information Retrieval 2nd edition" CiteSeer_Volume="" Title="Information Retrieval, 2nd edition,">
<identifier Org="ISBN:0070544840" Paper_ID="/322454.html" Extracted="0070544840" DDC="025.5/2" Normalized_DDC="02552" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0789023555" Paper_ID="/322454.html" Extracted="0789023555" DDC="025" Normalized_DDC="025" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0792399269" Paper_ID="/322454.html" Extracted="0792399269" DDC="005.74/068" Normalized_DDC="00574068" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0849318254" Paper_ID="/322454.html" Extracted="0849318254" DDC="006.7" Normalized_DDC="0067" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0849318580" Paper_ID="/322454.html" Extracted="0849318580" DDC="006.7" Normalized_DDC="0067" Normalized_Weight="0.0625" />
<identifier Org="ISBN:0897910524" Paper_ID="/322454.html" Extracted="0897910524" DDC="025/.04 s" Normalized_DDC="02504" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1558604545" Paper_ID="/322454.html" Extracted="1558604545" DDC="025.5/24" Normalized_DDC="025524" Normalized_Weight="0.0625" />
<identifier Org="ISBN:1586030132" Paper_ID="/322454.html" Extracted="1586030132" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540205896" Paper_ID="/322454.html" Extracted="3540205896" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540252959" Paper_ID="/322454.html" Extracted="3540252959" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540408304" Paper_ID="/322454.html" Extracted="3540408304" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540433430" Paper_ID="/322454.html" Extracted="3540433430" DDC="005.74" Normalized_DDC="00574" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540651012" Paper_ID="/322454.html" Extracted="3540651012" DDC="025/.00285" Normalized_DDC="02500285" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3540663320" Paper_ID="/322454.html" Extracted="3540663320" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:3790812994" Paper_ID="/322454.html" Extracted="3790812994" DDC="006.3" Normalized_DDC="0063" Normalized_Weight="0.0625" />
<identifier Org="ISBN:902724989X" Paper_ID="/322454.html" Extracted="902724989X" DDC="006.3/5" Normalized_DDC="00635" Normalized_Weight="0.0625" />
</rec>
<rec ID="/557091.html" Type="inproceedings" CiteSeer_Book="Proceedings of COLING92" CiteSeer_Volume="" Title="Word-Sense Disambiguation using Statistical Models of {Roget}'s Categories Trained on Large Corpora,">
<identifier Org="ISBN:2930344504" Paper_ID="/557091.html" Extracted="2930344504" />
<identifier Org="ISBN:3540725873" Paper_ID="/557091.html" Extracted="3540725873" />
</rec>
<rec ID="SELF" Type="SELF" CiteSeer_Book="SELF" CiteSeer_Volume="SELF" Title="Homonymy and Polysemy in Information Retrieval">
<identifier Org="ISBN:019927634X" Paper_ID="SELF" Extracted="019927634X" DDC="410.285" Normalized_DDC="410285" Normalized_Weight="0.14285714285714285" />
<identifier Org="ISBN:1402048092" Paper_ID="SELF" Extracted="1402048092" DDC="401/.430285" Normalized_DDC="401430285" Normalized_Weight="0.14285714285714285" />
<identifier Org="ISBN:1591404142" Paper_ID="SELF" Extracted="1591404142" DDC="006.3/12" Normalized_DDC="006312" Normalized_Weight="0.14285714285714285" />
<identifier Org="ISBN:2846270996" Paper_ID="SELF" Extracted="2846270996" DDC="400" Normalized_DDC="40" Normalized_Weight="0.14285714285714285" />
<identifier Org="ISBN:3540664947" Paper_ID="SELF" Extracted="3540664947" DDC="006.3/5" Normalized_DDC="00635" Normalized_Weight="0.14285714285714285" />
<identifier Org="ISBN:3540857591" Paper_ID="SELF" Extracted="3540857591" DDC="025.04" Normalized_DDC="02504" Normalized_Weight="0.14285714285714285" />
<identifier Org="ISBN:8484298809" Paper_ID="SELF" Extracted="8484298809" />
<identifier Org="ISBN:9027222797" Paper_ID="SELF" Extracted="9027222797" DDC="410/.285" Normalized_DDC="410285" Normalized_Weight="0.14285714285714285" />
</rec>
</references_metadata>