Automatically assigned DDC number: 00635

Manually assigned DDC number: 00635

Number of references: 8

Title: Homonymy and Polysemy in Information Retrieval

Author:

Subject: Robert Krovetz Homonymy and Polysemy in Information Retrieval

Description: This paper discusses research on distinguishing word meanings in the context of information retrieval systems. We conducted experiments with three sources of evidence for making these distinctions: morphology, part-of-speech, and phrases. We have focused on the distinction between homonymy and polysemy (unrelated vs. related meanings). Our results support the need to distinguish homonymy and polysemy. We found: 1) grouping morphological variants makes a significant improvement in retrieval performance, 2) that more than half of all words in a dictionary that differ in part-of-speech are related in meaning, and 3) that it is crucial to assign credit to the component words of a phrase. These experiments provide a better understanding of word-based methods, and suggest where natural language processing can provide further improvements in retrieval performance. 1 Introduction Lexical ambiguity is a fundamental problem in natural language processing, but relatively little quantitative inf...

Contributor: The Pennsylvania State University CiteSeer Archives

Publisher: unknown

Date: 1997-12-05

Pubyear: 1997

Format: ps

Identifier: http://citeseer.ist.psu.edu/167170.html

Source: ftp://ftp.nj.nec.com/pub/krovetz/homonymy-polysemy.ps

Language: en

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Relation:

Rights: unrestricted

Graph

<?xml   version="1.0"   encoding="UTF-8"?>

<references_metadata>

      <rec   ID="/576559.html"   Type="inproceedings"   CiteSeer_Book="ACL   Proceedings   Second   Conference   on   Applied   Natural   Language   Processing"   CiteSeer_Volume=""   Title="A   tool   for   investigating   the   synonymy   relation   in   a   sense   disambiguated   thesaurus,">

            <identifier   Org="ISBN:0805810889"   Paper_ID="/576559.html"   Extracted="0805810889"   DDC="401/.43"   Normalized_DDC="40143"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:0818622059"   Paper_ID="/576559.html"   Extracted="0818622059"   DDC="005.74"   Normalized_DDC="00574"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:0897913213"   Paper_ID="/576559.html"   Extracted="0897913213"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.25"   />

            <identifier   Org="ISBN:1558601570"   Paper_ID="/576559.html"   Extracted="1558601570"   DDC="621.3804"   Normalized_DDC="6213804"   Normalized_Weight="0.25"   />

      </rec>

      <rec   ID="/192832.html"   Type="article"   CiteSeer_Book="Computational   Linguistics"   CiteSeer_Volume="20"   Title="Word   Sense   Disambiguation   Using   a   Second   Language   Monolingual   Corpus,">

            <identifier   Org="ISBN:0262611228"   Paper_ID="/192832.html"   Extracted="0262611228"   DDC="410.72"   Normalized_DDC="41072"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0387947019"   Paper_ID="/192832.html"   Extracted="0387947019"   DDC="006.5/4"   Normalized_DDC="00654"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:0818679190"   Paper_ID="/192832.html"   Extracted="0818679190"   />

            <identifier   Org="ISBN:0824790006"   Paper_ID="/192832.html"   Extracted="0824790006"   DDC="006.3/5"   Normalized_DDC="00635"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:1402048092"   Paper_ID="/192832.html"   Extracted="1402048092"   DDC="401/.430285"   Normalized_DDC="401430285"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:157735236X"   Paper_ID="/192832.html"   Extracted="157735236X"   />

            <identifier   Org="ISBN:3110155788"   Paper_ID="/192832.html"   Extracted="3110155788"   DDC="410.1/51"   Normalized_DDC="410151"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3110176165"   Paper_ID="/192832.html"   Extracted="3110176165"   DDC="401/.43"   Normalized_DDC="40143"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540210067"   Paper_ID="/192832.html"   Extracted="3540210067"   DDC="410/.285"   Normalized_DDC="410285"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540240179"   Paper_ID="/192832.html"   Extracted="3540240179"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540340459"   Paper_ID="/192832.html"   Extracted="3540340459"   DDC="469.0285"   Normalized_DDC="4690285"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540411178"   Paper_ID="/192832.html"   Extracted="3540411178"   DDC="418/.02/0285"   Normalized_DDC="418020285"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540415971"   Paper_ID="/192832.html"   Extracted="3540415971"   DDC="006.3/1"   Normalized_DDC="00631"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540652590"   Paper_ID="/192832.html"   Extracted="3540652590"   DDC="418/.02/0285"   Normalized_DDC="418020285"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:3540733442"   Paper_ID="/192832.html"   Extracted="3540733442"   />

            <identifier   Org="ISBN:9027248079"   Paper_ID="/192832.html"   Extracted="9027248079"   DDC="410.285"   Normalized_DDC="410285"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:9042015306"   Paper_ID="/192832.html"   Extracted="9042015306"   DDC="418.02"   Normalized_DDC="41802"   Normalized_Weight="0.06666666666666667"   />

            <identifier   Org="ISBN:9629961482"   Paper_ID="/192832.html"   Extracted="9629961482"   DDC="418.020285"   Normalized_DDC="418020285"   Normalized_Weight="0.06666666666666667"   />

      </rec>

      <rec   ID="/22021.html"   Type="article"   CiteSeer_Book="Information   Systems"   CiteSeer_Volume="10"   Title="Lexical   Ambiguity   and   Information   Retrieval,">

            <identifier   Org="ISBN:019927634X"   Paper_ID="/22021.html"   Extracted="019927634X"   DDC="410.285"   Normalized_DDC="410285"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:038778702X"   Paper_ID="/22021.html"   Extracted="038778702X"   DDC="610.285   22"   Normalized_DDC="61028522"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:0387944540"   Paper_ID="/22021.html"   Extracted="0387944540"   DDC="025.06/61"   Normalized_DDC="0250661"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:0788129457"   Paper_ID="/22021.html"   Extracted="0788129457"   />

            <identifier   Org="ISBN:0789023555"   Paper_ID="/22021.html"   Extracted="0789023555"   DDC="025"   Normalized_DDC="025"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:0792356853"   Paper_ID="/22021.html"   Extracted="0792356853"   DDC="410/.285"   Normalized_DDC="410285"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:079239710X"   Paper_ID="/22021.html"   Extracted="079239710X"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:0805811273"   Paper_ID="/22021.html"   Extracted="0805811273"   DDC="413/.028"   Normalized_DDC="413028"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:0898715008"   Paper_ID="/22021.html"   Extracted="0898715008"   DDC="005.74"   Normalized_DDC="00574"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:1402033435"   Paper_ID="/22021.html"   Extracted="1402033435"   DDC="006.35"   Normalized_DDC="00635"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:1581136463"   Paper_ID="/22021.html"   Extracted="1581136463"   />

            <identifier   Org="ISBN:1588110168"   Paper_ID="/22021.html"   Extracted="1588110168"   DDC="401/.4/0285"   Normalized_DDC="40140285"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:1878289519"   Paper_ID="/22021.html"   Extracted="1878289519"   DDC="658.4/038"   Normalized_DDC="6584038"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:3540204091"   Paper_ID="/22021.html"   Extracted="3540204091"   DDC="004"   Normalized_DDC="004"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:3540213821"   Paper_ID="/22021.html"   Extracted="3540213821"   DDC="005.74"   Normalized_DDC="00574"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:3540261788"   Paper_ID="/22021.html"   Extracted="3540261788"   DDC="021.65"   Normalized_DDC="02165"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:354040550X"   Paper_ID="/22021.html"   Extracted="354040550X"   DDC="005.74"   Normalized_DDC="00574"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:3540413480"   Paper_ID="/22021.html"   Extracted="3540413480"   DDC="004"   Normalized_DDC="004"   Normalized_Weight="0.058823529411764705"   />

            <identifier   Org="ISBN:3540856536"   Paper_ID="/22021.html"   Extracted="3540856536"   />

            <identifier   Org="ISBN:3790812994"   Paper_ID="/22021.html"   Extracted="3790812994"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.058823529411764705"   />

      </rec>

      <rec   ID="/50937.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   the   Sixteenth   Annual   International   ACM   SIGIR   Conference   on   Research   and   Development   in   Information   Retrieval"   CiteSeer_Volume=""   Title="{V}iewing   {M}orphology   as   an   {I}nference   {P}rocess,,"   />

      <rec   ID="/29993.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   SIGIR94   17th   ACM   International   Conference   on   Research   and   Development   in   Information   Retrieval"   CiteSeer_Volume=""   Title="Word   sense   disambiguation   and   information   retrieval,">

            <identifier   Org="ISBN:0130950696"   Paper_ID="/29993.html"   Extracted="0130950696"   DDC="410/.285"   Normalized_DDC="410285"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:019927634X"   Paper_ID="/29993.html"   Extracted="019927634X"   DDC="410.285"   Normalized_DDC="410285"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:026206197X"   Paper_ID="/29993.html"   Extracted="026206197X"   DDC="423/.1"   Normalized_DDC="4231"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:038778702X"   Paper_ID="/29993.html"   Extracted="038778702X"   DDC="610.285   22"   Normalized_DDC="61028522"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:0792356853"   Paper_ID="/29993.html"   Extracted="0792356853"   DDC="410/.285"   Normalized_DDC="410285"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1402048092"   Paper_ID="/29993.html"   Extracted="1402048092"   DDC="401/.430285"   Normalized_DDC="401430285"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1402056338"   Paper_ID="/29993.html"   Extracted="1402056338"   DDC="658.4038011"   Normalized_DDC="6584038011"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1558604545"   Paper_ID="/29993.html"   Extracted="1558604545"   DDC="025.5/24"   Normalized_DDC="025524"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:1581136463"   Paper_ID="/29993.html"   Extracted="1581136463"   />

            <identifier   Org="ISBN:1581138814"   Paper_ID="/29993.html"   Extracted="1581138814"   />

            <identifier   Org="ISBN:1595931406"   Paper_ID="/29993.html"   Extracted="1595931406"   />

            <identifier   Org="ISBN:3540001972"   Paper_ID="/29993.html"   Extracted="3540001972"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:354019889X"   Paper_ID="/29993.html"   Extracted="354019889X"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540204946"   Paper_ID="/29993.html"   Extracted="3540204946"   DDC="005.75/8"   Normalized_DDC="005758"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540213821"   Paper_ID="/29993.html"   Extracted="3540213821"   DDC="005.74"   Normalized_DDC="00574"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540250700"   Paper_ID="/29993.html"   Extracted="3540250700"   DDC="006.312"   Normalized_DDC="006312"   Normalized_Weight="0.07142857142857142"   />

            <identifier   Org="ISBN:3540856536"   Paper_ID="/29993.html"   Extracted="3540856536"   />

            <identifier   Org="ISBN:9051992734"   Paper_ID="/29993.html"   Extracted="9051992734"   DDC="006.3/5"   Normalized_DDC="00635"   Normalized_Weight="0.07142857142857142"   />

      </rec>

      <rec   ID="/350487.html"   Type="misc"   CiteSeer_Book=""   CiteSeer_Volume=""   Title="Translation   Mismatch   in   a   Hybrid   MT   System,"   />

      <rec   ID="/322454.html"   Type="book"   CiteSeer_Book="Information   Retrieval   2nd   edition"   CiteSeer_Volume=""   Title="Information   Retrieval,   2nd   edition,">

            <identifier   Org="ISBN:0070544840"   Paper_ID="/322454.html"   Extracted="0070544840"   DDC="025.5/2"   Normalized_DDC="02552"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0789023555"   Paper_ID="/322454.html"   Extracted="0789023555"   DDC="025"   Normalized_DDC="025"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0792399269"   Paper_ID="/322454.html"   Extracted="0792399269"   DDC="005.74/068"   Normalized_DDC="00574068"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0849318254"   Paper_ID="/322454.html"   Extracted="0849318254"   DDC="006.7"   Normalized_DDC="0067"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0849318580"   Paper_ID="/322454.html"   Extracted="0849318580"   DDC="006.7"   Normalized_DDC="0067"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:0897910524"   Paper_ID="/322454.html"   Extracted="0897910524"   DDC="025/.04   s"   Normalized_DDC="02504"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:1558604545"   Paper_ID="/322454.html"   Extracted="1558604545"   DDC="025.5/24"   Normalized_DDC="025524"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:1586030132"   Paper_ID="/322454.html"   Extracted="1586030132"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540205896"   Paper_ID="/322454.html"   Extracted="3540205896"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540252959"   Paper_ID="/322454.html"   Extracted="3540252959"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540408304"   Paper_ID="/322454.html"   Extracted="3540408304"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540433430"   Paper_ID="/322454.html"   Extracted="3540433430"   DDC="005.74"   Normalized_DDC="00574"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540651012"   Paper_ID="/322454.html"   Extracted="3540651012"   DDC="025/.00285"   Normalized_DDC="02500285"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3540663320"   Paper_ID="/322454.html"   Extracted="3540663320"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:3790812994"   Paper_ID="/322454.html"   Extracted="3790812994"   DDC="006.3"   Normalized_DDC="0063"   Normalized_Weight="0.0625"   />

            <identifier   Org="ISBN:902724989X"   Paper_ID="/322454.html"   Extracted="902724989X"   DDC="006.3/5"   Normalized_DDC="00635"   Normalized_Weight="0.0625"   />

      </rec>

      <rec   ID="/557091.html"   Type="inproceedings"   CiteSeer_Book="Proceedings   of   COLING92"   CiteSeer_Volume=""   Title="Word-Sense   Disambiguation   using   Statistical   Models   of   {Roget}'s   Categories   Trained   on   Large   Corpora,">

            <identifier   Org="ISBN:2930344504"   Paper_ID="/557091.html"   Extracted="2930344504"   />

            <identifier   Org="ISBN:3540725873"   Paper_ID="/557091.html"   Extracted="3540725873"   />

      </rec>

      <rec   ID="SELF"   Type="SELF"   CiteSeer_Book="SELF"   CiteSeer_Volume="SELF"   Title="Homonymy   and   Polysemy   in   Information   Retrieval">

            <identifier   Org="ISBN:019927634X"   Paper_ID="SELF"   Extracted="019927634X"   DDC="410.285"   Normalized_DDC="410285"   Normalized_Weight="0.14285714285714285"   />

            <identifier   Org="ISBN:1402048092"   Paper_ID="SELF"   Extracted="1402048092"   DDC="401/.430285"   Normalized_DDC="401430285"   Normalized_Weight="0.14285714285714285"   />

            <identifier   Org="ISBN:1591404142"   Paper_ID="SELF"   Extracted="1591404142"   DDC="006.3/12"   Normalized_DDC="006312"   Normalized_Weight="0.14285714285714285"   />

            <identifier   Org="ISBN:2846270996"   Paper_ID="SELF"   Extracted="2846270996"   DDC="400"   Normalized_DDC="40"   Normalized_Weight="0.14285714285714285"   />

            <identifier   Org="ISBN:3540664947"   Paper_ID="SELF"   Extracted="3540664947"   DDC="006.3/5"   Normalized_DDC="00635"   Normalized_Weight="0.14285714285714285"   />

            <identifier   Org="ISBN:3540857591"   Paper_ID="SELF"   Extracted="3540857591"   DDC="025.04"   Normalized_DDC="02504"   Normalized_Weight="0.14285714285714285"   />

            <identifier   Org="ISBN:8484298809"   Paper_ID="SELF"   Extracted="8484298809"   />

            <identifier   Org="ISBN:9027222797"   Paper_ID="SELF"   Extracted="9027222797"   DDC="410/.285"   Normalized_DDC="410285"   Normalized_Weight="0.14285714285714285"   />

      </rec>

</references_metadata>

www.000webhost.com