@prefix epid: .
@prefix dc: .
@prefix geo: .
@prefix bibo: .
@prefix epx: .
@prefix owl: .
@prefix void: .
@prefix event: .
@prefix skos: .
@prefix xsd: .
@prefix cc: .
@prefix ep: .
@prefix foaf: .
@prefix rdf: .
@prefix rdfs: .
@prefix eprel: .
@prefix dct: .
<>
foaf:primaryTopic ;
rdfs:comment "The repository administrator has not yet configured an RDF license."^^xsd:string .
rdfs:label "ECML2001.ps"^^xsd:string .
rdfs:label "preview.png"^^xsd:string .
rdfs:label "ECML2001.pdf"^^xsd:string .
rdfs:label "indexcodes.txt"^^xsd:string .
dc:format "text/html";
dc:title "HTML Summary of #1796 \n\nMining the Web for Synonyms: PMI-IR versus LSA on TOEFL\n\n";
foaf:primaryTopic .
dct:hasPart ;
ep:hasFile ;
eprel:hasVersion ;
eprel:hasVolatileVersion ;
eprel:haspreviewThumbnailVersion ;
rdf:type bibo:Document,
ep:Document;
rdfs:label "Mining the Web for Synonyms: PMI-IR versus LSA on TOEFL (Postscript)"^^xsd:string .
dct:hasPart ;
ep:hasFile ;
eprel:isVersionOf ;
eprel:isVolatileVersionOf ;
eprel:ispreviewThumbnailVersionOf ;
rdf:type ep:Document;
rdfs:label "Mining the Web for Synonyms: PMI-IR versus LSA on TOEFL (Image (PNG))"^^xsd:string .
dct:hasPart ;
ep:hasFile ;
eprel:hasIndexCodesVersion ;
eprel:hasVersion ,
;
eprel:hasVolatileVersion ,
;
eprel:haspreviewThumbnailVersion ;
rdf:type bibo:Document,
ep:Document;
rdfs:label "Mining the Web for Synonyms: PMI-IR versus LSA on TOEFL (PDF)"^^xsd:string .
dct:hasPart ;
ep:hasFile ;
eprel:isIndexCodesVersionOf ;
eprel:isVersionOf ;
eprel:isVolatileVersionOf ;
rdf:type ep:Document;
rdfs:label "Mining the Web for Synonyms: PMI-IR versus LSA on TOEFL (Indexer Terms)"^^xsd:string .
rdf:_1 .
rdf:_1 ;
rdf:_2 .
,
;
bibo:abstract "This paper presents a simple unsupervised learning algorithm for recognizing synonyms, based on statistical data acquired by querying a Web search engine. The algorithm, called PMI-IR, uses Pointwise Mutual Information (PMI) and Information Retrieval (IR) to measure the similarity of pairs of words. PMI-IR is empirically evaluated using 80 synonym test questions from the Test of English as a Foreign Language (TOEFL) and 50 synonym test questions from a collection of tests for students of English as a Second Language (ESL). On both tests, the algorithm obtains a score of 74%. PMI-IR is contrasted with Latent Semantic Analysis (LSA), which achieves a score of 64% on the same 80 TOEFL questions. The paper discusses potential applications of the new unsupervised learning algorithm and some implications of the results for LSA and LSI (Latent Semantic Indexing). \n\n"^^xsd:string;
bibo:authorList ;
bibo:editorList ;
bibo:status ,
;
dct:creator ;
dct:date "2001";
dct:isPartOf ;
dct:publisher ;
dct:subject ,
,
;
dct:title "Mining the Web for Synonyms: PMI-IR versus LSA on TOEFL"^^xsd:string;
ep:hasDocument ,
,
,
;
rdf:type bibo:Article,
ep:ConfpaperEPrint,
ep:EPrint;
rdfs:seeAlso .
rdf:type skos:Concept;
skos:prefLabel "Language" .
rdf:type skos:Concept;
skos:prefLabel "Machine Learning" .
rdf:type skos:Concept;
skos:prefLabel "Statistical Models" .
foaf:name "Springer-Verlag"^^xsd:string;
rdf:type foaf:Organization .
foaf:familyName "De Raedt"^^xsd:string;
foaf:givenName "Luc"^^xsd:string;
foaf:name "Luc De Raedt"^^xsd:string;
rdf:type foaf:Person .
foaf:familyName "Flach"^^xsd:string;
foaf:givenName "Peter"^^xsd:string;
foaf:name "Peter Flach"^^xsd:string;
rdf:type foaf:Person .
foaf:familyName "Turney"^^xsd:string;
foaf:givenName "Peter"^^xsd:string;
foaf:name "Peter Turney"^^xsd:string;
rdf:type foaf:Person .