BIS 2008

BIS record '2007/1/449'


  author        = {Maciej Piasecki and
                   Bartosz Broda},
  title         = {Semantic Similarity Measure of Polish Nouns Based on Linguistic Features},
  year          = {2007},
  session       = {Information Retrieval},
  pages         = {384--393},
  crossref      = {BIS:2007/1},
  bibsource     = {BIS,},
  abstract      = {A word-to-word similarity function automatically extracted from a corpus of texts can be a very helpful tool in automatic extraction of lexical semantic relations. There are many approaches for English, but only few for inflective languages with almost free word order. In the paper a method for the construction of a similarity function of Polish nouns is proposed. The method uses only simple tools for language processing (e.g.\ it does need the application of a parser). The core is the construction of a matrix of co-occurrences of nouns and adjectives on the basis of application of morpho-syntactic constraints testing agreement between an adjective and a noun. Several methods of transformation of the matrix and calculation of the similarity function are presented. The achieved accuracy of 81.04\% in WordNet-based Synonymy Test (for 4~611 Polish nouns, using the current version of Polish WordNet) seems to be comparable with the best results reported for English.}

  editor        = {Witold Abramowicz},
  booktitle     = {Business Information Systems, 10th International Conference, BIS 2007, Poznań, Poland, April 2007},
  title         = {Business Information Systems, 10th International Conference, BIS 2007, Poznań, Poland, April 2007},
  publisher     = {Springer-Verlag},
  isbn          = {978-3-540-72034-8},
  year          = {2007},
  bibsource     = {BIS,}

BIS index BIS 2007
Dept. of Information Systems at Poznan University of Economics, Dominik Flejter