@inproceedings{531432fa51a04470a3c360465fb1b477,
title = "SemSim: Resources for normalized semantic similarity computation using lexical networks",
abstract = "We investigate the creation of corpora from web-harvested data following a scalable approach that has linear query complexity. Individual web queries are posed for a lexicon that includes thousands of nouns and the retrieved data are aggregated. A lexical network is constructed, in which the lexicon nouns are linked according to their context-based similarity. We introduce the notion of semantic neighborhoods, which are exploited for the computation of semantic similarity. Two types of normalization are proposed and evaluated on the semantic tasks of: (i) similarity judgement, and (ii) noun categorization and taxonomy creation. The created corpus along with a set of tools and noun similarities are made publicly available.",
keywords = "Distributional semantic models, Lexical networks, Semantic similarity",
author = "Elias Iosif and Alexandros Potamianos",
year = "2012",
language = "English",
series = "Proceedings of the 8th International Conference on Language Resources and Evaluation, LREC 2012",
publisher = "European Language Resources Association (ELRA)",
pages = "3499--3504",
editor = "Dogan, {Mehmet Ugur} and Joseph Mariani and Asuncion Moreno and Sara Goggi and Khalid Choukri and Nicoletta Calzolari and Jan Odijk and Thierry Declerck and Bente Maegaard and Stelios Piperidis and Helene Mazo and Olivier Hamon",
booktitle = "Proceedings of the 8th International Conference on Language Resources and Evaluation, LREC 2012",
note = "8th International Conference on Language Resources and Evaluation, LREC 2012 ; Conference date: 21-05-2012 Through 27-05-2012",
}