Title |
WikiNet: A Very Large Scale Multi-Lingual Concept Network |
Authors |
Vivi Nastase, Michael Strube, Benjamin Boerschinger, Caecilia Zirn and Anas Elghafari |
Abstract |
This paper describes a multi-lingual large-scale concept network obtainedautomatically by mining for concepts and relations and exploiting a variety ofsources of knowledge from Wikipedia. Concepts and their lexicalizations areextracted from Wikipedia pages, in particular from article titles, hyperlinks,disambiguation pages and cross-language links. Relations are extracted from thecategory and page network, from the category names, from infoboxes and the bodyof the articles. The resulting network has two main components: (i) a central,language independent index of concepts, which serves to keep track of theconcepts' lexicalizations both within a language and across languages, and toseparate linguistic expressions of concepts from the relations in which theyare involved (concepts themselves are represented as numeric IDs); (ii) a largenetwork built on the basis of the relations extracted, represented as relationsbetween concepts (more specifically, the numeric IDs). The various stages ofobtaining the network were separately evaluated, and the results show aqualitative resource. |
Language |
Multilinguality |
Topics |
Ontologies, Knowledge Discovery/Representation, Multilinguality |
Full paper  |
WikiNet: A Very Large Scale Multi-Lingual Concept Network |
Bibtex |
@InProceedings{NASTASE10.615,
author = {Vivi Nastase, Michael Strube, Benjamin Boerschinger, Caecilia Zirn and Anas Elghafari}, title = {WikiNet: A Very Large Scale Multi-Lingual Concept Network}, booktitle = {Proceedings of the Seventh conference on International Language Resources and Evaluation (LREC'10)}, year = {2010}, month = {may}, date = {19-21}, address = {Valletta, Malta}, editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odjik, Stelios Piperidis, Mike Rosner, Daniel Tapias}, publisher = {European Language Resources Association (ELRA)}, isbn = {2-9517408-6-7}, language = {english} } |