Title |
A Framework for Identity Resolution and Merging for Multi-source Information Extraction |
Authors |
Milena Yankova, Horacio Saggion and Hamish Cunningham |
Abstract |
In the context of ontology-based information extraction, identity resolution is the process of deciding whether an instance extracted from text refers to a known entity in the target domain (e.g. the ontology). We present an ontology-based framework for identity resolution which can be customized to different application domains and extraction tasks. Rules for identify resolution, which compute similarities between target and source entities based on class information and instance properties and values, can be defined for each class in the ontology. We present a case study of the application of the framework to the problem of multi-source job vacancy extraction |
Language |
Multiple languages |
Topics |
Tools, systems, applications, Information Extraction, Information Retrieval, Ontologies |
Full paper |
A Framework for Identity Resolution and Merging for Multi-source Information Extraction |
Slides |
- |
Bibtex |
@InProceedings{YANKOVA08.347,
author = {Milena Yankova, Horacio Saggion and Hamish Cunningham},
title = {A Framework for Identity Resolution and Merging for Multi-source Information Extraction},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |