Title |
A Development Environment for Configurable Meta-Annotators in a Pipelined NLP Architecture |
Authors |
Youssef Drissi, Branimir Boguraev, David Ferrucci, Paul Keyser and Anthony Levas |
Abstract |
Information extraction from large data repositories is critical to Information Management solutions. In addition to prerequisite corpus analysis, to determine domain-specific characteristics of text resources, developing, refining and evaluating analytics entails a complex and lengthy process, typically requiring more than just domain expertise. Modern architectures for text processing, while facilitating reuse and (re-)composition of analytical pipelines, do place additional constraints upon the analytics development, as domain experts need not only configure individual annotator components, but situate these within a fully functional annotator pipeline. We present the design, and current status, of a tool for configuring model-driven annotators, which abstracts away from annotator implementation details, pipeline composition constraints, and data management. Instead, the tool embodies support for all stages of ontology-centric model development cycle from corpus analysis and concept definition, to model development and testing, to large scale evaluation, to easy and rapid composition of text applications deploying these concept models. With our design, we aim to meet the needs of domain experts, who are not necessarily expert NLP practitioners. |
Language |
Language-independent |
Topics |
Tools, systems, applications, Information Extraction, Information Retrieval, Usability, user satisfaction |
Full paper |
A Development Environment for Configurable Meta-Annotators in a Pipelined NLP Architecture |
Slides |
A Development Environment for Configurable Meta-Annotators in a Pipelined NLP Architecture |
Bibtex |
@InProceedings{DRISSI08.820,
author = {Youssef Drissi, Branimir Boguraev, David Ferrucci, Paul Keyser and Anthony Levas},
title = {A Development Environment for Configurable Meta-Annotators in a Pipelined NLP Architecture},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |