Title |
Tapping Huge Temporally Indexed Textual Resources with WCTAnalyze |
Authors |
Sebastian Gottwald, Matthias Richter, Gerhard Heyer and Gerik Scheuermann |
Abstract |
WCTAnalyze is a tool for storing, accessing and visually analyzing huge collections of temporally indexed data. It is motivated by applications in media analysis, business intelligence etc. where higher level analysis is performed on top of linguistically and statistically processed unstructured textual data. WCTAnalyze combines fast access with economically storage behaviour and appropriates a lot of built in visualization options for result presentation in detail as well as in contrast. So it enables an efficient and effective way to explore chronological text patterns of word forms, their co-occurrence sets and co-occurrence set intersections. Digging deep into co-occurrences of the same semantic or syntactic describing wordforms, some entities can be recognized as to be temporal related, whereas other differ significantly. This behaviour motivates approaches in interactive discovering events based on co-occurrence subsets. |
Language |
|
Topics |
Tools, systems, applications, LR Infrastructures and Architectures, Text mining |
Full paper |
Tapping Huge Temporally Indexed Textual Resources with WCTAnalyze |
Slides |
- |
Bibtex |
@InProceedings{GOTTWALD08.117,
author = {Sebastian Gottwald, Matthias Richter, Gerhard Heyer and Gerik Scheuermann},
title = {Tapping Huge Temporally Indexed Textual Resources with WCTAnalyze},
booktitle = {Proceedings of the Sixth International Conference on Language Resources and Evaluation (LREC'08)},
year = {2008},
month = {may},
date = {28-30},
address = {Marrakech, Morocco},
editor = {Nicoletta Calzolari (Conference Chair), Khalid Choukri, Bente Maegaard, Joseph Mariani, Jan Odijk, Stelios Piperidis, Daniel Tapias},
publisher = {European Language Resources Association (ELRA)},
isbn = {2-9517408-4-0},
note = {http://www.lrec-conf.org/proceedings/lrec2008/},
language = {english}
} |