Title |
An Examination of Cross-Cultural Similarities and Differences from Social Media Data with respect to Language Use |
Authors |
Mohammad Fazleh Elahi and Paola Monachesi |
Abstract |
We present a methodology for analyzing cross-cultural similarities and differences using language as a medium, love as domain, social media as a data source and 'Terms' and 'Topics' as cultural features. We discuss the techniques necessary for the creation of the social data corpus from which emotion terms have been extracted using NLP techniques. Topics of love discussion were then extracted from the corpus by means of Latent Dirichlet Allocation (LDA). Finally, on the basis of these features, a cross-cultural comparison was carried out. For the purpose of cross-cultural analysis, the experimental focus was on comparing data from a culture from the East (India) with a culture from the West (United States of America). Similarities and differences between these cultures have been analyzed with respect to the usage of emotions, their intensities and the topics used during love discussion in social media. |
Topics |
Corpus (creation, annotation, etc.), Topic detection & tracking, Emotion Recognition/Generation |
Full paper |
An Examination of Cross-Cultural Similarities and Differences from Social Media Data with respect to Language Use |
Bibtex |
@InProceedings{ELAHI12.942,
author = {Mohammad Fazleh Elahi and Paola Monachesi}, title = {An Examination of Cross-Cultural Similarities and Differences from Social Media Data with respect to Language Use}, booktitle = {Proceedings of the Eight International Conference on Language Resources and Evaluation (LREC'12)}, year = {2012}, month = {may}, date = {23-25}, address = {Istanbul, Turkey}, editor = {Nicoletta Calzolari (Conference Chair) and Khalid Choukri and Thierry Declerck and Mehmet Uğur Doğan and Bente Maegaard and Joseph Mariani and Asuncion Moreno and Jan Odijk and Stelios Piperidis}, publisher = {European Language Resources Association (ELRA)}, isbn = {978-2-9517408-7-7}, language = {english} } |