2018
|
Kar, Sudipta; Maharjan, Suraj; López-Monroy, Pastor A; Solorio, Thamar MPST: A Corpus of Movie Plot Synopses with Tags Conference Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018), European Language Resources Association (ELRA), 2018. Abstract | Links | BibTeX | Tags: Information Extraction, Narrative Analysis, Sentiment analysis, Text Classification @conference{Kar2018,
title = {MPST: A Corpus of Movie Plot Synopses with Tags},
author = {Sudipta Kar and Suraj Maharjan and A. Pastor López-Monroy and Thamar Solorio},
url = {http://sudiptakar.info/wp-content/uploads/2018/05/322_LREC_2018.pdf, Slide
http://sudiptakar.info/wp-content/uploads/2018/02/mpst-corpus-movie-2.pdf, Paper},
year = {2018},
date = {2018-05-10},
booktitle = {Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)},
publisher = {European Language Resources Association (ELRA)},
abstract = {Social tagging of movies reveals a wide range of heterogeneous information about movies, like the genre, plot structure, soundtracks, metadata, visual and emotional experiences. Such information can be valuable in building automatic systems to create tags for movies. Automatic tagging systems can help recommendation engines to improve the retrieval of similar movies as well as help viewers to know what to expect from a movie in advance. In this paper, we set out to the task of collecting a corpus of movie plot synopses and tags. We describe a methodology that enabled us to build a fine-grained set of around 70 tags exposing heterogeneous characteristics of movie plots and the multi-label associations of these tags with some 14K movie plot synopses. We investigate how these tags correlate with movies and the flow of emotions throughout different types of movies. Finally, we use this corpus to explore the feasibility of inferring tags from plot synopses. We expect the corpus will be useful in other tasks where analysis of narratives is relevant.},
keywords = {Information Extraction, Narrative Analysis, Sentiment analysis, Text Classification},
pubstate = {published},
tppubtype = {conference}
}
Social tagging of movies reveals a wide range of heterogeneous information about movies, like the genre, plot structure, soundtracks, metadata, visual and emotional experiences. Such information can be valuable in building automatic systems to create tags for movies. Automatic tagging systems can help recommendation engines to improve the retrieval of similar movies as well as help viewers to know what to expect from a movie in advance. In this paper, we set out to the task of collecting a corpus of movie plot synopses and tags. We describe a methodology that enabled us to build a fine-grained set of around 70 tags exposing heterogeneous characteristics of movie plots and the multi-label associations of these tags with some 14K movie plot synopses. We investigate how these tags correlate with movies and the flow of emotions throughout different types of movies. Finally, we use this corpus to explore the feasibility of inferring tags from plot synopses. We expect the corpus will be useful in other tasks where analysis of narratives is relevant. |
2014
|
Osborne, John David; Gyawali, Binod; Solorio, Thamar Evaluation of YTEX and MetaMap for clinical concept recognition Journal Article CoRR, abs/1402.1668 , 2014. Links | BibTeX | Tags: Clinical Applications, Information Extraction @article{OsborneEtAl:14,
title = {Evaluation of YTEX and MetaMap for clinical concept recognition},
author = { John David Osborne and Binod Gyawali and Thamar Solorio},
url = {http://arxiv.org/abs/1402.1668},
year = {2014},
date = {2014-01-01},
journal = {CoRR},
volume = {abs/1402.1668},
keywords = {Clinical Applications, Information Extraction},
pubstate = {published},
tppubtype = {article}
}
|
2013
|
Gyawali, Binod; Ramirez-de-la-Rosa, Gabriela; Solorio, Thamar Native Language Identification: a Simple n-gram Based Approach Inproceedings Proceedings of the Eighth Workshop on Innovative Use of NLP for Building Educational Applications, pp. 224–231, ACL, Atlanta, Georgia, 2013. Links | BibTeX | Tags: Information Extraction, Profiling @inproceedings{GyawaliEtAl:13,
title = {Native Language Identification: a Simple n-gram Based Approach},
author = { Binod Gyawali and Gabriela Ramirez-de-la-Rosa and Thamar Solorio},
url = {http://www.aclweb.org/anthology/W13-1729},
year = {2013},
date = {2013-06-01},
booktitle = {Proceedings of the Eighth Workshop on Innovative Use of NLP for Building Educational Applications},
pages = {224--231},
publisher = {ACL},
address = {Atlanta, Georgia},
keywords = {Information Extraction, Profiling},
pubstate = {published},
tppubtype = {inproceedings}
}
|
Osborne, John David; Gyawali, Binod; Solorio, Thamar Evaluation of freely available open source software for clinical concept recognition Inproceedings Notebook for ShARe/CLEF eHealth Evaluation Lab at CLEF 2013, 2013. BibTeX | Tags: Clinical Applications, Information Extraction @inproceedings{OsborneEtAl:13,
title = {Evaluation of freely available open source software for clinical concept recognition},
author = { John David Osborne and Binod Gyawali and Thamar Solorio},
year = {2013},
date = {2013-01-01},
booktitle = {Notebook for ShARe/CLEF eHealth Evaluation Lab at CLEF 2013},
keywords = {Clinical Applications, Information Extraction},
pubstate = {published},
tppubtype = {inproceedings}
}
|