2017
Suraj Maharjan Gustavo Aguilar, A. Pastor López Monroy
A Multi-task Approach for Named Entity Recognition on Social Media Data Inproceedings
In: Proceedings of 3rd Workshop on Noisy User-generated Text, WNUT 2017., 2017, (Ranked 1st place in the two evaluation metrics).
Abstract | Links | BibTeX | Tags: CRF, Deeplearning, Multitask, NER
@inproceedings{aguilar-EtAl:2017:WNUT,
title = {A Multi-task Approach for Named Entity Recognition on Social Media Data},
author = {Gustavo Aguilar, Suraj Maharjan, A. Pastor López Monroy, Thamar Solorio},
url = {http://www.aclweb.org/anthology/W17-4419},
year = {2017},
date = {2017-09-07},
publisher = {Proceedings of 3rd Workshop on Noisy User-generated Text, WNUT 2017.},
abstract = {Named Entity Recognition for social media data is challenging because of its inherent noisiness. In addition to improper grammatical structures, it contains spelling inconsistencies and numerous informal abbreviations. We propose a novel multi-task approach by employing a more general secondary task of Named Entity (NE) segmentation together with the primary task of fine-grained NE categorization. The multi-task neural network architecture learns higher order feature representations from word and character sequences along with basic Part-of-Speech tags and gazetteer information. This neural network acts as a feature extractor to feed a Conditional Random Fields classifier. We were able to obtain the first position in the 3rd Workshop on Noisy User-generated Text (WNUT-2017) with a 41.86% entity F1-score and a 40.24% surface F1-score.},
note = {Ranked 1st place in the two evaluation metrics},
keywords = {CRF, Deeplearning, Multitask, NER},
pubstate = {published},
tppubtype = {inproceedings}
}
Suraj Maharjan Niloofar S. Samghabadi, Alan Sprague
Detecting Nastiness in Social Media Inproceedings
In: ALW1@ACL2017, 2017.
Links | BibTeX | Tags: Abusive Language detection
@inproceedings{safisamghabadi-EtAl:2017:ALW1,
title = {Detecting Nastiness in Social Media},
author = {Niloofar S. Samghabadi, Suraj Maharjan, Alan Sprague, Raquel D. Sprague, Thamar Solorio},
url = {http://aclweb.org/anthology/W17-3010},
year = {2017},
date = {2017-08-04},
booktitle = {ALW1@ACL2017},
keywords = {Abusive Language detection},
pubstate = {published},
tppubtype = {inproceedings}
}
Kar, Sudipta; Maharjan, Suraj; Solorio, Thamar
RiTUAL-UH at SemEval-2017 Task 5: Sentiment Analysis on Financial Data Using Neural Networks Inproceedings
In: Proceedings of the 11th International Workshop on Semantic Evaluation (SemEval-2017), 2017, (Ranked 2nd for Subtask 2. With alternate scoring, ranked 1st in both subtask.).
Abstract | Links | BibTeX | Tags: CNN, Neural Networks, Sentiment analysis
@inproceedings{Kar2017,
title = {RiTUAL-UH at SemEval-2017 Task 5: Sentiment Analysis on Financial Data Using Neural Networks},
author = {Sudipta Kar and Suraj Maharjan and Thamar Solorio},
url = {http://www.aclweb.org/anthology/S17-2150},
year = {2017},
date = {2017-08-03},
publisher = {Proceedings of the 11th International Workshop on Semantic Evaluation (SemEval-2017)},
abstract = {In this paper, we present our systems for the “SemEval-2017 Task-5 on FineGrained Sentiment Analysis on Financial Microblogs and News”. In our system, we combined hand-engineered lexical, sentiment and metadata features, the representations learned from Convolutional Neural Networks (CNN) and Bidirectional Gated Recurrent Unit (Bi-GRU) with Attention model applied on top. With this architecture, we obtained weighted cosine similarity scores of 72.34% and 74.37% for subtask-1 and subtask-2, respectively. Using the official scoring system, our system ranked the second place for subtask-2 and eighth place for the subtask-1. It ranked first for both of the subtasks by the scores achieved by an alternate scoring system.
.},
note = {Ranked 2nd for Subtask 2. With alternate scoring, ranked 1st in both subtask.},
keywords = {CNN, Neural Networks, Sentiment analysis},
pubstate = {published},
tppubtype = {inproceedings}
}
.
Maharjan, Suraj; Arevalo, John; Montes, Manuel; Gonzalez, Fabio A.; Solorio, Thamar
A Multi-task Approach to Predict Likability of Books Inproceedings
In: Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 1, Long Papers, pp. 1217–1227, Association for Computational Linguistics, Valencia, Spain, 2017.
Links | BibTeX | Tags: Multitask, Neural Networks
@inproceedings{Maharjan2017,
title = {A Multi-task Approach to Predict Likability of Books},
author = {Suraj Maharjan and John Arevalo and Manuel Montes and Fabio A. Gonzalez and Thamar Solorio},
url = {https://www.aclweb.org/anthology/E/E17/E17-1114.pdf},
year = {2017},
date = {2017-04-03},
booktitle = {Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 1, Long Papers},
pages = {1217--1227},
publisher = {Association for Computational Linguistics},
address = {Valencia, Spain},
keywords = {Multitask, Neural Networks},
pubstate = {published},
tppubtype = {inproceedings}
}
Shrestha, Prasha; Sierra, Sebastian; Gonzalez, Fabio; Montes, Manuel; Rosso, Paolo; Solorio, Thamar
Convolutional Neural Networks for Authorship Attribution of Short Texts Inproceedings
In: Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 2, Short Papers, pp. 669–674, Association for Computational Linguistics, Valencia, Spain, 2017.
Links | BibTeX | Tags: Authorship Attribution, CNN
@inproceedings{Shrestha2017,
title = {Convolutional Neural Networks for Authorship Attribution of Short Texts},
author = { Prasha Shrestha and Sebastian Sierra and Fabio Gonzalez and Manuel Montes and Paolo Rosso and Thamar Solorio},
url = {https://www.aclweb.org/anthology/E/E17/E17-2106.pdf},
year = {2017},
date = {2017-04-03},
booktitle = {Proceedings of the 15th Conference of the European Chapter of the Association for Computational Linguistics: Volume 2, Short Papers},
pages = {669--674},
publisher = {Association for Computational Linguistics},
address = {Valencia, Spain},
keywords = {Authorship Attribution, CNN},
pubstate = {published},
tppubtype = {inproceedings}
}
Thamar Solorio John Arevalo, Manuel Montes-y-Gómez
Gated Multimodal Units for Information Fusion Conference
5th International Conference on Learning Representations (ICLR) 2017 -Workshop Track, 2017.
Links | BibTeX | Tags: Multimodal
@conference{ArevaloEtAl:17,
title = {Gated Multimodal Units for Information Fusion},
author = {John Arevalo, Thamar Solorio, Manuel Montes-y-Gómez, Fabio A González},
url = {https://arxiv.org/pdf/1702.01992.pdf},
year = {2017},
date = {2017-02-07},
booktitle = {5th International Conference on Learning Representations (ICLR) 2017 -Workshop Track},
keywords = {Multimodal},
pubstate = {published},
tppubtype = {conference}
}
2016
Attia, Mohammed; Maharjan, Suraj; Samih, Younes; Kallmeyer, Laura; Solorio, Thamar
CogALex-V Shared Task: GHHH-Detecting Semantic Relations via Word Embeddings Proceeding
COLING 2016, 2016.
Links | BibTeX | Tags: Multitask CNN, shared task
@proceedings{Attia2016,
title = {CogALex-V Shared Task: GHHH-Detecting Semantic Relations via Word Embeddings},
author = { Mohammed Attia and Suraj Maharjan and Younes Samih and Laura Kallmeyer and Thamar Solorio},
url = {https://0196403f-a-62cb3a1a-s-sites.googlegroups.com/site/cogalex2016/home/accepted-papers/CogALex-V_Proceedings.pdf?attachauth=ANoY7cr0r4e68M8K-_cfjhjFKT3AWjmTqlHE03yzJDAGAPM7UGnGo0fdL-hJDw7OibRB_ez0E_mV52qLK625Y6oxQYQHy9fR_huydrJawgirWO8t-4xYv17CY26yzHq5s99haOCe5HJ5dcVFWaxAmVngOpEH345qsvxTfwAJf4IO3JJte0huRQ29NCosOhzjMGRmFexrTlzQMMl1gSVZQSpCQMxIwUbpsobLJ8NXJc_cX0THghOGZevzcxgg2WuV__z09CI2397T&attredirects=0#page=100},
year = {2016},
date = {2016-12-12},
publisher = {COLING 2016},
keywords = {Multitask CNN, shared task},
pubstate = {published},
tppubtype = {proceedings}
}
Rey-Villamizar, Nicolas; Shrestha, Prasha; Sadeque, Farig; Bethard, Steven; Pedersen, Ted; Mukherjee, Arjun; Solorio, Thamar
Analysis of Anxious Word Usage on Online Health Forums Proceeding
EMNLP 2016, 2016.
Links | BibTeX | Tags: Clinical Applications, health forum, LIWC
@proceedings{Rey-Villamizar2016b,
title = {Analysis of Anxious Word Usage on Online Health Forums},
author = {Nicolas Rey-Villamizar and Prasha Shrestha and Farig Sadeque and Steven Bethard and Ted Pedersen and Arjun Mukherjee and Thamar Solorio},
url = {http://www.aclweb.org/anthology/W/W16/W16-6105.pdf},
year = {2016},
date = {2016-11-05},
publisher = {EMNLP 2016},
keywords = {Clinical Applications, health forum, LIWC},
pubstate = {published},
tppubtype = {proceedings}
}
Molina, Giovanni; Rey-Villamizar, Nicolas; Solorio, Thamar; AlGhamdi, Fahad; Ghoneim, Mahmoud; Hawwari, Abdelati; Diab, Mona
Overview for the second shared task on language identification in code-switched data Proceeding
Proceedings of the Second Workshop on Computational Approaches to Code Switching; EMNLP 2016, 2016.
Links | BibTeX | Tags: Code-Switching, shared task
@proceedings{Molina2016,
title = {Overview for the second shared task on language identification in code-switched data},
author = {Giovanni Molina and Nicolas Rey-Villamizar and Thamar Solorio and Fahad AlGhamdi and Mahmoud Ghoneim and Abdelati Hawwari and Mona Diab},
url = {http://www.aclweb.org/anthology/W/W16/W16-5805.pdf},
year = {2016},
date = {2016-11-01},
pages = {40-49},
publisher = {Proceedings of the Second Workshop on Computational Approaches to Code Switching; EMNLP 2016},
keywords = {Code-Switching, shared task},
pubstate = {published},
tppubtype = {proceedings}
}
Sadeque, Farig; Pedersen, Ted; Solorio, Thamar; Shrestha, Prasha; Rey-Villamizar, Nicolas; Bethard, Steven
Why Do They Leave: Modeling Participation in Online Depression Forums Proceeding
Conference on Empirical Methods in Natural Language Processing, 2016.
Links | BibTeX | Tags: health forum
@proceedings{Sadeque2016,
title = {Why Do They Leave: Modeling Participation in Online Depression Forums},
author = {Farig Sadeque and Ted Pedersen and Thamar Solorio and Prasha Shrestha and Nicolas Rey-Villamizar and Steven Bethard},
url = {http://www.aclweb.org/anthology/W/W16/W16-6203.pdf},
year = {2016},
date = {2016-11-01},
publisher = {Conference on Empirical Methods in Natural Language Processing},
keywords = {health forum},
pubstate = {published},
tppubtype = {proceedings}
}
AlGhamdi, Fahad; Molina, Giovanni; Diab, Mona; Solorio, Thamar; Hawwari, Abdelati; Soto, Victor; Hirschberg, Julia
Part of Speech Tagging for Code Switched Data Proceeding
Proceedings of the Second Workshop on Computational Approaches to Code Switching; EMNLP, 2016.
Links | BibTeX | Tags: Code-Switching
@proceedings{AlGhamdi2016,
title = {Part of Speech Tagging for Code Switched Data},
author = {Fahad AlGhamdi and Giovanni Molina and Mona Diab and Thamar Solorio and Abdelati Hawwari and Victor Soto and Julia Hirschberg},
url = {http://www.aclweb.org/anthology/W/W16/W16-5812.pdf},
year = {2016},
date = {2016-11-01},
pages = {98-107},
publisher = {Proceedings of the Second Workshop on Computational Approaches to Code Switching; EMNLP},
keywords = {Code-Switching},
pubstate = {published},
tppubtype = {proceedings}
}
Samih, Younes; Maharjan, Suraj; Attia, Mohammed; Kallmeyer, Laura; Solorio, Thamar
Multilingual Code-switching Identification via LSTM Recurrent Neural Networks Proceeding
Proceedings of the Second Workshop on Computational Approaches to Code Switching; EMNLP, 2016.
Links | BibTeX | Tags: Code-Switching, CRF, Deeplearning, Neural Networks
@proceedings{Samih2016,
title = {Multilingual Code-switching Identification via LSTM Recurrent Neural Networks},
author = {Younes Samih and Suraj Maharjan and Mohammed Attia and Laura Kallmeyer and Thamar Solorio},
url = {http://www.aclweb.org/anthology/W/W16/W16-5806.pdf},
year = {2016},
date = {2016-10-31},
publisher = {Proceedings of the Second Workshop on Computational Approaches to Code Switching; EMNLP},
keywords = {Code-Switching, CRF, Deeplearning, Neural Networks},
pubstate = {published},
tppubtype = {proceedings}
}
Sapkota, Upendra; Solorio, Thamar; y Gomez, Manuel Montes; Bethard, Steven
Domain Adaptation for Authorship Attribution: Improved Structural Correspondence Learning Conference
Association for Computational Linguistics (ACL) , ACL Berlin, Germany, 2016.
Links | BibTeX | Tags: Authorship Attribution
@conference{SapkotaEtAl:16,
title = {Domain Adaptation for Authorship Attribution: Improved Structural Correspondence Learning},
author = {Upendra Sapkota and Thamar Solorio and Manuel Montes y Gomez and Steven Bethard},
url = {https://aclweb.org/anthology/P/P16/P16-1210.pdf},
year = {2016},
date = {2016-08-08},
booktitle = {Association for Computational Linguistics (ACL) },
address = {Berlin, Germany},
organization = {ACL},
keywords = {Authorship Attribution},
pubstate = {published},
tppubtype = {conference}
}
Franco-Salvador, Marc; Kar, Sudipta; Solorio, Thamar; Rosso, Paolo
UH-PRHLT at SemEval-2016 Task 3: Combining Lexical and Semantic-based Features for Community Question Answering Inproceedings
In: Proceedings of SemEval-2016, pp. 814-821, Association for Computational Linguistics, San Diego, California, 2016.
Links | BibTeX | Tags: Question Answering, Text Classification
@inproceedings{Franco-Salvador2016,
title = {UH-PRHLT at SemEval-2016 Task 3: Combining Lexical and Semantic-based Features for Community Question Answering},
author = {Marc Franco-Salvador and Sudipta Kar and Thamar Solorio and Paolo Rosso},
url = {https://aclweb.org/anthology/S/S16/S16-1126.pdf},
year = {2016},
date = {2016-06-16},
booktitle = {Proceedings of SemEval-2016},
pages = {814-821},
publisher = {Association for Computational Linguistics},
address = {San Diego, California},
keywords = {Question Answering, Text Classification},
pubstate = {published},
tppubtype = {inproceedings}
}
Rey-Villamizar, Nicolas; Shrestha, Prasha; Solorio, Thamar; Sadeque, Farig; Bethard, Steven; Pedersen, Ted
A Semi-supervised Approach for the CLPsych 2016 Shared Task Conference
3rd Workshop on Computational Linguistics and Clinical Psychology: From Linguistic Signal to Clinical Reality, Association for Computational Linguistics, 2016.
Links | BibTeX | Tags: bayesian optimization, health forum, LIWC, shared task
@conference{Rey-Villamizar2016,
title = {A Semi-supervised Approach for the CLPsych 2016 Shared Task},
author = {Nicolas Rey-Villamizar and Prasha Shrestha and Thamar Solorio and Farig Sadeque and Steven Bethard and Ted Pedersen},
url = {http://anthology.aclweb.org/W/W16/W16-0322.pdf},
year = {2016},
date = {2016-06-16},
booktitle = {3rd Workshop on Computational Linguistics and Clinical Psychology: From Linguistic Signal to Clinical Reality},
pages = {171–175},
publisher = {Association for Computational Linguistics},
keywords = {bayesian optimization, health forum, LIWC, shared task},
pubstate = {published},
tppubtype = {conference}
}
Shrestha, Prasha; Bethard, Steven; Pedersen, Ted; Rey-Villamizar, Nicolas; Sadeque, Farig; Solorio, Thamar
Age and Gender Prediction on Health Forum Data Conference
Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016), European Language Resources Association (ELRA), 2016.
Links | BibTeX | Tags: health applications, Profiling
@conference{ShrestaEtAl:16,
title = {Age and Gender Prediction on Health Forum Data},
author = {Prasha Shrestha and Steven Bethard and Ted Pedersen and Nicolas Rey-Villamizar and Farig Sadeque and Thamar Solorio },
url = {http://www.lrec-conf.org/proceedings/lrec2016/pdf/1117_Paper.pdf},
year = {2016},
date = {2016-05-24},
booktitle = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
journal = {Proceedings of LREC},
pages = {8},
publisher = {European Language Resources Association (ELRA)},
keywords = {health applications, Profiling},
pubstate = {published},
tppubtype = {conference}
}
2015
Sadeque, Farig; Solorio, Thamar; Pedersen, Ted; Shrestha, Prasha; Bethard, Steven
Predicting Continued Participation in Online Health Forums Inproceedings
In: Proceedings of the 6th International Workshop on Health Text Mining and Information Analysis (Louhi), pp. 15-20, Association for Computational Linguistics, Lisboa, Portugal, 2015.
Links | BibTeX | Tags: health applications
@inproceedings{Sadeque-EtAl:2015:LOUHI,
title = {Predicting Continued Participation in Online Health Forums},
author = {Farig Sadeque and Thamar Solorio and Ted Pedersen and Prasha Shrestha and Steven Bethard},
url = {https://aclweb.org/anthology/W/W15/W15-2602.pdf},
year = {2015},
date = {2015-09-23},
booktitle = {Proceedings of the 6th International Workshop on Health Text Mining and Information Analysis (Louhi)},
pages = {15-20},
publisher = {Association for Computational Linguistics},
address = {Lisboa, Portugal},
keywords = {health applications},
pubstate = {published},
tppubtype = {inproceedings}
}
Maharjan, Suraj; Solorio, Thamar
Using Wide Range of Features for Author profiling Proceeding
CLEF, 2015.
Links | BibTeX | Tags: Profiling, shared task
@proceedings{Maharjan2015,
title = {Using Wide Range of Features for Author profiling},
author = {Maharjan, Suraj and Solorio, Thamar},
url = {https://pdfs.semanticscholar.org/f555/c009a623960b60b52f38a39a18fa5cbac273.pdf},
year = {2015},
date = {2015-09-08},
journal = {Proceedings of CLEF},
publisher = {CLEF},
keywords = {Profiling, shared task},
pubstate = {published},
tppubtype = {proceedings}
}
Maharjan, Suraj; Blair, Elizabeth; Bethard, Steven; Solorio, Thamar
Developing Language-tagged Corpora for Code-switching Tweets Inproceedings
In: Proceedings of The 9th Linguistic Annotation Workshop, pp. 72–84, Association for Computational Linguistics, Denver, Colorado, USA, 2015.
Links | BibTeX | Tags: Code-Switching
@inproceedings{maharjan-EtAl:2015:LAW,
title = {Developing Language-tagged Corpora for Code-switching Tweets},
author = {Suraj Maharjan and Elizabeth Blair and Steven Bethard and Thamar Solorio},
url = {http://www.aclweb.org/anthology/W15-1608},
year = {2015},
date = {2015-06-05},
booktitle = {Proceedings of The 9th Linguistic Annotation Workshop},
pages = {72--84},
publisher = {Association for Computational Linguistics},
address = {Denver, Colorado, USA},
keywords = {Code-Switching},
pubstate = {published},
tppubtype = {inproceedings}
}
Sapkota, Upendra; Bethard, Steven; y Gomez, Manuel Montes; Solorio, Thamar
Not All Character N-grams Are Created Equal: A Study in Authorship Attribution Conference
Proceedings of the 2015 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies, ACL Denver, Colorado, 2015.
Links | BibTeX | Tags: Authorship Attribution
@conference{SapkotaEtAl:15,
title = {Not All Character N-grams Are Created Equal: A Study in Authorship Attribution},
author = {Upendra Sapkota and Steven Bethard and Manuel Montes y Gomez and Thamar Solorio},
url = {http://www.aclweb.org/anthology/N/N15/N15-1010.pdf},
year = {2015},
date = {2015-06-01},
booktitle = {Proceedings of the 2015 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies},
pages = {93--102},
address = {Denver, Colorado},
organization = {ACL},
keywords = {Authorship Attribution},
pubstate = {published},
tppubtype = {conference}
}
Shrestha, Prasha; Solorio, Thamar
Identification of Original Document by Using Textual Similarities Incollection
In: Gelbukh, Alexander (Ed.): Computational Linguistics and Intelligent Text Processing, vol. 9042, pp. 643-654, Springer International Publishing, 2015, ISBN: 978-3-319-18116-5.
Links | BibTeX | Tags: plagiarism
@incollection{,
title = {Identification of Original Document by Using Textual Similarities},
author = { Prasha Shrestha and Thamar Solorio},
editor = {Gelbukh, Alexander},
url = {http://dx.doi.org/10.1007/978-3-319-18117-2_48},
doi = {10.1007/978-3-319-18117-2_48},
isbn = {978-3-319-18116-5},
year = {2015},
date = {2015-01-01},
booktitle = {Computational Linguistics and Intelligent Text Processing},
volume = {9042},
pages = {643-654},
publisher = {Springer International Publishing},
series = {Lecture Notes in Computer Science},
keywords = {plagiarism},
pubstate = {published},
tppubtype = {incollection}
}
2014
Solorio, Thamar; Blair, Elizabeth; Maharjan, Suraj; Bethard, Steven; Diab, Mona; Gohneim, Mahmoud; Hawwari, Abdelati; AlGhamdi, Fahad; Hirschberg, Julia; Chang, Alison; Fung, Pascale
Overview for the First Shared Task on Language Identification in Code-Switched Data Conference
Proceedings of The First Workshop on Computational Approaches to Code Switching, held in conjunction with EMNLP 2014., ACL, Doha, Qatar, 2014.
Links | BibTeX | Tags: Code-Switching
@conference{SolorioEtAl:14,
title = {Overview for the First Shared Task on Language Identification in Code-Switched Data},
author = {Thamar Solorio and Elizabeth Blair and Suraj Maharjan and Steven Bethard and Mona Diab and Mahmoud Gohneim and Abdelati Hawwari and Fahad AlGhamdi and Julia Hirschberg and Alison Chang and Pascale Fung},
url = {http://www.aclweb.org/anthology/W/W14/W14-3907.pdf},
year = {2014},
date = {2014-10-25},
booktitle = {Proceedings of The First Workshop on Computational Approaches to Code Switching, held in conjunction with EMNLP 2014.},
pages = {62--72},
publisher = {ACL},
address = {Doha, Qatar},
keywords = {Code-Switching},
pubstate = {published},
tppubtype = {conference}
}
Maharjan, Suraj; Shrestha, Prasha; Thamar, Solorio
A Simple Approach to Author Profiling in MapReduce Conference
CLEF, 2014.
Links | BibTeX | Tags: Profiling, shared task
@conference{Maharjan2014,
title = {A Simple Approach to Author Profiling in MapReduce},
author = {Suraj Maharjan and Prasha Shrestha and Solorio Thamar },
url = {http://ceur-ws.org/Vol-1180/CLEF2014wn-Pan-MaharjanEt2014.pdf},
year = {2014},
date = {2014-09-15},
publisher = {CLEF},
keywords = {Profiling, shared task},
pubstate = {published},
tppubtype = {conference}
}
Sapkota, Upendra; Solorio, Thamar; Montes, Manuel; Bethard, Steven; Rosso, Paolo
Cross-Topic Authorship Attribution: Will Out-Of-Topic Data Help? Inproceedings
In: Proceedings of COLING 2014, the 25th International Conference on Computational Linguistics: Technical Papers, pp. 1228–1237, Dublin City University and Association for Computational Linguistics, Dublin, Ireland, 2014.
Links | BibTeX | Tags: Authorship Attribution
@inproceedings{SapkotaEtAl:14,
title = {Cross-Topic Authorship Attribution: Will Out-Of-Topic Data Help?},
author = { Upendra Sapkota and Thamar Solorio and Manuel Montes and Steven Bethard and Paolo Rosso},
url = {http://www.aclweb.org/anthology/C14-1116},
year = {2014},
date = {2014-08-01},
booktitle = {Proceedings of COLING 2014, the 25th International Conference on Computational Linguistics: Technical Papers},
pages = {1228--1237},
publisher = {Dublin City University and Association for Computational Linguistics},
address = {Dublin, Ireland},
keywords = {Authorship Attribution},
pubstate = {published},
tppubtype = {inproceedings}
}
Solorio, Thamar; Hasan, Ragib; Mizan, Mainul
Sockpuppet Detection in Wikipedia: A Corpus of Real-World Deceptive Writing for Linking Identities Inproceedings
In: The 9th edition of the Language Resources and Evaluation Conference (LREC 2014), pp. 26–31, European Language Resources Association (ELRA), Reykjavik, Iceland, 2014.
Links | BibTeX | Tags: Authorship Attribution
@inproceedings{SolorioEtAl:14b,
title = {Sockpuppet Detection in Wikipedia: A Corpus of Real-World Deceptive Writing for Linking Identities},
author = { Thamar Solorio and Ragib Hasan and Mainul Mizan},
url = {http://www.lrec-conf.org/proceedings/lrec2014/pdf/1007_Paper.pdf},
year = {2014},
date = {2014-05-01},
booktitle = {The 9th edition of the Language Resources and Evaluation Conference (LREC 2014)},
pages = {26--31},
publisher = {European Language Resources Association (ELRA)},
address = {Reykjavik, Iceland},
keywords = {Authorship Attribution},
pubstate = {published},
tppubtype = {inproceedings}
}
Maharjan, Suraj; Shrestha, Prasha; Solorio, Thamar; Hasan, Ragib
A Straightforward Author Profiling Approach in MapReduce Incollection
In: Bazzan, Ana L. C.; Pichara, Karim (Ed.): Advances in Artificial Intelligence — IBERAMIA 2014, vol. 8864, pp. 95-107, Springer International Publishing, 2014, ISBN: 978-3-319-12026-3.
Links | BibTeX | Tags: Profiling
@incollection{MaharjanEtAl:14,
title = {A Straightforward Author Profiling Approach in MapReduce},
author = { Suraj Maharjan and Prasha Shrestha and Thamar Solorio and Ragib Hasan},
editor = {Bazzan, Ana L.C. and Pichara, Karim},
url = {http://dx.doi.org/10.1007/978-3-319-12027-0_8},
doi = {10.1007/978-3-319-12027-0_8},
isbn = {978-3-319-12026-3},
year = {2014},
date = {2014-01-01},
booktitle = {Advances in Artificial Intelligence -- IBERAMIA 2014},
volume = {8864},
pages = {95-107},
publisher = {Springer International Publishing},
series = {Lecture Notes in Computer Science},
keywords = {Profiling},
pubstate = {published},
tppubtype = {incollection}
}
Shrestha, Prasha; Maharjan, Suraj; de la Rosa, Gabriela Ramírez; Sprague, Alan; Solorio, Thamar; Warner, Gary
Using String Information for Malware Family Identification Incollection
In: Bazzan, Ana L. C.; Pichara, Karim (Ed.): Advances in Artificial Intelligence — IBERAMIA 2014, vol. 8864, pp. 686-697, Springer International Publishing, 2014, ISBN: 978-3-319-12026-3.
Links | BibTeX | Tags: Security
@incollection{ShresthaEtAl:14,
title = {Using String Information for Malware Family Identification},
author = { Prasha Shrestha and Suraj Maharjan and Gabriela Ramírez de la Rosa and Alan Sprague and Thamar Solorio and Gary Warner},
editor = {Bazzan, Ana L.C. and Pichara, Karim},
url = {http://dx.doi.org/10.1007/978-3-319-12027-0_55},
doi = {10.1007/978-3-319-12027-0_55},
isbn = {978-3-319-12026-3},
year = {2014},
date = {2014-01-01},
booktitle = {Advances in Artificial Intelligence -- IBERAMIA 2014},
volume = {8864},
pages = {686-697},
publisher = {Springer International Publishing},
series = {Lecture Notes in Computer Science},
keywords = {Security},
pubstate = {published},
tppubtype = {incollection}
}
Osborne, John David; Gyawali, Binod; Solorio, Thamar
Evaluation of YTEX and MetaMap for clinical concept recognition Journal Article
In: CoRR, vol. abs/1402.1668, 2014.
Links | BibTeX | Tags: Clinical Applications, Information Extraction
@article{OsborneEtAl:14,
title = {Evaluation of YTEX and MetaMap for clinical concept recognition},
author = { John David Osborne and Binod Gyawali and Thamar Solorio},
url = {http://arxiv.org/abs/1402.1668},
year = {2014},
date = {2014-01-01},
journal = {CoRR},
volume = {abs/1402.1668},
keywords = {Clinical Applications, Information Extraction},
pubstate = {published},
tppubtype = {article}
}
Hassanali, Khairun-nisa; Liu, Yang; Iglesias, Aquiles; Solorio, Thamar; Dollaghan, Christine
Automatic generation of the index of productive syntax for child language transcripts Journal Article
In: Behavior Research Methods, vol. 46, no. 1, pp. 254–262, 2014.
Links | BibTeX | Tags: Clinical Applications
@article{HassanaliEtAl:14,
title = {Automatic generation of the index of productive syntax for child language transcripts},
author = { Khairun-nisa Hassanali and Yang Liu and Aquiles Iglesias and Thamar Solorio and Christine Dollaghan},
url = {http://dx.doi.org/10.3758/s13428-013-0354-x},
doi = {10.3758/s13428-013-0354-x},
year = {2014},
date = {2014-01-01},
journal = {Behavior Research Methods},
volume = {46},
number = {1},
pages = {254--262},
publisher = {Springer US},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {article}
}
Bogdanova, Dasha; Rosso, Paolo; Solorio, Thamar
Exploring High-level Features for Detecting Cyberpedophilia Journal Article
In: Comput. Speech Lang., vol. 28, no. 1, pp. 108–120, 2014, ISSN: 0885-2308.
Links | BibTeX | Tags: Cyberpedophilia, Emotion detection, Sentiment analysis
@article{BogdanovaEtAl:14,
title = {Exploring High-level Features for Detecting Cyberpedophilia},
author = { Dasha Bogdanova and Paolo Rosso and Thamar Solorio},
url = {http://dx.doi.org/10.1016/j.csl.2013.04.007},
doi = {10.1016/j.csl.2013.04.007},
issn = {0885-2308},
year = {2014},
date = {2014-01-01},
journal = {Comput. Speech Lang.},
volume = {28},
number = {1},
pages = {108--120},
publisher = {Academic Press Ltd.},
address = {London, UK, UK},
keywords = {Cyberpedophilia, Emotion detection, Sentiment analysis},
pubstate = {published},
tppubtype = {article}
}
2013
Ramírez-de-la-Rosa, Gabriela; Solorio, Thamar; Montes-y-Gómez, Manuel; Liu, Yang; Iglesias, Aquiles; Bedore, Lisa; Peña, Elizabeth
Exploring word class n-grams to measure language development in children Inproceedings
In: Proceedings of the 2013 Workshop on Biomedical Natural Language Processing, pp. 89–97, ACL, Sofia, Bulgaria, 2013.
Links | BibTeX | Tags: Clinical Applications
@inproceedings{RamirezEtAl:13,
title = {Exploring word class n-grams to measure language development in children},
author = { Gabriela Ramírez-de-la-Rosa and Thamar Solorio and Manuel Montes-y-Gómez and Yang Liu and Aquiles Iglesias and Lisa Bedore and Elizabeth Peña},
url = {http://www.aclweb.org/anthology/W13-1911},
year = {2013},
date = {2013-08-01},
booktitle = {Proceedings of the 2013 Workshop on Biomedical Natural Language Processing},
pages = {89--97},
publisher = {ACL},
address = {Sofia, Bulgaria},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {inproceedings}
}
Hassanali, Khairun-nisa; Liu, Yang; Solorio, Thamar
Using Latent Dirichlet Allocation for Child Narrative Analysis Inproceedings
In: Proceedings of the 2013 Workshop on Biomedical Natural Language Processing, pp. 111–115, ACL, Sofia, Bulgaria, 2013.
Links | BibTeX | Tags: Clinical Applications
@inproceedings{HassanaliEtAl:13b,
title = {Using Latent Dirichlet Allocation for Child Narrative Analysis},
author = { Khairun-nisa Hassanali and Yang Liu and Thamar Solorio},
url = {http://www.aclweb.org/anthology/W13-1914},
year = {2013},
date = {2013-08-01},
booktitle = {Proceedings of the 2013 Workshop on Biomedical Natural Language Processing},
pages = {111--115},
publisher = {ACL},
address = {Sofia, Bulgaria},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {inproceedings}
}
Hassanali, Kairuh-nisa; Liu, Yang; Iglesias, Aquiles; Solorio, Thamar; Dollaghan, Chrsitine
Automatic Generation of the Index of Productive Syntax for Child Language Transcripts Journal Article
In: Behavior Research Methods, vol. 45, no. 2, 2013.
BibTeX | Tags: Clinical Applications
@article{HassanaliEtAl:13,
title = {Automatic Generation of the Index of Productive Syntax for Child Language Transcripts},
author = { Kairuh-nisa Hassanali and Yang Liu and Aquiles Iglesias and Thamar Solorio and Chrsitine Dollaghan},
year = {2013},
date = {2013-06-01},
journal = {Behavior Research Methods},
volume = {45},
number = {2},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {article}
}
Gyawali, Binod; Ramirez-de-la-Rosa, Gabriela; Solorio, Thamar
Native Language Identification: a Simple n-gram Based Approach Inproceedings
In: Proceedings of the Eighth Workshop on Innovative Use of NLP for Building Educational Applications, pp. 224–231, ACL, Atlanta, Georgia, 2013.
Links | BibTeX | Tags: Information Extraction, Profiling
@inproceedings{GyawaliEtAl:13,
title = {Native Language Identification: a Simple n-gram Based Approach},
author = { Binod Gyawali and Gabriela Ramirez-de-la-Rosa and Thamar Solorio},
url = {http://www.aclweb.org/anthology/W13-1729},
year = {2013},
date = {2013-06-01},
booktitle = {Proceedings of the Eighth Workshop on Innovative Use of NLP for Building Educational Applications},
pages = {224--231},
publisher = {ACL},
address = {Atlanta, Georgia},
keywords = {Information Extraction, Profiling},
pubstate = {published},
tppubtype = {inproceedings}
}
Solorio, Thamar; Hasan, Ragib; Mizan, Mainul
A Case Study of Sockpuppet Detection in Wikipedia Inproceedings
In: Workshop on Language Analysis in Social Media (LASM) at NAACL-HLT 2013, pp. 59–68, ACL, Atlanta, Georgia, 2013.
BibTeX | Tags: Authorship Attribution, Security
@inproceedings{SolorioEtAl:13,
title = {A Case Study of Sockpuppet Detection in Wikipedia},
author = { Thamar Solorio and Ragib Hasan and Mainul Mizan},
year = {2013},
date = {2013-06-01},
booktitle = {Workshop on Language Analysis in Social Media (LASM) at NAACL-HLT 2013},
pages = {59--68},
publisher = {ACL},
address = {Atlanta, Georgia},
keywords = {Authorship Attribution, Security},
pubstate = {published},
tppubtype = {inproceedings}
}
Sapkota, Upendra; Solorio, Thamar; Montes-y-Gómez, Manuel; Rosso, Paolo
The use of Orthogonal Similarity Relations in the Prediction of Authorship Inproceedings
In: Proceedings of the 14th International Conference on Intelligent Text Processing and Computational Linguistics, CICLing-2013, pp. 463–475, , % note = (acceptance rate 24.6,%), Samos, Greece, 2013.
BibTeX | Tags: Authorship Attribution
@inproceedings{SapkotaEtAl:13,
title = {The use of Orthogonal Similarity Relations in the Prediction of Authorship},
author = { Upendra Sapkota and Thamar Solorio and Manuel Montes-y-Gómez and Paolo Rosso},
year = {2013},
date = {2013-03-01},
booktitle = {Proceedings of the 14th International Conference on Intelligent Text Processing and Computational Linguistics, CICLing-2013},
pages = {463--475},
publisher = {, % note = (acceptance rate 24.6,%)},
address = {Samos, Greece},
keywords = {Authorship Attribution},
pubstate = {published},
tppubtype = {inproceedings}
}
Solorio, Thamar
Survey on Emerging Research on the Use of Natural Language Processing in Clinical Language Assessment of Children Journal Article
In: Language and Linguistics Compass, vol. 7, no. 12, pp. 633–646, 2013.
BibTeX | Tags: Clinical Applications
@article{Solorio:13,
title = {Survey on Emerging Research on the Use of Natural Language Processing in Clinical Language Assessment of Children},
author = { Thamar Solorio},
year = {2013},
date = {2013-01-01},
journal = {Language and Linguistics Compass},
volume = {7},
number = {12},
pages = {633--646},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {article}
}
Osborne, John David; Gyawali, Binod; Solorio, Thamar
Evaluation of freely available open source software for clinical concept recognition Inproceedings
In: Notebook for ShARe/CLEF eHealth Evaluation Lab at CLEF 2013, 2013.
BibTeX | Tags: Clinical Applications, Information Extraction
@inproceedings{OsborneEtAl:13,
title = {Evaluation of freely available open source software for clinical concept recognition},
author = { John David Osborne and Binod Gyawali and Thamar Solorio},
year = {2013},
date = {2013-01-01},
booktitle = {Notebook for ShARe/CLEF eHealth Evaluation Lab at CLEF 2013},
keywords = {Clinical Applications, Information Extraction},
pubstate = {published},
tppubtype = {inproceedings}
}
Shrestha, Prasha; Solorio, Thamar
Using a Variety of n-Grams for the Detection of Different Kinds of Plagiarism Inproceedings
In: Notebook for PAN at CLEF 2013, 2013.
Links | BibTeX | Tags: plagiarism, shared task
@inproceedings{ShresthaAndSolorio:13,
title = {Using a Variety of n-Grams for the Detection of Different Kinds of Plagiarism},
author = { Prasha Shrestha and Thamar Solorio},
url = {http://ceur-ws.org/Vol-1179/CLEF2013wn-PAN-ShresthaEt2013.pdf},
year = {2013},
date = {2013-01-01},
booktitle = {Notebook for PAN at CLEF 2013},
keywords = {plagiarism, shared task},
pubstate = {published},
tppubtype = {inproceedings}
}
Sapkota, Upendra; Solorio, Thamar; Montes-y-Gómez, Manuel; Ramírez-de-la-Rosa, Gabriela
Automatic Author Profiling for English and Spanish Text Inproceedings
In: Notebook for PAN at CLEF 2013, 2013.
BibTeX | Tags: Profiling, Security
@inproceedings{SapkotaEtAl:13b,
title = {Automatic Author Profiling for English and Spanish Text},
author = { Upendra Sapkota and Thamar Solorio and Manuel Montes-y-Gómez and Gabriela Ramírez-de-la-Rosa},
year = {2013},
date = {2013-01-01},
booktitle = {Notebook for PAN at CLEF 2013},
keywords = {Profiling, Security},
pubstate = {published},
tppubtype = {inproceedings}
}
2012
Sapkota, Upendra; Solorio, Thamar
Sub-profiling by linguistic dimensions to solve the authorship attribution task Inproceedings
In: Notebook for PAN at CLEF 2012, Rome, Italy, 2012.
BibTeX | Tags: Authorship Attribution
@inproceedings{SapkotaAndSolorio:12,
title = {Sub-profiling by linguistic dimensions to solve the authorship attribution task},
author = { Upendra Sapkota and Thamar Solorio},
year = {2012},
date = {2012-09-01},
booktitle = {Notebook for PAN at CLEF 2012},
address = {Rome, Italy},
keywords = {Authorship Attribution},
pubstate = {published},
tppubtype = {inproceedings}
}
Bogdanova, Daria; Rosso, Paolo; Solorio, Thamar
On the Impact of Sentiment and Emotion Based Features in Detecting Online Sexual Predators Inproceedings
In: Proceedings of the ACL 2012 3rd Workshop on Computational Approaches to Subjectivity and Sentiment Analysis (WASSA), pp. 110–118, ACL Jeju, Republic of Korea, 2012.
BibTeX | Tags: Cyberpedophilia, Security
@inproceedings{BogdanovaEtAl:12b,
title = {On the Impact of Sentiment and Emotion Based Features in Detecting Online Sexual Predators},
author = { Daria Bogdanova and Paolo Rosso and Thamar Solorio},
year = {2012},
date = {2012-07-01},
booktitle = {Proceedings of the ACL 2012 3rd Workshop on Computational Approaches to Subjectivity and Sentiment Analysis (WASSA)},
pages = {110--118},
address = {Jeju, Republic of Korea},
organization = {ACL},
keywords = {Cyberpedophilia, Security},
pubstate = {published},
tppubtype = {inproceedings}
}
Gyawali, Binod; Solorio, Thamar; Benajiba, Yassine
Grading the Quality of Medical Evidence Inproceedings
In: 2012 Workshop on Biomedical Natural Language Processing (BIONLP 2012), pp. 176–184, ACL Montréal, Canada, 2012.
Links | BibTeX | Tags: health applications
@inproceedings{GyawaliEtAl:12a,
title = {Grading the Quality of Medical Evidence},
author = { Binod Gyawali and Thamar Solorio and Yassine Benajiba},
url = {http://www.aclweb.org/anthology/W12-2422},
year = {2012},
date = {2012-06-01},
booktitle = {2012 Workshop on Biomedical Natural Language Processing (BIONLP 2012)},
pages = {176--184},
address = {Montréal, Canada},
organization = {ACL},
keywords = {health applications},
pubstate = {published},
tppubtype = {inproceedings}
}
Gyawali, Binod; Solorio, Thamar
UABCoRAL: A Preliminary study for Resolving the Scope of Negation Inproceedings
In: *SEM: 1st Joint Conference on Lexical and Computational Semantics, pp. 275–281, ACL Montréal, Canada, 2012.
BibTeX | Tags:
@inproceedings{GyawaliEtAl:12b,
title = {UABCoRAL: A Preliminary study for Resolving the Scope of Negation},
author = { Binod Gyawali and Thamar Solorio},
year = {2012},
date = {2012-06-01},
booktitle = {*SEM: 1st Joint Conference on Lexical and Computational Semantics},
pages = {275--281},
address = {Montréal, Canada},
organization = {ACL},
keywords = {},
pubstate = {published},
tppubtype = {inproceedings}
}
Bogdanova, Daria; Rosso, Paolo; Solorio, Thamar
Modelling Fixated Discourse in Chats with Cyberpedophiles Inproceedings
In: EACL 2012 Workshop on Computational Approaches to Deception Detection, pp. 86–90, ACL Avignon, France, 2012.
BibTeX | Tags: Cyberpedophilia, Security
@inproceedings{BogdanovaEtAl:12,
title = {Modelling Fixated Discourse in Chats with Cyberpedophiles},
author = { Daria Bogdanova and Paolo Rosso and Thamar Solorio},
year = {2012},
date = {2012-04-01},
booktitle = {EACL 2012 Workshop on Computational Approaches to Deception Detection},
pages = {86--90},
address = {Avignon, France},
organization = {ACL},
keywords = {Cyberpedophilia, Security},
pubstate = {published},
tppubtype = {inproceedings}
}
Ramírez-de-la-Rosa, Gabriela; Montes-y-Gómez, Manuel; Solorio, Thamar; Villaseñor-Pineda, Luis
A document is known by the company it keeps: Neighborhood consensus for short text categorization Journal Article
In: Language Resources and Evaluation, no. 47, pp. 127–149, 2012.
BibTeX | Tags: Text Classification
@article{RamirezEtAl:12,
title = {A document is known by the company it keeps: Neighborhood consensus for short text categorization},
author = { Gabriela Ramírez-de-la-Rosa and Manuel Montes-y-Gómez and Thamar Solorio and Luis Villaseñor-Pineda},
year = {2012},
date = {2012-01-01},
journal = {Language Resources and Evaluation},
number = {47},
pages = {127--149},
keywords = {Text Classification},
pubstate = {published},
tppubtype = {article}
}
Hassanali, Khairun-nisa; Liu, Yang; Solorio, Thamar
Coherence in Child Language Narratives: A Case Study of Annotation and Automatic Prediction of Coherence Inproceedings
In: Proceedings of 3rd Workshop on Child, Computer and Interaction (WOCCI 2012), 2012.
BibTeX | Tags: Clinical Applications
@inproceedings{HassanaliEtAl:12,
title = {Coherence in Child Language Narratives: A Case Study of Annotation and Automatic Prediction of Coherence},
author = { Khairun-nisa Hassanali and Yang Liu and Thamar Solorio},
year = {2012},
date = {2012-01-01},
booktitle = {Proceedings of 3rd Workshop on Child, Computer and Interaction (WOCCI 2012)},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {inproceedings}
}
Hassanali, Khairun-nisa; Liu, Yang; Solorio, Thamar
Evaluating NLP Features for Automatic Prediction of Language Impairment Using Child Speech Transcripts Inproceedings
In: Proceedings of INTERSPEECH 2012, 2012.
BibTeX | Tags: Clinical Applications
@inproceedings{HassanaliEtAl:12b,
title = {Evaluating NLP Features for Automatic Prediction of Language Impairment Using Child Speech Transcripts},
author = { Khairun-nisa Hassanali and Yang Liu and Thamar Solorio},
year = {2012},
date = {2012-01-01},
booktitle = {Proceedings of INTERSPEECH 2012},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {inproceedings}
}
2011
Gabani, Keyur; Solorio, Thamar; Liu, Yang; Dollaghan, Christine
Exploring a corpus-based approach for detecting language impairment in monolingual English-speaking children Journal Article
In: Artificial Intelligence in Medicine, vol. 53, no. 3, pp. 161–170, 2011.
BibTeX | Tags: Clinical Applications
@article{GabaniEtAl:11,
title = {Exploring a corpus-based approach for detecting language impairment in monolingual English-speaking children},
author = { Keyur Gabani and Thamar Solorio and Yang Liu and Christine Dollaghan},
year = {2011},
date = {2011-11-01},
journal = {Artificial Intelligence in Medicine},
volume = {53},
number = {3},
pages = {161--170},
keywords = {Clinical Applications},
pubstate = {published},
tppubtype = {article}
}
Escalante, Hugo Jair; Montes-y-Gómez, Manuel; Solorio, Thamar
Weighted Profile Intersection Measure for Profile-based Authorship Attribution Inproceedings
In: 10th Mexican International Conference on Artificial Intelligence, pp. 232–243, , %note = (acceptance rate 27.5,%), Puebla, Mexico, 2011.
BibTeX | Tags: Authorship Attribution, Security
@inproceedings{EscalanteEtAl:11b,
title = {Weighted Profile Intersection Measure for Profile-based Authorship Attribution},
author = { Hugo Jair Escalante and Manuel Montes-y-Gómez and Thamar Solorio},
year = {2011},
date = {2011-11-01},
booktitle = {10th Mexican International Conference on Artificial Intelligence},
pages = {232--243},
publisher = {, %note = (acceptance rate 27.5,%)},
address = {Puebla, Mexico},
keywords = {Authorship Attribution, Security},
pubstate = {published},
tppubtype = {inproceedings}
}