@inproceedings{fd687478e9c849fd99aeb44a6a4f6f78,
title = "CIC-GIL approach to author profiling in Spanish tweets: Location and occupation",
abstract = "{\textcopyright} 2018 CEUR-WS. All Rights Reserved.We present the CIC-GIL approach to the author profiling (AP) task at MEX-A3T 2018. The task consists of two subtasks: identification of authors{\textquoteright} location (6-way) and occupation (8-way) in a corpus of Mexican Spanish tweets. We used the logistic regression algorithm trained on typed character n-grams, function-word n-grams, and regionalisms for location identification, and typed character n-grams with several modifications for occupation identification. Our best run showed F1-macro score of 73.63% for location and 48.94% for occupation identification. The results are competitive with other participating teams; in particular, our best run was ranked fourth in the shared task.",
author = "I. Markov and H. G{\'o}mez-Adorno and M. Jasso-Rosales and G. Sidorov",
year = "2018",
language = "English",
volume = "2150",
series = "CEUR Workshop Proceedings",
publisher = "CEUR-WS",
pages = "97--101",
editor = "P. Rosso and J. Carrillo-de-Albornoz and J. Gonzalo and R. Martinez and S. Montalvo",
booktitle = "Proceedings of the 3rd Workshop on Evaluation of Human Language Technologies for Iberian Languages, IberEval 2018 - co-located with 34th Conference of the Spanish Society for Natural Language Processing, SEPLN 2018",
note = "3rd Workshop on Evaluation of Human Language Technologies for Iberian Languages, IberEval 2018 ; Conference date: 18-09-2018",
}