@inproceedings{467723aa363d4743819b9b8e45b66c48,
title = "Towards a Statistical-Enriched Corpus Containing Portuguese Collocations in Use: Reviewing Possible Extraction Tools",
abstract = "Collocations are a main problem for any natural language processing task, from machine translation to summarization. With the goal of building a corpus with collocations, enriched with statistical information about them, we survey, in this paper, four tools for extracting collocations. These tools allow us to collect sentences with collocations, and also to gather statistics on this particular type of co-ocurrences, like Mutual Information and Log likelihood values.",
keywords = "Collocations, Wortschatz, DeepDict, CRPC, Sketch engine",
author = "{\^A}ngela Costa and Luisa Coheur",
note = "info:eu-repo/grantAgreement/FCT/5876/147316/PT# UID/LIN/03213/2013; 12th International Conference on Computational Processing of the Portuguese Language, PROPOR 2016 ; Conference date: 13-07-2016 Through 15-07-2016",
year = "2016",
doi = "10.1007/978-3-319-41552-9_32",
language = "English",
isbn = "978-3-319-41551-2",
volume = "9727",
series = "Lecture Notes in Artificial Intelligence",
publisher = "Springer",
pages = "319--329",
editor = "Jo{\~a}o Silva and Ricardo Ribeiro and Paulo Quaresma and Andr{\'e} Adami and Ant{\'o}nio Branco",
booktitle = "Computational Processing of the Portuguese Language",
address = "Netherlands",
}