@inproceedings{32697ea5015c4682acd443ccb034fc30,
title = "A new European Portuguese corpus for the study of Psychosis through speech analysis",
abstract = "Psychosis is a clinical syndrome characterized by the presence of symptoms such as hallucinations, thought disorder and disorganized speech. Several studies have used machine learning, combined with speech and natural language processing methods to aid in the diagnosis process of this disease. This paper describes the creation of the first European Portuguese corpus for the identification of the presence of speech characteristics of psychosis, which contains samples of 92 participants, 56 controls and 36 individuals diagnosed with psychosis and medicated. The corpus was used in a set of experiments that allowed identifying the most promising feature set to perform the classification: the combination of acoustic and speech metric features. Several classifiers were implemented to study which ones entailed the best performance depending on the task and feature set. The most promising results obtained for the entire corpus were achieved when identifying individuals with a Multi-Layer Perceptron classifier and reached an 87.5% accuracy. Focusing on the gender dependent results, the overall best results were 90.9% and 82.9% accuracy, for female and male subjects respectively. Lastly, the experiments performed lead us to conjecture that spontaneous speech presents more identifiable characteristics than read speech to differentiate healthy and patients diagnosed with psychosis.",
keywords = "Machine Learning, Psychosis, Schizophrenia, Speech Analysis",
author = "Maria Forj{\'o} and Daniel Neto and Alberto Abad and Pinto, {H. Sofia} and Joaquim Gago",
note = "Funding Information: We thank Dra. Ana Moreira for her insight and support during the creation of the protocol and the recording process of the patients corpus subset at CHLO. We also thank the staff from Unidade de Sa{\'u}de Mental de Oeiras - Centro Hospi-talar Lisboa Ocidental for their help and support during the patients corpus recording process. This work was supported by national funds through Fundac¸{\~a}o para a Ci{\^e}ncia e a Tec-nologia (FCT) under project UIDB/50021/2020. Publisher Copyright: {\textcopyright} European Language Resources Association (ELRA), licensed under CC-BY-NC-4.0.; 13th International Conference on Language Resources and Evaluation Conference, LREC 2022 ; Conference date: 20-06-2022 Through 25-06-2022",
year = "2022",
language = "English",
series = "2022 Language Resources and Evaluation Conference, LREC 2022",
publisher = "European Language Resources Association (ELRA)",
pages = "7298--7304",
editor = "Nicoletta Calzolari and Frederic Bechet and Philippe Blache and Khalid Choukri and Christopher Cieri and Thierry Declerck and Sara Goggi and Hitoshi Isahara and Bente Maegaard and Joseph Mariani and Helene Mazo and Jan Odijk and Stelios Piperidis",
booktitle = "2022 Language Resources and Evaluation Conference, LREC 2022",
}