@inproceedings{1219524da73149a8823e959a5a67c4df,
title = "Comparing Different Dictionary-Based Classifiers for the Classification of Volatile Compounds Measured with an E-nose",
abstract = "Electronic noses (e-noses) are devices that mimic the biological sense of olfaction to recognize gaseous samples in a very fast and accurate manner, being applicable in a multitude of scenarios. E-noses are composed of an array of gas sensors, a signal acquisition unit and a pattern recognition unit including automatic classifiers based on machine learning. In a previous work, a text-based approach was developed to classify volatile organic compounds (VOCs) using as input signals from an in-house developed e-nose. This text-based algorithm was compared with a 1-nearest neighbor classifier with euclidean distance (1-NN ED). In this work we studied other text-based approaches that relied in the Bag of Words model and compared it with the previous approach that relied in the term frequency-inverse document frequency (TF-IDF) model and other traditional text-mining classifiers, namely the naive bayes and linear Support Vector Machines (SVM). The results show that the TF-IDF model is more robust overall when compared with the Bag of Words (BoW) model. An average F1-score of 0.84 and 0.70 was achieved for the TF-IDF model with a linear SVM for two distinct gas sensor formulations (5CB and 8CB, respectively), while an F1-score of 0.66 and 0.71 was achieved for the BoW model for the same formulations. The text-based approaches appeared to be less reliable than the traditional 1-NN ED method.",
keywords = "Bag of words, Classification, Electronic nose, Euclidean distance, Morphology, TFIDF, Volatile organic compounds",
author = "Rita Alves and Jo{\~a}o Rodrigues and Efthymia Ramou and Palma, {Susana I. C. J.} and Roque, {Ana C. A.} and Hugo Gamboa",
note = "Funding Information: Acknowledgements. This project has received funding from the European Research Council (ERC) under the EU Horizon 2020 research and innovation programme [grant reference SCENT-ERC-2014-STG-639123, (2015-2022)] and by national funds from FCT - Funda{\c c}{\~a}o para a Ci{\^e}ncia e a Tecnologia, I.P., in the scope of the project UIDP/04378/2020 and UIDB/04378/2020 of the Research Unit on Applied Molecular Biosciences - UCIBIO and the project LA/P/0140/2020 of the Associate Laboratory Institute for Health and Bioeconomy - i4HB, which is financed by national funds from financed by FCT/MEC (UID/Multi/04378/2019). This work was also partly supported by Funda{\c c}{\~a}o para a Ci{\^e}ncia e Tecnologia, under PhD grant PD/BDE/142816/2018. Publisher Copyright: {\textcopyright} 2023, The Author(s), under exclusive license to Springer Nature Switzerland AG.; Proceedings of the 15th International Conference on Biomedical Engineering Systems and Technologies, BIOSTEC 2022 ; Conference date: 09-02-2022 Through 11-02-2022",
year = "2023",
doi = "10.1007/978-3-031-38854-5_7",
language = "English",
isbn = "978-3-031-38853-8",
series = "Communications in Computer and Information Science",
publisher = "Springer",
pages = "121--140",
editor = "Roque, {Ana Cec{\'i}lia A.} and Denis Gracanin and Ronny Lorenz and Athanasios Tsanas and Nathalie Bier and Ana Fred and Hugo Gamboa",
booktitle = "Biomedical Engineering Systems and Technologies",
address = "Netherlands",
}