Publications
OUR RESEARCH
Scientific Publications
Here you can find the comprehensive list of publications from the members of the Research Center on Computer Vision and eXtended Reality (xRAI).
Use the tag cloud to filter papers based on specific research topics, or use the menus to filter by year, type of publication, or authors.
For each paper, you have the option to view additional details such as the Abstract, Links, and BibTex record.
Research is formalized curiosity. It is poking and prying with a purpose
Zora Neale Hurston
2025
Krilavičius, Tomas; Paolis, Lucio Tommaso De; Luca, Valerio De; Spjut, Josef
eXtended Reality and Artificial Intelligence in Medicine and Rehabilitation Journal Article
In: Information Systems Frontiers, 2025, ISSN: 13873326.
Abstract | Links | BibTeX | Tags: 3D modeling, Artificial Intelligence, Augmented Reality, Extended reality, Minimally-invasive surgery, Personalized medicine, Pre-operative planning, Surgery
@article{krilavicius_extended_2025,
title = {eXtended Reality and Artificial Intelligence in Medicine and Rehabilitation},
author = {Tomas Krilavičius and Lucio Tommaso De Paolis and Valerio De Luca and Josef Spjut},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85217159420&doi=10.1007%2fs10796-025-10580-8&partnerID=40&md5=3bc0bae0925d3f2f6d1a6e1e659b9aae},
doi = {10.1007/s10796-025-10580-8},
issn = {13873326},
year = {2025},
date = {2025-01-01},
journal = {Information Systems Frontiers},
abstract = {This special issue focuses on the application of eXtended Reality (XR) technologies—comprising Virtual Reality (VR), Augmented Reality (AR), and Mixed Reality (MR)—and Artificial Intelligence (AI) in the fields of medicine and rehabilitation. AR provides support in minimally invasive surgery, where it visualises internal anatomical structures on the patient’s body and provides real-time feedback to improve accuracy, keep the surgeon’s attention and reduce the risk of errors. Furthermore, XR technologies can be used to develop applications for pre-operative planning or for training surgeons through serious games. AI finds applications both in medical image processing, for the recognition of anatomical structures and the reconstruction of 3D models, and in the analysis of biological data for patient monitoring and disease diagnosis. In rehabilitation, XR and AI can enable personalised therapy plans, increase patient engagement through immersive environments and provide real-time feedback to improve recovery outcomes. The papers in this special issue deal with rehabilitation through serious games, AI-enhanced XR applications for healthcare, digital twins and the analysis of bio/neuro-adaptive signals. © The Author(s), under exclusive licence to Springer Science+Business Media, LLC, part of Springer Nature 2025.},
keywords = {3D modeling, Artificial Intelligence, Augmented Reality, Extended reality, Minimally-invasive surgery, Personalized medicine, Pre-operative planning, Surgery},
pubstate = {published},
tppubtype = {article}
}
2024
Agostinelli, Thomas; Generosi, Andrea; Ceccacci, Silvia; Mengoni, Maura
Validation of computer vision-based ergonomic risk assessment tools for real manufacturing environments Journal Article
In: Scientific Reports, vol. 14, no. 1, pp. 27785, 2024, ISSN: 2045-2322.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Computer Vision and Pattern Recognition, Human-Centered Design, Industry 4.0
@article{agostinelli_validation_2024,
title = {Validation of computer vision-based ergonomic risk assessment tools for real manufacturing environments},
author = {Thomas Agostinelli and Andrea Generosi and Silvia Ceccacci and Maura Mengoni},
url = {https://www.nature.com/articles/s41598-024-79373-4},
doi = {10.1038/s41598-024-79373-4},
issn = {2045-2322},
year = {2024},
date = {2024-11-01},
urldate = {2024-12-28},
journal = {Scientific Reports},
volume = {14},
number = {1},
pages = {27785},
abstract = {This study contributes to understanding semi-automated ergonomic risk assessments in industrial manufacturing environments, proposing a practical tool for enhancing worker safety and operational efficiency. In the Industry 5.0 era, the human-centric approach in manufacturing is crucial, especially considering the aging workforce and the dynamic nature of the entire modern industrial sector, today integrating digital technology, automation, and sustainable practices to enhance productivity and environmental responsibility. This approach aims to adapt work conditions to individual capabilities, addressing the high incidence of work-related musculoskeletal disorders (MSDs). The traditional, subjective methods of ergonomic assessment are inadequate for dynamic settings, highlighting the need for affordable, automatic tools for continuous monitoring of workers’ postures to evaluate ergonomic risks effectively during tasks. To enable this perspective, 2D RGB Motion Capture (MoCap) systems based on computer vision currently seem the technologies of choice, given their low intrusiveness, cost, and implementation effort. However, the reliability and applicability of these systems in the dynamic and varied manufacturing environment remain uncertain. This research benchmarks various literature proposed MoCap tools and examines the viability of MoCap systems for ergonomic risk assessments in Industry 5.0 by exploiting one of the benchmarked semi-automated, low-cost and non-intrusive 2D RGB MoCap system, capable of continuously monitoring and analysing workers’ postures. By conducting experiments across varied manufacturing environments, this research evaluates the system’s effectiveness in assessing ergonomic risks and its adaptability to different production lines. Results reveal that the accuracy of risk assessments varies by specific environmental conditions and workstation setups. Although these systems are not yet optimized for expert-level risk certification, they offer significant potential for enhancing workplace safety and efficiency by providing continuous posture monitoring. Future improvements could explore advanced computational techniques like machine learning to refine ergonomic assessments further.},
keywords = {Artificial Intelligence, Computer Vision and Pattern Recognition, Human-Centered Design, Industry 4.0},
pubstate = {published},
tppubtype = {article}
}
Recupito, Gilberto; Pecorelli, Fabiano; Catolino, Gemma; Lenarduzzi, Valentina; Taibi, Davide; Nucci, Dario Di; Palomba, Fabio
Technical debt in AI-enabled systems: On the prevalence, severity, impact, and management strategies for code and architecture Journal Article
In: Journal of Systems and Software, vol. 216, pp. 112151, 2024, ISSN: 0164-1212.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Software Engineering, Technical Debt Management
@article{recupitoTechnicalDebtAIenabled2024,
title = {Technical debt in AI-enabled systems: On the prevalence, severity, impact, and management strategies for code and architecture},
author = {Gilberto Recupito and Fabiano Pecorelli and Gemma Catolino and Valentina Lenarduzzi and Davide Taibi and Dario Di Nucci and Fabio Palomba},
url = {https://linkinghub.elsevier.com/retrieve/pii/S0164121224001961},
doi = {10.1016/j.jss.2024.112151},
issn = {0164-1212},
year = {2024},
date = {2024-10-01},
urldate = {2024-07-07},
journal = {Journal of Systems and Software},
volume = {216},
pages = {112151},
abstract = {Context: Artificial Intelligence (AI) is pervasive in several application domains and promises to be even more diffused in the next decades. Developing high-quality AI-enabled systems — software systems embedding one or multiple AI components, algorithms, and models — could introduce critical challenges for mitigating specific risks related to the systems' quality. Such development alone is insufficient to fully address socio-technical consequences and the need for rapid adaptation to evolutionary changes. Recent work proposed the concept of AI technical debt, a potential liability concerned with developing AI-enabled systems whose impact can affect the overall systems' quality. While the problem of AI technical debt is rapidly gaining the attention of the software engineering research community, scientific knowledge that contributes to understanding and managing the matter is still limited. Objective: In this paper, we leverage the expertise of practitioners to offer useful insights to the research community, aiming to enhance researchers' awareness about the detection and mitigation of AI technical debt. Our ultimate goal is to empower practitioners by providing them with tools and methods. Additionally, our study sheds light on novel aspects that practitioners might not be fully acquainted with, contributing to a deeper understanding of the subject. Method: We develop a survey study featuring 53 AI practitioners, in which we collect information on the practical prevalence, severity, and impact of AI technical debt issues affecting the code and the architecture other than the strategies applied by practitioners to identify and mitigate them. Results: The key findings of the study reveal the multiple impacts that AI technical debt issues may have on the quality of AI-enabled systems (e.g., the high negative impact that Undeclared consumers has on security, whereas Jumbled Model Architecture can induce the code to be hard to maintain) and the little support practitioners have to deal with them, limited to apply manual effort for identification and refactoring. Conclusion: We conclude the article by distilling lessons learned and actionable insights for researchers.},
keywords = {Artificial Intelligence, Software Engineering, Technical Debt Management},
pubstate = {published},
tppubtype = {article}
}
Rausa, Maria; Gaglio, Salvatore; Augello, Agnese; Caggianese, Giuseppe; Franchini, Silvia; Gallo, Luigi; Sabatucci, Luca
Enriching Metaverse with Memories Through Generative AI: A Case Study Proceedings Article
In: 2024 IEEE International Conference on Metrology for eXtended Reality, Artificial Intelligence and Neural Engineering (MetroXRAINE), pp. 371–376, 2024.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Metaverse, Modeling, Virtual Reality
@inproceedings{rausa_enriching_2024,
title = {Enriching Metaverse with Memories Through Generative AI: A Case Study},
author = {Maria Rausa and Salvatore Gaglio and Agnese Augello and Giuseppe Caggianese and Silvia Franchini and Luigi Gallo and Luca Sabatucci},
url = {https://ieeexplore.ieee.org/abstract/document/10796338},
doi = {10.1109/MetroXRAINE62247.2024.10796338},
year = {2024},
date = {2024-10-01},
urldate = {2025-01-08},
booktitle = {2024 IEEE International Conference on Metrology for eXtended Reality, Artificial Intelligence and Neural Engineering (MetroXRAINE)},
pages = {371–376},
abstract = {The paper introduces MetaMemory, an approach to generate 3D models from either textual descriptions or photographs of objects, offering dual input modes for enhanced representation. MetaMemory's architecture is discussed presenting the tools employed in extracting the object from the image, generating the 3D mesh from texts or images, and visualizing the object reconstruction in an immersive scenario. Afterwards, a case study in which we experienced reconstructing memories of ancient crafts is examined together with the achieved results, by highlighting current limitations and potential applications.},
keywords = {Artificial Intelligence, Metaverse, Modeling, Virtual Reality},
pubstate = {published},
tppubtype = {inproceedings}
}
Aversano, Lerina; Bernardi, Mario Luca; Calgano, Vincenzo; Cimitile, Marta; Esposito, Concetta; Iammarino, Martina; Pisco, Marco; Spaziani, Sara; Verdone, Chiara
Using Machine Learning for Classification of Cancer Cells from Raman Spectroscopy Proceedings Article
In: pp. 15–24, 2024, ISBN: 978-989-758-584-5.
Abstract | Links | BibTeX | Tags: Classification, Healthcare, Machine Learning
@inproceedings{aversano_using_2024,
title = {Using Machine Learning for Classification of Cancer Cells from Raman Spectroscopy},
author = {Lerina Aversano and Mario Luca Bernardi and Vincenzo Calgano and Marta Cimitile and Concetta Esposito and Martina Iammarino and Marco Pisco and Sara Spaziani and Chiara Verdone},
url = {https://www.scitepress.org/Link.aspx?doi=10.5220/0011142600003277},
doi = {10.5220/0011142600003277},
isbn = {978-989-758-584-5},
year = {2024},
date = {2024-10-01},
urldate = {2024-10-02},
pages = {15–24},
abstract = {Since cancer represents one of the leading causes of death worldwide, the development of approaches capable of discerning healthy from diseased cells would be of fundamental importance to support diagnostic and screening techniques. Raman spectroscopy is the most effective molecular analysis technique currently available and provides information on the molecular composition, bonds, chemical environment, phase, and crystalline structure of the samples under examination. This work exploits a combination of Raman spectroscopy and machine learning models to discriminate patients’ liver cells between tumor and non-tumor. The research uses real patient data, provided by the Center for Nanophotonics and Optoelectronics for Human Health (CNOS), which analyzed the cells of a patient with liver cancer. Specifically, the dataset has been built through a long data collection process, which first involved the analysis of the cells with Raman spectroscopy and then the training of two classifiers, Decision Tree and Random Forest. The results show good performance for the trained classifiers, especially those relating to the Random Forest, which reaches an accuracy of 90%.},
keywords = {Classification, Healthcare, Machine Learning},
pubstate = {published},
tppubtype = {inproceedings}
}
Mennella, Ciro; Esposito, Massimo; Pietro, Giuseppe De; Maniscalco, Umberto
Promoting fairness in activity recognition algorithms for patient’s monitoring and evaluation systems in healthcare Journal Article
In: Computers in Biology and Medicine, vol. 179, pp. 108826, 2024, ISSN: 00104825.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Bias, Deep Learning, Motion analysis, Rehabilitation, Time-series
@article{mennella_promoting_2024,
title = {Promoting fairness in activity recognition algorithms for patient’s monitoring and evaluation systems in healthcare},
author = {Ciro Mennella and Massimo Esposito and Giuseppe De Pietro and Umberto Maniscalco},
url = {https://linkinghub.elsevier.com/retrieve/pii/S0010482524009119},
doi = {10.1016/j.compbiomed.2024.108826},
issn = {00104825},
year = {2024},
date = {2024-09-01},
urldate = {2024-07-21},
journal = {Computers in Biology and Medicine},
volume = {179},
pages = {108826},
abstract = {Researchers face the challenge of defining subject selection criteria when training algorithms for human activity recognition tasks. The ongoing uncertainty revolves around which characteristics should be considered to ensure algorithmic robustness across diverse populations. This study aims to address this challenge by conducting an analysis of heterogeneity in the training data to assess the impact of physical characteristics and soft-biometric attributes on activity recognition performance.
The performance of various state-of-the-art deep neural network architectures (tCNN, hybrid-LSTM, Transformer model) processing time-series data using the IntelliRehab (IRDS) dataset was evaluated. By intentionally introducing bias into the training data based on human characteristics, the objective is to identify the characteristics that influence algorithms in motion analysis.
Experimental findings reveal that the CNN-LSTM model achieved the highest accuracy, reaching 88%. Moreover, models trained on heterogeneous distributions of disability attributes exhibited notably higher accuracy, reaching 51%, compared to those not considering such factors, which scored an average of 33%. These evaluations underscore the significant influence of subjects’ characteristics on activity recognition performance, providing valuable insights into the algorithm’s robustness across diverse populations.
This study represents a significant step forward in promoting fairness and trustworthiness in artificial intelligence by quantifying representation bias in multi-channel time-series activity recognition data within the healthcare domain.},
keywords = {Artificial Intelligence, Bias, Deep Learning, Motion analysis, Rehabilitation, Time-series},
pubstate = {published},
tppubtype = {article}
}
The performance of various state-of-the-art deep neural network architectures (tCNN, hybrid-LSTM, Transformer model) processing time-series data using the IntelliRehab (IRDS) dataset was evaluated. By intentionally introducing bias into the training data based on human characteristics, the objective is to identify the characteristics that influence algorithms in motion analysis.
Experimental findings reveal that the CNN-LSTM model achieved the highest accuracy, reaching 88%. Moreover, models trained on heterogeneous distributions of disability attributes exhibited notably higher accuracy, reaching 51%, compared to those not considering such factors, which scored an average of 33%. These evaluations underscore the significant influence of subjects’ characteristics on activity recognition performance, providing valuable insights into the algorithm’s robustness across diverse populations.
This study represents a significant step forward in promoting fairness and trustworthiness in artificial intelligence by quantifying representation bias in multi-channel time-series activity recognition data within the healthcare domain.
Melillo, Antonio; Rachedi, Sarah; Caggianese, Giuseppe; Gallo, Luigi; Maiorano, Patrizia; Gimigliano, Francesca; Lucidi, Fabio; Pietro, Giuseppe De; Guida, Maurizio; Giordano, Antonio; Chirico, Andrea
In: Games for Health Journal, pp. g4h.2023.0202, 2024, ISSN: 2161-783X, 2161-7856.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Labor, Pain, User study, Virtual Reality
@article{melillo_synchronization_2024,
title = {Synchronization of a Virtual Reality Scenario to Uterine Contractions for Labor Pain Management: Development Study and Randomized Controlled Trial},
author = {Antonio Melillo and Sarah Rachedi and Giuseppe Caggianese and Luigi Gallo and Patrizia Maiorano and Francesca Gimigliano and Fabio Lucidi and Giuseppe De Pietro and Maurizio Guida and Antonio Giordano and Andrea Chirico},
url = {https://www.liebertpub.com/doi/10.1089/g4h.2023.0202},
doi = {10.1089/g4h.2023.0202},
issn = {2161-783X, 2161-7856},
year = {2024},
date = {2024-06-01},
urldate = {2024-07-21},
journal = {Games for Health Journal},
pages = {g4h.2023.0202},
abstract = {Background: Labor is described as one of the most painful events women can experience through their lives, and labor pain shows unique features and rhythmic fluctuations.
Purpose: The present study aims to evaluate virtual reality (VR) analgesic interventions for active labor with biofeedback-based VR technologies synchronized to uterine activity.
Materials and Methods: We developed a VR system modeled on uterine contractions by connecting it to cardiotocographic equipment. We conducted a randomized controlled trial on a sample of 74 cases and 80 controls during active labor.
Results: Results of the study showed a significant reduction of pain scores compared with both preintervention scores and to control group scores; a significant reduction of anxiety levels both compared with preintervention assessment and to control group and significant reduction in fear of labor experience compared with controls.
Conclusion: VR may be considered as an effective nonpharmacological analgesic technique for the treatment of pain and anxiety and fear of childbirth experience during labor. The developed system could improve personalization of care, modulating the multisensory stimulation tailored to labor progression. Further studies are needed to compare the synchronized VR system to uterine activity and unsynchronized VR interventions.},
keywords = {Artificial Intelligence, Labor, Pain, User study, Virtual Reality},
pubstate = {published},
tppubtype = {article}
}
Purpose: The present study aims to evaluate virtual reality (VR) analgesic interventions for active labor with biofeedback-based VR technologies synchronized to uterine activity.
Materials and Methods: We developed a VR system modeled on uterine contractions by connecting it to cardiotocographic equipment. We conducted a randomized controlled trial on a sample of 74 cases and 80 controls during active labor.
Results: Results of the study showed a significant reduction of pain scores compared with both preintervention scores and to control group scores; a significant reduction of anxiety levels both compared with preintervention assessment and to control group and significant reduction in fear of labor experience compared with controls.
Conclusion: VR may be considered as an effective nonpharmacological analgesic technique for the treatment of pain and anxiety and fear of childbirth experience during labor. The developed system could improve personalization of care, modulating the multisensory stimulation tailored to labor progression. Further studies are needed to compare the synchronized VR system to uterine activity and unsynchronized VR interventions.
Generosi, Andrea; Bruschi, Valeria; Cecchi, Stefania; Dourou, Nefeli Aikaterini; Montanari, Roberto; Mengoni, Maura
An Innovative System for Driver Monitoring and Vehicle Sound Interaction Proceedings Article
In: 2024 IEEE International Workshop on Metrology for Automotive (MetroAutomotive), pp. 159–164, IEEE, Bologna, Italy, 2024, ISBN: 9798350384987.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Deep Learning, Human Computer Interaction
@inproceedings{generosi_innovative_2024,
title = {An Innovative System for Driver Monitoring and Vehicle Sound Interaction},
author = {Andrea Generosi and Valeria Bruschi and Stefania Cecchi and Nefeli Aikaterini Dourou and Roberto Montanari and Maura Mengoni},
url = {https://ieeexplore.ieee.org/document/10615427/},
doi = {10.1109/MetroAutomotive61329.2024.10615427},
isbn = {9798350384987},
year = {2024},
date = {2024-06-01},
urldate = {2024-12-28},
booktitle = {2024 IEEE International Workshop on Metrology for Automotive (MetroAutomotive)},
pages = {159–164},
publisher = {IEEE},
address = {Bologna, Italy},
abstract = {An important aspect of Advanced Driver-Assistance Systems is the real-time monitoring of the driver and the interaction with him/her. In this scenario, the proposed work is focused on the development of an innovative system capable of analyzing the driver’s state and interact with him/her in a innovative way. In particular, the driver monitoring is obtained through the implementation of a multimodal approach that exploits deep learning and data fusion techniques while the interaction is achieved through sound signals elaborated with digital signal processing algorithm for the creation of an immersive scenario.},
keywords = {Artificial Intelligence, Deep Learning, Human Computer Interaction},
pubstate = {published},
tppubtype = {inproceedings}
}
Raikov, Aleksandr; Giretti, Alberto; Pirani, Massimiliano; Spalazzi, Luca; Guo, Meng
Accelerating human–computer interaction through convergent conditions for LLM explanation Journal Article
In: Frontiers in Artificial Intelligence, vol. 7, 2024, ISSN: 2624-8212, (Publisher: Frontiers).
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Causal Loop Dynamics, Cognitive semantics, Eigenform, Explainable AI, Hybrid reality, LLM
@article{raikovAcceleratingHumanComputer2024,
title = {Accelerating human–computer interaction through convergent conditions for LLM explanation},
author = {Aleksandr Raikov and Alberto Giretti and Massimiliano Pirani and Luca Spalazzi and Meng Guo},
url = {https://www.frontiersin.org/journals/artificial-intelligence/articles/10.3389/frai.2024.1406773/full},
doi = {10.3389/frai.2024.1406773},
issn = {2624-8212},
year = {2024},
date = {2024-05-01},
urldate = {2024-10-05},
journal = {Frontiers in Artificial Intelligence},
volume = {7},
abstract = {<p>The article addresses the accelerating human–machine interaction using the large language model (LLM). It goes beyond the traditional logical paradigms of explainable artificial intelligence (XAI) by considering poor-formalizable cognitive semantical interpretations of LLM. XAI is immersed in a hybrid space, where humans and machines have crucial distinctions during the digitisation of the interaction process. The author's convergent methodology ensures the conditions for making XAI purposeful and sustainable. This methodology is based on the inverse problem-solving method, cognitive modeling, genetic algorithm, neural network, causal loop dynamics, and eigenform realization. It has been shown that decision-makers need to create unique structural conditions for information processes, using LLM to accelerate the convergence of collective problem solving. The implementations have been carried out during the collective strategic planning in situational centers. The study is helpful for the advancement of explainable LLM in many branches of economy, science and technology.</p>},
note = {Publisher: Frontiers},
keywords = {Artificial Intelligence, Causal Loop Dynamics, Cognitive semantics, Eigenform, Explainable AI, Hybrid reality, LLM},
pubstate = {published},
tppubtype = {article}
}
Jamali, Reza; Generosi, Andrea; Villafan, Josè Yuri; Mengoni, Maura; Pelagalli, Leonardo; Battista, Gianmarco; Martarelli, Milena; Chiariotti, Paolo; Mansi, Silvia Angela; Arnesano, Marco; Castellini, Paolo
Facial Expression Recognition for Measuring Jurors’ Attention in Acoustic Jury Tests Journal Article
In: Sensors, vol. 24, no. 7, pp. 2298, 2024, ISSN: 1424-8220.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Computer Vision and Pattern Recognition, Deep Learning, Emotion Recognition
@article{jamali_facial_2024,
title = {Facial Expression Recognition for Measuring Jurors’ Attention in Acoustic Jury Tests},
author = {Reza Jamali and Andrea Generosi and Josè Yuri Villafan and Maura Mengoni and Leonardo Pelagalli and Gianmarco Battista and Milena Martarelli and Paolo Chiariotti and Silvia Angela Mansi and Marco Arnesano and Paolo Castellini},
url = {https://www.mdpi.com/1424-8220/24/7/2298},
doi = {10.3390/s24072298},
issn = {1424-8220},
year = {2024},
date = {2024-04-01},
urldate = {2024-12-28},
journal = {Sensors},
volume = {24},
number = {7},
pages = {2298},
abstract = {The perception of sound greatly impacts users’ emotional states, expectations, affective relationships with products, and purchase decisions. Consequently, assessing the perceived quality of sounds through jury testing is crucial in product design. However, the subjective nature of jurors’ responses may limit the accuracy and reliability of jury test outcomes. This research explores the utility of facial expression analysis in jury testing to enhance response reliability and mitigate subjectivity. Some quantitative indicators allow the research hypothesis to be validated, such as the correlation between jurors’ emotional responses and valence values, the accuracy of jury tests, and the disparities between jurors’ questionnaire responses and the emotions measured by FER (facial expression recognition). Specifically, analysis of attention levels during different statuses reveals a discernible decrease in attention levels, with 70 percent of jurors exhibiting reduced attention levels in the ‘distracted’ state and 62 percent in the ‘heavy-eyed’ state. On the other hand, regression analysis shows that the correlation between jurors’ valence and their choices in the jury test increases when considering the data where the jurors are attentive. The correlation highlights the potential of facial expression analysis as a reliable tool for assessing juror engagement. The findings suggest that integrating facial expression recognition can enhance the accuracy of jury testing in product design by providing a more dependable assessment of user responses and deeper insights into participants’ reactions to auditory stimuli.},
keywords = {Artificial Intelligence, Computer Vision and Pattern Recognition, Deep Learning, Emotion Recognition},
pubstate = {published},
tppubtype = {article}
}
Dubbioso, Raffaele; Spisto, Myriam; Verde, Laura; Iuzzolino, Valentina Virginia; Senerchia, Gianmaria; Pietro, Giuseppe De; Falco, Ivanoe De; Sannino, Giovanna
Precision medicine in ALS: Identification of new acoustic markers for dysarthria severity assessment Journal Article
In: Biomedical Signal Processing and Control, vol. 89, pp. 105706, 2024, ISSN: 17468094.
Abstract | Links | BibTeX | Tags: Amyotrophic lateral sclerosis (ALS), Artificial Intelligence, Bulbar functions, Classification, Dysarthria, Precision medicine
@article{dubbioso_precision_2024,
title = {Precision medicine in ALS: Identification of new acoustic markers for dysarthria severity assessment},
author = {Raffaele Dubbioso and Myriam Spisto and Laura Verde and Valentina Virginia Iuzzolino and Gianmaria Senerchia and Giuseppe De Pietro and Ivanoe De Falco and Giovanna Sannino},
url = {https://linkinghub.elsevier.com/retrieve/pii/S1746809423011394},
doi = {10.1016/j.bspc.2023.105706},
issn = {17468094},
year = {2024},
date = {2024-03-01},
urldate = {2024-07-21},
journal = {Biomedical Signal Processing and Control},
volume = {89},
pages = {105706},
abstract = {Amyotrophic lateral sclerosis (ALS) is a fatal neurodegenerative disease affecting motorneurons of the bulbar, cervical, thoracic, or lumbar segments. Bulbar presentation is a devastating characteristic that impairs patients’ ability to communicate and is linked to shorter survival. Early acoustic manifestation of voice symptoms, such as dysarthria, is very variable, making its detection and classification challenging, both by human specialists and automatic systems. In this context, precision medicine, defined as “prevention and treatment strategies that take individual variability into account”, has gained a great interest in the ALS community. Specifically, the use of innovative Artificial Intelligence techniques, such as Machine Learning, plays a pivotal role in finding specific patterns in the data set to help neurologists in clinical decision-making. Therefore, the main objective of this study was to find new markers, and new patterns, to promptly detect the possible presence of dysarthria and to correctly classify its severity. We have performed an acoustic analysis on different voice signals of various degrees of impairment acquired during outpatient visits at the ALS center of the “Federico II” University Hospital. From the collected signals, a new database containing different acoustic parameters was realized, on which several experiments were performed. The study led us to the discovery of markers that helped to develop a decision tree that separated healthy subjects from patients and, among patients, those with different severity of dysarthria. This model achieved good results in terms of dysarthria classification accuracy, 86.6%, which is excellent considering the small number of subjects in the data set.},
keywords = {Amyotrophic lateral sclerosis (ALS), Artificial Intelligence, Bulbar functions, Classification, Dysarthria, Precision medicine},
pubstate = {published},
tppubtype = {article}
}
Pontillo, Valeria; d'Aragona, Dario Amoroso; Pecorelli, Fabiano; Nucci, Dario Di; Ferrucci, Filomena; Palomba, Fabio
Machine learning-based test smell detection Journal Article
In: Empirical Software Engineering, vol. 29, no. 2, pp. 55, 2024, ISSN: 1382-3256, 1573-7616.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Code Smell Detection, Software Engineering, Technical Debt Management
@article{pontilloMachineLearningbasedTest2024,
title = {Machine learning-based test smell detection},
author = {Valeria Pontillo and Dario Amoroso d'Aragona and Fabiano Pecorelli and Dario Di Nucci and Filomena Ferrucci and Fabio Palomba},
url = {https://link.springer.com/10.1007/s10664-023-10436-2},
doi = {10.1007/s10664-023-10436-2},
issn = {1382-3256, 1573-7616},
year = {2024},
date = {2024-03-01},
urldate = {2024-07-07},
journal = {Empirical Software Engineering},
volume = {29},
number = {2},
pages = {55},
abstract = {Test smells are symptoms of sub-optimal design choices adopted when developing test cases. Previous studies have proved their harmfulness for test code maintainability and effectiveness. Therefore, researchers have been proposing automated, heuristic-based techniques to detect them. However, the performance of these detectors is still limited and dependent on tunable thresholds. We design and experiment with a novel test smell detection approach based on machine learning to detect four test smells. First, we develop the largest dataset of manually-validated test smells to enable experimentation. Afterward, we train six machine learners and assess their capabilities in within- and cross-project scenarios. Finally, we compare the ML-based approach with state-of-the-art heuristic-based techniques. The key findings of the study report a negative result. The performance of the machine learning-based detector is significantly better than heuristic-based techniques, but none of the learners able to overcome an average F-Measure of 51%. We further elaborate and discuss the reasons behind this negative result through a qualitative investigation into the current issues and challenges that prevent the appropriate detection of test smells, which allowed us to catalog the next steps that the research community may pursue to improve test smell detection techniques.},
keywords = {Artificial Intelligence, Code Smell Detection, Software Engineering, Technical Debt Management},
pubstate = {published},
tppubtype = {article}
}
Mennella, Ciro; Maniscalco, Umberto; Pietro, Giuseppe De; Esposito, Massimo
Ethical and regulatory challenges of AI technologies in healthcare: A narrative review Journal Article
In: Heliyon, vol. 10, no. 4, pp. e26297, 2024, ISSN: 24058440.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Decision-Making, Ethics, Healthcare, Regulatory guidelines, Technologies
@article{mennella_ethical_2024,
title = {Ethical and regulatory challenges of AI technologies in healthcare: A narrative review},
author = {Ciro Mennella and Umberto Maniscalco and Giuseppe De Pietro and Massimo Esposito},
url = {https://linkinghub.elsevier.com/retrieve/pii/S2405844024023284},
doi = {10.1016/j.heliyon.2024.e26297},
issn = {24058440},
year = {2024},
date = {2024-02-01},
urldate = {2024-07-21},
journal = {Heliyon},
volume = {10},
number = {4},
pages = {e26297},
abstract = {Over the past decade, there has been a notable surge in AI-driven research, specifically geared toward enhancing crucial clinical processes and outcomes. The potential of AI-powered decision support systems to streamline clinical workflows, assist in diagnostics, and enable personalized treatment is increasingly evident. Nevertheless, the introduction of these cutting-edge solutions poses substantial challenges in clinical and care environments, necessitating a thorough exploration of ethical, legal, and regulatory considerations.
A robust governance framework is imperative to foster the acceptance and successful implementation of AI in healthcare. This article delves deep into the critical ethical and regulatory concerns entangled with the deployment of AI systems in clinical practice. It not only provides a comprehensive overview of the role of AI technologies but also offers an insightful perspective on the ethical and regulatory challenges, making a pioneering contribution to the field.
This research aims to address the current challenges in digital healthcare by presenting valuable recommendations for all stakeholders eager to advance the development and implementation of innovative AI systems.},
keywords = {Artificial Intelligence, Decision-Making, Ethics, Healthcare, Regulatory guidelines, Technologies},
pubstate = {published},
tppubtype = {article}
}
A robust governance framework is imperative to foster the acceptance and successful implementation of AI in healthcare. This article delves deep into the critical ethical and regulatory concerns entangled with the deployment of AI systems in clinical practice. It not only provides a comprehensive overview of the role of AI technologies but also offers an insightful perspective on the ethical and regulatory challenges, making a pioneering contribution to the field.
This research aims to address the current challenges in digital healthcare by presenting valuable recommendations for all stakeholders eager to advance the development and implementation of innovative AI systems.
Agnolucci, Lorenzo; Galteri, Leonardo; Bertini, Marco; Bimbo, Alberto Del
Arniqa: Learning distortion manifold for image quality assessment Proceedings Article
In: Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision, pp. 189–198, 2024, (tex.copyright: All rights reserved).
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Computer Vision and Pattern Recognition, Image Representation, No-Reference Image Quality Assessment (NR-IQA), Quality Assessment
@inproceedings{agnolucciArniqaLearningDistortion2024,
title = {Arniqa: Learning distortion manifold for image quality assessment},
author = {Lorenzo Agnolucci and Leonardo Galteri and Marco Bertini and Alberto Del Bimbo},
url = {https://openaccess.thecvf.com/content/WACV2024/papers/Agnolucci_ARNIQA_Learning_Distortion_Manifold_for_Image_Quality_Assessment_WACV_2024_paper.pdf},
doi = {10.1109/WACV57701.2024.00026},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision},
pages = {189–198},
abstract = {No-Reference Image Quality Assessment (NR-IQA) aims to develop methods to measure image quality in alignment with human perception without the need for a high-quality reference image. In this work, we propose a self-supervised approach named ARNIQA (leArning distoRtion maNifold for Image Quality Assessment) for modeling the image distortion manifold to obtain quality representations in an intrinsic manner. First, we introduce an image degradation model that randomly composes ordered sequences of consecutively applied distortions. In this way, we can synthetically degrade images with a large variety of degradation patterns. Second, we propose to train our model by maximizing the similarity between the representations of patches of different images distorted equally, despite varying content. Thus, images degraded in the same manner correspond to neighboring positions within the distortion manifold. Finally, we map the image representations to the quality scores with a simple linear regressor, thus without fine-tuning the encoder weights. The experiments show that our approach achieves state-of-the-art performance on several datasets. In addition, ARNIQA demonstrates improved data efficiency, generalization capabilities, and robustness compared to competing methods. The code and the model are publicly available at https://github. com/miccunifi/ARNIQA.},
note = {tex.copyright: All rights reserved},
keywords = {Artificial Intelligence, Computer Vision and Pattern Recognition, Image Representation, No-Reference Image Quality Assessment (NR-IQA), Quality Assessment},
pubstate = {published},
tppubtype = {inproceedings}
}
Agnolucci, Lorenzo; Galteri, Leonardo; Bertini, Marco; Bimbo, Alberto Del
Reference-based restoration of digitized analog videotapes Proceedings Article
In: Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision, pp. 1659–1668, 2024, (tex.copyright: All rights reserved).
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Compression Artifact Removal, Computer Vision and Pattern Recognition, Digital Archiving, Image Processing, Transformer Networks
@inproceedings{agnolucciReferencebasedRestorationDigitized2024,
title = {Reference-based restoration of digitized analog videotapes},
author = {Lorenzo Agnolucci and Leonardo Galteri and Marco Bertini and Alberto Del Bimbo},
url = {https://openaccess.thecvf.com/content/WACV2024/papers/Agnolucci_Reference-Based_Restoration_of_Digitized_Analog_Videotapes_WACV_2024_paper.pdf},
doi = {10.1109/WACV57701.2024.00168},
year = {2024},
date = {2024-01-01},
booktitle = {Proceedings of the IEEE/CVF Winter Conference on Applications of Computer Vision},
pages = {1659–1668},
abstract = {Analog magnetic tapes have been the main video data storage device for several decades. Videos stored on analog videotapes exhibit unique degradation patterns caused by tape aging and reader device malfunctioning that are different from those observed in film and digital video restoration tasks. In this work, we present a reference-based approach for the resToration of digitized Analog videotaPEs (TAPE). We leverage CLIP for zero-shot artifact detection to identify the cleanest frames of each video through textual prompts describing different artifacts. Then, we select the clean frames most similar to the input ones and employ them as references. We design a transformer-based Swin-UNet network that exploits both neighboring and reference frames via our Multi-Reference Spatial Feature Fusion (MRSFF) blocks. MRSFF blocks rely on cross-attention and attention pooling to take advantage of the most useful parts of each reference frame. To address the absence of ground truth in real-world videos, we create a synthetic dataset of videos exhibiting artifacts that closely resemble those commonly found in analog videotapes. Both quantitative and qualitative experiments show the effectiveness of our approach compared to other state-of-the-art methods. The code, the model, and the synthetic dataset are publicly available at https://github.com/miccunifi/TAPE.},
note = {tex.copyright: All rights reserved},
keywords = {Artificial Intelligence, Compression Artifact Removal, Computer Vision and Pattern Recognition, Digital Archiving, Image Processing, Transformer Networks},
pubstate = {published},
tppubtype = {inproceedings}
}
Barbareschi, Mario; Barone, Salvatore
Investigating the Resilience Source of Classification Systems for Approximate Computing Techniques Journal Article
In: IEEE Transactions on Emerging Topics in Computing, pp. 12, 2024, ISSN: 2168-6750.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Classification systems, Neural networks, Tree Ensemble
@article{barbareschi_investigating_2024,
title = {Investigating the Resilience Source of Classification Systems for Approximate Computing Techniques},
author = {Mario Barbareschi and Salvatore Barone},
url = {https://ieeexplore.ieee.org/document/10542568},
doi = {10.1109/TETC.2024.3403757},
issn = {2168-6750},
year = {2024},
date = {2024-01-01},
journal = {IEEE Transactions on Emerging Topics in Computing},
pages = {12},
abstract = {During the last decade, classification systems (CSs) received significant research attention, with new learning algorithms achieving high accuracy in various applications. However, their resource-intensive nature, in terms of hardware and computation time, poses new design challenges.
CSs exhibit inherent error resilience, due to redundancy of training sets, and self-healing properties, making them suitable for Approximate Computing (AxC).
AxC enables efficient computation by using reduced precision or approximate values, leading to energy, time, and silicon area savings.
Exploiting AxC involves estimating the introduced error for each approximate variant found during a Design-Space Exploration (DSE). This estimation has to be both rapid and meaningful, considering a substantial number of test samples, which are utterly conflicting demands.
In this paper, we investigate on sources of error resiliency of CSs, and we propose a technique to haste the DSE that reduces the computational time for error estimation by systematically reducing the test set. In particular, we cherry-pick samples that are likely to be more sensitive to approximation and perform accuracy-loss estimation just by exploiting such a sample subset.
In order to demonstrate its efficacy, we integrate our technique into two different approaches for generating approximate CSs, showing an average speed-up up to approx18.},
keywords = {Artificial Intelligence, Classification systems, Neural networks, Tree Ensemble},
pubstate = {published},
tppubtype = {article}
}
CSs exhibit inherent error resilience, due to redundancy of training sets, and self-healing properties, making them suitable for Approximate Computing (AxC).
AxC enables efficient computation by using reduced precision or approximate values, leading to energy, time, and silicon area savings.
Exploiting AxC involves estimating the introduced error for each approximate variant found during a Design-Space Exploration (DSE). This estimation has to be both rapid and meaningful, considering a substantial number of test samples, which are utterly conflicting demands.
In this paper, we investigate on sources of error resiliency of CSs, and we propose a technique to haste the DSE that reduces the computational time for error estimation by systematically reducing the test set. In particular, we cherry-pick samples that are likely to be more sensitive to approximation and perform accuracy-loss estimation just by exploiting such a sample subset.
In order to demonstrate its efficacy, we integrate our technique into two different approaches for generating approximate CSs, showing an average speed-up up to approx18.
Ferraro, Antonino; Galli, Antonio; Gatta, Valerio La; Minocchi, Mario; Moscato, Vincenzo; Postiglione, Marco
Few Shot NER on Augmented Unstructured Text from Cardiology Records Book Section
In: Barolli, Leonard (Ed.): Advances in Internet, Data & Web Technologies, vol. 193, pp. 1–12, Springer Nature Switzerland, Cham, 2024, ISBN: 978-3-031-53554-3 978-3-031-53555-0, (Series Title: Lecture Notes on Data Engineering and Communications Technologies).
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Data Augmentation, Healthcare, Named-Entity Recognition
@incollection{barolli_few_2024,
title = {Few Shot NER on Augmented Unstructured Text from Cardiology Records},
author = {Antonino Ferraro and Antonio Galli and Valerio La Gatta and Mario Minocchi and Vincenzo Moscato and Marco Postiglione},
editor = {Leonard Barolli},
url = {https://link.springer.com/10.1007/978-3-031-53555-0_1},
doi = {10.1007/978-3-031-53555-0_1},
isbn = {978-3-031-53554-3 978-3-031-53555-0},
year = {2024},
date = {2024-01-01},
urldate = {2024-07-12},
booktitle = {Advances in Internet, Data & Web Technologies},
volume = {193},
pages = {1–12},
publisher = {Springer Nature Switzerland},
address = {Cham},
abstract = {The principal challenge encountered in the realm of Named-Entity Recognition lies in the acquisition of high-caliber annotated data. In certain languages and specialized domains, the availability of substantial datasets suitable for training models via traditional machine learning methodologies can prove to be a formidable obstacle [10]. In an effort to address this issue, we have explored a Policy-based Active Learning approach aimed at meticulously selecting the most advantageous instances generated through a Data Augmentation procedure [3, 6]. This endeavor was undertaken within the context of a few-shot scenario in the biomedical field. Our study has revealed the superiority of this strategy in comparison to active learning techniques relying on fixed metrics or random instance selection, guaranteeing the privacy of patients from whose medical records the source data were obtained and used. However, it is imperative to note that this approach entails heightened computational demands and necessitates a longer execution duration [7].},
note = {Series Title: Lecture Notes on Data Engineering and Communications Technologies},
keywords = {Artificial Intelligence, Data Augmentation, Healthcare, Named-Entity Recognition},
pubstate = {published},
tppubtype = {incollection}
}
Agnolucci, Lorenzo; Galteri, Leonardo; Bertini, Marco
Quality-Aware Image-Text Alignment for Real-World Image Quality Assessment Journal Article
In: arXiv preprint arXiv:2403.11176, 2024, (arXiv: 2403.11176 tex.copyright: All rights reserved).
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Computer Vision and Pattern Recognition, Image Processing, Quality Assessment, Self-Supervised Learning, Vision and Language
@article{agnolucciQualityAwareImageTextAlignment2024,
title = {Quality-Aware Image-Text Alignment for Real-World Image Quality Assessment},
author = {Lorenzo Agnolucci and Leonardo Galteri and Marco Bertini},
url = {https://arxiv.org/abs/2403.11176},
doi = {10.48550/ARXIV.2403.11176},
year = {2024},
date = {2024-01-01},
journal = {arXiv preprint arXiv:2403.11176},
abstract = {No-Reference Image Quality Assessment (NR-IQA) focuses on designing methods to measure image quality in alignment with human perception when a high-quality reference image is unavailable. The reliance on annotated Mean Opinion Scores (MOS) in the majority of state-of-the-art NR-IQA approaches limits their scalability and broader applicability to real-world scenarios. To overcome this limitation, we propose QualiCLIP (Quality-aware CLIP), a CLIP-based self-supervised opinion-unaware method that does not require labeled MOS. In particular, we introduce a quality-aware image-text alignment strategy to make CLIP generate representations that correlate with the inherent quality of the images. Starting from pristine images, we synthetically degrade them with increasing levels of intensity. Then, we train CLIP to rank these degraded images based on their similarity to quality-related antonym text prompts, while guaranteeing consistent representations for images with comparable quality. Our method achieves state-of-the-art performance on several datasets with authentic distortions. Moreover, despite not requiring MOS, QualiCLIP outperforms supervised methods when their training dataset differs from the testing one, thus proving to be more suitable for real-world scenarios. Furthermore, our approach demonstrates greater robustness and improved explainability than competing methods. The code and the model are publicly available at https://github.com/miccunifi/QualiCLIP.},
note = {arXiv: 2403.11176
tex.copyright: All rights reserved},
keywords = {Artificial Intelligence, Computer Vision and Pattern Recognition, Image Processing, Quality Assessment, Self-Supervised Learning, Vision and Language},
pubstate = {published},
tppubtype = {article}
}
Mengoni, Maura; Ceccacci, Silvia; Generosi, Andrea
Emotion Recognition and Affective Computing Book Section
In: Interaction Techniques and Technologies in Human-Computer Interaction, CRC Press, 2024, ISBN: 9781003490678.
Abstract | BibTeX | Tags: Artificial Intelligence, Computer Vision and Pattern Recognition, Deep Learning, Emotion Recognition
@incollection{mengoni_emotion_2024,
title = {Emotion Recognition and Affective Computing},
author = {Maura Mengoni and Silvia Ceccacci and Andrea Generosi},
isbn = {9781003490678},
year = {2024},
date = {2024-01-01},
booktitle = {Interaction Techniques and Technologies in Human-Computer Interaction},
publisher = {CRC Press},
abstract = {This chapter explores the challenging topic of emotion recognition by affective computing. The importance of considering and understanding people’s emotions in interaction design is discussed, focusing on the role of human emotions in the entire life cycle of human–system interaction as a means to innovate products and services. The measurement of emotions is also analyzed, including the classification of human emotions and recognition methods, as well as current techniques for measuring emotional responses. An emotional-based approach and related technologies are considered in managing the entire life cycle of human–system interaction as an innovation driver. This chapter also presents how to use affective computing in cross-transversal applications, concentrating on potential applications and different case studies. This chapter concludes with a look towards a world of emotional intelligence, where affective computing plays a crucial role in collecting and analyzing emotional data to support innovative product and service experiences.},
keywords = {Artificial Intelligence, Computer Vision and Pattern Recognition, Deep Learning, Emotion Recognition},
pubstate = {published},
tppubtype = {incollection}
}
Generosi, Andrea; Villafan, Josè Yuri; Montanari, Roberto; Mengoni, Maura
A Multimodal Approach to Understand Driver’s Distraction for DMS Proceedings Article
In: Antona, Margherita; Stephanidis, Constantine (Ed.): Universal Access in Human-Computer Interaction, pp. 250–270, Springer Nature Switzerland, Cham, 2024, ISBN: 9783031608759.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Computer Vision and Pattern Recognition, Deep Learning, Human Computer Interaction
@inproceedings{generosi_multimodal_2024,
title = {A Multimodal Approach to Understand Driver’s Distraction for DMS},
author = {Andrea Generosi and Josè Yuri Villafan and Roberto Montanari and Maura Mengoni},
editor = {Margherita Antona and Constantine Stephanidis},
doi = {10.1007/978-3-031-60875-9_17},
isbn = {9783031608759},
year = {2024},
date = {2024-01-01},
booktitle = {Universal Access in Human-Computer Interaction},
pages = {250–270},
publisher = {Springer Nature Switzerland},
address = {Cham},
abstract = {This study introduces a multimodal approach for enhancing the accuracy of Driver Monitoring Systems (DMS) in detecting driver distraction. By integrating data from vehicle control units with vision-based information, the research aims to address the limitations of current DMS. The experimental setup involves a driving simulator and advanced computer vision, deep learning technologies for facial expression recognition, and head rotation analysis. The findings suggest that combining various data types—behavioral, physiological, and emotional—can significantly improve DMS’s predictive capability. This research contributes to the development of more sophisticated, adaptive, and real-time systems for improving driver safety and advancing autonomous driving technologies.},
keywords = {Artificial Intelligence, Computer Vision and Pattern Recognition, Deep Learning, Human Computer Interaction},
pubstate = {published},
tppubtype = {inproceedings}
}
Scannapieco, Simone; Tomazzoli, Claudio
Cnosso, a Novel Method for Business Document Automation Based on Open Information Extraction Journal Article
In: Expert Systems with Applications, vol. 245, pp. 123038, 2024, ISSN: 0957-4174.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Document automation, Information Extraction, Natural language analysis, Natural Language Processing, Semantic Role Labeling
@article{scannapieco_cnosso_2024,
title = {Cnosso, a Novel Method for Business Document Automation Based on Open Information Extraction},
author = {Simone Scannapieco and Claudio Tomazzoli},
url = {https://www.sciencedirect.com/science/article/pii/S0957417423035406},
doi = {10.1016/j.eswa.2023.123038},
issn = {0957-4174},
year = {2024},
date = {2024-01-01},
journal = {Expert Systems with Applications},
volume = {245},
pages = {123038},
abstract = {The state-of-the-art in automated processing of unstructured business documents has evolved from manual labor to advanced AI systems in the span of mere decades. Such systems involve learning techniques, rule or clause sets, neural models – either used alone or in combination – for the extraction to work. As an example, rule-based processes operate on a perceived layout or positioning of the information, whereas model-based frameworks adopt a semantic, and often uninspectable, approach. Verb-Based Semantic Role Labeling (VBSRL) is a novel system presented in a former paper that uses a hybrid foundation to inform the extraction phase via a set of rules modeling natural language. We propose a new VBSRL-based document processing method, aided by valuable and innovative architectural choices, which has been implemented for the Italian language and experimented upon with promising results. Even in its infancy, in fact, the first implementation of this system shows better results than comparable IE solutions, obtaining an aggregate, average F-measure of nearly 79%.},
keywords = {Artificial Intelligence, Document automation, Information Extraction, Natural language analysis, Natural Language Processing, Semantic Role Labeling},
pubstate = {published},
tppubtype = {article}
}
Tomazzoli, Claudio; Ponza, Andrea; Cristani, Matteo; Olivieri, Francesco; Scannapieco, Simone
A Cobot in the Vineyard: Computer Vision for Smart Chemicals Spraying Journal Article
In: Applied Sciences, vol. 14, no. 9, 2024, ISSN: 2076-3417.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Collaborative robotic, Computer vision, Cyber-Physical Systems, Deep Learning, Machine Learning, Precision agriculture
@article{tomazzoli_cobot_2024,
title = {A Cobot in the Vineyard: Computer Vision for Smart Chemicals Spraying},
author = {Claudio Tomazzoli and Andrea Ponza and Matteo Cristani and Francesco Olivieri and Simone Scannapieco},
url = {https://www.mdpi.com/2076-3417/14/9/3777},
doi = {10.3390/app14093777},
issn = {2076-3417},
year = {2024},
date = {2024-01-01},
journal = {Applied Sciences},
volume = {14},
number = {9},
abstract = {Precision agriculture (PA) is a management concept that makes use of digital techniques to monitor and optimise agricultural production processes and represents a field of growing economic and social importance. Within this area of knowledge, there is a topic not yet fully explored: outlining a road map towards the definition of an affordable cobot solution (i.e., a low-cost robot able to safely coexist with humans) able to perform automatic chemical treatments. The present study narrows its scope to viticulture technologies, and targets small/medium-sized winemakers and producers, for whom innovative technological advancements in the production chain are often precluded by financial factors. The aim is to detail the realization of such an integrated solution and to discuss the promising results achieved. The results of this study are: (i) The definition of a methodology for integrating a cobot in the process of grape chemicals spraying under the constraints of a low-cost apparatus; (ii) the realization of a proof-of-concept of such a cobotic system; (iii) the experimental analysis of the visual apparatus of this system in an indoor and outdoor controlled environment as well as in the field.},
keywords = {Artificial Intelligence, Collaborative robotic, Computer vision, Cyber-Physical Systems, Deep Learning, Machine Learning, Precision agriculture},
pubstate = {published},
tppubtype = {article}
}
Workneh, Tewabe Chekole; Cristani, Matteo; Tomazzoli, Claudio
Assessing the Impact of Climate Change on Mineral-Associated Organic Carbon (MAOC) Using Machine Learning Models Proceedings Article
In: pp. 35–47, 2024.
Abstract | Links | BibTeX | Tags: Machine Learning, Mineral-associated organic carbon, Predictive Models
@inproceedings{workneh_assessing_2024,
title = {Assessing the Impact of Climate Change on Mineral-Associated Organic Carbon (MAOC) Using Machine Learning Models},
author = {Tewabe Chekole Workneh and Matteo Cristani and Claudio Tomazzoli},
url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-85214791497&partnerID=40&md5=5a2e249e0da0fd4f9571af2bc00696ca},
year = {2024},
date = {2024-01-01},
volume = {3883},
pages = {35–47},
series = {CEUR Workshop Proceedings},
abstract = {This study examines the impact of climate change on Soil Organic Carbon (SOC) stocks, with a particular focus on Mineral-Associated Organic Carbon (MAOC)—a stable fraction of soil organic matter critical for long-term carbon sequestration. This study aims to develop a predictive tool for estimating MAOC at a finer spatial resolution, addressing gaps in current models and enabling cost-effective climate change mitigation strategies. Using an extensive dataset from the Zenodo repository, augmented with detailed meteorological data, machine learning techniques were employed—specifically, the Random Forest (RF) Regressor and Support Vector Machine (SVM) Regressor. The RF model not only outperformed the SVM in predictive accuracy but also identified key factors influencing MAOC content under various climate change scenarios. These findings deepen our understanding of soil carbon sequestration potential in future climate conditions, offering actionable insights for sustainable soil management and cost-effective climate change mitigation strategies. textbackslashcopyright 2024 Copyright for this paper by its authors.},
keywords = {Machine Learning, Mineral-associated organic carbon, Predictive Models},
pubstate = {published},
tppubtype = {inproceedings}
}
2023
Mennella, Ciro; Maniscalco, Umberto; Pietro, Giuseppe De; Esposito, Massimo
In: Computers in Biology and Medicine, vol. 167, pp. 107665, 2023, ISSN: 00104825.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Generative algorithms, Rehabilitation, Synthetic data
@article{mennella_generating_2023,
title = {Generating a novel synthetic dataset for rehabilitation exercises using pose-guided conditioned diffusion models: A quantitative and qualitative evaluation},
author = {Ciro Mennella and Umberto Maniscalco and Giuseppe De Pietro and Massimo Esposito},
url = {https://linkinghub.elsevier.com/retrieve/pii/S0010482523011307},
doi = {10.1016/j.compbiomed.2023.107665},
issn = {00104825},
year = {2023},
date = {2023-12-01},
urldate = {2024-07-21},
journal = {Computers in Biology and Medicine},
volume = {167},
pages = {107665},
abstract = {Machine learning has emerged as a promising approach to enhance rehabilitation therapy monitoring and evaluation, providing personalized insights. However, the scarcity of data remains a significant challenge in developing robust machine learning models for rehabilitation.
This paper introduces a novel synthetic dataset for rehabilitation exercises, leveraging pose-guided person image generation using conditioned diffusion models. By processing a pre-labeled dataset of class movements for 6 rehabilitation exercises, the described method generates realistic human movement images of elderly subjects engaging in home-based exercises.
A total of 22,352 images were generated to accurately capture the spatial consistency of human joint relationships for predefined exercise movements. This novel dataset significantly amplified variability in the physical and demographic attributes of the main subject and the background environment. Quantitative metrics used for image assessment revealed highly favorable results. The generated images successfully maintained intra-class and inter-class consistency in motion data, producing outstanding outcomes with distance correlation values exceeding the 0.90.
This innovative approach empowers researchers to enhance the value of existing limited datasets by generating high-fidelity synthetic images that precisely augment the anthropometric and biomechanical attributes of individuals engaged in rehabilitation exercises.},
keywords = {Artificial Intelligence, Generative algorithms, Rehabilitation, Synthetic data},
pubstate = {published},
tppubtype = {article}
}
This paper introduces a novel synthetic dataset for rehabilitation exercises, leveraging pose-guided person image generation using conditioned diffusion models. By processing a pre-labeled dataset of class movements for 6 rehabilitation exercises, the described method generates realistic human movement images of elderly subjects engaging in home-based exercises.
A total of 22,352 images were generated to accurately capture the spatial consistency of human joint relationships for predefined exercise movements. This novel dataset significantly amplified variability in the physical and demographic attributes of the main subject and the background environment. Quantitative metrics used for image assessment revealed highly favorable results. The generated images successfully maintained intra-class and inter-class consistency in motion data, producing outstanding outcomes with distance correlation values exceeding the 0.90.
This innovative approach empowers researchers to enhance the value of existing limited datasets by generating high-fidelity synthetic images that precisely augment the anthropometric and biomechanical attributes of individuals engaged in rehabilitation exercises.
Russo, Raffaele; Giuseppe, Giuliano Di; Vanacore, Alessandro; Gatta, Valerio La; Ferraro, Antonino; Galli, Antonio; Postiglione, Marco; Moscato, Vincenzo
Graph-Based Approach for European Law Classification Proceedings Article
In: 2023 IEEE International Conference on Big Data (BigData), pp. 1–9, IEEE, Sorrento, Italy, 2023, ISBN: 9798350324457.
Abstract | Links | BibTeX | Tags: Artificial Intelligence, Semantics
@inproceedings{russo_graph-based_2023,
title = {Graph-Based Approach for European Law Classification},
author = {Raffaele Russo and Giuliano Di Giuseppe and Alessandro Vanacore and Valerio La Gatta and Antonino Ferraro and Antonio Galli and Marco Postiglione and Vincenzo Moscato},
url = {https://ieeexplore.ieee.org/document/10386684/},
doi = {10.1109/BigData59044.2023.10386684},
isbn = {9798350324457},
year = {2023},
date = {2023-12-01},
urldate = {2024-07-12},
booktitle = {2023 IEEE International Conference on Big Data (BigData)},
pages = {1–9},
publisher = {IEEE},
address = {Sorrento, Italy},
abstract = {Deep learning, owing to its transformative influence across a myriad of sectors, has recently made its foray into the legal domain, instigated by the surge in digitization. Among the multitude of applications in this space, legal document classification emerges as a pivotal yet complex undertaking. Legal texts, characterized by unique domain-centric semantics and intricate linguistic patterns, necessitate precision-driven classification systems for numerous practical implications. This paper illuminates the challenges and opportunities in automating the classification of European Union (EU) legal documents, emphasizing the interrelationships among statutes and the hierarchical nature of legal references. In this context, we introduce a novel graph data modeling technique that adeptly marries content-centric indicators with the relational dynamics inherent among diverse legal documents. Central to our approach is a framework that melds text embeddings with graph neural networks for the classification of legal documents aligned with their subject-based directories. Empirical evaluations on the EU law dataset underline the efficacy of our model across varying granularities, from general thematic categories to intricate subtopics. This endeavor not only augments the comprehensibility and accessibility of EU jurisprudence but also holds significant implications across regulatory compliance, legal research, and policy formulation, underscoring the potential of deep learning in reshaping legal paradigms.},
keywords = {Artificial Intelligence, Semantics},
pubstate = {published},
tppubtype = {inproceedings}
}