@inproceedings{fbf95005a9a04425a4c5139a283f21bc,
title = "IDPP: Imbalanced Datasets Pipelines in Pyrus",
abstract = "We showcase and demonstrate IDPP, a Pyrus-based tool that offers a collection of pipelines for the analysis of imbalanced datasets. Like Pyrus, IDPP is a web-based, low-code/no-code graphical modelling environment for ML and data analytics applications. On a case study from the medical domain, we solve the challenge of re-using AI/ML models that do not address data with imbalanced class by implementing ML algorithms in Python that do the re-balancing. We then use these algorithms and the original ML models in the IDPP pipelines. With IDPP, our low-code development approach to balance datasets for AI/ML applications can be used by non-coders. It simplifies the data-preprocessing stage of any AI/ML project pipeline, which can potentially improve the performance of the models. The tool demo will showcase the low-code implementation and no-code reuse and repurposing of AI-based systems through end-to end Pyrus pipelines.",
keywords = "AI/ML-systems, data resampling techniques, imbalanced medical datasets, Low-code, Pyrus, Responsible AI",
author = "Amandeep Singh and Olga Minguett",
note = "Publisher Copyright: {\textcopyright} 2024, The Author(s), under exclusive license to Springer Nature Switzerland AG.; 8th International Conference on Engineering of Computer-Based Systems, ECBS 2023 ; Conference date: 16-10-2023 Through 18-10-2023",
year = "2024",
doi = "10.1007/978-3-031-49252-5_6",
language = "English",
isbn = "9783031492518",
series = "Lecture Notes in Computer Science (including subseries Lecture Notes in Artificial Intelligence and Lecture Notes in Bioinformatics)",
publisher = "Springer Science and Business Media Deutschland GmbH",
pages = "60--69",
editor = "Jan Kofro{\v n} and Tiziana Margaria and Cristina Seceleanu",
booktitle = "Engineering of Computer-Based Systems - 8th International Conference, ECBS 2023, Proceedings",
}