@inbook{89edffcd752748a98bd08169212902ae,
title = "Towards Trust-Based Data Weighting in Machine Learning",
abstract = "In distributed environments, data for Machine Learning (ML) applications may be generated from numerous sources and devices, and traverse a cloud-edge continuum via a variety of protocols, using multiple security schemes and equipment types. While ML models typically benefit from using large training sets, not all data can be equally trusted. In this work, we examine data trust as a factor in creating ML models, and explore an approach using annotated trust metadata to contribute to data weighting in generating ML models. We assess the feasibility of this approach using well-known datasets for both linear regression and classification problems, demonstrating the benefit of including trust as a factor when using heterogeneous datasets. We discuss the potential benefits of this approach, and the opportunity it presents for improved data utilisation and processing.",
keywords = "clustering, data confidence fabric, data weighting, edge computing, linear regression, machine learning",
author = "Murphy, \{Sean Og\} and Utz Roedig and Sreenan, \{Cormac J.\} and Ahmed Khalid",
note = "Publisher Copyright: {\textcopyright} 2023 IEEE.; 31st IEEE International Conference on Network Protocols, ICNP 2023 ; Conference date: 10-10-2023 Through 13-10-2023",
year = "2023",
doi = "10.1109/ICNP59255.2023.10355606",
language = "English",
series = "Proceedings - International Conference on Network Protocols, ICNP",
publisher = "IEEE Computer Society",
booktitle = "2023 IEEE 31st International Conference on Network Protocols, ICNP 2023",
address = "United States",
}