@Article{Schiavon2026,
author={Schiavon, Jo{\~a}o Paulo and Castro, M{\'a}rcio and Carvalho, J{\^o}nata Tyska},
title={Ensemble-based Anomaly Detection in Brazilian Parliamentary Expenses using Unlabeled Public Data},
journal={International Journal of Data Science and Analytics},
year={2026},
month={Apr},
day={16},
volume={22},
number={1},
pages={139},
abstract={The rapid growth of digital information offers both opportunities and challenges for monitoring public resource usage. In Brazil, members of the National Congress receive monthly allowances for reimbursable expenses, but manual oversight of this spending is inefficient and error-prone. This work introduces an unsupervised methodology that integrates an ensemble of six machine learning techniques to detect anomalies in parliamentary expenses using unlabeled government data. To guide model training, we leverage six datasets from the ADBench framework, a comprehensive anomaly detection benchmark comprising multiple datasets, selected for their similarity to the target domain. To evaluate the proposed approach, we propose four new real-world unlabeled datasets, which are collectively named the Brazilian Parliamentary Expenses Datasets, obtained from official reimbursement records of the Brazilian Quota for Parliamentary Activity. Results demonstrate that combining multiple anomaly detection methods enhances precision and robustness in identifying irregular expenditures, advancing transparency and accountability in public administration. Moreover, the proposed approach helps prioritize oversight efforts by directing investigations toward cases with a higher probability of irregular behavior.},
issn={2364-4168},
doi={10.1007/s41060-026-01079-9},
url={https://doi.org/10.1007/s41060-026-01079-9}
}
