@article{M9826FF40, title = "Anomaly Detection in Mammography Data using Dimensionality Reduction and DBSCAN Clustering for Enhancing Diagnostic Model Performance", journal = "Journal of KIISE, JOK", year = "2025", issn = "2383-630X", doi = "10.5626/JOK.2025.52.9.787", author = "Donghee Kim, Jaeil Kim", keywords = "mammography data, anomaly detection, autoencoder, dimensionality reduction, DBSCAN clustering", abstract = "This study introduces a data cleaning technique for identifying and removing anomalous images from mammography data. An autoencoder extracts low-dimensional latent features, which are then refined through dimensionality reduction (methods such as PCA, t-SNE, and Isomap) to highlight irregular patterns. DBSCAN clustering is subsequently employed to detect anomalies. An ablation study confirmed that dimensionality reduction enhances anomaly detection, and the impact of anomaly removal on model training was assessed. Results indicate that the combination of t-SNE and DBSCAN yields superior performance, with the refined model demonstrating significant improvements in accuracy and sensitivity. These findings enhance the reliability of AI-based breast cancer diagnosis and present a promising pre-processing method for medical imaging." }