@article{article_1672180, title={COUGH SOUND ANALYSIS WITH DEEP LEARNING: THE IMPACT OF DATA AUGMENTATION ON RESPIRATORY DISEASE CLASSIFICATION}, journal={Mühendislik Bilimleri ve Tasarım Dergisi}, volume={13}, pages={896–910}, year={2025}, author={Türkçetin, Ayşen Özün and Koç, Turgay and Cilekar, Sule}, keywords={Cough Sound Analysis, Lung Diseases, Deep Learning Models, Data Augmentation, Convolution Neural Network, Cross Validation, Imbalanced Data}, abstract={Respiratory diseases affect millions globally, necessitating efficient and early diagnostic tools to mitigate complications. This study proposes a robust and systematic approach for classifying asthma, COPD, pneumonia, and healthy conditions using cough sound analysis. Mel-frequency cepstral coefficients (MFCCs) were extracted and used to train both a deep learning model (CNN) and traditional classifiers (Random Forest, SVM) under limited and imbalanced data conditions. A major focus was on evaluating the impact of data augmentation and model choice on classification performance. Initial results showed that traditional models outperformed the CNN due to overfitting. However, with progressive augmentation up to 800 synthetic samples per class and the use of Dice Loss, the CNN model achieved substantial improvements, reaching 84% accuracy and a Macro F1 Score of 69%. These results highlight the critical role of data augmentation and tailored training strategies in enhancing the performance of deep learning models for audio-based biomedical classification tasks.}, number={3}, publisher={Süleyman Demirel University}