<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                    <journal-id></journal-id>
            <journal-title-group>
                                                                                    <journal-title>Balkan Journal of Electrical and Computer Engineering</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">2147-284X</issn>
                                        <issn pub-type="epub">2147-284X</issn>
                                                                                            <publisher>
                    <publisher-name>MUSA YILMAZ</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.17694/bajece.1691905</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Electrical Engineering (Other)</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Elektrik Mühendisliği (Diğer)</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                        <article-title>Heart Attack Classification with a Machine Learning Approach Based on the Random Forest Algorithm</article-title>
                                                                                                                                                                                                <trans-title-group xml:lang="tr">
                                    <trans-title>Random Forest Algoritmasına Dayalı Makine Öğrenmesi Yaklaşımıyla Kalp Krizi Sınıflandırması</trans-title>
                                </trans-title-group>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-4564-8076</contrib-id>
                                                                <name>
                                    <surname>Dal</surname>
                                    <given-names>Süleyman</given-names>
                                </name>
                                                                    <aff>BATMAN ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-4893-6014</contrib-id>
                                                                <name>
                                    <surname>Sezgin</surname>
                                    <given-names>Necmettin</given-names>
                                </name>
                                                                    <aff>BATMAN ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20250630">
                    <day>06</day>
                    <month>30</month>
                    <year>2025</year>
                </pub-date>
                                        <volume>13</volume>
                                        <issue>2</issue>
                                        <fpage>140</fpage>
                                        <lpage>147</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20250505">
                        <day>05</day>
                        <month>05</month>
                        <year>2025</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20250515">
                        <day>05</day>
                        <month>15</month>
                        <year>2025</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2013, Balkan Journal of Electrical and Computer Engineering</copyright-statement>
                    <copyright-year>2013</copyright-year>
                    <copyright-holder>Balkan Journal of Electrical and Computer Engineering</copyright-holder>
                </permissions>
            
                                                                                                <abstract><p>Heart attack diagnosis delays constitute a critical health problem that increases the risk of mortality. Timely and accurate identification of cardiac events is therefore essential to improve patient outcomes and reduce preventable deaths. This study aims to develop a random forest based classification model using the Heart Disease Classification dataset published on the Kaggle platform to support early diagnosis. This dataset consists of 1319 samples and 8 demographic, clinical and biochemical features for the diagnosis of heart disease. To evaluate the model’s reliability and generalizability, a 10-fold cross-validation technique was employed. Through this method, each data instance contributed to both training and testing phases, enabling a more stable and robust performance assessment. This approach also reduced the risk of overfitting and ensured more representative evaluation metrics. The performance of the model was evaluated with ROC curve, training-validation curves, confusion matrix. In the evaluation process, especially in Fold 6, 100% accuracy, precision, recall and F1 score were obtained and it was revealed that the model showed superior performance in the classification task. In addition, as a result of the feature importance analysis, it was determined that troponin, potassium (kcm) and age variables came to the forefront in the decision process. This study aims to fill an important gap in the literature in terms of both strong classification performance and interpretability in the field of machine learning models for heart attack diagnosis.</p></abstract>
                                                                                                                                    <trans-abstract xml:lang="tr">
                            <p>Kalp krizi tanısındaki gecikmeler, mortalite riskini artıran kritik bir sağlık sorunu oluşturmaktadır. Bu nedenle, kardiyak olayların zamanında ve doğru bir şekilde tanımlanması, hasta sonuçlarını iyileştirmek ve önlenebilir ölümleri azaltmak açısından büyük önem taşımaktadır. Bu çalışma, erken tanıyı desteklemek amacıyla Kaggle platformunda yayımlanan Kalp Hastalığı Sınıflandırma veri seti kullanılarak Random Forest tabanlı bir sınıflandırma modeli geliştirmeyi amaçlamaktadır. Bu veri seti, kalp hastalığı tanısı için 1319 örneklem ve 8 demografik, klinik ve biyokimyasal özelliği içermektedir. Modelin güvenilirliğini ve genellenebilirliğini değerlendirmek için 10 katlı çapraz doğrulama yöntemi kullanılmıştır. Bu yöntem sayesinde her bir veri örneği hem eğitim hem de test aşamalarına katkı sağlamış, böylece daha kararlı ve sağlam bir performans değerlendirmesi yapılmıştır. Aynı zamanda bu yaklaşım, aşırı öğrenme riskini azaltmış ve daha temsil edici değerlendirme metrikleri elde edilmesini sağlamıştır. Modelin performansı ROC eğrisi, eğitim-doğrulama eğrileri ve karışıklık matrisi ile değerlendirilmiştir. Değerlendirme sürecinde özellikle 6. katmanda %100 doğruluk, kesinlik, duyarlılık ve F1 skoru elde edilmiş; modelin sınıflandırma görevinde üstün performans sergilediği ortaya konmuştur. Ayrıca, özellik önem düzeyi analizi sonucunda troponin, potasyum (kcm) ve yaş değişkenlerinin karar verme sürecinde öne çıktığı belirlenmiştir. Bu çalışma, kalp krizi tanısına yönelik makine öğrenmesi modelleri alanında hem güçlü sınıflandırma performansı hem de yorumlanabilirlik açısından literatürde önemli bir boşluğu doldurmayı hedeflemektedir.</p></trans-abstract>
                                                            
            
                                                            <kwd-group>
                                                    <kwd>Heart Attack Classification</kwd>
                                                    <kwd>  Machine Learning</kwd>
                                                    <kwd>  Random Forest Algorithm</kwd>
                                                    <kwd>  Clinical Decision Support Systems</kwd>
                                            </kwd-group>
                                                        
                                                                            <kwd-group xml:lang="tr">
                                                    <kwd>Kalp Krizi Sınıflandırması</kwd>
                                                    <kwd>  Makine Öğrenmesi</kwd>
                                                    <kwd>  Random Forest Algoritması</kwd>
                                                    <kwd>  Klinik Karar Destek Sistemleri</kwd>
                                            </kwd-group>
                                                                                                        <funding-group specific-use="FundRef">
                    <award-group>
                                                    <funding-source>
                                <named-content content-type="funder_name">&quot;No funding</named-content>
                            </funding-source>
                                                                    </award-group>
                </funding-group>
                                </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">[1]	H. F. El-Sofany, &quot;Predicting heart diseases using machine learning and different data classification techniques,&quot; IEEE Access, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">[2]	H. G. Enad and M. A. Mohammed, &quot;Cloud computing-based framework for heart disease classification using quantum machine learning approach,&quot; Journal of Intelligent Systems, vol. 33, no. 1, p. 20230261, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">[3]	T. A. Gaziano, A. Bitton, S. Anand, S. Abrahams-Gessel, and A. Murphy, &quot;Growing epidemic of coronary heart disease in low-and middle-income countries,&quot; Current problems in cardiology, vol. 35, no. 2, pp. 72-115, 2010.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">[4]	C. Gupta, A. Saha, N. S. Reddy, and U. D. Acharya, &quot;Cardiac Disease Prediction using Supervised Machine Learning Techniques,&quot; in Journal of physics: conference series, 2022, vol. 2161, no. 1: IOP Publishing, p. 012013.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">[5]	A. K. Dubey, A. K. Sinhal, and R. Sharma, &quot;Heart disease classification through crow intelligence optimization-based deep learning approach,&quot; International Journal of Information Technology, vol. 16, no. 3, pp. 1815-1830, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">[6]	R. Rajkumar, K. Anandakumar, and A. Bharathi, &quot;Coronary artery disease (CAD) prediction and classification-a survey,&quot; Breast Cancer, vol. 90, p. 94.35, 2006.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">[7]	P. Rani et al., &quot;An extensive review of machine learning and deep learning techniques on heart disease classification and prediction,&quot; Archives of Computational Methods in Engineering, vol. 31, no. 6, pp. 3331-3349, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">[8]	I. H. Sarker, &quot;Machine learning: Algorithms, real-world applications and research directions,&quot; SN computer science, vol. 2, no. 3, p. 160, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">[9]	Ö. F. Ertuğrul, S. Dal, Y. Hazar, and E. Aldemir, &quot;Determining relevant features in activity recognition via wearable sensors on the MYO Armband,&quot; Arabian Journal for Science and Engineering, vol. 45, pp. 10097-10113, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">[10]	L. Fraiwan, K. Lweesy, N. Khasawneh, H. Wenz, and H. Dickhaus, &quot;Automated sleep stage identification system based on time–frequency analysis of a single EEG channel and random forest classifier,&quot; Computer methods and programs in biomedicine, vol. 108, no. 1, pp. 10-19, 2012.</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">[11]	D. R. Edla, K. Mangalorekar, G. Dhavalikar, and S. Dodia, &quot;Classification of EEG data for human mental state analysis using Random Forest Classifier,&quot; Procedia computer science, vol. 132, pp. 1523-1532, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">[12]	K. Natarajan et al., &quot;Efficient heart disease classification through stacked ensemble with optimized firefly feature selection,&quot; International Journal of Computational Intelligence Systems, vol. 17, no. 1, p. 174, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">[13]	B. Deekshatulu and P. Chandra, &quot;Classification of heart disease using k-nearest neighbor and genetic algorithm,&quot; Procedia technology, vol. 10, pp. 85-94, 2013.</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">[14]	N. Kosaraju, S. R. Sankepally, and K. Mallikharjuna Rao, &quot;Categorical data: Need, encoding, selection of encoding method and its emergence in machine learning models—a practical review study on heart disease prediction dataset using pearson correlation,&quot; in Proceedings of International Conference on Data Science and Applications: ICDSA 2022, Volume 1, 2023: Springer, pp. 369-382.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">[15]	T. Amarbayasgalan, V.-H. Pham, N. Theera-Umpon, Y. Piao, and K. H. Ryu, &quot;An efficient prediction method for coronary heart disease risk based on two deep neural networks trained on well-ordered training datasets,&quot; IEEE Access, vol. 9, pp. 135210-135223, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">[16]	Y. Hazar and Ö. F. Ertuğrul, &quot;Process management in diabetes treatment by blending technique,&quot; Computers in Biology and Medicine, vol. 190, p. 110034, 2025.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">[17]	P. Soltanzadeh and M. Hashemzadeh, &quot;RCSMOTE: Range-Controlled synthetic minority over-sampling technique for handling the class imbalance problem,&quot; Information Sciences, vol. 542, pp. 92-111, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">[18]	N. V. Chawla, K. W. Bowyer, L. O. Hall, and W. P. Kegelmeyer, &quot;SMOTE: synthetic minority over-sampling technique,&quot; Journal of artificial intelligence research, vol. 16, pp. 321-357, 2002.</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">[19]	S. Hegelich, &quot;Decision trees and random forests: Machine learning techniques to classify rare events,&quot; European policy analysis, vol. 2, no. 1, pp. 98-120, 2016.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">[20]	G. A. B. Suryanegara and M. D. Purbolaksono, &quot;Peningkatan Hasil Klasifikasi pada Algoritma Random Forest untuk Deteksi Pasien Penderita Diabetes Menggunakan Metode Normalisasi,&quot; Jurnal RESTI (Rekayasa Sistem Dan Teknologi Informasi), vol. 5, no. 1, pp. 114-122, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">[21]	S. Suparyati, E. Utami, and A. H. Muhammad, &quot;Applying different resampling strategies in random forest algorithm to predict lumpy skin disease,&quot; Jurnal RESTI (Rekayasa Sistem dan Teknologi Informasi), vol. 6, no. 4, pp. 555-562, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref22">
                        <label>22</label>
                        <mixed-citation publication-type="journal">[22]	R. Oktafiani, A. Hermawan, and D. Avianto, &quot;Max Depth Impact on Heart Disease Classification: Decision Tree and Random Forest,&quot; Jurnal RESTI (Rekayasa Sistem dan Teknologi Informasi), vol. 8, no. 1, pp. 160-168, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref23">
                        <label>23</label>
                        <mixed-citation publication-type="journal">[23]	I. Tougui, A. Jilbab, and J. El Mhamdi, &quot;Impact of the choice of cross-validation techniques on the results of machine learning-based diagnostic applications,&quot; Healthcare informatics research, vol. 27, no. 3, pp. 189-199, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref24">
                        <label>24</label>
                        <mixed-citation publication-type="journal">[24]	A. Géron, Hands-on machine learning with Scikit-Learn, Keras, and TensorFlow: Concepts, tools, and techniques to build intelligent systems. &quot; O&#039;Reilly Media, Inc.&quot;, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref25">
                        <label>25</label>
                        <mixed-citation publication-type="journal">[25]	M. Yin, J. Wortman Vaughan, and H. Wallach, &quot;Understanding the effect of accuracy on trust in machine learning models,&quot; in Proceedings of the 2019 chi conference on human factors in computing systems, 2019, pp. 1-12.</mixed-citation>
                    </ref>
                                    <ref id="ref26">
                        <label>26</label>
                        <mixed-citation publication-type="journal">[26]	J. Davis and M. Goadrich, &quot;The relationship between Precision-Recall and ROC curves,&quot; in Proceedings of the 23rd international conference on Machine learning, 2006, pp. 233-240.</mixed-citation>
                    </ref>
                                    <ref id="ref27">
                        <label>27</label>
                        <mixed-citation publication-type="journal">[27]	A. Humphrey et al., &quot;Machine-learning classification of astronomical sources: estimating F1-score in the absence of ground truth,&quot; Monthly Notices of the Royal Astronomical Society: Letters, vol. 517, no. 1, pp. L116-L120, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref28">
                        <label>28</label>
                        <mixed-citation publication-type="journal">[28]	J. Liang, &quot;Confusion matrix: Machine learning,&quot; POGIL Activity Clearinghouse, vol. 3, no. 4, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref29">
                        <label>29</label>
                        <mixed-citation publication-type="journal">[29]	I. Markoulidakis and G. Markoulidakis, &quot;Probabilistic Confusion Matrix: A Novel Method for Machine Learning Algorithm Generalized Performance Analysis,&quot; Technologies, vol. 12, no. 7, p. 113, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref30">
                        <label>30</label>
                        <mixed-citation publication-type="journal">[30]	V. A. Huynh-Thu, Y. Saeys, L. Wehenkel, and P. Geurts, &quot;Statistical interpretation of machine learning-based feature importance scores for biomarker discovery,&quot; Bioinformatics, vol. 28, no. 13, pp. 1766-1774, 2012.</mixed-citation>
                    </ref>
                                    <ref id="ref31">
                        <label>31</label>
                        <mixed-citation publication-type="journal">[31]	F. Pan, T. Converse, D. Ahn, F. Salvetti, and G. Donato, &quot;Feature selection for ranking using boosted trees,&quot; in Proceedings of the 18th ACM conference on Information and knowledge management, 2009, pp. 2025-2028.</mixed-citation>
                    </ref>
                                    <ref id="ref32">
                        <label>32</label>
                        <mixed-citation publication-type="journal">[32]	A. A. Megantara and T. Ahmad, &quot;Feature importance ranking for increasing performance of intrusion detection system,&quot; in 2020 3rd International Conference on Computer and Informatics Engineering (IC2IE), 2020: IEEE, pp. 37-42.</mixed-citation>
                    </ref>
                                    <ref id="ref33">
                        <label>33</label>
                        <mixed-citation publication-type="journal">[33]	M. A. Jamil and S. Khanam, &quot;Influence of one-way ANOVA and Kruskal–Wallis based feature ranking on the performance of ML classifiers for bearing fault diagnosis,&quot; Journal of Vibration Engineering &amp; Technologies, vol. 12, no. 3, pp. 3101-3132, 2024.</mixed-citation>
                    </ref>
                                    <ref id="ref34">
                        <label>34</label>
                        <mixed-citation publication-type="journal">[34]	N. Silpa, V. M. Rao, M. V. Subbarao, R. R. Kurada, S. S. Reddy, and P. J. Uppalapati, &quot;An enriched employee retention analysis system with a combination strategy of feature selection and machine learning techniques,&quot; in 2023 7th International Conference on Intelligent Computing and Control Systems (ICICCS), 2023: IEEE, pp. 142-149.</mixed-citation>
                    </ref>
                                    <ref id="ref35">
                        <label>35</label>
                        <mixed-citation publication-type="journal">[35]	C. Strobl, A.-L. Boulesteix, A. Zeileis, and T. Hothorn, &quot;Bias in random forest variable importance measures: Illustrations, sources and a solution,&quot; BMC bioinformatics, vol. 8, pp. 1-21, 2007.</mixed-citation>
                    </ref>
                                    <ref id="ref36">
                        <label>36</label>
                        <mixed-citation publication-type="journal">[36]	B. M. Greenwell, B. C. Boehmke, and A. J. McCarthy, &quot;A simple and effective model-based variable importance measure,&quot; arXiv preprint arXiv:1805.04755, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref37">
                        <label>37</label>
                        <mixed-citation publication-type="journal">[37]   Bharath011, Heart Disease Classification Dataset, Kaggle, 2022. [Çevrimiçi]. Erişim adresi:https://www.kaggle.com/datasets/bharath011/heart-disease-classification dataset</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
