<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                                                <journal-id>müh.bil.ve araş.dergisi</journal-id>
            <journal-title-group>
                                                                                    <journal-title>Mühendislik Bilimleri ve Araştırmaları Dergisi</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">2687-4415</issn>
                                                                                                        <publisher>
                    <publisher-name>Bandırma Onyedi Eylül Üniversitesi</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.46387/bjesr.1419106</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Deep Learning</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Derin Öğrenme</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                        <trans-title-group xml:lang="tr">
                                    <trans-title>Evrişimli Sinir Ağlarında Gelişmiş Performans için Hiperparametrelerin Optimize Edilmesi: NASNetMobile ve DenseNet201 Modellerini Kullanan Bir Çalışma</trans-title>
                                </trans-title-group>
                                                                                                                                                                                                <article-title>Optimizing Hyperparameters for Enhanced Performance in Convolutional Neural Networks: A Study Using NASNetMobile and DenseNet201 Models</article-title>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0001-7708-8731</contrib-id>
                                                                <name>
                                    <surname>Aksoy</surname>
                                    <given-names>İbrahim</given-names>
                                </name>
                                                                    <aff>AKSARAY UNIVERSITY</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-3752-7354</contrib-id>
                                                                <name>
                                    <surname>Adem</surname>
                                    <given-names>Kemal</given-names>
                                </name>
                                                                    <aff>SİVAS BİLİM VE TEKNOLOJİ ÜNİVERSİTESİ, MÜHENDİSLİK VE DOĞA BİLİMLERİ FAKÜLTESİ, BİLGİSAYAR MÜHENDİSLİĞİ BÖLÜMÜ</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20240430">
                    <day>04</day>
                    <month>30</month>
                    <year>2024</year>
                </pub-date>
                                        <volume>6</volume>
                                        <issue>1</issue>
                                        <fpage>42</fpage>
                                        <lpage>52</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20240113">
                        <day>01</day>
                        <month>13</month>
                        <year>2024</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20240216">
                        <day>02</day>
                        <month>16</month>
                        <year>2024</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2019, Mühendislik Bilimleri ve Araştırmaları Dergisi</copyright-statement>
                    <copyright-year>2019</copyright-year>
                    <copyright-holder>Mühendislik Bilimleri ve Araştırmaları Dergisi</copyright-holder>
                </permissions>
            
                                                                                                <trans-abstract xml:lang="tr">
                            <p>Biyolojik sinir ağlarının işleyişinden esinlenen evrişimli sinir ağlarının görüntü verisi tanıma, sınıflandırma ve özellik çıkarma gibi görevlerde oldukça başarılı olduğu kanıtlanmıştır. Yine de, bu ağların tasarlanması ve uygulanması bazı zorluklar ortaya çıkarmaktadır. Bu zorluklardan biri, belirli model, veri kümesi ve donanıma göre uyarlanmış hiperparametrelerin optimize edilmesidir. Bu çalışmada, çeşitli hiperparametrelerin evrişimli sinir ağı modellerinin sınıflandırma performansını nasıl etkilediği araştırılmıştır. Araştırma epok sayısı, nöronlar, yığın boyutu, aktivasyon fonksiyonları, optimizasyon algoritmaları ve öğrenme oranı gibi parametrelere odaklanmıştır. Keras kütüphanesi kullanılarak NASNetMobile ve DenseNet201 modelleri (veri kümesindeki üstün performansları nedeniyle vurgulanmıştır) kullanılarak deneyler yapılmıştır. 65 farklı eğitim oturumu gerçekleştirildikten sonra, doğruluk oranları ilk değerlerine kıyasla NASNetMobile için %6,5 ve DenseNet201 için %11,55 oranında kayda değer bir artış göstermiştir.</p></trans-abstract>
                                                                                                                                    <abstract><p>Convolutional neural networks, inspired by the workings of biological neural networks, have proven highly successful in tasks like image data recognition, classification, and feature extraction. Yet, designing and implementing these networks pose certain challenges. One such challenge involves optimizing hyperparameters tailored to the specific model, dataset, and hardware. This study delved into how various hyperparameters impact the classification performance of convolutional neural network models. The investigation focused on parameters like the number of epochs, neurons, batch size, activation functions, optimization algorithms, and learning rate. Using the Keras library, experiments were conducted using NASNetMobile and DenseNet201 models—highlighted for their superior performance on the dataset. After running 65 different training sessions, accuracy rates saw a notable increase of 6.5% for NASNetMobile and 11.55% for DenseNet201 compared to their initial values.</p></abstract>
                                                            
            
                                                                                        <kwd-group>
                                                    <kwd>Image	Classification</kwd>
                                                    <kwd>  DenseNet</kwd>
                                                    <kwd>  NASNetMobile</kwd>
                                                    <kwd>  Hyperparameters</kwd>
                                                    <kwd>  Activation			Function</kwd>
                                                    <kwd>  Optimization		Algorithm</kwd>
                                                    <kwd>  CNN</kwd>
                                            </kwd-group>
                            
                                                <kwd-group xml:lang="tr">
                                                    <kwd>Görüntü	Sınıflandırma</kwd>
                                                    <kwd>  DenseNet</kwd>
                                                    <kwd>  NASNetMobile</kwd>
                                                    <kwd>  Hiperparametreler</kwd>
                                                    <kwd>  Aktivasyon	Fonksiyonları</kwd>
                                                    <kwd>  Optimizasyon Algoritmaları</kwd>
                                                    <kwd>  Öğrenme Oranı</kwd>
                                                    <kwd>  ESA</kwd>
                                            </kwd-group>
                                                                                                                                        </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">E. Öztemel “Yapay sinir ağları”, Papatya Yayıncılık, İstanbul, 2003.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">S. Aktürk and K. Serbest, “Nesne Tespiti İçin Derin Öğrenme Kütüphanelerinin İncelenmesi”, Journal of Smart Systems Research, vol. 3, no. 2, pp. 97-119, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">A. Onan, “Evrişimli sinir ağı mimarilerine dayalı Türkçe duygu analizi”, Avrupa Bilim ve Teknoloji Dergisi, pp. 374-380, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">L.N. Smith, “Cyclical learning rates for training neural networks”, IEEE winter conference on applications of computer vision (WACV), pp. 464-472, 2017.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">C. Bircanoğlu and N. Arıca, “Yapay Sinir Ağlarında Aktivasyon Fonksiyonlarının Karşılaştırılması”, in 2018 26th signal processing and communications applications conference (SIU). IEEE, pp. 1-4, İzmir, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">A. Gülcü and Z. Kuş, “Konvolüsyonel sinir ağlarında hiper-parametre optimizasyonu yöntemlerinin incelenmesi”, Gazi University Journal of Science Part C: Design and Technology, pp. 503-522, 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">E. Seyyarer, F. Ayata, T. Uçkan and A. Karci, “Derin öğrenmede kullanılan optimizasyon algoritmalarının uygulanması ve kıyaslanması”, Computer Science, vol. 5, no. 2, pp. 90-98, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">K. Adem, “P+ FELU: Flexible and trainable fast exponential linear unit for deep learning architectures”, Neural Computing and Applications, vol. 34, no. 24, pp. 21729-21740, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">P. Liashchynskyi and P. Liashchynskyi, “Grid search, random search, genetic algorithm: a big comparison for NAS”, arXiv preprint arXiv:1912.06059, 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">Kaggle, “Dogs &amp; Cats Images”, url: https://www.kaggle.com/datasets/chetankv/dogs-cats-images, (Access Date: 01/01/2024).</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">Kaggle, “pizza classification data”, url: https://www.kaggle.com/datasets/projectshs/pizza-classification-data, (Access Date: 01/01/2024).</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">A.G. Ivakhnenko and V.G. Lapa, “Cybernetic predicting devices”, 1966.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">[13]	A. Şeker, B. Diri and H. Balık, “Derin öğrenme yöntemleri ve uygulamaları hakkında bir inceleme”, Gazi Mühendislik Bilimleri Dergisi, vol. 3, no. 3, pp. 47-64, 2017.</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">Ö. İnik and E. Ülker, “Derin Öğrenmede Kullanılan Veri Setleri ve Yazılım Kütüphaneleri”, International Symposium on Multidisciplinary Studies and Innovative Technologies (ISMSIT) 2017, Tokat, 2017.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">F.D. Adhinata, D.P. Rakhmadani, M. Wibowo and A. Jayadi, “A deep learning using DenseNet201 to detect masked or non-masked face”, JUITA: Jurnal Informatika, vol. 9, no. 1, pp. 115-121, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">S.H. Wang and Y.D. Zhang, “DenseNet-201-based deep neural network with composite learning factor and precomputation for multiple sclerosis classification”, ACM Transactions on Multimedia Computing, Communications, and Applications (TOMM), vol. 16, no. 2, pp. 1-19, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">A.O. Adedoja, P.A. Owolawi, T. Mapayi and C. Tu, “Intelligent Mobile Plant Disease Diagnostic System Using NASNet-Mobile Deep Learning”, IAENG International Journal of Computer Science, vol. 49, no. 1, pp. 216-231, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">A. Daşgın, “Covid19 Yayılımını Azaltmak İçin Yüz Maskesinin Evrişimsel Sinir Ağı Modelleri İle Tespiti”, Master’s thesis, Sosyal Bilimler Enstitüsü, Aksaray Üniversitesi, Aksaray, 2023.</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">C. Doğan, “İstatistiksel ve Makine Öğrenme ile Derin Sinir Ağlarında Hiper-Parametre Seçimi İçin Melez Yaklaşım”, Master’s thesis, Fen Bilimleri Enstitüsü, Hacettepe Üniversitesi, Ankara, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">F. Kurt, “Evrişimli Sinir Ağlarında Hiper Parametrelerin Etkisinin İncelenmesi”, Master’s thesis, Fen Bilimleri Enstitüsü, Hacettepe Üniversitesi, Ankara, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">J. Brownlee, “What is the Difference Between a Batch and an Epoch in a Neural Network”, Machine Learning Mastery, vol. 20, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref22">
                        <label>22</label>
                        <mixed-citation publication-type="journal">W. Hastomo, A.S.B.  Karno, N. Kalbuana, and A. Meiriki, “Characteristic parameters of epoch deep learning to predict Covid-19 data in Indonesia”, Journal of Physics: Conference Series, vol. 1933, no. 1, pp. 1-4, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref23">
                        <label>23</label>
                        <mixed-citation publication-type="journal">M.A. Bülbül and C. Öztürk, “Optimization, modeling and implementation of plant water consumption control using genetic algorithm and artificial neural network in a hybrid structure”, Arabian Journal for Science and Engineering, vol. 47, no. 2, pp. 2329-2343, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref24">
                        <label>24</label>
                        <mixed-citation publication-type="journal">A. Zhang, Z.C. Lipton, M. Li and A.J. Smola, “Dive into deep learning”, arXiv preprint arXiv:2106.11342, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref25">
                        <label>25</label>
                        <mixed-citation publication-type="journal">T. Ünal, Ü. Çiftçi and N.N. Urgan, “Bir Gizli Katmanlı Yapay Sinir Ağlarında Optimal Nöron Sayısının İncelenmesi”, Süleyman Demirel Üniversitesi Fen Edebiyat Fakültesi Fen Dergisi, vol. 17, no. 2, pp. 303-325, 2022.</mixed-citation>
                    </ref>
                                    <ref id="ref26">
                        <label>26</label>
                        <mixed-citation publication-type="journal">L.N. Smith, “A disciplined approach to neural network hyper-parameters: Part 1-learning rate, batch size, momentum, and weight decay”, arXiv preprint arXiv:1803.09820, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref27">
                        <label>27</label>
                        <mixed-citation publication-type="journal">G. Ser and C.T. Bati, “Derin sinir ağları ile en iyi modelin belirlenmesi: mantar verileri üzerine Keras uygulaması”, Yuzuncu Yıl University Journal of Agricultural Sciences, vol. 29, no. 3, pp. 406-417, 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref28">
                        <label>28</label>
                        <mixed-citation publication-type="journal">D. Kulshrestha, “Activation Functions in Machine Learning”, url: https://iq.opengenus.org/activation-functions-ml/, (Access Date: 03.12.2023).</mixed-citation>
                    </ref>
                                    <ref id="ref29">
                        <label>29</label>
                        <mixed-citation publication-type="journal">S. Kılıçarslan, C. Közkurt, S. Baş and A. Elen, “Detection and classification of pneumonia using novel Superior Exponential (SupEx) activation function in convolutional neural networks”, Expert Systems with Applications, vol. 217, no. 119503, 2023.</mixed-citation>
                    </ref>
                                    <ref id="ref30">
                        <label>30</label>
                        <mixed-citation publication-type="journal">S. Kılıçarslan and M. Çelik, “RSigELU: A nonlinear activation function for deep neural networks”, Expert Systems with Applications, vol. 174, no. 114805, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref31">
                        <label>31</label>
                        <mixed-citation publication-type="journal">M.A. Bülbül, “Optimization of artificial neural network structure and hyperparameters in hybrid model by genetic algorithm: iOS–android application for breast cancer diagnosis/prediction”, The Journal of Supercomputing, pp. 1-21, 2023.</mixed-citation>
                    </ref>
                                    <ref id="ref32">
                        <label>32</label>
                        <mixed-citation publication-type="journal">R. Sun, “Optimization for deep learning: theory and algorithms”, arXiv preprint arXiv:1912.08957, 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref33">
                        <label>33</label>
                        <mixed-citation publication-type="journal">Y. Bengio, “Practical recommendations for gradient-based training of deep architectures”, Neural Networks: Tricks of the Trade: Second Edition, pp. 437-478, 2012.</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
