<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                    <journal-id></journal-id>
            <journal-title-group>
                                                                                    <journal-title>Balkan Journal of Electrical and Computer Engineering</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">2147-284X</issn>
                                        <issn pub-type="epub">2147-284X</issn>
                                                                                            <publisher>
                    <publisher-name>MUSA YILMAZ</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.17694/bajece.781162</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Artificial Intelligence</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Yapay Zeka</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                                                            <article-title>Autonomous Navigation in Search and Rescue Simulated Environment using Deep Reinforcement Learning</article-title>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-5450-1316</contrib-id>
                                                                <name>
                                    <surname>Abdeh</surname>
                                    <given-names>Mohammed</given-names>
                                </name>
                                                                    <aff>ÇUKUROVA ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0001-5876-4116</contrib-id>
                                                                <name>
                                    <surname>Abut</surname>
                                    <given-names>Fatih</given-names>
                                </name>
                                                                    <aff>ÇUKUROVA ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0003-0780-0679</contrib-id>
                                                                <name>
                                    <surname>Akay</surname>
                                    <given-names>Fatih</given-names>
                                </name>
                                                                    <aff>ÇUKUROVA ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20210430">
                    <day>04</day>
                    <month>30</month>
                    <year>2021</year>
                </pub-date>
                                        <volume>9</volume>
                                        <issue>2</issue>
                                        <fpage>92</fpage>
                                        <lpage>98</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20200816">
                        <day>08</day>
                        <month>16</month>
                        <year>2020</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20210205">
                        <day>02</day>
                        <month>05</month>
                        <year>2021</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2013, Balkan Journal of Electrical and Computer Engineering</copyright-statement>
                    <copyright-year>2013</copyright-year>
                    <copyright-holder>Balkan Journal of Electrical and Computer Engineering</copyright-holder>
                </permissions>
            
                                                                                                                        <abstract><p>Human assisted search and rescue (SAR) robots are increasingly being used in zones of natural disasters, industrial accidents, and civil wars. Due to complex terrains, obstacles, and uncertainties in time availability, there is a need for these robots to have a certain level of autonomy to act independently for approaching certain SAR tasks. One of these tasks is autonomous navigation. Previous approaches to develop autonomous or semi-autonomous SAR navigating robots use heuristics-based methods. These algorithms, however, require environment-related prior knowledge and enough sensing capabilities, which are hard to maintain due to restrictions of size and weight in highly unstructured environments such as collapsed buildings. This study approaches the problem of autonomous navigation using a modified version of the Deep Q-Network algorithm. Unlike the classical usage of the entire game screen images to train the agent, our approach uses only the images captured by the agent&#039;s low-resolution camera to train the agent for navigating through an arena avoiding obstacles and to reach a victim. This approach is a much more relevant way of decision making in complex, uncertain contexts; since in real-world SAR scenarios, it is almost impossible to have the area&#039;s full information to be used by SAR teams.  We simulated a SAR scenario, which consists of an arena full of randomly generated obstacles, a victim, and an autonomous SAR robot. The simulation results show that the agent was able to reach the victim in 56% of the evaluation episodes after 400 episodes of training.</p></abstract>
                                                            
            
                                                                                        <kwd-group>
                                                    <kwd>Deep Reinforcement Learning</kwd>
                                                    <kwd>  Autonomous Navigation</kwd>
                                                    <kwd>  Autonomous Search and Rescue</kwd>
                                                    <kwd>  Simulation</kwd>
                                            </kwd-group>
                            
                                                                                                                                                    </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">[1]	C. Kenny, Why Do People Die In Earthquakes? The Costs, Benefits, And Institutions Of Disaster Risk Reduction In Developing Countries. The World Bank, 2009.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">[2]	“NFPA 1670, Standard on Operations and Training for Technical Rescue Incidents - National Fire Protection Association - Google Books.” (accessed Aug. 03, 2020).</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">[3]	“Rescue: Technical Rescue Program Development Manual - Google Books.” https://books.google.com.tr/books/about/Rescue_Technical_Rescue_Program_Developm.html?id=2VNSswEACAAJ&amp;redir_esc=y (accessed Aug. 03, 2020).</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">[4]	R. R. Murphy et al., “Search and Rescue Robotics,” in Springer Handbook of Robotics, Springer Berlin Heidelberg, 2008, pp. 1151–1173.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">[5]	T. Bräunl, “Localization and Navigation,” in Embedded Robotics, Springer Berlin Heidelberg, 2008, pp. 241–269.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">[6]	K. N. McGuire, G. C. H. E. de Croon, and K. Tuyls, “A comparative study of bug algorithms for robot navigation,” Rob. Auton. Syst., vol. 121, p. 103261, Nov. 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">[7]	S. Waharte and N. Trigoni, “Supporting search and rescue operations with UAVs,” in Proceedings - EST 2010 - 2010 International Conference on Emerging Security Technologies, ROBOSEC 2010 - Robots and Security, LAB-RS 2010 - Learning and Adaptive Behavior in Robotic Systems, 2010, pp. 142–147, DOI: 10.1109/EST.2010.31.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">[8]	V. Mnih et al., “Human-level control through deep reinforcement learning,” Nature, vol. 518, no. 7540, pp. 529–533, Feb. 2015, DOI: 10.1038/nature14236.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">[9]	D. Silver et al., “Mastering the game of Go with deep neural networks and tree search,” Nature, vol. 529, no. 7587, pp. 484–489, Jan. 2016, DOI: 10.1038/nature16961.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">[10]	J. Xiao, A. Owens, and A. Torralba, “SUN3D: A database of big spaces reconstructed using SfM and object labels,” in Proceedings of the IEEE International Conference on Computer Vision, 2013, pp. 1625–1632, DOI: 10.1109/ICCV.2013.458.</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">[11]	I. Toschi, P. Rodríguez-Gonzálvez, F. Remondino, S. Minto, S. Orlandini, and A. Fuller, “Accuracy evaluation of a mobile mapping system with advanced statistical methods,” in International Archives of the Photogrammetry, Remote Sensing and Spatial Information Sciences - ISPRS Archives, 2015, vol. 40, no. 5W4, pp. 245–253.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">[12]	P. Kim, J. Park, Y. K. Cho, and J. Kang, “UAV-assisted autonomous mobile robot navigation for as-is 3D data collection and registration in cluttered environments,” Autom. Constr., vol. 106, p. 102918, Oct. 2019, DOI: 10.1016/j.autcon.2019.102918.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">[13]	“ICARUS Project.” https://icarus2020.eu/ (accessed Aug. 03, 2020).</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">[14]	L. Marconi et al., “The SHERPA project: smart collaboration between humans and ground-aerial robots for improving rescuing activities in alpine environments,” 2012, DOI: 10.1109/SSRR.2012.6523905.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">[15]	J. G. C. Zuluaga, J. P. Leidig, C. Trefftz, and G. Wolffe, “Deep Reinforcement Learning for Autonomous Search and Rescue,” in Proceedings of the IEEE National Aerospace Electronics Conference, NAECON, Dec. 2018, vol. 2018-July, pp. 521–524.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">[16]	O. Michel, “Cyberbotics Ltd. Webots TM : Professional Mobile Robot Simulation,” 2004. Accessed: Aug. 03, 2020. [Online]. Available: http://www.cyberbotics.com.</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
