<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                    <journal-id></journal-id>
            <journal-title-group>
                                                                                    <journal-title>Çukurova Üniversitesi Mühendislik Fakültesi Dergisi</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">2757-9255</issn>
                                                                                                        <publisher>
                    <publisher-name>Çukurova Üniversitesi</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.21605/cukurovaumfd.1410642</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Data Models, Storage and Indexing</subject>
                                                            <subject>Computer Software</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Veri Modelleri, Depolama ve Dizinleme</subject>
                                                            <subject>Bilgisayar Yazılımı</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                        <trans-title-group xml:lang="tr">
                                    <trans-title>Suç Kategorisi Tespiti için Yığınlama Topluluk Öğrenimi Modeli Kullanan Çatı Tasarımı</trans-title>
                                </trans-title-group>
                                                                                                                                                                                                <article-title>A Design of Crime Category Detection Framework using Stacking Ensemble Model</article-title>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-3028-0416</contrib-id>
                                                                <name>
                                    <surname>Arslan</surname>
                                    <given-names>Recep Sinan</given-names>
                                </name>
                                                                    <aff>KAYSERİ ÜNİVERSİTESİ, MÜHENDİSLİK, MİMARLIK VE TASARIM FAKÜLTESİ, BİLGİSAYAR MÜHENDİSLİĞİ BÖLÜMÜ</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0009-0000-8201-9343</contrib-id>
                                                                <name>
                                    <surname>Dülgeroğlu</surname>
                                    <given-names>Burak</given-names>
                                </name>
                                                                    <aff>KAYSERİ ÜNİVERSİTESİ, LİSANSÜSTÜ EĞİTİM ENSTİTÜSÜ</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20231228">
                    <day>12</day>
                    <month>28</month>
                    <year>2023</year>
                </pub-date>
                                        <volume>38</volume>
                                        <issue>4</issue>
                                        <fpage>1035</fpage>
                                        <lpage>1048</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20231016">
                        <day>10</day>
                        <month>16</month>
                        <year>2023</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20231225">
                        <day>12</day>
                        <month>25</month>
                        <year>2023</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2009, Çukurova Üniversitesi Mühendislik Fakültesi Dergisi</copyright-statement>
                    <copyright-year>2009</copyright-year>
                    <copyright-holder>Çukurova Üniversitesi Mühendislik Fakültesi Dergisi</copyright-holder>
                </permissions>
            
                                                                                                <trans-abstract xml:lang="tr">
                            <p>Suç, toplum açısından kanuni olarak zararlı olarak tanımlanmış eylemi ifade eder ve bu eylemlerin engellenmesi için suç türünün anlaşılması oldukça önemlidir. Ancak suç herhangi bir zamanda ve yerde meydana gelebilmektedir ve bu durum suçun tahmin edilebilirliğini zorlaştırmaktadır. Daha önce işlenmiş suçlara dayalı olarak oluşturulan verilerin kullanılması bu zorluğun aşılmasına katkı sağlamaktadır. Bu çalışmada suç faaliyetlerini sınıflandırma için uzunluğundan bağımsız olarak metinlerin sayısal temsilini üretebilen Doc2Vec yapısı ve 8 farklı yapay öğrenme modelini içeren bir yığınlama topluluk öğrenimi modelin kullanıldığı özgün bir model önerilmiştir. Model literatürden farklı olarak öznitelikleri kategorik olarak değil metin olarak işlemekte ve vektör haline dönüştürmektedir. Bu sayede literatürde kullanılamayan özniteliklerin kullanılmasını sağlamaktadır. Önerilen model 12 yıl boyunca işlenen suçları içeren, Francisco Crime Classification, isimli online dağıtımlı bir çevrimiçi yarışma veriseti kullanılarak test edilmiştir. En yüksek suç kaydının olduğu 15 suç kategorisi için %99,28  doğruluk değeri elde edilirken, kesinlik, geri çağırma ve f-değeri sırasıyla %99,18, %99,38 ve %99,28 olmuştur. Çapraz doğrulama (k=10) ile 0,001 std. değeri ile %99,8 başarım yakalanmıştır. Bu performans değerleri kategorik özellik yapısının kullanıldığı literatürdeki tüm çalışmalardan yüksektir. Elde edilen sonuçlar metin tabanlı özellikler barındıran suç faaliyet raporlarının kategorik olarak model eğitimlerinde kullanılması yerine Doc2Vec gibi doğal dil işleme teknikleri ile işlenebilir vektörlere dönüştürülmesinin sınıflandırma performansına doğrudan katkı sunabildiğini göstermiş ve daha az ön işlem sayesinde daha verimli bir modelin ortaya çıkmasını sağlamıştır.</p></trans-abstract>
                                                                                                                                    <abstract><p>Crime refers to an action legally defined as harmful to society, and it is important to understand the type of crime to prevent these actions. However, crime can occur at any time and place, making it difficult to predict. Data generated based on previously committed crimes contributes to overcoming this difficulty. This study proposes a novel model for classifying criminal activities using a Doc2Vec that can cause a numerical representation of texts regardless of length and a stacking ensemble model that includes 8 different machine-learning models. Unlike the literature, the model processes the features as text and converts them into vectors rather than categorically. In this way, it enables using features that cannot be used in the literature. The proposed model is tested using a distributed online competition database, Francisco Crime Classification, which contains crimes committed over 12 years. An accuracy value of 99.28% was obtained for the 15 crime categories with the highest crime records, while precision, recall, and f-score values were 99.18%, 99.38%, and 99.20%, respectively. With cross-validation (k=10), 99.80% performance was achieved with a std. value of 0.001. These performance values are higher than those of all the studies in the literature using categorical feature structures. The results show that converting criminal activity reports, which contain text-based features, into vectors that can be processed with natural language processing techniques such as Doc2vec instead of using them categorically in model training can directly contribute to the classification performance and provide a more efficient model with less preprocessing.</p></abstract>
                                                            
            
                                                                                        <kwd-group>
                                                    <kwd>Crime prediction</kwd>
                                                    <kwd>  Criminology</kwd>
                                                    <kwd>  Doc2vec</kwd>
                                                    <kwd>  Stacking ensemble model</kwd>
                                            </kwd-group>
                            
                                                <kwd-group xml:lang="tr">
                                                    <kwd>Suç tahminlemesi</kwd>
                                                    <kwd>  Kriminoloji</kwd>
                                                    <kwd>  Doc2Vec</kwd>
                                                    <kwd>  Topluluk öğrenme</kwd>
                                            </kwd-group>
                                                                                                                                        </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">1.	İçli, T.G., 1993. Türkiye’de Suçlular (Sosyal Kültürel ve Ekonomik Özellikleri. Atatürk Kültür, Dil ve Tarih Kurumu Atatürk Kültür Merkezi Yayını, Ankara, 71.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">2.	Hochstetler, J., Hochstetler, L., Fu, S., 2016. An Optimal Police Patrol Planning Strategy for Smart City Safety. IEEE 18th International Conference on High Performance Computing and Communications, Sydney, Australia, 1256-1263.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">3.	Open Government, https://www.data.gov/open -gov/, Access date: Haziran 2023.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">4.	Data.world Crime Datasets, https://data.world/ datasets/crime, Access date: Temmuz 2023.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">5.	All Data Related to Crime And Justice, https://www.ons.gov.uk/peoplepopulationandcommunity/crimeandjustice/datalist?filter=datasets, Access date: Ağustos 2023.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">6.	Pradhan, I., Potika, K., Eirinaki, M., Potikas, P., 2019. Exploratory Data Analysis and Crime Prediction for Smart Cities. Proceedings of the 23rd International Database Applications and Engineering Symposium on - IDEAS ’19, Athens, Greece, 1-9.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">7.	Ke, J., Li, X., Chen, J., 2018. San Fransisco Crime Classification (Report), Jocobs School of Engineering, San Diego, 7.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">8.	Khan, M., Ali, A., Alharbi, Y., 2022. Predicting and Preventing Crime: A Crime Prediction Model using San Francisco Crime Data by Classification Techniques. Complexity, 1-13.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">9.	Wu, X., 2016. An Informative and Predictive Analysis of the San Francisco Police Department Crime Data. M.Sc., University of California, Los Angeles, 11.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">10.	Abouelnaga, Y., 2016. San Francisco Crime Classification”, arXiv:1607.03626.</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">11.	Arslan, R.S., Dülgeroğlu, B., 2023. Crime Classification using Categorical Feature Engineering and Machine Learning. International Ankara Congress on Multidisciplinary Studies-VI, Ankara, Turkey, 1-8.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">12.	Aldossari, B.S., Alqahtani, F.M., Alshahrani, N.S., Alhammam, M.M., Alzamanan, R.M., Aslam, N.I., 2020. A Comparative Study of Decision Tree and Naive Bayes Machine Learning Model for Crime Category Prediction in Chicago. Proceedings of 2020 6th International Conference on Computing and Data Engineering, Sanya, China, 34-38.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">13.	Deborah, D., Jitesh, J., Kieron, D., Vincent, T., 2023. A Comparative Analysis of Multiple Methods for Predicting a Specific Type of Crime in the City of Chicago. ArXiv: 2304.13464.</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">14.	Reier Forradellas, R.F., Náñez Alonso, S.L., Jorge-Vazquez, J., Rodriguez, M.L., 2020. Applied Machine Learning in Social Sciences: Neural Networks and Crime Prediction. Social Sciences, 10(1), 4.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">15.	Kim, S., Joshi, P., Kalsi, P.S., Taheri, P., 2018. Crime Analysis through Machine Learning. 2018 IEEE 9th Annual Information Technology, Electronics and Mobile Communication Conference (IEMCON), Vancouver, Canada, 1-6.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">16.	Alves, L.G.A., Ribeiro, H.V., Rodrigues, F.A., 2018. Crime Prediction through Urban Metrics and Statistical Learning. Physica A: Statistical Mechanics and Its Applications, 505, 435-443.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">17.	Wu, S., Wang, C., Cao, H., Jia, X., 2020. Crime Prediction using Data Mining and Machine Learning. Intell. Syst. Comput., Springer Verlag, 905, 360-375.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">18.	Bandekar, S.R., Vijayalakshmi, C., 2020. Design and Analysis of Machine Learning algorithms for the Reduction of Crime Rates in India. Procedia Computer Science, 172, 122-127.</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">19.	Gül, S., Polat, A., 2009. Kamu Güvenlik Politikalarının Oluşturulmasında Yeni Bir Yaklaşım: Suç Tahmini. Türk İdare Dergisi. 463 (81), 131-156.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">20.	Iqbal, R., 2013. An Experimental Study of Classification Algorithms for Crime Prediction. Indian Journal of Science and Technology, 6(3), 1-7.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">21.	Saeed, U., Sarim, M., Usmani, A., Mukhtar, A., Basit, S.A., Kashif Riffat, S., 2015. Application of Machine Learning Algorithms in Crime Classification and Classification Rule Mining. Research Journal of Recent Sciences, 4(3), 106-114.</mixed-citation>
                    </ref>
                                    <ref id="ref22">
                        <label>22</label>
                        <mixed-citation publication-type="journal">22.	Shojaee, S., Mustapha, A., Fatimah, S., Jabar, A., 2013. A Study on Classification Learning Algorithms to Predict Crime Status. International Journal of Digital Content Technology and its Applications, 7(9), 361-371.</mixed-citation>
                    </ref>
                                    <ref id="ref23">
                        <label>23</label>
                        <mixed-citation publication-type="journal">23.	Arslan, R.S., 2021. Comparison of Feature Selection Methods in Security Analysis of Android. 2021 6th International Conference on Computer Science and Engineering (UBMK). Ankara, Turkey, 1-5.</mixed-citation>
                    </ref>
                                    <ref id="ref24">
                        <label>24</label>
                        <mixed-citation publication-type="journal">24.	 Lundberg, S., Lee, S., 2017. A Unified Approach to Interpreting Model Predictions. 31st Conference on Neural Information Processing Systems (NIPS 2017), Long Beach, CA, USA, 1-11.</mixed-citation>
                    </ref>
                                    <ref id="ref25">
                        <label>25</label>
                        <mixed-citation publication-type="journal">25.	Hizlisoy, S., Arslan, R.S., 2021. Text Independent Speaker Recognition Based on MFCC and Machine Learning. Selcuk University Journal of Engineering Sciences, 20(03), 073-078.</mixed-citation>
                    </ref>
                                    <ref id="ref26">
                        <label>26</label>
                        <mixed-citation publication-type="journal">26.	Hizlisoy, S., Tüfekci, Z., 2020. Türkçe Müzikten Duygu Tanıma. European Journal of Science and Technology, Special Issue, 6-12.</mixed-citation>
                    </ref>
                                    <ref id="ref27">
                        <label>27</label>
                        <mixed-citation publication-type="journal">27.	Arslan, R.S., Yurttakal, A.H., 2020. K-Nearest Neighbour Classifier Usage for Permission based Malware Detection in Android. Icontech International Journal, 4(2), 15-27.</mixed-citation>
                    </ref>
                                    <ref id="ref28">
                        <label>28</label>
                        <mixed-citation publication-type="journal">28.	Quoc, L., Tomas, M., 2014. Distributed Representations of Sentences and Documents. Proceedings of the 31st International Conference on Machine Learning, PMLR 32(2), 1188-1196.</mixed-citation>
                    </ref>
                                    <ref id="ref29">
                        <label>29</label>
                        <mixed-citation publication-type="journal">29.	Arslan, R.S., 2021. Kötücül Web Sayfalarının Tespitinde Doc2Vec Modeli ve Makine Öğrenmesi Yaklaşımı. European Journal of Science and Technology, 27, 792-801.</mixed-citation>
                    </ref>
                                    <ref id="ref30">
                        <label>30</label>
                        <mixed-citation publication-type="journal">30.	Arslan, R.S., 2021. Kötücül URL Filtreleme için Derin Öğrenme Modeli Tasarımı. European Journal of Science and Technology, 29, 122-128.</mixed-citation>
                    </ref>
                                    <ref id="ref31">
                        <label>31</label>
                        <mixed-citation publication-type="journal">31.	Arslan, R.S., 2021. Identify type of Android malware with Machine Learning Based Ensemble model. 2021 5th International Symposium on Multidisciplinary Studies and Innovative Technologies (ISMSIT), Ankara, Turkey, 1-5.</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
