<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                    <journal-id></journal-id>
            <journal-title-group>
                                                                                    <journal-title>Bilişim Teknolojileri Dergisi</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">1307-9697</issn>
                                        <issn pub-type="epub">2147-0715</issn>
                                                                                            <publisher>
                    <publisher-name>Gazi Üniversitesi</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.17671/gazibtd.999960</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Computer Software</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Bilgisayar Yazılımı</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                        <article-title>Naive Bayes Sınıflandırıcısı Kullanılarak YouTube Verileri Üzerinden Çok Dilli Duygu Analizi</article-title>
                                                                                                                                                                                                <trans-title-group xml:lang="en">
                                    <trans-title>Multilingual Sentiment Analysis on YouTube Data Using Naive Bayes Classifier</trans-title>
                                </trans-title-group>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0003-2695-5078</contrib-id>
                                                                <name>
                                    <surname>Şahinaslan</surname>
                                    <given-names>Önder</given-names>
                                </name>
                                                                    <aff>MALTEPE UNIVERSITY</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-9440-414X</contrib-id>
                                                                <name>
                                    <surname>Dalyan</surname>
                                    <given-names>Hüseyin</given-names>
                                </name>
                                                                    <aff>MALTEPE ÜNİVERSİTESİ, MÜHENDİSLİK FAKÜLTESİ</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0001-8519-7612</contrib-id>
                                                                <name>
                                    <surname>Şahinaslan</surname>
                                    <given-names>Ender</given-names>
                                </name>
                                                                    <aff>EA SAĞLIK, EĞİTİM VE BİLİŞİM LTD. ŞTİ.</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20220430">
                    <day>04</day>
                    <month>30</month>
                    <year>2022</year>
                </pub-date>
                                        <volume>15</volume>
                                        <issue>2</issue>
                                        <fpage>221</fpage>
                                        <lpage>229</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20211010">
                        <day>10</day>
                        <month>10</month>
                        <year>2021</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20220414">
                        <day>04</day>
                        <month>14</month>
                        <year>2022</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2008, Bilişim Teknolojileri Dergisi</copyright-statement>
                    <copyright-year>2008</copyright-year>
                    <copyright-holder>Bilişim Teknolojileri Dergisi</copyright-holder>
                </permissions>
            
                                                                                                <abstract><p>Bu çalışma, Naive Bayes sınıflandırma algoritması kullanılarak sosyal medya verileri üzerinden dünya dillerinde yapılan yorum ve paylaşımların anlaşılmasına katkıda bulunmayı amaçlamaktadır. Duygu analizi veya fikir madenciliği, doğal dil işleme konularının bir alt bölümünde yer alır ve sosyal medya üzerinde yer alan verilerin anlamlandırabilmesi sağlanır. Yapay zekâ ve makine öğrenmesi gibi konularla birlikte günümüzde son derece popüler bir alandır. Küresel bir köye dönüşen dünyada, insanlar sosyal medya araçları üzerinden görüş, düşünce ve o konu hakkında memnuniyet durumları gibi pek çok veriyi paylaşmaktadır. Anlamlandırılmayı bekleyen bu veriler üzerinden insanların duygu ve düşünceleri ortaya çıkartabilmek mümkündür. Son dönemlerde Türkçe dilinde bir takım duygu analizi çalışmalarının yapıldığı görülmektedir. Ancak dünyadaki farklı dil ve lehçelerde yapılan yorumlar üzerinden çok dilli duygu analiz çalışması sınırlıdır. Bu çalışmada, Türkçe, İngilizce, Almanca, Fransızca, Arapça, Rusça ve Korece gibi farklı dünya dillerinden YouTube yorum verileri kullanılmıştır. PHP ile elde edilen bu ham veriler üzerinden anlamsız veriler temizlenerek belirli bir kalitede veri seti elde edilmiştir. Bu yorum verilerini İngilizce&#039;ye çevirmek için Google çeviri aracı API&#039;sı kullanılmıştır. Duygular, PHP Niiknow kütüphanesi üzerinden Naive Bayes algoritması kullanılarak pozitif, negatif ve nötr olarak sınıflandırılır. WEKA ile yapılan veri analizinde doğru sınıflandırma oranı %65,56 olarak bulunmuştur. Bu çalışma, 15.082 veri seti ve Google Çeviri aracı tarafından desteklenen 108 dil sayısı ile sınırlıdır.</p></abstract>
                                                                                                                                    <trans-abstract xml:lang="en">
                            <p>This study aims to contribute to the understanding of comments and shares made in world languages over social media data using the Naive Bayes classification algorithm. Sentiment analysis or opinion mining is a subsection of natural language processing and it is ensured that the data on social media can be interpreted. It is an extremely popular field today, along with topics such as artificial intelligence and machine learning. In the world that has turned into a global village, people share a lot of data such as opinions, thoughts and satisfaction about that subject through social media tools. It is possible to reveal people&#039;s feelings and thoughts through these data waiting to be interpreted. It is seen that some sentiment analysis studies have been carried out in Turkish language recently. However, multilingual sentiment analysis work is limited on interpretations made in different languages and dialects in the world. In this study, YouTube comment data from different world languages such as Turkish, English, German, French, Arabic, Russian and Korean have been used.  A certain quality data set has been obtained by cleaning the meaningless data over these raw data obtained with PHP. The Google translation tool API has been used to translate this comment data into English. Emotions are classified as positive, negative and neutral using the Naive Bayes algorithm via the PHP Niiknow library. In the data analysis performed with WEKA, the correct classification rate has found to be 65.56%. This study is limited to 15,082 data sets and the number of 108 languages supported by the Google Translate tool.</p></trans-abstract>
                                                            
            
                                                            <kwd-group>
                                                    <kwd>Duygu Analizi</kwd>
                                                    <kwd>  Makine Öğrenmesi</kwd>
                                                    <kwd>  Naive Bayes</kwd>
                                                    <kwd>  WEKA</kwd>
                                                    <kwd>  Youtube</kwd>
                                            </kwd-group>
                                                        
                                                                            <kwd-group xml:lang="en">
                                                    <kwd>Sentiment Analysis</kwd>
                                                    <kwd>  Machine Learning</kwd>
                                                    <kwd>  Naive Bayes</kwd>
                                                    <kwd>  WEKA</kwd>
                                                    <kwd>  Youtube</kwd>
                                            </kwd-group>
                                                                                                            </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">O. Sahinaslan ve E. Sahinaslan, &quot;Cross-object information security: A study on new generation encryption&quot;, AIP Conference Proceedings, 2086, 030034, 2019, doi:10.1063/1.5095119.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">O. Sahinaslan, E. Sahinaslan ve E. Gunes, &quot;Review of the contributions of contactless payment technologies in the COVID-19 pandemic process&quot;,  AIP Conference Proceedings, 2334,  070002, 2021, doi:10.1063/5.0042225.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">E. Sahinaslan, &quot;On the internet of things: Security, threat and control&quot;, AIP Conference Proceedings, 2086, 030035, 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">N. Tuna , A. Sebatlı Sağlam ve F. Çavdur , &quot;Covid-19 Salgını ile İlgili Paylaşımlar Üzerinde Veri Analizi&quot;, Bilişim Teknolojileri Dergisi, 15(1), 13-23, 2022, doi:10.17671/gazibtd.928990.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">İnternet: Most popular social networks worldwide as of July 2021, ranked by number of active users, https://www.statista.com/statistics/272014/global-social-networks-ranked-by-number-of-users/, 12.08.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">İ. Erkan, &quot;Youtube Kullanma Amacının Youtube’da Yapılan Marka İşbirliklerine Yönelik Tutuma Etkisi&quot;, Cumhuriyet Üniversitesi İktisadi ve İdari Bilimler Dergisi, 128-145, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">W. Medhat, A. Hassan ve . H. Korashy, &quot;Sentiment Analysis Algorithms And Applications:A Survey&quot;, Ain Shams Engineering Journal, 1093-1113, 2014.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">İnternet: Makine Öğrenmesi Nedir, https://www.ibm.com/tr-tr/cloud/learn/machine-learning., IBM,20.08.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">D. Jurafsky,  J. H. Martin, &quot;Naive Bayes and Sentiment Classification&quot;, Speech and Language Processing, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">A. Severyn, A. Moschitti, O. Uryupina, B. Plank ve K. Filippova, &quot;Multi-lingual Opinion Mining on YouTube&quot;, Information Processing and Management, 46-60, 2016.</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">K. Arun ve A. Srinagesh, &quot;Multi-Lingual Twitter Sentiment Analysis Using Machine Learning&quot;, International Journal of Electrical and Computer Engineering, 5992-6000, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">M. M. Agüero-Torales, J. I. Abreu Salas ve A. G. López-Herrera, &quot;Deep Learning And Multilingual Sentiment Analysis On Social Media&quot;, Applied Soft Computing, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">A. Hogenboom, B. Heerschop, F. Frasincar, U. Kaymak ve F. De Jong, &quot;Multi-Lingual Support For Lexicon-Based Sentiment Analysis Guided&quot;, Decision Support Systems, 43-53, 2014.</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">T. Ma Ma, K. Yamamori, A. Thida, &quot;A Comparative Approach to Naive Bayes Classifier and Support Vector Machine for Email Spam Classification&quot;, 2020 IEEE 9th Global Conference on Consumer Electronics (GCCE), 324-326, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">K. Asad Ullah Rafiq, K. Madiha ve M. B. Khan, &quot;Naïve Multi-label Classification Of Youtube Comments Using&quot;, Procedia Computer Science, 2016.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">C. R. Stephens, H. F. Huerta ve A. R. Linares, &quot;Why The Naive Bayes Approximation is Not As Naive&quot;, 2015 6th International Conference on Information, Intelligence, Systems and Applications (IISA), 2015.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">I. Blekanov, M. Kukarkin, A. Maksimov, S. Bodrunova, &quot;Sentiment Analysis for Ad Hoc Discussions Using Multilingual Knowledge-Based Approach&quot;, Proceedings of the 3rd International Conference on Applications in Information Technology, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">M. C. Yılmaz ve Z. Orman, &quot;LSTM Derin Öğrenme Yaklaşımı ile Covid-19 Pandemi Sürecinde Twitter Verilerinden Duygu Analizi&quot;, Acta Infologica, https://doi.org/10.26650/acin.947747.</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">İ. Sel ve D. Hanbay, &quot;Ön Eğitimli Dil Modelleri Kullanarak Türkçe Tweetlerden Cinsiyet Tespiti&quot;, Fırat Üniversitesi Müh. Bil. Dergisi, 33, 2, 675-684, 20211.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">E. Karamehmetoğlu, S. Ersöz ve O. Karamehmetoğlu, &quot;Sosyal Ağ Tabanlı Verilerden Faydalanarak Korona Virüs Konulu Duygu Analiz Çalışması&quot;, Ergonomi, 4(1), 47 - 54, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">J. Samuel, G. G. M. Nawaz Ali, M. Rahman, E. Esawi ve Y. Samuel, &quot;COVID-19 Public Sentiment Insights and Machine Learning for Tweets Classification&quot;, Information, cilt 11(6), 314, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref22">
                        <label>22</label>
                        <mixed-citation publication-type="journal">İnternet: WEKA Data Mining, https://www.cs.waikato.ac.nz/~ml/WEKA, 08.09.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref23">
                        <label>23</label>
                        <mixed-citation publication-type="journal">İnternet: YouTube Data API Overview, https://developers.google.com/youtube/v3/getting-started, 24.06.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref24">
                        <label>24</label>
                        <mixed-citation publication-type="journal">İnternet, MySQL Database, https://www.mysql.com/, 24.09.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref25">
                        <label>25</label>
                        <mixed-citation publication-type="journal">İnternet: Microsoft Veri Platformu,  https://www.microsoft.com/tr-tr/sql-server/, MsSQL, 24.09.2021</mixed-citation>
                    </ref>
                                    <ref id="ref26">
                        <label>26</label>
                        <mixed-citation publication-type="journal">İnternet: Translation APIs &amp; Reference,  https://cloud.google.com/translate/docs/apis, 18.06.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref27">
                        <label>27</label>
                        <mixed-citation publication-type="journal">Internet: Niiknow-Naive Bayes, https://github.com/niiknow/bayes/blob/e754145d52900fdf4c1e620cc561132954721cf9/src/Bayes.php, 19.06.2021.</mixed-citation>
                    </ref>
                                    <ref id="ref28">
                        <label>28</label>
                        <mixed-citation publication-type="journal">S. Alqaraleh , &quot;Efficient Turkish Text Classification Approach for Crisis Management Systems&quot;, Gazi University Journal of Science, 34(3), 718-731, 2021, doi:10.35378/gujs.715296..</mixed-citation>
                    </ref>
                                    <ref id="ref29">
                        <label>29</label>
                        <mixed-citation publication-type="journal">Ö. Tonkal, H. Polat, “Traffic Classification and Comparative Analysis with Machine Learning Algorithms in Software Defined Networks”, Gazi University Journal of Science Part C: Design and Technology , 9 (1) , 71-83 . doi: 10.29109/gujsc.869418.</mixed-citation>
                    </ref>
                                    <ref id="ref30">
                        <label>30</label>
                        <mixed-citation publication-type="journal">S. A. Arpacı ve O. Kalıpsız, &quot;A Comparison of Different Naive Bayes Technıques for Software Defect Classaification&quot;, Omer Halisdemir University Journal of Engineering Sciences, c.7(1), 1-13, 2018. doi: 10.28948/ngumuh.383709.</mixed-citation>
                    </ref>
                                    <ref id="ref31">
                        <label>31</label>
                        <mixed-citation publication-type="journal">H. Deng, Y. Sun, Y. Chang ve J. Han, 2014, Probabilistic models for classification. in CC Aggarwal (ed.), Data Classification: Algorithms and Applications. CRC Press, 65-86.2014, doi:10.1201/b17320.</mixed-citation>
                    </ref>
                                    <ref id="ref32">
                        <label>32</label>
                        <mixed-citation publication-type="journal">Frank, E., Bouckaert, R. R., “Naive bayes for text classification with unbalanced classes”, In European Conference on Principles of Data Mining and Knowledge Discovery, Springer, Berlin, Heidelberg, 503-510, (2006).</mixed-citation>
                    </ref>
                                    <ref id="ref33">
                        <label>33</label>
                        <mixed-citation publication-type="journal">E. Çelik, D. Dal ve T. Aydin , &quot;Duygu Analizi İçin Veri Madenciliği Sınıflandırma Algoritmalarının Karşılaştırılması&quot;, Avrupa Bilim ve Teknoloji Dergisi, 27, 880-889, 2021, doi:10.31590/ejosat.905259.</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
