<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                    <journal-id></journal-id>
            <journal-title-group>
                                                                                    <journal-title>Balkan Journal of Electrical and Computer Engineering</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">2147-284X</issn>
                                        <issn pub-type="epub">2147-284X</issn>
                                                                                            <publisher>
                    <publisher-name>MUSA YILMAZ</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.17694/bajece.1712376</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Software Architecture</subject>
                                                            <subject>Software Testing, Verification and Validation</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Yazılım Mimarisi</subject>
                                                            <subject>Yazılım Testi, Doğrulama ve Validasyon</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                        <trans-title-group xml:lang="tr">
                                    <trans-title>Sosyal Nesnelerin İnternetinden Kaynaklanan Büyük Verilerin Doğruluğu ve Gerçekliğinin Tespiti için ML Algoritmalarıyla Veri Ön İşleme Yaklaşımı ve Bir Vaka Çalışması</trans-title>
                                </trans-title-group>
                                                                                                                                                                                                <article-title>Data Pre-processing Approach with ML Algorithms for Accuracy and Authenticity Detection of Big Data Sourced from the Social Internet of Things and a Case Study</article-title>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0009-0009-7128-4075</contrib-id>
                                                                <name>
                                    <surname>Kızılaslan</surname>
                                    <given-names>Deniz</given-names>
                                </name>
                                                                    <aff>İSTANBUL AYDIN ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0003-2710-0063</contrib-id>
                                                                <name>
                                    <surname>Kaya</surname>
                                    <given-names>Şükrü Mustafa</given-names>
                                </name>
                                                                    <aff>İSTANBUL AYDIN ÜNİVERSİTESİ</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20260328">
                    <day>03</day>
                    <month>28</month>
                    <year>2026</year>
                </pub-date>
                                        <volume>14</volume>
                                                    <fpage>63</fpage>
                                        <lpage>73</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20250603">
                        <day>06</day>
                        <month>03</month>
                        <year>2025</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20251203">
                        <day>12</day>
                        <month>03</month>
                        <year>2025</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2013, Balkan Journal of Electrical and Computer Engineering</copyright-statement>
                    <copyright-year>2013</copyright-year>
                    <copyright-holder>Balkan Journal of Electrical and Computer Engineering</copyright-holder>
                </permissions>
            
                                                                                                <trans-abstract xml:lang="tr">
                            <p>IoT, çevremizdeki sayısız fiziksel olayı algılayan, bunları veriye dönüştüren ve bu verileri farklı ortamlara veya dijital sistemlere aktaran sensörler dünyasıdır. Nesnelerin İnterneti tabanlı teknolojilerin kullanım alanları sürekli artmakta ve IoT altyapısını destekleyecek teknolojiler geliştirilmektedir. Ancak algılama katmanında üretilen büyük miktardaki büyük verinin etkin bir şekilde yönetilebilmesi için ön işleme tabi tutulması ve büyük veri standartlarıyla uyumlu hale getirilmesi gerekmektedir. Büyük verinin etkin bir şekilde yönetilebilmesi için veri seti standartlarının iyileştirilmesi gerekmekte ve daha kaliteli bir veri seti için farklı veri işleme yöntemleri geliştirilmektedir. Bu çalışmada, mobil cihazlar kullanılarak IoT algılama katmanında üretilen verilerin doğruluğu ve güvenilirliğini belirlemek amacıyla literatür taraması yapılmıştır. Ayrıca çalışmada, mobil cihazlar ve sosyal platformlar üzerinde üretilen verilerden oluşan veri seti ML sınıflandırma algoritmaları ile incelenmiştir. Veri seti üzerinde Lojistik Regresyon (LR), Naive Bayes (NB), Rastgele Orman (RF), K-en yakın komşu (kNN), Destek Vektör Makineleri (SVM) sınıflandırma algoritmaları ile doğruluk ve güvenilirlik açısından karşılaştırmalar ve değerlendirmeler yapılmıştır. ML sınıflandırma algoritmaları üzerinde yapılan çalışmalar sonucunda, Rastgele Orman ve Destek Vektör Makineleri algoritmalarının yakın oranlarda doğruluk sağladığı görülmektedir. Bu çalışma, IoT algılama katmanında mobil cihazlar kullanılarak elde edilen verilerin doğruluğunu ve güvenilirliğini artırmak için etkili algoritmaların belirlenmesine katkıda bulunmaktadır.</p></trans-abstract>
                                                                                                                                    <abstract><p>The Social Internet of Things (SIoT), which integrates sensor data with social media interactions, produces massive volumes of unstructured data that require accurate and reliable preprocessing for meaningful analysis. This study investigates the effectiveness of various machine learning (ML) classification algorithms in detecting the accuracy and authenticity of SIoT-derived data.A dataset comprising 17,500 user records collected from mobile devices and social media platforms was analyzed using five ML classifiers: Logistic Regression, Naive Bayes, K-Nearest Neighbor (K-NN), Random Forest, and Support Vector Machines (SVM). Through extensive hyperparameter tuning and 5-fold cross-validation, the Random Forest and SVM models exhibited the highest performance, achieving accuracy scores of 0.58 and 0.57, respectively. SVM also obtained the best AUC value of 0.64, highlighting its strength in distinguishing authentic from manipulated data. Additionally, the results emphasize the need for larger, more diverse datasets, and suggest incorporating deep learning and automated bias mitigation methods in future research.</p></abstract>
                                                            
            
                                                                                        <kwd-group>
                                                    <kwd>Internet of Things</kwd>
                                                    <kwd>  Social Internet of Things</kwd>
                                                    <kwd>  Big Data</kwd>
                                                    <kwd>  Data Processing</kwd>
                                            </kwd-group>
                            
                                                <kwd-group xml:lang="tr">
                                                    <kwd>Nesnelerin İnterneti</kwd>
                                                    <kwd>  Sosyal Nesnelerin İnterneti</kwd>
                                                    <kwd>  Büyük Veri</kwd>
                                                    <kwd>  Veri işleme</kwd>
                                            </kwd-group>
                                                                                                                                        </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">[1]	Shahab, S., Agarwal, P., Mufti, T., &amp; Obaid, A. J. (2022). SIoT (Social Internet of Things): A Review. Evolutionary Computing and Mobile Sustainable Networks, 313–323.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">[2]	Dhelim, S., Ning, H., Farha, F., Chen, L., Atzori, L., &amp; Daneshmand, M. (2021). IoT-Enabled Social Relationships Meet Artificial Social Intelligence. IEEE Internet of Things Journal, 8(20), 15364–15375.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">[3]	Nejad, H. V., Farimani, Z. M., &amp; Tavakolifar, A. (2020). Social Internet of Things and New Generation Computing—A Survey. Toward Social Internet of Things (SIoT), 846, 129–152.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">[4]	Kaya, Ş. M., &amp; Kaya, E. (2022). The (Un)seen Influence of S-IoT on the Political Economic Decisions. In 6th International Congress of Social Sciences, Istanbul.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">[5]	Rad, M. M., Rahmani, A. M., Sahafi, A., &amp; Qader, N. N. (2020). Social Internet of Things: vision, challenges, and trends. Human-centric Computing and Information Sciences, 10.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">[6]	Kaur, N., &amp; Sood, S. K. (2023). Social Internet of Things (SIoT): A decade’s journey and future directions. Journal of Network and Computer Applications, 210.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">[7]	Dhelim, S., Ning, H., Farha, F., Chen, L., Atzori, L., &amp; Daneshmand, M. (2021). IoT-Enabled Social Relationships Meet Artificial Social Intelligence. IEEE Internet of Things Journal, 8(20), 15364–15375.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">[8]	İşler, B., Kaya, Ş. M., &amp; Kılıç, F. R. (2025). Fog-Enabled Machine Learning Approaches for Weather Prediction in IoT Systems: A Case Study. Sensors, 25(13), 4070.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">[9]	Zhang, L., et al. (2021). Integrating Social Media Data with IoT for Enhanced User Experience. IEEE Internet of Things Journal, 8(3), 1540–1552.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">[10]	Kim, J., et al. (2020). Understanding User Characteristics and Interactions on Social Media Platforms. Journal of Interactive Advertising, 20(3).</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">[11]	Chen, M., et al. (2019). Trust management in social Internet of Things: A survey. IEEE Communications Surveys &amp; Tutorials, 22(2), 1197–1230.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">[12]	Li, J., &amp; Wang, H. (2020). A sentiment-aware framework for social IoT applications based on hybrid machine learning. Future Generation Computer Systems, 108, 512–524.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">[13]	Gupta, R., et al. (2022). Real-time analytics for social IoT using edge computing. IEEE Transactions on Network and Service Management, 19(1), 67–80.</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">[14]	Zhou, J., Leung, V. C., &amp; Yang, L. T. (2021). Internet of Things security and privacy: Challenges and solutions. IEEE Internet of Things Journal, 8(12), 10231–10255.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">[15]	Kaya, Ş. M. (2025). Edge And Fog Computing With Artificial Intelligence Methods On Iot-Based Big Data. Artificial Intelligence: Foundations, Applications and Future Directions, 347.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">[16]	Johnson, E. (2019). IoT Sensors and Their Applications in Smart Systems. Sensors and Actuators B: Chemical, 185, 230–245.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">[17]	Hatton, M. (2013, January). The global M2M market in 2013. Machina Research White Paper.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">[18]	Gahi, Y., Guennoun, M., &amp; Mouftah, H. T. (2016). Big Data Analytics: Security and Privacy Challenges. In Proceedings of the 2016 IEEE Symposium on Computers and Communication (ISCC) (pp. 952–957). Messina, Italy.</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">[19]	Zikopoulos, I., Eaton, C. P., &amp; Zikopoulos, P. (2011). Understanding Big Data: Analytics for Enterprise Class Hadoop and Streaming Data (1st ed.). McGraw-Hill Osborne Media.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">[20]	Schneider, R. D. (2012). Hadoop for Dummies (Special ed.). John Wiley &amp; Sons.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">[21]	Setty, K., &amp; Bakhshi, R. (2013). What Is Big Data and What Does It Have to Do with IT Audit?. ISACA Journal, 3, 23–25.</mixed-citation>
                    </ref>
                                    <ref id="ref22">
                        <label>22</label>
                        <mixed-citation publication-type="journal">[22]	Kaya, Ş. M., Bayram, V., &amp; Özkan, M. (2025). Evaluation of the intergenerational relationship of IoT awareness in businesses. Journal of Information and Optimization Sciences, 46(5), 1753–1772.</mixed-citation>
                    </ref>
                                    <ref id="ref23">
                        <label>23</label>
                        <mixed-citation publication-type="journal">[23]	Cyganek, B., et al. (2016). A Survey of Big Data Issues in Electronic Health Record Analysis. Applied Artificial Intelligence, 30(6), 497–520.</mixed-citation>
                    </ref>
                                    <ref id="ref24">
                        <label>24</label>
                        <mixed-citation publication-type="journal">[24]	Gandomi, A., &amp; Haider, M. (2015). Beyond the hype: Big data concepts, methods, and analytics. International Journal of Information Management, 35(2), 137–144.</mixed-citation>
                    </ref>
                                    <ref id="ref25">
                        <label>25</label>
                        <mixed-citation publication-type="journal">[25]	Zhang, L., et al. (2021). Integrating Social Media Data with IoT for Enhanced User Experience. IEEE Internet of Things Journal, 8(3), 450–465.</mixed-citation>
                    </ref>
                                    <ref id="ref26">
                        <label>26</label>
                        <mixed-citation publication-type="journal">[26]	Esmaili Jobani, A., &amp; Kaya, Ş. M. (2025). Hybrid IoT and AI-based Solution for Energy Management in Data Centres under Various Climate Conditions. Anadolu Bil Meslek Yüksekokulu Dergisi, 20(72), 107–124.</mixed-citation>
                    </ref>
                                    <ref id="ref27">
                        <label>27</label>
                        <mixed-citation publication-type="journal">[27]	Chen, Y., et al. (2019). Analyzing User Behavior on Social Media Platforms: Methods and Applications. ACM Transactions on Social Computing, 4(2), 75–90.</mixed-citation>
                    </ref>
                                    <ref id="ref28">
                        <label>28</label>
                        <mixed-citation publication-type="journal">[28]	Smith, E., et al. (2018). User Characteristics and Interactions on Social Media Platforms: Insights from Data Analytics. International Journal of Information Management, 45, 210–225.</mixed-citation>
                    </ref>
                                    <ref id="ref29">
                        <label>29</label>
                        <mixed-citation publication-type="journal">[29]	Hancke, G. P., &amp; Hancke Jr., G. P. (2013). The role of advanced sensing in smart cities. Sensors, 13(1), 393–425.</mixed-citation>
                    </ref>
                                    <ref id="ref30">
                        <label>30</label>
                        <mixed-citation publication-type="journal">[30]	Talari, S., et al. (2017). A Review of Smart Cities Based on the Internet of Things Concept. Energies, 10(4), 421.</mixed-citation>
                    </ref>
                                    <ref id="ref31">
                        <label>31</label>
                        <mixed-citation publication-type="journal">[31]	Sikder, A. K., Petracca, G., Aksu, H., Jaeger, T., &amp; Uluagac, A. S. (2018). A Survey on Sensor-Based Threats to Internet-of-Things (IoT) Devices and Applications. ArXiv Preprint.</mixed-citation>
                    </ref>
                                    <ref id="ref32">
                        <label>32</label>
                        <mixed-citation publication-type="journal">[32]	Kaya, Ş. M., Erdem, A., &amp; Güneş, A. (2021). A Smart Data Pre-Processing Approach to Effective Management of Big Health Data in IoT Edge. Smart Homecare Technology and TeleHealth, 9–21.</mixed-citation>
                    </ref>
                                    <ref id="ref33">
                        <label>33</label>
                        <mixed-citation publication-type="journal">[33]	Kaya, Ş. M., İşler, B., Abu-Mahfouz, A. M., Rasheed, J., &amp; AlShammari, A. (2023). An Intelligent Anomaly Detection Approach for Accurate and Reliable Weather Forecasting at IoT Edges: A Case Study. Sensors, 23(5), 2426.</mixed-citation>
                    </ref>
                                    <ref id="ref34">
                        <label>34</label>
                        <mixed-citation publication-type="journal">[34]	Ahmed, I., Saeed, A., &amp; Malik, H. (2023). A trust-aware data filtering framework for Social Internet of Things. Computer Networks, 225, 109554.</mixed-citation>
                    </ref>
                                    <ref id="ref35">
                        <label>35</label>
                        <mixed-citation publication-type="journal">[35]	Kaya, Ş. M., Erdem, A., &amp; Güneş, A. (2022). Anomaly Detection and Performance Analysis by Using Big Data Filtering Techniques For Healthcare on IoT Edges. Sakarya University Journal of Science, 26(1), 1–13.</mixed-citation>
                    </ref>
                                    <ref id="ref36">
                        <label>36</label>
                        <mixed-citation publication-type="journal">[36]	Li, S., Raymond, K. K., Sun, Q., Buchanan, W. J., &amp; Cao, J. (2015). IoT Forensics: Amazon Echo as a Use Case. Journal of Latex Class Files, 14.</mixed-citation>
                    </ref>
                                    <ref id="ref37">
                        <label>37</label>
                        <mixed-citation publication-type="journal">[37]	James, G., Witten, D., Hastie, T., &amp; Tibshirani, R. (2021). An Introduction to Statistical Learning: with Applications in R (2nd ed.). Springer.</mixed-citation>
                    </ref>
                                    <ref id="ref38">
                        <label>38</label>
                        <mixed-citation publication-type="journal">[38]	Bayram, V., &amp; Kaya, M. (2023). The Contributions of Metaverse Technology on Management Information Systems in Strategic Planning and Decision-Making Processes of Businesses. Uluslararası Yönetim Akademisi Dergisi, 6(3), 794–807.</mixed-citation>
                    </ref>
                                    <ref id="ref39">
                        <label>39</label>
                        <mixed-citation publication-type="journal">[39]	Tharwat, A. (2021). Classification assessment methods. Applied Computing and Informatics, 17(1), 168–192</mixed-citation>
                    </ref>
                                    <ref id="ref40">
                        <label>40</label>
                        <mixed-citation publication-type="journal">[40]	Kaya, Ş. M., &amp; Bayram, V. (2025). Artificial Intelligence Awareness Scale Development Study. OPUS Journal of Society Research, 22(4), 657–672.</mixed-citation>
                    </ref>
                                    <ref id="ref41">
                        <label>41</label>
                        <mixed-citation publication-type="journal">[41]	Cihan, P. (2018). Determination of diagnosis, prognosis and risk factors in animal diseases using by data mining methods. PhD Thesis, Yildiz Technical University, Istanbul, Turkey.</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
