<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                    <journal-id></journal-id>
            <journal-title-group>
                                                                                    <journal-title>Balkan Journal of Electrical and Computer Engineering</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">2147-284X</issn>
                                        <issn pub-type="epub">2147-284X</issn>
                                                                                            <publisher>
                    <publisher-name>MUSA YILMAZ</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id pub-id-type="doi">10.17694/bajece.1366812</article-id>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Computer Software</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Bilgisayar Yazılımı</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                                                            <article-title>Document Classification with Contextually Enriched Word Embeddings</article-title>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0003-0879-1989</contrib-id>
                                                                <name>
                                    <surname>Mahmood</surname>
                                    <given-names>Raad Saadi</given-names>
                                </name>
                                                                    <aff>CANKIRI KARATEKIN UNIVERSITY</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0003-2897-3894</contrib-id>
                                                                <name>
                                    <surname>Bakal</surname>
                                    <given-names>Mehmet Gökhan</given-names>
                                </name>
                                                                    <aff>ABDULLAH GUL UNIVERSITY</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-6425-104X</contrib-id>
                                                                <name>
                                    <surname>Akbaş</surname>
                                    <given-names>Ayhan</given-names>
                                </name>
                                                                    <aff>University of Surrey</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20240301">
                    <day>03</day>
                    <month>01</month>
                    <year>2024</year>
                </pub-date>
                                        <volume>12</volume>
                                        <issue>1</issue>
                                        <fpage>90</fpage>
                                        <lpage>97</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20230926">
                        <day>09</day>
                        <month>26</month>
                        <year>2023</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20231028">
                        <day>10</day>
                        <month>28</month>
                        <year>2023</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2013, Balkan Journal of Electrical and Computer Engineering</copyright-statement>
                    <copyright-year>2013</copyright-year>
                    <copyright-holder>Balkan Journal of Electrical and Computer Engineering</copyright-holder>
                </permissions>
            
                                                                                                                        <abstract><p>The text classification task has a wide range of application domains for distinct purposes, such as the classification of articles, social media posts, and sentiments. As a natural language processing application,  machine learning and deep learning techniques are intensively utilized in solving such challenges. One common approach is employing the discriminative word features comprising Bag-of-Words and n-grams to conduct text classification experiments. The other powerful approach is exploiting neural network-based (specifically deep learning models) through either sentence, word, or character levels. In this study, we proposed a novel approach to classify documents with contextually enriched word embeddings powered by the neighbor words accessible through the trigram word series. In the experiments, a well-known web of science dataset is exploited to demonstrate the novelty of the models. Consequently, we built various models constructed with and without the proposed approach to monitor the models&#039; performances. The experimental models showed that the proposed neighborhood-based word embedding enrichment has decent potential to use in further studies.</p></abstract>
                                                            
            
                                                                                        <kwd-group>
                                                    <kwd>Text classification</kwd>
                                                    <kwd>  Deep Learning</kwd>
                                                    <kwd>  LSTM</kwd>
                                                    <kwd>  Word2Vec</kwd>
                                                    <kwd>  N-grams</kwd>
                                            </kwd-group>
                            
                                                                                                                                                <funding-group specific-use="FundRef">
                    <award-group>
                                                    <funding-source>
                                <named-content content-type="funder_name">The authors received no financial support for the research, authorship, and/or publication of this article.</named-content>
                            </funding-source>
                                                                    </award-group>
                </funding-group>
                                </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">[1] A. J. Trappey, F.-C. Hsu, C. V. Trappey, and C.-I. Lin, “Development
of a patent document classification and search platform using a backpropagation
network,” Expert Systems with Applications, vol. 31, no. 4,
pp. 755–765, 2006.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">[2] G. Aghila et al., “A survey of nan” ive bayes machine learning approach
in text document classification,” arXiv preprint arXiv:1003.1795, 2010.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">[3] A. Joulin, E. Grave, P. Bojanowski, and T. Mikolov, “Bag of tricks for
efficient text classification,” arXiv preprint arXiv:1607.01759, 2016.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">[4] Q. Chen and M. Sokolova, “Specialists, scientists, and sentiments:
Word2vec and doc2vec in analysis of scientific and medical texts,” SN
Computer Science, vol. 2, pp. 1–11, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">[5] G. Bakal and O. Abar, “On comparative classification of relevant covid-
19 tweets,” in 2021 6th International Conference on Computer Science
and Engineering (UBMK). IEEE, 2021, pp. 287–291.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">[6] B. J. Marafino, J. M. Davies, N. S. Bardach, M. L. Dean, and R. A.
Dudley, “N-gram support vector machines for scalable procedure and
diagnosis classification, with applications to clinical free text data from
the intensive care unit,” Journal of the American Medical Informatics
Association, vol. 21, no. 5, pp. 871–875, 2014.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">[7] A. Graves, S. Fern´andez, and J. Schmidhuber, “Bidirectional lstm networks
for improved phoneme classification and recognition,” in Artificial
Neural Networks: Formal Models and Their Applications–ICANN 2005:
15th International Conference, Warsaw, Poland, September 11-15, 2005.
Proceedings, Part II 15. Springer, 2005, pp. 799–804.</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">[8] A. Graves and J. Schmidhuber, “Framewise phoneme classification
with bidirectional lstm and other neural network architectures,” Neural
networks, vol. 18, no. 5-6, pp. 602–610, 2005.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">[9] L. Xiao, G. Wang, and Y. Zuo, “Research on patent text classification
based on word2vec and lstm,” in 2018 11th International Symposium on
Computational Intelligence and Design (ISCID), vol. 1. IEEE, 2018,
pp. 71–74.</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">[10] C. C. Aggarwal and C. C. Aggarwal, “Machine learning for text: An
introduction,” Machine learning for text, pp. 1–16, 2018.</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">[11] P. Milhorat, S. Schl¨ogl, G. Chollet, J. Boudy, A. Esposito, and G. Pelosi,
“Building the next generation of personal digital assistants,” in 2014 1st
international conference on advanced technologies for signal and image
processing (atsip). IEEE, 2014, pp. 458–463.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">[12] H.-H. Chiang, “A comparison between teacher-led and online text-tospeech
dictation for students’ vocabulary performance.” English Language
Teaching, vol. 12, no. 3, pp. 77–93, 2019.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">[13] E. Adamopoulou and L. Moussiades, “Chatbots: History, technology,
and applications,” Machine Learning with Applications, vol. 2, p.
100006, 2020.</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">[14] D. Martinez, O. Plchot, L. Burget, O. Glembek, and P. Matˇejka,
“Language recognition in ivectors space,” in Twelfth annual conference
of the international speech communication association, 2011.</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">[15] T. Pedersen and R. Bruce, “Distinguishing word senses in untagged
text,” arXiv preprint cmp-lg/9706008, 1997.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">[16] M. Bevilacqua, T. Pasini, A. Raganato, and R. Navigli, “Recent trends
in word sense disambiguation: A survey,” in Proceedings of the Thirtieth
International Joint Conference on Artificial Intelligence, IJCAI-21.
International Joint Conference on Artificial Intelligence, Inc, 2021.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">[17] D. Nadeau and S. Sekine, “A survey of named entity recognition and
classification,” Lingvisticae Investigationes, vol. 30, no. 1, pp. 3–26,
2007.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">[18] W. Medhat, A. Hassan, and H. Korashy, “Sentiment analysis algorithms
and applications: A survey,” Ain Shams engineering journal, vol. 5,
no. 4, pp. 1093–1113, 2014.</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">[19] E. Reiter and R. Dale, “Building applied natural language generation
systems,” Natural Language Engineering, vol. 3, no. 1, pp. 57–87, 1997.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">[20] B. Kolukisa, B. K. Dedeturk, B. A. Dedeturk, A. Gulsen, and G. Bakal,
“A comparative analysis on medical article classification using text
mining &amp; machine learning algorithms,” in 2021 6th International
Conference on Computer Science and Engineering (UBMK). IEEE,
2021, pp. 360–365.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">[21] A. Adhikari, A. Ram, R. Tang, and J. Lin, “Rethinking complex neural
network architectures for document classification,” in Proceedings of the
2019 Conference of the North American Chapter of the Association for
Computational Linguistics: Human Language Technologies, Volume 1
(Long and Short Papers), 2019, pp. 4046–4051.</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
