<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.4 20241031//EN"
        "https://jats.nlm.nih.gov/publishing/1.4/JATS-journalpublishing1-4.dtd">
<article  article-type="research-article"        dtd-version="1.4">
            <front>

                <journal-meta>
                                                                <journal-id>meuded</journal-id>
            <journal-title-group>
                                                                                    <journal-title>Mersin Üniversitesi Dil ve Edebiyat Dergisi</journal-title>
            </journal-title-group>
                            <issn pub-type="ppub">1304-6594</issn>
                                        <issn pub-type="epub">2149-0856</issn>
                                                                                            <publisher>
                    <publisher-name>Mersin Üniversitesi</publisher-name>
                </publisher>
                    </journal-meta>
                <article-meta>
                                        <article-id/>
                                                                <article-categories>
                                            <subj-group  xml:lang="en">
                                                            <subject>Computational Linguistics</subject>
                                                            <subject>Lexicography and Semantics</subject>
                                                    </subj-group>
                                            <subj-group  xml:lang="tr">
                                                            <subject>Hesaplamalı Dilbilim</subject>
                                                            <subject>Sözlükbilim ve Anlambilim</subject>
                                                    </subj-group>
                                    </article-categories>
                                                                                                                                                        <title-group>
                                                                                                                        <trans-title-group xml:lang="tr">
                                    <trans-title>Makinece Okunabilir Çok Dilli Sözlükler: Yarı Otomatik Bir ISO–TEI Modeli</trans-title>
                                </trans-title-group>
                                                                                                                                                                                                <article-title>Machine-Readable Multilingual Dictionaries: A Semi-Automatic ISO–TEI Model</article-title>
                                                                                                    </title-group>
            
                                                    <contrib-group content-type="authors">
                                                                        <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0001-9340-5485</contrib-id>
                                                                <name>
                                    <surname>Özcan</surname>
                                    <given-names>Emrah</given-names>
                                </name>
                                                                    <aff>YILDIZ TECHNICAL UNIVERSITY</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-8278-2805</contrib-id>
                                                                <name>
                                    <surname>Erkoç</surname>
                                    <given-names>Mehmet Fatih</given-names>
                                </name>
                                                                    <aff>YILDIZ TECHNICAL UNIVERSITY</aff>
                                                            </contrib>
                                                    <contrib contrib-type="author">
                                                                    <contrib-id contrib-id-type="orcid">
                                        https://orcid.org/0000-0002-9231-4191</contrib-id>
                                                                <name>
                                    <surname>Tokatlı</surname>
                                    <given-names>Hasan</given-names>
                                </name>
                                                                    <aff>YILDIZ TECHNICAL UNIVERSITY</aff>
                                                            </contrib>
                                                                                </contrib-group>
                        
                                        <pub-date pub-type="pub" iso-8601-date="20260227">
                    <day>02</day>
                    <month>27</month>
                    <year>2026</year>
                </pub-date>
                                        <volume>22</volume>
                                        <issue>1</issue>
                                        <fpage>1</fpage>
                                        <lpage>20</lpage>
                        
                        <history>
                                    <date date-type="received" iso-8601-date="20260203">
                        <day>02</day>
                        <month>03</month>
                        <year>2026</year>
                    </date>
                                                    <date date-type="accepted" iso-8601-date="20260223">
                        <day>02</day>
                        <month>23</month>
                        <year>2026</year>
                    </date>
                            </history>
                                        <permissions>
                    <copyright-statement>Copyright © 2004, Mersin Üniversitesi Dil ve Edebiyat Dergisi</copyright-statement>
                    <copyright-year>2004</copyright-year>
                    <copyright-holder>Mersin Üniversitesi Dil ve Edebiyat Dergisi</copyright-holder>
                </permissions>
            
                                                                                                <trans-abstract xml:lang="tr">
                            <p>Sözlükbilimin dijital dönüşümü, alanı statik ve insan tarafından okunabilir ürünler üretmekten, dinamik ve makine tarafından okunabilir veritabanları geliştirmeye doğru köklü biçimde dönüştürmüştür. Bu makale, özellikle ara (pivot) diller aracılığıyla yarı otomatik türetime odaklanarak, makine tarafından okunabilir çok dilli sözlüklerin (MRD) geliştirilmesine ilişkin kuramsal ve yöntemsel temelleri incelemektedir. Yürüttüğümüz bir araştırma projesinin deneysel bulgularına dayanarak, karmaşık sözlüksel verilerin modellenmesinde Text Encoding Initiative (TEI) yönergeleri ile ISO 24613 (Lexical Markup Framework) standardının kullanım etkinliğini analiz ediyoruz. Veritabanı modellerine yönelik tarihsel eleştirileri, sözlüksel birlikte çalışabilirliğe ilişkin güncel standartlarla sentezleyerek; çok dilli sözlüklerin tamamen otomatik olarak türetilmesinin hâlen anlamsal belirsizliklerle sorunlu olduğunu, buna karşılık sağlam bir veri modellemesine ve insan doğrulamasına dayanan yarı otomatik bir iş akışının, birçok dil çifti için geçerli olan kaynak kıtlığını aşmada ölçeklenebilir bir çözüm sunduğunu savunuyoruz.</p></trans-abstract>
                                                                                                                                    <abstract><p>The digital transformation of lexicography has fundamentally shifted the discipline from the production of static, human-readable artefacts to the creation of dynamic, machine-readable databases. This article examines the theoretical and methodological foundations of developing machine-readable multilingual dictionaries (MRDs), with particular emphasis on semi-automatic derivation via pivot languages. Drawing upon the experimental results of a research project we conducted, we analyse the efficacy of utilising the Text Encoding Initiative (TEI) guidelines and ISO-24613 (Lexical Markup Framework) to model complex lexical data. By synthesising historical critiques of database models with contemporary standards for lexical interoperability, we argue that, while fully automatic induction of multilingual lexicons remains fraught with semantic ambiguity, a semi-automatic workflow, grounded in rigorous data modelling and human verification, offers a scalable solution to overcome the resource scarcity inherent in many language pairs.</p></abstract>
                                                            
            
                                                                                        <kwd-group>
                                                    <kwd>Computational lexicography</kwd>
                                                    <kwd>  Machine-readable dictionaries (MRD)</kwd>
                                                    <kwd>  Text Encoding Initiative (TEI)</kwd>
                                                    <kwd>  ISO 24613 (LMF)</kwd>
                                                    <kwd>  Multilingual dictionaries</kwd>
                                                    <kwd>  Pivot language</kwd>
                                                    <kwd>  Semi-automatic modelling</kwd>
                                            </kwd-group>
                            
                                                <kwd-group xml:lang="tr">
                                                    <kwd>Hesaplamalı sözlükbilim</kwd>
                                                    <kwd>  Makinece okunabilir sözlükler (MRD)</kwd>
                                                    <kwd>  Metin kodlama girişimi (TEI)</kwd>
                                                    <kwd>  ISO 24613 (LMF)</kwd>
                                                    <kwd>  Çokdilli sözlükler</kwd>
                                                    <kwd>  Ara (pivot) dil</kwd>
                                                    <kwd>  Yarı otomatik modelleme</kwd>
                                            </kwd-group>
                                                                                                                                    <funding-group specific-use="FundRef">
                    <award-group>
                                                    <funding-source>
                                <named-content content-type="funder_name">Yildiz Technical University Scientific Research Projects Coordination Unit</named-content>
                            </funding-source>
                                                                            <award-id>SBA-2021-4256</award-id>
                                            </award-group>
                </funding-group>
                                </article-meta>
    </front>
    <back>
                            <ref-list>
                                    <ref id="ref1">
                        <label>1</label>
                        <mixed-citation publication-type="journal">Arhar Holdt, S., &amp; Kosem, I. (2025). Using large language models to generate distractors for language games. In Proceedings of the eLex 2025 Conference (pp. 620–635). Bled, Slovenia.</mixed-citation>
                    </ref>
                                    <ref id="ref2">
                        <label>2</label>
                        <mixed-citation publication-type="journal">Aydın, C. R., Erkan, A., Güngör, T., &amp; Takçı, H. (2014). Sözlük kullanarak Türkçe için kavram madenciliği metotları geliştirme: Bir uygulama. In Proceedings of XVI. Academic Informatics Conference (pp. 801–810). Mersin, Türkiye.</mixed-citation>
                    </ref>
                                    <ref id="ref3">
                        <label>3</label>
                        <mixed-citation publication-type="journal">Boguraev, B., Briscoe, T., Carroll, J., &amp; Copestake, A. (1990). Database models for computational lexicography. In Proceedings of the 4th International Congress on Lexicography (pp. 59–78). Malaga, Spain.</mixed-citation>
                    </ref>
                                    <ref id="ref4">
                        <label>4</label>
                        <mixed-citation publication-type="journal">Chiarcos, C., Ionov, M., Apostol, E.-S., Gkirtzou, K., Kabashi, B., Khan, A. F., &amp; Truică, C.-O. (2024). Multiword expressions, collocations and the OntoLex vocabulary. In Multiword expressions in lexical resources, 187-227. Language Science Press. https://doi.org/10.5281/zenodo.10998641</mixed-citation>
                    </ref>
                                    <ref id="ref5">
                        <label>5</label>
                        <mixed-citation publication-type="journal">De Schryver, G.-M. (2010). State-of-the-art software to support intelligent lexicography. In R. Zhu (Ed.), 中華字典研究-第2輯(上下)-2009《康熙字典》曁詞典学国際学術研討会論文集 2, 584–599. 中国社会科学 = China Sociale Wetenschappen Publishing House.</mixed-citation>
                    </ref>
                                    <ref id="ref6">
                        <label>6</label>
                        <mixed-citation publication-type="journal">De Schryver, G.M. (2023). Generative AI and Lexicography: The Current State of the Art Using ChatGPT. International Journal of Lexicography, 36(4), 355-387.</mixed-citation>
                    </ref>
                                    <ref id="ref7">
                        <label>7</label>
                        <mixed-citation publication-type="journal">Francopoulo, G., &amp; Huang, C.-R. (2014). Lexical markup framework: An ISO standard for electronic lexicons and its implications for Asian languages. Lexicography ASIALEX, 1, 37-51. https://doi.org/10.1007/s40607-014-0006-z</mixed-citation>
                    </ref>
                                    <ref id="ref8">
                        <label>8</label>
                        <mixed-citation publication-type="journal">Gantar, P. (2020). Dictionary of Modern Slovene: From Slovene lexical database to digital dictionary database. Rasprave, 46(2), 589-602.</mixed-citation>
                    </ref>
                                    <ref id="ref9">
                        <label>9</label>
                        <mixed-citation publication-type="journal">Gillis-Webber, F. (2018). Conversion of the English-Xhosa dictionary for nurses to a linguistic linked data framework. Information, 9(11), 274. https://doi.org/10.3390/info9110274</mixed-citation>
                    </ref>
                                    <ref id="ref10">
                        <label>10</label>
                        <mixed-citation publication-type="journal">Ide, N. &amp; Veronis, J. (1993). Extracting knowledge bases from machine-readable dictionaries: Have we wasted our time?, Knowledge Bases &amp; Knowledge Structures 93, Tokyo, 257-266.</mixed-citation>
                    </ref>
                                    <ref id="ref11">
                        <label>11</label>
                        <mixed-citation publication-type="journal">Ide, N., &amp; Veronis, J. (1995). Encoding dictionaries. In N. Ide and J. Veronis (Eds.), The Text Encoding Initiative: Background and Context, special triple issue of Computers and the Humanities, 29(2), 167-180.</mixed-citation>
                    </ref>
                                    <ref id="ref12">
                        <label>12</label>
                        <mixed-citation publication-type="journal">Ide, N., Kilgarriff, A., &amp; Romary, L. (2000). A formal model of dictionary structure and content. Euralex 2000 Proceedings, 113-126.</mixed-citation>
                    </ref>
                                    <ref id="ref13">
                        <label>13</label>
                        <mixed-citation publication-type="journal">Jarrar, M., &amp; Amayreh, H. (2019). An Arabic-Multilingual Database with a Lexicographic Search Engine. In Lecture notes in computer science, 234-246. Springer International Publishing. https://doi.org/10.1007/978-3-030-23281-8_19</mixed-citation>
                    </ref>
                                    <ref id="ref14">
                        <label>14</label>
                        <mixed-citation publication-type="journal">Khemakhem, M., Herold, A., &amp; Romary, L. (2018). Enhancing usability for automatically structuring digitised dictionaries. GLOBALEX workshop at LREC 2018, May 2018, Miyazaki, Japan. https://hal.science/hal-01708137v1</mixed-citation>
                    </ref>
                                    <ref id="ref15">
                        <label>15</label>
                        <mixed-citation publication-type="journal">Kovarikova, D. (2021). Sharing data through specialized corpus-based tools: The case of GramatiKat. Journal of Linguistics/Jazykovedný casopis. 72, 531-544. https://doi.org/10.2478/jazcas-2021-0049.</mixed-citation>
                    </ref>
                                    <ref id="ref16">
                        <label>16</label>
                        <mixed-citation publication-type="journal">Krek, S., Ponikvar, P., Repar, A., Kosem, I., and Lindemann, D. (2025). DMLEX on Wikibase: Legacy dictionaries as collaboratively editable dataset Proceedings of the eLex 2025 conference, Bled, Slovenia, 175-189.</mixed-citation>
                    </ref>
                                    <ref id="ref17">
                        <label>17</label>
                        <mixed-citation publication-type="journal">Lemnitzer, L., Romary, L., &amp; Witt, A. (2013). Representing human and machine dictionaries in markup languages. In R. Gouws, U. Heid, W. Schweickard, &amp; H. E. Wiegand (Eds.), HSK - Dictionaries. An international encyclopedia of lexicography: Supplementary volume: Recent developments with special focus on computational lexicography (Vol. 5.4, pp. 1195–1208). Mouton de Gruyter.</mixed-citation>
                    </ref>
                                    <ref id="ref18">
                        <label>18</label>
                        <mixed-citation publication-type="journal">Lindemann, D. (2025). Ontolex-Lemon in Wikidata and other Wikibase instances. Proceedings of the 5th Conference on Language, Data and Knowledge: Workshops, 287–297. https://doi.org/10.5281/zenodo.15861038</mixed-citation>
                    </ref>
                                    <ref id="ref19">
                        <label>19</label>
                        <mixed-citation publication-type="journal">Mechura, M. (2017). Introducing Lexonomy: An open-source dictionary writing and publishing system. Proceedings of eLex 2017 Conference, 662-679.</mixed-citation>
                    </ref>
                                    <ref id="ref20">
                        <label>20</label>
                        <mixed-citation publication-type="journal">Nasution, A. H., Murakami, Y., &amp; Ishida, T. (2017). Plan optimization for creating bilingual dictionaries of low-resource languages. Proceedings of IEEE International Conference on Culture and Computing, 35-41.</mixed-citation>
                    </ref>
                                    <ref id="ref21">
                        <label>21</label>
                        <mixed-citation publication-type="journal">Rabe, M., Puttkammer, M. J., &amp; van Huyssteen, G. B. (2025). Compiling a Candidate List of Taboo Constructions for an Under-Resourced Language. Proceedings of the eLex 2025 conference, 739-756.</mixed-citation>
                    </ref>
                                    <ref id="ref22">
                        <label>22</label>
                        <mixed-citation publication-type="journal">Romary, L., &amp; Wegstein, W. (2012). Consistent modeling of Heterogeneous Lexical Structures. Journal of the Text Encoding Initiative, 3, 1-43.</mixed-citation>
                    </ref>
                                    <ref id="ref23">
                        <label>23</label>
                        <mixed-citation publication-type="journal">Romary, L., Khemakhem, M., Khan, F., Bowers, J., Calzolari, N., George, M., Pet, M., &amp; Bański, P. (2019). LMF reloaded. Proceedings of the AsiaLex 2019 Conference, 533–539.</mixed-citation>
                    </ref>
                                    <ref id="ref24">
                        <label>24</label>
                        <mixed-citation publication-type="journal">Rundell, M. (2023). Automating the creation of dictionaries: Are we nearly there? proceedings of the 16th International Conference of the Asian Association for Lexicography (ASIALEX 2023), 9-17.</mixed-citation>
                    </ref>
                                    <ref id="ref25">
                        <label>25</label>
                        <mixed-citation publication-type="journal">Saveski, M., &amp; Trajkovski, I. (2011). Development of an English–Macedonian machine readable dictionary by using parallel corpora. In M. Gusev &amp; P. Mitrevski (Eds.), ICT Innovations 2010. Communications in Computer and Information Science (Vol. 83, pp. 207–218). Springer. https://doi.org/10.1007/978-3-642-19325-5_20</mixed-citation>
                    </ref>
                                    <ref id="ref26">
                        <label>26</label>
                        <mixed-citation publication-type="journal">Sobkowiak, W. (1996). Phonetic Transcription in Machine-readable Dictionaries. Proceedings of the 7th EURALEX International Congress (EURALEX ’96), 181-188.</mixed-citation>
                    </ref>
                                    <ref id="ref27">
                        <label>27</label>
                        <mixed-citation publication-type="journal">Stöckle, P., Elsner, D., Koppensteiner, W., &amp; Korecky-Kröll, K. (2025). LLM-assisted dialect lexicography: Challenges and opportunities in processing historical Bavarian dialects. Proceedings of the eLex 2025 Conference, 453–475.</mixed-citation>
                    </ref>
                                    <ref id="ref28">
                        <label>28</label>
                        <mixed-citation publication-type="journal">TEI Consortium. (2012). TEI P5: Guidelines for electronic text encoding and interchange.</mixed-citation>
                    </ref>
                                    <ref id="ref29">
                        <label>29</label>
                        <mixed-citation publication-type="journal">Tiberius, C., Heylen, K., De Does, J., Vanroy, B., Vandeghinste, V., &amp; Van Doeselaar, J. (2024). LLMs and evidence-based lexicography: Pilot studies at INT. In S. Krek (Ed.), Book of abstracts of the workshop Large Language Models and Lexicography (pp. 44–48).</mixed-citation>
                    </ref>
                                    <ref id="ref30">
                        <label>30</label>
                        <mixed-citation publication-type="journal">Veronis, J., &amp; Ide, N. (1991). An assessment of semantic information automatically extracted from machine readable dictionaries. In J. Kunze &amp; D. Reimann (Eds.), Fifth Conference of the European Chapter of the Association for Computational Linguistics (pp. 227–232). Association for Computational Linguistics. https://aclanthology.org/E91-1040/</mixed-citation>
                    </ref>
                                    <ref id="ref31">
                        <label>31</label>
                        <mixed-citation publication-type="journal">Vulić, I., De Smet, W., &amp; Moens, M.-F. (2012). Cross-language information retrieval models based on latent topic models trained with document-aligned comparable corpora. Information Retrieval, 16(3), 331–368. https://doi.org/10.1007/s10791-012-9200-5</mixed-citation>
                    </ref>
                            </ref-list>
                    </back>
    </article>
