@article{article_1596966, title={Building An Integrated Database For Turkish Startups: A Systematic And Novel Framework}, journal={Bilecik Şeyh Edebali Üniversitesi Fen Bilimleri Dergisi}, volume={12}, pages={398–420}, year={2025}, DOI={10.35193/bseufbd.1596966}, author={Çelikel, İsmail Ozan and Bahar, Eda and Orman, Günce Keziban and Turhan, Sultan Nezihe}, keywords={Turkish Startup Ecosystem, Integrated Database, MongoDB, Exploratory Data Analysis, Web Scraping, DataOps}, abstract={In recent years, the Turkish startup ecosystem has grown significantly thanks to the increase in government support, diversification of private investments, the spread of startup culture worldwide, and technological developments. Despite the rapidly increasing numbers, there is no up-to-date, comprehensive, and analytically serviceable database for new entrepreneurial firms in different sectors. This study creates an integrated and centralized database for startups in Türkiye by using a hybrid methodology that combines traditional ETL processes with modern data engineering techniques. All data belonging to the companies were obtained from public databases and national techno-hub pools via the web scrape method and stored in a database on MongoDB, a document-based NoSQL database. While data preprocessing provided consistency, integrity, and structural integrity, exploratory data analysis revealed critical insights into the geographical distribution, fields of activity, and workforce metrics of the startup ecosystem in Türkiye. The findings obtained at the end of the study provide very valuable information to stakeholders, including researchers, policymakers, and firms operating in different sectors. The data pipeline construction methodology introduced in the study, characterized by its scalability and adaptability, also serves as a replicable framework for data engineering projects in other fields. Future research can further enhance its analytical capacity by enriching this dataset with financial metrics and sectoral impacts.}, number={2}, publisher={Bilecik Seyh Edebali University}, organization={The author(s) acknowledge that they received no external funding to support this research.}