<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.172383.3</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Research Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Application of K-Means Clustering for Job Applicant Analysis in Construction Firms Using R</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 3; peer review: 4 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Jaya</surname>
                        <given-names>Daniel Jesayanto</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-1940-6302</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Ramdhani</surname>
                        <given-names>Wahyu Muhammad</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0000-3816-6100</uri>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Wati</surname>
                        <given-names>Endang</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0008-4264-7984</uri>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Nandes</surname>
                        <given-names>Yogi Novario</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0000-4028-3672</uri>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Nadhiroh</surname>
                        <given-names>Ilma Zahriyatun</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0002-0352-2691</uri>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Pade</surname>
                        <given-names>Reza Bakhrun Fidianto</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0009-6281-8418</uri>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Technology and Vocational Education and Training, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, 55282, Indonesia</aff>
                <aff id="a2">
                    <label>2</label>Building Engineering Education, Universitas Negeri Jakarta, East Jakarta, Special Capital Region of Jakarta, Indonesia</aff>
                <aff id="a3">
                    <label>3</label>Educational Research and Evaluation, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, 55282, Indonesia</aff>
                <aff id="a4">
                    <label>4</label>English Language Education, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, 55282, Indonesia</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:danieljesayanto.2023@student.uny.ac.id">danieljesayanto.2023@student.uny.ac.id</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>16</day>
                <month>6</month>
                <year>2026</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2025</year>
            </pub-date>
            <volume>14</volume>
            <elocation-id>1388</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>8</day>
                    <month>5</month>
                    <year>2026</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Jaya DJ et al.</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/14-1388/pdf"/>
            <abstract>
                <p>This study applies K-Means clustering to segment job applicant test data from a construction consulting firm to support data-driven screening decisions. From 161 applicants, 30 candidates who met the document-screening requirements were invited for in-person testing and included in the analysis. Three assessment variables were used: AutoCAD drafting skills, planning/supervision report-writing skills, and adaptability. Using R, K-Means clustering was performed to partition candidates into three groups based on multivariate similarity patterns, and the resulting group structure was visualized using 2D and 3D scatter plots. The clustering output revealed distinct competency profiles: one group characterized by generally lower scores across the three variables, a second group with moderate and mixed scores, and a third group with consistently higher scores. Internal validity indices suggested modest separation (mean silhouette&#x00a0;=&#x00a0;0.16; Davies&#x2013;Bouldin Index&#x00a0;=&#x00a0;2.05), consistent with exploratory clustering on a small pre-screened sample. These patterns provide a structured interpretation of applicant diversity and can inform practical recruitment actions such as prioritizing candidates for interviews, identifying borderline profiles for additional evaluation, and designing targeted upskilling recommendations for specific competency gaps. Overall, this study illustrates how unsupervised clustering of routine recruitment test results may support more structured interpretation of applicant competency profiles in early-stage construction-sector recruitment, provided that the results are used cautiously alongside professional judgment and further validation.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>K-Means Clustering; data-driven recruitment; workforce selection; cluster visualization; construction competencies</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="https://doi.org/10.13039/501100014538">
                    <funding-source>Lembaga Pengelola Dana Pendidikan</funding-source>
                    <award-id>202407111205431</award-id>
                    <award-id>202406111204346</award-id>
                    <award-id>202406111202933</award-id>
                    <award-id>202312211239164</award-id>
                    <award-id>202404111201727</award-id>
                    <award-id>202407112005435</award-id>
                </award-group>
                <funding-statement>This research was funded by scholarships awarded by the Indonesian Endowment Fund for Education (LPDP), with Grant Numbers 202312211239164 (Daniel Jesayanto Jaya), 202407112005435 (Wahyu Muhammad Ramdhani), 202406111202933 (Endang Wati), 202406111204346 (Yogi Novario Nandes), 202407111205431 (Ilma Zahriyatun Nadhiroh), and 202404111201727 (Reza Bakhrun Fidianto Pade).</funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
        <notes>
            <sec sec-type="version-changes">
                <label>Revised</label>
                <title>Amendments from Version 2</title>
                <p>This new version revises the manuscript in response to reviewer comments. The literature review has been strengthened with broader international scholarship on HR analytics, algorithm-assisted recruitment, AI-assisted hiring, fairness, transparency, and human oversight. The Methods section now provides clearer justification for analysing the 30 shortlisted candidates, clarifies preprocessing decisions, and explains the use of K-Means clustering as an exploratory decision-support technique rather than an automated hiring system. The justification for the three-cluster solution has also been expanded by discussing managerial interpretability alongside internal validity diagnostics, including silhouette coefficient and Davies&#x2013;Bouldin Index. Variable terminology has been standardized throughout the manuscript, tables, figures, and supplementary materials. The Results, Discussion, Limitations, and Conclusions have been revised to emphasize the exploratory nature of the findings and to avoid overstating recruitment effectiveness. Revised figure files and updated supplementary materials have been deposited in Zenodo to align the extended data with the revised manuscript.</p>
            </sec>
        </notes>
    </front>
    <body>
        <sec id="sec1" sec-type="intro">
            <title>1. Introduction</title>
            <sec id="sec1.1">
                <title>1.1 Research background</title>
                <p>In the modern workplace, workforce selection is a critical component of human resource development, particularly in sectors that require a combination of technical expertise and adaptive capability. Career development and career transformation are influenced not only by formal qualifications but also by individuals&#x2019; ability to adapt to changing work environments and collaborate effectively with diverse stakeholders. Data-driven approaches to workforce analysis have therefore gained attention as tools to support more structured and transparent evaluation processes (
                    <xref ref-type="bibr" rid="ref29">Pala, 2021</xref>).</p>
                <p>Recruitment involves more than sourcing candidates; it requires systematic decision-making informed by job analysis, organizational needs, and available labor characteristics (
                    <xref ref-type="bibr" rid="ref40">Widodo, 2018</xref>). Job analysis plays a central role in defining task requirements, competency expectations, and qualification standards, thereby helping organizations align applicants with role-specific demands. From the applicant&#x2019;s perspective, successful job search outcomes depend on understanding personal competencies, evaluating labor market opportunities, and developing skills that match employer expectations (
                    <xref ref-type="bibr" rid="ref25">
London, 1973</xref>).</p>
                <p>In the construction sector, technical competencies such as AutoCAD drafting, the ability to prepare planning and supervision reports, and adaptability to dynamic project environments are particularly valued (
                    <xref ref-type="bibr" rid="ref15">Gangl, 2003</xref>). These competencies are increasingly important in large-scale infrastructure development contexts. In Indonesia, national strategic projects such as the Nusantara Capital City (Ibu Kota Nusantara, IKN) development have intensified demand for construction personnel with both technical proficiency and social adaptability (
                    <xref ref-type="bibr" rid="ref19">Irmawan et al., 2023</xref>; 
                    <xref ref-type="bibr" rid="ref35">Supriyanti et al., 2023</xref>). Managing and interpreting recruitment assessment data in such contexts presents practical challenges, especially when organizations must evaluate multiple competency dimensions simultaneously.</p>
                <p>Contemporary recruitment is increasingly shaped by data-driven and technology-assisted decision-making. In human resource management, analytics can help organizations organize multidimensional applicant information, improve the transparency of assessment processes, and support more systematic screening decisions (
                    <xref ref-type="bibr" rid="ref29">Pala, 2021</xref>; 
                    <xref ref-type="bibr" rid="ref18">Hurbean et al., 2023</xref>; 
                    <xref ref-type="bibr" rid="ref26">Madanchian, 2024</xref>). However, the use of analytical tools in recruitment also requires caution because applicant evaluation is a consequential decision-making context. Recent discussions on AI-assisted hiring and algorithmic decision-making emphasize that analytics should not be treated as a substitute for professional judgment, particularly when sample size, assessment scope, and validation evidence are limited (
                    <xref ref-type="bibr" rid="ref32">Rigotti &amp; Fosch-Villaronga, 2024</xref>; 
                    <xref ref-type="bibr" rid="ref5">Dadaboyev et al., 2025</xref>). Issues such as transparency, explainability, fairness, adverse impact, and human oversight are central to responsible recruitment analytics (
                    <xref ref-type="bibr" rid="ref28">National Institute of Standards and Technology [NIST], 2023</xref>; 
                    <xref ref-type="bibr" rid="ref12">
European Union Parliament and Council, 2024</xref>; 
                    <xref ref-type="bibr" rid="ref10">
U.S. Equal Employment Opportunity Commission [EEOC], 2023</xref>).</p>
                <p>In this study, K-Means clustering is therefore positioned as an exploratory decision-support technique rather than an automated hiring or rejection system. The purpose of clustering is to describe competency patterns among candidates who had already passed document screening and completed in-person assessment. The resulting cluster labels are analytical interpretations of score similarity patterns and should be read as preliminary competency profiles that may inform further managerial review, not as definitive employment decisions (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>).</p>
                <p>Cluster analysis offers a data-driven approach to explore patterns within applicant assessment data by grouping individuals with similar characteristics. Clustering techniques partition data into internally homogeneous and externally heterogeneous groups, thereby supporting structured interpretation of complex multivariate information (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>). Among these techniques, K-Means clustering is widely used due to its computational simplicity and interpretability, making it suitable for exploratory analysis of recruitment-related datasets. In recruitment contexts, clustering can be applied to post-screening assessment data to identify competency profiles rather than to make automated hiring decisions.</p>
                <p>Beyond operational efficiency, the use of data-driven tools in recruitment raises broader issues of transparency, governance, and fairness in algorithm-assisted selection. International guidance emphasizes that AI-enabled assessment should be accompanied by risk management, documentation, and ongoing monitoring of unintended impacts (
                    <xref ref-type="bibr" rid="ref28">NIST, 2023</xref>). In addition, U.S. Equal Employment Opportunity Commission (EEOC) guidance highlights that employers should assess whether algorithmic or AI-based selection procedures produce adverse impact under Title VII and aligns such assessment with the Uniform Guidelines on Employee Selection Procedures (
                    <xref ref-type="bibr" rid="ref10">EEOC, 2023</xref>). Similarly, the European Union Artificial Intelligence Act classifies certain AI systems used in employment-related contexts as high-risk, reinforcing expectations for accountability and safeguards when analytics influence employment decisions (
                    <xref ref-type="bibr" rid="ref12">
European Union Parliament and Council, 2024</xref>). Accordingly, this study positions K-Means clustering as an exploratory decision-support technique rather than an automated hiring system; cluster labels are interpreted cautiously as descriptive competency profiles and are intended to complement human review rather than replace managerial judgment.</p>
                <p>This study applies K-Means clustering to recruitment test data from a construction consulting firm, focusing on candidates who passed document screening and completed in-person assessments. Using three core variables&#x2014;AutoCAD drafting skills, planning/supervision report-writing skills, and adaptability&#x2014;the study demonstrates how unsupervised clustering can support exploratory analysis of applicant competency profiles within a real organizational context.</p>
            </sec>
            <sec id="sec1.2">
                <title>1.2 Literature review</title>
                <p>Clustering is an unsupervised analytical technique used to group objects into clusters based on attribute similarity, such that objects within the same cluster exhibit higher similarity than those in other clusters (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>). By minimizing within-cluster variation and maximizing between-cluster differences, clustering supports pattern discovery and interpretation in complex datasets (
                    <xref ref-type="bibr" rid="ref27">Manikandan et al., 2018</xref>; 
                    <xref ref-type="bibr" rid="ref6">Darmi &amp; Setiawan, 2016</xref>). For organizational and workforce analytics, clustering provides a data-driven means of understanding heterogeneity among individuals without requiring predefined class labels.</p>
                <p>Among various clustering approaches, K-Means clustering is one of the most widely applied methods due to its simplicity, efficiency, and interpretability. K-Means partitions data into 
                    <italic toggle="yes">k</italic> clusters by iteratively assigning observations to the nearest centroid and updating centroid positions until convergence is achieved (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>). Because of its relatively low computational cost, K-Means is suitable for applied settings where rapid analysis and transparent interpretation are required (
                    <xref ref-type="bibr" rid="ref13">Fadhli, 2017</xref>).</p>
                <p>Previous studies demonstrate applicability across domains. In educational research, K-Means has been used to analyze student preferences and learning achievement patterns (
                    <xref ref-type="bibr" rid="ref14">Firza &amp; Sarjono, 2020</xref>). In organizational contexts, it has been applied to group employees based on discipline and performance indicators to support human resource decision-making (
                    <xref ref-type="bibr" rid="ref2">Agustina &amp; Prihandoko, 2018</xref>). Comparative studies suggest that while alternatives such as Fuzzy C-Means may offer advantages in some conditions, K-Means remains computationally efficient and practical for many real-world applications (
                    <xref ref-type="bibr" rid="ref41">Wiharto &amp; Suryani, 2020</xref>).</p>
                <p>

                    <bold>1.2.1 K-Means algorithm</bold>
                </p>
                <p>K-Means is a partition-based clustering algorithm that divides data into a predefined number of clusters by minimizing the average distance between data points and their respective cluster centroids (
                    <xref ref-type="bibr" rid="ref39">Widiyaningtyas et al., 2017</xref>). The algorithm operates iteratively, beginning with the selection of initial centroid values and proceeding through repeated reassignment of data points based on distance calculations until cluster membership stabilizes (
                    <xref ref-type="bibr" rid="ref30">Purba et al., 2018</xref>). Prior work emphasizes that K-Means can be sensitive to initialization and the scale of input variables, highlighting the need for transparent methodological choices in applied studies (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>).</p>
                <p>

                    <bold>1.2.2 Worker recruitment</bold>
                </p>
                <p>Recruitment is a strategic organizational process aimed at attracting and selecting individuals whose competencies align with job requirements and organizational objectives. Job analysis plays a critical role in defining tasks, responsibilities, and qualification standards, thereby guiding recruitment and selection decisions (
                    <xref ref-type="bibr" rid="ref40">Widodo, 2018</xref>). In the construction sector, recruitment emphasizes a combination of technical competencies&#x2014;such as drafting and report preparation&#x2014;and adaptive capabilities, reflecting the dynamic and collaborative nature of construction projects (
                    <xref ref-type="bibr" rid="ref15">Gangl, 2003</xref>). The job search process seeks to match job seekers with appropriate opportunities and can be supported through technology-enabled and data-driven methods (
                    <xref ref-type="bibr" rid="ref17">Green et al., 2011</xref>). Given the multidimensionality of applicant data, clustering methods such as K-Means offer a way to organize assessment results into interpretable competency profiles that can support early-stage evaluation (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>).</p>
                <p>

                    <bold>1.2.3 HR analytics and algorithm-assisted recruitment</bold>
                </p>
                <p>HR analytics refers to the systematic use of workforce-related data to support organizational decision-making. In recruitment, HR analytics can assist decision-makers by structuring applicant information, identifying patterns across competency dimensions, and supporting more consistent interpretation of assessment results (
                    <xref ref-type="bibr" rid="ref29">Pala, 2021</xref>; 
                    <xref ref-type="bibr" rid="ref18">Hurbean et al., 2023</xref>; 
                    <xref ref-type="bibr" rid="ref37">Venugopal et al., 2024</xref>). This is particularly relevant in sectors such as construction consulting, where applicants may need to demonstrate both technical skills and adaptive capabilities. From a human resource development perspective, recruitment is not only a selection activity but also part of a broader workforce capability system because it determines how organizations identify, develop, and allocate human talent (
                    <xref ref-type="bibr" rid="ref40">Widodo, 2018</xref>; 
                    <xref ref-type="bibr" rid="ref11">El Achmar &amp; Bhagat, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref21">Jaya et al., 2026a</xref>).</p>
                <p>The growing use of analytics and artificial intelligence in recruitment has also generated debate about fairness, transparency, and accountability. AI-assisted hiring systems may improve efficiency in screening and assessment, but recent literature cautions that these systems can reproduce bias, create opacity in decision-making, and produce adverse impacts when used without proper validation and oversight (
                    <xref ref-type="bibr" rid="ref26">Madanchian, 2024</xref>; 
                    <xref ref-type="bibr" rid="ref32">Rigotti &amp; Fosch-Villaronga, 2024</xref>; 
                    <xref ref-type="bibr" rid="ref5">Dadaboyev et al., 2025</xref>). Therefore, algorithm-assisted recruitment should be accompanied by clear documentation, human review, and careful interpretation of results (
                    <xref ref-type="bibr" rid="ref28">NIST, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref10">EEOC, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref12">
European Union Parliament and Council, 2024</xref>).</p>
                <p>In this context, clustering offers a comparatively transparent exploratory method. Unlike predictive models that estimate hiring outcomes or job performance, clustering groups applicants based on similarity in observed assessment scores (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>). This makes the method useful for descriptive segmentation and early-stage decision support. Nevertheless, cluster labels should not be interpreted as evidence of actual job performance or recruitment effectiveness unless they are externally validated using hiring outcomes, supervisor evaluations, or post-employment performance data (
                    <xref ref-type="bibr" rid="ref22">Jaya et al., 2026b</xref>). Accordingly, this study uses K-Means clustering to generate interpretable applicant competency profiles while acknowledging the methodological and ethical limits of using analytical tools in recruitment decision-making.</p>
            </sec>
        </sec>
        <sec id="sec2" sec-type="methods">
            <title>2. Methods</title>
            <sec id="sec2.1">
                <title>2.1 Research design</title>
                <p>This study employed a quantitative, exploratory research design using unsupervised clustering to analyze recruitment assessment data from a construction consulting firm. The primary objective was to explore competency-based grouping patterns among job applicants using K-Means clustering as a decision-support tool, rather than to predict hiring outcomes or evaluate post-employment performance. The overall research workflow is illustrated in 
                    <xref ref-type="fig" rid="f1">
Figure 1</xref>.</p>
                <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                    <label>
Figure 1. </label>
                    <caption>
                        <title>Workflow research diagram.</title>
                    </caption>
                    <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/201201/6a2483f6-f530-4706-b1d5-948b3587a9da_figure1.gif"/>
                </fig>
            </sec>
            <sec id="sec2.2">
                <title>2.2 Data source and participant selection</title>
                <p>The data were obtained from CV Ardantama Putra Perkasa as part of its internal recruitment process. Although the vacancy was advertised through JobStreet Indonesia, all data analyzed in this study originated exclusively from the company&#x2019;s internal screening and testing procedures.</p>
                <p>A total of 161 applicants applied for the position. Applicants were shortlisted through the company&#x2019;s standard document-screening procedure conducted by the HR team and the hiring unit. Screening focused on administrative completeness and role relevance, including: (i) completeness of required documents; (ii) educational background and relevance to construction consulting work; (iii) evidence of relevant technical exposure, such as drafting/reporting-related tasks or portfolio where available; and (iv) basic eligibility criteria specified in the vacancy announcement. From this process, 30 candidates met the minimum document-screening requirements and were invited to complete in-person competency testing.</p>
                <p>Only these 30 shortlisted candidates were included in the clustering analysis because complete assessment scores were available for all three variables: AutoCAD drafting skills, planning/supervision report-writing skills, and adaptability. This sampling decision means that the analysis represents competency patterns among a pre-screened analytical sample rather than the full applicant pool. Following STROBE-style reporting principles, this sampling boundary is explicitly stated to clarify the analytical population, eligibility process, and limitations of inference (
                    <xref ref-type="bibr" rid="ref38">von Elm et al., 2007</xref>). The results therefore should not be generalized to all 161 applicants or to construction job applicants more broadly. Instead, the analysis illustrates how clustering can be used to organize assessment data after an initial administrative screening stage has already occurred.</p>
            </sec>
            <sec id="sec2.3">
                <title>2.3 Assessment variables</title>
                <p>Candidates were evaluated using three competency indicators relevant to construction consulting roles:
                    <list list-type="order">
                        <list-item>
                            <label>1.</label>
                            <p>AutoCAD drafting skills;</p>
                        </list-item>
                        <list-item>
                            <label>2.</label>
                            <p>planning/supervision report-writing skills;</p>
                        </list-item>
                        <list-item>
                            <label>3.</label>
                            <p>adaptability.</p>
                        </list-item>
                    </list>
                </p>
                <p>AutoCAD drafting skills refer to candidates&#x2019; ability to produce and interpret technical drawings using AutoCAD. Planning/supervision report-writing skills refer to candidates&#x2019; ability to prepare structured reports related to construction planning and supervision activities. Adaptability refers to candidates&#x2019; ability to adjust to changing project conditions, work demands, and organizational expectations. These indicators reflect the need to combine technical competence with adaptive and work-relevant capability in construction-related occupational settings (
                    <xref ref-type="bibr" rid="ref15">Gangl, 2003</xref>; 
                    <xref ref-type="bibr" rid="ref40">Widodo, 2018</xref>; 
                    <xref ref-type="bibr" rid="ref21">Jaya et al., 2026a</xref>).</p>
                <p>Each variable was assessed on a numerical scale from 0 to 100, with higher scores indicating stronger performance. Because all three variables used the same scale, the raw scores were retained for clustering analysis to preserve the original meaning of the assessment results.</p>
            </sec>
            <sec id="sec2.4">
                <title>2.4 Data preprocessing, outlier, and sensitivity checks</title>
                <p>The dataset was reviewed for completeness and consistency before clustering. All 30 shortlisted candidates had complete scores across the three assessment variables; therefore, no candidate records were removed because of missing data. The variable names were standardized throughout the dataset and manuscript as AutoCAD drafting skills, planning/supervision report-writing skills, and adaptability. Clear reporting of data eligibility, exclusions, and analytical decisions is important for reproducibility in observational data analysis (
                    <xref ref-type="bibr" rid="ref38">von Elm et al., 2007</xref>).</p>
                <p>Because all variables were measured on the same 0&#x2013;100 scale, the analysis used raw scores without additional normalization or standardization. This decision was made to preserve the practical interpretation of the original assessment scores. Euclidean distance was used as the distance metric because K-Means clustering groups observations by minimizing within-cluster squared distances (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>). Basic outlier and sensitivity checks were conducted by inspecting score distributions, distances to cluster centroids, and two-dimensional and three-dimensional visualizations. These checks were used to determine whether any individual observation disproportionately shaped the cluster interpretation.</p>
            </sec>
            <sec id="sec2.5">
                <title>2.5 Clustering procedure</title>
                <p>K-Means clustering was applied to group candidates based on similarity across the three assessment variables. The number of clusters was set to k&#x00a0;=&#x00a0;3 because the company required an interpretable decision-support structure that could distinguish lower, intermediate, and higher competency profiles for managerial review. However, this three-cluster solution is not interpreted as proof that the dataset contains three naturally distinct applicant groups. Rather, k&#x00a0;=&#x00a0;3 was used as a practically meaningful segmentation structure and was examined using internal diagnostic checks.</p>
                <p>The analysis used Euclidean squared distance to assign each candidate to the nearest centroid. Because K-Means can be sensitive to centroid initialization, variable scaling, and the predefined number of clusters, the initial centroids and iteration procedure were explicitly reported in the supplementary materials. Methodological transparency is particularly important when applying K-Means to small applied datasets (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>). Cluster-number justification was examined using the elbow method and additional internal diagnostics, including the silhouette coefficient and Davies&#x2013;Bouldin Index (
                    <xref ref-type="bibr" rid="ref33">Rousseeuw, 1987</xref>; 
                    <xref ref-type="bibr" rid="ref7">Davies &amp; Bouldin, 1979</xref>). These diagnostics were used to assess whether the three-cluster solution was reasonably interpretable while acknowledging that internal validation metrics in small, pre-screened datasets should be interpreted cautiously.</p>
                <p>The clustering workflow was implemented using spreadsheet-based calculations for transparency of manual steps and R programming for reproducibility, validity checks, and visualization. Intermediate iteration tables, R scripts, and visualization outputs are provided as extended data.</p>
                <p>The final clustering procedure was implemented in R using a custom K-Means function with fixed initial centroids derived from the spreadsheet-based clustering workflow. The algorithm calculated Euclidean squared distances, assigned each candidate to the nearest centroid, recalculated cluster centroids, and repeated the process until centroid values stabilized. Because the initial centroids were fixed and explicitly reported, the clustering procedure is deterministic for the reported dataset. The R script, supporting tables, and visualization outputs are provided as extended data.</p>
            </sec>
            <sec id="sec2.6">
                <title>2.5.1 Cluster-number justification and stability checks</title>
                <p>Because the number of clusters in K-Means must be specified before analysis, the choice of k was evaluated using both practical and diagnostic considerations. Practically, k&#x00a0;=&#x00a0;3 corresponded to the company&#x2019;s need for three interpretable competency profiles that could support recruitment discussion: lower, intermediate, and higher competency profiles. Analytically, the three-cluster solution was examined using the elbow method, silhouette coefficient, and Davies&#x2013;Bouldin Index.</p>
                <p>The elbow method was used to compare the reduction in within-cluster sum of squares across alternative cluster numbers. The silhouette coefficient was used to evaluate the degree to which candidates were closer to their assigned cluster than to other clusters (
                    <xref ref-type="bibr" rid="ref33">Rousseeuw, 1987</xref>). The Davies&#x2013;Bouldin Index was used to assess within-cluster compactness relative to between-cluster separation (
                    <xref ref-type="bibr" rid="ref7">Davies &amp; Bouldin, 1979</xref>). Because the final workflow used fixed initial centroids, the analysis was reproducible without stochastic initialization. The diagnostic indices were therefore used primarily to evaluate the interpretability of the selected three-cluster solution rather than to claim strong natural cluster separation. These diagnostic checks are commonly recommended because internal validity indices provide useful but incomplete evidence, particularly when clusters overlap or sample sizes are small (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>; 
                    <xref ref-type="bibr" rid="ref22">Jaya et al., 2026b</xref>).</p>
                <p>These diagnostics were not used to claim that k&#x00a0;=&#x00a0;3 represents a definitive natural structure in the data. Instead, they were used to examine whether the selected three-cluster solution was defensible as an exploratory and managerially interpretable grouping of shortlisted candidates.</p>
            </sec>
            <sec id="sec2.7">
                <title>2.6 Visualization and interpretation</title>
                <p>Clustering results were visualized using two-dimensional and three-dimensional scatter plots. Two-dimensional plots illustrated relationships between AutoCAD drafting skills and planning/supervision report-writing skills, while three-dimensional plots incorporated adaptability as a third axis.</p>
                <p>Clusters were subsequently labeled as &#x201c;Lower competency profile,&#x201d; &#x201c;Intermediate/mixed competency profile,&#x201d; and &#x201c;Higher competency profile&#x201d; based on their relative position in the multivariate competency space. These labels represent analytical interpretations of score patterns and do not constitute formal hiring decisions made by the company.</p>
            </sec>
            <sec id="sec2.8">
                <title>2.7 Scope and methodological limitations</title>
                <p>This study focuses on exploratory grouping of recruitment assessment data from a pre-screened subset of applicants. The clustering results were not validated against final hiring decisions or post-employment performance outcomes. Accordingly, findings should be interpreted as structured analytical support rather than definitive evidence of selection effectiveness.</p>
            </sec>
            <sec id="sec2.9">
                <title>2.8 Cluster validity assessment</title>
                <p>To provide quantitative support for the cluster structure, internal validity indices were calculated. The silhouette coefficient was computed using Euclidean distances to estimate how well each candidate matched its assigned cluster relative to other clusters. The Davies&#x2013;Bouldin Index (DBI) was calculated to evaluate average cluster similarity based on within-cluster dispersion relative to between-cluster centroid distances. These indices were interpreted as descriptive diagnostics of separation quality rather than evidence of predictive utility.</p>
            </sec>
        </sec>
        <sec id="sec3">
            <title>3. Results and discussion</title>
            <sec id="sec3.1">
                <title>3.1 Applicant characteristics</title>
                <p>This study analysed recruitment assessment records from CV Ardantama Putra Perkasa, obtained from the company&#x2019;s internal testing and selection process. A total of 161 applicants submitted applications, of whom 30 candidates meeting minimum screening criteria were invited for in-person testing. Each candidate was assessed on three indicators measured on a 0&#x2013;100 scale: AutoCAD drafting skills (X), planning/supervision report-writing skills (Y), and adaptability (Z). Candidate characteristics and scores are summarised in 
                    <xref ref-type="table" rid="T1">
Table 1</xref>.</p>
                <table-wrap id="T1" orientation="portrait" position="float">
                    <label>
Table 1. </label>
                    <caption>
                        <title>Shortlisted candidate characteristics and assessment scores.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Respondent code</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Gender</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
AutoCAD drafting skills (X)</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Planning/supervision 
report-writing skills (Y)</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Adaptability (Z)</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">92</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">68</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">68</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">65</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">66</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">73</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">86</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">87</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp4</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">69</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">74</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">73</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp5</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">78</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">72</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">91</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp6</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">84</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">90</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">92</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp7</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">69</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">76</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">87</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp8</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">95</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">73</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">76</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp9</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">90</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">80</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">85</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp10</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">68</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">82</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">68</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">63</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">71</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp12</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">93</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">77</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp13</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">62</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">72</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">68</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp14</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">90</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">61</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">72</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp15</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">84</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">63</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">90</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp16</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">94</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">70</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">89</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp17</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">73</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">87</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">80</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp18</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">71</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">73</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">95</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp19</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">93</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">62</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">70</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp20</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">90</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">68</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">89</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp21</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">87</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">94</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">87</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp22</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">60</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">90</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">64</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp23</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Female</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">65</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">64</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">93</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp24</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">69</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">84</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp25</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">66</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">63</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">72</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp26</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">95</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">85</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">93</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp27</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">80</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">83</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp28</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">92</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">85</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">93</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp29</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">71</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">71</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">85</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp30</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Male</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">92</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">61</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">88</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>Overall, the score distribution shows meaningful heterogeneity across candidates&#x2014;particularly in adaptability and planning/supervision report-writing&#x2014;indicating variation in both technical and interpersonal readiness. This variability provides a suitable basis for exploratory clustering analysis.</p>
            </sec>
            <sec id="sec3.2">
                <title>3.2 K-Means clustering results</title>
                <p>Using K-Means clustering with k&#x00a0;=&#x00a0;3, the 30 assessed candidates were grouped based on similarity across AutoCAD drafting skills, planning/supervision report-writing skills, and adaptability. The three-cluster solution was selected because it provided a practically interpretable structure for recruitment discussion while remaining consistent with the exploratory purpose of the study. The clusters should therefore be interpreted as descriptive competency profiles rather than as statistically definitive applicant classes or formal hiring decisions (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>).</p>
                <p>The first cluster represents candidates with comparatively lower overall competency profiles across the assessed variables. The second cluster represents candidates with mixed or intermediate competency profiles, indicating that further assessment or managerial consideration may be appropriate. The third cluster represents candidates with comparatively stronger combined technical and adaptive competency profiles. These labels are interpretive and intended to support structured review rather than automate recruitment outcomes, consistent with responsible use of analytics in consequential employment-related decisions (
                    <xref ref-type="bibr" rid="ref28">NIST, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref10">EEOC, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref12">
European Union Parliament and Council, 2024</xref>).</p>
                <p>The first cluster is characterized by relatively lower combined scores across the three assessed competencies. The second cluster consists of candidates with moderate and mixed competency scores, reflecting intermediate profiles that may warrant further evaluation. The third cluster comprises candidates with comparatively higher scores across technical and adaptive dimensions, indicating stronger and more balanced competency profiles.</p>
                <p>The clustering process involved iterative centroid updates until cluster memberships stabilized. To maintain readability, detailed distance-to-centroid and iteration tables are provided as extended data, while the main text reports the final centroid summary and stabilized cluster assignment.</p>
                <p>The final stabilized cluster assignment is presented in 
                    <xref ref-type="table" rid="T3">
Table 3</xref>. Respondent codes correspond to the candidate codes reported in 
                    <xref ref-type="table" rid="T1">
Table 1</xref>. Detailed distance-to-centroid calculations and iteration outputs are provided in the Zenodo supplementary materials to support reproducibility without overloading the main manuscript. The final cluster centroid and size summary for the three interpretive profiles is presented in 
                    <xref ref-type="table" rid="T2">
Table 2</xref>.</p>
                <table-wrap id="T2" orientation="portrait" position="float">
                    <label>
Table 2. </label>
                    <caption>
                        <title>Cluster centroid and size summary.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Cluster</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">n</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
AutoCAD drafting skills, mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Planning/supervision 
report-writing skills, mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Adaptability, mean</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Interpretive profile</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">8</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">65.13</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">73.13</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">71.88</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">79.45</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">75.73</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">80.00</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">87.09</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">77.82</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">88.36</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap id="T3" orientation="portrait" position="float">
                    <label>
Table 3. </label>
                    <caption>
                        <title>Final cluster assignment by respondent code.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Respondent code</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Cluster</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">
Category</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp4</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp10</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp13</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp22</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp25</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp23</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Lower competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp24</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp17</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp12</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp29</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp18</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp27</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp14</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp19</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp1</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp30</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Intermediate/mixed competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp7</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp5</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp15</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp6</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp8</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp9</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp16</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp20</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp21</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp26</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Resp28</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">Higher competency profile</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec id="sec3.3">
                <title>3.2.1 Cluster validity metrics</title>
                <p>Internal validity diagnostics were calculated to evaluate the interpretability of the selected cluster solution. For the three-cluster solution, the mean silhouette coefficient was 0.16, indicating modest and weak-to-moderate separation among applicant competency profiles. The Davies&#x2013;Bouldin Index was 2.05, suggesting limited compactness and separation between clusters. These values indicate that the clusters are interpretable for exploratory and managerial discussion, but they do not demonstrate strong natural separation in the data.</p>
                <p>The elbow method was also used to compare the reduction in within-cluster sum of squares across alternative cluster numbers. The elbow pattern did not provide decisive evidence that three clusters represented a clearly optimal natural structure. Therefore, the three-cluster solution was retained primarily because it aligned with the company&#x2019;s need for a practical and interpretable decision-support structure, while the internal validity indices were interpreted cautiously. These indicators are useful for assessing internal cluster structure, although they do not provide external validation of hiring effectiveness or job performance outcomes (
                    <xref ref-type="bibr" rid="ref7">Davies &amp; Bouldin, 1979</xref>; 
                    <xref ref-type="bibr" rid="ref33">Rousseeuw, 1987</xref>; 
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>).</p>
            </sec>
            <sec id="sec3.4">
                <title>3.3 Visualization of cluster structure</title>
                <p>To support interpretation, two-dimensional and three-dimensional visualizations were generated. 
                    <xref ref-type="fig" rid="f2">
Figure 2</xref> presents a 2D scatter plot based on AutoCAD drafting skills and planning/supervision report-writing skills, showing visible separation between lower, intermediate, and higher competency profiles along key technical dimensions.</p>
                <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                    <label>
Figure 2. </label>
                    <caption>
                        <title>K-means clustering visualization in a 2D scatter plot.</title>
                    </caption>
                    <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/201201/6a2483f6-f530-4706-b1d5-948b3587a9da_figure2.gif"/>
                </fig>
                <p>
                    <xref ref-type="fig" rid="f3">
Figure 3</xref> extends the visualization into three dimensions by incorporating adaptability as a third axis. The 3D scatter plot reveals clearer spatial separation among clusters, particularly distinguishing candidates who combine strong technical skills with high adaptability from those with lower overall competency scores.</p>
                <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                    <label>
Figure 3. </label>
                    <caption>
                        <title>K-means clustering visualization in a 3D scatter plot.</title>
                    </caption>
                    <graphic id="gr3" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/201201/6a2483f6-f530-4706-b1d5-948b3587a9da_figure3.gif"/>
                </fig>
                <p>To further examine structural consistency, hierarchical clustering projected onto principal component space is presented in 
                    <xref ref-type="fig" rid="f4">
Figure 4</xref>. Although hierarchical clustering was not employed as the primary analytical method, the observed grouping patterns broadly align with the K-Means classification, providing additional support for the stability of the three-cluster structure within this dataset.</p>
                <fig fig-type="figure" id="f4" orientation="portrait" position="float">
                    <label>
Figure 4. </label>
                    <caption>
                        <title>Hierarchical clustering visualization using PCA-projected dimensions.</title>
                    </caption>
                    <graphic id="gr4" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/201201/6a2483f6-f530-4706-b1d5-948b3587a9da_figure4.gif"/>
                </fig>
            </sec>
            <sec id="sec3.5">
                <title>3.4 Interpretation and discussion</title>
                <p>The clustering results illustrate how K-Means can be used as an exploratory tool to organize recruitment assessment data into interpretable competency profiles within a construction consulting context. The findings suggest that candidates can be descriptively grouped according to combinations of technical and adaptive competencies. However, the results should not be interpreted as evidence that clustering improves recruitment effectiveness because the analysis was conducted on a small, pre-screened sample and was not externally validated against final hiring decisions, supervisor evaluations, or post-employment performance outcomes. This interpretation is consistent with methodological cautions in clustering research, where internal cluster structure does not automatically demonstrate practical or predictive validity (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref24">Kassambara, 2017</xref>; 
                    <xref ref-type="bibr" rid="ref22">Jaya et al., 2026b</xref>).</p>
                <p>The intermediate cluster is particularly important from a managerial perspective because it represents candidates with mixed competency profiles. Rather than treating this group as a fixed decision category, organizations may use it to identify applicants who require follow-up interviews, additional assessment, or targeted development consideration. In this sense, clustering functions as a decision-support lens that helps structure discussion but does not replace professional judgment (
                    <xref ref-type="bibr" rid="ref29">Pala, 2021</xref>; 
                    <xref ref-type="bibr" rid="ref18">Hurbean et al., 2023</xref>; 
                    <xref ref-type="bibr" rid="ref26">Madanchian, 2024</xref>).</p>
                <p>From an ethical and governance perspective, the use of analytics in recruitment should remain transparent, documented, and subject to human oversight. Cluster labels such as &#x201c;Lower competency profile,&#x201d; &#x201c;Intermediate/mixed competency profile,&#x201d; and &#x201c;Higher competency profile&#x201d; should be understood as descriptive analytical labels rather than automated employment decisions. When analytical tools are used in recruitment contexts, organizations should ensure that their use is aligned with fairness, accountability, and validation principles (
                    <xref ref-type="bibr" rid="ref32">Rigotti &amp; Fosch-Villaronga, 2024</xref>; 
                    <xref ref-type="bibr" rid="ref28">NIST, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref10">EEOC, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref12">
European Union Parliament and Council, 2024</xref>).</p>
            </sec>
            <sec id="sec3.6">
                <title>3.5 Methodological considerations and limitations</title>
                <p>Several limitations should be considered when interpreting these findings. First, the analysis was limited to 30 candidates who had already passed document screening and completed in-person testing. Therefore, the results describe competency patterns within a pre-screened analytical sample and cannot be generalized to the full pool of 161 applicants. Second, the sample size was small for clustering analysis, which limits the strength of claims regarding cluster stability and natural group structure. Third, the study relied on three assessment variables only; additional indicators such as interview performance, portfolio quality, work experience, certification, or supervisor-rated performance could produce a more comprehensive applicant profile. These reporting boundaries are important for transparency in observational data analysis (
                    <xref ref-type="bibr" rid="ref38">von Elm et al., 2007</xref>).</p>
                <p>Fourth, the cluster results were not externally validated against actual hiring outcomes or post-employment job performance. As a result, the study cannot claim that the clustering procedure improves recruitment effectiveness. Instead, the findings should be interpreted as an illustrative application of clustering for organizing multidimensional assessment data. Future research should test this approach using larger applicant pools, additional competency indicators, longitudinal job-performance data, and fairness or adverse-impact analysis (
                    <xref ref-type="bibr" rid="ref20">Jain et al., 1999</xref>; 
                    <xref ref-type="bibr" rid="ref10">EEOC, 2023</xref>; 
                    <xref ref-type="bibr" rid="ref22">Jaya et al., 2026b</xref>).</p>
            </sec>
        </sec>
        <sec id="sec4" sec-type="conclusions">
            <title>4. Conclusions</title>
            <p>This study explored the use of K-Means clustering as an exploratory analytical approach for organizing recruitment assessment data in a construction consulting context. Using data from 30 shortlisted candidates who completed in-person testing, the analysis grouped applicants based on three competency indicators: AutoCAD drafting skills, planning/supervision report-writing skills, and adaptability.</p>
            <p>The three-cluster solution provided an interpretable structure for describing lower, intermediate, and higher competency profiles among the shortlisted candidates. However, these clusters should not be interpreted as definitive hiring categories or as evidence of improved recruitment effectiveness. The analysis was based on a small, pre-screened sample and was not externally validated using final hiring decisions or post-employment performance outcomes.</p>
            <p>The main contribution of this study is therefore methodological and illustrative. It shows how clustering can help structure multidimensional recruitment assessment data and support transparent discussion among decision-makers. Used appropriately, clustering may complement professional judgment by making applicant competency patterns easier to interpret. Nevertheless, the method should be applied cautiously, with clear documentation, human oversight, and further validation before being used in consequential recruitment decisions (
                <xref ref-type="bibr" rid="ref28">NIST, 2023</xref>; 
                <xref ref-type="bibr" rid="ref10">EEOC, 2023</xref>; 
                <xref ref-type="bibr" rid="ref12">
European Union Parliament and Council, 2024</xref>).</p>
            <p>Future studies should apply this approach to larger and more diverse applicant datasets, include additional competency and background variables, compare alternative clustering methods, and examine whether cluster membership relates to actual hiring outcomes or subsequent job performance. Further work should also consider fairness, transparency, and adverse-impact assessment when analytics are used to support recruitment decisions (
                <xref ref-type="bibr" rid="ref32">Rigotti &amp; Fosch-Villaronga, 2024</xref>; 
                <xref ref-type="bibr" rid="ref5">Dadaboyev et al., 2025</xref>).</p>
        </sec>
        <sec id="sec5">
            <title>Ethical approval</title>
            <p>Ethical review and approval were not required for this study because the researchers analyzed fully anonymized secondary data that had been lawfully transferred by CV Ardantama Putra Perkasa under a formal Data Usage Agreement (No. 12/X/S-K/APP/2024). According to Indonesian national research ethics regulations (Permenkes RI No. 74/2016, Article 11) and the general principles of the Declaration of Helsinki, research involving secondary anonymized non-clinical data that cannot identify individuals is exempt from institutional ethical review. Therefore, this study qualifies for an ethics exemption.</p>
        </sec>
        <sec id="sec6">
            <title>Informed consent</title>
            <p>Informed consent for data use was not obtained directly by the researchers, as all data were collected by CV Ardantama Putra Perkasa under standard recruitment procedures. The company confirmed, through the Data Usage Agreement (No. 12/X/S-K/APP/2024), that job applicants had authorized the use of their anonymized recruitment test results for evaluation and administrative purposes in accordance with Indonesian data protection regulations (UU ITE and PP 71/2019). Because the researchers received only anonymized secondary data and had no access to identifiable information, this study meets the criteria for consent exemption.</p>
        </sec>
    </body>
    <back>
        <sec id="sec7">
            <title>Clinical trial registration</title>
            <p>Not applicable.</p>
        </sec>
        <sec id="sec9" sec-type="dataAvailability">
            <title>Data availability statement</title>
            <sec id="sec10">
                <title>Underlying data</title>
                <p>The anonymized job applicant dataset is not publicly available due to confidentiality agreements with CV Ardantama Putra Perkasa. Access may be granted for legitimate academic research upon reasonable request to the corresponding author (
                    <email xlink:href="mailto:danieljesayanto.2023@student.uny.ac.id">danieljesayanto.2023@student.uny.ac.id</email>), subject to approval by the data owner and compliance with Indonesian data protection regulations (UU ITE and PP 71/2019), including signing a Data Use Agreement and a commitment not to attempt re-identification.</p>
            </sec>
            <sec id="sec11">
                <title>Extended data</title>
                <p>Extended data supporting this study, including R scripts, clustering iteration tables, visualizations, and documentation, are openly available in Zenodo at 
                    <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.20070567">https://doi.org/10.5281/zenodo.20070567</ext-link> (
                    <xref ref-type="bibr" rid="ref23">Jaya, 2026</xref>) under the 
                    <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution 4.0 International</ext-link> (CC BY 4.0) license.</p>
            </sec>
        </sec>
        <ack>
            <title>Acknowledgement</title>
            <p>The authors gratefully acknowledge the financial support provided by the Indonesian Endowment Fund for Education (LPDP) as the official sponsor of the scholarships that supported this publication. The authors also thank CV Ardantama Putra Perkasa for granting formal permission to use anonymized job applicant data for research and academic purposes.</p>
        </ack>
        <ref-list>
            <title>References</title>
            <ref id="ref1">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Akkermans</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Donald</surname>
                            <given-names>WE</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jackson</surname>
                            <given-names>D</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Are we talking about the same thing? The case for stronger connections between graduate and worker employability research.</article-title>
                    <source>

                        <italic toggle="yes">Career Dev. Int.</italic>
</source>
                    <year>2024</year>;<volume>29</volume>(<issue>1</issue>):<fpage>80</fpage>&#x2013;<lpage>92</lpage>.
                    <pub-id pub-id-type="doi">10.1108/CDI-08-2023-0278</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Agustina</surname>
                            <given-names>N</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Prihandoko</surname>
                            <given-names>P</given-names>
                        </name>
</person-group>:
                    <article-title>Perbandingan algoritma K-Means dengan Fuzzy C-Means untuk clustering tingkat kedisiplinan kinerja karyawan.</article-title>
                    <source>

                        <italic toggle="yes">Jurnal RESTI (Rekayasa Sistem dan Teknologi Informasi).</italic>
</source>
                    <year>2018</year>;<volume>2</volume>(<issue>3</issue>):<fpage>621</fpage>&#x2013;<lpage>626</lpage>.
                    <pub-id pub-id-type="doi">10.29207/resti.v2i3.492</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hesketh</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>The mismanagement of talent: Employability and jobs in the knowledge economy.</article-title>
                    <source>

                        <italic toggle="yes">Ind. Labor Relat. Rev.</italic>
</source>
                    <year>2005</year>.
                    <pub-id pub-id-type="doi">10.2189/asqu.2005.50.2.306</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Chen Yu</surname>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">K-Means clustering.</italic>
</source>
                    <publisher-name>Indiana University</publisher-name>;<year>2020</year>.</mixed-citation>
            </ref>
            <ref id="ref5">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Dadaboyev</surname>
                            <given-names>SMU</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Soomro</surname>
                            <given-names>TR</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bakhsh</surname>
                            <given-names>FA</given-names>
                        </name>
</person-group>:
                    <article-title>Role of artificial intelligence in employee recruitment: a systematic literature review.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Inf. Technol.</italic>
</source>
                    <year>2025</year>.
                    <pub-id pub-id-type="doi">10.1007/s44282-025-00246-w</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Darmi</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Setiawan</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <article-title>Penerapan metode clustering K-Means dalam pengelompokan penjualan produk.</article-title>
                    <source>

                        <italic toggle="yes">Jurnal Media Infotama.</italic>
</source>
                    <year>2016</year>;<volume>12</volume>(<issue>2</issue>):<fpage>148</fpage>&#x2013;<lpage>157</lpage>.</mixed-citation>
            </ref>
            <ref id="ref7">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Davies</surname>
                            <given-names>DL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bouldin</surname>
                            <given-names>DW</given-names>
                        </name>
</person-group>:
                    <article-title>A cluster separation measure.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Transactions on Pattern Analysis and Machine Intelligence.</italic>
</source>
                    <year>1979</year>;<volume>PAMI-1</volume>:<fpage>224</fpage>&#x2013;<lpage>227</lpage>.
                    <pub-id pub-id-type="doi">10.1109/TPAMI.1979.4766909</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref8">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Div&#x00e1;n</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <chapter-title>Data-driven decision making.</chapter-title>
                    <source>

                        <italic toggle="yes">2017 IEEE International Conference on Technological Innovations in ICT for Agriculture and Rural Development (TIAR).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>2017</year>; pp.<fpage>50</fpage>&#x2013;<lpage>56</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ICTUS.2017.8285973</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref9">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Donald</surname>
                            <given-names>WE</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Van der Heijden</surname>
                            <given-names>BIJM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Manville</surname>
                            <given-names>G</given-names>
                        </name>
</person-group>:
                    <article-title>(Re) Framing sustainable careers: Toward a conceptual model and future research agenda.</article-title>
                    <source>

                        <italic toggle="yes">Career Dev. Int.</italic>
</source>
                    <year>2024</year>;<volume>29</volume>(<issue>5</issue>):<fpage>513</fpage>&#x2013;<lpage>526</lpage>.
                    <pub-id pub-id-type="doi">10.1108/CDI-02-2024-0073</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref10">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <collab>EEOC</collab>
</person-group>:
                    <source>

                        <italic toggle="yes">Select Issues: Assessing Adverse Impact in Software, Algorithms, and Artificial Intelligence Used in Employment Selection Procedures Under Title VII of the Civil Rights Act of 1964 (Technical Assistance; 
                            <bold>EEOC-NVTA-2023-2</bold>, Issue Date: 
                            <bold>2023-05-18</bold>).</italic>
</source>
                    <publisher-name>U.S. Equal Employment Opportunity Commission</publisher-name>;<year>2023</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://data.aclum.org/storage/2025/01/EOCC_www_eeoc_gov_laws_guidance_select-issues-assessing-adverse-impact-software-algorithms-and-artificial.pdf">https://data.aclum.org/storage/2025/01/EOCC_www_eeoc_gov_laws_guidance_select-issues-assessing-adverse-impact-software-algorithms-and-artificial.pdf</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref11">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>El Achmar</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bhagat</surname>
                            <given-names>R</given-names>
                        </name>
</person-group>:
                    <article-title>The conceptual relation between human resource management (HRM) and competency mapping.</article-title>
                    <source>

                        <italic toggle="yes">International Journal of Teaching &amp; Education.</italic>
</source>
                    <year>2023</year>.</mixed-citation>
            </ref>
            <ref id="ref12">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <collab>European Union Parliament and Council</collab>
</person-group>:
                    <italic toggle="yes">Regulation (EU) 2024/1689 &#x2026; (Artificial Intelligence Act).</italic>Official Journal of the European Union, OJ L, 2024/1689, 12.7.2024. EUR-Lex.<year>2024</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://data.europa.eu/eli/reg/2024/1689/oj">https://data.europa.eu/eli/reg/2024/1689/oj</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref13">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Fadhli</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>Manajemen peningkatan mutu pendidikan.</article-title>
                    <source>

                        <italic toggle="yes">Tadbir: Jurnal Studi Manajemen Pendidikan.</italic>
</source>
                    <year>2017</year>;<volume>1</volume>(<issue>2</issue>):<fpage>215</fpage>&#x2013;<lpage>240</lpage>.
                    <pub-id pub-id-type="doi">10.29240/jsmp.v1i2.295</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref14">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Firza</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sarjono</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>Penerapan algoritma K-Means dalam metode clustering untuk peminatan jurusan bagi siswa Swasta Pelita Raya Kota Jambi.</article-title>
                    <source>

                        <italic toggle="yes">Jurnal Manajemen Sistem Informasi.</italic>
</source>
                    <year>2020</year>;<volume>5</volume>(<issue>3</issue>):<fpage>371</fpage>&#x2013;<lpage>382</lpage>.</mixed-citation>
            </ref>
            <ref id="ref15">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gangl</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>Labor market structure and re-employment rates: Unemployment dynamics in West Germany and the United States.</article-title>
                    <source>

                        <italic toggle="yes">Research in Social Stratification and Mobility.</italic>
</source>
                    <year>2003</year>;<volume>20</volume>:<fpage>185</fpage>&#x2013;<lpage>224</lpage>.
                    <pub-id pub-id-type="doi">10.1016/S0276-5624(03)20004-4</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref16">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Gie</surname>
                            <given-names>W</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Jollyta</surname>
                            <given-names>D</given-names>
                        </name>
</person-group>:
                    <article-title>Perbandingan Euclidean dan Manhattan untuk optimasi cluster menggunakan Davies-Bouldin Index: Status COVID-19 wilayah Riau.</article-title>
                    <source>

                        <italic toggle="yes">Prosiding Seminar Nasional Riset Information Science (SENARIS).</italic>
</source>
                    <year>2020, July</year>;<volume>2</volume>:<fpage>187</fpage>&#x2013;<lpage>191</lpage>.</mixed-citation>
            </ref>
            <ref id="ref17">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Green</surname>
                            <given-names>AE</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hoyos</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>Y</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <source>

                        <italic toggle="yes">Job search study: Literature review and analysis of the Labour Force Survey.</italic>
</source>
                    <publisher-loc>London</publisher-loc>:
                    <publisher-name>Department for Work and Pensions</publisher-name>;<year>2011</year>.</mixed-citation>
            </ref>
            <ref id="ref18">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Hurbean</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Miliaru</surname>
                            <given-names>F</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Muntean</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The impact of business intelligence and analytics adoption on decision-making effectiveness and managerial work performance.</article-title>
                    <source>

                        <italic toggle="yes">Scientific Annals of Economics and Business.</italic>
</source>
                    <year>2023</year>;<volume>70</volume>:<fpage>43</fpage>&#x2013;<lpage>54</lpage>.
                    <pub-id pub-id-type="doi">10.47743/saeb-2023-0012</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref19">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Irmawan</surname>
                            <given-names>I</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sagharmata</surname>
                            <given-names>FA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ruthriana</surname>
                            <given-names>F</given-names>
                        </name>
</person-group>:
                    <article-title>Analisis dampak pembangunan Kota Hutan (Forest City) (Studi kasus: Ibu Kota Nusantara (IKN), Kalimantan).</article-title>
                    <source>

                        <italic toggle="yes">Prosiding Seminar Rekayasa Teknologi (SemResTek).</italic>
</source>
                    <year>2023</year>;<fpage>299</fpage>&#x2013;<lpage>304</lpage>.</mixed-citation>
            </ref>
            <ref id="ref20">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jain</surname>
                            <given-names>AK</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Murty</surname>
                            <given-names>MN</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Flynn</surname>
                            <given-names>PJ</given-names>
                        </name>
</person-group>:
                    <article-title>Data clustering: A review.</article-title>
                    <source>

                        <italic toggle="yes">ACM Computing Surveys (CSUR).</italic>
</source>
                    <year>1999</year>;<volume>31</volume>(<issue>3</issue>):<fpage>264</fpage>&#x2013;<lpage>323</lpage>.
                    <pub-id pub-id-type="doi">10.1145/331499.331504</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref21">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jaya</surname>
                            <given-names>DJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sudira</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Raharjo</surname>
                            <given-names>NE</given-names>
                        </name>
</person-group>:
                    <article-title>Vocational teacher professionalisation as human resource development: policy reflections from Indonesia.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Train. Res.</italic>
</source>
                    <year>2026a</year>:<fpage>1</fpage>&#x2013;<lpage>11</lpage>.
                    <pub-id pub-id-type="doi">10.1080/14480220.2026.2630821</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref22">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jaya</surname>
                            <given-names>DJ</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ramdhani</surname>
                            <given-names>WM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hamid</surname>
                            <given-names>HWR</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Integrating fuzzy C-means clustering and Random Forest for multivariate performance prediction in vocational education.</article-title>
                    <source>

                        <italic toggle="yes">Commun. Stat. Case Stud. Data Anal. Appl.</italic>
</source>
                    <year>2026b</year>.
                    <pub-id pub-id-type="doi">10.1080/23737484.2026.2640437</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref23">
                <mixed-citation publication-type="data">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jaya</surname>
                            <given-names>DJ</given-names>
                        </name>
</person-group>:
                    <data-title>Supplementary Materials R2 for &#x201c;Application of K-Means Clustering for Job Applicant Analysis in Construction Firms Using R&#x201d;</data-title>. [Data set].
                    <source>

                        <italic toggle="yes">Zenodo.</italic>
</source>
                    <year>2026</year>.
                    <pub-id pub-id-type="doi">10.5281/zenodo.20070567</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref24">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Kassambara</surname>
                            <given-names>A</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Practical guide to cluster analysis in R.</italic>
</source>
                    <publisher-name>STHDA</publisher-name>;
                    <edition>1st ed. </edition>
                    <year>2017</year>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.sthda.com">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref25">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>London</surname>
                            <given-names>HH</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Principles and techniques of vocational guidance.</italic>
</source>
                    <publisher-loc>Ohio</publisher-loc>:
                    <publisher-name>Charles E. Merrill Publishing Company</publisher-name>;<year>1973</year>.</mixed-citation>
            </ref>
            <ref id="ref26">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Madanchian</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>From Recruitment to Retention: AI Tools for Human Resource Decision-Making.</article-title>
                    <source>

                        <italic toggle="yes">Appl Sci.</italic>
</source>
                    <year>2024</year>;<volume>14</volume>(<issue>24</issue>):<fpage>11750</fpage>.
                    <pub-id pub-id-type="doi">10.3390/app142411750</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref27">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Manikandan</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Caroline</surname>
                            <given-names>AL</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kanniamma</surname>
                            <given-names>D</given-names>
                        </name>
</person-group>:
                    <article-title>The study on clustering analysis in data mining.</article-title>
                    <source>

                        <italic toggle="yes">International Journal of Data Mining Techniques and Applications.</italic>
</source>
                    <year>2018</year>;<volume>7</volume>(<issue>1</issue>):<fpage>46</fpage>&#x2013;<lpage>49</lpage>.</mixed-citation>
            </ref>
            <ref id="ref28">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <collab>National Institute of Standards and Technology (NIST)</collab>
</person-group>:
                    <italic toggle="yes">Artificial Intelligence Risk Management Framework (AI RMF 1.0).</italic>
                    <year>2023</year>.
                    <pub-id pub-id-type="doi">https://doi.org/10.6028/NIST.AI.100-1</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref29">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Pala</surname>
                            <given-names>SK</given-names>
                        </name>
</person-group>:
                    <article-title>Use and applications of data analytics in human resource management and talent acquisition.</article-title>
                    <source>

                        <italic toggle="yes">International Journal of Enhanced Research in Science, Technology &amp; Engineering.</italic>
</source>
                    <year>2021</year>;<volume>10</volume>:<fpage>2319</fpage>&#x2013;<lpage>7463</lpage>.</mixed-citation>
            </ref>
            <ref id="ref30">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Purba</surname>
                            <given-names>W</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tamba</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Saragih</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <article-title>The effect of mining data K-Means clustering toward students profile model drop out potential.</article-title>
                    <source>

                        <italic toggle="yes">IOP Conference Series: Journal of Physics.</italic>
</source>
                    <year>2018</year>;<volume>1007</volume>(<issue>1</issue>):<fpage>012046</fpage>&#x2013;<lpage>012049</lpage>.
                    <pub-id pub-id-type="doi">10.1088/1742-6596/1007/1/012049</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref31">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rawat</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nadavulakere</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Isenhour</surname>
                            <given-names>L</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Career enhancement strategies, supportive work relationships and subjective career success: The moderating role of family&#x2013;work conflict.</article-title>
                    <source>

                        <italic toggle="yes">Career Dev. Int.</italic>
</source>
                    <year>2024</year>;<volume>29</volume>(<issue>4</issue>):<fpage>421</fpage>&#x2013;<lpage>433</lpage>.
                    <pub-id pub-id-type="doi">10.1108/CDI-06-2023-0160</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref32">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rigotti</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Fosch-Villaronga</surname>
                            <given-names>E</given-names>
                        </name>
</person-group>:
                    <article-title>Fairness, AI &amp; recruitment.</article-title>
                    <source>

                        <italic toggle="yes">Comput. Law Secur. Rev.</italic>
</source>
                    <year>2024</year>;<volume>53</volume>:<fpage>105966</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.clsr.2024.105966</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref33">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rousseeuw</surname>
                            <given-names>PJ</given-names>
                        </name>
</person-group>:
                    <article-title>Silhouettes: A graphical aid to the interpretation and validation of cluster analysis.</article-title>
                    <source>

                        <italic toggle="yes">J. Comput. Appl. Math.</italic>
</source>
                    <year>1987</year>;<volume>20</volume>:<fpage>53</fpage>&#x2013;<lpage>65</lpage>.
                    <pub-id pub-id-type="doi">10.1016/0377-0427(87)90125-7</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref34">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Smith</surname>
                            <given-names>SC</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Todaro</surname>
                            <given-names>MP</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Economic development.</italic>
</source>
                    <publisher-loc>Boston</publisher-loc>:
                    <publisher-name>Pearson Education</publisher-name>;
                    <edition>12th ed. </edition>
                    <year>2015</year>.</mixed-citation>
            </ref>
            <ref id="ref35">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Supriyanti</surname>
                            <given-names>SS</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kusmayanti</surname>
                            <given-names>JD</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Paluseri</surname>
                            <given-names>ARA</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Pemberdayaan masyarakat sekitar di wilayah Ibu Kota Nusantara.</article-title>
                    <source>

                        <italic toggle="yes">Masyarakat Indonesia.</italic>
</source>
                    <year>2023</year>;<volume>49</volume>(<issue>1</issue>):<fpage>93</fpage>&#x2013;<lpage>102</lpage>.</mixed-citation>
            </ref>
            <ref id="ref36">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Van der Heijden</surname>
                            <given-names>BIJM</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hofer</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Semeijn</surname>
                            <given-names>J</given-names>
                        </name>
</person-group>:
                    <article-title>&#x201c;Don&#x2019;t you worry &#x2019;bout a thing&#x201d; &#x2013; The moderating role of age in the relationship between qualitative job insecurity and career sustainability.</article-title>
                    <source>

                        <italic toggle="yes">Career Dev. Int.</italic>
</source>
                    <year>2024</year>;<volume>29</volume>(<issue>5</issue>):<fpage>527</fpage>&#x2013;<lpage>543</lpage>.
                    <pub-id pub-id-type="doi">10.1108/CDI-08-2023-0280</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref37">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Venugopal</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Madhavan</surname>
                            <given-names>V</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Prasad</surname>
                            <given-names>R</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Transformative AI in human resource management: enhancing workforce planning with topic modeling.</article-title>
                    <source>

                        <italic toggle="yes">Cogent Bus. Manag.</italic>
</source>
                    <year>2024</year>;<volume>11</volume>(<issue>1</issue>):<fpage>2432550</fpage>.
                    <pub-id pub-id-type="doi">10.1080/23311975.2024.2432550</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref38">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Elm</surname>
                            <given-names>E</given-names>
                            <prefix>von</prefix>
                        </name>

                        <name name-style="western">
                            <surname>Altman</surname>
                            <given-names>DG</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Egger</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>The Strengthening the Reporting of Observational Studies in Epidemiology (STROBE) Statement: Guidelines for Reporting Observational Studies.</article-title>
                    <source>

                        <italic toggle="yes">PLoS Med.</italic>
</source>
                    <year>2007</year>;<volume>4</volume>(<issue>10</issue>):<fpage>e296</fpage>.
                    <pub-id pub-id-type="pmid">17941714</pub-id>
                    <pub-id pub-id-type="doi">10.1371/journal.pmed.0040296</pub-id>
                    <pub-id pub-id-type="pmcid">PMC2020495</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref39">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Widiyaningtyas</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Prabowo</surname>
                            <given-names>MIW</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Pratama</surname>
                            <given-names>MAM</given-names>
                        </name>
</person-group>:
                    <chapter-title>Implementation of K-Means clustering to distribution of high school teachers.</chapter-title>
                    <source>

                        <italic toggle="yes">Proceeding EECSI, Yogyakarta, 19&#x2013;21 September.</italic>
</source>
                    <year>2017, September</year>;<fpage>49</fpage>&#x2013;<lpage>54</lpage>.</mixed-citation>
            </ref>
            <ref id="ref40">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Widodo</surname>
                            <given-names>SE</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Manajemen pengembangan sumber daya manusia.</italic>
</source>
                    <publisher-loc>Yogyakarta</publisher-loc>:
                    <publisher-name>Pustaka Pelajar</publisher-name>;<year>2018</year>.</mixed-citation>
            </ref>
            <ref id="ref41">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Wiharto</surname>
                            <given-names>W</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Suryani</surname>
                            <given-names>E</given-names>
                        </name>
</person-group>:
                    <article-title>The comparison of clustering algorithms K-Means and Fuzzy C-Means for segmentation retinal blood vessels.</article-title>
                    <source>

                        <italic toggle="yes">Acta Informatica Medica.</italic>
</source>
                    <year>2020</year>;<volume>28</volume>(<issue>1</issue>):<fpage>42</fpage>&#x2013;<lpage>46</lpage>.
                    <pub-id pub-id-type="doi">10.5455/aim.2020.28.42-47</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref42">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Wu</surname>
                            <given-names>Y</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Pressure from social media: Influence of social media usage on career exploration.</article-title>
                    <source>

                        <italic toggle="yes">Career Dev. Int.</italic>
</source>
                    <year>2024</year>;<volume>29</volume>(<issue>1</issue>):<fpage>93</fpage>&#x2013;<lpage>112</lpage>.
                    <pub-id pub-id-type="doi">10.1108/CDI-01-2023-0016</pub-id>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report468949">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.196340.r468949</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Pi&#x015f;irgen</surname>
                        <given-names>Ali</given-names>
                    </name>
                    <xref ref-type="aff" rid="r468949a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0001-7257-2938</uri>
                </contrib>
                <aff id="r468949a1">
                    <label>1</label>Karamano&#x011f;lu Mehmetbey University, Karaman, Turkey</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>20</day>
                <month>4</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Pi&#x015f;irgen A</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport468949" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.172383.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>
                <bold>Choosing the number of clusters</bold>
            </p>
            <p> There is an inherent tension: K=3 is motivated by desired recruitment categories, but K should be justified from the data structure as well, otherwise the analysis becomes forced classification by clustering.</p>
            <p> The manuscript should present cluster-number justification more rigorously (e.g., elbow method plus at least one additional diagnostic such as silhouette/gap or stability), and explain that &#x201c;three clusters&#x201d; may be a managerial convenience rather than a natural structure.</p>
            <p> </p>
            <p> 
                <bold>Terminology discipline:</bold>
            </p>
            <p> Use one consistent naming scheme for variables (e.g., &#x201c;AutoCAD drafting&#x201d; vs &#x201c;AutoCAD drawing&#x201d;; &#x201c;planning/supervision report writing&#x201d;). Inconsistencies make reproducibility and interpretation harder, especially if extended data uses different names. Particularly Table 1 and Table 4. Ensure that variable names match</p>
            <p> </p>
            <p> 
                <bold>Reproducibility</bold>
            </p>
            <p> Because this is an applied observational dataset analysis (not a clinical trial, systematic review, or animal study), CONSORT/PRISMA/ARRIVE are not directly applicable; however, STROBE-style completeness standards are useful for reporting observational data and analysis decisions.
                <sup>1</sup>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>No source data required</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>My research focuses on data analytics and decision support systems within the field of information systems, with particular emphasis on machine learning, clustering techniques, and data-driven modeling of socio-economic systems such as scientometrics, tourism, marketing.</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-468949-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>The Strengthening the Reporting of Observational Studies in Epidemiology (STROBE) Statement: Guidelines for Reporting Observational Studies</article-title>.
                        <source>
                            <italic>PLoS Medicine</italic>
                        </source>.<year>2007</year>;<volume>4</volume>(<issue>10</issue>) :
                        <elocation-id>10.1371/journal.pmed.0040296</elocation-id>
                        <pub-id pub-id-type="doi">10.1371/journal.pmed.0040296</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
        <sub-article article-type="response" id="comment16156-468949">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Ramdhani</surname>
                            <given-names>Wahyu Muhammad</given-names>
                        </name>
                        <aff>Educational Research and Evalu, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, Indonesia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>we declare that we have no competing interest in this work.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>7</day>
                    <month>5</month>
                    <year>2026</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear Reviewer,</p>
                <p> </p>
                <p> Thank you for your careful and constructive review of our manuscript and for approving the work with reservations. We have revised the manuscript to address each of your comments.</p>
                <p> </p>
                <p> 1. Choosing the number of clusters</p>
                <p> </p>
                <p> Comment:</p>
                <p> There is an inherent tension: K = 3 is motivated by desired recruitment categories, but K should be justified from the data structure as well. The manuscript should present cluster-number justification more rigorously and explain that three clusters may be a managerial convenience rather than a natural structure.</p>
                <p> </p>
                <p> Response:</p>
                <p> We agree with this important point. In the revised manuscript, we now explicitly state that the three-cluster solution was selected partly because it corresponded to the organization&#x2019;s need for an interpretable decision-support structure, but that it should not be interpreted as proof of three naturally distinct applicant groups. We have reframed the three-cluster solution as a managerially interpretable exploratory grouping rather than a definitive natural classification.</p>
                <p> </p>
                <p> We also expanded the cluster-number justification by discussing internal validity diagnostics, including the elbow method, silhouette coefficient, and Davies&#x2013;Bouldin Index. The revised manuscript reports a mean silhouette coefficient of 0.16 and a Davies&#x2013;Bouldin Index of 2.05, which are interpreted cautiously as indicating modest separation rather than strong natural cluster structure.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> The Methods and Results sections now include clearer discussion of cluster-number justification, managerial interpretability, and internal validity diagnostics. The Results, Discussion, and Conclusions have also been revised to avoid overstating the strength or naturalness of the three-cluster solution.</p>
                <p> </p>
                <p> 2. Terminology discipline</p>
                <p> </p>
                <p> Comment:</p>
                <p> Use one consistent naming scheme for variables, especially in Table 1 and Table 4. Inconsistencies make reproducibility and interpretation harder.</p>
                <p> </p>
                <p> Response:</p>
                <p> We agree. We have standardized the terminology across the manuscript, tables, figures, and supplementary materials. The revised manuscript consistently uses the following terms: &#x201c;AutoCAD drafting skills,&#x201d; &#x201c;planning/supervision report-writing skills,&#x201d; and &#x201c;adaptability.&#x201d; We also revised the tables and figure labels to align with this terminology. The previous decision-style labels were replaced with neutral interpretive profile labels to avoid implying automated hiring decisions.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> Table 1 and the results tables have been revised using consistent terminology. The labels &#x201c;Rejected,&#x201d; &#x201c;Under Consideration,&#x201d; and &#x201c;Accepted&#x201d; were replaced with &#x201c;Lower competency profile,&#x201d; &#x201c;Intermediate/mixed competency profile,&#x201d; and &#x201c;Higher competency profile.&#x201d; Revised figures and supplementary materials were also provided.</p>
                <p> </p>
                <p> 3. Reproducibility and reporting completeness</p>
                <p> </p>
                <p> Comment:</p>
                <p> Because this is an applied observational dataset analysis, CONSORT/PRISMA/ARRIVE are not directly applicable; however, STROBE-style completeness standards are useful for reporting observational data and analysis decisions.</p>
                <p> </p>
                <p> Response:</p>
                <p> We agree. We have revised the manuscript to follow STROBE-style completeness principles where relevant. The revised Methods section now clarifies the source of the data, the applicant screening process, the reason for analysing only the 30 shortlisted candidates, the assessment variables, preprocessing decisions, clustering parameters, and limitations of inference.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> We added explicit explanation of the analytical sample, eligibility process, preprocessing decisions, and reporting boundaries. We also cited the STROBE statement and revised the limitations section to clarify the observational and exploratory nature of the study.</p>
                <p> </p>
                <p> 4. Use of supplementary materials</p>
                <p> </p>
                <p> Response:</p>
                <p> We also updated the supplementary materials to improve consistency and reproducibility. The revised extended data include the final R script, clustering outputs, revised figure files, and supporting documentation. The supplementary terminology was updated to match the revised manuscript.</p>
                <p> </p>
                <p> We appreciate the reviewer&#x2019;s comments, which helped us improve the methodological discipline, terminology consistency, and interpretation of the clustering results.</p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report467509">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.196340.r467509</article-id>
            <title-group>
                <article-title>Reviewer response for version 2</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Kembuan</surname>
                        <given-names>Olivia</given-names>
                    </name>
                    <xref ref-type="aff" rid="r467509a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-4549-0544</uri>
                </contrib>
                <contrib contrib-type="author">
                    <name>
                        <surname>Sangkop</surname>
                        <given-names>Ferdinan</given-names>
                    </name>
                    <xref ref-type="aff" rid="r467509a2">2</xref>
                    <role>Co-referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-6361-7919</uri>
                </contrib>
                <aff id="r467509a1">
                    <label>1</label>Universitas Negeri Manado, Sulawesi Utara, Indonesia</aff>
                <aff id="r467509a2">
                    <label>2</label>informatics, Universitas Negeri Manado (Ringgold ID: 175496), Tondano, North Sulawes, Indonesia</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>23</day>
                <month>3</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Kembuan O and Sangkop F</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport467509" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.172383.2"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>
                <bold>Is the work clearly and accurately presented and does it cite the current literature?</bold>
            </p>
            <p> The manuscript is generally clearly structured and readable.&#x00a0; However, the literature review focuses primarily on clustering algorithms and includes a number of regional or context-specific references. The manuscript would benefit from stronger engagement with more recent international literature on HR analytics, algorithmic decision-making in recruitment, and AI-assisted hiring systems. Incorporating broader global scholarship would strengthen the theoretical grounding of the study.</p>
            <p> 
                <bold>Is the study design appropriate and is the work technically sound?</bold>
            </p>
            <p> Provide a clearer justification for analyzing only the 30 shortlisted candidates and discuss the implications of this sampling decision.</p>
            <p> Although some methodological details are provided, additional clarification of analytical parameters and preprocessing decisions would improve reproducibility.</p>
            <p> 
                <bold>Are the conclusions drawn adequately supported by the results?</bold>
            </p>
            <p> The conclusions generally align with the exploratory nature of the study; however, some claims regarding the usefulness of clustering for improving recruitment decision-making are somewhat stronger than the evidence supports. Because the analysis is based on a small, pre-screened sample and lacks external validation against actual hiring outcomes or job performance, the conclusions should emphasize the illustrative and exploratory nature of the findings rather than suggesting demonstrated improvements in recruitment effectiveness.</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Partly</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>I cannot comment. A qualified statistician is required.</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>No source data required</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Partly</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Data Science</p>
            <p>We confirm that we have read this submission and believe that we have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however we have significant reservations, as outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment16155-467509">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Ramdhani</surname>
                            <given-names>Wahyu Muhammad</given-names>
                        </name>
                        <aff>Educational Research and Evalu, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, Indonesia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>We declare that we have no competing interest on this work.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>7</day>
                    <month>5</month>
                    <year>2026</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Dear Reviewers,</p>
                <p> </p>
                <p> Thank you for your constructive evaluation of our manuscript and for approving the work with reservations. We have revised the manuscript substantially to address your comments.</p>
                <p> </p>
                <p> 1. Engagement with broader international literature</p>
                <p> </p>
                <p> Comment:</p>
                <p> The literature review focused primarily on clustering algorithms and included several regional or context-specific references. The manuscript would benefit from stronger engagement with more recent international literature on HR analytics, algorithmic decision-making in recruitment, and AI-assisted hiring systems.</p>
                <p> </p>
                <p> Response:</p>
                <p> We agree with this comment. In the revised manuscript, we have expanded the literature review by adding a new discussion of HR analytics, algorithm-assisted recruitment, AI-assisted hiring, fairness, transparency, explainability, adverse impact, and human oversight. We incorporated broader international literature and governance-oriented sources to strengthen the theoretical grounding of the study. The revised manuscript now positions K-Means clustering within the wider context of responsible recruitment analytics and decision support rather than only within clustering methodology.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> We revised the Introduction and added a new literature review subsection on HR analytics and algorithm-assisted recruitment. We also added recent international references on AI-assisted recruitment, HR analytics, algorithmic fairness, and AI governance.</p>
                <p> </p>
                <p> 2. Justification for analysing only 30 shortlisted candidates</p>
                <p> </p>
                <p> Comment:</p>
                <p> Provide a clearer justification for analyzing only the 30 shortlisted candidates and discuss the implications of this sampling decision.</p>
                <p> </p>
                <p> Response:</p>
                <p> We agree. The revised manuscript now explains that 161 applicants initially applied, but only 30 candidates passed the company&#x2019;s document-screening procedure and completed in-person competency testing. Only these 30 candidates had complete scores for all three assessment variables. We have clarified that this is a pre-screened analytical sample and that the findings should not be generalized to the full applicant pool or to construction applicants more broadly.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> The Methods section now includes a clearer explanation of the screening procedure, the reason for limiting the analysis to 30 candidates, and the implications of this sampling decision for interpretation and generalizability.</p>
                <p> </p>
                <p> 3. Clarification of analytical parameters and preprocessing decisions</p>
                <p> </p>
                <p> Comment:</p>
                <p> Additional clarification of analytical parameters and preprocessing decisions would improve reproducibility.</p>
                <p> </p>
                <p> Response:</p>
                <p> We have revised the Methods section to clarify the preprocessing and clustering workflow. The revised manuscript states that all variables were measured on the same 0&#x2013;100 scale, that raw scores were retained, that no additional normalization was applied, and that Euclidean squared distance was used in the clustering procedure. We also clarified that detailed clustering outputs and supporting materials are provided as extended data.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> We revised the Methods section on assessment variables, preprocessing, outlier/sensitivity checks, and clustering procedure. We also updated the supplementary materials to align with the revised manuscript terminology.</p>
                <p> </p>
                <p> 4. Claims regarding usefulness of clustering for recruitment decision-making</p>
                <p> </p>
                <p> Comment:</p>
                <p> Some claims regarding the usefulness of clustering for improving recruitment decision-making were stronger than the evidence supports. Because the analysis is based on a small, pre-screened sample and lacks external validation against actual hiring outcomes or job performance, the conclusions should emphasize the illustrative and exploratory nature of the findings.</p>
                <p> </p>
                <p> Response:</p>
                <p> We agree and have revised the manuscript accordingly. The revised version no longer presents clustering as evidence of demonstrated improvement in recruitment effectiveness. Instead, clustering is framed as an exploratory and illustrative decision-support technique for organizing applicant assessment data. We explicitly acknowledge that the analysis was based on a small, pre-screened sample and was not externally validated against hiring outcomes or job performance.</p>
                <p> </p>
                <p> Changes made:</p>
                <p> We revised the Abstract, Results, Discussion, Limitations, and Conclusions to emphasize the exploratory nature of the findings. We also added explicit limitations regarding sample size, pre-screening, lack of external validation, and the need for future studies using larger datasets and job-performance outcomes.</p>
                <p> </p>
                <p> We appreciate the reviewers&#x2019; comments, which helped us strengthen the theoretical framing, methodological transparency, and cautious interpretation of the manuscript.</p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report446627">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.190104.r446627</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Gupta</surname>
                        <given-names>Deepak</given-names>
                    </name>
                    <xref ref-type="aff" rid="r446627a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-0069-7488</uri>
                </contrib>
                <aff id="r446627a1">
                    <label>1</label>Penn State University, University Park, PA, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>3</day>
                <month>2</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Gupta D</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport446627" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.172383.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The manuscript addresses a relevant and practically important topic of using K&#x2011;Means clustering to support recruitment decisions in a construction consulting firm. The use of real organizational data, clear cluster descriptions, and intuitive 2D/3D visualizations makes the work accessible and potentially useful for practitioners interested in HR analytics and R-based implementations. However, the current version has substantial methodological and presentation limitations that need to be addressed before the article can be considered for indexing. 
                <list list-type="order">
                    <list-item>
                        <p>The study starts from 161 applicants but analyzes only 30 shortlisted candidates who &#x201c;met the minimum requirements,&#x201d; with no clear justification of the selection criteria or their implications. This design means the clustering is applied to a highly pre-filtered subset rather than the full applicant pool, which severely limits generalizability to &#x201c;recruitment strategies&#x201d; or &#x201c;workforce selection&#x201d; more broadly. The authors should explicitly describe the screening rules used to select the 30 candidates (cut&#x2011;offs, qualitative judgments, etc.). The authors should re-run the analysis on the full set of 161 applicants (if possible and ethically permissible) or reframe the paper as a methodological demonstration on a small, filtered sample and tone down claims about recruitment optimization.</p>
                    </list-item>
                    <list-item>
                        <p>Initial centroids are chosen manually as &#x201c;Rejected = (60,75,85); Considered = (62,77,88); Accepted = (70,84,92)&#x201d; with no methodological justification beyond being &#x201c;chosen randomly,&#x201d; which they are not. These values embed prior expectations about the three groups and risk steering the solution toward a desired structure, rather than letting the algorithm discover patterns in the data. The authors should justify the chosen centroids and make that explicit. In addition, run at least one standard initialization strategy (e.g., built&#x2011;in k-means in R with multiple random starts, or k-means++). The authors should also report whether the manually initialized solution is stable across different initializations; and if not, the conclusions about three clusters and their interpretation need to be more cautious.</p>
                    </list-item>
                    <list-item>
                        <p>The methods mention Euclidean distance and cite general clustering references, but there is no clear statement on whether the three variables were standardized or used in raw form. There is also no discussion of data cleaning beyond a vague reference to removing &#x201c;irrelevant or incomplete data.&#x201d; How many records, if any, were excluded and why? Whether any outliers were identified and how they were handled. The authors should explicitly state whether they standardized the variables before clustering; if not, justify why not and show at least descriptive ranges/variances. They should also provide a proper description of data-cleaning procedure. If outliers exist (some points in the 3D plot appear distant from cluster centers), please clarify whether they influence centroid placement and consider sensitivity analyses.</p>
                    </list-item>
                    <list-item>
                        <p>The discussion and conclusions repeatedly assert that K&#x2011;Means is &#x201c;effective&#x201d; and &#x201c;improves recruitment decision-making,&#x201d; yet there is no external validation. There is no comparison with actual hiring decisions made by the firm. No HR-expert assessment of whether clusters align with real performance or selection outcomes. If such data are not available, please qualify all claims about decision-making benefits as exploratory.</p>
                    </list-item>
                    <list-item>
                        <p>The author states in the &#x201c;Underlying data&#x201d; section that the dataset is not publicly available due to confidentiality and must be requested via the corresponding author. At the same time, the text refers to R scripts and supplementary materials in a Zenodo repository as extended data. The authors should clarify precisely what is in the Zenodo archive (R code, example data, figures, documentation) and referencing it consistently in the methods and data availability sections. If contractual and legal constraints allow, please consider publishing an anonymized dataset (at least the 30 shortlisted candidates; ideally all 161) with no identifying information. If this is impossible, explicitly justify the restriction and explain how others can still verify the methodology (e.g., via synthetic data included in the Zenodo package).</p>
                    </list-item>
                    <list-item>
                        <p>The conclusions and parts of the discussion are phrased quite strongly (e.g., &#x201c;confirm that the K&#x2011;Means Clustering algorithm is an effective tool&#x201d; and &#x201c;this approach not only addresses challenges in evaluating applicants but also builds a foundation for sustainable talent management&#x201d;), which is not fully justified given the small, preselected sample and lack of external validation.</p>
                    </list-item>
                    <list-item>
                        <p>Minor comments: The authors are suggested to modify the text in the abstract, discussion, and conclusions to reflect that findings are preliminary and illustrative for one firm and one small dataset.</p>
                    </list-item>
                    <list-item>
                        <p>The literature review is generally coherent but heavily focused on clustering and Indonesian/sector-specific references. There is relatively little engagement with the broader international work on AI in recruitment, algorithmic decision-making, or HR analytics.</p>
                    </list-item>
                    <list-item>
                        <p>Tables 2-7 list centroid updates and distances in excessive detail. It is pedagogically useful but makes the manuscript long and difficult to navigate. Some of the tables can be moved to the supplementary information with their summary in the main text.</p>
                    </list-item>
                    <list-item>
                        <p>There are some grammatical errors, please perform a proofread of the manuscript carefully.</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Partly</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Partly</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Partly</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Partly</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Healthcare, 3D Printing, Artificial Intelligence</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment15419-446627">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Ramdhani</surname>
                            <given-names>Wahyu Muhammad</given-names>
                        </name>
                        <aff>Educational Research and Evalu, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, Indonesia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>The authors declare that they have no competing interests.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>6</day>
                    <month>2</month>
                    <year>2026</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Response to Reviewer 2</p>
                <p> 
                    <bold>Deepak Gupta (Penn State University, USA)</bold>
                </p>
                <p> We thank the reviewer for the detailed and technically informed evaluation of our manuscript. The feedback has been instrumental in improving methodological rigor, transparency, and interpretive clarity. Our responses are provided below.</p>
                <p> 
                    <bold>Comment 1: Pre-filtered sample and limited generalizability</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We fully agree. The manuscript has been explicitly reframed to clarify that the clustering analysis was applied to a 
                    <italic>pre-screened subset</italic> of applicants who passed document screening. This design choice is now clearly justified in the Methods section, and all claims have been moderated accordingly. The study is presented as an 
                    <italic>exploratory analytical illustration</italic> rather than a full recruitment optimization model.</p>
                <p> 
                    <bold>Comment 2: Manual centroid bias and need for robustness checks</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> This concern has been directly addressed. In addition to clarifying the rationale for initial centroid selection, we now report results from 
                    <bold>multiple random initializations</bold> (nstart = 50) using R&#x2019;s kmeans() function. The three-cluster structure remained largely stable across runs, with only minor variation among borderline profiles. These findings are now reported and discussed in the revised manuscript.</p>
                <p> 
                    <bold>Comment 3: Data normalization, outliers, and cleaning</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> The Methods section now explicitly states that all variables were measured on the same 0&#x2013;100 scale, and therefore raw scores were used without normalization. We also added an 
                    <bold>outlier and sensitivity analysis</bold>, including a leave-one-out test removing the most distant observation. This test did not materially change the cluster structure, and validation metrics showed only marginal changes. These results are now reported to support robustness.</p>
                <p> 
                    <bold>Comment 4: Lack of validation against real hiring outcomes</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We explicitly acknowledge this limitation. The revised manuscript clearly states that no comparison with actual hiring decisions or post-employment performance was possible. All statements regarding recruitment support are now framed as 
                    <italic>illustrative and exploratory</italic>, not empirically validated improvements.</p>
                <p> 
                    <bold>Comment 5: Data availability and Zenodo clarification</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> This issue has been resolved by clearly distinguishing: 
                    <list list-type="bullet">
                        <list-item>
                            <p>Confidential underlying data (not publicly shareable);</p>
                        </list-item>
                        <list-item>
                            <p>Publicly available extended data hosted on Zenodo, including R scripts, figures, clustering outputs, and documentation.</p>
                        </list-item>
                    </list> The Data availability section has been rewritten for clarity and compliance with journal policy.</p>
                <p> 
                    <bold>Comment 6: Excessive tables and manuscript length</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> In line with the suggestion, detailed centroid iteration tables have been moved to 
                    <bold>extended data</bold>. The main text now focuses on final clustering outcomes, visual interpretation, and discussion, substantially improving readability.</p>
                <p> 
                    <bold>Comment 7: Language and proofreading</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> The manuscript has been carefully proofread and revised to improve clarity, reduce repetition, and ensure consistent terminology throughout.</p>
                <p> 
                    <bold>Final note:</bold>
                </p>
                <p> We thank the reviewer for the rigorous and constructive critique. The revisions have significantly strengthened the manuscript&#x2019;s technical soundness, transparency, and responsible positioning within data-driven recruitment research.</p>
            </body>
        </sub-article>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report446632">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.190104.r446632</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Shaikh</surname>
                        <given-names>Sonia Najam</given-names>
                    </name>
                    <xref ref-type="aff" rid="r446632a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0001-7365-1064</uri>
                </contrib>
                <aff id="r446632a1">
                    <label>1</label>Jiangsu University, Zhenjiang, China</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>8</day>
                <month>1</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Shaikh SN</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport446632" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.172383.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>
                <list list-type="bullet">
                    <list-item>
                        <p>The paper presents an interesting and practically valuable idea by using K-Means clustering to support recruitment decision-making in a construction firm. The study groups applicants into rejected, under consideration, and accepted categories based on AutoCAD skills, planning/supervision report ability, and adaptability, and it makes good use of R and visualization techniques to demonstrate the results. The topic is timely and relevant to HR analytics and industry needs, and overall the manuscript is readable, logically structured, and supported by real organizational data, which gives it strong applied significance.</p>
                    </list-item>
                    <list-item>
                        <p>However, while the work is clearly presented, it is only partly sufficient in terms of scientific rigor and presentation quality. The manuscript sometimes becomes repetitive and uses very long tables that make it difficult to follow the narrative smoothly. The literature review is decent, but it leans heavily on regional or context-specific studies, and it would benefit greatly from integrating more current international literature on AI-driven recruitment, algorithmic hiring, fairness, and HR analytics trends. Adding such perspectives would make the study more globally relevant and intellectually grounded.</p>
                    </list-item>
                    <list-item>
                        <p>In terms of study design, the concept is appropriate, but there are some important weaknesses that affect technical soundness. The biggest issue is that the study only analyzed 30 shortlisted candidates out of 161 applicants, without providing a clear justification. This introduces bias and limits how generalizable the findings are. Another concern is the selection of initial centroids, which appears subjective rather than determined using a standard procedure such as random initialization or k-means++. There is also no explanation of whether data normalization was applied, which is important since K-Means relies on Euclidean distance and differences in scale can significantly affect results. These issues really need to be addressed for the paper to be scientifically strong.</p>
                    </list-item>
                    <list-item>
                        <p>The paper partly allows replication because the clustering process is explained carefully and tables clearly trace centroid iterations and cluster formation. However, critical methodological details are missing. There is no detailed explanation of data cleaning, whether any applicants were excluded and why, how outliers were treated, whether ethical permission or company approval was obtained, and what settings were used in R. To make the study convincingly reproducible, the authors should provide anonymized raw data, the R script, and a clearer explanation of all methodological choices.</p>
                    </list-item>
                    <list-item>
                        <p>The analysis and interpretation are also only partly sufficient. Although clustering has been correctly applied and visualizations are very good, the study does not present objective validation of the clusters. There is no numerical reporting of validation metrics such as silhouette score, Davies&#x2013;Bouldin index, or any form of comparison with real hiring outcomes or expert HR evaluation. Without such validation, the findings are mostly descriptive, and the claim that clustering improves recruitment decision-making is not empirically proven. Adding cluster validity results and some form of comparison or evaluation would significantly strengthen the credibility of the conclusions.</p>
                    </list-item>
                    <list-item>
                        <p>Data availability is partly fulfilled. While applicant scores are shown in tables, there is no formal dataset sharing, no supplementary files, and no data availability statement. Reproducibility is an important expectation, so providing anonymized data and the analysis code will help readers trust and build upon the work.</p>
                    </list-item>
                    <list-item>
                        <p>The conclusions are relevant and aligned with the results, but they are currently expressed too strongly considering the methodological limitations and lack of validation. The study needs to acknowledge its limitations, including the small selective sample, potential bias, lack of external validation, and ethical concerns such as fairness and transparency in automated hiring. The tone of the conclusions should be slightly moderated to reflect that the findings are promising but not definitively proven.</p>
                    </list-item>
                    <list-item>
                        <p>Overall, this is a promising and meaningful study with clear practical relevance, strong visualization, and a good foundation. However, to make it scientifically sound and suitable for indexing, the authors must justify or expand the sample, apply standard centroid initialization or explain theirs clearly, normalize or justify scale handling, provide quantitative cluster validation, share data and code, strengthen literature support, and include a more explicit discussion of limitations and ethical considerations.&#x00a0;</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Partly</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Partly</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Partly</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Partly</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>Human Resource Management, Artificial intelligence, Big data analytics capability</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <sub-article article-type="response" id="comment15418-446632">
            <front-stub>
                <contrib-group>
                    <contrib contrib-type="author">
                        <name>
                            <surname>Ramdhani</surname>
                            <given-names>Wahyu Muhammad</given-names>
                        </name>
                        <aff>Educational Research and Evalu, Universitas Negeri Yogyakarta, Yogyakarta, Special Region of Yogyakarta, Indonesia</aff>
                    </contrib>
                </contrib-group>
                <author-notes>
                    <fn fn-type="conflict">
                        <p>
                            <bold>Competing interests: </bold>The authors declare that they have no competing interests.</p>
                    </fn>
                </author-notes>
                <pub-date pub-type="epub">
                    <day>6</day>
                    <month>2</month>
                    <year>2026</year>
                </pub-date>
            </front-stub>
            <body>
                <p>Response to Reviewer 1</p>
                <p> 
                    <bold>Sonia Najam Shaikh (Jiangsu University, China)</bold>
                </p>
                <p> We sincerely thank the reviewer for the careful reading of our manuscript and for the constructive and detailed feedback. We have revised the manuscript substantially to address all major concerns raised. Our point-by-point responses are provided below.</p>
                <p> 
                    <bold>Comment 1: Limited international literature and lack of broader AI/HR analytics perspective</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> Thank you for this important suggestion. We have expanded the literature review and discussion to better situate the study within international debates on data-driven recruitment, employability, and HR analytics. Specifically, we incorporated recent global literature addressing analytical decision support, adaptability, and career sustainability (e.g., Akkermans et al., 2024; Donald et al., 2024; Rawat et al., 2024; Zhang et al., 2024; Van der Heijden et al., 2024).</p>
                <p> In addition, we explicitly positioned clustering as an 
                    <italic>exploratory decision-support tool</italic>, aligned with international guidance on responsible and transparent use of analytics in employment contexts.</p>
                <p> 
                    <bold>Comment 2: Analysis limited to 30 candidates out of 161 applicants</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We fully agree that this required clearer justification. The revised manuscript now explicitly explains that the clustering analysis was conducted on 30 candidates who passed formal document screening conducted by the company as part of standard recruitment procedures. We clearly state that the study analyzes a 
                    <italic>pre-screened assessment sample</italic>, not the full applicant pool.</p>
                <p> Accordingly, the study has been reframed as an 
                    <italic>exploratory methodological illustration</italic> rather than a comprehensive recruitment optimization model. Limitations related to selection bias and generalizability are now explicitly acknowledged in the Methods, Results, and Conclusions sections.</p>
                <p> 
                    <bold>Comment 3: Subjective centroid selection and lack of standard initialization</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> Thank you for highlighting this critical methodological issue. We have clarified that the manually specified initial centroids were derived from preliminary inspection of score distributions and used for transparency and pedagogical traceability.</p>
                <p> To address concerns regarding subjectivity and robustness, we have now: 
                    <list list-type="order">
                        <list-item>
                            <p>Added a dedicated subsection describing 
                                <bold>multiple random initializations</bold> using the built-in kmeans() function in R (nstart = 50);</p>
                        </list-item>
                        <list-item>
                            <p>Reported 
                                <bold>stability checks</bold>, showing that the three-cluster structure was largely consistent across runs, with only minor variations among borderline cases;</p>
                        </list-item>
                        <list-item>
                            <p>Moderated all interpretations to emphasize that clusters reflect 
                                <italic>similarity patterns</italic>, not predefined hiring categories.</p>
                        </list-item>
                    </list> </p>
                <p> 
                    <bold>Comment 4: Missing details on data cleaning, ethics, and reproducibility</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> This concern has been fully addressed. The revised manuscript now includes: 
                    <list list-type="bullet">
                        <list-item>
                            <p>A clearer description of document screening and data preprocessing;</p>
                        </list-item>
                        <list-item>
                            <p>Explicit confirmation that all analyzed records were complete and measured on the same 0&#x2013;100 scale;</p>
                        </list-item>
                        <list-item>
                            <p>A detailed 
                                <bold>Ethical approval and informed consent</bold> section clarifying the use of fully anonymized secondary data under a formal Data Usage Agreement;</p>
                        </list-item>
                        <list-item>
                            <p>An updated 
                                <bold>Data availability statement</bold>;</p>
                        </list-item>
                        <list-item>
                            <p>An updated 
                                <bold>Zenodo repository</bold> containing R scripts, clustering outputs, and documentation to support reproducibility.</p>
                        </list-item>
                    </list> </p>
                <p> 
                    <bold>Comment 5: Lack of objective cluster validation</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> We agree with this observation. To strengthen technical rigor, we have added a dedicated 
                    <bold>cluster validity assessment</bold> section reporting internal validation metrics. Specifically, we report: 
                    <list list-type="bullet">
                        <list-item>
                            <p>Mean silhouette coefficient (0.16);</p>
                        </list-item>
                        <list-item>
                            <p>Davies&#x2013;Bouldin Index (DBI = 2.05).</p>
                        </list-item>
                    </list> We explicitly interpret these values as 
                    <italic>diagnostic indicators</italic> of modest separation, appropriate for exploratory analysis, and avoid presenting them as evidence of predictive effectiveness.</p>
                <p> 
                    <bold>Comment 6: Overly strong conclusions</bold>
                </p>
                <p> 
                    <bold>Response:</bold>
                </p>
                <p> The Conclusions section has been revised to adopt a more cautious and balanced tone. Claims regarding effectiveness and decision-making improvement are now framed as 
                    <italic>exploratory and context-specific</italic>. Limitations related to sample size, pre-screening, lack of external validation, and ethical considerations are explicitly acknowledged.</p>
                <p> 
                    <bold>Final note:</bold>
                </p>
                <p> We sincerely appreciate the reviewer&#x2019;s thoughtful comments, which have significantly strengthened the manuscript&#x2019;s methodological transparency, analytical caution, and international relevance.</p>
            </body>
        </sub-article>
    </sub-article>
</article>
