<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="data-paper" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.179164.1</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Data Note</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Dataset of multi-focus (Z-stack) images derived from liquid-based cervical cancer cytology specimens</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 1; peer review: awaiting peer review]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Onishi</surname>
                        <given-names>Takafumi</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-2494-1265</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Miyamoto</surname>
                        <given-names>Tomoyuki</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a3">3</xref>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Osawa</surname>
                        <given-names>Yukihiko</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Shibahara</surname>
                        <given-names>Kazuki</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0009-0003-7060-5857</uri>
                    <xref ref-type="aff" rid="a3">3</xref>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Nishimori</surname>
                        <given-names>Makoto</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a3">3</xref>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Yakushiji</surname>
                        <given-names>Hiromasa</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0003-1674-1359</uri>
                    <xref ref-type="aff" rid="a3">3</xref>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Ohno</surname>
                        <given-names>Setsuyo</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Ohno</surname>
                        <given-names>Eiji</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Funding Acquisition</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Department of Medical Technology and Sciences, Faculty of Health Sciences, Kyoto Tachibana University, Kyoto, Kyoto, Japan</aff>
                <aff id="a2">
                    <label>2</label>Research Center for Life and Health Sciences, KyotoTachibana University, Kyoto, Kyoto, Japan</aff>
                <aff id="a3">
                    <label>3</label>Department of Medical Life Sciences, School of Medical Life Sciences, Kyushu University of Medical Science, Nobeoka, Miyazaki, Japan</aff>
                <aff id="a4">
                    <label>4</label>Cancer Cell Institute, Kyushu University of Medical Science, Nobeoka, Miyazaki, Japan</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:onishi-ta@tachibana-u.ac.jp">onishi-ta@tachibana-u.ac.jp</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>10</day>
                <month>4</month>
                <year>2026</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2026</year>
            </pub-date>
            <volume>15</volume>
            <elocation-id>502</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>19</day>
                    <month>3</month>
                    <year>2026</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Onishi T et al.</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/15-502/pdf"/>
            <abstract>
                <title>Abstract*</title>
                <sec>
                    <title>Background</title>
                    <p>In cervical cancer screening, cytotechnologists and cytopathologists integrate three-dimensional information by continuously adjusting the microscope&#x2019;s focus to evaluate chromatin structure and nuclear morphology. However, most existing public datasets consist of single-focus 2D images, which do not fully reflect this clinical diagnostic workflow. This study presents the Cervical Cancer Cell Image Database: Multi-focus Cytology Dataset (CCCID) to bridge this gap.</p>
                </sec>
                <sec>
                    <title>Methods</title>
                    <p>Cervical specimens were processed using the BD SurePath&#x2122; LBC technique and Papanicolaou staining. Digitization was performed using a NanoZoomer-XR scanner. For 639 unique fields of view (FOVs), a Z-stack consisting of 11 focal planes was captured at 1.0&#x00a0;&#x03bc;m intervals, resulting in 7,029 images (384&#x00a0;&#x00d7;&#x00a0;384 pixels). Ground-truth labels were established only when six board-certified expert cytotechnologists reached 100% consensus.</p>
                </sec>
                <sec>
                    <title>Conclusions</title>
                    <p>The CCCID provides a high-reliability benchmark for developing machine-learning models that utilize axial (Z-axis) information. It is highly valuable for advancing three-dimensional nuclear morphology analysis, cell segmentation in overlapping clusters, and the evaluation of focus-fusion algorithms in digital cytopathology.</p>
                </sec>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Multi-focus imaging; Z-stack; Cervical cancer; Liquid-based cytology; Deep learning; Pap smear; cytology; cytopathology.</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="https://doi.org/10.13039/501100001695">
                    <funding-source>JST CREST</funding-source>
                    <award-id>JPMJCR1786</award-id>
                </award-group>
                <award-group id="fund-2">
                    <funding-source>JST CREST</funding-source>
                    <award-id>JPMJCR20F3</award-id>
                </award-group>
                <award-group id="fund-3">
                    <funding-source>JST AIP Acceleration Research</funding-source>
                    <award-id>JPMJCR23U4</award-id>
                </award-group>
                <funding-statement> &#13;
This work was supported by JST CREST Grant Number JPMJCR1786, JST CREST Grant Number JPMJCR20F3, and JST AIP Acceleration Research Grant Number JPMJCR23U4.&#13;
</funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
    </front>
    <body>
        <sec id="sec4" sec-type="intro">
            <title>Introduction</title>
            <p>Cervical cancer remains a leading cause of cancer-related deaths among women globally, and cytology is central to its early detection.
                <sup>
                    <xref ref-type="bibr" rid="ref1">1</xref>
                </sup> Liquid-based cytology (LBC) is a widely used standard method because of its specimen uniformity. Although image analysis using deep learning has flourished, existing public datasets such as the Herlev dataset,
                <sup>
                    <xref ref-type="bibr" rid="ref2">2</xref>
                </sup> Cervix93,
                <sup>
                    <xref ref-type="bibr" rid="ref3">3</xref>
                </sup> SIPaKMeD,
                <sup>
                    <xref ref-type="bibr" rid="ref4">4</xref>
                </sup> and CRIC Cervix
                <sup>
                    <xref ref-type="bibr" rid="ref5">5</xref>
                </sup> primarily consist of single-focus 2D static images. These do not fully reflect the actual diagnostic process in which cytotechnologists and pathologists integrate three-dimensional information by continuously adjusting the focus to evaluate chromatin structure, nuclear membrane irregularities, and cell overlapping.
                <sup>
                    <xref ref-type="bibr" rid="ref6">6</xref>
                </sup> Even with LBC, cells and nuclei retain a thickness of several to over 10 micrometers. Single-plane 2D images risk losing critical information, such as 3D nuclear morphology. Therefore, this dataset was constructed to provide multi-focus image sequences (Z-stacks) of cervical LBC specimens. By including continuous focal depths for each field of view, this dataset enables the development of analytical methods and artificial intelligence models that consider 3D morphological information, thus reflecting conditions closer to real-world clinical practice.</p>
        </sec>
        <sec id="sec5">
            <title>Materials and methods</title>
            <p>

                <list list-type="order">
                    <list-item>
                        <label>1.</label>
                        <p>Specimen Preparation and LBC Processing</p>
                        <p>Cervical cytology specimens were collected from patients at Nobeoka Prefectural Hospital and Kawasaki Medical University. All samples were processed using the BD SurePath&#x2122; LBC system (BD Diagnostics, Burlington, NC, USA), which employs a density gradient enrichment process to provide a representative monolayer of cells. The processed slides were stained using the standard Papanicolaou staining method to visualize nuclear and cytoplasmic features. This study was conducted in accordance with the Declaration of Helsinki and was approved by the Institutional Review Boards of all participating institutions, including the Ethics Committee of Kyushu University of Medical Science (Approval No. 17&#x2013;19). Informed consent was obtained using an opt-out procedure approved by the ethics committees. The study included only adult participants, and all data were anonymized prior to image extraction and annotation. Written informed consent was waived in accordance with the opt-out procedure approved by the ethics committees, given the retrospective nature of the study and the use of fully anonymized samples.</p>
                    </list-item>
                    <list-item>
                        <label>2.</label>
                        <p>Whole-slide imaging and Digital Acquisition</p>
                        <p>The prepared LBC slides were digitized using a NanoZoomer-XR whole slide imaging scanner (Hamamatsu Photonics, Shizuoka, Japan). Scanning was performed using a 20&#x00d7; objective lens. The proprietary software of the scanner was used to generate whole-slide images in the .ndpi format.</p>
                    </list-item>
                    <list-item>
                        <label>3.</label>
                        <p>Fields of view (FOVs) Selection and Multi-focus (Z-stack) Extraction</p>
                        <p>Specific FOVs representing typical cytological features of each Bethesda category were identified from whole-slide images. For each selected FOV, a multi-focus image sequence (Z-stack) was generated. The extraction process involved capturing 11 distinct focal planes with a vertical interval of 1.0&#x00a0;&#x03bc;m between each plane. The focal range was centered on the optimal focus determined by the expert system, covering a total depth of 10&#x00a0;&#x03bc;m (5&#x00a0;&#x03bc;m above and below the center). The extracted images were cropped into 384&#x00a0;&#x00d7;&#x00a0;384 pixel tiles and converted from the raw.ndpi format to the JPG format with a resolution of 96 dpi for standardized use in machine-learning workflows.</p>
                    </list-item>
                    <list-item>
                        <label>4.</label>
                        <p>Annotation and Consensus Validation</p>
                        <p>The annotation of the dataset was conducted by six board-certified expert cytotechnologists. To facilitate the annotation process, a custom software, &#x201c;Annotation Image Creation Tool,&#x201d; developed by Proassist Ltd., (Osaka, Japan) was used. The annotation protocol was as follows. Each expert independently reviewed the multi-focus image sequences for each FOV. The FOVs were classified into one of the following four categories based on the Bethesda System: negative for intraepithelial lesion or malignancy (NILM), low-grade squamous intraepithelial lesion (LSIL), high-grade squamous intraepithelial lesion (HSIL), squamous cell carcinoma (SCC). In this dataset, these are categorized as &#x201c;SCC_etc,&#x201d; which includes both SCC and adenocarcinoma (AC). A strict consensus rule was applied for inclusion in the final dataset; an FOV was included only if all six experts reached a 100% agreement on the diagnostic classification. The FOVs that did not achieve unanimous agreement were excluded from the dataset to ensure the highest possible ground-truth reliability.</p>
                    </list-item>
                    <list-item>
                        <label>5.</label>
                        <p>Final Dataset Organization</p>
                        <p>The final validated dataset, consisting of 639 FOVs (7,029 total images), was organized into the directory structure described in the Data description section. Each file was named according to its diagnostic class, FOV index, and Z-stack index to facilitate automated processing.</p>
                    </list-item>
                </list>
            </p>
            <sec id="sec6">
                <title>Data description</title>
                <p>CCCID is organized into four main directories named according to the Bethesda System: &#x201c;NILM,&#x201d; &#x201c;LSIL,&#x201d; &#x201c;HSIL,&#x201d; and &#x201c;SCC_etc&#x201d; (
                    <xref ref-type="table" rid="T1">
Table 1</xref>). Each directory contains subfolders corresponding to specific cellular or pathological types (
                    <xref ref-type="table" rid="T2">
Table 2</xref>). The &#x201c;NILM&#x201d; directory contains nine subfolders representing normal or benign cellular components: 1. Superficial-Intermediate Cells, 2. Parabasal-Basal Cells, 3. Glandular Cells (Isolated), 4. Glandular Cells (Cluster), 5. Squamous Metaplastic Cells, 6. Repair Cells, 7. Atrophic Vaginitis, 8. Macrophages, and 9. Neutrophils. The &#x201c;LSIL&#x201d; directory contains four subfolders: 10. Superficial-type Dysplastic Cells, 11. Intermediate-type Dysplastic Cells, 12. Superficial-type Koilocyte, and 13. Intermediate-type Koilocyte. The &#x201c;HSIL&#x201d; directory contains two subfolders: 14. Deep-layer Dysplastic Cells and 15. Carcinoma in situ Cells. The &#x201c;SCC_etc&#x201d; directory contains two subfolders: 16. Squamous Cell Carcinoma and 17. Adenocarcinoma.</p>
                <table-wrap id="T1" orientation="portrait" position="float">
                    <label>
Table 1. </label>
                    <caption>
                        <title>Dataset composition of the cervical cancer cell image database: Multi-focus cytology dataset.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Category</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Folder name</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">No. of FOVs</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Images per FOV</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Total JPG files</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Negative for intraepithelial lesion or malignancy</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">NILM</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">273</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">3,003</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Low-grade squamous intraepithelial lesion</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">LSIL</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">93</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1,023</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">High-grade squamous intraepithelial lesion</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">HSIL</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">69</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">759</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Squamous cell carcinoma and Adenocarcinoma</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">SCC_etc</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">204</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">2,244</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">Total</td>
                                <td colspan="1" rowspan="1"/>
                                <td align="left" colspan="1" rowspan="1" valign="top">639</td>
                                <td colspan="1" rowspan="1"/>
                                <td align="left" colspan="1" rowspan="1" valign="top">7,029</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <p>Fields of view (FOVs), negative for intraepithelial lesion or malignancy (NILM), low-grade squamous intraepithelial lesion (LSIL), high-grade squamous intraepithelial lesion (HSIL), squamous cell carcinoma (SCC_etc).</p>
                    </table-wrap-foot>
                </table-wrap>
                <table-wrap id="T2" orientation="portrait" position="float">
                    <label>
Table 2. </label>
                    <caption>
                        <title>Detailed cellular composition of the cervical cancer cell image database: Multi-focus cytology dataset.</title>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Main folder name</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Subfolder name (cell type)</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">No. of FOVs</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Images per FOV</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Total JPG files</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="left" colspan="1" rowspan="9" valign="middle">NILM</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1. Superficial-Intermediate Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">30</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">330</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">2. Parabasal-Basal Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">30</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">330</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">3. Glandular Cells (Isolated)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">30</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">330</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">4. Glandular Cells (Cluster)</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">13</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">143</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">5. Squamous Metaplastic Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">21</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">231</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">6. Repair Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">6</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">66</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">7. Atrophic Vaginitis</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">21</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">231</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">8. Macrophages</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">91</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1,001</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">9. Neutrophils</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">31</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">341</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="4" valign="middle">LSIL</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">10. Superficial-type Dysplastic Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">121</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">11. Intermediate-type Dysplastic Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">29</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">319</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">12. Superficial-type Koilocyte</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">32</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">352</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">13. Intermediate-type Koilocyte</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">21</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">231</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="2" valign="middle">HSIL</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">14. Deep-layer Dysplastic Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">121</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">15. Carcinoma In Situ Cells</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">58</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">638</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="2" valign="middle">SCC_etc</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">16. Squamous Cell Carcinoma</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">175</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">1,925</td>
                            </tr>
                            <tr>
                                <td align="left" colspan="1" rowspan="1" valign="top">17. Adenocarcinoma</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">29</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">11</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">319</td>
                            </tr>
                            <tr>
                                <td colspan="1" rowspan="1"/>
                                <td align="left" colspan="1" rowspan="1" valign="top">Total</td>
                                <td align="left" colspan="1" rowspan="1" valign="top">639</td>
                                <td colspan="1" rowspan="1"/>
                                <td align="left" colspan="1" rowspan="1" valign="top">7,029</td>
                            </tr>
                        </tbody>
                    </table>
                    <table-wrap-foot>
                        <p>Fields of view (FOVs), negative for intraepithelial lesion or malignancy (NILM), low-grade squamous intraepithelial lesion (LSIL), high-grade squamous intraepithelial lesion (HSIL), squamous cell carcinoma (SCC_etc).</p>
                    </table-wrap-foot>
                </table-wrap>
                <p>Each subfolder contains individual image files in JPG format, representing specific FOVs and their corresponding multi-focus planes.</p>
                <p>The image files follow the naming convention: [Serial Number]_(CenterX, CenterY, Z-stack Index).jpg.
                    <list list-type="bullet">
                        <list-item>
                            <label>&#x2022;</label>
                            <p>[Serial Number]: A unique sequential identifier assigned to each captured FOV.</p>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>[Center X, Center Y]: X and Y coordinates of the center of the FOV within the specimen (&#x03bc;m).</p>
                        </list-item>
                        <list-item>
                            <label>&#x2022;</label>
                            <p>[Z-stack Index]: The focal plane number, ranging from 0 to 10 (representing 11 layers).</p>
                        </list-item>
                    </list>
                </p>
                <p>For example, the file &#x201c;001_(3059,11012,0).jpg&#x201d; represents the first captured image, located at specimen coordinates (3059&#x00a0;&#x03bc;m, 11012&#x00a0;&#x03bc;m), with a focal plane index of 0. The files &#x201c;001_(3059,11012,0).jpg&#x201d; through &#x201c;001_(3059,11012,10).jpg&#x201d; constitute the complete 11-layer Z-stack for the first FOV.</p>
                <p>All images are 384&#x00a0;&#x00d7;&#x00a0;384 pixels with a resolution of 96 dpi. The Z-stack index 0 to 10 corresponds to a focal range captured at 1&#x00a0;&#x03bc;m intervals, providing a comprehensive volumetric view of the cellular and nuclear morphology. A representative image is shown in 
                    <xref ref-type="fig" rid="f1">
Figure 1</xref>.</p>
                <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                    <label>
Figure 1. </label>
                    <caption>
                        <title>The representative multi-focus (Z-stack) images for each category contained in the Cervical Cancer Cell Image Database: Multi-focus Cytology Dataset.</title>
                        <p>Negative for intraepithelial lesion or malignancy (NILM), low-grade squamous intraepithelial lesion (LSIL), high-grade squamous intraepithelial lesion (HSIL), squamous cell carcinoma (SCC), and adenocarcinoma (AC).</p>
                    </caption>
                    <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/197645/c4bf605c-06ec-47a5-8cbf-f5b4db193000_figure1.gif"/>
                </fig>
            </sec>
            <sec id="sec7">
                <title>Value of the data</title>
                <p>CCCID provides unique multi-focus (Z-stack) image sequences of cervical cytology, addressing the limitations of existing single-focus 2D datasets by reflecting the actual diagnostic process used by cytotechnologists and cytopathologists. These data are valuable for developing and evaluating deep learning models that require three-dimensional morphological information, such as chromatin distribution and nuclear membrane irregularities, which are often blurred or lost in single-plane images. The dataset features high ground-truth reliability, as every included image was validated through 100% consensus among six expert cytotechnologists, minimizing interobserver variability in the training data. Researchers can reuse this dataset to benchmark computer-aided diagnosis systems, specifically for testing algorithms designed to handle overlapping cells or thick cell clusters common in LBC specimens. The inclusion of 11 focus layers at 1&#x00a0;&#x03bc;m intervals allows for the exploration of focus-fusion (Extended Depth of Field) algorithms and the study of how vertical focal shifts impact the accuracy of automated cell classification.</p>
            </sec>
            <sec id="sec8">
                <title>Limitations</title>
                <p>Although CCCID provides a high-quality multi-focus resource, several limitations should be noted. First, the data were collected using a specific Whole Slide Imaging scanner (NanoZoomer-XR) and a single LBC preparation method (BD SurePath&#x2122;). Therefore, the visual characteristics of the images may differ from those produced by other scanners or preparation techniques, such as ThinPrep. Second, the dataset focuses on typical diagnostic images where six expert cytotechnologists reached a 100% consensus. This means that highly atypical or &#x201c;borderline&#x201d; cases, which often cause diagnostic disagreement in clinical practice, were intentionally excluded. Third, the number of FOVs varies across categories, resulting in class imbalance among the different cell types. Finally, the Z-stack range is fixed at 11 layers with 1&#x00a0;&#x03bc;m intervals.</p>
            </sec>
        </sec>
        <sec id="sec9">
            <title>Ethical considerations</title>
            <p>In all cases, informed consent was obtained from the patients using an opt-out procedure. This study was conducted in accordance with the Declaration of Helsinki and was approved by the Institutional Review Boards of all participating institutions, including the Ethics Committee of Kyushu University of Medical Science (Approval No. 17&#x2013;19). All patient data were fully anonymized prior to the image extraction and annotation process to ensure the protection of personal information.</p>
        </sec>
        <sec id="sec10">
            <title>Consent to publish</title>
            <p>Cytology samples were used in anonymized form. Consent for the use of clinical samples and associated images for research and publication was obtained through an opt-out procedure approved by the institutional ethics committees, including the Ethics Committee of Kyushu University of Medical Science (Approval No. 17&#x2013;19).</p>
        </sec>
    </body>
    <back>
        <sec id="sec13" sec-type="data-availability">
            <title>Data availability</title>
            <p>Zenodo: Cervical Cancer Cell Image Database: Multi-focus Cytology Dataset (CCCID). 
                <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.5281/zenodo.18904734">https://doi.org/10.5281/zenodo.18904734</ext-link>.
                <sup>
                    <xref ref-type="bibr" rid="ref7">7</xref>
                </sup>
            </p>
            <p>This project contains the following underlying data:
                <list list-type="bullet">
                    <list-item>
                        <label>&#x2022;</label>
                        <p>
CCCID_NILM_part1.zip.7z</p>
                        <p>This file contains image data for: 1. Superficial-Intermediate Cells, 2. Parabasal-Basal Cells, 3. Glandular Cells (Isolated), and 4. Glandular Cells (Cluster).</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>
CCCID_NILM_part2.zip.7z</p>
                        <p>This file contains image data for: 5. Squamous Metaplastic Cells, 6. Repair Cells, 7. Atrophic Vaginitis, 8. Macrophages, and 9. Neutrophils.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>CCCID_LSIL.zip.7z</p>
                        <p>This file contains image data for: 10. Superficial-type Dysplastic Cells, 11. Intermediate-type Dysplastic Cells, 12. Superficial-type Koilocyte, and 13. Intermediate-type Koilocyte.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>CCCID_HSIL.zip.7z</p>
                        <p>This file contains image data for: 14. Deep-layer Dysplastic Cells and 15. Carcinoma in situ Cells.</p>
                    </list-item>
                    <list-item>
                        <label>&#x2022;</label>
                        <p>
CCCID_SCC_etc.zip.7z</p>
                        <p>This file contains image data for: 16. Squamous Cell Carcinoma and 17. Adenocarcinoma.</p>
                    </list-item>
                </list>
            </p>
            <p>Data are available under the terms of the 
                <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution 4.0 International license</ext-link> (CC-BY 4.0).</p>
        </sec>
        <ack>
            <title>Acknowledgements</title>
            <p>We thank Mr. Hideki Hashimoto of Proassist Ltd. for creating the Annotation Image Creation Tool used to construct this dataset.</p>
        </ack>
        <ref-list>
            <title>References</title>
            <ref id="ref1">
                <label>1</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Giansanti</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lastrucci</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Pirrera</surname>
                            <given-names>A</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>AI in cervical cancer cytology diagnostics: A narrative review of cutting-edge studies.</article-title>
                    <source>

                        <italic toggle="yes">Bioengineering (Basel).</italic>
</source>
                    <year>2025</year>;<volume>12</volume>(<issue>7</issue>):<fpage>769</fpage>.
                    <pub-id pub-id-type="pmid">40722461</pub-id>
                    <pub-id pub-id-type="doi">10.3390/bioengineering12070769</pub-id>
                    <pub-id pub-id-type="pmcid">PMC12292208</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Jantzen</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Norup</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Dounias</surname>
                            <given-names>G</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Pap-smear benchmark data for pattern classification, Nature Inspired Smart Information Systems (NiSIS 2005).</article-title>
                    <year>2005</year>;<fpage>1</fpage>&#x2013;<lpage>9</lpage>.</mixed-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Phoulady</surname>
                            <given-names>HA</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Mouton</surname>
                            <given-names>PR</given-names>
                        </name>
</person-group>:
                    <article-title>A new cervical cytology dataset for nucleus detection and image classification (Cervix93) and methods for cervical nucleus detection.</article-title>
                    <year>2018</year>.
                    <pub-id pub-id-type="doi">10.48550/arXiv.1811.09651</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Plissiti</surname>
                            <given-names>ME</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Dimitrakopoulos</surname>
                            <given-names>P</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sfikas</surname>
                            <given-names>G</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>Sipakmed: A new dataset for feature and image based classification of normal and pathological cervical cells in Pap smear images.</chapter-title>
                    <source>

                        <italic toggle="yes">2018 25th IEEE International Conference on Image Processing (ICIP)</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>2018</year>;<fpage>3144</fpage>&#x2013;<lpage>3148</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ICIP.2018.8451588</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Rezende</surname>
                            <given-names>MT</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Silva</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Bernardo</surname>
                            <given-names>F d O</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Cric searchable image database as a public platform for conventional Pap smear cytology data.</article-title>
                    <source>

                        <italic toggle="yes">Sci. Data</italic>
</source>
                    <year>2021</year>;<volume>8</volume>(<issue>1</issue>):<fpage>151</fpage>.
                    <pub-id pub-id-type="pmid">34112812</pub-id>
                    <pub-id pub-id-type="doi">10.1038/s41597-021-00933-8</pub-id>
                    <pub-id pub-id-type="pmcid">PMC8192784</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Miyamoto</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Osawa</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Nishimori</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Evaluating the efficacy of multi-focus images in digital cytopathology.</article-title>
                    <source>

                        <italic toggle="yes">Journal of health and welfare investigation.</italic>
</source>
                    <year>2025</year>;<volume>9</volume>:<fpage>1</fpage>&#x2013;<lpage>4</lpage>.
                    <pub-id pub-id-type="doi">10.15069/0002000161</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <mixed-citation publication-type="data">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ohno</surname>
                            <given-names>E</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ohno</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Miyamoto</surname>
                            <given-names>T</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <data-title>Cervical Cancer Cell Image Database: Multi-focus Cytology Dataset (CCCID) (1.0.0).</data-title>[Data set].
                    <source>

                        <italic toggle="yes">Zenodo.</italic>
</source>
                    <year>2026</year>.
                    <pub-id pub-id-type="doi">10.5281/zenodo.18904734</pub-id>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
</article>
