<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="data-paper" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.177481.1</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Data Note</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>CYCLIST+IMU: A synchronized visual&#x2013;inertial dataset for cyclist orientation and perception in urban environments</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 1; peer review: 2 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>G&#x00f3;mez-Meneses</surname>
                        <given-names>Luis</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Project Administration</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Visualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-0667-7472</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Arias-Correa</surname>
                        <given-names>Mauricio</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Resources</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <xref ref-type="aff" rid="a2">2</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Herrera-Ram&#x00ed;rez</surname>
                        <given-names>Jorge</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Supervision</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a3">3</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Ballesteros</surname>
                        <given-names>John R.</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Data Curation</role>
                    <role content-type="http://credit.niso.org/">Investigation</role>
                    <role content-type="http://credit.niso.org/">Validation</role>
                    <xref ref-type="aff" rid="a4">4</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Faculty of Engineering, Instituto Tecnologico Metropolitano, Medell&#x00ed;n, Antioquia, Colombia</aff>
                <aff id="a2">
                    <label>2</label>Design Engineering Research Group (GRID), Universidad EAFIT, Medell&#x00ed;n, Antioquia, Colombia</aff>
                <aff id="a3">
                    <label>3</label>Faculty of Exact and Applied Sciences, Instituto Tecnologico Metropolitano, Medell&#x00ed;n, Antioquia, Colombia</aff>
                <aff id="a4">
                    <label>4</label>Department of Computer Science and Decision Sciences, Universidad Nacional de Colombia Sede Medellin, Medell&#x00ed;n, Antioquia, Colombia</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:luisgomez251811@correo.itm.edu.co">luisgomez251811@correo.itm.edu.co</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>15</day>
                <month>4</month>
                <year>2026</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2026</year>
            </pub-date>
            <volume>15</volume>
            <elocation-id>527</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>13</day>
                    <month>3</month>
                    <year>2026</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 G&#x00f3;mez-Meneses L et al.</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/15-527/pdf"/>
            <abstract>
                <sec>
                    <title>Background</title>
                    <p>Cyclists are among the most vulnerable road users in urban traffic environments. For autonomous vehicles to interact safely and effectively with cyclists, perception systems must go beyond detection and segmentation to include an explicit understanding of cyclist orientation. However, most existing cyclist datasets lack synchronized inertial metadata describing body orientation, limiting their use in multimodal and orientation-aware perception studies.</p>
                </sec>
                <sec>
                    <title>Methods</title>
                    <p>This Data Note presents a multimodal visual&#x2013;inertial dataset acquired using the CYCLIST+IMU framework, which synchronizes monocular RGB images captured from a vehicle-mounted camera with inertial measurements recorded by bicycle-mounted and vehicle-mounted inertial measurement units. Data were collected during multiple real-world urban acquisition sessions, resulting in 3,606 RGB images, each temporally aligned with inertial measurements, including cyclist orientation angles (yaw and roll). From these acquisitions, cyclist-centered image crops were generated and manually annotated, resulting in polygon-based semantic segmentation labels, region-of-interest detection files, and relative depth maps estimated from the RGB images. To improve angular coverage, a targeted data augmentation strategy based on horizontal image flipping was applied to underrepresented orientation ranges, resulting in the generation of 718 additional samples. The final dataset comprises 4,324 synchronized multimodal samples organized in a hierarchical directory structure that preserves one-to-one correspondence across all data modalities.</p>
                </sec>
                <sec>
                    <title>Conclusions</title>
                    <p>The CYCLIST+IMU dataset provides synchronized RGB image crops, inertial orientation metadata, semantic segmentation annotations, relative depth maps, and detection files for 4,324 cyclist instances captured under real urban traffic conditions. By explicitly integrating visual and inertial data with precise temporal alignment and detailed documentation, this dataset enables reproducible research on cyclist orientation estimation, semantic segmentation, and multimodal sensor fusion for intelligent transportation systems.</p>
                </sec>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>Cyclist dataset</kwd>
                <kwd>Visual&#x2013;inertial dataset</kwd>
                <kwd>Cyclist orientation</kwd>
                <kwd>Yaw and roll angles</kwd>
                <kwd>Vulnerable road users</kwd>
                <kwd>Semantic segmentation</kwd>
                <kwd>Depth maps</kwd>
                <kwd>Urban traffic scene.</kwd>
            </kwd-group>
            <funding-group>
                <funding-statement>The author(s) declared that no grants were involved in supporting this work.</funding-statement>
            </funding-group>
        </article-meta>
    </front>
    <body>
        <sec id="sec4" sec-type="intro">
            <title>1. Introduction</title>
            <p>Time has proven that conventional cars are remarkably inefficient. They don&#x2019;t just consume energy but also erode human health and productivity. The paradox of private ownership exacerbates this, as vehicles spend most of their existence idle, wasting precious space and materials. Driven by these shortcomings, a global interest in autonomous vehicles (AVs) has surged since the 1980s, mobilizing universities and industry leaders to rethink the very nature of mobility (
                <xref ref-type="bibr" rid="ref2">Badue et al., 2019</xref>; 
                <xref ref-type="bibr" rid="ref18">Thrun, 2010</xref>; 
                <xref ref-type="bibr" rid="ref17">Narula &amp; Tyagi, 2023</xref>).</p>
            <p>The integration of AVs -whether for personal or public use- into heterogeneous traffic settings demands an interactive capability that transcends rudimentary obstacle recognition. These systems must interface harmoniously and safely with manual drivers, cyclists, and pedestrians. Within these shared environments, human participants navigate through an intricate web of implicit cues, such as nuanced adjustments in approach speed, alongside explicit signals like eye contact or hand gestures. These interactions establish a mutual consensus that enables the fluid synchronization of future maneuvers among road participants. However, contemporary AV architectures tend to prioritize a strict, rationalist framework of collision avoidance over social negotiation. Consequently, these vehicles frequently manifest non-human patterns, including abrupt halts, hesitant movements, or excessive delays at junctions. Such behaviors disrupt the temporal rhythm of traffic and can, paradoxically, undermine overall systemic safety (
                <xref ref-type="bibr" rid="ref4">Brown &amp; Laurier, 2017</xref>; 
                <xref ref-type="bibr" rid="ref5">Brown, Broth &amp; Vinkhuyzen, 2023</xref>).</p>
            <p>The operational scope of an AV necessitates the accurate identification of both road signage and traffic participants, specifically those lacking a protective mechanical framework&#x2014;such as pedestrians and cyclists. Categorized as &#x2018;Vulnerable Road Users&#x2019; (VRUs), these individuals are exposed to a disproportionate risk of sustaining severe injuries or fatalities in the event of traffic accidents (
                <xref ref-type="bibr" rid="ref10">Flohr, 2018</xref>; 
                <xref ref-type="bibr" rid="ref16">Mannion, 2019</xref>).</p>
            <p>Road traffic injuries have persisted as the twelfth leading cause of death across all age groups globally. Within this context, VRUs account for more than half of the 1.19 million annual fatalities reported by the World Health Organization (
                <xref ref-type="bibr" rid="ref20">WHO, 2023</xref>). As seen in 
                <xref ref-type="fig" rid="f1">
Figure 1</xref>, cyclists account for 5% of these global deaths, a percentage that has increased by nearly 20% over the last decade. This vulnerability is further intensified when cyclists must navigate mixed traffic environments, where safety is predicated on the mutual understanding of motion; a form of social coordination that contemporary autonomous systems still struggle to replicate (
                <xref ref-type="bibr" rid="ref12">Ghoul &amp; Sayed, 2025</xref>; 
                <xref ref-type="bibr" rid="ref15">Lu et al., 2025</xref>).</p>
            <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                <label>
Figure 1. </label>
                <caption>
                    <title>Global percentage distribution of country-reported deaths by road users.</title>
                    <p>Source: (
                        <xref ref-type="bibr" rid="ref20">World Health Organization, 2023</xref>).</p>
                </caption>
                <graphic id="gr1" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure1.gif"/>
            </fig>
            <p>Cyclist detection persists as a challenge for AV perception systems, primarily due to the inherent visual complexity associated with non-rigid articulations, highly variable aspect ratios, and a diverse range of spatial orientations. Beyond the technical impediments posed by occlusions and cluttered urban environments, contemporary research underscores that mere classification is insufficient. Systems must achieve a sophisticated understanding of behavioral intent through advanced frameworks (
                <xref ref-type="bibr" rid="ref7">Corral-Soto et al., 2025b</xref>). Consequently, the estimation of orientation angles has transitioned from a secondary metric to a critical precursor for the &#x2018;reflexive adjustment&#x2019; required for an AV to safely navigate and avoid collisions with cyclists (
                <xref ref-type="bibr" rid="ref5">Brown et al., 2023</xref>).</p>
            <p>Regardless of the previously addressed technical and social imperatives, a systematic examination of cyclist datasets published between 2023 and 2025 reveals a significant deficit in metadata fidelity. Contemporary repositories fail to provide three-dimensional orientation parameters (Roll, Pitch, Yaw) integrated with the cyclist&#x2019;s posture within the image frame, as illustrated in 
                <xref ref-type="table" rid="T1">
Table 1</xref>. This lack of data limits the ability of AVs to interpret the cyclist&#x2019;s body language and, consequently, delays the achievement of what 
                <xref ref-type="bibr" rid="ref5">Brown et al. (2023)</xref> term the &#x2018;sociality of traffic&#x2019; for AVs.</p>
            <table-wrap id="T1" orientation="portrait" position="float">
                <label>
Table 1. </label>
                <caption>
                    <title>Comparative analysis of cyclist datasets (2023&#x2013;2025).</title>
                    <p>Source: Authors.</p>
                </caption>
                <table content-type="article-table" frame="hsides">
                    <thead>
                        <tr>
                            <th align="left" colspan="1" rowspan="1" valign="top">Work (APA citation)</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">Dataset characteristics</th>
                            <th align="left" colspan="1" rowspan="1" valign="top">
Does it include orientation angles (Roll, Pitch, Yaw) and acquisition method</th>
                        </tr>
                    </thead>
                    <tbody>
                        <tr>
                            <td align="center" colspan="1" rowspan="1" valign="middle">
                                <xref ref-type="bibr" rid="ref6">Chiang, C. Y., et al. (2024)</xref>. 
                                <italic toggle="yes">AllTheDocks road safety dataset: A cyclist&#x2019;s perspective and experience.</italic>
</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">AllTheDocks: Collected in London through citizen science. Includes video (61.68&#x00a0;km), accelerometer, GPS, and gyroscope data.</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">
                                <bold>No (for cyclists in the image).</bold> The dataset includes gyroscope data (GyroX, GyroY, GyroZ), but these correspond exclusively to the ego-cyclist carrying the camera. Method: Telemetry extracted from helmet-mounted GoPro cameras.</td>
                        </tr>
                        <tr>
                            <td align="center" colspan="1" rowspan="1" valign="middle">
                                <xref ref-type="bibr" rid="ref22">Yan, Z., Li, J., Hang, P., &amp; Sun, J. (2025)</xref>. 
                                <italic toggle="yes">OnSiteVRU: A high-resolution trajectory dataset for high-density vulnerable road users.</italic>
</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">OnSiteVRU: High-resolution trajectory data (0.04&#x00a0;s) collected in China. Covers intersections, road segments, and urban villages with 17,429 VRU trajectories.</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">
                                <bold>No (partial).</bold> Only includes the heading angle (direction of motion relative to the X-axis). Roll and pitch for the cyclist posture in the image are not provided. Method: Extraction using elevated vision cameras (YOLOv7/DeepSORT) and onboard vehicle sensors (LiDAR/IMU).</td>
                        </tr>
                        <tr>
                            <td align="center" colspan="1" rowspan="1" valign="middle">
                                <xref ref-type="bibr" rid="ref11">Goren, D., &amp; Caesar, H. (2025)</xref>. 
                                <italic toggle="yes">BikeScenes: Online LiDAR semantic segmentation for bicycles.</italic>
</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">BikeScenes-lidarseg: LiDAR semantic segmentation dataset captured from a bicycle perspective. Contains 3,021 scans annotated into 29 semantic classes.</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">
                                <bold>No.</bold> Although the SenseBike platform includes an IMU for ego-motion compensation, cyclist metadata corresponds only to semantic segmentation labels, not orientation angles. Method: Offline LiDAR point cloud registration with GLIM and manual scan-level annotation.</td>
                        </tr>
                        <tr>
                            <td align="center" colspan="1" rowspan="1" valign="middle">
                                <xref ref-type="bibr" rid="ref14">Li, M., et al. (2025)</xref>. 
                                <italic toggle="yes">A benchmark for cycling close pass detection from video streams.</italic>
</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">Cyc-CP: Benchmark combining Victorian On-road Cycling (VOC) data and CARLA synthetic data. Focuses on close pass overtaking events.</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">
                                <bold>No (partial).</bold> Predicts allocentric orientation angle (&#x03b8;) of the overtaking vehicle. Roll, pitch, and yaw for cyclist posture are not defined. Method: Monocular 3D detection using FCOS3D on single-view video.</td>
                        </tr>
                        <tr>
                            <td align="center" colspan="1" rowspan="1" valign="middle">
                                <xref ref-type="bibr" rid="ref9">Desai, N. P., Etemad, A., &amp; Greenspan, M. (2025)</xref>. 
                                <italic toggle="yes">CycleCrash: A dataset of bicycle collision videos for collision prediction and analysis.</italic>
</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">CycleCrash: 3,000 dashcam videos with 436,347 frames depicting cyclist collisions and near-miss events.</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">
                                <bold>No.</bold> Direction annotations are limited to five discrete classes (forward, backward, left, right, stationary). Method: Web video curation and manual annotation based on traffic rules.</td>
                        </tr>
                        <tr>
                            <td align="center" colspan="1" rowspan="1" valign="middle">
                                <xref ref-type="bibr" rid="ref7">Corral-Soto, E. R., et al. (2025a)</xref>. 
                                <italic toggle="yes">3DArticCyclists: Generating synthetic articulated 8D pose-controllable cyclist data for computer vision applications.</italic>
</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">3DArticBikes/3DArticCyclists: Hybrid synthetic&#x2013;real dataset addressing cyclist data scarcity for autonomous driving. Includes 11,086 cyclist&#x2013;bicycle configurations.</td>
                            <td align="left" colspan="1" rowspan="1" valign="middle">
                                <bold>Yes.</bold> Provides full 3D orientation parameters (&#x03b8;x, &#x03b8;y, &#x03b8;z corresponding to roll, pitch, and yaw). Method: Synthetic generation using Blender and 3D Gaussian Splatting, with pose refinement via inverse kinematics based on real video data processed with CLIFF.</td>
                        </tr>
                    </tbody>
                </table>
            </table-wrap>
            <p>To address the identified lack of data, this paper presents a multimodal cyclist dataset that synchronizes real-world RGB imagery, depth maps, and semantic segmentation with precise, frame-by-frame inertial telemetry. Unlike contemporary synthetic frameworks&#x2014;such as 3DArticCyclists (
                <xref ref-type="bibr" rid="ref7">Corral-Soto et al., 2025a</xref>)&#x2014;this dataset provides empirical ground truth for three-axis orientation (Roll, Pitch, Yaw) and triaxial acceleration (Ax, Ay, Az). By integrating these dynamic parameters, the proposed dataset enables the training of autonomous navigation models that move beyond rudimentary collision avoidance, facilitating the complex social coordination required to achieve the &#x2018;sociality of traffic&#x2019; (
                <xref ref-type="bibr" rid="ref5">Brown et al., 2023</xref>).</p>
        </sec>
        <sec id="sec5">
            <title>2. Materials and methods</title>
            <sec id="sec6">
                <title>2.1 Data acquisition system</title>
                <p>Cyclist images and synchronized visual&#x2013;inertial data were captured using the CYCLOPS system (cyclists&#x2019; orientation data acquisition system using RGB camera and inertial measurement units). This original development consists of a node located on a vehicle and another on a bicycle. The vehicle node includes a monocular RGB camera, an inertial measurement unit (IMU), an RF transceiver, and a microcontroller. The bicycle node includes an IMU, an RF transceiver, and a microcontroller. The system facilitates the acquisition of images of a moving cyclist and associates each image with both acceleration and orientation angles (Ax, Ay, Az, Roll, Pitch, Yaw), as illustrated in 
                    <xref ref-type="fig" rid="f2">
Figure 2</xref>. Similarly, camera acceleration and orientation angles are acquired at the vehicle to subsequently obtain relative values (cyclist relative to camera) and establish the cyclist&#x2019;s real orientation in each image acquired from the vehicle while both are moving in an urban environment.</p>
                <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                    <label>
Figure 2. </label>
                    <caption>
                        <title>Frame assignment for both, the camera attached to a car&#x2019;s windshield (over the vehicle) and the bicycle&#x2019;s top tube (cyclist).</title>
                        <p>For the vehicle, the axes have been named Xv, Yv, and Zv, and rotations around the axis are ROLLv, PITCHv, and YAWv (respectively). Similarly, the frame for the cyclist has axes Xc, Yc, and Zc, and rotations around the axis are ROLLc, PITCHc, and YAWc (respectively). Source: Adapted from the original in 
                            <xref ref-type="bibr" rid="ref1">Arias-Correa et al. (2024)</xref>.</p>
                    </caption>
                    <graphic id="gr2" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure2.gif"/>
                </fig>
                <p>A significant achievement of the CYCLOPS acquisition system lies in the synchronization between images and 6-axis motion data for both actors. Full details regarding the open-source hardware architecture, the IMU-based sensor fusion, and the software suite (VideoCapture) are documented in 
                    <xref ref-type="bibr" rid="ref1">Arias-Correa et al. (2024)</xref>, ensuring complete experimental reproducibility. A general diagram of the hardware and software for each node (cyclist node and camera node) of the CYCLOPS system is presented in 
                    <xref ref-type="fig" rid="f3">
Figure 3</xref>.</p>
                <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                    <label>
Figure 3. </label>
                    <caption>
                        <title>Diagram of the hardware and software for each node of the CYCLOPS system.</title>
                        <p>The block Cyclist includes a printed circuit board (PCB), which comprises an IMU, an Arduino Nano board (Microcontroller-C), and a transceiver HC12 in transmission mode (Transceiver-C) with an antenna. Similarly, the block camera includes the RGB camera mounted on the vehicle&#x2019;s windshield, an IMU (IMU-V), an Arduino Nano board (Microcontroller-V), and a transceiver HC12 (Transceiver-V) with an antenna. Both the camera and the PCB send data to the acquisition software running on a computer. Source: Adapted from the original in 
                            <xref ref-type="bibr" rid="ref1">Arias-Correa et al. (2024)</xref>.</p>
                    </caption>
                    <graphic id="gr3" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure3.gif"/>
                </fig>
            </sec>
            <sec id="sec7">
                <title>2.2 Visual&#x2013;inertial data synchronization</title>
                <p>The CYCLOPS system implements a hardware-level synchronization protocol to ensure precise temporal registration between the visual&#x2013;inertial data from the RGB camera and the high-frequency inertial data from the IMU sensors. This synchronization is executed at the point of acquisition via a deterministic software architecture that manages concurrent sensor triggering and logging across both bicycle-mounted and vehicle-mounted nodes. Specifically, each RGB frame is hardware-level synchronized to a discrete set of inertial measurements captured at the exact timestamp 
                    <italic toggle="yes">t
                        <sub>k</sub>
                    </italic> of the camera&#x2019;s shutter release. This one-to-one temporal mapping constitutes the fundamental visual&#x2013;inertial sample of the dataset. For every image captured by the vehicle node, the system captures the cyclist&#x2019;s instantaneous kinematic state, including orientation variables such as yawb and rollb referenced to the coordinate frames established during system calibration. Crucially, this process is managed in real-time using a unified system clock, which precludes the need for subsequent corrections such as temporal interpolation, resampling, or offline alignment. By avoiding these post-processing steps, the CYCLOPS dataset maintains the integrity of the raw sensor data, providing a high-fidelity, temporally consistent snapshot of the cyclist&#x2019;s pose and motion at the precise moment of visual capture as seen in 
                    <xref ref-type="fig" rid="f4">
Figure 4</xref>.</p>
                <fig fig-type="figure" id="f4" orientation="portrait" position="float">
                    <label>
Figure 4. </label>
                    <caption>
                        <title>Result of the CYCLOPS acquisition process.</title>
                        <p>The figure shows the output generated by the CYCLOPS system for several consecutive RGB image frames acquired by the vehicle-mounted camera, together with their corresponding inertial measurements stored in format. Each image frame is temporally synchronized with a discrete set of inertial data captured at the exact acquisition instant, establishing a one-to-one correspondence between visual and inertial information. This synchronized visual&#x2013;inertial data product represents the final output of the CYCLOPS framework.</p>
                    </caption>
                    <graphic id="gr4" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure4.gif"/>
                </fig>
                <p>All details regarding the CYCLOPS hardware components (including camera and IMU models), synchronization strategy, calibration procedures, and data verification experiments are fully described and validated in 
                    <xref ref-type="bibr" rid="ref1">Arias-Correa et al. (2024)</xref> and are therefore not repeated here.</p>
                <p>Each RGB image captured by the vehicle-mounted camera is associated with a corresponding set of inertial measurements describing the cyclist&#x2019;s motion and orientation at the time of capture. Orientation variables, including yaw and roll, are derived from the inertial measurements and expressed in their respective reference frames as defined by the system configuration. Although the dataset also includes pitch measurements, this variable is not explicitly discussed here because the subsequent analysis and data augmentation procedures focus exclusively on yaw and roll.</p>
            </sec>
            <sec id="sec8">
                <title>2.3 Data Acquisition Protocol</title>
                <p>Data were collected across multiple independent acquisition sessions conducted in urban environments. Each session is identified using the label Adq_x and corresponds to a continuous recording sequence acquired while the cyclist and the acquisition vehicle were in motion under real traffic conditions.</p>
                <p>
During each acquisition session, RGB images of the cyclist were recorded using the vehicle-mounted camera, while inertial measurements describing the cyclist&#x2019;s motion and orientation were simultaneously captured by the bicycle-mounted and vehicle-mounted IMUs. A single sample is defined as an RGB image associated with its corresponding synchronized inertial measurements, including orientation angles such as yaw and roll, as described in 
                    <xref ref-type="sec" rid="sec8">Section 2.2</xref>.</p>
                <p>The acquisition protocol was designed to capture natural cyclist behavior in unconstrained urban scenarios. Data were collected under daytime lighting conditions on public roads, without imposing specific trajectories or maneuvers on the cyclist beyond normal riding behavior.</p>
                <p>Following data collection, a basic quality control process was applied to the acquired data. Samples exhibiting acquisition failures, severe occlusions of the cyclist, or loss of visual&#x2013;inertial synchronization were excluded from the dataset. Only samples in which the cyclist was clearly visible, and the corresponding inertial data were successfully recorded and retained for further processing and inclusion in the dataset.</p>
                <p>In this work, a total of 3,606 RGB images were acquired, each associated with its corresponding inertial measurements obtained from the IMU units of the CYCLOPS system. Images and inertial data are stored following a hierarchical file structure designed to preserve the temporal correspondence between each image and its associated orientation and acceleration records. After data acquisition, the RGB images were manually annotated using the DarkLabel tool (
                    <ext-link ext-link-type="uri" xlink:href="https://github.com/darkpgmr/DarkLabel">

                        <italic toggle="yes">https://github.com/darkpgmr/DarkLabel</italic>
</ext-link>) to identify and delineate the cyclist region of interest (ROI). The resulting annotations were exported in YOLO format (*.txt files), providing normalized bounding box coordinates for each cyclist and enabling their direct use in object detection and subsequent analysis pipelines.</p>
            </sec>
            <sec id="sec9">
                <title>2.4 Image processing</title>
                <p>To construct a dataset suitable for computer vision tasks, additional processing was applied to the cyclist region-of-interest (ROI) images extracted from the original RGB images. This processing stage includes manual semantic segmentation of the cyclist and the generation of relative depth maps, as illustrated in 
                    <xref ref-type="fig" rid="f5">
Figure 5</xref>.</p>
                <fig fig-type="figure" id="f5" orientation="portrait" position="float">
                    <label>
Figure 5. </label>
                    <caption>
                        <title>RGB image processing stages.</title>
                        <p>(a) Manual segmentation of the cyclist from RGB images using the LabelMe annotation tool, where the region corresponding to the cyclist is precisely delineated. (b) Depth map estimation from RGB images using an encoder&#x2013;decoder model, generating a complementary geometric representation of the cyclist and the surrounding environment.</p>
                    </caption>
                    <graphic id="gr5" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure5.gif"/>
                </fig>
                <p>Polygon-based semantic segmentation of the cyclist was performed using the LabelMe annotation tool (
                    <xref ref-type="bibr" rid="ref19">Russell et al., 2008</xref>), which supports polygon-based annotation and is widely used in computer vision applications. As illustrated in 
                    <xref ref-type="fig" rid="f5">
Figure 5a</xref>, for each RGB image, the region corresponding to the cyclist was manually delineated using polygonal annotations. This procedure was applied to the entire dataset to ensure a consistent and precise definition of the region of interest across all samples. The resulting annotations were stored in JSON format, preserving the geometric information required for subsequent processing and reuse.</p>
                <p>In parallel, the RGB images were processed to obtain depth maps using the Depth Anything model (
                    <xref ref-type="bibr" rid="ref21">Yang et al., 2024</xref>), as shown in 
                    <xref ref-type="fig" rid="f5">
Figure 5b</xref>. Depth Anything follows a base-model paradigm, and is trained at a large scale using unlabeled data, enabling robust generalization across diverse visual scenes. Although alternative approaches such as MiDaS have demonstrated strong performance through supervised and weakly supervised training on curated datasets (
                    <xref ref-type="bibr" rid="ref81">Ranftl et al., 2020</xref>; 
                    <xref ref-type="bibr" rid="ref3">Birkl et al., 2023</xref>). The Depth Anything model was selected due to its ability to produce consistent relative depth estimates without relying on task-specific supervision. The depth maps included in the CYCLIST+IMU dataset represent relative depth and have been stored as 8-bit grayscale images, where depth values (non-metric) were normalized and linearly mapped to the range [0, 255] before saving in JPEG format. These depth maps are provided as complementary geometric context to the RGB images and semantic annotations.</p>
            </sec>
            <sec id="sec10">
                <title>2.5 Data augmentation</title>
                <p>To enhance the coverage of cyclist orientations and increase the angular diversity of the dataset, a data augmentation strategy based on geometric transformations was applied. This strategy was designed to expand the range of represented orientations while preserving the physical coherence and visual consistency of the samples.</p>
                <p>Data augmentation was performed using a horizontal flipping transformation applied to the RGB images. This operation generates additional samples by flipping the original images along the vertical axis, thereby increasing orientation diversity without introducing artificial visual artifacts or altering the geometric structure of the cyclist and the surrounding environment.</p>
                <p>To maintain consistency between the visual content and the associated orientation labels, yaw and roll values were deterministically updated following the transformation. Under horizontal flipping, yaw angles were transformed according to: 
                    <italic toggle="yes">yaw&#x2032;</italic>&#x00a0;=&#x00a0;360&#x00b0;&#x00a0;&#x2212;&#x00a0;
                    <italic toggle="yes">yaw.</italic> Meanwhile, roll values were inverted as: 
                    <italic toggle="yes">roll&#x2032;</italic>&#x00a0;=&#x00a0;&#x2212;
                    <italic toggle="yes">roll.</italic> This transformation was applied only to samples belonging to selected underrepresented yaw intervals, as identified during the dataset validation stage (
                    <xref ref-type="sec" rid="sec13">Section 3.1</xref>).</p>
                <p>An illustrative example of the data augmentation process is shown in 
                    <xref ref-type="fig" rid="f6">
Figure 6</xref>, where the original image, the augmented image, and the corresponding updates to yaw and roll angles are presented.</p>
                <fig fig-type="figure" id="f6" orientation="portrait" position="float">
                    <label>
Figure 6. </label>
                    <caption>
                        <title>Example of data augmentation using horizontal image flipping.</title>
                        <p>The original RGB image and the corresponding augmented image obtained by horizontal flipping are shown. Yaw and roll angles are deterministically updated to preserve geometric consistency, with (
                            <italic toggle="yes">yaw&#x2019;&#x00a0;=&#x00a0;360&#x00b0;-yaw</italic>) and (
                            <italic toggle="yes">roll&#x2019;&#x00a0;=&#x00a0;&#x2212;roll</italic>
).</p>
                    </caption>
                    <graphic id="gr6" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure6.gif"/>
                </fig>
            </sec>
            <sec id="sec11">
                <title>2.6 Dataset structure and organization.</title>
                <p>The dataset is organized using a hierarchical directory structure designed to preserve traceability between original acquisitions and all derived data products. At the top level, the dataset is divided into two main directories: Original_Image, containing the raw RGB images, and Image_Crops, which stores all processed cyclist-centered
 data.</p>
                <p>Within Image_Crops, data are grouped into acquisition-level subdirectories labeled Adq_x, where x denotes an independent synchronized recording session, integrating RGB imagery and inertial measurement unit (IMU) data. Each Adq_x directory contains four modality-specific subfolders: RGB_IMAGE (cropped RGB images), Detection (region-of-interest detection files), Polygons (polygon-based semantic segmentation annotations in JSON format), and Depth_Map (relative depth maps).</p>
                <p>Each acquisition session also includes a metadata file (Adq_x.xlsx) consolidating inertial information, including cyclist orientation parameters (yaw and roll), and unique identifiers linking all data modalities. File naming follows the convention Adq_x (n), ensuring a strict one-to-one correspondence among RGB images, detection files, segmentation annotations, depth maps, and inertial measurements.</p>
                <p>An overview of the dataset structure is provided in 
                    <xref ref-type="fig" rid="f7">
Figure 7</xref>, and a summary of dataset contents and file formats is presented in 
                    <xref ref-type="table" rid="T2">
Table 2</xref>.</p>
                <fig fig-type="figure" id="f7" orientation="portrait" position="float">
                    <label>
Figure 7. </label>
                    <caption>
                        <title>Hierarchical organization of the CYCLIST+IMU dataset.</title>
                        <p>The dataset is structured to preserve traceability between the original multimodal acquisitions and all derived data products. Raw RGB images are stored in the Original_Image directory, while processed cyclist-centered data are organized under Image_Crops by acquisition session (Adq_x). Each Adq_x represents a synchronized acquisition unit integrating RGB imagery and inertial measurement unit (IMU) data, including cyclist orientation parameters such as yaw and roll observed from the acquisition vehicle. For each session, cropped RGB images, region-of-interest detection files, relative depth maps, and polygon-based semantic segmentation annotations are stored in modality-specific subdirectories using a consistent naming convention that ensures a strict one-to-one correspondence across data types.</p>
                    </caption>
                    <graphic id="gr7" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure7.gif"/>
                </fig>
                <table-wrap id="T2" orientation="portrait" position="float">
                    <label>
Table 2. </label>
                    <caption>
                        <title>Summary of the generated dataset structure.</title>
                        <p>Source: Authors.</p>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Data type</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Format</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Quantity</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Cyclist RGB images</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">.JPG</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">4324</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Segmentation polygons</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">.JSON</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">4324</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Depth maps</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">.JPG</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">4324</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Cyclist detection annotations</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">.TXT</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">4324</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">IMU data</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">.XLSX</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">4324</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>
                    <xref ref-type="table" rid="T2">
Table 2</xref> presents the complete description of the dataset generated in this work.</p>
            </sec>
        </sec>
        <sec id="sec12">
            <title>3. Dataset validation</title>
            <p>A dataset validation procedure was conducted to assess the internal consistency, angular coverage, and coherence of the visual&#x2013;inertial orientation metadata. Validation focuses on descriptive and structural properties of the dataset rather than on model performance, in accordance with the scope of a Data Note.</p>
            <sec id="sec13">
                <title>3.1 Angular consistency and coverage.</title>
                <p>The CYCLOPS orientation angles include yaw and roll, which require different statistical treatments due to their measurement domains. Yaw is a periodic variable defined over [0&#x00b0;, 360&#x00b0;), while roll is restricted to a narrow, non-periodic range around zero (approximately &#x2212;20&#x00b0; to 20&#x00b0;).</p>
                <p>Yaw distributions were analysed using circular statistics to avoid discontinuities at the 0&#x00b0;/360&#x00b0; boundary, computing circular mean, median, and deviation with the pycircstat Python library. Roll values were characterised using standard linear descriptive statistics (mean, median, and standard deviation).</p>
                <p>
                    <xref ref-type="fig" rid="f8">
Figure 8</xref> shows the yaw and roll distributions prior to data augmentation, and 
                    <xref ref-type="table" rid="T3">
Table 3</xref> reports the corresponding descriptive statistics, confirming adequate angular coverage of cyclist orientations under real-world riding conditions.</p>
                <fig fig-type="figure" id="f8" orientation="portrait" position="float">
                    <label>
Figure 8. </label>
                    <caption>
                        <title>Distribution of angular variables acquired by the CYCLOPS system.</title>
                        <p>(a) Circular distribution of cyclist orientation angles (yaw), represented using circular statistics to account for the periodic nature of the variable over the [0&#x00b0;, 360&#x00b0;) range. (b) Linear distribution of cyclist inclination angles (roll), analysed using linear statistics due to their bounded range around 0&#x00b0;.</p>
                    </caption>
                    <graphic id="gr8" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure8.gif"/>
                </fig>
                <table-wrap id="T3" orientation="portrait" position="float">
                    <label>
Table 3. </label>
                    <caption>
                        <title>Descriptive statistics of the angular variables (
                            <italic toggle="yes">yaw</italic> and 
                            <italic toggle="yes">roll</italic>
) in the CYCLOPS dataset.</title>
                        <p>Source: Authors.</p>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Yaw</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Roll</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Total samples: 3606</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">Total samples: 3606</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Circular mean: 297.05&#x00b0;</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">Mean: 0.44&#x00b0;</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Circular median: 283.81&#x00b0;</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">median: &#x2212;0.81&#x00b0;</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Circular deviation: 141.12&#x00b0;</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">Standard deviation: 9.68&#x00b0;</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
            <sec id="sec14">
                <title>3.2 Validation of the data augmentation strategy.</title>
                <p>The data augmentation procedure based on horizontal image flipping was validated to ensure geometric consistency between RGB images and orientation angles. After augmentation, yaw and roll values were deterministically updated following the transformation rules defined in the Methods section.</p>
                <p>Consistency between augmented images, updated orientation angles, and the associated segmentation polygons, detection files, and relative depth maps was verified through visual inspection. 
                    <xref ref-type="fig" rid="f6">
Figure 6</xref> illustrates the augmentation process, while 
                    <xref ref-type="fig" rid="f9">
Figure 9</xref> shows the post-augmentation distributions of yaw and roll, highlighting the angular regions targeted to improve coverage.</p>
                <fig fig-type="figure" id="f9" orientation="portrait" position="float">
                    <label>
Figure 9. </label>
                    <caption>
                        <title>Post-augmentation distribution of cyclist orientation and inclination variables.</title>
                        <p>(a) Circular distribution of orientation angles (
                            <italic toggle="yes">yaw</italic>) after data augmentation. Angular bins highlighted in red indicate the yaw intervals selected for horizontal flipping and sample augmentation. (b) Linear distribution of inclination angles (
                            <italic toggle="yes">roll</italic>
) after data augmentation. Red-highlighted bins correspond to the roll range associated with the augmented samples, while blue bins represent the remaining original and augmented data.</p>
                    </caption>
                    <graphic id="gr9" orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/195711/91a06d8a-217c-4e82-a684-5f62058a4302_figure9.gif"/>
                </fig>
                <p>
                    <xref ref-type="table" rid="T4">
Table 4</xref> summarizes the descriptive statistics after augmentation, confirming enhanced angular coverage without altering the overall structure of the original dataset.</p>
                <table-wrap id="T4" orientation="portrait" position="float">
                    <label>
Table 4. </label>
                    <caption>
                        <title>Descriptive statistics of the angular variables (
                            <italic toggle="yes">yaw</italic> and 
                            <italic toggle="yes">roll</italic>
) after data augmentation in the CYCLOPS dataset.</title>
                        <p>Source: Authors.</p>
                    </caption>
                    <table content-type="article-table" frame="hsides">
                        <thead>
                            <tr>
                                <th align="left" colspan="1" rowspan="1" valign="top">Yaw</th>
                                <th align="left" colspan="1" rowspan="1" valign="top">Roll</th>
                            </tr>
                        </thead>
                        <tbody>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Total samples: 4324</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">Total samples: 4324</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Circular mean: 307.15&#x00b0;</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">Mean: &#x2212;0.34&#x00b0;</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Circular median: 295.56&#x00b0;</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">median: &#x2212;0.56&#x00b0;</td>
                            </tr>
                            <tr>
                                <td align="center" colspan="1" rowspan="1" valign="middle">Circular deviation: 140.22&#x00b0;</td>
                                <td align="left" colspan="1" rowspan="1" valign="middle">Standard deviation: 8.94&#x00b0;</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
            </sec>
        </sec>
        <sec id="sec15">
            <title>Ethical considerations</title>
            <p>The data presented in this Data Note were collected in public urban environments under natural traffic conditions. The acquisition protocol consisted of recording cyclist behavior in real-world settings without clinical intervention, behavioral manipulation, or collection of personal identifiers.</p>
            <p>
All cyclists recorded in this dataset were adult volunteers known to the research team and were fully informed about the purpose of the data acquisition and the intended public release of the dataset. Informed consent for participation and publication of anonymized data was obtained verbally prior to data collection. Written consent was not deemed necessary because no personal identifiable information was collected, and all visual data were anonymized prior to public release.</p>
            <p>No personal data such as names, identification numbers, contact information, or biometric identifiers were collected or stored during acquisition. Prior to publication, all captured visual images included in both the publicly released dataset and this manuscript were automatically processed using a YOLO-based face detection model, and any detected facial regions were anonymized through Gaussian blurring (21&#x00a0;&#x00d7;&#x00a0;21 kernel) to prevent individual identification. This anonymization procedure was systematically applied to all applicable captured images before public release.</p>
            <p>Derived data products such as segmentation masks, depth maps, and inertial metadata do not contain identifiable facial information.</p>
            <p>Because the released dataset does not contain personally identifiable information and consists of non-interventional observational recordings conducted with informed adult volunteers in public environments, this study qualifies as research without risk according to Colombian national regulations governing health research involving human participants (Resolution 8430 of 1993, Ministry of Health of Colombia). Under these regulations and applicable institutional guidelines, formal approval from an Institutional Review Board (IRB) or ethics committee was not required.</p>
            <p>The individuals shown in 
                <xref ref-type="fig" rid="f4">
Figures 4</xref>, 
                <xref ref-type="fig" rid="f5">5</xref>, and 
                <xref ref-type="fig" rid="f6">6</xref>, as well as all individuals appearing in the publicly released dataset, correspond to the same adult volunteers who provided informed consent for participation and publication of anonymized images. No third-party individuals were intentionally included in the dataset.</p>
            <p>The study was conducted in accordance with the ethical principles outlined in the Declaration of Helsinki, insofar as applicable to non-interventional observational data collection.</p>
        </sec>
    </body>
    <back>
        <sec id="sec18" sec-type="data-availability">
            <title>Data availability</title>
            <p>Open Science Framework (OSF). CYCLIST+IMU: A synchronized visual&#x2013;inertial dataset for cyclist orientation and perception in urban environments. 
                <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.17605/OSF.IO/HVPKZ">https://doi.org/10.17605/OSF.IO/HVPKZ</ext-link> (
                <xref ref-type="bibr" rid="ref13">G&#x00f3;mez-Meneses et al., 2026</xref>).</p>
            <p>This project contains the following underlying data:
                <list list-type="bullet">
                    <list-item>
                        <label>&#x2022;</label>
                        <p>
CYCLIST_IMU_Dataset.zip (Complete dataset including RGB images, cyclist-centered image crops, inertial measurement files (.xlsx), semantic segmentation polygons (.json), region-of-interest detection annotations (.txt), and relative depth maps (.jpg), organized by acquisition session.)</p>
                    </list-item>
                </list>
            </p>
            <p>Data is available under the terms of the 
                <ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution 4.0 International copyright</ext-link> (CC BY 4.0) license.</p>
        </sec>
        <ack>
            <title>Acknowledgements</title>
            <p>The authors have no acknowledgements to declare.</p>
        </ack>
        <ref-list>
            <title>References</title>
            <ref id="ref1">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Arias-Correa</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Robledo</surname>
                            <given-names>S</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Londo&#x00f1;o</surname>
                            <given-names>M</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>CYCLOPS: A cyclists&#x2019; orientation data acquisition system using RGB camera and inertial measurement units (IMU).</article-title>
                    <source>

                        <italic toggle="yes">HardwareX.</italic>
</source>
                    <year>2024</year>;<volume>18</volume>:<fpage>e00534</fpage>.
                    <pub-id pub-id-type="pmid">38690150</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.ohx.2024.e00534</pub-id>
                    <pub-id pub-id-type="pmcid">PMC11059332</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref2">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Badue</surname>
                            <given-names>C</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Guidolini</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Carneiro</surname>
                            <given-names>RV</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Self-driving cars: A survey.</article-title>
                    <source>

                        <italic toggle="yes">Expert Syst. Appl.</italic>
</source>
                    <year>2019</year>;<volume>165</volume>:<fpage>113816</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.eswa.2020.113816</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref3">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Birkl</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Wofk</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>M&#x00fc;ller</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <article-title>MiDaS v3.1 &#x2013; A model zoo for robust monocular relative depth estimation.</article-title>
                    <source>

                        <italic toggle="yes">arXiv preprint, arXiv:2307.14460.</italic>
</source>
                    <year>2023</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2307.14460">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref4">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Laurier</surname>
                            <given-names>E</given-names>
                        </name>
</person-group>:
                    <chapter-title>The trouble with autopilots: Assisted and autonomous driving on the social road.</chapter-title>
                    <source>

                        <italic toggle="yes">Proceedings of the 2017 CHI Conference on Human Factors in Computing Systems.</italic>
</source>
                    <publisher-name>ACM</publisher-name>;<year>2017</year>; pp.<fpage>416</fpage>&#x2013;<lpage>429</lpage>.
                    <pub-id pub-id-type="doi">10.1145/3025453.3025462</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref5">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Brown</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Broth</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Vinkhuyzen</surname>
                            <given-names>E</given-names>
                        </name>
</person-group>:
                    <chapter-title>The halting problem: Video analysis of self-driving cars in traffic.</chapter-title>
                    <source>

                        <italic toggle="yes">Proceedings of the 2023 CHI Conference on Human Factors in Computing Systems.</italic>
</source>
                    <publisher-name>ACM</publisher-name>;<year>2023</year>; pp.<fpage>1</fpage>&#x2013;<lpage>14</lpage>.
                    <pub-id pub-id-type="doi">10.1145/3544548.3581045</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref6">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Chiang</surname>
                            <given-names>CY</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhong</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ding</surname>
                            <given-names>J</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>AllTheDocks road safety dataset: A cyclist's perspective and experience.</chapter-title>
                    <source>

                        <italic toggle="yes">2024 IEEE 99th Vehicular Technology Conference (VTC2024-Spring).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>2024, June</year>; pp.<fpage>1</fpage>&#x2013;<lpage>5</lpage>.</mixed-citation>
            </ref>
            <ref id="ref7">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Corral-Soto</surname>
                            <given-names>ER</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ren</surname>
                            <given-names>Y</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <chapter-title>3DArticCyclists: Generating Synthetic Articulated 8D Pose-Controllable Cyclist Data for Computer Vision Applications.</chapter-title>
                    <source>

                        <italic toggle="yes">2025 IEEE Intelligent Vehicles Symposium (IV).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>2025a, June</year>; pp.<fpage>2114</fpage>&#x2013;<lpage>2121</lpage>.</mixed-citation>
            </ref>
            <ref id="ref8">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Corral-Soto</surname>
                            <given-names>ER</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Liu</surname>
                            <given-names>Y</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Ren</surname>
                            <given-names>Y</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Monocular Visual 8D Pose Estimation for Articulated Bicycles and Cyclists.</article-title>
                    <source>

                        <italic toggle="yes">arXiv preprint arXiv:2510.20158.</italic>
</source>
                    <year>2025b</year>.</mixed-citation>
            </ref>
            <ref id="ref9">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Desai</surname>
                            <given-names>NP</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Etemad</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Greenspan</surname>
                            <given-names>M</given-names>
                        </name>
</person-group>:
                    <chapter-title>CycleCrash: A Dataset of Bicycle Collision Videos for Collision Prediction and Analysis.</chapter-title>
                    <source>

                        <italic toggle="yes">2025 IEEE/CVF Winter Conference on Applications of Computer Vision (WACV).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>2025, February</year>; pp.<fpage>6688</fpage>&#x2013;<lpage>6698</lpage>.</mixed-citation>
            </ref>
            <ref id="ref10">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Flohr</surname>
                            <given-names>FB</given-names>
                        </name>
</person-group>:
                    <source>

                        <italic toggle="yes">Vulnerable road user detection and orientation estimation for context-aware automated driving.</italic>
</source>
                    <publisher-name>Universiteit van Amsterdam). UvA-DARE (Digital Academic Repository)</publisher-name>;<year>2018</year>. (Doctoral dissertation).</mixed-citation>
            </ref>
            <ref id="ref11">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Goren</surname>
                            <given-names>D</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Caesar</surname>
                            <given-names>H</given-names>
                        </name>
</person-group>:
                    <article-title>BikeScenes: Online LiDAR Semantic Segmentation for Bicycles.</article-title>
                    <source>

                        <italic toggle="yes">arXiv preprint arXiv:2510.25901.</italic>
</source>
                    <year>2025</year>.</mixed-citation>
            </ref>
            <ref id="ref12">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ghoul</surname>
                            <given-names>T</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Sayed</surname>
                            <given-names>T</given-names>
                        </name>
</person-group>:
                    <article-title>Cyclist safety assessment using autonomous vehicles.</article-title>
                    <source>

                        <italic toggle="yes">Accid. Anal. Prev.</italic>
</source>
                    <year>2025</year>;<volume>212</volume>:<fpage>107923</fpage>.
                    <pub-id pub-id-type="pmid">39837243</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.aap.2025.107923</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref13">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>G&#x00f3;mez-Meneses</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Arias-Correa</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Herrera-Ram&#x00ed;rez</surname>
                            <given-names>J</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>CYCLIST+IMU: A synchronized visual&#x2013;inertial dataset for cyclist orientation and perception in urban environments [Data set].</article-title>
                    <source>

                        <italic toggle="yes">Open Science Framework.</italic>
</source>
                    <year>2026</year>.
                    <pub-id pub-id-type="doi">10.17605/OSF.IO/HVPKZ</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref14">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Beck</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Rathnayake</surname>
                            <given-names>T</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>A benchmark for cycling close pass detection from video streams.</article-title>
                    <source>

                        <italic toggle="yes">Transportation Research Part C: Emerging Technologies.</italic>
</source>
                    <year>2025</year>;<volume>174</volume>:<fpage>105112</fpage>.
                    <pub-id pub-id-type="doi">10.1016/j.trc.2025.105112</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref15">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>H</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Zhu</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lu</surname>
                            <given-names>C</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Empowering safer socially sensitive autonomous vehicles using human-plausible cognitive encoding.</article-title>
                    <source>

                        <italic toggle="yes">Proc. Natl. Acad. Sci.</italic>
</source>
                    <year>2025</year>;<volume>122</volume>(<issue>21</issue>):<fpage>e2401626122</fpage>.
                    <pub-id pub-id-type="pmid">40388625</pub-id>
                    <pub-id pub-id-type="doi">10.1073/pnas.2401626122</pub-id>
                    <pub-id pub-id-type="pmcid">PMC12130892</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref16">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Mannion</surname>
                            <given-names>P</given-names>
                        </name>
</person-group>:
                    <article-title>Vulnerable road user detection: State-of-the-art and open challenges.</article-title>
                    <source>

                        <italic toggle="yes">arXiv preprint arXiv:1902.03601.</italic>
</source>
                    <year>2019</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/1902.03601">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref17">
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Narula</surname>
                            <given-names>M</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Tyagi</surname>
                            <given-names>D</given-names>
                        </name>
</person-group>:
                    <chapter-title>Autonomous cars: A comprehensive survey.</chapter-title>
                    <source>

                        <italic toggle="yes">2023 Seventh International Conference on Image Information Processing (ICIIP).</italic>
</source>
                    <publisher-name>IEEE</publisher-name>;<year>2023</year>; pp.<fpage>586</fpage>&#x2013;<lpage>590</lpage>.
                    <pub-id pub-id-type="doi">10.1109/ICIIP61524.2023.10537704</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref18">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Thrun</surname>
                            <given-names>S</given-names>
                        </name>
</person-group>:
                    <article-title>Toward robotic cars.</article-title>
                    <source>

                        <italic toggle="yes">Commun. ACM.</italic>
</source>
                    <year>2010</year>;<volume>53</volume>(<issue>4</issue>):<fpage>99</fpage>&#x2013;<lpage>106</lpage>.
                    <pub-id pub-id-type="doi">10.1145/1721654.1721679</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref81">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Ranftl</surname>
                            <given-names>R</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Lasinger</surname>
                            <given-names>K</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hafner</surname>
                            <given-names>D</given-names>
                        </name>
                        <etal/>
</person-group>:
                    <article-title>Towards robust monocular depth estimation: Mixing datasets for zero-shot cross-dataset transfer.</article-title>
                    <source>

                        <italic toggle="yes">IEEE Transactions on Pattern Analysis and Machine Intelligence.</italic>
</source>
                    <year>2022</year>;<volume>44</volume>(<issue>3</issue>):<fpage>1623</fpage>&#x2013;<lpage>1637</lpage>.
                    <pub-id pub-id-type="doi">10.1109/TPAMI.2020.3019967</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref19">
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Russell</surname>
                            <given-names>BC</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Torralba</surname>
                            <given-names>A</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Murphy</surname>
                            <given-names>KP</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>LabelMe: A Database and Web-Based Tool for Image Annotation.</article-title>
                    <source>

                        <italic toggle="yes">Int. J. Comput. Vis.</italic>
</source>
                    <year>2008</year>;<volume>77</volume>(<issue>1&#x2013;3</issue>):<fpage>157</fpage>&#x2013;<lpage>173</lpage>.
                    <pub-id pub-id-type="doi">10.1007/s11263-007-0090-8</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref20">
                <mixed-citation publication-type="other">
                    <collab>World Health Organization</collab>:
                    <article-title>Global status report on road safety 2023.</article-title>
                    <year>2023</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/9789240086517">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref21">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>L</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Kang</surname>
                            <given-names>B</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Huang</surname>
                            <given-names>Z</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>Depth anything: Unleashing the power of large-scale unlabeled data.</article-title>
                    <source>

                        <italic toggle="yes">arXiv.</italic>
</source>
                    <year>2024</year>.
                    <ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2401.10891">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref22">
                <mixed-citation publication-type="other">
                    <person-group person-group-type="author">

                        <name name-style="western">
                            <surname>Yan</surname>
                            <given-names>Z</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Li</surname>
                            <given-names>J</given-names>
                        </name>

                        <name name-style="western">
                            <surname>Hang</surname>
                            <given-names>P</given-names>
                        </name>

                        <etal/>
</person-group>:
                    <article-title>OnSiteVRU: A High-Resolution Trajectory Dataset for High-Density Vulnerable Road Users.</article-title>
                    <source>

                        <italic toggle="yes">arXiv preprint arXiv:2503.23365.</italic>
</source>
                    <year>2025</year>.</mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report483535">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.195711.r483535</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Al-Taie</surname>
                        <given-names>Ammar</given-names>
                    </name>
                    <xref ref-type="aff" rid="r483535a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-5156-6245</uri>
                </contrib>
                <aff id="r483535a1">
                    <label>1</label>KAIST, Daejeon, South Korea</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>1</day>
                <month>6</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Al-Taie A</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport483535" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.177481.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>Thank you to the authors for submitting this dataset of cyclists across different angles to support automated vehicle (AV) -cyclist interactions.&#x00a0;</p>
            <p> </p>
            <p> The researchers clearly show a strong need for this dataset, as AVs must safely detect and interact with cyclists on shared roads. However, I felt that the authors could make the introduction more accessible to readers as it is currently too technical. For example, rather than saying "Cyclist detection persists as a challenge for AV perception systems, primarily due to the inherent visual complexity associated with non-rigid articulations, highly variable aspect ratios, and a diverse range of spatial orientations" the authors can clearly explain that cyclists are likely to encounter AVs across a range of traffic scenarios, such as intersections, roundabouts or lane merging. This would ground the justification to real use cases and make the introduction more accessible.&#x00a0;</p>
            <p> </p>
            <p> The authors also only determine the orientation of the cyclists in the dataset; I would have liked to see a more elaborate labeling, e.g., specifying the traffic scenario, such as whether it is a roundabout. This could help AVs predict the likely cyclist orientation across different scenarios.&#x00a0;</p>
            <p> </p>
            <p> Moreover, the paper is lacking key citations from the field, including the work of Al-Taie, Von Sawitzky, and Matviienko, who have researched how AVs can communicate with cyclists.</p>
            <p> </p>
            <p> Overall, I feel this is a well-justified dataset. However, it needs a discussion and motivation that would further ground the dataset into real-world scenarios, and citations of key papers in the field.</p>
            <p>Are sufficient details of methods and materials provided to allow replication by others?</p>
            <p>Partly</p>
            <p>Is the rationale for creating the dataset(s) clearly described?</p>
            <p>Yes</p>
            <p>Are the datasets clearly presented in a useable and accessible format?</p>
            <p>Yes</p>
            <p>Are the protocols appropriate and is the work technically sound?</p>
            <p>Partly</p>
            <p>Reviewer Expertise:</p>
            <p>I am a Human-Computer Interaction researcher investigating how Automated Vehicles can successfuly and safely communicate their intentions to surrounding road users.</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report479065">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.195711.r479065</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Pappalardo</surname>
                        <given-names>Giuseppina</given-names>
                    </name>
                    <xref ref-type="aff" rid="r479065a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r479065a1">
                    <label>1</label>University of Catania, Catania, Italy</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>13</day>
                <month>5</month>
                <year>2026</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2026 Pappalardo G</copyright-statement>
                <copyright-year>2026</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport479065" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.177481.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The paper presents a valuable multimodal dataset (CYCLIST+IMU) that combines visual and inertial data to improve cyclist perception in urban environments. The dataset is well-structured, technically sound, and addresses a relevant gap in current research by including cyclist orientation information.</p>
            <p> However, several key issues need to be addressed to ensure scientific robustness: 
                <list list-type="bullet">
                    <list-item>
                        <p>
                            <bold>Participant description is insufficient</bold>: there is no clear information on the number, demographics, or variability of cyclists, limiting representativeness.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Limited scenario diversity</bold>: data are collected under constrained conditions (e.g., daytime only), reducing generalizability.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Validation is weak</bold>: it relies mainly on descriptive statistics, without assessing annotation quality, synchronization accuracy, or practical usability.</p>
                    </list-item>
                    <list-item>
                        <p>
                            <bold>Figures are unclear</bold>: their size and design make it difficult to interpret results and understand improvements (e.g., after data augmentation).</p>
                    </list-item>
                </list>
            </p>
            <p>Are sufficient details of methods and materials provided to allow replication by others?</p>
            <p>No</p>
            <p>Is the rationale for creating the dataset(s) clearly described?</p>
            <p>Yes</p>
            <p>Are the datasets clearly presented in a useable and accessible format?</p>
            <p>Yes</p>
            <p>Are the protocols appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Cyclist safety</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
    </sub-article>
</article>
