<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.2 20190208//EN" "http://jats.nlm.nih.gov/publishing/1.2/JATS-journalpublishing1.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="1.2" xml:lang="en">
    <front>
        <journal-meta>
            <journal-id journal-id-type="pmc">F1000Research</journal-id>
            <journal-title-group>
                <journal-title>F1000Research</journal-title>
            </journal-title-group>
            <issn pub-type="epub">2046-1402</issn>
            <publisher>
                <publisher-name>F1000 Research Limited</publisher-name>
                <publisher-loc>London, UK</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="doi">10.12688/f1000research.15620.1</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Research Article</subject>
                </subj-group>
                <subj-group>
                    <subject>Articles</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Exploring machine learning: A bibliometric general approach using SciMAT</article-title>
                <fn-group content-type="pub-status">
                    <fn>
                        <p>[version 1; peer review: 2 approved with reservations]</p>
                    </fn>
                </fn-group>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Rincon-Patino</surname>
                        <given-names>Juan</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Formal Analysis</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Software</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-3709-4878</uri>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="yes">
                    <name>
                        <surname>Ramirez-Gonzalez</surname>
                        <given-names>Gustavo</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Methodology</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-1338-8820</uri>
                    <xref ref-type="corresp" rid="c1">a</xref>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <contrib contrib-type="author" corresp="no">
                    <name>
                        <surname>Corrales</surname>
                        <given-names>Juan Carlos</given-names>
                    </name>
                    <role content-type="http://credit.niso.org/">Conceptualization</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Original Draft Preparation</role>
                    <role content-type="http://credit.niso.org/">Writing &#x2013; Review &amp; Editing</role>
                    <xref ref-type="aff" rid="a1">1</xref>
                </contrib>
                <aff id="a1">
                    <label>1</label>Telematic Engineering Department, University of Cauca, Popaya&#x0301;n, Cauca, 190001, Colombia</aff>
            </contrib-group>
            <author-notes>
                <corresp id="c1">
                    <label>a</label>
                    <email xlink:href="mailto:gramirez@unicauca.edu.co">gramirez@unicauca.edu.co</email>
                </corresp>
                <fn fn-type="conflict">
                    <p>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>7</day>
                <month>8</month>
                <year>2018</year>
            </pub-date>
            <pub-date pub-type="collection">
                <year>2018</year>
            </pub-date>
            <volume>7</volume>
            <elocation-id>1210</elocation-id>
            <history>
                <date date-type="accepted">
                    <day>26</day>
                    <month>7</month>
                    <year>2018</year>
                </date>
            </history>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2018 Rincon-Patino J et al.</copyright-statement>
                <copyright-year>2018</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access article distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <self-uri content-type="pdf" xlink:href="https://f1000research.com/articles/7-1210/pdf"/>
            <abstract>
                <p>
                    <bold>Background:</bold> Machine learning is becoming increasingly important for companies and the scientific community. In this study, we perform a bibliometric analysis on machine learning research, in order to provide an overview of the scientific work during the period 2007&#x2013;2017 in this area and to show trends that could be the basis for future developments in the field.</p>
                <p>
                    <bold>Methods:</bold> This study is carried out using the SciMAT tool based on results extracted from Scopus. This analysis shows the strategic diagrams of evolution and a set of thematic networks. The results provide information on broad tendencies of machine learning.</p>
                <p>
                    <bold>Results:</bold> The results show that SciMAT is a useful tool to carry out a science mapping analysis, and emphasizes the premise that machine learning has boundless applications and will continue to be an interesting research field in the future.</p>
                <p>
                    <bold>Conclusions:</bold> Some of the conclusions exposed in this study show that classification algorithms have been widely studied and represent a relevant tool for generating different machine learning applications. Nonetheless, regression algorithms are becoming increasingly important in the scientific community, allowing the generation of solutions to predict diseases, sales, and yields, for example.</p>
            </abstract>
            <kwd-group kwd-group-type="author">
                <kwd>machine learning</kwd>
                <kwd>science mapping</kwd>
                <kwd>bibliometrics</kwd>
                <kwd>topic analysis</kwd>
                <kwd>SciMAT</kwd>
            </kwd-group>
            <funding-group>
                <award-group id="fund-1" xlink:href="http://dx.doi.org/10.13039/501100005682">
                    <funding-source>Universidad del Cauca</funding-source>
                </award-group>
                <funding-statement>The authors are grateful to the Telematics Engineering Group (GIT) of the University of Cauca for scientific support and Innovacci&#x00f3;n Cauca project for master's scholarship granted to J. Rincon-Patino.</funding-statement>
                <funding-statement>
                    <italic>The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript.</italic>
                </funding-statement>
            </funding-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="intro">
            <title>Introduction</title>
            <p>The machine learning field researches different human learning processes, the theoretical analysis of possible learning algorithms and methods for several application domains
                <sup>
                    <xref ref-type="bibr" rid="ref-1">1</xref>
                </sup>. Studies based on machine learning have allowed scientists and companies to predict mass mortality events
                <sup>
                    <xref ref-type="bibr" rid="ref-2">2</xref>
                </sup>, the quality of water
                <sup>
                    <xref ref-type="bibr" rid="ref-3">3</xref>
                </sup>, segment clients in private banking
                <sup>
                    <xref ref-type="bibr" rid="ref-4">4</xref>
                </sup>, automatically classify text
                <sup>
                    <xref ref-type="bibr" rid="ref-5">5</xref>
                </sup> or for the production of crops, such as cocoa
                <sup>
                    <xref ref-type="bibr" rid="ref-6">6</xref>
                </sup>. Considering the growing interest of the scientific community in machine learning research and its challenges, it is interesting and necessary to analyze the field. A good approach for that purpose is science mapping analysis because it is a different way of visualizing information that allows a new researcher to become familiar with a field. An example of science mapping analysis providing an overview of the conceptual evolution of a field in medicine is proposed in 
                <xref ref-type="bibr" rid="ref-7">7</xref>. In this study, we perform a science mapping analysis to explore machine learning research. The objective of the study is to allow new data analysts to know the current knowledge base about machine learning and to have an initial point to explore applications in this field.</p>
            <p>This article has the following structure: In the 
                <italic toggle="yes">Methods</italic> section, we describe the research methodology, the dataset used, the tool configuration, and how the analysis was performed. The 
                <italic toggle="yes">Results</italic> section presents the results of the science mapping analysis. The conclusions are at the end of the article.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <sec>
                <title>Dataset for visualization analysis</title>
                <p>We used 
                    <ext-link ext-link-type="uri" xlink:href="https://www.scopus.com/">Scopus</ext-link> as the bibliographic source. We looked, in the third quarter of 2017, for references of articles and conferences about machine learning, using this concept as the search keyword (&#x2018;machine AND learning&#x2019;), with results ranging from 2007 to 2017(Q2). The concept was searched for in the article title, abstract and keywords of articles found. These articles were sorted by date (newest first). All the articles, between 2007 and 2017, were taken in to account for performing the analysis with the aim of obtaining a general vision of the field.</p>
                <p>We obtained 67,475 records that were saved using RIS format in different files sorted by year. 
                    <xref ref-type="fig" rid="f1">Figure 1</xref> shows a summary of the records, and shows that research in the field of machine learning has been growing steadily. It is important to observe that the results for 2017 are not in the figure since the records are only to the second half Q2 of year and database is permanently updated. However, these results were used for the analysis because they show trends, which is the primary objective of the present study.</p>
                <fig fig-type="figure" id="f1" orientation="portrait" position="float">
                    <label>Figure 1. </label>
                    <caption>
                        <title>Number of documents for Scopus per year for machine learning 2007&#x2013;2017(Q2).</title>
                    </caption>
                    <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure1.gif"/>
                </fig>
            </sec>
            <sec>
                <title>Parameter design</title>
                <p>We used the records from Scopus for executing the analysis with 
                    <ext-link ext-link-type="uri" xlink:href="http://sci2s.ugr.es/scimat/">SciMAT version 1.1.04</ext-link>. In this tool, the unit of analysis was Words. Primarily, we did a deduplication process, grouping similar words (by plurals) and looking for synonyms or duplicates in words with the highest number of documents and repetitions, always trying to avoid bias to include the largest number of terms. After that, we divided the time interval (2007 &#x2013; 2017) into six smaller periods: 2007&#x2013;2009, 2010&#x2013;2012, 2013&#x2013;2014, 2015, 2016, 2017(Q2 &#x2013; published papers up the second quarter of the year). We distributed the gaps this way in order to have a comparable number of articles in each one of them. Finally, we carried out the analysis with the following configuration: all the periods, author&#x2019;s words as the unit of analysis, a minimum frequency for data reduction of 100 (excepting 2017 (Q2) with 50) and co-occurrence as a kind of network. Other configurations were: network reduction equal to one, association strength as a normalization measure, Simple centers algorithm with a maximum net size of seven and a minimum of five, core mapper for the document mapper, h-index and Sum citations as the quality measures and, lastly, association strength for the evolution and overlapping map.</p>
            </sec>
            <sec>
                <title>Analysis design</title>
                <p>SciMAT shows a spatial representation of the way disciplines, fields, specialties and documents or authors related to one another
                    <sup>
                        <xref ref-type="bibr" rid="ref-8">8</xref>&#x2013;
                        <xref ref-type="bibr" rid="ref-10">10</xref>
                    </sup>. For this purpose, the tool implements a longitudinal framework, which takes as its base a co-word analysis and the h-index. Co-word analysis firstly provides information on the themes of a research field and, secondly, enables to analyze and to track the evolution of a study field throughout consecutive periods of time
                    <sup>
                        <xref ref-type="bibr" rid="ref-11">11</xref>
                    </sup>. The h-index is used to measure the impact of the various identified thematic areas
                    <sup>
                        <xref ref-type="bibr" rid="ref-8">8</xref>
                    </sup>.</p>
                <p>In this tool, we follow four steps as mentioned by 
                    <xref ref-type="bibr" rid="ref-10">10</xref>: researching cluster detection, drawing strategic diagrams, plotting of thematic areas and carrying out a performance analysis. For the first one, the tool creates a network of keywords co-occurrence based on 
                    <xref ref-type="bibr" rid="ref-12">12</xref> and 
                    <xref ref-type="bibr" rid="ref-13">13</xref> and makes a clustering of keywords to topics, using the Simple center's algorithm. For the second step, according to 
                    <xref ref-type="bibr" rid="ref-13">13</xref>, the cluster centrality and density rank values are relevant. The centrality measures the intensity of the interaction of a group with the others; if the cluster is boldly related to the field of research, then the link will be stronger. The density measures the intensity of internal links inside the group. According to 
                    <xref ref-type="bibr" rid="ref-8">8</xref> and 
                    <xref ref-type="bibr" rid="ref-10">10</xref>, the themes of the clusters can be classified into four groups using these two measures: (1) Motor themes, which are both well developed and central to the research field; (2) basic and transversal themes, which are not sufficiently developed topics but significant for the area of investigation; (3) emerging or declining themes, which are weakly studied and marginal; (4) highly developed and isolated themes, which have well-developed internal links, but reduced external links and have only minimal importance to the field. The third step is the plotting of thematic areas, and the last one is to conduct the performance analysis. In this study, we analyzed quantitative measures, such as the number of documents and authors.</p>
            </sec>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <p>To analyze the most relevant topics of investigation in different years, SciMAT uses strategic diagrams. We generated a diagram for each period of the study. The charts are divided into four quadrants: the upper-right quadrant alludes to the motor themes, the upper-left quadrant to the highly developed and isolated themes, the lower-right one to the basic and transversal themes, and the lower-left one to the emerging or declining topics
                <sup>
                    <xref ref-type="bibr" rid="ref-9">9</xref>
                </sup>.</p>
            <p>
                <xref ref-type="fig" rid="f2">Figure 2</xref> shows the strategic diagram of the period 2007&#x2013;2009, which has 27 themes. During this time span, OPTIMIZATION, CONTROL-THEORY, and IMAGE-CLASSIFICATION are some of the emerging topics. SEQUENCE-ANALYSIS-PROTEIN appears as the motor theme with the highest density (0.83) and centrality (3.21) values, followed by DATABASES-PROTEIN, with centrality equal to 2.97 and density equal to 0.43. This suggests that machine learning was widely used to study the protein molecule in that period, covering, for example, studies to predict the structure or function of that molecule.</p>
            <fig fig-type="figure" id="f2" orientation="portrait" position="float">
                <label>Figure 2. </label>
                <caption>
                    <title>Strategic diagram of the period 2007&#x2013;2009 for machine learning using data from Scopus.</title>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure2.gif"/>
            </fig>
            <p>Due to the great number of themes that appear in the strategic diagram, we decided to choose three themes, giving priority to those that may have a high impact application. 
                <xref ref-type="fig" rid="f3">Figure 3A</xref> shows the net for the theme DATABASES-PROTEIN, which has a density of 0.43, a centrality of 2.97 and a document count of 322. In this net, we can observe that an important topic is PROTEIN-STRUCTURE. 
                <xref ref-type="fig" rid="f3">Figure 3B</xref> presents the network for the theme DATASETS, which has a density of 0.06, a centrality of 1.37, a document count of 273 and strongly related topics such as CLASSIFIERS, SEMI-SUPERVISED-LEARNING and RANDOM-FOREST. 
                <xref ref-type="fig" rid="f3">Figure 3C</xref> shows the network for the theme IMAGE-CLASSIFICATION, which has a density of 0.11, a centrality of 1.3, a document count of 273 and relevant concepts, such as NEURAL-NETWORKS, SUPPORT-VECTOR-MACHINE (SVM) and IMAGE-PROCESSING.</p>
            <fig fig-type="figure" id="f3" orientation="portrait" position="float">
                <label>Figure 3. </label>
                <caption>
                    <title>Selected thematic networks for period 2007&#x2013;2009 for machine learning using data from Scopus.</title>
                    <p>(
                        <bold>A</bold>) DATABASES-PROTEIN; (
                        <bold>B</bold>) DATASETS; (
                        <bold>C</bold>) IMAGE-CLASSIFICATION.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure3.gif"/>
            </fig>
            <p>
                <xref ref-type="fig" rid="f4">Figure 4</xref> shows the strategic diagram of the period 2010&#x2013;2012. The diagram has 35 themes. During this time span, VIRTUAL-REALITY, ROBOTS, and METADATA are some of the emerging themes, while CLASSIFICATION-ALGORITHM is one of the basic and transversal topics. AGED and PROTEIN-ANALYSIS appear as the motor subjects with the highest density (0.72 and 0.58, respectively) and centrality (1.91 and 2.18, respectively) values. Other important themes are CHEMISTRY AND GENETICS. This is a sign that during this period, topics on biology and health began to become relevant in applied machine learning research.</p>
            <fig fig-type="figure" id="f4" orientation="portrait" position="float">
                <label>Figure 4. </label>
                <caption>
                    <title>Strategic diagram of the period 2010&#x2013;2012 for machine learning using data from Scopus.</title>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure4.gif"/>
            </fig>
            <p>From the second period, we selected three thematic networks. 
                <xref ref-type="fig" rid="f5">Figure 5A</xref> shows the net for the theme PROTEIN-ANALYSIS, which has a density of 0.58, a centrality of 2.18 and a document count of 229. This shows us that topics about proteins continue to be important in this period. 
                <xref ref-type="fig" rid="f5">Figure 5B</xref> presents the network for the theme CHEMISTRY, which is an emergent theme and has a density of 0.32, a centrality of 2.24 and a document count of 346. 
                <xref ref-type="fig" rid="f5">Figure 5C</xref> shows the network for the subject VIRTUAL-REALITY, which has a density of 0.07, a centrality of 0.98, a document count of 65 and is another emerging theme for the period 2010&#x2013;2012.</p>
            <fig fig-type="figure" id="f5" orientation="portrait" position="float">
                <label>Figure 5. </label>
                <caption>
                    <title>Selected thematic networks for period 2010&#x2013;2012 for machine learning using data from Scopus.</title>
                    <p>(
                        <bold>A</bold>) PROTEIN-ANALYSIS; (
                        <bold>B</bold>) CHEMISTRY; (
                        <bold>C</bold>) VIRTUAL-REALITY.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure5.gif"/>
            </fig>
            <p>The strategic diagram of the period 2013&#x2013;2014 is shown on 
                <xref ref-type="fig" rid="f6">Figure 6</xref>, which has 32 themes. During this time frame, SENSORS, FACE-RECOGNITION and COMMERCE are some of the emerging topics. The IMAGE-INTERPRETATION-COMPUTER-ASSISTED topic appears as the motor theme, with the highest density (0.58) and centrality (2.61) values. This suggests that in this period there were studies on machine learning applied to different topics, such as sensor data, costs, and gesture recognition.</p>
            <fig fig-type="figure" id="f6" orientation="portrait" position="float">
                <label>Figure 6. </label>
                <caption>
                    <title>Strategic diagram of the period 2013&#x2013;2014 for machine learning using data from Scopus.</title>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure6.gif"/>
            </fig>
            <p>We selected three thematic networks from the third period (2013&#x2013;2014). 
                <xref ref-type="fig" rid="f7">Figure 7A</xref> shows the network for the theme AMINO-ACID-SEQUENCE, which has a density of 0.42, a centrality of 1.91 and a document count of 276. 
                <xref ref-type="fig" rid="f7">Figure 7B</xref> presents the network for the theme MOBILE-DEVICES, which has a density of 0.21, a centrality of 0.76, a document count of 159 and strongly related topics such as HUMAN-COMPUTER-INTERACTION, E-LEARNING, and UBIQUITOUS-COMPUTING. 
                <xref ref-type="fig" rid="f7">Figure 7C</xref> shows the network for the theme COMMERCE, which has a density of 0.07, a centrality of 0.88, a document count of 205 and relevant concepts, such as SOCIAL-NETWORKING and COSTS.</p>
            <fig fig-type="figure" id="f7" orientation="portrait" position="float">
                <label>Figure 7. </label>
                <caption>
                    <title>Selected thematic networks for period 2013&#x2013;2014 for machine learning using data from Scopus.</title>
                    <p>(
                        <bold>A</bold>) AMINO-ACID-SEQUENCE; (
                        <bold>B</bold>) MOBILE-DEVICES; (
                        <bold>C</bold>) COMMERCE.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure7.gif"/>
            </fig>
            <p>
                <xref ref-type="fig" rid="f8">Figure 8</xref> shows the strategic diagram of the period 2015. The diagram has 25 themes. During this time span, SMARTPHONES, FACE-RECOGNITION and FORESTRY (label generated for algorithms such as Random-Forest or Decision-Trees) are some of the emerging themes. NUCLEAR-MAGNETIC-RESONANCE-IMAGING appears as the motor subject with the highest density (0.57) and centrality (2.81) values. Other important themes are COMPUTATIONAL-BIOLOGY and MEDICAL-IMAGING. We found that during this period biology and health were once again relevant topics in machine learning research.</p>
            <fig fig-type="figure" id="f8" orientation="portrait" position="float">
                <label>Figure 8. </label>
                <caption>
                    <title>Strategic diagram of the period 2015 for machine learning using data from Scopus.</title>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure8.gif"/>
            </fig>
            <p>From the fourth time frame, we selected three thematic networks. 
                <xref ref-type="fig" rid="f9">Figure 9A</xref> shows the network for the theme NUCLEAR-MAGNETIC-RESONANCE-IMAGING, which has a density of 0.57, a centrality of 2.81 and a document count of 251. 
                <xref ref-type="fig" rid="f9">Figure 9B</xref> presents the network for the theme COMPUTATIONAL-BIOLOGY, which is an emergent theme and has a density of 0.44, a centrality of 1.8 and a document count of 320. 
                <xref ref-type="fig" rid="f9">Figure 9C</xref> shows the network for the topic SMARTPHONES, which has a density of 0.07, a centrality of 0.13, a document count of 144 and is another emerging theme for the 2015 period.</p>
            <fig fig-type="figure" id="f9" orientation="portrait" position="float">
                <label>Figure 9. </label>
                <caption>
                    <title>Selected thematic networks for period 2015 for machine learning using data from Scopus.</title>
                    <p>(
                        <bold>A</bold>) NUCLEAR-MAGNETIC-RESONANCE-IMAGING; (
                        <bold>B</bold>) COMPUTATIONAL-BIOLOGY; (
                        <bold>C</bold>) SMARTPHONES.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure9.gif"/>
            </fig>
            <p>The strategic diagram of the period 2016 is shown in 
                <xref ref-type="fig" rid="f10">Figure 10</xref>, which has 24 themes. During this time span, UBIQUITOUS-COMPUTING and COMMERCE are some of the emerging themes. The MIDDLE-AGED theme &#x2013;which refers to applications developed for middle-aged people&#x2013; appears as the motor topic with the highest density (0.76) and centrality (2.04) values.</p>
            <fig fig-type="figure" id="f10" orientation="portrait" position="float">
                <label>Figure 10. </label>
                <caption>
                    <title>Strategic diagram of the period 2016 for machine learning using data from Scopus.</title>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure10.gif"/>
            </fig>
            <p>We selected three thematic networks from the fifth period (2016). 
                <xref ref-type="fig" rid="f11">Figure 11A</xref> shows the network for the theme MEDICAL-IMAGING, which has a density of 0.26, a centrality of 1.45 and a document count of 312. 
                <xref ref-type="fig" rid="f11">Figure 11B</xref> presents the network for the theme INTRUSION-DETECTION, which has a density of 0.3, a centrality of 0.89 and a document count of 289. 
                <xref ref-type="fig" rid="f11">Figure 11C</xref> shows the network for the theme UBIQUITOUS-COMPUTING, which has a density of 0.07, a centrality of 1.07, a document count of 132 and relevant concepts, such as AUTOMATION, SMARTPHONES and the INTERNET.</p>
            <fig fig-type="figure" id="f11" orientation="portrait" position="float">
                <label>Figure 11. </label>
                <caption>
                    <title>Selected thematic networks for period 2016 for machine learning using data from Scopus.</title>
                    <p>(
                        <bold>A</bold>) MEDICAL-IMAGING; (
                        <bold>B</bold>) INTRUSION-DETECTION; (
                        <bold>C</bold>) UBIQUITOUS-COMPUTING.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure11.gif"/>
            </fig>
            <p>
                <xref ref-type="fig" rid="f12">Figure 12</xref> shows the strategic diagram of the period 2017(Q2). The diagram has 16 themes. During this time span, HUMAN is the only emerging theme, while FORESTRY is one of the basic and transversal topics. This shows us the importance of algorithms such as Random-Forest or Decision-Trees during the last decade in the research on machine learning. MEDICAL-IMAGING appears as the motor theme with the highest density (0.51) and centrality (2.05) values. Once again, topics on health are relevant in machine learning research.</p>
            <fig fig-type="figure" id="f12" orientation="portrait" position="float">
                <label>Figure 12. </label>
                <caption>
                    <title>Strategic diagram of the period 2017(Q2) for machine learning using data from Scopus.</title>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure12.gif"/>
            </fig>
            <p>From 2017(Q2), we selected three thematic networks. 
                <xref ref-type="fig" rid="f13">Figure 13A</xref> shows the net for the theme MEDICAL-IMAGING, which has a document count of 137. 
                <xref ref-type="fig" rid="f13">Figure 13B</xref> presents the network for the topic FORESTRY (label generated for algorithms such as Random-Forest or Decision-Trees), which has a density of 0.17, a centrality of 1.84 and a document count of 220.</p>
            <fig fig-type="figure" id="f13" orientation="portrait" position="float">
                <label>Figure 13. </label>
                <caption>
                    <title>Selected thematic networks for period 2017(Q2) for machine learning using data from Scopus.</title>
                    <p>(
                        <bold>A</bold>) MEDICAL-IMAGING; (
                        <bold>B</bold>) FORESTRY.</p>
                </caption>
                <graphic orientation="portrait" position="float" xlink:href="https://f1000research-files.f1000.com/manuscripts/17040/649f156e-e43a-4670-aec5-fba6ed833c44_figure13.gif"/>
            </fig>
            <supplementary-material id="DS0" orientation="portrait" position="float" xlink:href="https://f1000researchdata.s3.amazonaws.com/datasets/15620/f809b5c7-6721-4d9b-a16e-ae4887a3e91b_Dataset_1.zip">
                <label>Data obtained from Scopus and SciMat project file, to be opened in SciMat</label>
            </supplementary-material>
        </sec>
        <sec sec-type="conclusions">
            <title>Conclusions</title>
            <p>Exposing emerging trends in the field of machine learning allows researchers to increase their understanding of the changes and the evolution over time of this research field. One of the primary objectives of a science mapping analysis is to highlight trends and possible relationships between the relevant topics of a research field. SciMAT is a useful tool to carry out a study based on this approach, which offers fundamental themes, based on a cluster generation. The results of the present study show that machine learning is an important and widely studied scientific area. The tendencies indicate that machine learning applications will still be of interest to the scientific community. The use of machine learning to predict diseases such as cancer
                <sup>
                    <xref ref-type="bibr" rid="ref-14">14</xref>
                </sup> or Alzheimer&#x2019;s disease
                <sup>
                    <xref ref-type="bibr" rid="ref-15">15</xref>
                </sup>, and in fields such as biology
                <sup>
                    <xref ref-type="bibr" rid="ref-16">16</xref>
                </sup>, rehabilitation system
                <sup>
                    <xref ref-type="bibr" rid="ref-17">17</xref>
                </sup>, commerce
                <sup>
                    <xref ref-type="bibr" rid="ref-18">18</xref>
                </sup>, smartphones
                <sup>
                    <xref ref-type="bibr" rid="ref-19">19</xref>
                </sup> and ubiquitous computing
                <sup>
                    <xref ref-type="bibr" rid="ref-20">20</xref>
                </sup>, will be a trend in the near future.</p>
        </sec>
        <sec>
            <title>Data availability</title>
            <p>The data referenced by this article are under copyright with the following copyright statement: Copyright: &#x00ef;&#x00bf;&#x00bd; 2018 Rincon-Patino J et al.</p>
            <p>Data associated with the article are available under the terms of the Creative Commons Zero "No rights reserved" data waiver (CC0 1.0 Public domain dedication).
                <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/publicdomain/zero/1.0/"/>
            </p>
            <p>Dataset 1: Data obtained from Scopus and SciMat project file, to be opened in SciMat. DOI, 
                <ext-link ext-link-type="uri" xlink:href="http://dx.doi.org/10.5256/f1000research.15620.d212425">10.5256/f1000research.15620.d212425</ext-link>
                <sup>
                    <xref ref-type="bibr" rid="ref-21">21</xref>
                </sup>
            </p>
        </sec>
    </body>
    <back>
        <ref-list>
            <ref id="ref-1">
                <label>1</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Michalski</surname>
                            <given-names>RS</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Carbonell</surname>
                            <given-names>JG</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Mitchell</surname>
                            <given-names>TM</given-names>
                        </name>
					</person-group>:
                    <article-title>Machine Learning: An Artificial Intelligence Approach.</article-title>Springer Berlin Heidelberg,<year>2013</year>.
                    <pub-id pub-id-type="doi">10.1007/978-3-662-12405-5</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-2">
                <label>2</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Crisci</surname>
                            <given-names>C</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Ghattas</surname>
                            <given-names>B</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Perera</surname>
                            <given-names>G</given-names>
                        </name>
					</person-group>:
                    <article-title>A review of supervised machine learning algorithms and their applications to ecological data.</article-title>
                    <source>
						
                        <italic toggle="yes">Ecol Modell.</italic>
					</source>
                    <year>2012</year>;<volume>240</volume>:<fpage>113</fpage>&#x2013;<lpage>122</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.ecolmodel.2012.03.001</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-3">
                <label>3</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>L&#x00f3;pez</surname>
                            <given-names>ID</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Figueroa</surname>
                            <given-names>A</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Corrales</surname>
                            <given-names>JC</given-names>
                        </name>
					</person-group>:
                    <article-title>Adaptive Prediction of Water Quality Using Computational Intelligence Techniques</article-title>. In
                    <italic toggle="yes">Computational Science and Its Applications -- ICCSA 2017: 17th International Conference, Trieste, Italy, July 3-6, 2017, Proceedings, Part II,</italic>Cham: Springer International Publishing,<year>2017</year>;<fpage>45</fpage>&#x2013;<lpage>59</lpage>.
                    <pub-id pub-id-type="doi">10.1007/978-3-319-62395-5_4</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-4">
                <label>4</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Smeureanu</surname>
                            <given-names>I</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Ruxanda</surname>
                            <given-names>G</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Badea</surname>
                            <given-names>LM</given-names>
                        </name>
					</person-group>:
                    <article-title>Customer segmentation in private banking sector using machine learning techniques.</article-title>
                    <source>
						
                        <italic toggle="yes">J Bus Econ Manag.</italic>
					</source>
                    <year>2013</year>;<volume>14</volume>(<issue>5</issue>):<fpage>923</fpage>&#x2013;<lpage>939</lpage>.
                    <pub-id pub-id-type="doi">10.3846/16111699.2012.749807</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-5">
                <label>5</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Sebastiani</surname>
                            <given-names>F</given-names>
                        </name>
					</person-group>:
                    <article-title>Machine Learning in Automated Text Categorization.</article-title>
                    <source>
						
                        <italic toggle="yes">ACM Comput Surv.</italic>
					</source>
                    <year>2002</year>;<volume>34</volume>(<issue>1</issue>):<fpage>1</fpage>&#x2013;<lpage>47</lpage>.
                    <pub-id pub-id-type="doi">10.1145/505282.505283</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-6">
                <label>6</label>
                <mixed-citation publication-type="book">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Plazas</surname>
                            <given-names>JE</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>L&#x00f3;pez</surname>
                            <given-names>ID</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Corrales</surname>
                            <given-names>JC</given-names>
                        </name>
					</person-group>:
                    <article-title>A Tool for Classification of Cacao Production in Colombia Based on Multiple Classifier Systems.</article-title>In
                    <italic toggle="yes">Computational Science and Its Applications -- ICCSA 2017: 17th International Conference, Trieste, Italy, July 3-6, 2017, Proceedings, Part II,</italic>Cham: Springer International Publishing,<year>2017</year>;<fpage>60</fpage>&#x2013;<lpage>69</lpage>.
                    <pub-id pub-id-type="doi">10.1007/978-3-319-62395-5_5</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-7">
                <label>7</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Moral-Mu&#x00f1;oz</surname>
                            <given-names>JA</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Cobo</surname>
                            <given-names>MJ</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Peis</surname>
                            <given-names>E</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Analyzing the research in 
                        <italic toggle="yes">Integrative</italic> &amp; 
                        <italic toggle="yes">Complementary Medicine</italic> by means of science mapping.</article-title>
                    <source>
						
                        <italic toggle="yes">Complement Ther Med.</italic>
					</source>
                    <year>2014</year>;<volume>22</volume>(<issue>2</issue>):<fpage>409</fpage>&#x2013;<lpage>418</lpage>.
                    <pub-id pub-id-type="pmid">24731913</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.ctim.2014.02.003</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-8">
                <label>8</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Mart&#x00ed;nez</surname>
                            <given-names>MA</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Cobo</surname>
                            <given-names>MJ</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Herrera</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Analyzing the Scientific Evolution of Social Work Using Science Mapping.</article-title>
                    <source>
						
                        <italic toggle="yes">Res Soc Work Pract.</italic>
					</source>
                    <year>2015</year>;<volume>25</volume>(<issue>2</issue>):<fpage>257</fpage>&#x2013;<lpage>277</lpage>.
                    <pub-id pub-id-type="doi">10.1177/1049731514522101</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-9">
                <label>9</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Cobo</surname>
                            <given-names>MJ</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>L&#x00f3;pez-Herrera</surname>
                            <given-names>AG</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Herrera-Viedma</surname>
                            <given-names>E</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>SciMAT: A new science mapping analysis software tool.</article-title>
                    <source>
						
                        <italic toggle="yes">J Am Soc Inf Sci Technol.</italic>
					</source>
                    <year>2012</year>;<volume>63</volume>(<issue>8</issue>):<fpage>1609</fpage>&#x2013;<lpage>1630</lpage>.
                    <pub-id pub-id-type="doi">10.1002/asi.22688</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-10">
                <label>10</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Cobo</surname>
                            <given-names>MJ</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>L&#x00f3;pez-Herrera</surname>
                            <given-names>AG</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Herrera-Viedma</surname>
                            <given-names>E</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>An approach for detecting, quantifying, and visualizing the evolution of a research field: A practical application to the Fuzzy Sets Theory field.</article-title>
                    <source>
						
                        <italic toggle="yes">J Informetr.</italic>
					</source>
                    <year>2011</year>;<volume>5</volume>(<issue>1</issue>):<fpage>146</fpage>&#x2013;<lpage>166</lpage>.
                    <pub-id pub-id-type="doi">10.1016/j.joi.2010.10.002</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-11">
                <label>11</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Garfield</surname>
                            <given-names>E</given-names>
                        </name>
					</person-group>:
                    <article-title>Scientography: Mapping the tracks of science.</article-title>
                    <source>
						
                        <italic toggle="yes">Curr Contents Soc Behav Sci.</italic>
					</source>
                    <year>1994</year>;<volume>7</volume>(<issue>45</issue>):<fpage>5</fpage>&#x2013;<lpage>10</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="https://wenku.baidu.com/view/1b8b7d2658fb770bf78a55cd.html">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-12">
                <label>12</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Callon</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Courtial</surname>
                            <given-names>JP</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Turner</surname>
                            <given-names>WA</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>From translations to problematic networks: An introduction to co-word analysis.</article-title>
                    <source>
						
                        <italic toggle="yes">Soc Sc Inform.</italic>
					</source>
                    <year>1983</year>;<volume>22</volume>(<issue>2</issue>):<fpage>191</fpage>&#x2013;<lpage>235</lpage>.
                    <pub-id pub-id-type="doi">10.1177/053901883022002003</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-13">
                <label>13</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Callon</surname>
                            <given-names>M</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Courtial</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Laville</surname>
                            <given-names>F</given-names>
                        </name>
					</person-group>:
                    <article-title>Co-word analysis as a tool for describing the network of interactions between basic and technological research: The case of polymer chemsitry.</article-title>
                    <source>
						
                        <italic toggle="yes">Scientometrics.</italic>
					</source>
                    <year>1991</year>;<volume>22</volume>(<issue>1</issue>):<fpage>155</fpage>&#x2013;<lpage>205</lpage>.
                    <pub-id pub-id-type="doi">10.1007/BF02019280</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-14">
                <label>14</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>Y</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Tetko</surname>
                            <given-names>IV</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Hall</surname>
                            <given-names>MA</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Gene selection from microarray data for cancer classification&#x2014;a machine learning approach.</article-title>
                    <source>
						
                        <italic toggle="yes">Comput Biol Chem.</italic>
					</source>
                    <year>2005</year>;<volume>29</volume>(<issue>1</issue>):<fpage>37</fpage>&#x2013;<lpage>46</lpage>.
                    <pub-id pub-id-type="pmid">15680584</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.compbiolchem.2004.11.001</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-15">
                <label>15</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Moradi</surname>
                            <given-names>E</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Pepe</surname>
                            <given-names>A</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Gaser</surname>
                            <given-names>C</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Machine learning framework for early MRI-based Alzheimer&#x2019;s conversion prediction in MCI subjects.</article-title>
                    <source>
						
                        <italic toggle="yes">Neuroimage.</italic>
					</source>
                    <year>2015</year>;<volume>104</volume>:<fpage>398</fpage>&#x2013;<lpage>412</lpage>.
                    <pub-id pub-id-type="pmid">25312773</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.neuroimage.2014.10.002</pub-id>
                    <pub-id pub-id-type="pmcid">5957071</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-16">
                <label>16</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Swan</surname>
                            <given-names>AL</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Mobasheri</surname>
                            <given-names>A</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Allaway</surname>
                            <given-names>D</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Application of Machine Learning to Proteomics Data: Classification and Biomarker Identification in Postgenomics Biology.</article-title>
                    <source>
						
                        <italic toggle="yes">OMICS.</italic>
					</source>
                    <year>2013</year>;<volume>17</volume>(<issue>12</issue>):<fpage>595</fpage>&#x2013;<lpage>610</lpage>.
                    <pub-id pub-id-type="pmid">24116388</pub-id>
                    <pub-id pub-id-type="doi">10.1089/omi.2013.0017</pub-id>
                    <pub-id pub-id-type="pmcid">3837439</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-17">
                <label>17</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Yeh</surname>
                            <given-names>SC</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Huang</surname>
                            <given-names>MC</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>PC</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>Machine learning-based assessment tool for imbalance and vestibular dysfunction with virtual reality rehabilitation system.</article-title>
                    <source>
						
                        <italic toggle="yes">Comput Methods Programs Biomed.</italic>
					</source>
                    <year>2014</year>;<volume>116</volume>(<issue>3</issue>):<fpage>311</fpage>&#x2013;<lpage>318</lpage>.
                    <pub-id pub-id-type="pmid">24894180</pub-id>
                    <pub-id pub-id-type="doi">10.1016/j.cmpb.2014.04.014</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-18">
                <label>18</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Yan</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>C</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Zha</surname>
                            <given-names>H</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>On Machine Learning Towards Predictive Sales Pipeline Analytics</article-title>. In
                    <italic toggle="yes">Proceedings of the Twenty-Ninth AAAI Conference on Artificial Intelligence</italic>.<year>2015</year>;<fpage>1945</fpage>&#x2013;<lpage>1951</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.semanticscholar.org/paper/On-Machine-Learning-towards-Predictive-Sales-Yan-Zhang/95762eb04f0c99b3b1428a670e054a5d8c6ec1fc">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-19">
                <label>19</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Faragher</surname>
                            <given-names>RM</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Harle</surname>
                            <given-names>RK</given-names>
                        </name>
					</person-group>:
                    <article-title>SmartSLAM - An Efficient Smartphone Indoor Positioning System Exploiting Machine Learning and Opportunistic Sensing</article-title>. In
                    <italic toggle="yes">Proceedings of the 26th International Technical Meeting of The Satellite Division of the Institute of Navigation (ION GNSS+ 2013)</italic>.<year>2013</year>;<fpage>1006</fpage>&#x2013;<lpage>1019</lpage>.
                    <ext-link ext-link-type="uri" xlink:href="https://www.ion.org/publications/abstract.cfm?articleID=11308">Reference Source</ext-link>
                </mixed-citation>
            </ref>
            <ref id="ref-20">
                <label>20</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Ventura</surname>
                            <given-names>D</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Casado-Mansilla</surname>
                            <given-names>D</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>L&#x00f3;pez-de-Armentia</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <etal/>
					</person-group>:
                    <article-title>ARIIMA: A Real IoT Implementation of a Machine-Learning Architecture for Reducing Energy Consumption</article-title>. In
                    <italic toggle="yes">Ubiquitous Computing and Ambient Intelligence. Personalisation and User Adapted Services: 8th International Conference, UCAmI 2014, Belfast, UK</italic>, Cham: Springer International Publishing,<year>2014</year>;<fpage>444</fpage>&#x2013;<lpage>451</lpage>.
                    <pub-id pub-id-type="doi">10.1007/978-3-319-13102-3_72</pub-id>
                </mixed-citation>
            </ref>
            <ref id="ref-21">
                <label>21</label>
                <mixed-citation publication-type="journal">
                    <person-group person-group-type="author">
						
                        <name name-style="western">
                            <surname>Rincon-Patino</surname>
                            <given-names>J</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Ramirez-Gonzalez</surname>
                            <given-names>G</given-names>
                        </name>
						
                        <name name-style="western">
                            <surname>Corrales</surname>
                            <given-names>JC</given-names>
                        </name>
					</person-group>:
                    <article-title>Dataset 1 in: Exploring machine learning: A bibliometric general approach using SciMAT.</article-title>
                    <source>
						
                        <italic toggle="yes">F1000Research.</italic>
					</source>
                    <year>2018</year>.
                    <ext-link ext-link-type="uri" xlink:href="http://www.doi.org/10.5256/f1000research.15620.d212425">http://www.doi.org/10.5256/f1000research.15620.d212425</ext-link>
                </mixed-citation>
            </ref>
        </ref-list>
    </back>
    <sub-article article-type="reviewer-report" id="report37068">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.17040.r37068</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Dozmorov</surname>
                        <given-names>Mikhail G.</given-names>
                    </name>
                    <xref ref-type="aff" rid="r37068a1">1</xref>
                    <role>Referee</role>
                    <uri content-type="orcid">https://orcid.org/0000-0002-0086-8358</uri>
                </contrib>
                <aff id="r37068a1">
                    <label>1</label>Department of Biostatistics&#x00a0;, Virginia Commonwealth University, Richmond, VA, USA</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>15</day>
                <month>8</month>
                <year>2018</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2018 Dozmorov MG</copyright-statement>
                <copyright-year>2018</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport37068" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.15620.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The paper &#x201c;Exploring machine learning: A&#x00a0;bibliometric general approach using SciMAT&#x201d; by Rincon-Patino 
                <italic>et al.</italic> presents an overview of areas of machine learning applications. The study is conducted using science mapping analysis with the SciMAT tool. A bibliography containing &#x201c;machine&#x201d; and &#x201c;learning&#x201d; keywords over the 10-year period (2007-2017) was extracted from Scopus. This period was split into six smaller periods, and the state of machine learning in each period was illustrated by two figures, strategic diagram, and selected thematic network. The paper is well written. The following recommendations are intended to improve the readability and message of the paper. 
                <list list-type="bullet">
                    <list-item>
                        <p>Strategic diagrams may not be familiar for users who aren&#x2019;t familiar with the SciMAT tool. Thus, the description of strategic diagrams given at the beginning of the Results section is better to be placed to the legend of the first figure. Also, clarify the meaning of &#x201c;the basic and transversal themes.&#x201d; Furthermore, the description of the lower-left quadrant, &#x201c;the emerging or declining topics,&#x201d; is confusing, it should be one or the other.</p>
                    </list-item>
                    <list-item>
                        <p>Although the study claims to present a longitudinal analysis of the development of machine learning areas, it is the analysis and the description of individual time periods, presented on individual figures. I am missing the compare-and-contrast view of the analysis, which would have been possible if the figures would be presented side-by-side. Given the good readability of the strategic diagrams, it is perfectly possible to combine them into one figure. The same can be done for the selected thematic networks, by making edges shorter, thicker, and fonts - larger.</p>
                    </list-item>
                    <list-item>
                        <p>It is unclear whether the manuscript is about the overview of machine learning fields, or the tool SciMAT and the science mapping analysis. Besides simply describing what the results are at each time period, it would be good to have some conclusions about the longitudinal trends of the field.</p>
                    </list-item>
                    <list-item>
                        <p>Although the rationale for choosing the non-equal smaller periods in understandable, the periods themselves should be better defined. At the very least, state that the presented periods are inclusive, that is, 2007-2009 spans the 3-year period. Better, adopt (MM/DD/YYYY-MM/DD/YYYY] notation.</p>
                    </list-item>
                    <list-item>
                        <p>Figure 1 shows the growing number of documents containing &#x201c;machine&#x201d; and &#x201c;learning&#x201d; keywords. However, it is known that the number of publications per year grows by itself. It would be more informative to show the proportion of published documents that contain machine" and &#x201c;learning&#x201d; keywords. The usefulness of representing the proportion of publications can be illustrated with the following R code:</p>
                    </list-item>
                </list> library(MDmisc) # devtools::install_github('mdozmorov/MDmisc')</p>
            <p> library(ggplot2)</p>
            <p> p &lt;- get_pubmed_graph("machine learning", yearstart = 2007, yearend = 2017, normalize = TRUE, xlab = "Year", ylab = "Proportion of all publications")</p>
            <p> p</p>
            <p> ggsave("pubmed_machine_learning.png", p, device = "png", height = 4)</p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Partly</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>NA</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
    </sub-article>
    <sub-article article-type="reviewer-report" id="report36927">
        <front-stub>
            <article-id pub-id-type="doi">10.5256/f1000research.17040.r36927</article-id>
            <title-group>
                <article-title>Reviewer response for version 1</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="author">
                    <name>
                        <surname>Tiwari</surname>
                        <given-names>Rajesh Kumar</given-names>
                    </name>
                    <xref ref-type="aff" rid="r36927a1">1</xref>
                    <role>Referee</role>
                </contrib>
                <aff id="r36927a1">
                    <label>1</label>Amity Institute of Biotechnology, Amity University Uttar Pradesh, Lucknow, India</aff>
            </contrib-group>
            <author-notes>
                <fn fn-type="conflict">
                    <p>
                        <bold>Competing interests: </bold>No competing interests were disclosed.</p>
                </fn>
            </author-notes>
            <pub-date pub-type="epub">
                <day>9</day>
                <month>8</month>
                <year>2018</year>
            </pub-date>
            <permissions>
                <copyright-statement>Copyright: &#x00a9; 2018 Tiwari RK</copyright-statement>
                <copyright-year>2018</copyright-year>
                <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
                    <license-p>This is an open access peer review report distributed under the terms of the Creative Commons Attribution Licence, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
                </license>
            </permissions>
            <related-article ext-link-type="doi" id="relatedArticleReport36927" related-article-type="peer-reviewed-article" xlink:href="10.12688/f1000research.15620.1"/>
            <custom-meta-group>
                <custom-meta>
                    <meta-name>recommendation</meta-name>
                    <meta-value>approve-with-reservations</meta-value>
                </custom-meta>
            </custom-meta-group>
        </front-stub>
        <body>
            <p>The article highlights about the bibliometric analysis of scientific works in the area of &#x00a0;machine learning, published in Scopus indexed Journals during the period of 2007-2017. The manuscript is well written. However, I have following suggestions to make:</p>
            <p> &#x00a0; 
                <list list-type="order">
                    <list-item>
                        <p>Correction in title of Manuscript: Exploring machine learning: A bibliometric general approach using SciMAT 
                            <bold>Tool</bold>
                        </p>
                    </list-item>
                    <list-item>
                        <p>Definition of Machine learning should be incorporated in the introduction Part. Authors can refer and cite following articles: PMID: 23740390
                            <sup>
                                <xref ref-type="bibr" rid="rep-ref-36927-1">1</xref>
                            </sup>&#x00a0;and PMID: 28302041
                            <sup>
                                <xref ref-type="bibr" rid="rep-ref-36927-2">2</xref>
                            </sup>
                        </p>
                    </list-item>
                    <list-item>
                        <p>Apart from mass&#x00a0; mortality&#x00a0; events,&#x00a0; the&#x00a0; quality&#x00a0; of&#x00a0; water,&#x00a0; segment&#x00a0; clients&#x00a0; in&#x00a0; private&#x00a0; banking,&#x00a0; automatically&#x00a0; classify&#x00a0; text, production&#x00a0; of&#x00a0; crops, the machine learning applications are also widely used in the Drug designing in pharmaceutical industries, academia and research. Authors should mention the same in the&#x00a0;introduction part of the article and can refer and cite the following articles with PMID: 22346230
                            <sup>
                                <xref ref-type="bibr" rid="rep-ref-36927-3">3</xref>
                            </sup>, PMID: 26526829
                            <sup>
                                <xref ref-type="bibr" rid="rep-ref-36927-4">4</xref>
                            </sup>, PMID: 28382857
                            <sup>
                                <xref ref-type="bibr" rid="rep-ref-36927-5">5</xref>
                            </sup>, PMID: 29256344
                            <sup>
                                <xref ref-type="bibr" rid="rep-ref-36927-6">6</xref>
                            </sup>
                        </p>
                    </list-item>
                    <list-item>
                        <p>Methods: As the data set is collected from Scopus, the same should be cited in the manuscript.</p>
                    </list-item>
                    <list-item>
                        <p>The original source of SciMAT Tool should be cited in the manuscript.</p>
                    </list-item>
                    <list-item>
                        <p>The authors must elaborate more about the basis of division of the data set. It &#x00a0;is mentioned &#x00a0;that the&#x00a0; time&#x00a0; interval divided&#x00a0; into&#x00a0; six&#x00a0; smaller&#x00a0; periods:&#x00a0; 2007&#x2013;2009,&#x00a0; 2010&#x2013;2012,&#x00a0; 2013&#x2013;2014,&#x00a0; 2015,&#x00a0; 2016,&#x00a0; 2017. As the &#x00a0;division is not uniform. Was the gap made such a way so as to have comparable number&#x00a0; of&#x00a0; articles&#x00a0; in&#x00a0; each&#x00a0; one&#x00a0; of &#x00a0;them only?</p>
                    </list-item>
                    <list-item>
                        <p>The machine learning algorithms are widely used in robotics and pharmaceutical properties prediction. They can also be included in conclusion part.</p>
                    </list-item>
                    <list-item>
                        <p>Apart from SciMAT, are some other similar tools available? Can the comparative &#x00a0;analysis of results using the same data set from different tools be done to know that how conclusive the reported results are? This can be included as future prospect of the current research.&#x00a0; &#x00a0; &#x00a0; &#x00a0; &#x00a0;</p>
                    </list-item>
                </list>
            </p>
            <p>Is the work clearly and accurately presented and does it cite the current literature?</p>
            <p>Yes</p>
            <p>If applicable, is the statistical analysis and its interpretation appropriate?</p>
            <p>Yes</p>
            <p>Are all the source data underlying the results available to ensure full reproducibility?</p>
            <p>Yes</p>
            <p>Is the study design appropriate and is the work technically sound?</p>
            <p>Yes</p>
            <p>Are the conclusions drawn adequately supported by the results?</p>
            <p>Yes</p>
            <p>Are sufficient details of methods and analysis provided to allow replication by others?</p>
            <p>Yes</p>
            <p>Reviewer Expertise:</p>
            <p>Machine learning classification, prediction models using Artificial Intelligence, Statistical analysis, Computational Biology</p>
            <p>I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above.</p>
        </body>
        <back>
            <ref-list>
                <title>References</title>
                <ref id="rep-ref-36927-1">
                    <label>1</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Can we predict blood brain barrier permeability of ligands using computational approaches?</article-title>.
                        <source>
                            <italic>Interdiscip Sci</italic>
                        </source>.<year>2013</year>;<volume>5</volume>(<issue>2</issue>) :
                        <elocation-id>10.1007/s12539-013-0158-9</elocation-id>
                        <fpage>95</fpage>-<lpage>101</lpage>
                        <pub-id pub-id-type="pmid">23740390</pub-id>
                        <pub-id pub-id-type="doi">10.1007/s12539-013-0158-9</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-36927-2">
                    <label>2</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Promises of Machine Learning Approaches in Prediction of Absorption of Compounds.</article-title>
                        <source>
                            <italic>Mini Rev Med Chem</italic>
                        </source>.<year>2018</year>;<volume>18</volume>(<issue>3</issue>) :
                        <elocation-id>10.2174/1389557517666170315150116</elocation-id>
                        <fpage>196</fpage>-<lpage>207</lpage>
                        <pub-id pub-id-type="pmid">28302041</pub-id>
                        <pub-id pub-id-type="doi">10.2174/1389557517666170315150116</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-36927-3">
                    <label>3</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>A prediction model for oral bioavailability of drugs using physicochemical properties by support vector machine.</article-title>
                        <source>
                            <italic>J Nat Sci Biol Med</italic>
                        </source>.<year>2011</year>;<volume>2</volume>(<issue>2</issue>) :
                        <elocation-id>10.4103/0976-9668.92325</elocation-id>
                        <fpage>168</fpage>-<lpage>73</lpage>
                        <pub-id pub-id-type="pmid">22346230</pub-id>
                        <pub-id pub-id-type="doi">10.4103/0976-9668.92325</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-36927-4">
                    <label>4</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Prediction of Metabolism of Drugs using Artificial Intelligence: How far have we reached?</article-title>.
                        <source>
                            <italic>Curr Drug Metab</italic>
                        </source>.<year>2016</year>;<volume>17</volume>(<issue>2</issue>) :<fpage>129</fpage>-<lpage>41</lpage>
                        <pub-id pub-id-type="pmid">26526829</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-36927-5">
                    <label>5</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Prediction of Human Intestinal Absorption of Compounds Using Artificial Intelligence Techniques.</article-title>
                        <source>
                            <italic>Curr Drug Discov Technol</italic>
                        </source>.<year>2017</year>;<volume>14</volume>(<issue>4</issue>) :
                        <elocation-id>10.2174/1570163814666170404160911</elocation-id>
                        <fpage>244</fpage>-<lpage>254</lpage>
                        <pub-id pub-id-type="pmid">28382857</pub-id>
                        <pub-id pub-id-type="doi">10.2174/1570163814666170404160911</pub-id>
                    </mixed-citation>
                </ref>
                <ref id="rep-ref-36927-6">
                    <label>6</label>
                    <mixed-citation publication-type="journal">
                        <person-group person-group-type="author"/>:
                        <article-title>Prediction of Drug-Plasma Protein Binding Using Artificial Intelligence Based Algorithms.</article-title>
                        <source>
                            <italic>Comb Chem High Throughput Screen</italic>
                        </source>.<year>2018</year>;<volume>21</volume>(<issue>1</issue>) :
                        <elocation-id>10.2174/1386207321666171218121557</elocation-id>
                        <fpage>57</fpage>-<lpage>64</lpage>
                        <pub-id pub-id-type="pmid">29256344</pub-id>
                        <pub-id pub-id-type="doi">10.2174/1386207321666171218121557</pub-id>
                    </mixed-citation>
                </ref>
            </ref-list>
        </back>
    </sub-article>
</article>
