<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMH</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Ment Health</journal-id>
      <journal-title>JMIR Mental Health</journal-title>
      <issn pub-type="epub">2368-7959</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v10i1e42420</article-id>
      <article-id pub-id-type="pmid">37163323</article-id>
      <article-id pub-id-type="doi">10.2196/42420</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Prediction of Mental Health Problem Using Annual Student Health Survey: Machine Learning Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Torous</surname>
            <given-names>John</given-names>
          </name>
        </contrib>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Li</surname>
            <given-names>Chun Hung</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Teles</surname>
            <given-names>Ariel</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author" corresp="yes" equal-contrib="yes">
          <name name-style="western">
            <surname>Baba</surname>
            <given-names>Ayako</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Health Service Center</institution>
            <institution>Kanazawa University</institution>
            <addr-line>Kakuma-machi, Kanazawa-city</addr-line>
            <addr-line>Ishikawa, 9201192</addr-line>
            <country>Japan</country>
            <phone>81 762645254</phone>
            <email>a_baba@staff.kanazawa-u.ac.jp</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1409-3482</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" equal-contrib="yes">
          <name name-style="western">
            <surname>Bunji</surname>
            <given-names>Kyosuke</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9512-7439</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Health Service Center</institution>
        <institution>Kanazawa University</institution>
        <addr-line>Ishikawa</addr-line>
        <country>Japan</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Graduate School of Business Administration</institution>
        <institution>Kobe University</institution>
        <addr-line>Hyogo</addr-line>
        <country>Japan</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Ayako Baba <email>a_baba@staff.kanazawa-u.ac.jp</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <year>2023</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>10</day>
        <month>5</month>
        <year>2023</year>
      </pub-date>
      <volume>10</volume>
      <elocation-id>e42420</elocation-id>
      <history>
        <date date-type="received">
          <day>3</day>
          <month>9</month>
          <year>2022</year>
        </date>
        <date date-type="rev-request">
          <day>29</day>
          <month>12</month>
          <year>2022</year>
        </date>
        <date date-type="rev-recd">
          <day>19</day>
          <month>2</month>
          <year>2023</year>
        </date>
        <date date-type="accepted">
          <day>19</day>
          <month>2</month>
          <year>2023</year>
        </date>
      </history>
      <copyright-statement>©Ayako Baba, Kyosuke Bunji. Originally published in JMIR Mental Health (https://mental.jmir.org), 10.05.2023.</copyright-statement>
      <copyright-year>2023</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Mental Health, is properly cited. The complete bibliographic information, a link to the original publication on https://mental.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://mental.jmir.org/2023/1/e42420" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>One of the reasons why students go to counseling is being called on based on self-reported health survey results. However, there is no concordant standard for such calls.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aims to develop a machine learning (ML) model to predict students’ mental health problems in 1 year and the following year using the health survey’s content and answering time (response time, response time stamp, and answer date).</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>Data were obtained from the responses of 3561 (62.58%) of 5690 undergraduate students from University A in Japan (a national university) who completed the health survey in 2020 and 2021. We performed 2 analyses; in analysis 1, a mental health problem in 2020 was predicted from demographics, answers for the health survey, and answering time in the same year, and in analysis 2, a mental health problem in 2021 was predicted from the same input variables as in analysis 1. We compared the results from different ML models, such as logistic regression, elastic net, random forest, XGBoost, and LightGBM. The results with and without <italic>answering time</italic> conditions were compared using the adopted model.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>On the basis of the comparison of the models, we adopted the LightGBM model. In this model, both analyses and conditions achieved adequate performance (eg, Matthews correlation coefficient [MCC] of with <italic>answering time</italic> condition in analysis 1 was 0.970 and MCC of without <italic>answering time</italic> condition in analysis 1 was 0.976; MCC of with <italic>answering time</italic> condition in analysis 2 was 0.986 and that of without <italic>answering time</italic> condition in analysis 2 was 0.971). In both analyses and in both conditions, the response to the questions about campus life (eg, anxiety and future) had the highest impact (Gain 0.131-0.216; Shapley additive explanations 0.018-0.028). Shapley additive explanations of 5 to 6 input variables from questions about campus life were included in the top 10. In contrast to our expectation, the inclusion of answering time–related variables did not exhibit substantial improvement in the prediction of students’ mental health problems. However, certain variables generated based on the answering time are apparently helpful in improving the prediction and affecting the prediction probability.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>These results demonstrate the possibility of predicting mental health across years using health survey data. Demographic and behavioral data, including answering time, were effective as well as self-rating items. This model demonstrates the possibility of synergistically using the characteristics of health surveys and advantages of ML. These findings can improve health survey items and calling criteria.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>student counseling</kwd>
        <kwd>health survey</kwd>
        <kwd>machine learning</kwd>
        <kwd>mental health problem</kwd>
        <kwd>response time</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>In Japan, 57% of female and 48% of male students seek counseling voluntarily [<xref ref-type="bibr" rid="ref1">1</xref>]. Others seek counseling after being referred by teachers, families, friends, or health service centers. Health service centers use health surveys as clues for counseling calls. A health survey is mainly conducted as a self-reported screening test or an interview along with health checkups [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
        <p>The style of mental health surveys differs among universities. Participants in the survey range from first-year students to undergraduate students to all students, including graduate students. The content is also diverse, with the University Personality Inventory (UPI) [<xref ref-type="bibr" rid="ref3">3</xref>] and General Health Questionnaire (GHQ) [<xref ref-type="bibr" rid="ref4">4</xref>,<xref ref-type="bibr" rid="ref5">5</xref>] being frequently used [<xref ref-type="bibr" rid="ref6">6</xref>]. Similarly, the criteria for calling using a mental health survey are inconsistent [<xref ref-type="bibr" rid="ref7">7</xref>]. It is challenging to devise uniform criteria that will aid in efficient calling. To address this issue, we propose that machine learning (ML) would aid in developing a universal method for detecting and predicting mental health problems among students.</p>
        <p>ML has several advantages in modeling highly individual phenomena with many variables, such as allowing the simultaneous testing of numerous input variables and their complex interactions [<xref ref-type="bibr" rid="ref8">8</xref>], permitting nonlinearity in producing predictive algorithms [<xref ref-type="bibr" rid="ref9">9</xref>], and having the ability to test all possible relationships to identify the superlative algorithm and model without a priori hypothesis by researchers [<xref ref-type="bibr" rid="ref8">8</xref>]. These advantages of ML can help detect and predict mental health problems.</p>
      </sec>
      <sec>
        <title>Related Work</title>
        <p>Many trials detect mental health problems using biological, behavioral, and subjective data [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref11">11</xref>]. Some studies have diagnosed suicidal ideation or behavior using various predictors, such as psychological problems and self-injuries [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>]. To predict mental health problems, the following broader variables were tested: birth information; physical illness; environmental factors; behavioral data (eg, number of naps, study duration, and use of a cell phone); biological data (eg, sleep onset time, skin conductance, and temperature) collected with wearable sensors, and text data posted on social media [<xref ref-type="bibr" rid="ref14">14</xref>-<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>There are also some examples of ML with on-campus data, known as learning analytics and educational data mining [<xref ref-type="bibr" rid="ref18">18</xref>]. In some studies, repeaters and dropouts have been predicted using log data from a learning management system or e-learning, information about entrance examinations, registered courses, attendance, grades, and submission status of assignments [<xref ref-type="bibr" rid="ref19">19</xref>-<xref ref-type="bibr" rid="ref24">24</xref>].</p>
        <p>On-campus mental health surveys are insufficiently used as ML predictors. We consider them suitable for statistical analysis for 3 reasons. First, the mental health survey is open to all students, and the response rate is high. They must complete it to receive health checkups. Second, mental health surveys are conducted annually at many universities. Thus, it is possible to observe a change over time. Third, web-based mental health surveys, which have become a standard under COVID-19, can collect well-organized self-reported data and <italic>answering time</italic> data.</p>
        <p>We use the word <italic>answering time</italic> as a broad concept, including response time (RT), which is the amount of time in which a student responds to the question item after it is shown on the screen; RT stamp (the time of day when a student accesses the survey form); and answer date (the number of days elapsed in which a student completes the survey after it was announced). In particular, RT has recently attracted attention mainly in psychological assessment and educational testing; however, little is known about how to use RT in mental health measurement [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref26">26</xref>]. A few studies have shown that RT is related to depression estimation and the prediction of suicide ideation and attempt status [<xref ref-type="bibr" rid="ref25">25</xref>,<xref ref-type="bibr" rid="ref27">27</xref>]. RT would be worth investigating for predicting mental health based on the response behavior.</p>
      </sec>
      <sec>
        <title>Goal of This Study</title>
        <p>This study aimed to predict students’ mental health problems even without a specific mental health score. In this study, we conducted 2 analyses. In analysis 1, we attempted to predict mental health problems from other items when responding to the survey. Analysis 2 attempted to predict mental health problems in 2021 from the responses in the survey conducted in 2020 (1 year later). We also tested the effect of answering time on the prediction of mental health problems.</p>
        <p>The main objective of this study was to build an exploratory predictive model. We also attempted to evaluate the impact of each input variable on the outcome based on ML and examine the interpretable relationship between input variables and mental health problems.</p>
        <p>This study demonstrates the possibility of using data collected from health surveys conducted at most universities to precisely detect students experiencing mental health problems and reduce call costs. This will also pave the way to using existing health survey data even without mental health scores.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Collection</title>
        <p>The data set was obtained from a closed health survey conducted at the beginning of 2020 and 2021 school years at University A, a national university in Japan. According to the email announcement of the annual health checkup, all students were asked to answer the survey on the learning management system. Although incentives were not offered and penalties were not levied, the students were required to answer this survey to obtain a health certification. However, the survey did not comprise adaptive questions. There were 28 nonrandomized questions (health survey in <xref ref-type="table" rid="table1">Table 1</xref>) that were presented one per page without completeness check. Students could review their answers before submission and resubmit them before the deadline. When there were duplicate submissions from identical IDs, the last submission was recorded.</p>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>List of items in the health survey.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="30"/>
            <col width="380"/>
            <col width="0"/>
            <col width="560"/>
            <thead>
              <tr valign="top">
                <td colspan="4">Item</td>
                <td>Options</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="5">
                  <bold>Individual data</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Faculty and department</td>
                <td>24 categories</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Sex</td>
                <td>Male and female</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">International student</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Age</td>
                <td>(Free description)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Years of university</td>
                <td>1, 2, 3, 4, 5, and 6</td>
              </tr>
              <tr valign="top">
                <td colspan="5">
                  <bold>Health survey</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Case history</bold>
                </td>
                <td>Yes, no, and do not know</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Circulatory problem</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Digestive problem</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Cranial nerve and mental disorders</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Respiratory problem</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Allergic disease</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Measles</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Rubella</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mumps</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Varicella</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Other diseases</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Currently under medical treatment</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Health concerns or worries</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Physical or mental disability</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Physical or mental disability certificate</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Needs for consultation or support from the university</td>
                <td>Yes, no, and do not know</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Blood type</td>
                <td>A, B, O, AB, and do not know</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Tuberculin skin test result</td>
                <td>Negative, positive, and do not know</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Vaccination</bold>
                </td>
                <td>1 time, ≥2 times, never, and do not know</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Measles</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Rubella</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Mumps</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Varicella</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Have meals</bold>
                </td>
                <td>Every day, sometimes, and never</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Breakfast</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Lunch</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Dinner</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Sleeping hours</td>
                <td>15 categories (1-hour increments; from &#60;3 to &#62;17 hours)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Exercise</td>
                <td>Every day, sometimes, and never</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Drinking</td>
                <td>Every day, sometimes, and never</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Smoking</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Thoughts on quitting smoking</td>
                <td>Want, do not want, and nonsmoker</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Residence</td>
                <td>Home, apartment, student dormitory, and others</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Commuting method</td>
                <td>Walking, bus, train and bus, bicycle, motorbike, car, and others</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Club activities</td>
                <td>Yes, used to be, and never</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Hours of internet use</td>
                <td>20 categories (1-hour increments; from &#60;0.5 to &#62;19 hours)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Nine questions about campus life</bold>
                </td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>This is not the university or major that I wanted.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I have a strong anxiety about my campus life.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>It takes me a long time to get used to new surroundings.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I am worried about my relationships with other people.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I am worried about my future.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I had some trouble with someone close to me.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I feel like my life rhythm has been upset recently.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I am worried that I may not be able to take credit as I think.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>I always feel busy with my academic work.</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Kessler 6 (mental health scale) [<xref ref-type="bibr" rid="ref28">28</xref>]</td>
                <td>4=all of the time, 3=most of the time, 2=some of the time, 1=a little of the time, and 0=none of the time</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Have lost &#62;3 kg in a month</bold>
                </td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Presently</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>In the past (&#62;18 years old)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>In the past (&#60;18 years old)</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">What you want to tell us and questions</td>
                <td>Free description</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Menstrual trouble (for women only)</td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Coping with menstrual trouble (for women only)</td>
                <td>Seeing a physician at a hospital, want to consult Health Service Center, and would like to wait and see how it goes</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Menstrual cycle (for women only)</td>
                <td>Regular every 26-32 days, not every 26-32 days but comes regularly, not regular but more than once every 3 months, and not more than once every 3 months</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">Menstrual pain (for women only)</td>
                <td>No pain, no need to take painkillers, need to take painkillers, and painkillers do not alleviate my pain</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td colspan="3">
                  <bold>Birth-control pills or oral contraceptives (for women only)</bold>
                </td>
                <td>Yes and no</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>Taking</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>To improve menstrual cycle</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>To improve menstrual pain</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>
                  <break/>
                </td>
                <td>For other reasons</td>
                <td colspan="2">
                  <break/>
                </td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <p>In this study, data that met the following conditions were excluded: during the 2020 or 2021 survey, the participant was, not an undergraduate, did not answer by the deadline (27 days in 2020 and 39 days in 2021), did not respond to any items, did not respond to all items on the Kessler 6 mental health scale [<xref ref-type="bibr" rid="ref29">29</xref>] (it was used as an outcome and detailed in Outcome and Input Variables section), was a nonregular student (eg, credited auditors), and did not give consent for data use. Incomplete submissions or atypical response duration were not excluded.</p>
        <p>In 2020 and 2021, a total of 5690 students may have been affiliated with the university based on student enrollment conditions in 2020. In both the 2020 and 2021 surveys, 3680 students answered the survey. In total, 119 (3.23%) students’ data were excluded: 10 (8.4%) students did not consent, 105 (88.2%) students did not complete Kessler 6 scale in 2020 or 2021 survey, and 4 (3.3%) students belonged to old affiliations. The resulting data set used for the analysis contains 3561 students (<xref ref-type="table" rid="table2">Table 2</xref>).</p>
        <p>The mean age was 20.54 (SD 1.75) years. The distribution of students by sex was 1941 (54.51%) male and 1620 (45.49%) female students. The data set included 1234 (34.65%) first-year students, 1005 (28.22%) second-year students, 1018 (28.59%) third-year students, and 304 (8.54%) fourth- or higher-year students. The distribution of students by faculty was 1361 (38.22%) in humanities and social sciences (6 departments); 943 (26.48%) in science and engineering (8 departments); 1175 (33%) in medical, pharmaceutical, and health (4 departments); and 82 (2.3%) in others (2 departments). Furthermore, 10 (0.28%) students were international students.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Demographic characteristics of participants in the 2020 school year (N=3561).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="540"/>
            <col width="430"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Variables</td>
                <td>Values</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="2">Age (years), mean (SD)</td>
                <td>20.54 (1.75)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Sex, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Male</td>
                <td>1941 (54.51)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Female</td>
                <td>1620 (45.49)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Years of university, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>First-year students</td>
                <td>1234 (34.65)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Second-year students</td>
                <td>1005 (28.22)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Third-year students</td>
                <td>1018 (28.59)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Fourth-year or higher-year students</td>
                <td>304 (8.54)</td>
              </tr>
              <tr valign="top">
                <td colspan="3">
                  <bold>Faculty, n (%)</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Humanities and social sciences (6 departments)</td>
                <td>1361 (38.22)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Science and engineering (8 departments)</td>
                <td>943 (26.48)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Medical, pharmaceutical, and health (4 departments)</td>
                <td>1175 (33)</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Others (2 departments)</td>
                <td>82 (2.3)</td>
              </tr>
              <tr valign="top">
                <td colspan="2">International students, n (%)</td>
                <td> 10 (0.28)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
      <sec>
        <title>Ethics Approval and Informed Consent</title>
        <p>This study received ethics approval from the Medical Ethics Committee of Kanazawa University (test number:2011-113 [017]). All students were asked to complete the survey; however, they had the option to not consent for its use for research purposes. We obtained written informed consent from all participants. Data were anonymized and saved offline. The usability and technical functionality were tested by staff members in advance. The research was performed according to relevant guidelines and regulations.</p>
      </sec>
      <sec>
        <title>Outcome and Input Variables</title>
        <p>Our model did not use the diagnosis but used the Japanese version of the Kessler 6 [<xref ref-type="bibr" rid="ref28">28</xref>] as an indicator of mental health problems. Diagnoses of the students were not necessarily shared with the university, whereas Kessler 6 could be obtained from the health survey conducted in the university. The Japanese version of the Kessler 6 demonstrates high performance in detecting mood or anxiety disorders according to the Diagnostic and Statistical Manual of Mental Disorders Fourth Edition [<xref ref-type="bibr" rid="ref28">28</xref>,<xref ref-type="bibr" rid="ref30">30</xref>]. Although diagnoses are not made based only on Kessler 6 scores and need consultations with physicians, they have been used widely for screening and surveys [<xref ref-type="bibr" rid="ref31">31</xref>]. Analyses 1 and 2 used the Kessler 6 scores for 2020 and 2021, respectively, as outcomes. Both analyses divided scores into a dichotomous variable (1: problem and 0: no problem) according to a ≥13 cutoff point [<xref ref-type="bibr" rid="ref29">29</xref>,<xref ref-type="bibr" rid="ref30">30</xref>].</p>
        <p>In this study, we examined several candidate ML models to determine which model to use. All candidate models are probabilistic prediction models: logistic regression, elastic net, random forest, XGBoost, and LightGBM. Elastic net is a logistic regression model with L1 and L2 regularization. Random forest combines independent decision trees and outputs the most popular class as a prediction [<xref ref-type="bibr" rid="ref32">32</xref>]. XGBoost and LightGBM are implementations of the gradient boosting decision tree (GBDT) [<xref ref-type="bibr" rid="ref33">33</xref>,<xref ref-type="bibr" rid="ref34">34</xref>]. The GBDT is known to achieve high performance in many ML tasks, such as predicting diseases [<xref ref-type="bibr" rid="ref35">35</xref>] or identifying psychological health risk factors [<xref ref-type="bibr" rid="ref36">36</xref>].</p>
        <p>We used the same input variables for analyses 1 and 2. All the responses to the 2020 questionnaire listed in <xref ref-type="table" rid="table1">Table 1</xref> were coded differently according to the model. For tree-based models (random forest, XGBoost, and LightGBM), they were coded numerically, with missing values filled with −99. For example, the answer for <italic>blood type</italic> item, which was one among A, B, O, AB, do not know, and no response, was coded as 1, 2, 3, 4, 5, and −99, respectively. For the regression models (logistic regression and elastic net), different coding schemes were applied based on the type of input variables. Continuous or ordinal variables such as <italic>hours of internet use</italic> or <italic>age</italic> were numerically coded in the same manner as tree-based models, except that missing or nonresponse data were filled with the grand mean. In contrast, effect coding was applied to nominal variables such as <italic>case history</italic> or <italic>blood type</italic>. Missing data were treated as independent categories. As a result, the response to <italic>blood type</italic> (Q7), for instance, was transformed into 5 input variables: ANS7_B, ANS7_O, ANS7_AB, ANS7_DN (do not know), and ANS7_NA (missing). When the respondent answered “B,” ANS7_B was coded as 1 and the remaining 4 were coded as 0.</p>
        <p>Because the aim of this study was to investigate which type of input variables were useful in the prediction of mental health problems, we used all variables except RT without dimensionality reduction. Notably, the tree-based models are less susceptible to the inclusion of irrelevant variables. In addition, an elastic net can reduce the number of input variables because of regularization.</p>
        <p>In addition to the raw response variables in <xref ref-type="table" rid="table1">Table 1</xref>, we generated several input variables with the expectation that some patterns would appear on each variable, as shown in <xref ref-type="table" rid="table3">Table 3</xref>. These conjectures are based on existing studies on students’ mental health and suicide [<xref ref-type="bibr" rid="ref37">37</xref>], shared knowledge among experts, or authors’ clinical experiences at the university.</p>
        <p>To deal with the content of answers to the free description question (<italic>What you want to tell us and questions</italic>), the answers were analyzed using KH Coder [<xref ref-type="bibr" rid="ref38">38</xref>,<xref ref-type="bibr" rid="ref39">39</xref>], a free text mining analysis software. First, words that appeared ≥10 times were clustered using the Ward method, and Jaccard distances between clusters were calculated. Six clusters were adopted for interpretation. Second, each free description was labeled as 0 or 1 for each cluster. If words in a cluster did not appear in a free description, the description was labeled as 0 for the cluster; if words contained in the cluster appeared even once in a free description, the description was labeled as 1 for the cluster. Cluster 1 contained, among other words, “counseling,” “current,” and “under treatment.” Cluster 2 contained, among other words, “syndrome,” “surgery,” and “diagnosis.” Cluster 3 contained, among other words, “menstruation” and “anemia.” Cluster 4 contained, among other words, “left,” “ear,” and “right.” Cluster 5 contained, among other words, “depression,” “mental,” “stress,” and “anxiety.” Cluster 6 contained, among other words, “hospital,” “allergy,” and “skin.”</p>
        <p>This study examined the effectiveness of answering time in predicting mental health problems. <xref ref-type="table" rid="table4">Table 4</xref> lists the answering time–related input variables.</p>
        <p>The 2 coordinates Xs and Ys represent the position of the time stamp in a 24-hour clock and are introduced to indicate that 0:00 and 24:00 are identical. They were calculated by</p>
        <disp-formula>
        X<sub>s</sub> = cos([s / 43200]π), Y<sub>s</sub> = sin([s / 43200]π) <bold>(1)</bold>
        </disp-formula>
        <p>where <italic>s</italic> is the number of seconds elapsed in a day; for instance, when the time stamp is 13:34:42, <italic>s</italic> will be 13 × 3600 + 34 × 60 + 42 = 48882. RT-related variables were included as the first and second principal component scores because the RT of every single item is difficult to interpret, and these RTs can moderately affect the prediction.</p>
        <p>Except for the text-mining analysis, the abovementioned feature engineering processes were executed using the R programming language [<xref ref-type="bibr" rid="ref40">40</xref>] on a Windows 10 machine, with the missMDA package [<xref ref-type="bibr" rid="ref41">41</xref>] for principal components analysis with missing data.</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Generated variables and possible conjecture.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="550"/>
            <col width="450"/>
            <thead>
              <tr valign="top">
                <td>Item</td>
                <td>Conjecture</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>The academic year of admission (the values in the data were between 2012 and 2020)</td>
                <td>There may be a cohort effect.</td>
              </tr>
              <tr valign="top">
                <td>An indicator to show how many years after age 18 (standard in Japan) the student was enrolled (2750 students were never retained , while 811 were retained)</td>
                <td>Some enrollments over the standard age may have reflected or caused some problems including mental health problems.</td>
              </tr>
              <tr valign="top">
                <td>An indicator to show how many years the respondent had ever been retained (3527 students were never retained, while 34 were retained)</td>
                <td>Some students who repeated school years may have had some mental health problems.</td>
              </tr>
              <tr valign="top">
                <td>The number of unanswered items</td>
                <td>Students with mental health problems may hesitate to answer or miss many items.</td>
              </tr>
              <tr valign="top">
                <td>The number of characters in answer to the free description question, <italic>what you want to tell us and questions</italic></td>
                <td>Students with mental health problems may write a lot in free descriptions to make the university aware of their difficulty.</td>
              </tr>
              <tr valign="top">
                <td>Dummy variables for including 6 specific word clusters<sup>a</sup></td>
                <td>Some students with mental health problems may have used specific words in common and expressions in the free description.</td>
              </tr>
              <tr valign="top">
                <td>Number of “yes” answers in <italic>case history</italic> and <italic>nine questions about campus life</italic></td>
                <td>Students with mental health problems may have experienced some diseases or campus life problems.</td>
              </tr>
              <tr valign="top">
                <td>The proportion of “yes” answers to each item in <italic>nine questions about campus life</italic> in the respondent’s department</td>
                <td>Some students who belonged to departments with many students with campus life problems may have felt stress.</td>
              </tr>
              <tr valign="top">
                <td>The number of students and the proportion of same-sex students in the respondent’s department</td>
                <td>Some students who belonged to the departments which have few same-sex students may have had difficulty in communication and relationships.</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table3fn1">
              <p><sup>a</sup>Cluster 1 contained, among other words, “counseling,” “current,” and “under treatment.” Cluster 2 contained, among other words, “syndrome,” “surgery,” and “diagnosis.” Cluster 3 contained, among other words, “menstruation” and “anemia.” Cluster 4 contained, among other words, “left,” “ear,” and “right.” Cluster 5 contained, among other words, “depression,” “mental,” “stress,” and “anxiety.” Cluster 6 contained, among other words, “hospital,” “allergy,” and “skin.”</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
        <table-wrap position="float" id="table4">
          <label>Table 4</label>
          <caption>
            <p>Generated variables based on answering time and possible conjecture.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Item</td>
                <td>Conjecture</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>Answer date (the number of days elapsed between the survey announcement and the completion of survey by a student)</td>
                <td>Students with mental health problems (eg, procrastination traits and, lack of information gathering) may answer the survey later.</td>
              </tr>
              <tr valign="top">
                <td>RT<sup>a</sup> per character in the free description question <italic>what you want to tell us and questions</italic></td>
                <td>Some students who wrote smooth free descriptions may have had some health problem to tell the university.</td>
              </tr>
              <tr valign="top">
                <td>2D-dimensional coordinates of response time stamps<sup>b</sup></td>
                <td>Response time stamps may have reflected students’ life rhythm and sleep quality, which may be related to mental health state.</td>
              </tr>
              <tr valign="top">
                <td>Kernel density of <italic>s</italic></td>
                <td>Some students who answered at different times compared with others may have had problems with life rhythm and sleep quality, which may be related to mental health problems.</td>
              </tr>
              <tr valign="top">
                <td>2 principal components scores of log-transformed standardized RTs of all items</td>
                <td>Students with mental health problems may spend a longer or shorter time on specific items than other students.</td>
              </tr>
              <tr valign="top">
                <td>Individual mean and SD of standardized log RTs calculated using all valid responses</td>
                <td>Students with mental health problems may spend, on average, a longer or shorter time answering. Students with mental health problems may spend very different time on different items.</td>
              </tr>
              <tr valign="top">
                <td>2 principal components scores of differences between the standardized log RTs of all items and the individual mean</td>
                <td>Students with mental health problems may spend longer or shorter time on answering specific items than others.</td>
              </tr>
              <tr valign="top">
                <td>2 principal components scores of kernel density of the standardized log RTs of all items</td>
                <td>Students with mental health problems may show peculiar RT patterns.</td>
              </tr>
            </tbody>
          </table>
          <table-wrap-foot>
            <fn id="table4fn1">
              <p><sup>a</sup>RT: response time.</p>
            </fn>
            <fn id="table4fn2">
              <p><sup>b</sup>They were calculated with equation 1.</p>
            </fn>
          </table-wrap-foot>
        </table-wrap>
      </sec>
      <sec>
        <title>Procedure</title>
        <p>In this procedure, we did not split the data into training and test data. This is because the values for the obtained metrics varied considerably depending on the data split owing to data imbalance. Thus, only 5.5% (196/3561) of the students in 2020 and 6.88% (245/3561) in 2021 had a higher risk of mental illness problems as assessed by Kessler 6, including 2.33% (83/3561) of the students who had problems both in 2020 and 2021. Typically, such imbalanced data are dealt with by applying sample weight to equal the total number of positive and negative observations. However, our preliminary comparison performed better when we did not impose sample weights on all candidate models. Therefore, we did not use any particular procedures for dealing with imbalanced data.</p>
        <p>First, we compared the performance of candidate ML models to determine which model to use. The procedure was divided into 2 parts: parameter tuning and performance evaluation. Both parts were conducted based on the following procedure (<italic>K</italic> repeats of 5-fold cross-validation; <xref rid="figure1" ref-type="fig">Figure 1</xref> shows the schema of the procedure):</p>
        <list list-type="order">
          <list-item>
            <p>Randomly shuffle the entire data set and split it into 5 folds so that the positive:negative ratio of the outcome variable is nearly the same among the data sets.</p>
          </list-item>
          <list-item>
            <p>Choose 1 of the 5 data sets as the test data, and train the model using the remaining 4 data sets.</p>
          </list-item>
          <list-item>
            <p>Evaluate the trained model on the test data.</p>
          </list-item>
          <list-item>
            <p>Repeat steps 2 and 3 for each data set.</p>
          </list-item>
          <list-item>
            <p>Calculate the means of 5 data sets on each evaluation metric.</p>
          </list-item>
          <list-item>
            <p>Repeat steps 1 through 5 <italic>K</italic> times.</p>
          </list-item>
          <list-item>
            <p>Calculate the means of <italic>K</italic> repeats on each evaluation metric.</p>
          </list-item>
        </list>
        <p>In the parameter tuning part, the model’s hyperparameters were optimized based on the tree-structured Parzen estimator [<xref ref-type="bibr" rid="ref42">42</xref>]. The log-loss, as a model performance measure, in a specific parameter set was measured by <italic>K</italic>=50 repeats of 5-fold cross-validation. Log-loss at fold <italic>f</italic> of the <italic>k</italic>-th repeat is calculated by</p>
        <disp-formula>
        LogLoss(k,f) = − (1 / n)Σ([y<sub>i</sub>]log[p<sub>i</sub>] + [1 − y<sub>i</sub>]log[1 − p<sub>i</sub>]) <bold>(2)</bold>
        </disp-formula>
        <p>where <italic>y<sub>i</sub></italic> and <italic>p<sub>i</sub></italic> are the realized value and predicted probability of respondent <italic>i</italic>, respectively, and <italic>n</italic> is the number of observations in the fold <italic>f</italic>. As a result, the log-loss for a specific parameter set was obtained by</p>
        <disp-formula>
        LogLoss = (1 / K)Σ(1 / 5)ΣLogLoss(k,f) <bold>(3)</bold>
        </disp-formula>
        <p>All the hyperparameters tuned in this study are summarized in <xref ref-type="table" rid="table5">Table 5</xref> [<xref ref-type="bibr" rid="ref43">43</xref>-<xref ref-type="bibr" rid="ref46">46</xref>]. These parameters can cope with overfitting if they are appropriately tuned. In addition, the learning rate parameters in the GBDT models (eta in XGBoost and learning rate in LightGBM) were fixed at 0.01. Generally, the smaller the learning rate, the more accurate is the prediction, although the computation time increases.</p>
        <p>As a result, the performance in each parameter set was measured as the average of <italic>K</italic>=50 log-losses. Finally, the parameter values that minimize the objective performance measure were adopted, and we proceeded to the performance evaluation. By using the optimized parameter set, we obtained 8 model performance measures (log-loss, Brier loss, area under the curve of receiver operating characteristic curve [AUC-ROC], area under the curve of precision-recall curve [AUC-PR], specificity, precision, recall [also known as sensitivity], and Matthews correlation coefficient [MCC]). Log-loss, Brier loss, AUC-ROC, and AUC-PR are measures based on predictive probability (<italic>p<sub>i</sub></italic>). In contrast, the specificity, precision, recall, and MCC are obtained from the confusion matrix. For example, MCC is calculated as follows:</p>
        <disp-formula><italic>(TP</italic> × <italic>TN</italic> – <italic>FP</italic> × <italic>FN) / √(</italic>[<italic>TP + FP</italic>] × [<italic>TP + FN</italic>] × [<italic>TN + FP</italic>] × [<italic>TN + FN</italic>]<italic>)</italic> <bold>(4)</bold>
        </disp-formula>
        <p>where <italic>TP, TN, FP,</italic> and <italic>FN</italic> are the numbers of true-positive, true-negative, false-positive, and false-negative respondents, respectively. As previously mentioned, this study used imbalanced data. Therefore, we included the AUC-PR and MCC, which are commonly used in such cases [<xref ref-type="bibr" rid="ref47">47</xref>].</p>
        <p>On the basis of the performance measures obtained, we selected the best model. To test the extent to which answering time–related variables contribute to prediction performance in the selected model, we also conducted parameter tuning and performance evaluation phases without all answering time–related variables (shown in <xref ref-type="table" rid="table4">Table 4</xref>). We call the analysis without answering time–related variables “<italic>without</italic> condition, whereas the analysis with all input variables is called <italic>with</italic> condition.</p>
        <p>Furthermore, we calculated feature importance measures (Gain and Shapley additive explanations [SHAP]) on both <italic>with</italic> and <italic>without</italic> conditions. SHAP is based on the Shapley values, the average marginal contribution in game theory. With the firm theoretical basis of game theory, SHAP can explain the extent to which each input variable contributes to the model’s prediction [<xref ref-type="bibr" rid="ref48">48</xref>]. Although several approaches exist for interpreting the prediction, we used SHAP because it is easy to implement and understand. Using the SHAP dependence plot, we can understand the relationship between the actual input value and its effect on the predicted probability. The abovementioned procedures were executed using all the data in <italic>K</italic>=100 repeats of 5-fold cross-validation. After model evaluation, we obtained SHAP dependence plots on several variables to interpret the model prediction.</p>
        <p>All the procedures described in this section were executed using the Julia programming language [<xref ref-type="bibr" rid="ref49">49</xref>] with several libraries: MLJ.jl [<xref ref-type="bibr" rid="ref50">50</xref>], TreeParzen.jl [<xref ref-type="bibr" rid="ref51">51</xref>], ScikitLearn.jl [<xref ref-type="bibr" rid="ref52">52</xref>], LightGBM.jl [<xref ref-type="bibr" rid="ref53">53</xref>], and ShapML.jl [<xref ref-type="bibr" rid="ref54">54</xref>]. Compared with several famous languages, such as R and Python, Julia is still a young language and is rapidly developing. However, it is already perceived as sufficiently stable to be used for research purposes [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Flowchart of 5-fold cross-validation in each part.</p>
          </caption>
          <graphic xlink:href="mental_v10i1e42420_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table5">
          <label>Table 5</label>
          <caption>
            <p>Hyperparameters of each model tuned in the parameter tuning part.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="420"/>
            <col width="0"/>
            <col width="550"/>
            <thead>
              <tr valign="top">
                <td colspan="3">Model and hyperparameter</td>
                <td>Description</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Elastic net</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>gamma</td>
                <td colspan="2">Strength of the L1 regularization</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>lambda</td>
                <td colspan="2">Strength of the L2 regularization</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Random forest</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>n_estimators</td>
                <td colspan="2">The number of trees in the forest</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>max_depth</td>
                <td colspan="2">The maximum depth of the tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>min_samples_leaf</td>
                <td colspan="2">The minimum number of samples required to be at a leaf node.</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>max_features</td>
                <td colspan="2">The proportion of features used in each tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>max_samples</td>
                <td colspan="2">The proportion of samples used in each tree</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>XGBoost</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>num_round</td>
                <td colspan="2">The number of boosting iterations</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>max_depth</td>
                <td colspan="2">The maximum depth of the tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>min_child_weight</td>
                <td colspan="2">Minimum sum of instance weight needed in a child</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>alpha</td>
                <td colspan="2">Strength of the L1 regularization</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>lambda</td>
                <td colspan="2">Strength of the L2 regularization</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>colsample_bytree</td>
                <td colspan="2">The proportion of features used in each tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>subsample</td>
                <td colspan="2">The proportion of samples used in each tree</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>LightGBM</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>num_iterations</td>
                <td colspan="2">The number of boosting iterations</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>num_leaves</td>
                <td colspan="2">The maximum number of leaves in 1 tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>max_depth</td>
                <td colspan="2">The maximum depth of the tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>min_deta_in_leaf</td>
                <td colspan="2">The minimal amount of data in 1 leaf</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>lambda_l1</td>
                <td colspan="2">Strength of the L1 regularization</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>lambda_l2</td>
                <td colspan="2">Strength of the L2 regularization</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>feature_fraction</td>
                <td colspan="2">The proportion of features used in each tree</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>bagging_fraction</td>
                <td colspan="2">The proportion of samples used in each tree</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p><xref ref-type="table" rid="table6">Tables 6</xref> and <xref ref-type="table" rid="table7">7</xref> summarize mean and SD of each model’s performance measures. As explained in <italic>Procedure</italic> section, the resultant values shown in <xref ref-type="table" rid="table6">Tables 6</xref> and <xref ref-type="table" rid="table7">7</xref> are the means and SDs calculated from 100 trials. Italicized variables indicate the best model in terms of each measure. Evidently, the elastic net and LightGBM performed best. Regarding probabilistic measures (<xref ref-type="table" rid="table6">Table 6</xref>), elastic net afforded slightly better values than LightGBM. By contrast, binary measures, which were calculated from the confusion matrix (<xref ref-type="table" rid="table7">Table 7</xref>), were apparently better at LightGBM. <xref rid="figure2" ref-type="fig">Figure 2</xref> shows the confusion matrix obtained from the elastic net and LightGBM in analyses 1 and 2. The actual values given below the percentages in each cell are the averages of K=100 repeats. In analysis 1, LightGBM misclassified only 11.27 (SD 1.75) observations (5.02, SD 1.58 false positives and 6.25, SD 1.18 false negatives) out of 3561 on average, whereas elastic net misclassified more than twice (average 25.94, SD 2.49) as many observations as LightGBM. Similar results were obtained in analysis 2. On the basis of these outcomes, we report the results for LightGBM.</p>
      <p><xref ref-type="table" rid="table8">Table 8</xref> presents a comparison of the performances of LightGBM measures between <italic>with</italic> and <italic>without</italic> conditions. In contrast to our expectations, these results were mixed. This implies that the use of answering time–related variables does not necessarily improve the prediction.</p>
      <p><xref ref-type="table" rid="table9">Tables 9</xref>-<xref ref-type="table" rid="table12">12</xref> show the top 10 input variables ranked by Gain and SHAP importance. SHAP importance was calculated as the average absolute value of all respondents. The number of “yes” answers to nine questions about campus life had the highest impact regardless of the analyses, conditions, and feature importance measures (<xref ref-type="table" rid="table9">Tables 9</xref>-<xref ref-type="table" rid="table12">12</xref>). In <xref ref-type="table" rid="table9">Table 9</xref> (Gain in with condition), 5 of the top 10 input variables are answering time–related variables. In <xref ref-type="table" rid="table10">Table 10</xref> (Gain in without condition), hours of internet use, years of university, and proportion of the same sex in the department were ranked common to both analyses 1 and 2, in addition to variables related to nine questions about campus life. In <xref ref-type="table" rid="table11">Table 11</xref> (SHAP in with condition), input variables from nine questions about campus life and answering time–related input variables mainly occupied the top 10 variables in analysis 1. In analysis 2, answering time–related input variables were out of rank, whereas years of university, the academic year of admission, diet-related variables, and proportion of the same sex in the department were ranked. In <xref ref-type="table" rid="table12">Table 12</xref> (SHAP in without condition), years of university, academic year of admission, and diet-related variables were ranked common to both analyses 1 and 2 in addition to variables related to nine questions about campus life.</p>
      <table-wrap position="float" id="table6">
        <label>Table 6</label>
        <caption>
          <p>Probabilistic performance measures of each model.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="210"/>
          <col width="180"/>
          <col width="180"/>
          <col width="180"/>
          <col width="220"/>
          <thead>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>Log-loss, mean (SD)</td>
              <td>Brier loss, mean (SD)</td>
              <td>AUC-ROC<sup>a</sup>, mean (SD)</td>
              <td>AUC-PR<sup>b</sup>, mean (SD)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="6">
                <bold>Analysis 1</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Logistic regression</td>
              <td>0.252 (0.012)</td>
              <td>0.109 (0.003)</td>
              <td>0.760 (0.012)</td>
              <td>0.215 (0.013)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Elastic net</td>
              <td>
                <italic>0.164 (0.001)</italic>
                <sup>c</sup>
              </td>
              <td>
                <italic>0.090 (0.001)</italic>
              </td>
              <td>
                <italic>0.862 (0.003)</italic>
              </td>
              <td>
                <italic>0.292 (0.010)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Random forest</td>
              <td>0.210 (0.008)</td>
              <td>0.113 (0.001)</td>
              <td>0.833 (0.005)</td>
              <td>0.218 (0.010)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>XGBoost</td>
              <td>0.165 (0.001)</td>
              <td>0.091 (0.001)</td>
              <td>0.855 (0.003)</td>
              <td>0.278 (0.009)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LightGBM</td>
              <td>0.165 (0.001)</td>
              <td>
                <italic>0.090 (0.001)</italic>
              </td>
              <td>0.857 (0.003)</td>
              <td>0.281 (0.010)</td>
            </tr>
            <tr valign="top">
              <td colspan="6">
                <bold>Analysis 2</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Logistic regression</td>
              <td>0.342 (0.015)</td>
              <td>0.140 (0.003)</td>
              <td>0.696 (0.009)</td>
              <td>0.178 (0.011)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Elastic net</td>
              <td>
                <italic>0.211 (0.001)</italic>
              </td>
              <td>
                <italic>0.115 (0.001)</italic>
              </td>
              <td>
                <italic>0.796 (0.004)</italic>
              </td>
              <td>
                <italic>0.264 (0.008)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Random forest</td>
              <td>0.250 (0.002)</td>
              <td>0.140 (0.001)</td>
              <td>0.768 (0.005)</td>
              <td>0.200 (0.007)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>XGBoost</td>
              <td>0.213 (0.001)</td>
              <td>0.116 (0.001)</td>
              <td>0.791 (0.004)</td>
              <td>0.249 (0.008)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LightGBM</td>
              <td>0.213 (0.001)</td>
              <td>0.116 (0.001)</td>
              <td>0.789 (0.004)</td>
              <td>0.246 (0.009)</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table6fn1">
            <p><sup>a</sup>AUC-ROC: area under the curve of receiver operating characteristic curve.</p>
          </fn>
          <fn id="table6fn2">
            <p><sup>b</sup>AUC-PR: area under the curve of precision-recall curve.</p>
          </fn>
          <fn id="table6fn3">
            <p><sup>c</sup>Italicized variables indicate the best model in terms of each measure.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table7">
        <label>Table 7</label>
        <caption>
          <p>Performance measures on each model from confusion matrix.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="230"/>
          <col width="180"/>
          <col width="180"/>
          <col width="180"/>
          <col width="200"/>
          <thead>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>Specificity, mean (SD)</td>
              <td>Precision, mean (SD)</td>
              <td>Recall, mean (SD)</td>
              <td>MCC<sup>a</sup>, mean (SD)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="6">
                <bold>Analysis 1</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Logistic regression</td>
              <td>0.977 (0.002)</td>
              <td>0.681 (0.020)</td>
              <td>0.823 (0.015)</td>
              <td>0.732 (0.016)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Elastic net</td>
              <td>0.996 (0.001)</td>
              <td>0.934 (0.009)</td>
              <td>0.936 (0.009)</td>
              <td>0.931 (0.007)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Random forest</td>
              <td>0.976 (0.002)</td>
              <td>0.681 (0.022)</td>
              <td>0.859 (0.018)</td>
              <td>0.749 (0.017)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>XGBoost</td>
              <td>0.998 (0.001)</td>
              <td>0.963 (0.008)</td>
              <td>0.963 (0.006)</td>
              <td>0.961 (0.005)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LightGBM</td>
              <td>
                <italic>0.999 (0.000)</italic>
                <sup>b</sup>
              </td>
              <td>
                <italic>0.975 (0.008)</italic>
              </td>
              <td>
                <italic>0.968 (0.006)</italic>
              </td>
              <td>
                <italic>0.970 (0.005)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td colspan="6">
                <bold>Analysis 2</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Logistic regression</td>
              <td>0.976 (0.002)</td>
              <td>0.730 (0.018)</td>
              <td>0.884 (0.012)</td>
              <td>0.787 (0.013)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Elastic net</td>
              <td>0.998 (0.001)</td>
              <td>0.970 (0.006)</td>
              <td>0.963 (0.005)</td>
              <td>0.964 (0.004)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Random forest</td>
              <td>0.967 (0.002)</td>
              <td>0.662 (0.017)</td>
              <td>0.857 (0.015)</td>
              <td>0.732 (0.014)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>XGBoost</td>
              <td>0.998 (0.000)</td>
              <td>0.977 (0.005)</td>
              <td>0.987 (0.004)</td>
              <td>0.981 (0.004)</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>LightGBM</td>
              <td>
                <italic>0.999 (0.000)</italic>
              </td>
              <td>
                <italic>0.984 (0.005)</italic>
              </td>
              <td>
                <italic>0.990 (0.004)</italic>
              </td>
              <td>
                <italic>0.986 (0.003)</italic>
              </td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table7fn1">
            <p><sup>a</sup>MCC: Matthews correlation coefficient.</p>
          </fn>
          <fn id="table7fn2">
            <p><sup>b</sup>Italicized variables indicate the best model in terms of each measure.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <fig id="figure2" position="float">
        <label>Figure 2</label>
        <caption>
          <p>Confusion matrices on the elastic net (left half) and LightGBM (right half).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <table-wrap position="float" id="table8">
        <label>Table 8</label>
        <caption>
          <p>Performance measures of with and without conditions on LightGBM.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="310"/>
          <col width="140"/>
          <col width="150"/>
          <col width="0"/>
          <col width="140"/>
          <col width="260"/>
          <thead>
            <tr valign="top">
              <td>Measure</td>
              <td colspan="3">Analysis 1</td>
              <td colspan="2">Analysis 2</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td><italic>With</italic>, mean (SD)</td>
              <td><italic>Without</italic>, mean (SD)</td>
              <td colspan="2"><italic>With</italic>, mean (SD)</td>
              <td><italic>Without</italic>, mean (SD)</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td>Log-loss</td>
              <td>
                <italic>0.165 (0.001)</italic>
                <sup>a</sup>
              </td>
              <td>
                <italic>0.165 (0.001)</italic>
              </td>
              <td colspan="2">0.213 (0.001)</td>
              <td>
                <italic>0.211 (0.001)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td>Brier loss</td>
              <td>
                <italic>0.090 (0.001)</italic>
              </td>
              <td>
                <italic>0.090 (0.001)</italic>
              </td>
              <td colspan="2">0.116 (0.001)</td>
              <td>
                <italic>0.115 (0.001)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td>AUC-ROC<sup>b</sup></td>
              <td>0.857 (0.003)</td>
              <td>
                <italic>0.858 (0.003)</italic>
              </td>
              <td colspan="2">0.789 (0.004)</td>
              <td>
                <italic>0.798 (0.004)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td>AUC-PR<sup>c</sup></td>
              <td>
                <italic>0.281 (0.010)</italic>
              </td>
              <td>0.276 (0.010)</td>
              <td colspan="2">0.246 (0.009)</td>
              <td>
                <italic>0.260 (0.010)</italic>
              </td>
            </tr>
            <tr valign="top">
              <td>Specificity</td>
              <td>
                <italic>0.999 (0.000)</italic>
              </td>
              <td>0.998 (0.000)</td>
              <td colspan="2">
                <italic>0.999 (0.000)</italic>
              </td>
              <td>0.998 (0.001)</td>
            </tr>
            <tr valign="top">
              <td>Precision</td>
              <td>
                <italic>0.975 (0.008)</italic>
              </td>
              <td>0.974 (0.008)</td>
              <td colspan="2">
                <italic>0.984 (0.005)</italic>
              </td>
              <td>0.970 (0.007)</td>
            </tr>
            <tr valign="top">
              <td>Recall</td>
              <td>0.968 (0.006)</td>
              <td>
                <italic>0.981 (0.007)</italic>
              </td>
              <td colspan="2">
                <italic>0.990 (0.004)</italic>
              </td>
              <td>0.977 (0.005)</td>
            </tr>
            <tr valign="top">
              <td>MCC<sup>d</sup></td>
              <td>0.970 (0.005)</td>
              <td>
                <italic>0.976 (0.005)</italic>
              </td>
              <td colspan="2">
                <italic>0.986 (0.003)</italic>
              </td>
              <td>0.971 (0.004)</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table8fn1">
            <p><sup>a</sup>Italicized variables indicate the best model in terms of each measure.</p>
          </fn>
          <fn id="table8fn2">
            <p><sup>b</sup>AUC-ROC: area under the curve of receiver operating characteristic curve.</p>
          </fn>
          <fn id="table8fn3">
            <p><sup>c</sup>AUC-PR: area under the curve of precision-recall curve.</p>
          </fn>
          <fn id="table8fn4">
            <p><sup>d</sup>MCC: Matthews correlation coefficient.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table9">
        <label>Table 9</label>
        <caption>
          <p>Top 10 input variables ranked by Gain (with answering time condition).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="700"/>
          <col width="270"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Input variable</td>
              <td>Gain</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 1</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.216</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.088</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I’m worried about my future.”</td>
              <td>0.033</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2nd principal component score of <italic>Diff</italic><sub><italic>RT</italic></sub><sup>a</sup></td>
              <td>0.031</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2nd principal component score of <italic>Dens</italic><sub><italic>RT</italic></sub><sup>b</sup></td>
              <td>0.030</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>x coordinate of response time stamp</td>
              <td>0.026</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Mean of “I had some trouble with someone close to me” in department</td>
              <td>0.025</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Individual mean of standardized log RT<sup>c</sup></td>
              <td>0.021</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>1st principal component score of <italic>Diff</italic><sub><italic>RT</italic></sub></td>
              <td>0.021</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.020</td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 2</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.131</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.080</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>y coordinate of response time stamp</td>
              <td>0.029</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2nd principal component score of <italic>Diff</italic><sub><italic>RT</italic></sub></td>
              <td>0.028</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Years of university</td>
              <td>0.026</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Individual SD of <italic>Dens</italic><sub><italic>RT</italic></sub></td>
              <td>0.024</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>1st principal component score of standardized log RT</td>
              <td>0.024</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I’m worried about my future.”</td>
              <td>0.023</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Individual SD of standardized log RT</td>
              <td>0.023</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Kernel density of <italic>s</italic></td>
              <td>0.023</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table9fn1">
            <p><sup>a</sup><italic>Diff<sub>RT</sub></italic> is the difference between the standardized log RT of each item and individual mean.</p>
          </fn>
          <fn id="table9fn2">
            <p><sup>b</sup><italic>Dens<sub>RT</sub></italic> is the kernel density of the standardized log RT of each item.</p>
          </fn>
          <fn id="table9fn3">
            <p><sup>c</sup>RT: response time.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table10">
        <label>Table 10</label>
        <caption>
          <p>Top 10 input variables ranked by Gain (without answering time condition).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="700"/>
          <col width="270"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Input variable</td>
              <td>Gain</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 1</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.200</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.089</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Mean of “I had some trouble with someone close to me.” in department</td>
              <td>0.035</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>sleeping hours</td>
              <td>0.032</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I'm worried about my future.”</td>
              <td>0.029</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Faculty and department</td>
              <td>0.024</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>years of university</td>
              <td>0.023</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.023</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Proportion of the same sex in department</td>
              <td>0.023</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Hours of internet use</td>
              <td>0.022</td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 2</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.143</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.119</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I'm worried about my future.”</td>
              <td>0.047</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.031</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Proportion of the same sex in department</td>
              <td>0.031</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Years of university</td>
              <td>0.030</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“It takes me a long time to get used to new surroundings.”</td>
              <td>0.030</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>The academic year of admission</td>
              <td>0.028</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Hours of internet use</td>
              <td>0.027</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Mean of “I have a strong anxiety about my campus life” in department</td>
              <td>0.023</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <table-wrap position="float" id="table11">
        <label>Table 11</label>
        <caption>
          <p>Top 10 input variables ranked by Shapley additive explanations (SHAP; with answering time condition).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="700"/>
          <col width="270"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Input variable</td>
              <td>SHAP</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 1</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.027</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.015</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I’m worried about my future.”</td>
              <td>0.006</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Mean of “I had some trouble with someone close to me.” in department</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2nd principal component score of <italic>Dens</italic><sub><italic>RT</italic></sub><sup><italic>a</italic></sup></td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>2nd principal component score of <italic>Diff</italic><sub><italic>RT</italic></sub><sup><italic>b</italic></sup></td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Years of university</td>
              <td>0.004</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“It takes me a long time to get used to new surroundings.”</td>
              <td>0.004</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>x coordinate of response time stamp</td>
              <td>0.003</td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 2</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.019</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.016</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Years of university</td>
              <td>0.006</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I’m worried about my future.”</td>
              <td>0.006</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>The academic year of admission</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“It takes me a long time to get used to new surroundings.”</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Have meals (breakfast)</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Have lost over 3 kg in a month (presently)</td>
              <td>0.004</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Proportion of the same sex in department</td>
              <td>0.004</td>
            </tr>
          </tbody>
        </table>
        <table-wrap-foot>
          <fn id="table11fn1">
            <p><sup>a</sup><italic>Dens<sub>RT</sub></italic> is the kernel density of the standardized log RT of each item.</p>
          </fn>
          <fn id="table11fn2">
            <p><sup>b</sup><italic>Diff<sub>RT</sub></italic> is the difference between the standardized log RT of each item and individual mean.</p>
          </fn>
        </table-wrap-foot>
      </table-wrap>
      <table-wrap position="float" id="table12">
        <label>Table 12</label>
        <caption>
          <p>Top 10 input variables ranked by Shapley additive explanations (SHAP; without answering time condition).</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="700"/>
          <col width="270"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Input variable</td>
              <td>SHAP</td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 1</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.028</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.015</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Mean of “I had some trouble with someone close to me.” in department</td>
              <td>0.006</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I’m worried about my future.”</td>
              <td>0.006</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Years of university</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>The academic year of admission</td>
              <td>0.003</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“It takes me a long time to get used to new surroundings.”</td>
              <td>0.003</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Sleeping hours</td>
              <td>0.003</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Have lost over 3 kg in a month</td>
              <td>0.003</td>
            </tr>
            <tr valign="top">
              <td colspan="3">
                <bold>Analysis 2</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I have a strong anxiety about my campus life.”</td>
              <td>0.018</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Nine questions about campus life (number of “yes”)</td>
              <td>0.016</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I’m worried about my future.”</td>
              <td>0.008</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>The academic year of admission</td>
              <td>0.007</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“I always feel busy with my academic work.”</td>
              <td>0.007</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Years of university</td>
              <td>0.007</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>“It takes me a long time to get used to new surroundings.”</td>
              <td>0.007</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Have meals (breakfast)</td>
              <td>0.006</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Have lost over 3 kg in a month (presently)</td>
              <td>0.005</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Age</td>
              <td>0.004</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <p><xref rid="figure3" ref-type="fig">Figures 3</xref>-<xref rid="figure8" ref-type="fig">8</xref> show SHAP dependence plots or violin plots of some interpretable input variables with high feature importance on average: the number of “yes” answers to <italic>nine questions about campus life</italic>, sleeping hours, years of university, proportion of the same sex in respondent’s department, xy coordinates of RT stamp, and answer date. The blue lines indicate smoothed conditional mean based on the generalized additive model. <xref rid="figure3" ref-type="fig">Figure 3</xref> shows that the averages of the SHAP effect were positive for ≥5 “yes” answers in 9 questions in common to both analyses 1 and 2, indicating that many campus life problems increased predictive probability. <xref rid="figure4" ref-type="fig">Figure 4</xref> shows that the averages of the SHAP effect were positive for &#60;6 hours or &#62;8 hours of sleep, indicating that too short or too long sleep increased predictive probability. <xref rid="figure5" ref-type="fig">Figure 5</xref> shows that the averages of the SHAP effect were positive for third- or higher-year students. Focusing on second-year students, the averages of the SHAP effect were positive in analysis 1 and negative in analysis 2, indicating that predictive probability decreased. <xref rid="figure6" ref-type="fig">Figure 6</xref> shows that the averages of the SHAP effect were positive for fewer proportion of the same sex in the department, indicating high predictive probability. All the top 5 departments with a low proportion of the same sex were in the faculty of science and engineering; female students were 2.8% (4/141) to 14.4% (18/125). The proportion of men in the international department was only 17.1% (32/187).</p>
      <p><xref rid="figure7" ref-type="fig">Figure 7</xref> shows the SHAP dependence plot on xy coordinates of the RT stamp. Both axes represent the realized values of the input. The correspondence between the RT stamp and the coordinates is shown in the graph. For example, if an answer was recorded at 00:00 (midnight), its RT stamp was transformed to (x,y)=(1,0). Red dots were plotted in conjunction with the sum of the SHAP values on the x and x coordinates. Their dots move outside the thick black circle (x<sup>2</sup> + y<sup>2</sup> = 1) if the sum is positive. As a result, if a respondent’s answer was recorded at 00:00 (midnight) and the sum of SHAP values was 0.02, a red dot according to the respondent was plotted at (x,y)=(1,0)*0.02*10=(1.2,0). Note that 10 is the magnification ratio determined arbitrarily for visibility. The thin black lines are circles of x<sup>2</sup>+y<sup>2</sup>=0.8,0.9,1.1,1.2, indicating SHAP values of −0.02, −0.01, 0.01, and 0.02. The figure suggests that respondents whose answers were recorded at midnight tended to show large SHAP values, indicating a high predictive probability. By contrast, those whose answers were recorded in the morning (approximately 7:00-11:00) or afternoon (approximately 13:00-17:00) were plotted inside the thick black circle, indicating negative SHAP values. <xref rid="figure8" ref-type="fig">Figure 8</xref> suggests that an ascending relationship exists between the answer date and SHAP. This indicates that students who responded to the survey more than 9 to 10 days after the announcement were more likely to be predicted as having mental health problems.</p>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Shapley additive explanations (SHAP) dependence plot of the number of “yes” answers to 9 questions about campus life on “with” condition (left: analysis 1; right: analysis 2).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure4" position="float">
        <label>Figure 4</label>
        <caption>
          <p>Shapley additive explanations (SHAP) dependence plot of sleeping hours (analysis 1, “without” condition).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure5" position="float">
        <label>Figure 5</label>
        <caption>
          <p>Shapley additive explanations (SHAP) violin plot of years of university on “with” condition (left: analysis 1; right: analysis 2).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure6" position="float">
        <label>Figure 6</label>
        <caption>
          <p>Shapley additive explanations (SHAP) dependence plot of the proportion of the same sex in respondent’s department (analysis 2, “with” condition).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure7" position="float">
        <label>Figure 7</label>
        <caption>
          <p>Shapley additive explanations (SHAP) dependence plot of xy coordinates of response time stamp (analysis 1, “with” condition).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig7.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <fig id="figure8" position="float">
        <label>Figure 8</label>
        <caption>
          <p>Shapley additive explanations (SHAP) dependence plot of answer date (analysis 2, “with” condition).</p>
        </caption>
        <graphic xlink:href="mental_v10i1e42420_fig8.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Among all the models, elastic net and LightGBM performed the best in analyses 1 and 2 (<xref ref-type="table" rid="table6">Tables 6</xref> and <xref ref-type="table" rid="table7">7</xref>). We adopted the LightGBM in this study based on the confusion matrix (<xref rid="figure2" ref-type="fig">Figure 2</xref>); however, the elastic net can also have an adequate ability to predict mental health problems not only in real time but also 1 year in the future.</p>
        <p>Some of the answering time findings are listed in <xref ref-type="table" rid="table8">Table 8</xref>. Whether the <italic>with</italic> condition outperformed the <italic>without</italic> condition depended on the performance measure considered. This is possibly because the LightGBM can obtain excellent performance even without answering time–related variables on these data. However, as shown in <xref ref-type="table" rid="table9">Tables 9</xref> and <xref ref-type="table" rid="table11">11</xref>, certain variables are apparently helpful in improving the prediction and affecting the prediction probability. In summary, it is difficult to determine whether we should use answering time–related variables to predict mental health problems.</p>
        <p>Focusing on input variables, those from <italic>nine questions about campus life</italic> improved performance (<xref ref-type="table" rid="table9">Tables 9</xref> and <xref ref-type="table" rid="table10">10</xref>) and were commonly effective for prediction (<xref ref-type="table" rid="table1">Tables 11</xref> and <xref ref-type="table" rid="table12">12</xref>). Comparing Gain and SHAP in <italic>with</italic> condition (<xref ref-type="table" rid="table9">Tables 9</xref> and <xref ref-type="table" rid="table11">11</xref>), it is suggested that some input variables converted from the answering time substantially impacted the learning. With respect to the <italic>without</italic> condition (<xref ref-type="table" rid="table1">Tables 10</xref> and <xref ref-type="table" rid="table12">12</xref>), it is suggested that the input variable, years of university, could improve the prediction to some extent.</p>
      </sec>
      <sec>
        <title>Detailed Discussion on Input Variables</title>
        <p>In <xref ref-type="table" rid="table9">Tables 9</xref>-<xref ref-type="table" rid="table12">12</xref>, the input variables from <italic>nine questions about campus life</italic> held a top-ranking position. In particular, the item “I have a strong anxiety about my campus life” had a stable and powerful influence on prediction. The questions were easy to use because there were only 9 yes or no questions. <xref rid="figure3" ref-type="fig">Figure 3</xref> suggests that students were more likely to have mental health problems when they responded positively to ≥5 items of the 9 questions. Furthermore, the variable <italic>nine questions about campus life</italic> could be used by faculty members to advise student orally in addition to health staff members. Their response will be useful for whole-university support and for early detection.</p>
        <p>Sleeping hours affected learning and prediction more in analysis 2 than in analysis 1 on the “without” condition (<xref ref-type="table" rid="table1">Tables 10</xref> and <xref ref-type="table" rid="table11">11</xref>). This implies that sleeping hours were less effective in learning and predicting mental health problems within 1 year. Sleeping hours may be a fluid measure that is affected by lifestyle and busyness. <xref rid="figure4" ref-type="fig">Figure 4</xref> suggested that 6 to 8 hours of sleep were desirable in terms of mental health.</p>
        <p>In Japan, 7 hours and 22 minutes are the average sleeping hours [<xref ref-type="bibr" rid="ref57">57</xref>]. More than one-third of the students in this survey slept for 7 hours. Sleeping too little or too much is a representative symptom of mental health disorder (eg, depressive disorders) [<xref ref-type="bibr" rid="ref58">58</xref>]. Even without any disorder, sleep diminution because of overwork and busyness could cause mental health problems, and sleeping too much may cause problems in academics. It can be useful for students sleeping &#60;6 or &#62;8 hours to be instructed on how to improve their life rhythm using flyers. Faculty members should keep in mind the need for students to sleep for &#62;6 hours when handing assignments.</p>
        <p>Years of university was an effective parameter in both analyses 1 and 2, and in both with and without conditions (<xref rid="figure5" ref-type="fig">Figure 5</xref>). The average SHAP effect of second-year students indicated that predictive probability decreased in the second year. It was reported that first- and last-year students tend to experience academic stress [<xref ref-type="bibr" rid="ref59">59</xref>]. The results depicted in <xref rid="figure5" ref-type="fig">Figure 5</xref> may imply that students adapt to the campus life from the beginning of the second year to their third year. Although some universities hold health surveys only for first-year students, this study indicated that third- or higher-year students should also be monitored.</p>
        <p><xref rid="figure6" ref-type="fig">Figure 6</xref> is consistent with the hypothesis that some students who belonged to departments with few same-sex students may have had difficulties. By contrast, a low proportion of the same sex in a department equals a high proportion of the other sex in that department, indicating a low predictive probability of the other sex. Considering that even an approximately 0.50 proportion of the same sex in the department showed positive averages of the SHAP effect, it is unclear how much the male:female ratio is desirable for students’ mental health. A low proportion of female students in the science and engineering departments reflected the gap in field of science, technology, engineering, and mathematics. The aspect of sex associated with these data was only male or female; the lesbian, gay, bisexual, transgender, queer community should be considered in future studies. Regardless of sex, being in a minority in a department should be a parameter to be examined; such examinations may afford opportunities for interaction.</p>
        <p>There are certain findings regarding the input variables generated based on answering time. Concerning the RT stamp, the results depicted in <xref rid="figure7" ref-type="fig">Figure 7</xref> were partly consistent with the hypothesis that RT stamps may reflect students’ life rhythm and sleep quality, which may be related to their mental health state. Students whose answers were recorded at midnight may have stayed up late, which may have been related to mental health problems. In contrast, it is unclear why students whose answers were recorded at noon (approximately 12:00) or evening (approximately 18:00) had negative SHAP values. This might suggest that they had been alone when groups of other students enjoyed lunch or after school. RT stamp data have not been used before; such data can be informative for understanding students’ lifestyles. Although the answer date was not ranked in <xref ref-type="table" rid="table9">Tables 9</xref>-<xref ref-type="table" rid="table12">12</xref>, the results depicted in <xref rid="figure8" ref-type="fig">Figure 8</xref> were consistent with the hypothesis that late answer data may have reflected some problems. We believe that the high SHAP of late responses may be caused by the lack of ability to check their emails and obtain essential information from them. Students who answered the survey at a later date should be asked about difficulty in schoolwork (eg, submission of assignments) in health checkup interview. Demonstrating that answering time affects the prediction and learning of mental health problems is meaningful because this parameter can easily be collected through a web survey.</p>
      </sec>
      <sec>
        <title>Limitations</title>
        <p>The data were collected from only one university during COVID-19; therefore, the model cannot be generalized to other universities and ages, whereas the approach can be. Campus life during COVID-19 differed from that without the virus. Moreover, this study could not reveal the condition of the 1994 students who did not provide answers in 2020 and 2021, even though they accounted for a major proportion of the population and may have had some mental health problems. The <italic>nine questions about campus life</italic>, which were the most powerful items in this study, are unique to University A and are not widely used. This model should be tested in other time periods or with other universities’ data. Using this model to call for psychological counseling for students at risk in a specific field is entirely different. This model should be evaluated to determine whether it helps in precisely detecting students experiencing mental health problems and to estimate the impact on cost reduction.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>Students’ mental health problems were predicted in real time and for 1 year in the future. The <italic>nine questions about campus life</italic>, especially the question “I have a strong anxiety about my campus life” was an overwhelmingly powerful item. It was indicated that demographic data (eg, years of university, proportion of the same sex in department, etc) and behavioral data (sleeping hours and answering time), as well as self-rating items were effective.</p>
        <p>The developed model itself should be adjusted for each university because it depends on the items used in the survey of the cooperating university. Nevertheless, this model demonstrates the possibility of synergistically using the characteristics of health surveys and advantages of ML. Consequently, it can be used for predicting mental health status from existing health data without a mental health scale.</p>
        <p>Furthermore, the impact of some items on the prediction was discussed. These findings can improve health survey items and define the criteria for inviting to student counseling. Accurate calls for student counseling will lead to early detection and intervention and operational efficiency.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">AUC-PR</term>
          <def>
            <p>area under the curve of precision-recall curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">AUC-ROC</term>
          <def>
            <p>area under the curve of receiver operating characteristic curve</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">GBDT</term>
          <def>
            <p>gradient boosting decision tree</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">MCC</term>
          <def>
            <p>Matthews correlation coefficient</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb5">ML</term>
          <def>
            <p>machine learning</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb6">RT</term>
          <def>
            <p>response time</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb7">SHAP</term>
          <def>
            <p>Shapley additive explanations</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>During the study, a portion of the interim results was presented at a briefing of the Research Support System for Female Researchers at Kanazawa University and the 85th Annual Convention of the Japanese Psychological Association. The staff at the Health Service Center at Kanazawa University performed data collection. Dr Satoshi Sugiyama (Keio University) and Dr Hiroshi Matsui (Hokkaido University) advised on our analysis. Prof Yumi Adachi (Kanazawa University) supported all processes. The authors would like to thank Editage for English editing.</p>
      <p>The Research Support System supported this work for Female Researchers at Kanazawa University.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>AB contributed to the conceptualization, methodology, investigation, resources, data curation, writing—original draft, writing—review and editing, visualization, supervision, project administration, and funding acquisition. KB contributed to conceptualization, methodology, software, formal analysis, data curation, writing—original draft, writing—review and editing, and visualization.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Furukawa</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Outcomes in psychological counseling. Shinri sodan ni okeru tenki ni tsuite</article-title>
          <source>Campus Health</source>
          <year>2020</year>
          <month>6</month>
          <volume>57</volume>
          <issue>2</issue>
          <fpage>56</fpage>
          <lpage>63</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://health-uv.umin.ac.jp/members/pdf/ch57_2/11.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hayakawa</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Implementation of the mental health survey: limitations and future challenges of the survey. Seishin kenko chosa no jisshi jyokyo: chosa no genkai to kongo no kadai</article-title>
          <source>Campus Health</source>
          <year>2020</year>
          <month>6</month>
          <volume>57</volume>
          <issue>2</issue>
          <fpage>51</fpage>
          <lpage>5</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://health-uv.umin.ac.jp/members/pdf/ch57_2/10.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hirayama</surname>
              <given-names>K</given-names>
            </name>
            <collab>Japanese Association for College Mental Health</collab>
          </person-group>
          <source>User Guide for the UPI. UPI riyo no tebiki</source>
          <year>2011</year>
          <publisher-loc>Tokyo, Japan</publisher-loc>
          <publisher-name>Sozo-shuppan</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>DP</given-names>
            </name>
          </person-group>
          <source>Manual of the General Health Questionnaire</source>
          <year>1978</year>
          <publisher-loc>Berkshire, UK</publisher-loc>
          <publisher-name>NFER-Nelson Publishers</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Goldberg</surname>
              <given-names>DP</given-names>
            </name>
            <name name-style="western">
              <surname>Hillier</surname>
              <given-names>VF</given-names>
            </name>
          </person-group>
          <article-title>A scaled version of the General Health Questionnaire</article-title>
          <source>Psychol Med</source>
          <year>1979</year>
          <month>02</month>
          <volume>9</volume>
          <issue>1</issue>
          <fpage>139</fpage>
          <lpage>45</lpage>
          <pub-id pub-id-type="doi">10.1017/s0033291700021644</pub-id>
          <pub-id pub-id-type="medline">424481</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sakai</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Noguchi</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Comparison of tests of mental health for student counseling: formation of a common measure. Daigakusei wo taisyo toshita seishintekikenkodochosa no kyotsusyakudoka niyoru hikakukento</article-title>
          <source>Jpn J Educ Psychol</source>
          <year>2015</year>
          <volume>63</volume>
          <issue>2</issue>
          <fpage>111</fpage>
          <lpage>20</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jstage.jst.go.jp/article/jjep/63/2/63_111/_article/-char/ja/"/>
          </comment>
          <pub-id pub-id-type="doi">10.5926/jjep.63.111</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Inaki</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Arai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kato</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takeuch</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Early detection and support of mental health issues through the university personality inventory (UPI) in student counseling</article-title>
          <source>Bull Research Jin-Ai Univ Faculty of Human Studies</source>
          <year>2020</year>
          <month>02</month>
          <day>20</day>
          <volume>18</volume>
          <fpage>1</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.57426/00000868</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McArdle</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Ritschard</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <source>Contemporary Issues in Exploratory Data Mining in the Behavioral Sciences</source>
          <year>2013</year>
          <publisher-loc>London, UK</publisher-loc>
          <publisher-name>Routledge</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobucci</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ammerman</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Alloy</surname>
              <given-names>LB</given-names>
            </name>
            <name name-style="western">
              <surname>Diamond</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Using machine learning to classify suicide attempt history among youth in medical care settings</article-title>
          <source>J Affect Disord</source>
          <year>2020</year>
          <month>05</month>
          <day>01</day>
          <volume>268</volume>
          <fpage>206</fpage>
          <lpage>14</lpage>
          <pub-id pub-id-type="doi">10.1016/j.jad.2020.02.048</pub-id>
          <pub-id pub-id-type="medline">32174479</pub-id>
          <pub-id pub-id-type="pii">S0165-0327(19)33569-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shatte</surname>
              <given-names>AB</given-names>
            </name>
            <name name-style="western">
              <surname>Hutchinson</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Teague</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in mental health: a scoping review of methods and applications</article-title>
          <source>Psychol Med</source>
          <year>2019</year>
          <month>07</month>
          <volume>49</volume>
          <issue>9</issue>
          <fpage>1426</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.1017/S0033291719000151</pub-id>
          <pub-id pub-id-type="medline">30744717</pub-id>
          <pub-id pub-id-type="pii">S0033291719000151</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Thieme</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Belgrave</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Doherty</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Machine learning in mental health: a systematic review of the HCI literature to support the development of effective and implementable ML systems</article-title>
          <source>ACM Trans Comput Hum Interact</source>
          <year>2020</year>
          <month>10</month>
          <day>31</day>
          <volume>27</volume>
          <issue>5</issue>
          <fpage>1</fpage>
          <lpage>53</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/pdf/10.1145/3398069"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3398069</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Naghavi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Teismann</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Asgari</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Mohebbian</surname>
              <given-names>MR</given-names>
            </name>
            <name name-style="western">
              <surname>Mansourian</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mañanas</surname>
              <given-names>MÁ</given-names>
            </name>
          </person-group>
          <article-title>Accurate diagnosis of suicide ideation/behavior using robust ensemble machine learning: a university student population in the Middle East and North Africa (MENA) region</article-title>
          <source>Diagnostics (Basel)</source>
          <year>2020</year>
          <month>11</month>
          <day>16</day>
          <volume>10</volume>
          <issue>11</issue>
          <fpage>956</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=diagnostics10110956"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/diagnostics10110956</pub-id>
          <pub-id pub-id-type="medline">33207776</pub-id>
          <pub-id pub-id-type="pii">diagnostics10110956</pub-id>
          <pub-id pub-id-type="pmcid">PMC7696788</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Burke</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Jacobucci</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Ammerman</surname>
              <given-names>BA</given-names>
            </name>
            <name name-style="western">
              <surname>Piccirillo</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>McCloskey</surname>
              <given-names>MS</given-names>
            </name>
            <name name-style="western">
              <surname>Heimberg</surname>
              <given-names>RG</given-names>
            </name>
            <name name-style="western">
              <surname>Alloy</surname>
              <given-names>LB</given-names>
            </name>
          </person-group>
          <article-title>Identifying the relative importance of non-suicidal self-injury features in classifying suicidal ideation, plans, and behavior using exploratory data mining</article-title>
          <source>Psychiatry Res</source>
          <year>2018</year>
          <month>04</month>
          <volume>262</volume>
          <fpage>175</fpage>
          <lpage>83</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/29453036"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.psychres.2018.01.045</pub-id>
          <pub-id pub-id-type="medline">29453036</pub-id>
          <pub-id pub-id-type="pii">S0165-1781(17)31048-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC6684203</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bagroy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Kumaraguru</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A social media based index of mental well-being in college campuses</article-title>
          <source>Proc SIGCHI Conf Hum Factor Comput Syst</source>
          <year>2017</year>
          <month>05</month>
          <volume>2017</volume>
          <fpage>1634</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28840202"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/3025453.3025909</pub-id>
          <pub-id pub-id-type="medline">28840202</pub-id>
          <pub-id pub-id-type="pmcid">PMC5565736</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sano</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>McHill</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Jaques</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Czeisler</surname>
              <given-names>CA</given-names>
            </name>
            <name name-style="western">
              <surname>Klerman</surname>
              <given-names>EB</given-names>
            </name>
            <name name-style="western">
              <surname>Picard</surname>
              <given-names>RW</given-names>
            </name>
          </person-group>
          <article-title>Recognizing academic performance, sleep quality, stress level, and mental health using personality traits, wearable sensors and mobile phones</article-title>
          <source>Int Conf Wearable Implant Body Sens Netw</source>
          <year>2015</year>
          <month>06</month>
          <volume>2015</volume>
          <fpage>7299420</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/28516162"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/BSN.2015.7299420</pub-id>
          <pub-id pub-id-type="medline">28516162</pub-id>
          <pub-id pub-id-type="pmcid">PMC5431072</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sano</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Taylor</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McHill</surname>
              <given-names>AW</given-names>
            </name>
            <name name-style="western">
              <surname>Phillips</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Barger</surname>
              <given-names>LK</given-names>
            </name>
            <name name-style="western">
              <surname>Klerman</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Picard</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Identifying objective physiological markers and modifiable behaviors for self-reported stress and mental health status using wearable sensors and mobile phones: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>06</month>
          <day>08</day>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>e210</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/6/e210/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.9410</pub-id>
          <pub-id pub-id-type="medline">29884610</pub-id>
          <pub-id pub-id-type="pii">v20i6e210</pub-id>
          <pub-id pub-id-type="pmcid">PMC6015266</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tate</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>McCabe</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Larsson</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lundström</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Lichtenstein</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Kuja-Halkola</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Predicting mental health problems in adolescence using machine learning techniques</article-title>
          <source>PLoS One</source>
          <year>2020</year>
          <month>04</month>
          <day>06</day>
          <volume>15</volume>
          <issue>4</issue>
          <fpage>e0230389</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0230389"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0230389</pub-id>
          <pub-id pub-id-type="medline">32251439</pub-id>
          <pub-id pub-id-type="pii">PONE-D-19-24985</pub-id>
          <pub-id pub-id-type="pmcid">PMC7135284</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Siemens</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>RS</given-names>
            </name>
          </person-group>
          <article-title>Learning analytics and educational data mining: towards communication and collaboration</article-title>
          <source>Proceedings of the 2nd International Conference on Learning Analytics and Knowledge</source>
          <year>2012</year>
          <conf-name>LAK '12</conf-name>
          <conf-date>April 29-May 2, 2012</conf-date>
          <conf-loc>Vancouver, Canada</conf-loc>
          <fpage>252</fpage>
          <lpage>4</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2330601.2330661"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2330601.2330661</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Djulovic</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Towards freshman retention prediction: a comparative study</article-title>
          <source>Int J Inf Educ</source>
          <year>2013</year>
          <volume>3</volume>
          <issue>5</issue>
          <fpage>494</fpage>
          <lpage>500</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://ijiet.org/papers/324-K045.pdf"/>
          </comment>
          <pub-id pub-id-type="doi">10.7763/IJIET.2013.V3.324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jayaprakash</surname>
              <given-names>SM</given-names>
            </name>
            <name name-style="western">
              <surname>Moody</surname>
              <given-names>EW</given-names>
            </name>
            <name name-style="western">
              <surname>Lauría</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Regan</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Baron</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Early alert of academically at-risk students: an open source analytics initiative</article-title>
          <source>J Learn Anal</source>
          <year>2014</year>
          <volume>1</volume>
          <issue>1</issue>
          <fpage>6</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://learning-analytics.info/index.php/JLA/article/view/3249/4011"/>
          </comment>
          <pub-id pub-id-type="doi">10.18608/jla.2014.11.3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kondo</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Hatanaka</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Modelling of students' learning states using big data of students through the baccalaureate degree program. Gakushi katei ni okeru daikibo data ni motoduku gakushu jotai no moderu ka</article-title>
          <source>Jpn Soc Info Sys Edu</source>
          <year>2016</year>
          <volume>33</volume>
          <issue>2</issue>
          <fpage>94</fpage>
          <lpage>103</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jstage.jst.go.jp/article/jsise/33/2/33_330204/_article/-char/ja/"/>
          </comment>
          <pub-id pub-id-type="doi">10.14926/jsise.33.94</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Otomo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Iwayama</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Mohri</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>On-campus data utilization: Working on IR (institutional research) in universities. Gakunai data no katsuyo: Daigaku ni okeru IR (institutional research) heno torikumi</article-title>
          <source>Fujitsu</source>
          <year>2014</year>
          <month>05</month>
          <volume>65</volume>
          <issue>3</issue>
          <fpage>41</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.fujitsu.com/downloads/JP/archive/imgjp/jmag/vol65-3/paper08.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Takaoka</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Nakai</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sugiyama</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Nozue</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Shimizu</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>The proposal for multi- faceted student support based on student data base: the collaboration of early detection of at-risk students and student counseling services. Gakusei no syugaku data wo katuyo shita takakuteki na gakuseishien no teian: youchui gakusei no sokihakken to gakuseisoudan tono kyodo</article-title>
          <source>Meiji Gakuin University bulletin of psychology</source>
          <year>2017</year>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>81</fpage>
          <lpage>93</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://meigaku.repo.nii.ac.jp/?action=pages_view_main&#38;active_action=repository_view_main_item_detail&#38;item_id=1527&#38;item_no=1&#38;page_id=13&#38;block_id=21"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Vihavainen</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Luukkainen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kurhila</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using students' programming behavior to predict success in an introductory mathematics course</article-title>
          <source>Proceedings of the 6th International Conference on Educational Data Mining</source>
          <year>2013</year>
          <conf-name>EDM '13</conf-name>
          <conf-date>July 6-9, 2013</conf-date>
          <conf-loc>Memphis, TN, USA</conf-loc>
          <fpage>300</fpage>
          <lpage>3</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.educationaldatamining.org/EDM2013/papers/rn_paper_52.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Iwata</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Kikuchi</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Fujihara</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>The usability of CAT system for assessing the depressive level of Japanese-a study on psychometric properties and response behavior</article-title>
          <source>Int J Behav Med</source>
          <year>2016</year>
          <month>08</month>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>427</fpage>
          <lpage>37</lpage>
          <pub-id pub-id-type="doi">10.1007/s12529-015-9503-1</pub-id>
          <pub-id pub-id-type="medline">26272358</pub-id>
          <pub-id pub-id-type="pii">10.1007/s12529-015-9503-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>DJ</given-names>
            </name>
            <name name-style="western">
              <surname>Su</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Modeling response time and responses in multidimensional health measurement</article-title>
          <source>Front Psychol</source>
          <year>2019</year>
          <month>01</month>
          <day>29</day>
          <volume>10</volume>
          <fpage>51</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/30761036"/>
          </comment>
          <pub-id pub-id-type="doi">10.3389/fpsyg.2019.00051</pub-id>
          <pub-id pub-id-type="medline">30761036</pub-id>
          <pub-id pub-id-type="pmcid">PMC6361798</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nock</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Banaji</surname>
              <given-names>MR</given-names>
            </name>
          </person-group>
          <article-title>Prediction of suicide ideation and attempts among adolescents using a brief performance-based test</article-title>
          <source>J Consult Clin Psychol</source>
          <year>2007</year>
          <month>10</month>
          <volume>75</volume>
          <issue>5</issue>
          <fpage>707</fpage>
          <lpage>15</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/17907852"/>
          </comment>
          <pub-id pub-id-type="doi">10.1037/0022-006X.75.5.707</pub-id>
          <pub-id pub-id-type="medline">17907852</pub-id>
          <pub-id pub-id-type="pii">2007-13640-004</pub-id>
          <pub-id pub-id-type="pmcid">PMC2043087</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Furukawa</surname>
              <given-names>TA</given-names>
            </name>
            <name name-style="western">
              <surname>Kawakami</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Saitoh</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Ono</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nakane</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Nakamura</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Tachimori</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Iwata</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Uda</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Nakane</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Watanabe</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Naganuma</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hata</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kobayashi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Miyake</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Takeshima</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Kikkawa</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>The performance of the Japanese version of the K6 and K10 in the World Mental Health Survey Japan</article-title>
          <source>Int J Methods Psychiatr Res</source>
          <year>2008</year>
          <volume>17</volume>
          <issue>3</issue>
          <fpage>152</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://europepmc.org/abstract/MED/18763695"/>
          </comment>
          <pub-id pub-id-type="doi">10.1002/mpr.257</pub-id>
          <pub-id pub-id-type="medline">18763695</pub-id>
          <pub-id pub-id-type="pmcid">PMC6878390</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kessler</surname>
              <given-names>RC</given-names>
            </name>
            <name name-style="western">
              <surname>Barker</surname>
              <given-names>PR</given-names>
            </name>
            <name name-style="western">
              <surname>Colpe</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Epstein</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Gfroerer</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Hiripi</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Howes</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Normand</surname>
              <given-names>SL</given-names>
            </name>
            <name name-style="western">
              <surname>Manderscheid</surname>
              <given-names>RW</given-names>
            </name>
            <name name-style="western">
              <surname>Walters</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Zaslavsky</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Screening for serious mental illness in the general population</article-title>
          <source>Arch Gen Psychiatry</source>
          <year>2003</year>
          <month>02</month>
          <volume>60</volume>
          <issue>2</issue>
          <fpage>184</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1001/archpsyc.60.2.184</pub-id>
          <pub-id pub-id-type="medline">12578436</pub-id>
          <pub-id pub-id-type="pii">yoa20567</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sakurai</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Nishi</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kondo</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Yanagida</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Kawakami</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Screening performance of K6/K10 and other screening instruments for mood and anxiety disorders in Japan</article-title>
          <source>Psychiatry Clin Neurosci</source>
          <year>2011</year>
          <month>08</month>
          <volume>65</volume>
          <issue>5</issue>
          <fpage>434</fpage>
          <lpage>41</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://onlinelibrary.wiley.com/doi/10.1111/j.1440-1819.2011.02236.x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1440-1819.2011.02236.x</pub-id>
          <pub-id pub-id-type="medline">21851452</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="web">
          <article-title>Comprehensive survey of living condition of the people on health and welfare 2019</article-title>
          <source>Ministry of Health, Labour and Welfare</source>
          <year>2019</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mhlw.go.jp/toukei/saikin/hw/k-tyosa/k-tyosa19/dl/07.pdf">https://www.mhlw.go.jp/toukei/saikin/hw/k-tyosa/k-tyosa19/dl/07.pdf</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Breiman</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Random forests</article-title>
          <source>Mach Lang</source>
          <year>2001</year>
          <month>10</month>
          <day>01</day>
          <volume>45</volume>
          <issue>1</issue>
          <fpage>5</fpage>
          <lpage>32</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1023/A%3A1010933404324"/>
          </comment>
          <pub-id pub-id-type="doi">10.1023/A:1010933404324</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ke</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Finley</surname>
              <given-names>TW</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>WY</given-names>
            </name>
            <name name-style="western">
              <surname>Ma</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ye</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>TY</given-names>
            </name>
          </person-group>
          <article-title>LightGBM: a highly efficient gradient boosting decision tree</article-title>
          <source>Proceedings of the 31st International Conference on Neural Information Processing Systems</source>
          <year>2017</year>
          <conf-name>NIPS'17</conf-name>
          <conf-date>Long Beach, CA, USA</conf-date>
          <conf-loc>December 4-9, 2017</conf-loc>
          <fpage>3149</fpage>
          <lpage>57</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/3294996.3295074"/>
          </comment>
          <pub-id pub-id-type="doi">10.5555/3294996.3295074</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Guestrin</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>XGBoost: a scalable tree boosting system</article-title>
          <source>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</source>
          <year>2016</year>
          <conf-name>KDD '16</conf-name>
          <conf-date>August 13-17, 2016</conf-date>
          <conf-loc>San Francisco, CA, USA</conf-loc>
          <fpage>785</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1145/2939672.2939785"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Which risk factors matter more for psychological distress during the COVID-19 pandemic? An application approach of gradient boosting decision trees</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2021</year>
          <month>05</month>
          <day>30</day>
          <volume>18</volume>
          <issue>11</issue>
          <fpage>5879</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph18115879"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph18115879</pub-id>
          <pub-id pub-id-type="medline">34070829</pub-id>
          <pub-id pub-id-type="pii">ijerph18115879</pub-id>
          <pub-id pub-id-type="pmcid">PMC8199069</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yuan</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>A stable AI-based binary and multiple class heart disease prediction model for IoMT</article-title>
          <source>IEEE Trans Industr Inform</source>
          <year>2022</year>
          <month>3</month>
          <volume>18</volume>
          <issue>3</issue>
          <fpage>2032</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ieeexplore.ieee.org/document/9517094"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/tii.2021.3098306</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Uchida</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Suicide among Japanese university students from the results of a 21 year survey: a clue to prevent suicide among university students. 21nenkan no chosa karamita daigakusei no jisatsu no tokucho to kikeninshi: yobo heno tegakari wo saguru. Article in Japanese</article-title>
          <source>Psychiatria et neurologia Japonica</source>
          <year>2010</year>
          <volume>112</volume>
          <issue>6</issue>
          <fpage>543</fpage>
          <lpage>60</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journal.jspn.or.jp/jspn/openpdf/1120060543.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higuchi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A two-step approach to quantitative content analysis: KH coder tutorial using anne of green gables (part I)</article-title>
          <source>Retsumeikan Soc Sci Rev</source>
          <year>2016</year>
          <volume>52</volume>
          <issue>3</issue>
          <fpage>77</fpage>
          <lpage>91</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://ritsumei.repo.nii.ac.jp/?action=pages_view_main&#38;active_action=repository_view_main_item_detail&#38;item_id=3738&#38;item_no=1&#38;page_id=13&#38;block_id=21"/>
          </comment>
          <pub-id pub-id-type="doi">10.34382/00003706</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Higuchi</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>A two-step approach to quantitative content analysis: KH coder tutorial using anne of green gables (part II)</article-title>
          <source>Retsumeikan Soc Sci Rev</source>
          <year>2017</year>
          <volume>53</volume>
          <issue>1</issue>
          <fpage>137</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.ritsumei.ac.jp/file.jsp?id=325881"/>
          </comment>
          <pub-id pub-id-type="doi">10.34382/00003731</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>R Core Team</collab>
          </person-group>
          <article-title>R: a language and environment for statistical computing</article-title>
          <source>R Foundation for Statistical Computing</source>
          <year>2019</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.R-project.org/">https://www.R-project.org/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Josse</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Husson</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>missMDA: a package for handling missing values in multivariate data analysis</article-title>
          <source>J Stat Softw</source>
          <year>2016</year>
          <volume>70</volume>
          <issue>1</issue>
          <fpage>1</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jstatsoft.org/article/view/v070i01"/>
          </comment>
          <pub-id pub-id-type="doi">10.18637/jss.v070.i01</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bergstra</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Bardenet</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Bengio</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Kégl</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Algorithms for hyper-parameter optimization</article-title>
          <source>Proceedings of the 24th International Conference on Neural Information Processing Systems</source>
          <year>2011</year>
          <conf-name>NIPS'11</conf-name>
          <conf-date>December 12-15, 2011</conf-date>
          <conf-loc>Granada, Spain</conf-loc>
          <fpage>2546</fpage>
          <lpage>54</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.5555/2986459.2986743"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>JuliaAI</collab>
            <collab>The Alan Turing Institute</collab>
          </person-group>
          <article-title>API: MLJLinearModels</article-title>
          <source>GitHub</source>
          <year>2020</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://juliaai.github.io/MLJLinearModels.jl/dev/api/">https://juliaai.github.io/MLJLinearModels.jl/dev/api/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pedregosa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Varoquaux</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Gramfort</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Michel</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Thirion</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Grisel</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Blondel</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Prettenhofer</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Weiss</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Dubourg</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Vanderplas</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Passos</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Cournapeau</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Brucher</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Perrot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Duchesnay</surname>
              <given-names>É</given-names>
            </name>
          </person-group>
          <article-title>Scikit-learn: machine learning in Python</article-title>
          <source>J Mach Learn Res</source>
          <year>2011</year>
          <volume>12</volume>
          <fpage>2825</fpage>
          <lpage>30</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jmlr.csail.mit.edu/papers/v12/pedregosa11a.html"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2786984.2786995</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>xgboost developers</collab>
          </person-group>
          <article-title>XGBoost parameters</article-title>
          <source>XGBoost</source>
          <year>2022</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://xgboost.readthedocs.io/en/stable/parameter.html">https://xgboost.readthedocs.io/en/stable/parameter.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="web">
          <article-title>Parameters</article-title>
          <source>LightGBM 3.3.2.99</source>
          <year>2022</year>
          <access-date>2023-01-13</access-date>
          <publisher-loc>Redmond, WA, USA</publisher-loc>
          <publisher-name>Microsoft Corporation</publisher-name>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://lightgbm.readthedocs.io/en/latest/Parameters.html">https://lightgbm.readthedocs.io/en/latest/Parameters.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Fernández</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Galar</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>García</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Herrera</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Krawczyk</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Prati</surname>
              <given-names>RC</given-names>
            </name>
          </person-group>
          <source>Learning from Imbalanced Data Sets</source>
          <year>2018</year>
          <publisher-loc>Basel, Switzerland</publisher-loc>
          <publisher-name>Springer</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Molnar</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <source>Interpretable Machine Learning: A Guide for Making Black Box Models Explainable. 2nd edition</source>
          <year>2022</year>
          <publisher-loc>Victoria, Canada</publisher-loc>
          <publisher-name>Leanpub</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bezanson</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Edelman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Karpinski</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>VB</given-names>
            </name>
          </person-group>
          <article-title>Julia: a fresh approach to numerical computing</article-title>
          <source>SIAM Rev</source>
          <year>2017</year>
          <month>01</month>
          <volume>59</volume>
          <issue>1</issue>
          <fpage>65</fpage>
          <lpage>98</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dl.acm.org/doi/10.1137/141000671"/>
          </comment>
          <pub-id pub-id-type="doi">10.1137/141000671</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blaom</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kiraly</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lienart</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Simillides</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Arenas</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Vollmer</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>MLJ: a Julia package for composable machine learning</article-title>
          <source>J Open Source Softw</source>
          <year>2020</year>
          <month>11</month>
          <day>07</day>
          <volume>5</volume>
          <issue>55</issue>
          <fpage>2704</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://joss.theoj.org/papers/10.21105/joss.02704"/>
          </comment>
          <pub-id pub-id-type="doi">10.21105/joss.02704</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bergstra</surname>
              <given-names>J</given-names>
            </name>
            <collab>IQVIA</collab>
          </person-group>
          <article-title>TreeParzen.jl</article-title>
          <source>GiHub</source>
          <year>2022</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/IQVIA-ML/TreeParzen.jl">https://github.com/IQVIA-ML/TreeParzen.jl</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>The scikit-learn developers</collab>
            <collab>The ScikitLearn.jl developers</collab>
          </person-group>
          <article-title>ScikitLearn.jl</article-title>
          <source>GitHub</source>
          <year>2022</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/cstjean/ScikitLearn.jl">https://github.com/cstjean/ScikitLearn.jl</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Mossel</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>LightGBM.jl</article-title>
          <source>GitHub</source>
          <year>2022</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/IQVIA-ML/LightGBM.jl">https://github.com/IQVIA-ML/LightGBM.jl</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Redell</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>ShapML.jl</article-title>
          <source>GitHub</source>
          <year>2022</year>
          <access-date>2023-02-01</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://github.com/nredell/ShapML.jl">https://github.com/nredell/ShapML.jl</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Mei</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Piccialli</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Cuomo</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Huo</surname>
              <given-names>Z</given-names>
            </name>
          </person-group>
          <article-title>Julia language in machine learning: algorithms, applications, and open issues</article-title>
          <source>Comput Sci Rev</source>
          <year>2020</year>
          <month>08</month>
          <volume>37</volume>
          <fpage>100254</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.sciencedirect.com/science/article/pii/S157401372030071X"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.cosrev.2020.100254</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perkel</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>Julia: come for the syntax, stay for the speed</article-title>
          <source>Nature</source>
          <year>2019</year>
          <month>08</month>
          <volume>572</volume>
          <issue>7767</issue>
          <fpage>141</fpage>
          <lpage>2</lpage>
          <pub-id pub-id-type="doi">10.1038/d41586-019-02310-3</pub-id>
          <pub-id pub-id-type="medline">31363196</pub-id>
          <pub-id pub-id-type="pii">10.1038/d41586-019-02310-3</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="web">
          <article-title>Gender data portal time use across the world</article-title>
          <source>Organisation for Economic Co-operation and Development</source>
          <access-date>2023-02-12</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.oecd.org/gender/data/">https://www.oecd.org/gender/data/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <collab>American Psychiatric Association</collab>
          </person-group>
          <source>Diagnostic and Statistical Manual of Mental Disorders (DSM-5). 5th edition</source>
          <year>2013</year>
          <publisher-loc>Washington, DC, USA</publisher-loc>
          <publisher-name>American Psychiatric Association</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bedewy</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gabriel</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Examining perceptions of academic stress and its sources among university students: the perception of academic stress scale</article-title>
          <source>Health Psychol Open</source>
          <year>2015</year>
          <month>07</month>
          <volume>2</volume>
          <issue>2</issue>
          <fpage>2055102915596714</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/abs/10.1177/2055102915596714?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub  0pubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2055102915596714</pub-id>
          <pub-id pub-id-type="medline">28070363</pub-id>
          <pub-id pub-id-type="pii">10.1177_2055102915596714</pub-id>
          <pub-id pub-id-type="pmcid">PMC5193280</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
