<?xml version="1.0" encoding="utf-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.0 20120330//EN" "JATS-journalpublishing1.dtd">
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">NEJSDS</journal-id>
<journal-title-group><journal-title>The New England Journal of Statistics in Data Science</journal-title></journal-title-group>
<issn pub-type="ppub">2693-7166</issn><issn-l>2693-7166</issn-l>
<publisher>
<publisher-name>New England Statistical Society</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">NEJSDS105</article-id>
<article-id pub-id-type="doi">10.51387/26-NEJSDS105</article-id>
<article-categories><subj-group subj-group-type="heading">
<subject>Case Study, Application, and/or Practice Article</subject></subj-group><subj-group subj-group-type="area">
<subject>NextGen</subject></subj-group></article-categories>
<title-group>
<article-title>Comparative Analysis of NLP Methods for Emotion Detection in Student Responses During COVID-19</article-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name><surname>Maret</surname><given-names>Alexander</given-names></name><email xlink:href="mailto:maret@upenn.edu">maret@upenn.edu</email><xref ref-type="aff" rid="j_nejsds105_aff_001"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Dees</surname><given-names>Cade</given-names></name><email xlink:href="mailto:cade.dees@yahoo.com">cade.dees@yahoo.com</email><xref ref-type="aff" rid="j_nejsds105_aff_002"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Fu</surname><given-names>Yule</given-names></name><email xlink:href="mailto:yule.fu@duke.edu">yule.fu@duke.edu</email><xref ref-type="aff" rid="j_nejsds105_aff_003"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Qian</surname><given-names>Yanjun</given-names></name><email xlink:href="mailto:yqian3@vcu.edu">yqian3@vcu.edu</email><xref ref-type="aff" rid="j_nejsds105_aff_004"/><xref ref-type="corresp" rid="cor1">∗</xref>
</contrib>
<contrib contrib-type="author">
<name><surname>Chan</surname><given-names>David</given-names></name><email xlink:href="mailto:dmchan@vcu.edu">dmchan@vcu.edu</email><xref ref-type="aff" rid="j_nejsds105_aff_005"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Gandhi</surname><given-names>Punit</given-names></name><email xlink:href="mailto:gandhipr@vcu.edu">gandhipr@vcu.edu</email><xref ref-type="aff" rid="j_nejsds105_aff_006"/>
</contrib>
<contrib contrib-type="author">
<name><surname>Sahoo</surname><given-names>Indranil</given-names></name><email xlink:href="mailto:sahooi@vcu.edu">sahooi@vcu.edu</email><xref ref-type="aff" rid="j_nejsds105_aff_007"/>
</contrib>
<aff id="j_nejsds105_aff_001">Department of Mathematics, <institution>University of Pennsylvania</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:maret@upenn.edu">maret@upenn.edu</email></aff>
<aff id="j_nejsds105_aff_002">Department of Computer Science, <institution>University of Alabama</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:cade.dees@yahoo.com">cade.dees@yahoo.com</email></aff>
<aff id="j_nejsds105_aff_003">Department of Mathematics, <institution>Duke University</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:yule.fu@duke.edu">yule.fu@duke.edu</email></aff>
<aff id="j_nejsds105_aff_004">Department of Statistical Sciences and Operations Research, <institution>Virginia Commonwealth University</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:yqian3@vcu.edu">yqian3@vcu.edu</email></aff>
<aff id="j_nejsds105_aff_005">Department of Mathematics and Applied Mathematics, <institution>Virginia Commonwealth University</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:dmchan@vcu.edu">dmchan@vcu.edu</email></aff>
<aff id="j_nejsds105_aff_006">Department of Mathematics and Applied Mathematics, <institution>Virginia Commonwealth University</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:gandhipr@vcu.edu">gandhipr@vcu.edu</email></aff>
<aff id="j_nejsds105_aff_007">Department of Statistical Sciences and Operations Research, <institution>Virginia Commonwealth University</institution>, <country>United States</country>. E-mail address: <email xlink:href="mailto:sahooi@vcu.edu">sahooi@vcu.edu</email></aff>
</contrib-group>
<author-notes>
<corresp id="cor1"><label>∗</label>Corresponding author.</corresp>
</author-notes>
<pub-date pub-type="ppub"><year>2026</year></pub-date><pub-date pub-type="epub"><day>1</day><month>6</month><year>2026</year></pub-date><volume content-type="ahead-of-print">0</volume><issue>0</issue><fpage>1</fpage><lpage>18</lpage><history><date date-type="accepted"><day>19</day><month>5</month><year>2026</year></date></history>
<permissions><copyright-statement>© 2026 New England Statistical Society</copyright-statement><copyright-year>2026</copyright-year>
<license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/4.0/">
<license-p>Open access article under the <ext-link ext-link-type="uri" xlink:href="http://creativecommons.org/licenses/by/4.0/">CC BY</ext-link> license.</license-p></license></permissions>
<abstract>
<p>Natural language processing (NLP) algorithms have demonstrated significant capabilities in understanding responses to open-ended questions in survey data. However, the reliability and uncertainty of these methods on this task still need to be thoroughly investigated. To address this issue, this paper presents a comprehensive comparative analysis of various NLP methods for detecting fine-grained emotions in student responses about their mental health during the COVID-19 pandemic. The evaluated models include a Lexicon-based approach, the bag-of-words (BoW) model, Term Frequency-Inverse Document Frequency (TF-IDF), a pre-trained Bidirectional Encoder Representations from Transformers (BERT) model, MentalBERT, and OpenAI’s GPT-3.5. We carefully assess the efficacy of these models in accurately classifying emotions into predetermined categories using performance metrics such as accuracy and F1 score. Furthermore, model stability and distinguishing ability were quantified through repetitive cross-validation and the Area Under the Receiver Operating Characteristic Curve (AUC). The consistency of emotion detection across different models is also evaluated. The study highlights that the effectiveness of employing NLP methods for mental health analysis may vary depending on the emotions being analyzed, and their stability and uncertainty require thorough examination. Our work can provide valuable guidance for data scientists on applying NLP methods to survey data, particularly for understanding survey respondents’ emotions.</p>
</abstract>
<kwd-group>
<label>Keywords and phrases</label>
<kwd>Survey responses</kwd>
<kwd>COVID-19</kwd>
<kwd>Natural language processing</kwd>
<kwd>Emotion detection</kwd>
</kwd-group>
<funding-group><funding-statement>This research was supported by NSF Research Experiences for Undergraduates (REU), grant number DMS1950015, and by the VCU College of Humanities and Sciences Catalyst.</funding-statement></funding-group>
</article-meta>
</front>
<body>
<sec id="j_nejsds105_s_001">
<label>1</label>
<title>Introduction</title>
<p>In the early 2020s, the lives of university students were significantly impacted by the COVID-19 pandemic. The abrupt transition to online learning, loss of contact with family and friends, and social and financial uncertainty had a considerable impact on students’ mental health. Many surveys [<xref ref-type="bibr" rid="j_nejsds105_ref_035">35</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_042">42</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_009">9</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_018">18</xref>] have been conducted in colleges and universities to assess their impact and long-term effects. These surveys typically included two types of questions: quantitative questions that measure agreement or disagreement with specific statements, and open-ended questions that invite students to describe their personal feelings and experiences. Traditional survey analysis [<xref ref-type="bibr" rid="j_nejsds105_ref_024">24</xref>] often focuses on the quantitative responses, as these numerical responses can be easily analyzed using mathematical and statistical models. However, the responses to open-ended questions can provide more details and personalized insights into students’ mental health, which can then lead to studying the reasons behind these impacts. To analyze this information in large data sets, it is necessary to apply Natural Language Processing (NLP) techniques [<xref ref-type="bibr" rid="j_nejsds105_ref_023">23</xref>] to detect emotions within the students’ responses.</p>
<p>Advancements in NLP for emotion detection have been significant over the past few decades. Early researchers developed the Lexicon-based method [<xref ref-type="bibr" rid="j_nejsds105_ref_038">38</xref>] to create a dictionary that scores the emotions associated with individual words. Subsequently, techniques like the Bag-of-Words (BoW) model [<xref ref-type="bibr" rid="j_nejsds105_ref_029">29</xref>] and Term Frequency-Inverse Document Frequency (TF-IDF) [<xref ref-type="bibr" rid="j_nejsds105_ref_032">32</xref>] were introduced to convert texts into numerical vectors. Machine learning algorithms, such as logistic regression [<xref ref-type="bibr" rid="j_nejsds105_ref_036">36</xref>] and Support Vector Machines (SVM) [<xref ref-type="bibr" rid="j_nejsds105_ref_034">34</xref>], can then be trained using these vectors to classify texts into different emotion categories. Since 2017, the Transformer architecture [<xref ref-type="bibr" rid="j_nejsds105_ref_041">41</xref>] in deep learning has achieved remarkable success in NLP. Large Language Models (LLMs) [<xref ref-type="bibr" rid="j_nejsds105_ref_026">26</xref>], such as the Bidirectional Encoder Representations from Transformers (BERT) [<xref ref-type="bibr" rid="j_nejsds105_ref_012">12</xref>] and the Generative Pre-trained Transformer (GPT) [<xref ref-type="bibr" rid="j_nejsds105_ref_030">30</xref>], have demonstrated strong capabilities in various NLP tasks. We can either use these LLMs directly for emotion detection or fine-tune them for specific emotions to further enhance accuracy.</p>
<p>Despite the success of NLP methods, two significant challenges remain when applying them to understand the mental health of college students through open-ended survey questions. First, mental health encompasses a range of nuanced emotions, such as depression, anxiety, stress, and isolation. However, many traditional sentiment analysis methods [<xref ref-type="bibr" rid="j_nejsds105_ref_024">24</xref>] only consider general positive or negative sentiments in texts. This limitation can lead to the neglect of personal emotions expressed in open-ended survey responses, making it difficult to identify subtle differences in mental health. Second, using NLP to analyze mental health can yield educational and psychological insights; thus, the stability and distinguishing ability of these methods are crucial for reliable studies. There has been some effort to explore differences between such methods in the context of social media text [<xref ref-type="bibr" rid="j_nejsds105_ref_004">4</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_025">25</xref>] and free response surveys [<xref ref-type="bibr" rid="j_nejsds105_ref_044">44</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_043">43</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_019">19</xref>] related to COVID. However, most of those studies only focus on the consistency in the general sentiment prediction, not on fine-grained emotion detection [<xref ref-type="bibr" rid="j_nejsds105_ref_010">10</xref>] that we are concerned with.</p>
<p>To address the challenges of reliable emotion detection, we conduct a comparative analysis of various NLP methods based on a recent study of college student responses during COVID-19 [<xref ref-type="bibr" rid="j_nejsds105_ref_001">1</xref>]. This study surveyed students at a large mid-Atlantic university in the U.S. during the early months of the COVID-19 pandemic to assess its impact on their mental health. The survey included both traditional quantitative scoring questions and open-ended responses. In their research, Amona et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_001">1</xref>] carefully annotated ten common emotions—such as isolation, depression, and anxiety—derived from the students’ responses to the question, “How is COVID affecting your mental health?” They then examined how these emotions impacted different subgroups within the student population.</p>
<p>Here, we compare a wide range of NLP methods, including Lexicon-based approaches, BoW, TF-IDF, fine-tuned BERT, and zero-shot GPT, for the automatic detection of emotions in these survey responses. First, we assess the performance of various NLP methods across all identified emotions. We find that despite the complicated Transformer method achieving the best overall performance, simpler methods, such as Lexicon, can effectively identify specific emotions. Next, we evaluate the stability and distinguishing ability of these models, demonstrating the performance-complexity trade-off when applying NLP methods. Finally, we evaluate the detection consistency in emotion detection between NLP methods and the true labels, assessing whether these methods yield similar results or not. This comprehensive study highlights that the effectiveness of employing NLP methods to analyze mental health through survey data varies for the emotions being analyzed. Moreover, for the methods with top overall performance, their stability and uncertainty need to be thoroughly examined. We summarize insights from our experimental studies and offer method selection recommendations for NLP analysis of survey data to guide future data science practices.</p>
<p>The paper is organized as follows: In Section <xref rid="j_nejsds105_s_002">2</xref>, we introduce related work that examines students’ mental health during COVID-19 and advancements in NLP methods for emotion detection. Section <xref rid="j_nejsds105_s_005">3</xref> outlines three aspects of our methodology: data collection and annotation, the implementation of NLP methods, and the comparison framework. In Section <xref rid="j_nejsds105_s_016">4</xref>, we present our results and discuss the outcomes of emotion detection using NLP methods in relation to mental health. Finally, Section <xref rid="j_nejsds105_s_021">5</xref> summarizes the conclusions of our study.</p>
</sec>
<sec id="j_nejsds105_s_002">
<label>2</label>
<title>Related Work</title>
<sec id="j_nejsds105_s_003">
<label>2.1</label>
<title>NLP Methods in Comparison Study</title>
<p>First, we will review the related NLP methods in our comparison study. Traditional methods include the Lexicon-based approach, where predefined dictionaries of emotional words are used to identify emotions in text. For example, Mohammad et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_021">21</xref>] developed the National Research Council of Canada (NRC) Emotion Lexicon (EmoLex), a widely used resource for Lexicon-based emotion detection. The model establishes connections between words and basic emotions, including anger, joy, and sadness. This Lexicon was developed through crowdsourcing, ensuring a diverse and comprehensive set of word-emotion associations. Mohammad [<xref ref-type="bibr" rid="j_nejsds105_ref_020">20</xref>] later extended their work by adding real-valued scores of intensity to emotions to create NRC Affect Intensity Lexicon (AIL), enabling more fine-grained analysis.</p>
<p>The next school of methods for text classification involves converting sentences to numeric vectors using BoW or TF-IDF and applying machine learning algorithms to them. Sebastiani [<xref ref-type="bibr" rid="j_nejsds105_ref_033">33</xref>] provided a thorough analysis of these algorithms, highlighting their performance across different datasets and establishing their strengths and limitations in text classification. BoW is a technique that turns text or images into a histogram of words. BoW models convert text into a matrix of token counts, representing the frequency of each word in the text. This representation is then used as input for machine learning classifiers such as logistic regression, SVM, or Naive Bayes. Based on the study in [<xref ref-type="bibr" rid="j_nejsds105_ref_029">29</xref>], this makes the BoW computationally simple, helping it score well on performance tests. Barry [<xref ref-type="bibr" rid="j_nejsds105_ref_002">2</xref>] studied using BoW on Amazon and Yelp food reviews to classify whether they were positive or negative. With its best machine learning model, they achieved an accuracy score of over <inline-formula id="j_nejsds105_ineq_001"><alternatives><mml:math>
<mml:mn>95</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$95\% $]]></tex-math></alternatives></inline-formula>. Desmet and Hoste [<xref ref-type="bibr" rid="j_nejsds105_ref_011">11</xref>] used BoW to detect 15 emotions. Their results varied by emotion, but six of the seven most common emotions had acceptable accuracy.</p>
<p>TF-IDF improves upon BoW by weighting terms based on their importance, calculated as the product of Term Frequency (TF) and Inverse Document Frequency (IDF). Ramos et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_032">32</xref>] explained that the less frequently a word appears in documents, the greater the weight it should receive. This weighting helps to emphasize significant words while downplaying common ones, enhancing the model’s ability to distinguish between different classes. Rahman et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_031">31</xref>] conducted sentiment classification by tweaking TF-IDF with various vectorization methods and classifiers. With the correct classifier, they achieved <inline-formula id="j_nejsds105_ineq_002"><alternatives><mml:math>
<mml:mn>100</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$100\% $]]></tex-math></alternatives></inline-formula> accuracy. Sundaram et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_037">37</xref>] used TF-IDF for six emotions. For emotions with large training sets, they had an accuracy of about <inline-formula id="j_nejsds105_ineq_003"><alternatives><mml:math>
<mml:mn>85</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$85\% $]]></tex-math></alternatives></inline-formula>.</p>
<p>The advent of the Transformer architecture in deep learning, such as BERT and GPT, has revolutionized NLP. BERT, introduced in [<xref ref-type="bibr" rid="j_nejsds105_ref_012">12</xref>], employs a bidirectional training approach to understand the context of words in a sentence. BERT’s architecture comprises multiple layers of encoders within the Transformer, enabling it to capture intricate relationships between words. BERT can be fine-tuned for specific tasks, such as emotion detection, which involves additional training on a labeled dataset to optimize the model’s performance for that particular task. Tang et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_039">39</xref>] further explored the fine-tuning of BERT for multi-label sentiment analysis, showcasing its effectiveness in handling multiple co-occurring emotions under unbalanced class distributions. Ji et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_017">17</xref>] developed MentalBERT, a BERT-based model fine-tuned on mental health-related text, demonstrating significant improvements in understanding and classifying emotional content compared to standard BERT models.</p>
<p>GPT models [<xref ref-type="bibr" rid="j_nejsds105_ref_030">30</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_027">27</xref>], such as GPT-3.5, leverage generative pre-training on a vast corpus of text to generate human-like responses. Floridi and Chiriatti [<xref ref-type="bibr" rid="j_nejsds105_ref_013">13</xref>] explained that such models will transform the writing process and are capable of producing texts on the level of some humans. These models can be adapted for emotion detection by fine-tuning them on specific datasets or using prompt engineering to elicit desired outputs. Jain et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_016">16</xref>] used two GPT models for emotion detection, achieving an accuracy score of 0.98 over the mental health datasets they tested it on. The BERT and GPT models show much promise, with the GPT models being the most cutting-edge technology available.</p>
</sec>
<sec id="j_nejsds105_s_004">
<label>2.2</label>
<title>Fine-Grained Emotion Detection</title>
<p>For this study, multiple fine-grained emotions related to mental health, such as isolation, anxiety, and depression, need to be detected from students’ responses to the open-ended question. Bouzazizi et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_005">5</xref>] tackled the challenging task of multi-class emotion detection on Twitter posts, achieving <inline-formula id="j_nejsds105_ineq_004"><alternatives><mml:math>
<mml:mn>60.2</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$60.2\% $]]></tex-math></alternatives></inline-formula> accuracy for seven emotion classes. Their study emphasized the complexity of multi-class classification and proposed a model to better extract and understand emotions present in text rather than classifying them into predefined categories. The authors introduced a system that first classifies text as positive or negative and then assigns scores for corresponding emotion subclasses, improving the robustness and accuracy of emotion classification. Demszky et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_010">10</xref>] created a labeled dataset of 58<italic>k</italic> comments for 27 emotions, including gratitude, confusion, and remorse. They also trained a BERT-based model, achieving 0.46 F1 score. Mustafa et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_022">22</xref>] leveraged Twitter data and machine learning to classify depression severity, achieving <inline-formula id="j_nejsds105_ineq_005"><alternatives><mml:math>
<mml:mn>91</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$91\% $]]></tex-math></alternatives></inline-formula> accuracy by analyzing the top 100 words used by individuals and their psychological attributes. The study highlighted the importance of feature selection in enhancing classifier performance and proposed incorporating additional data, such as emojis and images, to improve future analyses. Guo et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_014">14</xref>] introduced a multi-way matching deep neural network model for fine-grained emotion detection of user reviews. Their approach predicted scores for specific attributes within reviews, such as location, service, price, and environment. The model consists of two steps: attribute detection and attribute classification. In the first step, the model identifies the relevant attributes mentioned in the text. In the second step, it assigns a score ranging from <inline-formula id="j_nejsds105_ineq_006"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>5</mml:mn></mml:math><tex-math><![CDATA[$-5$]]></tex-math></alternatives></inline-formula> to 5 for each emotion, reflecting the user’s opinion. This fine-grained analysis offers a more detailed understanding of user emotions by focusing on specific aspects of their reviews, demonstrating that NLP methods can effectively distinguish between various emotion categories.</p>
</sec>
</sec>
<sec id="j_nejsds105_s_005" sec-type="methods">
<label>3</label>
<title>Methodology</title>
<sec id="j_nejsds105_s_006">
<label>3.1</label>
<title>Data Collection and Labeling</title>
<p>The dataset has been previously studied in [<xref ref-type="bibr" rid="j_nejsds105_ref_001">1</xref>] and [<xref ref-type="bibr" rid="j_nejsds105_ref_007">7</xref>], and was collected from students at a large mid-Atlantic university in the U.S. between April and June 2020. We focus on one part of the collected data containing short-answer responses from students concerning the impact of COVID-19 on their mental health. The students had to answer the question, “How is coronavirus/COVID-19 affecting your mental health?” The responses are labeled manually by our research team with various emotional indicators, which serve as the ground truth for our emotion detection models. Each response is annotated with binary labels for 10 emotions: <italic>Isolation</italic>, <italic>Depression</italic>, <italic>Anxiety</italic>, <italic>Negative Feelings</italic>, <italic>Lack of Motivation</italic>, <italic>All Stress</italic>, <italic>Issues With Home Life</italic>, <italic>No/Positive Effects</italic>, <italic>Lack of Routine</italic>, <italic>Miscellaneous</italic>. The binary labels (1 if positive, 0 if negative) indicate whether the labelers believed the respondent’s answers expressed the corresponding emotions.</p>
<p>The ten categories of emotions are inspired by [<xref ref-type="bibr" rid="j_nejsds105_ref_006">6</xref>] and [<xref ref-type="bibr" rid="j_nejsds105_ref_035">35</xref>]. In Appendix <xref rid="j_nejsds105_app_001">A</xref>, we provide an example for each emotion, and explain our definitions of <italic>Negative Feelings</italic>, <italic>All Stress</italic>, and <italic>Miscellaneous</italic>. A response could be labeled into more than one emotion category. To ensure the labeling quality, two team members collaboratively categorized emotions for each response. For any questionable answers, they would sort out with multiple members to reach a consensus on labeling. In preparation for our analysis, the data were cleaned by removing responses with no emotion detected, which typically occurred when there was no response or only random characters. We also removed responses that lacked demographic information to facilitate future analysis. This left 398 responses in the dataset. The percentages of the remaining responses labeled as 1 for each emotion, ordered from largest to smallest, are illustrated in Figure <xref rid="j_nejsds105_fig_001">1</xref>.</p>
<fig id="j_nejsds105_fig_001">
<label>Figure 1</label>
<caption>
<p>The proportions of the responses expressing the corresponding emotions from the human labeling results. The ten emotions are ordered from the largest to the smallest.</p>
</caption>
<graphic xlink:href="nejsds105_g001.jpg"/>
</fig>
<p>In Figure <xref rid="j_nejsds105_fig_002">2</xref>, we analyze correlation and hierarchical clustering for all emotions. We find that most of the emotion pairs have near-zero correlations. The clustering analysis shows that “Depression” and “Anxiety” are the closest emotions. However, their correlation is only 0.3. Other close emotions also show small correlation coefficients of <inline-formula id="j_nejsds105_ineq_007"><alternatives><mml:math>
<mml:mo stretchy="false">∼</mml:mo>
<mml:mn>0.1</mml:mn></mml:math><tex-math><![CDATA[$\sim 0.1$]]></tex-math></alternatives></inline-formula>. Thus, we simplify this multiple-label classification problem into 10 binary classification problems. For every NLP method, we train ten models, each using labels for a single emotion. This simplification will provide a fair method-comparison framework.</p>
<fig id="j_nejsds105_fig_002">
<label>Figure 2</label>
<caption>
<p>The correlation matrix (left) and dendrogram clustering (right) of the labels for ten emotions.</p>
</caption>
<graphic xlink:href="nejsds105_g002.jpg"/>
</fig>
</sec>
<sec id="j_nejsds105_s_007">
<label>3.2</label>
<title>Emotion Detection Using NLP</title>
<sec id="j_nejsds105_s_008">
<label>3.2.1</label>
<title>Text Preprocessing</title>
<p>We follow the common steps in NLP [<xref ref-type="bibr" rid="j_nejsds105_ref_023">23</xref>] to preprocess the students’ responses in all the following methods, except GPT, which takes the original text as input. The preprocessing steps include: 
<list>
<list-item id="j_nejsds105_li_001">
<label>•</label>
<p>Text cleaning: Removal of special characters, numbers, and extraneous whitespace.</p>
</list-item>
<list-item id="j_nejsds105_li_002">
<label>•</label>
<p>Tokenization: Splitting text into individual words or tokens.</p>
</list-item>
<list-item id="j_nejsds105_li_003">
<label>•</label>
<p>Lowercasing: Converting all text to lowercase to ensure uniformity.</p>
</list-item>
<list-item id="j_nejsds105_li_004">
<label>•</label>
<p>Stop words removal: Removing common words that do not contribute to emotional meaning, such as “and,” “the,” etc.</p>
</list-item>
<list-item id="j_nejsds105_li_005">
<label>•</label>
<p>Lemmatization: Reducing words to their base or root form.</p>
</list-item>
</list> 
After the preprocessing, the tokenized text will serve as input to the following NLP models to detect emotions expressed in the responses.</p>
</sec>
<sec id="j_nejsds105_s_009">
<label>3.2.2</label>
<title>Lexicon-Based Method</title>
<p>The Lexicon-based model uses a custom dictionary created from a human-encoded text dataset. After the preprocessing, the word frequencies are calculated to understand the distribution of terms within the dataset. Words are then scored based on their association with emotion labels, using metrics such as pointwise mutual information (PMI) to quantify the strength of association between words and emotions.</p>
<p>For a response <italic>r</italic> with words <inline-formula id="j_nejsds105_ineq_008"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mo>…</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">n</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${w_{1}},{w_{2}},\dots ,{w_{n}}$]]></tex-math></alternatives></inline-formula>, its probability of including the emotion <inline-formula id="j_nejsds105_ineq_009"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${\textbf{E}_{j}}$]]></tex-math></alternatives></inline-formula> is: 
<disp-formula id="j_nejsds105_eq_001">
<label>(3.1)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mi mathvariant="italic">p</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mi mathvariant="italic">σ</mml:mi>
<mml:mo fence="true" stretchy="false">{</mml:mo>
<mml:munderover accentunder="false" accent="false">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mo largeop="true" movablelimits="false">∑</mml:mo></mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">i</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">n</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:mtext>Score</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>+</mml:mo>
<mml:mtext>Intercept</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo fence="true" stretchy="false">}</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ p(r,{\textbf{E}_{j}})=\sigma \{{\sum \limits_{i=1}^{n}}\text{Score}({w_{i}},{\textbf{E}_{j}})+\text{Intercept}({\textbf{E}_{j}})\}\]]]></tex-math></alternatives>
</disp-formula> 
where <inline-formula id="j_nejsds105_ineq_010"><alternatives><mml:math>
<mml:mtext>Score</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[$\text{Score}({w_{i}},{\textbf{E}_{j}})$]]></tex-math></alternatives></inline-formula> represents the score of word <inline-formula id="j_nejsds105_ineq_011"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${w_{i}}$]]></tex-math></alternatives></inline-formula> for emotion <inline-formula id="j_nejsds105_ineq_012"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${\textbf{E}_{j}}$]]></tex-math></alternatives></inline-formula>, <inline-formula id="j_nejsds105_ineq_013"><alternatives><mml:math>
<mml:mtext>Intercept</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[$\text{Intercept}({\textbf{E}_{j}})$]]></tex-math></alternatives></inline-formula> is the intercept for emotion <inline-formula id="j_nejsds105_ineq_014"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${\textbf{E}_{j}}$]]></tex-math></alternatives></inline-formula>, and <inline-formula id="j_nejsds105_ineq_015"><alternatives><mml:math>
<mml:mi mathvariant="italic">σ</mml:mi>
<mml:mo fence="true" stretchy="false">{</mml:mo>
<mml:mo>·</mml:mo>
<mml:mo fence="true" stretchy="false">}</mml:mo></mml:math><tex-math><![CDATA[$\sigma \{\cdot \}$]]></tex-math></alternatives></inline-formula> is the Sigmoid function. The Lexicon model will conclude that a response expresses an emotion when its predicted probability is at least 0.50.</p>
<p>Our study implemented the Lexicon-based model using R’s <monospace>SentimentAnalysis</monospace> package [<xref ref-type="bibr" rid="j_nejsds105_ref_028">28</xref>]. All responses were scanned to create a custom dictionary for each emotion. The scores of top words for the three typical emotions identified in Section <xref rid="j_nejsds105_s_017">4.1</xref>, as well as their intercepts, are presented in Table <xref rid="j_nejsds105_tab_001">1</xref>. We find that most of the words with coefficients different from 0 are explainable. For the <italic>“Depression”</italic> emotion, “depress” is associated with positive instances, while “routin”, “tend”, and “schedul” are associated with negative instances. For <italic>“Lack of Motivation”</italic>, “motiv”, “focus”. and “bed” are associated with positive ones. For <italic>“Miscellaneous”</italic>, the method only finds two words. The word “sleep” shows a clear positive association, indicating the labelers put the sleep issues in this category. On the other hand, the words with near-zero coefficients are less explainable. They might be introduced in the dictionaries due to random sampling of positive/negative instances.</p>
<table-wrap id="j_nejsds105_tab_001">
<label>Table 1</label>
<caption>
<p>The word scores and intercepts of three typical emotions in the customized dictionary for our dataset.</p>
</caption>
<table>
<thead>
<tr>
<td colspan="2" style="vertical-align: top; text-align: center; border-top: double; border-bottom: solid thin"><italic>Depression</italic></td>
<td colspan="2" style="vertical-align: top; text-align: center; border-top: double; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td colspan="2" style="vertical-align: top; text-align: center; border-top: double; border-bottom: solid thin"><italic>Miscellaneous</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: left; border-bottom: solid thin"><bold>Word</bold></td>
<td style="vertical-align: top; text-align: right; border-bottom: solid thin"><bold>Score</bold></td>
<td style="vertical-align: top; text-align: left; border-bottom: solid thin"><bold>Word</bold></td>
<td style="vertical-align: top; text-align: right; border-bottom: solid thin"><bold>Score</bold></td>
<td style="vertical-align: top; text-align: left; border-bottom: solid thin"><bold>Word</bold></td>
<td style="vertical-align: top; text-align: right; border-bottom: solid thin"><bold>Score</bold></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: left">depress</td>
<td style="vertical-align: top; text-align: right">0.321</td>
<td style="vertical-align: top; text-align: left">motiv</td>
<td style="vertical-align: top; text-align: right">0.138</td>
<td style="vertical-align: top; text-align: left">sleep</td>
<td style="vertical-align: top; text-align: right">0.028</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: left">routin</td>
<td style="vertical-align: top; text-align: right"><inline-formula id="j_nejsds105_ineq_016"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>0.033</mml:mn></mml:math><tex-math><![CDATA[$-0.033$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: left">focus</td>
<td style="vertical-align: top; text-align: right">0.075</td>
<td style="vertical-align: top; text-align: left">focus</td>
<td style="vertical-align: top; text-align: right">0.003</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: left">tend</td>
<td style="vertical-align: top; text-align: right"><inline-formula id="j_nejsds105_ineq_017"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>0.023</mml:mn></mml:math><tex-math><![CDATA[$-0.023$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: left">bed</td>
<td style="vertical-align: top; text-align: right">0.044</td>
<td style="vertical-align: top; text-align: left"/>
<td style="vertical-align: top; text-align: right"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: left">schedul</td>
<td style="vertical-align: top; text-align: right"><inline-formula id="j_nejsds105_ineq_018"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>0.016</mml:mn></mml:math><tex-math><![CDATA[$-0.016$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: left">there</td>
<td style="vertical-align: top; text-align: right">0.020</td>
<td style="vertical-align: top; text-align: left"/>
<td style="vertical-align: top; text-align: right"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: left">becom</td>
<td style="vertical-align: top; text-align: right"><inline-formula id="j_nejsds105_ineq_019"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>0.005</mml:mn></mml:math><tex-math><![CDATA[$-0.005$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: left">anymore</td>
<td style="vertical-align: top; text-align: right">0.012</td>
<td style="vertical-align: top; text-align: left"/>
<td style="vertical-align: top; text-align: right"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: left">effect</td>
<td style="vertical-align: top; text-align: right"><inline-formula id="j_nejsds105_ineq_020"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>0.003</mml:mn></mml:math><tex-math><![CDATA[$-0.003$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: left">cant</td>
<td style="vertical-align: top; text-align: right">0.001</td>
<td style="vertical-align: top; text-align: left"/>
<td style="vertical-align: top; text-align: right"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: left; border-bottom: solid thin">Intercept</td>
<td style="vertical-align: top; text-align: right; border-bottom: solid thin">0.036</td>
<td style="vertical-align: top; text-align: left; border-bottom: solid thin">Intercept</td>
<td style="vertical-align: top; text-align: right; border-bottom: solid thin">0.086</td>
<td style="vertical-align: top; text-align: left; border-bottom: solid thin">Intercept</td>
<td style="vertical-align: top; text-align: right; border-bottom: solid thin">0.059</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="j_nejsds105_s_010">
<label>3.2.3</label>
<title>BoW and TF-IDF</title>
<p>The BoW [<xref ref-type="bibr" rid="j_nejsds105_ref_029">29</xref>] and TF-IDF [<xref ref-type="bibr" rid="j_nejsds105_ref_032">32</xref>] methods will convert the tokenized text into a vector or matrix, and then train machine learning models for emotion detection. The BoW model transforms text into a matrix of token counts. Each response is represented as a vector <bold>v</bold> indicating the frequency of each word in the text. For a response <italic>r</italic> with words <inline-formula id="j_nejsds105_ineq_021"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mo>…</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">n</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${w_{1}},{w_{2}},\dots ,{w_{n}}$]]></tex-math></alternatives></inline-formula>, the vector representation <inline-formula id="j_nejsds105_ineq_022"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold">v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>BoW</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[${\mathbf{v}_{\text{BoW}}}(r)$]]></tex-math></alternatives></inline-formula> is given by: 
<disp-formula id="j_nejsds105_eq_002">
<label>(3.2)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold">v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>BoW</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo fence="true" stretchy="false">[</mml:mo>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mo>…</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo fence="true" stretchy="false">]</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ {\mathbf{v}_{\text{BoW}}}(r)=[f({w_{1}},r),f({w_{2}},r),\dots ,f({w_{n}},r)]\]]]></tex-math></alternatives>
</disp-formula> 
where <inline-formula id="j_nejsds105_ineq_023"><alternatives><mml:math>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[$f({w_{i}},r)$]]></tex-math></alternatives></inline-formula> is the frequency of word <inline-formula id="j_nejsds105_ineq_024"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">i</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${w_{i}}$]]></tex-math></alternatives></inline-formula> in response <italic>r</italic>.</p>
<p>The TF-IDF model improves upon the BoW model by weighing terms based on their importance. The term frequency (TF) measures how often a word appears in a document, while the inverse document frequency (IDF) measures how unique or rare a word is across all documents. The TF-IDF score for a word <italic>w</italic> in response <italic>r</italic> is calculated as: 
<disp-formula id="j_nejsds105_eq_003">
<label>(3.3)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mtext>TF-IDF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mtext>TF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>×</mml:mo>
<mml:mtext>IDF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ \text{TF-IDF}(w,r)=\text{TF}(w,r)\times \text{IDF}(w)\]]]></tex-math></alternatives>
</disp-formula> 
where: 
<disp-formula id="j_nejsds105_eq_004">
<label>(3.4)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mtext>TF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mo largeop="false" movablelimits="false">∑</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msup>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>′</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo stretchy="false">∈</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msup>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo>′</mml:mo>
</mml:mrow>
</mml:msup>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ \text{TF}(w,r)=\frac{f(w,r)}{{\textstyle\sum _{{w^{\prime }}\in r}}f({w^{\prime }},r)}\]]]></tex-math></alternatives>
</disp-formula> 
and 
<disp-formula id="j_nejsds105_eq_005">
<label>(3.5)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mtext>IDF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mo movablelimits="false">log</mml:mo>
<mml:mfenced separators="" open="(" close=")">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:mi mathvariant="italic">N</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mo stretchy="false">|</mml:mo>
<mml:mo fence="true" stretchy="false">{</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo stretchy="false">∈</mml:mo>
<mml:mi mathvariant="italic">R</mml:mi>
<mml:mo>:</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo stretchy="false">∈</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo fence="true" stretchy="false">}</mml:mo>
<mml:mo stretchy="false">|</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
</mml:mrow>
</mml:mfenced>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ \text{IDF}(w)=\log \left(\frac{N}{|\{r\in R:w\in r\}|}\right)\]]]></tex-math></alternatives>
</disp-formula> 
where <inline-formula id="j_nejsds105_ineq_025"><alternatives><mml:math>
<mml:mi mathvariant="italic">f</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[$f(w,r)$]]></tex-math></alternatives></inline-formula> is the frequency of word <italic>w</italic> in response <italic>r</italic>, <italic>N</italic> is the total number of responses, and <inline-formula id="j_nejsds105_ineq_026"><alternatives><mml:math>
<mml:mo stretchy="false">|</mml:mo>
<mml:mo fence="true" stretchy="false">{</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo stretchy="false">∈</mml:mo>
<mml:mi mathvariant="italic">R</mml:mi>
<mml:mo>:</mml:mo>
<mml:mi mathvariant="italic">w</mml:mi>
<mml:mo stretchy="false">∈</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo fence="true" stretchy="false">}</mml:mo>
<mml:mo stretchy="false">|</mml:mo></mml:math><tex-math><![CDATA[$|\{r\in R:w\in r\}|$]]></tex-math></alternatives></inline-formula> is the number of responses containing the word <italic>w</italic>. Finally, for a response <italic>r</italic> with words <inline-formula id="j_nejsds105_ineq_027"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mo>…</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">n</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${w_{1}},{w_{2}},\dots ,{w_{n}}$]]></tex-math></alternatives></inline-formula>, the vector representation <inline-formula id="j_nejsds105_ineq_028"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold">v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>TF-IDF</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[${\mathbf{v}_{\text{TF-IDF}}}(r)$]]></tex-math></alternatives></inline-formula> is given by: 
<disp-formula id="j_nejsds105_eq_006">
<alternatives><mml:math display="block">
<mml:mtable displaystyle="true" columnalign="right left" columnspacing="0pt">
<mml:mtr>
<mml:mtd class="align-odd">
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="bold">v</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mtext>TF-IDF</mml:mtext>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
</mml:mtd>
<mml:mtd class="align-even">
<mml:mo fence="true" stretchy="false">[</mml:mo>
<mml:mtext>TF-IDF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mtext>TF-IDF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd class="align-odd"/>
<mml:mtd class="align-even">
<mml:mo>…</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mtext>TF-IDF</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">w</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">n</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo fence="true" stretchy="false">]</mml:mo>
<mml:mo>.</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[\begin{aligned}{}{\mathbf{v}_{\text{TF-IDF}}}(r)=& [\text{TF-IDF}({w_{1}},r),\text{TF-IDF}({w_{2}},r),\\ {} & \dots ,\text{TF-IDF}({w_{n}},r)].\end{aligned}\]]]></tex-math></alternatives>
</disp-formula>
</p>
<p>After transforming each response into a vector, we adopt machine learning methods to train classifiers to detect each emotion. In this study, we consider two methods: logistic regression [<xref ref-type="bibr" rid="j_nejsds105_ref_036">36</xref>] and SVM [<xref ref-type="bibr" rid="j_nejsds105_ref_034">34</xref>]. Logistic regression predicts the probability of a class by applying a logistic function to a linear combination of input features, whereas SVM finds the hyperplane that best separates the data into classes by maximizing the margin between the classes. With the kernel method [<xref ref-type="bibr" rid="j_nejsds105_ref_015">15</xref>], those linear classifiers can be extended for non-linear classification. However, the performance of non-linear classifiers depends on the careful choice of kernels and their hyper-parameters for specific problems and datasets. To avoid excessive parameter tuning, we only consider the linear classifiers in the BoW and TF-IDF methods. To handle imbalanced data, we can also use the Synthetic Minority Over-sampling Technique (SMOTE) [<xref ref-type="bibr" rid="j_nejsds105_ref_008">8</xref>] to generate synthetic samples for the minority class, balancing the dataset. After conducting preliminary experiments, we employ the SVM with a linear kernel for the BoW method and logistic regression with SMOTE for the TF-IDF method, as these combinations provide generally better accuracy across different emotions.</p>
</sec>
<sec id="j_nejsds105_s_011">
<label>3.2.4</label>
<title>Fine-Tuned MentalBERT</title>
<p>BERT [<xref ref-type="bibr" rid="j_nejsds105_ref_012">12</xref>] is a transformer-based model designed to understand the context of words in a sentence through bidirectional training. MentalBERT [<xref ref-type="bibr" rid="j_nejsds105_ref_017">17</xref>] is a pre-trained BERT model specialized in mental health-related text. We first load the pretrained network “mental-bert-base-uncased”. Then, we fine-tune MentalBERT using our dataset to tailor it to the specific emotion-related student mental health during the COVID-19 pandemic. The model was trained for 5 epochs with a batch size of 16, learning rate of <inline-formula id="j_nejsds105_ineq_029"><alternatives><mml:math>
<mml:msup>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mo>−</mml:mo>
<mml:mn>5</mml:mn>
</mml:mrow>
</mml:msup></mml:math><tex-math><![CDATA[${2^{-5}}$]]></tex-math></alternatives></inline-formula>, and a maximum sequence length of 128 tokens. The fine-tuning process adjusts the pre-trained model’s parameters to minimize the loss on the training data using the true emotion labels in our dataset.</p>
</sec>
<sec id="j_nejsds105_s_012">
<label>3.2.5</label>
<title>Zero-Shot GPT</title>
<p>GPT [<xref ref-type="bibr" rid="j_nejsds105_ref_030">30</xref>], a generative LLM, has revolutionized NLP and artificial intelligence since ChatGPT was introduced in 2022. In this study, we utilize OpenAI’s GPT-3.5 [<xref ref-type="bibr" rid="j_nejsds105_ref_027">27</xref>] to generate emotion predictions for each response, as a baseline method. Given its ability to understand and generate human-like text, GPT-3.5 can be prompted with the students’ responses and asked whether the input paragraph expresses specific emotions. The predictions are then mapped to the binary labels for further evaluation. The details of GPT’s prompts are listed in Appendix <xref rid="j_nejsds105_app_002">B</xref>. We do not input the human labeling into the GPT prompt; thus, the method can be considered a zero-shot one. The experiment was conducted using GPT-3.5-turbo, the July 2024 version.</p>
<p>In Table <xref rid="j_nejsds105_tab_002">2</xref>, we summarize the training complexity of the five methods compared in this paper.</p>
<table-wrap id="j_nejsds105_tab_002">
<label>Table 2</label>
<caption>
<p>The model complexity comparison of the five methods we compare in this study.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: center; border-top: double; border-bottom: solid thin">Model</td>
<td style="vertical-align: top; text-align: center; border-top: double; border-bottom: solid thin">Complexity</td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: center">Lexicon</td>
<td style="vertical-align: top; text-align: center">Build a customized dictionary for each emotion, usually including around 10 words in our application.</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: center">BoW</td>
<td style="vertical-align: top; text-align: center">Convert each instance to a vector with maximum length 1000, and train a linear SVM (parameters &lt; 1k).</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: center">TF-IDF</td>
<td style="vertical-align: top; text-align: center">Convert each instance to a vector with maximum length 1000, and train a logistic regression (parameters &lt; 1k).</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: center">MentalBERT</td>
<td style="vertical-align: top; text-align: center">Pretrained 110M parameters, fine-tuning for each emotion.</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">GPT-3.5</td>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Pretrained 20B parameters, training is not needed.</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="j_nejsds105_s_013">
<label>3.3</label>
<title>Comparison Framework</title>
<sec id="j_nejsds105_s_014">
<label>3.3.1</label>
<title>Performance Criterion</title>
<p>To compare the performance of the different models, we use several standard evaluation metrics: True Positive (TP), True Negative (TN), False Positive (FP), False Negative (FN), Accuracy, Precision, Recall, F1 Score, Receiver Operating Characteristic (ROC) Curve, and Area Under the ROC Curve (AUC). For a response <italic>r</italic>, we set <inline-formula id="j_nejsds105_ineq_030"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn></mml:math><tex-math><![CDATA[${y_{r}}({\textbf{E}_{j}})=1$]]></tex-math></alternatives></inline-formula> if human labeling considers that it includes the emotion <inline-formula id="j_nejsds105_ineq_031"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${\textbf{E}_{j}}$]]></tex-math></alternatives></inline-formula>, otherwise <inline-formula id="j_nejsds105_ineq_032"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn></mml:math><tex-math><![CDATA[${y_{r}}({\textbf{E}_{j}})=0$]]></tex-math></alternatives></inline-formula>. Then, for an NLP method, its prediction result is <inline-formula id="j_nejsds105_ineq_033"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[${\hat{y}_{r}}({\textbf{E}_{j}})$]]></tex-math></alternatives></inline-formula>. The first four metrics are calculated as: 
<disp-formula id="j_nejsds105_eq_007">
<alternatives><mml:math display="block">
<mml:mtable displaystyle="true" columnalign="right left" columnspacing="0pt">
<mml:mtr>
<mml:mtd class="align-odd">
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mtd>
<mml:mtd class="align-even">
<mml:mo>=</mml:mo>
<mml:munderover accentunder="false" accent="false">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mo largeop="true" movablelimits="false">∑</mml:mo></mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">R</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">{</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">}</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd class="align-odd">
<mml:msub>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mtd>
<mml:mtd class="align-even">
<mml:mo>=</mml:mo>
<mml:munderover accentunder="false" accent="false">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mo largeop="true" movablelimits="false">∑</mml:mo></mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">R</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">{</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo stretchy="false">≠</mml:mo>
<mml:mn>1</mml:mn>
<mml:mspace width="2.5pt"/>
<mml:mtext>and</mml:mtext>
<mml:mspace width="2.5pt"/>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">}</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd class="align-odd">
<mml:msub>
<mml:mrow>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mtd>
<mml:mtd class="align-even">
<mml:mo>=</mml:mo>
<mml:munderover accentunder="false" accent="false">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mo largeop="true" movablelimits="false">∑</mml:mo></mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">R</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">{</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mspace width="2.5pt"/>
<mml:mtext>and</mml:mtext>
<mml:mspace width="2.5pt"/>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo stretchy="false">≠</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">}</mml:mo>
</mml:mtd>
</mml:mtr>
<mml:mtr>
<mml:mtd class="align-odd">
<mml:msub>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mtd>
<mml:mtd class="align-even">
<mml:mo>=</mml:mo>
<mml:munderover accentunder="false" accent="false">
<mml:mrow>
<mml:mstyle displaystyle="true">
<mml:mo largeop="true" movablelimits="false">∑</mml:mo></mml:mstyle>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">R</mml:mi>
</mml:mrow>
</mml:munderover>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">{</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo stretchy="false">≠</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo fence="true" maxsize="1.61em" minsize="1.61em">}</mml:mo>
<mml:mo mathvariant="normal">,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[\begin{aligned}{}{\text{TP}_{{\textbf{E}_{j}}}}& ={\sum \limits_{r=1}^{R}}\mathbf{1}\Big\{{y_{r}}({\textbf{E}_{j}})={\hat{y}_{r}}({\textbf{E}_{j}})=1\Big\}\\ {} {\text{FP}_{{\textbf{E}_{j}}}}& ={\sum \limits_{r=1}^{R}}\mathbf{1}\Big\{{y_{r}}({\textbf{E}_{j}})\ne 1\hspace{2.5pt}\text{and}\hspace{2.5pt}{\hat{y}_{r}}({\textbf{E}_{j}})=1\Big\}\\ {} {\text{FN}_{{\textbf{E}_{j}}}}& ={\sum \limits_{r=1}^{R}}\mathbf{1}\Big\{{y_{r}}({\textbf{E}_{j}})=1\hspace{2.5pt}\text{and}\hspace{2.5pt}{\hat{y}_{r}}({\textbf{E}_{j}})\ne 1\Big\}\\ {} {\text{TN}_{{\textbf{E}_{j}}}}& ={\sum \limits_{r=1}^{R}}\mathbf{1}\Big\{{y_{r}}({\textbf{E}_{j}})={\hat{y}_{r}}({\textbf{E}_{j}})\ne 1\Big\},\end{aligned}\]]]></tex-math></alternatives>
</disp-formula> 
where <inline-formula id="j_nejsds105_ineq_034"><alternatives><mml:math>
<mml:mn mathvariant="bold">1</mml:mn>
<mml:mo fence="true" stretchy="false">{</mml:mo>
<mml:mo>·</mml:mo>
<mml:mo fence="true" stretchy="false">}</mml:mo></mml:math><tex-math><![CDATA[$\mathbf{1}\{\cdot \}$]]></tex-math></alternatives></inline-formula> denotes an indicator function. Then, accuracy measures the proportion of correct predictions (both TP and TN) out of the total number of predictions, calculated as: 
<disp-formula id="j_nejsds105_eq_008">
<label>(3.6)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mrow>
<mml:mtext>ACC</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
<mml:mo>.</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ {\text{ACC}_{{\textbf{E}_{j}}}}=\frac{{\text{TP}_{{\textbf{E}_{j}}}}+{\text{TN}_{{\textbf{E}_{j}}}}}{{\text{TP}_{{\textbf{E}_{j}}}}+{\text{TN}_{{\textbf{E}_{j}}}}+{\text{FP}_{{\textbf{E}_{j}}}}+{\text{FN}_{{\textbf{E}_{j}}}}}.\]]]></tex-math></alternatives>
</disp-formula>
</p>
<p>Precision measures the proportion of true positive predictions out of all positive predictions (TP and FP), calculated as: 
<disp-formula id="j_nejsds105_eq_009">
<label>(3.7)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
<mml:mo>.</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ {\text{Precision}_{{\textbf{E}_{j}}}}=\frac{{\text{TP}_{{\textbf{E}_{j}}}}}{{\text{TP}_{{\textbf{E}_{j}}}}+{\text{FP}_{{\textbf{E}_{j}}}}}.\]]]></tex-math></alternatives>
</disp-formula>
</p>
<p>Recall measures the proportion of true positive predictions out of all actual positive cases (TP and FN), calculated as: 
<disp-formula id="j_nejsds105_eq_010">
<label>(3.8)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mrow>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>TP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>FN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
<mml:mo>.</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ {\text{Recall}_{{\textbf{E}_{j}}}}=\frac{{\text{TP}_{{\textbf{E}_{j}}}}}{{\text{TP}_{{\textbf{E}_{j}}}}+{\text{FN}_{{\textbf{E}_{j}}}}}.\]]]></tex-math></alternatives>
</disp-formula>
</p>
<p>At last, the F1 Score is the harmonic mean of Precision and Recall, providing a single metric that balances both concerns, calculated as: 
<disp-formula id="j_nejsds105_eq_011">
<label>(3.9)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mrow>
<mml:mtext>F1</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo>
<mml:mn>2</mml:mn>
<mml:mo>×</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>×</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Precision</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>Recall</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
<mml:mo>.</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ {\text{F1}_{{\textbf{E}_{j}}}}=2\times \frac{{\text{Precision}_{{\textbf{E}_{j}}}}\times {\text{Recall}_{{\textbf{E}_{j}}}}}{{\text{Precision}_{{\textbf{E}_{j}}}}+{\text{Recall}_{{\textbf{E}_{j}}}}}.\]]]></tex-math></alternatives>
</disp-formula>
</p>
<p>The Receiver Operating Characteristic (ROC) Curve is a graphical representation of a model’s diagnostic ability. It plots the True Positive Rate (Recall) against the False Positive Rate (FPR) with different thresholds, where FPR is defined as: 
<disp-formula id="j_nejsds105_eq_012">
<label>(3.10)</label><alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:msub>
<mml:mrow>
<mml:mtext>FPR</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>=</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>FP</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
<mml:mo>+</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>TN</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ {\text{FPR}_{{\textbf{E}_{j}}}}=\frac{{\text{FP}_{{\textbf{E}_{j}}}}}{{\text{FP}_{{\textbf{E}_{j}}}}+{\text{TN}_{{\textbf{E}_{j}}}}}\]]]></tex-math></alternatives>
</disp-formula> 
Then, we can calculate the Area Under the ROC Curve (AUC), which quantifies the model’s overall ability to discriminate between positive and negative classes. A higher AUC indicates a better-performing model.</p>
</sec>
<sec id="j_nejsds105_s_015">
<label>3.3.2</label>
<title>Comparison Steps</title>
<p>To give a comprehensive comparison among the NLP methods in the emotion detection from students’ responses, our study includes the following three steps: 
<list>
<list-item id="j_nejsds105_li_006">
<label>1.</label>
<p>Compare the emotion detection performance of the five NLP methods. We use the accuracy and F1 scores as the criteria. For the four trainable methods, i.e., Lexicon, BoW, TF-IDF, and MentalBERT, we vary the size of the training data using <inline-formula id="j_nejsds105_ineq_035"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula>, <inline-formula id="j_nejsds105_ineq_036"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula>, and <inline-formula id="j_nejsds105_ineq_037"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> of the entire dataset, to evaluate how the sample size affects the performance. We repeat the training/testing splits 100 times and report the average accuracy and F1 scores on the testing set. The zero-shot method, GPT-3.5, is used as the baseline.</p>
</list-item>
<list-item id="j_nejsds105_li_007">
<label>2.</label>
<p>Evaluate the stability and distinguishing ability of the NLP methods. We performed the 5-fold stratified cross-validation [<xref ref-type="bibr" rid="j_nejsds105_ref_045">45</xref>] 100 times with different data separations. In each stratified cross-validation, the data was split into five stratified folds, ensuring proportional representation of the positive/negative instances. The model is trained on four folds and tested on the remaining fold to evaluate performance. The process is repeated five times, once for each fold as the testing set. By doing so, we reduce variability caused by differences in the proportions of positive/negative instances between the training and testing datasets. The standard deviations of the accuracy and F1 scores are calculated to assess whether the model’s performance is sensitive to data splitting. Then, we obtain the predicted probabilities for emotions and calculate the average AUC for each model across 100 stratified cross-validations to assess their distinguishing abilities.</p>
</list-item>
<list-item id="j_nejsds105_li_008">
<label>3.</label>
<p>Show the consistency of the detection results among the five NLP methods for different emotions. We conduct pairwise comparisons to determine whether the detection results of one approach are consistent with those of another. This analysis highlights the similarities and differences among the five NLP methods.</p>
</list-item>
</list>
</p>
</sec>
</sec>
</sec>
<sec id="j_nejsds105_s_016">
<label>4</label>
<title>Comparison Results and Discussion</title>
<sec id="j_nejsds105_s_017">
<label>4.1</label>
<title>Detection Performance Comparison</title>
<p>In this section, we examine the performance of four trainable methods – Lexicon, BoW, TF-IDF, and MentalBERT – as well as the zero-shot method, GPT. For the four trainable methods, we consider training data splits of <inline-formula id="j_nejsds105_ineq_038"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula>, <inline-formula id="j_nejsds105_ineq_039"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula>, and <inline-formula id="j_nejsds105_ineq_040"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> to evaluate the impact of training sample size. We choose accuracy and F1 scores from the testing data, as defined in Section <xref rid="j_nejsds105_s_005">3</xref>, as the performance criteria. For each percentage, we repeat the training/testing splits 100 times, and report the average performance criteria. The original results are presented in the tables in Appendix <xref rid="j_nejsds105_s_022">C.1</xref>.</p>
<p>To compare the performance of the five methods, we show the boxplots of their accuracy (upper panel) and F1-scores (lower panel) with various training percentages in Figure <xref rid="j_nejsds105_fig_003">3</xref>. We observe that the training percentage has a limited effect on the Lexicon’s performance. The median F1 score of the Lexicon with a <inline-formula id="j_nejsds105_ineq_041"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> training split is even slightly higher than those with <inline-formula id="j_nejsds105_ineq_042"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> and <inline-formula id="j_nejsds105_ineq_043"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula> training percentages. The performance of BoW and TF-IDF shows modest impacts of the training percentage, and their overall trends are similar to each other. At last, the performance of MentalBERT, especially its F1 score, is significantly impacted by the training percentage. The median F1 score of MentalBERT with <inline-formula id="j_nejsds105_ineq_044"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> is the highest among all NLP methods; however, its median F1 score with <inline-formula id="j_nejsds105_ineq_045"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> is the lowest. A possible reason is that <inline-formula id="j_nejsds105_ineq_046"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> of the training data, comprising only 80 instances, is insufficient to fine-tune the 110M parameters in the MentalBERT model. The zero-shot GPT demonstrates modest performance, similar to BoW and TF-IDF with a <inline-formula id="j_nejsds105_ineq_047"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula> training percentage. However, its F1 scores surpass BoW, TF-IDF, and MentalBERT with a <inline-formula id="j_nejsds105_ineq_048"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> training percentage. Overall, the Lexicon method is relatively resistant to decreases in the training dataset, while MentalBERT is the most sensitive. Meanwhile, the performance changes in BoW and TF-IDF with varying training set sizes are moderate.</p>
<fig id="j_nejsds105_fig_003">
<label>Figure 3</label>
<caption>
<p>The boxplots of accuracy and F1 scores from the testing data among 10 emotions for the four trainable methods with <inline-formula id="j_nejsds105_ineq_049"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula>, <inline-formula id="j_nejsds105_ineq_050"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula>, and <inline-formula id="j_nejsds105_ineq_051"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> training percentages and the zero-shot GPT. The values of the three typical emotions, <italic>Depression</italic>, <italic>Lack of Motivation</italic>, and <italic>Miscellaneous</italic>, are also highlighted.</p>
</caption>
<graphic xlink:href="nejsds105_g003.jpg"/>
</fig>
<p>We examine the performance of those methods for individual emotions. We select three emotions: <italic>Depression</italic>, <italic>Lack of Motivation</italic>, and <italic>Miscellaneous</italic>, which present various levels of detection performance. The emotion with good performance, <italic>Depression</italic>, can be identified by keywords such as “depression” and “depressed” from the responses. The emotion associated with poor performance, <italic>Miscellaneous</italic>, is ambiguous and has only a small positive sample size. The moderate one, <italic>Lack of Motivation</italic>, has a clear definition but requires a comprehensive understanding of the responses to detect it. The accuracies and F1 scores of the three typical emotions of NLP methods with various training percentages are shown in Figure <xref rid="j_nejsds105_fig_004">4</xref>. We also highlight the values of the three typical emotions in Figure <xref rid="j_nejsds105_fig_003">3</xref>.</p>
<fig id="j_nejsds105_fig_004">
<label>Figure 4</label>
<caption>
<p>The accuracy and F1 score of the four trainable methods with <inline-formula id="j_nejsds105_ineq_052"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula>, <inline-formula id="j_nejsds105_ineq_053"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula>, and <inline-formula id="j_nejsds105_ineq_054"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> training data split, and the zero-shot GPT for three typical emotions spanning different levels of detection performance.</p>
</caption>
<graphic xlink:href="nejsds105_g004.jpg"/>
</fig>
<p>For <italic>Depression</italic>, the four trainable NLP methods with <inline-formula id="j_nejsds105_ineq_055"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> training percentages achieve high performance with an accuracy of <inline-formula id="j_nejsds105_ineq_056"><alternatives><mml:math>
<mml:mn>0.9</mml:mn>
<mml:mo stretchy="false">∼</mml:mo>
<mml:mn>1.0</mml:mn></mml:math><tex-math><![CDATA[$0.9\sim 1.0$]]></tex-math></alternatives></inline-formula> and F1 scores of <inline-formula id="j_nejsds105_ineq_057"><alternatives><mml:math>
<mml:mn>0.8</mml:mn>
<mml:mo stretchy="false">∼</mml:mo>
<mml:mn>1.0</mml:mn></mml:math><tex-math><![CDATA[$0.8\sim 1.0$]]></tex-math></alternatives></inline-formula>. Moreover, Lexicon, BoW, and MentalBERT all achieve significant improvements in both accuracy and F1 score compared to GPT, when the training percentage exceeds <inline-formula id="j_nejsds105_ineq_058"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula>, whereas TF-IDF yields a minor improvement. However, with a <inline-formula id="j_nejsds105_ineq_059"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> training percentage, the performance of TF-IDF and MentalBERT drops dramatically, while the performance of Lexicon and BoW remains stable.</p>
<p>For the emotion with moderate detection difficulty, <italic>Lack of Motivation</italic>, the four trainable methods, with an <inline-formula id="j_nejsds105_ineq_060"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> training percentage, can achieve higher or similar accuracy or F1 scores compared to the zero-shot GPT. However, the increase between the trainable methods and the GPT is smaller than that for the <italic>Depression</italic> case. The F1 score of the MentalBERT is superior to that of other methods, demonstrating its capability to understand the context of the responses. When the training percentage reaches <inline-formula id="j_nejsds105_ineq_061"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula> and <inline-formula id="j_nejsds105_ineq_062"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula>, the F1 scores of most trainable methods decrease to levels below or similar to those of GPT. This suggests that we require a sufficiently large dataset to train the model for this emotion.</p>
<p>For the challenging emotion, <italic>Miscellaneous</italic>, the four trainable methods, along with GPT, achieve high accuracy of around <inline-formula id="j_nejsds105_ineq_063"><alternatives><mml:math>
<mml:mn>0.90</mml:mn>
<mml:mo stretchy="false">∼</mml:mo>
<mml:mn>0.95</mml:mn></mml:math><tex-math><![CDATA[$0.90\sim 0.95$]]></tex-math></alternatives></inline-formula> and low F1-scores of around <inline-formula id="j_nejsds105_ineq_064"><alternatives><mml:math>
<mml:mn>0</mml:mn>
<mml:mo stretchy="false">∼</mml:mo>
<mml:mn>0.1</mml:mn></mml:math><tex-math><![CDATA[$0\sim 0.1$]]></tex-math></alternatives></inline-formula>. The results show that there is a very small number of positive data points for the <italic>Miscellaneous</italic> emotion, and the NLP methods will predict all sentences as negative. Due to this issue, the training percentages cannot help the performance of the four trainable results. Moreover, the zero-shot GPT also fails to recognize this ambiguous definition with a near-zero F1 score.</p>
</sec>
<sec id="j_nejsds105_s_018">
<label>4.2</label>
<title>Model Stability and Distinguishing Ability</title>
<p>The next step is to evaluate the stability and distinguishing ability of the four trainable methods: Lexicon, BoW, TF-IDF, and MentalBERT. We find the mean and standard deviation of the accuracies and F1 scores from 100 repetitions of stratified 5-fold cross-validation. The means are similar to those with an <inline-formula id="j_nejsds105_ineq_065"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> training percentage in Section <xref rid="j_nejsds105_s_017">4.1</xref>, as the models using 5-fold cross-validation were also fitted from <inline-formula id="j_nejsds105_ineq_066"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> of the data. The standard deviation tells us how the performance measurements change depending on which <inline-formula id="j_nejsds105_ineq_067"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> of the data they are trained with, showing the stability of the methods. Then, we calculate the average AUC of the 100 repetitions, which indicates the model’s ability to separate each emotion. The AUC is close to 1 when a method is capable of identifying all instances of an emotion with very few false positives. At the same time, an AUC of 0.5 means the method distinguishes an emotion no better than a random guess. The original results are presented in the tables in Appendix <xref rid="j_nejsds105_s_023">C.2</xref>.</p>
<fig id="j_nejsds105_fig_005">
<label>Figure 5</label>
<caption>
<p>The boxplots of stability and distinguishing ability measurements among 10 emotions of the four trainable methods using 100 repetitions of 5-fold cross-validation. The values of the three typical emotions, <italic>Depression</italic>, <italic>Lack of Motivation</italic>, and <italic>Miscellaneous</italic>, are also highlighted.</p>
</caption>
<graphic xlink:href="nejsds105_g005.jpg"/>
</fig>
<p>The left and middle plots in Figure <xref rid="j_nejsds105_fig_005">5</xref> show the boxplots of the standard deviations of the accuracy and F1 scores, and the right plot illustrates the boxplots of average AUCs among 10 emotions for the four trainable methods. There is no result for GPT, as it does not require a training process and cannot produce a probability of a positive detection. For the accuracy, it is clear that Lexicon has the smallest standard deviations, while MentalBERT has the largest. For the standard deviations of F1 scores, the trend is less obvious. However, the lower bound of Lexicon’s boxplot is lower than that of the other three trainable methods, showing that it can achieve the highest stability for some emotions. Those plots show that Lexicon excels in the stability measurements, while MentalBERT’s performance is sensitive to the part of the data with which it is trained. In the right plot, the upper bounds of the boxplots are all close to 1.0, but their lower bounds are different. Among the four methods, TF-IDF shows the highest average AUCs, and Lexicon and MentalBERT have the lowest values. Thus, when using AUC as the criterion, TF-IDF shows the highest distinguishing ability for some challenging emotions.</p>
<p>We show the stability and distinguishing ability measurements for the three typical emotions identified in Section <xref rid="j_nejsds105_s_017">4.1</xref>. Their values are also highlighted in Figure <xref rid="j_nejsds105_fig_005">5</xref> with special legends. For the emotion with good detection performance, <italic>Depression</italic>, the standard deviations of accuracy and F1 score are close to 0 for Lexicon, and slightly increase from BoW and TF-IDF to MentalBERT. The AUCs of all four methods are almost 1, showing excellent distinguishing ability. For the moderate one, <italic>Lack of Motivation</italic>, the standard deviation of accuracy again increases from Lexicon, BoW, TF-IDF, to MentalBERT. However, MentalBERT achieves the smallest standard deviation of F1 scores. One possible reason is that MentalBERT is better able to understand the concept of <italic>Lack of Motivation</italic>, thereby improving its stability. Their AUCs are around 0.75 and 0.85, and TF-IDF achieves the highest AUC.</p>
<p>For the emotion with poor performance, <italic>Miscellaneous</italic>, the standard deviations of Lexicon are still low despite its overall poor averages shown in Section <xref rid="j_nejsds105_s_017">4.1</xref>. MentalBERT again has the largest standard deviation in its accuracy and F1 scores. The AUCs are around 0.5 and 0.6, indicating the model’s prediction is slightly better than the random guess. Among the four methods, TF-IDF has the highest AUC, while Lexicon and MentalBERT have the lowest. We can conclude that for both easy and challenging emotions, Lexicon exhibits the highest stability, while MentalBERT shows the lowest. For the moderate one, MentalBERT’s stability becomes better. For moderate and challenging emotions, TF-IDF’s distinguishing ability outperforms others when using AUC as the criterion.</p>
<fig id="j_nejsds105_fig_006">
<label>Figure 6</label>
<caption>
<p>The stability and distinguishing ability measurements of the four trainable methods using 5-fold cross-validation for three typical emotions spanning different levels of detection performance.</p>
</caption>
<graphic xlink:href="nejsds105_g006.jpg"/>
</fig>
</sec>
<sec id="j_nejsds105_s_019">
<label>4.3</label>
<title>Prediction Consistency</title>
<p>In this section, we aim to compare the consistency between the detections of different NLP methods, which indicates whether they yield identical predictions for each student’s response. To handle emotions with a very small number of positive samples, we choose the Jaccard index, also known as the Jaccard similarity, to measure consistency. The Jaccard index between the two methods for a certain emotion can be calculated as: 
<disp-formula id="j_nejsds105_eq_013">
<alternatives><mml:math display="block">
<mml:mtable displaystyle="true">
<mml:mtr>
<mml:mtd>
<mml:mtext>Jac</mml:mtext>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal">,</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo><mml:mstyle displaystyle="true">
<mml:mfrac>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo largeop="false" movablelimits="false">∑</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">R</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mi mathvariant="italic">I</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mspace width="2.5pt"/>
<mml:mtext>and</mml:mtext>
<mml:mspace width="2.5pt"/>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:msubsup>
<mml:mrow>
<mml:mo largeop="false" movablelimits="false">∑</mml:mo>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">R</mml:mi>
</mml:mrow>
</mml:msubsup>
<mml:mi mathvariant="italic">I</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mspace width="2.5pt"/>
<mml:mtext>or</mml:mtext>
<mml:mspace width="2.5pt"/>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup>
<mml:mo>=</mml:mo>
<mml:mn>1</mml:mn>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
</mml:mrow>
</mml:mfrac>
</mml:mstyle>
<mml:mo mathvariant="normal">,</mml:mo>
</mml:mtd>
</mml:mtr>
</mml:mtable></mml:math><tex-math><![CDATA[\[ \text{Jac}({\text{Meth}_{1}},{\text{Meth}_{2}})=\frac{{\textstyle\textstyle\sum _{r=1}^{R}}I({\hat{y}_{r}^{{\text{Meth}_{1}}}}=1\hspace{2.5pt}\text{and}\hspace{2.5pt}{\hat{y}_{r}^{{\text{Meth}_{2}}}}=1)}{{\textstyle\textstyle\sum _{r=1}^{R}}I({\hat{y}_{r}^{{\text{Meth}_{1}}}}=1\hspace{2.5pt}\text{or}\hspace{2.5pt}{\hat{y}_{r}^{{\text{Meth}_{2}}}}=1)},\]]]></tex-math></alternatives>
</disp-formula> 
where <inline-formula id="j_nejsds105_ineq_068"><alternatives><mml:math>
<mml:mi mathvariant="italic">I</mml:mi>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:mo>·</mml:mo>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[$I(\cdot )$]]></tex-math></alternatives></inline-formula> is the indicator function, and <inline-formula id="j_nejsds105_ineq_069"><alternatives><mml:math>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>1</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup></mml:math><tex-math><![CDATA[${\hat{y}_{r}^{{\text{Meth}_{1}}}}$]]></tex-math></alternatives></inline-formula> and <inline-formula id="j_nejsds105_ineq_070"><alternatives><mml:math>
<mml:msubsup>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msub>
<mml:mrow>
<mml:mtext>Meth</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mn>2</mml:mn>
</mml:mrow>
</mml:msub>
</mml:mrow>
</mml:msubsup></mml:math><tex-math><![CDATA[${\hat{y}_{r}^{{\text{Meth}_{2}}}}$]]></tex-math></alternatives></inline-formula> denote whether the two methods predict is that emotion expressed in response <italic>r</italic>. The prediction results are based on the first repetition of the 100 5-fold cross-validation processes in Section <xref rid="j_nejsds105_s_018">4.2</xref>. We calculate the Jaccard indices from the 15 pair-wise comparisons between five NLP methods and the true labels, and the results of the ten emotions are listed in Appendix <xref rid="j_nejsds105_s_024">C.3</xref>. Figure <xref rid="j_nejsds105_fig_007">7</xref> presents the average pairwise consistencies over the ten emotions. MentalBERT vs. true labels (0.5) and BoW vs. TF-IDF (0.48) have the two highest average Jaccard indices. The first pair demonstrates the capability of trainable Transformer models to predict results close to the true labels. Meanwhile, the second pair is possibly caused by the similar mechanisms of the two methods, which first convert the responses to vectors and then train a machine learning classifier. Then, we examine the leftmost column, which shows the consistency of the five NLP methods compared to the true label. MentalBERT has the highest score (0.5), followed by BoW (0.43), and Lexicon, TF-IDF, and GPT have the lowest scores (0.37).</p>
<fig id="j_nejsds105_fig_007">
<label>Figure 7</label>
<caption>
<p>The average Jaccard indices among 10 emotions between five NLP methods and the true labels.</p>
</caption>
<graphic xlink:href="nejsds105_g007.jpg"/>
</fig>
<p>Finally, we present the Jaccard indices for the three typical emotions. For the good one, <italic>Depression</italic>, almost all pairwise consistencies are above 0.5, while the consistencies between the true labels, Lexicon, BoW, and MentalBERT are higher than 0.75. However, the TF-IDF and GPT generate relatively inconsistent predictions, while their Jaccard index is lower than 0.5, which is consistent with the results in Figure <xref rid="j_nejsds105_fig_004">4</xref> where these two methods show lower accuracies and F1 scores. For the emotion with moderate detection performance, <italic>Lack of Motivation</italic>, we find that MentalBERT achieves the highest consistency with the true labels, which is around 0.6, while the other Jaccard indices range from 0.22 to 0.57. This result highlights the capabilities of trainable LLMs. For the emotion with poor performance, <italic>Miscellaneous</italic>, every pairwise comparison is below 0.1, indicating that none of the NLP methods, whether trainable or not, can capture the ambiguous concept of <italic>Miscellaneous</italic>.</p>
<fig id="j_nejsds105_fig_008">
<label>Figure 8</label>
<caption>
<p>The Jaccard indices between five NLP methods and the true labels for three typical emotions spanning different levels of detection performance.</p>
</caption>
<graphic xlink:href="nejsds105_g008.jpg"/>
</fig>
</sec>
<sec id="j_nejsds105_s_020">
<label>4.4</label>
<title>Discussion</title>
<p><bold>Performance and Complexity Trade-off:</bold> The NLP methods investigated in this study exhibit dramatically different levels of complexity. The Lexicon-based method requires learning scores for only dozens of keywords, while MentalBERT must fine-tune over 100 million parameters in its Transformer architecture [<xref ref-type="bibr" rid="j_nejsds105_ref_017">17</xref>]. These complexity differences translate into distinct performance patterns. The Lexicon-based method achieves stable performance across training sample sizes ranging from <inline-formula id="j_nejsds105_ineq_071"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula> to <inline-formula id="j_nejsds105_ineq_072"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula>, demonstrating the lowest standard deviations in both accuracy and F1 scores. However, its peak performance cannot compete with more sophisticated methods. In contrast, fine-tuned MentalBERT demonstrates the highest accuracy and F1 scores with <inline-formula id="j_nejsds105_ineq_073"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> training data and achieves the best Jaccard Index agreement with true labels. Yet its performance drops dramatically with limited training data (<inline-formula id="j_nejsds105_ineq_074"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% $]]></tex-math></alternatives></inline-formula>), and it exhibits the highest variability in repeated cross-validation experiments.</p>
<p>BoW and TF-IDF methods, both of which convert responses into numeric vectors before training traditional machine learning models, demonstrate balanced performance, complexity, and stability. Their methodological similarity is reflected in their relatively high pairwise Jaccard index. While TF-IDF achieves better AUC scores than BoW, indicating good distinguishing ability for challenging emotions, its performance declines more rapidly with reduced training data.</p>
<p>The zero-shot GPT method, implemented through OpenAI’s API, requires no training process and achieves performance comparable to BoW and TF-IDF models trained on <inline-formula id="j_nejsds105_ineq_075"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% $]]></tex-math></alternatives></inline-formula> of the data, though it underperforms compared to MentalBERT trained on <inline-formula id="j_nejsds105_ineq_076"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% $]]></tex-math></alternatives></inline-formula> of the data. Notably, Lossio-Venture et al. [<xref ref-type="bibr" rid="j_nejsds105_ref_019">19</xref>] found that zero-shot ChatGPT outperformed fine-tuned Transformers in sentiment analysis for COVID-19 survey data. This apparent discrepancy likely stems from task complexity differences: sentiment analysis predicts general positive/negative sentiment, a more universal task that ChatGPT’s vast training data can handle effectively. In contrast, our fine-grained emotion detection requires distinguishing among ten mental health-related emotions, many specifically defined by our research team. Without access to labeled training data, the zero-shot GPT model cannot accurately detect these domain-specific emotional categories.</p>
<p><bold>Method Selection Suggestions:</bold> Based on our performance observations, we offer the following guidelines for NLP method selection. The Lexicon-based method proves particularly effective for detecting well-defined emotions with clear linguistic indicators, especially when training data is limited or stability is prioritized over peak performance. Fine-tuned MentalBERT is most suitable for detecting contextually complex emotions when sufficient training data (<inline-formula id="j_nejsds105_ineq_077"><alternatives><mml:math>
<mml:mo mathvariant="normal">&gt;</mml:mo>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$\gt 50\% $]]></tex-math></alternatives></inline-formula> of available samples) and computational resources are available. Traditional machine learning methods, such as BoW and TF-IDF, provide effective predictions when labeled data or computational resources are insufficient for Transformer models. Finally, zero-shot GPT can generate quick assessments when no training data is available, though performance will be limited for domain-specific emotions.</p>
<p><bold>Uncertainty in Mental Health Studies:</bold> When deploying NLP methods for emotion detection in mental health research, their inherent uncertainty must be carefully examined, as detection results can have serious consequences for both research conclusions and potential interventions. Uncertainty arises from multiple sources, beginning with the training dataset itself. As demonstrated by our experiments, most NLP methods show performance sensitivity to training size variations. Additionally, repeated cross-validation reveals that resampling the training dataset while maintaining the same sample size yields variable predictions, particularly for high-complexity models like fine-tuned MentalBERT. Therefore, sensitivity analysis for training sample size and cross-validation repetitions is essential for evaluating model stability.</p>
<p>A second source of uncertainty stems from the binarization of predicted probabilities. All four trainable methods output probabilities indicating the likelihood of emotion presence, with positive detection determined by a 0.5 threshold. However, a response with 0.99 prediction probability represents a different uncertainty level compared to one with 0.51 probability. In this study, we employed AUC to evaluate the distinguishing ability of NLP models based on predicted probabilities, and ROC curves can provide additional insights into model uncertainty characteristics.</p>
<p><bold>Emotion Labeling Impact:</bold> A crucial finding is that the target emotion significantly impacts NLP method performance. Figures <xref rid="j_nejsds105_fig_003">3</xref> and <xref rid="j_nejsds105_fig_005">5</xref> demonstrate that accuracy and stability measurements for the same method vary substantially across the ten emotions studied. Training sample size sensitivity also depends on the specific emotions being detected. Consequently, method comparisons yield different conclusions for different emotion types, as illustrated by our analysis of <italic>Depression</italic>, <italic>Lack of Motivation</italic>, and <italic>Miscellaneous</italic> categories. Such performance disparities across emotions can lead to inconsistent findings in studies relying on NLP detection results. While traditional mental health studies, such as [<xref ref-type="bibr" rid="j_nejsds105_ref_001">1</xref>], design emotion categories based on domain knowledge, the increasing role of NLP methods in data analysis necessitates careful selection and design of emotion categories to ensure both performance and stability of automated detection algorithms. For instance, <italic>Miscellaneous</italic>, a convenient category for human labelers, leads to poor performance for all NLP methods. Such categories should be avoided when incorporating NLP methods for data analysis.</p>
<p>We note that all four trainable methods can improve the model’s consistency in producing predictions that are similar to those of human labelers. Thus, the zero-shot GPT-3.5 performs relatively poorly compared to other methods when we use human labels as the “golden standard”. However, as pre-trained LLMs become more powerful, their predictions could be more valuable when the quality of human labels cannot be ensured. Collaboration between LLMs and human experts can be beneficial for mental health research.</p>
<p><bold>Multi-label Classification:</bold> There are machine learning research related to multi-label classification [<xref ref-type="bibr" rid="j_nejsds105_ref_003">3</xref>, <xref ref-type="bibr" rid="j_nejsds105_ref_040">40</xref>]. They found that by adopting specialized methods, such as problem transformation and algorithm selection, we can capture the inner structure of the labels to improve accuracy. In Figure <xref rid="j_nejsds105_fig_002">2</xref>, there are weak associations between our ten emotions. For example, <italic>No/Positive Effects</italic> have <inline-formula id="j_nejsds105_ineq_078"><alternatives><mml:math>
<mml:mo>−</mml:mo>
<mml:mn>0.20</mml:mn>
<mml:mo stretchy="false">∼</mml:mo>
<mml:mo>−</mml:mo>
<mml:mn>0.03</mml:mn></mml:math><tex-math><![CDATA[$-0.20\sim -0.03$]]></tex-math></alternatives></inline-formula> correlations with other 9 emotions. Employing multi-label classification to improve the efficiency of emotion detection would be an interesting future study.</p>
</sec>
</sec>
<sec id="j_nejsds105_s_021">
<label>5</label>
<title>Conclusion</title>
<p>This paper presents a comprehensive comparative study of NLP methods for detecting fine-grained emotions in college student responses regarding their mental health during the COVID-19 pandemic. We evaluated five distinct approaches: Lexicon, BoW, TF-IDF, fine-tuned MentalBERT, and zero-shot GPT, examining their performance, training sample size sensitivity, stability, distinguishing ability, and inter-method consistency. Our experimental results reveal performance-complexity trade-offs among NLP methods and provide evidence-based guidelines for method selection. We demonstrate the critical importance of recognizing uncertainty inherent in NLP detections and emphasize the need for careful emotion category design to ensure detection quality. Our insights bridge a critical gap in NLP analysis between data science and mental health studies, utilizing survey data with various applications.</p>
<p>This work establishes a foundation for future NLP development in mental health survey research through several promising directions. First, hybrid or mixture-of-experts frameworks could be designed to balance performance-complexity trade-offs by selecting appropriate models based on emotion type and available training sample size, thereby providing stable detection results across diverse conditions. Second, uncertainty-aware algorithms could be developed based on our analytical framework, incorporating prediction probabilities, cross-validation standard deviations, and inter-method consistency scores to generate uncertainty estimates. In mental health applications, such systems could restrict automated decisions to low-uncertainty cases while flagging high-uncertainty responses for human review. Finally, our findings highlight the need for developing emotion categories that balance mental-health insights with computational detectability, potentially through collaborative efforts between domain experts and NLP researchers.</p>
</sec>
</body>
<back>
<app-group>
<app id="j_nejsds105_app_001"><label>Appendix A</label>
<title>Labeling Criteria for Ten Emotions</title>
<p>Table <xref rid="j_nejsds105_tab_003">3</xref> gives an example for each emotion in our labeling process. Most of those emotions are self-explanatory, except the last three. We list our labeling criterion here:</p>
<list>
<list-item id="j_nejsds105_li_009">
<label>•</label>
<p><italic>Negative Feelings</italic> include fear, grief or sorrow, sadness, hopelessness, lack of purpose or control;</p>
</list-item>
<list-item id="j_nejsds105_li_010">
<label>•</label>
<p><italic>All Stress</italic> includes stress or worry related to the academy, financial and job, health, or general reasons;</p>
</list-item>
<list-item id="j_nejsds105_li_011">
<label>•</label>
<p><italic>Miscellaneous</italic> includes miscellaneous mental health issues, such as self-harm, substance abuse, trauma, eating disorders, sleep issues, etc.</p>
</list-item>
</list> 
<table-wrap id="j_nejsds105_tab_003">
<label>Table 3</label>
<caption>
<p>Examples of the 10 emotions in manual labeling in our dataset.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: center; border-top: solid thin; border-bottom: solid thin"><bold>Emotions affecting mental health</bold></td>
<td style="vertical-align: middle; text-align: left; border-top: solid thin; border-bottom: solid thin"><bold>Sample of positive responses</bold></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Isolation</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“I’m extroverted and the isolation is very taxing.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Depression</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“I am deeply depressed from watching the world collapse and feeling so helpless and useless.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Anxiety</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“I had general anxiety even before the pandemic, so this has just been adding to it.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Issues With Home Life</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“Being away from campus has taken my independence away which has taken a toll on me.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Lack of Routine</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“I experience a lack of routine or structure due to the coronavirus.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Lack of Motivation</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“The lack of a concrete schedule from not attending classes and extracurricular activities has distorted the passage of time and days feel much longer than they should be.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">No/Positive Effects</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“Giving me time to really focus on myself and develop new hobbies.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Negative Feelings</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“I constantly have panic attacks or moments of sadness.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">All Stress</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“I feel like I am constantly stressed about me or my family contracting it, and it worries me because I care about my health, but even more about their health.”</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: center; border-bottom: solid thin">Miscellaneous</td>
<td style="vertical-align: middle; text-align: left; border-bottom: solid thin">“This situation has caused me to struggle even more with my recovery from an eating disorder.”</td>
</tr>
</tbody>
</table>
</table-wrap> 
<table-wrap id="j_nejsds105_tab_004">
<label>Table 4</label>
<caption>
<p>The accuracy and F1 score of each method with <inline-formula id="j_nejsds105_ineq_079"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% /20\% $]]></tex-math></alternatives></inline-formula> training/testing splitting.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Isolation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Depression</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Anxiety</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Issues With Home Life</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Routine</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Lexicon</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.793</td>
<td style="vertical-align: top; text-align: justify">0.990</td>
<td style="vertical-align: top; text-align: justify">0.972</td>
<td style="vertical-align: top; text-align: justify">0.852</td>
<td style="vertical-align: top; text-align: justify">0.946</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.693</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.967</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.937</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.282</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.211</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>BoW</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.799</td>
<td style="vertical-align: top; text-align: justify">0.982</td>
<td style="vertical-align: top; text-align: justify">0.979</td>
<td style="vertical-align: top; text-align: justify">0.850</td>
<td style="vertical-align: top; text-align: justify">0.957</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.748</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.942</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.953</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.459</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.524</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>TF-IDF</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.817</td>
<td style="vertical-align: top; text-align: justify">0.944</td>
<td style="vertical-align: top; text-align: justify">0.918</td>
<td style="vertical-align: top; text-align: justify">0.847</td>
<td style="vertical-align: top; text-align: justify">0.956</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.758</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.794</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.793</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.441</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.467</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>MentalBERT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.833</td>
<td style="vertical-align: top; text-align: justify">0.980</td>
<td style="vertical-align: top; text-align: justify">0.967</td>
<td style="vertical-align: top; text-align: justify">0.860</td>
<td style="vertical-align: top; text-align: justify">0.953</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.797</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.942</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.929</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.470</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.461</td>
</tr>
</tbody>
</table>
</table-wrap>
</app>
<app id="j_nejsds105_app_002"><label>Appendix B</label>
<title>Prompts for GPT-3.5</title>
<p>Using OpenAI’s API, we first write the following prompt:</p><graphic xlink:href="nejsds105_g009.jpg"/> 
<p>where <monospace>response</monospace> is the students’ responses <italic>r</italic> in their survey. We then send the message to GPT-3.5:</p><graphic xlink:href="nejsds105_g010.jpg"/> 
<p>When receiving the answer from GPT-3.5, we will check whether it includes each emotion <inline-formula id="j_nejsds105_ineq_080"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub></mml:math><tex-math><![CDATA[${\textbf{E}_{j}}$]]></tex-math></alternatives></inline-formula>. If so, the corresponding detection <inline-formula id="j_nejsds105_ineq_081"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo></mml:math><tex-math><![CDATA[${\hat{y}_{r}}({\textbf{E}_{j}})$]]></tex-math></alternatives></inline-formula> will be set as 1; otherwise <inline-formula id="j_nejsds105_ineq_082"><alternatives><mml:math>
<mml:msub>
<mml:mrow>
<mml:mover accent="true">
<mml:mrow>
<mml:mi mathvariant="italic">y</mml:mi>
</mml:mrow>
<mml:mo stretchy="false">ˆ</mml:mo></mml:mover>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">r</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">(</mml:mo>
<mml:msub>
<mml:mrow>
<mml:mtext mathvariant="bold">E</mml:mtext>
</mml:mrow>
<mml:mrow>
<mml:mi mathvariant="italic">j</mml:mi>
</mml:mrow>
</mml:msub>
<mml:mo mathvariant="normal" fence="true" stretchy="false">)</mml:mo>
<mml:mo>=</mml:mo>
<mml:mn>0</mml:mn></mml:math><tex-math><![CDATA[${\hat{y}_{r}}({\textbf{E}_{j}})=0$]]></tex-math></alternatives></inline-formula>.</p></app>
<app id="j_nejsds105_app_003"><label>Appendix C</label>
<title>Original Results</title>
<sec id="j_nejsds105_s_022">
<label>C.1</label>
<title>Accuracy and F1 Scores with Various Training Sample Sizes</title>
<p>For the four trainable NLP methods, their accuracy and F1 scores from testing dataset with various training sample sizes for the ten emotions are listed in Tables <xref rid="j_nejsds105_tab_004">4</xref> and <xref rid="j_nejsds105_tab_005">5</xref> (<inline-formula id="j_nejsds105_ineq_083"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% /20\% $]]></tex-math></alternatives></inline-formula> training/testing), Tables <xref rid="j_nejsds105_tab_006">6</xref> and <xref rid="j_nejsds105_tab_007">7</xref> (<inline-formula id="j_nejsds105_ineq_084"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% /50\% $]]></tex-math></alternatives></inline-formula> training/testing), Tables <xref rid="j_nejsds105_tab_008">8</xref> and <xref rid="j_nejsds105_tab_009">9</xref> (<inline-formula id="j_nejsds105_ineq_085"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% /80\% $]]></tex-math></alternatives></inline-formula> training/testing). The accuracy and F1 scores of the zero-shot GPT are listed in Table <xref rid="j_nejsds105_tab_010">10</xref>. We repeat the splitting 100 times and report the average performance criteria.</p>
<table-wrap id="j_nejsds105_tab_005">
<label>Table 5</label>
<caption>
<p>The accuracy and F1 score of each method with <inline-formula id="j_nejsds105_ineq_086"><alternatives><mml:math>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$80\% /20\% $]]></tex-math></alternatives></inline-formula> training/testing splitting.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>No/Positive Effects</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Negative Feelings</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Miscellaneous</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>All Stress</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Lexicon</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.916</td>
<td style="vertical-align: top; text-align: justify">0.873</td>
<td style="vertical-align: top; text-align: justify">0.803</td>
<td style="vertical-align: top; text-align: justify">0.938</td>
<td style="vertical-align: top; text-align: justify">0.828</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.639</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.030</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.344</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.000</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.551</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>BoW</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.905</td>
<td style="vertical-align: top; text-align: justify">0.886</td>
<td style="vertical-align: top; text-align: justify">0.749</td>
<td style="vertical-align: top; text-align: justify">0.922</td>
<td style="vertical-align: top; text-align: justify">0.813</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.619</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.353</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.391</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.071</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.557</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>TF-IDF</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.900</td>
<td style="vertical-align: top; text-align: justify">0.890</td>
<td style="vertical-align: top; text-align: justify">0.757</td>
<td style="vertical-align: top; text-align: justify">0.929</td>
<td style="vertical-align: top; text-align: justify">0.805</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.583</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.395</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.418</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.125</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.531</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>MentalBERT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.933</td>
<td style="vertical-align: top; text-align: justify">0.944</td>
<td style="vertical-align: top; text-align: justify">0.780</td>
<td style="vertical-align: top; text-align: justify">0.929</td>
<td style="vertical-align: top; text-align: justify">0.851</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.768</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.749</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.431</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.091</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.770</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="j_nejsds105_tab_006">
<label>Table 6</label>
<caption>
<p>The accuracy and F1 score of each method with <inline-formula id="j_nejsds105_ineq_087"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% /50\% $]]></tex-math></alternatives></inline-formula> training/testing splitting.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Isolation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Depression</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Anxiety</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Issues With Home Life</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Routine</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Lexicon</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.771</td>
<td style="vertical-align: top; text-align: justify">0.990</td>
<td style="vertical-align: top; text-align: justify">0.973</td>
<td style="vertical-align: top; text-align: justify">0.846</td>
<td style="vertical-align: top; text-align: justify">0.944</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.658</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.970</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.942</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.227</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.205</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>BoW</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.767</td>
<td style="vertical-align: top; text-align: justify">0.978</td>
<td style="vertical-align: top; text-align: justify">0.974</td>
<td style="vertical-align: top; text-align: justify">0.849</td>
<td style="vertical-align: top; text-align: justify">0.954</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.706</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.930</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.943</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.425</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.500</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>TF-IDF</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.789</td>
<td style="vertical-align: top; text-align: justify">0.933</td>
<td style="vertical-align: top; text-align: justify">0.898</td>
<td style="vertical-align: top; text-align: justify">0.846</td>
<td style="vertical-align: top; text-align: justify">0.954</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.717</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.753</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.737</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.389</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.439</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>MentalBERT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.805</td>
<td style="vertical-align: top; text-align: justify">0.976</td>
<td style="vertical-align: top; text-align: justify">0.962</td>
<td style="vertical-align: top; text-align: justify">0.855</td>
<td style="vertical-align: top; text-align: justify">0.948</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.762</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.927</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.917</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.092</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.245</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="j_nejsds105_tab_007">
<label>Table 7</label>
<caption>
<p>The accuracy and F1 score of each method with <inline-formula id="j_nejsds105_ineq_088"><alternatives><mml:math>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>50</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$50\% /50\% $]]></tex-math></alternatives></inline-formula> training/testing splitting.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>No/Positive Effects</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Negative Feelings</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Miscellaneous</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>All Stress</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Lexicon</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.913</td>
<td style="vertical-align: top; text-align: justify">0.872</td>
<td style="vertical-align: top; text-align: justify">0.793</td>
<td style="vertical-align: top; text-align: justify">0.936</td>
<td style="vertical-align: top; text-align: justify">0.827</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.619</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.039</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.280</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.001</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.531</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>BoW</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.889</td>
<td style="vertical-align: top; text-align: justify">0.878</td>
<td style="vertical-align: top; text-align: justify">0.750</td>
<td style="vertical-align: top; text-align: justify">0.928</td>
<td style="vertical-align: top; text-align: justify">0.798</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.543</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.298</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.376</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.067</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.503</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>TF-IDF</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.884</td>
<td style="vertical-align: top; text-align: justify">0.888</td>
<td style="vertical-align: top; text-align: justify">0.758</td>
<td style="vertical-align: top; text-align: justify">0.933</td>
<td style="vertical-align: top; text-align: justify">0.796</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.496</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.339</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.357</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.082</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.483</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>MentalBERT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.918</td>
<td style="vertical-align: top; text-align: justify">0.929</td>
<td style="vertical-align: top; text-align: justify">0.767</td>
<td style="vertical-align: top; text-align: justify">0.936</td>
<td style="vertical-align: top; text-align: justify">0.829</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.699</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.637</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.336</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.023</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.730</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="j_nejsds105_tab_008">
<label>Table 8</label>
<caption>
<p>The accuracy and F1 score of each method with <inline-formula id="j_nejsds105_ineq_089"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% /80\% $]]></tex-math></alternatives></inline-formula> training/testing splitting.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Isolation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Depression</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Anxiety</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Issues With Home Life</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Routine</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Lexicon</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.720</td>
<td style="vertical-align: top; text-align: justify">0.988</td>
<td style="vertical-align: top; text-align: justify">0.958</td>
<td style="vertical-align: top; text-align: justify">0.838</td>
<td style="vertical-align: top; text-align: justify">NA</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.546</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.960</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.894</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.141</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">NA</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>BoW</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.720</td>
<td style="vertical-align: top; text-align: justify">0.943</td>
<td style="vertical-align: top; text-align: justify">0.947</td>
<td style="vertical-align: top; text-align: justify">0.843</td>
<td style="vertical-align: top; text-align: justify">0.948</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.621</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.793</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.874</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.302</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.283</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>TF-IDF</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.728</td>
<td style="vertical-align: top; text-align: justify">0.890</td>
<td style="vertical-align: top; text-align: justify">0.858</td>
<td style="vertical-align: top; text-align: justify">0.841</td>
<td style="vertical-align: top; text-align: justify">NA</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.607</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.529</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.576</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.187</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">NA</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>MentalBERT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.701</td>
<td style="vertical-align: top; text-align: justify">0.840</td>
<td style="vertical-align: top; text-align: justify">0.812</td>
<td style="vertical-align: top; text-align: justify">0.940</td>
<td style="vertical-align: top; text-align: justify">0.941</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.591</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.107</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.342</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.035</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.000</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="j_nejsds105_tab_009">
<label>Table 9</label>
<caption>
<p>The accuracy and F1 score of each method with <inline-formula id="j_nejsds105_ineq_090"><alternatives><mml:math>
<mml:mn>20</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi>
<mml:mo mathvariant="normal" stretchy="false">/</mml:mo>
<mml:mn>80</mml:mn>
<mml:mi mathvariant="normal">%</mml:mi></mml:math><tex-math><![CDATA[$20\% /80\% $]]></tex-math></alternatives></inline-formula> training/testing splitting.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>No/Positive Effects</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Negative Feelings</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Miscellaneous</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>All Stress</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Lexicon</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.896</td>
<td style="vertical-align: top; text-align: justify">0.866</td>
<td style="vertical-align: top; text-align: justify">0.772</td>
<td style="vertical-align: top; text-align: justify">NA</td>
<td style="vertical-align: top; text-align: justify">0.814</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.515</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.042</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.158</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">NA</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.463</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>BoW</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.857</td>
<td style="vertical-align: top; text-align: justify">0.872</td>
<td style="vertical-align: top; text-align: justify">0.752</td>
<td style="vertical-align: top; text-align: justify">0.935</td>
<td style="vertical-align: top; text-align: justify">0.785</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.311</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.104</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.299</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.031</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.401</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>TF-IDF</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.854</td>
<td style="vertical-align: top; text-align: justify">NA</td>
<td style="vertical-align: top; text-align: justify">0.758</td>
<td style="vertical-align: top; text-align: justify">NA</td>
<td style="vertical-align: top; text-align: justify">0.772</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.222</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">NA</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.216</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">NA</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.305</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>MentalBERT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify">Accuracy</td>
<td style="vertical-align: top; text-align: justify">0.848</td>
<td style="vertical-align: top; text-align: justify">0.878</td>
<td style="vertical-align: top; text-align: justify">0.765</td>
<td style="vertical-align: top; text-align: justify">0.940</td>
<td style="vertical-align: top; text-align: justify">0.715</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.038</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.047</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.032</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.000</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.383</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="j_nejsds105_tab_010">
<label>Table 10</label>
<caption>
<p>The accuracy and F1 score of zero-shot GPT method.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Isolation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Depression</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Anxiety</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Issues With Home Life</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Routine</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>GPT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Accuracy</bold></td>
<td style="vertical-align: top; text-align: justify">0.788</td>
<td style="vertical-align: top; text-align: justify">0.861</td>
<td style="vertical-align: top; text-align: justify">0.827</td>
<td style="vertical-align: top; text-align: justify">0.827</td>
<td style="vertical-align: top; text-align: justify">0.832</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><bold>F1</bold></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.782</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.708</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.717</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.523</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.367</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><italic>No/Positive Effects</italic></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><italic>Negative Feelings</italic></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><italic>Miscellaneous</italic></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><italic>All Stress</italic></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>GPT</bold></td>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
<td style="vertical-align: top; text-align: justify"/>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify"><bold>Accuracy</bold></td>
<td style="vertical-align: top; text-align: justify">0.842</td>
<td style="vertical-align: top; text-align: justify">0.891</td>
<td style="vertical-align: top; text-align: justify">0.686</td>
<td style="vertical-align: top; text-align: justify">0.939</td>
<td style="vertical-align: top; text-align: justify">0.725</td>
</tr>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><bold>F1</bold></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.575</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.505</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.31</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.577</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="j_nejsds105_tab_011">
<label>Table 11</label>
<caption>
<p>The standard deviations of accuracy and F1 scores obtained from 100 repetitive five-fold cross-validation for four trainable NLP methods.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><bold>5-fold Cross Validation</bold></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Iso-lation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Depre-ssion</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Anxie-ty</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Issues With Home Life</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Routine</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>No/ Positive Effects</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Nega-tive Feelings</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Misce-llane-ous</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>All Stress</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td colspan="11" style="vertical-align: top; text-align: center; border-bottom: solid thin"><bold>Lexicon</bold></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">Accuracy</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_091"><alternatives><mml:math>
<mml:mn>0.793</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.010</mml:mn></mml:math><tex-math><![CDATA[$0.793\pm 0.010$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_092"><alternatives><mml:math>
<mml:mn>0.990</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.000</mml:mn></mml:math><tex-math><![CDATA[$0.990\pm 0.000$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_093"><alternatives><mml:math>
<mml:mn>0.976</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.000</mml:mn></mml:math><tex-math><![CDATA[$0.976\pm 0.000$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_094"><alternatives><mml:math>
<mml:mn>0.852</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.006</mml:mn></mml:math><tex-math><![CDATA[$0.852\pm 0.006$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_095"><alternatives><mml:math>
<mml:mn>0.944</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.003</mml:mn></mml:math><tex-math><![CDATA[$0.944\pm 0.003$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_096"><alternatives><mml:math>
<mml:mn>0.915</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.006</mml:mn></mml:math><tex-math><![CDATA[$0.915\pm 0.006$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_097"><alternatives><mml:math>
<mml:mn>0.871</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.004</mml:mn></mml:math><tex-math><![CDATA[$0.871\pm 0.004$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_098"><alternatives><mml:math>
<mml:mn>0.802</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.008</mml:mn></mml:math><tex-math><![CDATA[$0.802\pm 0.008$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_099"><alternatives><mml:math>
<mml:mn>0.938</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.002</mml:mn></mml:math><tex-math><![CDATA[$0.938\pm 0.002$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_100"><alternatives><mml:math>
<mml:mn>0.831</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.011</mml:mn></mml:math><tex-math><![CDATA[$0.831\pm 0.011$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_101"><alternatives><mml:math>
<mml:mn>0.696</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.017</mml:mn></mml:math><tex-math><![CDATA[$0.696\pm 0.017$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_102"><alternatives><mml:math>
<mml:mn>0.971</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.001</mml:mn></mml:math><tex-math><![CDATA[$0.971\pm 0.001$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_103"><alternatives><mml:math>
<mml:mn>0.947</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.000</mml:mn></mml:math><tex-math><![CDATA[$0.947\pm 0.000$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_104"><alternatives><mml:math>
<mml:mn>0.275</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.041</mml:mn></mml:math><tex-math><![CDATA[$0.275\pm 0.041$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_105"><alternatives><mml:math>
<mml:mn>0.202</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.072</mml:mn></mml:math><tex-math><![CDATA[$0.202\pm 0.072$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_106"><alternatives><mml:math>
<mml:mn>0.633</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.032</mml:mn></mml:math><tex-math><![CDATA[$0.633\pm 0.032$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_107"><alternatives><mml:math>
<mml:mn>0.037</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.031</mml:mn></mml:math><tex-math><![CDATA[$0.037\pm 0.031$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_108"><alternatives><mml:math>
<mml:mn>0.335</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.039</mml:mn></mml:math><tex-math><![CDATA[$0.335\pm 0.039$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_109"><alternatives><mml:math>
<mml:mn>0.000</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.000</mml:mn></mml:math><tex-math><![CDATA[$0.000\pm 0.000$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_110"><alternatives><mml:math>
<mml:mn>0.555</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.041</mml:mn></mml:math><tex-math><![CDATA[$0.555\pm 0.041$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td colspan="11" style="vertical-align: top; text-align: center; border-bottom: solid thin"><bold>BoW</bold></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">Accuracy</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_111"><alternatives><mml:math>
<mml:mn>0.797</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.011</mml:mn></mml:math><tex-math><![CDATA[$0.797\pm 0.011$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_112"><alternatives><mml:math>
<mml:mn>0.982</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.002</mml:mn></mml:math><tex-math><![CDATA[$0.982\pm 0.002$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_113"><alternatives><mml:math>
<mml:mn>0.977</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.001</mml:mn></mml:math><tex-math><![CDATA[$0.977\pm 0.001$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_114"><alternatives><mml:math>
<mml:mn>0.851</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.009</mml:mn></mml:math><tex-math><![CDATA[$0.851\pm 0.009$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_115"><alternatives><mml:math>
<mml:mn>0.958</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.003</mml:mn></mml:math><tex-math><![CDATA[$0.958\pm 0.003$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_116"><alternatives><mml:math>
<mml:mn>0.901</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.007</mml:mn></mml:math><tex-math><![CDATA[$0.901\pm 0.007$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_117"><alternatives><mml:math>
<mml:mn>0.889</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.007</mml:mn></mml:math><tex-math><![CDATA[$0.889\pm 0.007$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_118"><alternatives><mml:math>
<mml:mn>0.751</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.012</mml:mn></mml:math><tex-math><![CDATA[$0.751\pm 0.012$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_119"><alternatives><mml:math>
<mml:mn>0.922</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.006</mml:mn></mml:math><tex-math><![CDATA[$0.922\pm 0.006$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_120"><alternatives><mml:math>
<mml:mn>0.813</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.010</mml:mn></mml:math><tex-math><![CDATA[$0.813\pm 0.010$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_121"><alternatives><mml:math>
<mml:mn>0.748</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.014</mml:mn></mml:math><tex-math><![CDATA[$0.748\pm 0.014$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_122"><alternatives><mml:math>
<mml:mn>0.944</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.005</mml:mn></mml:math><tex-math><![CDATA[$0.944\pm 0.005$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_123"><alternatives><mml:math>
<mml:mn>0.949</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.003</mml:mn></mml:math><tex-math><![CDATA[$0.949\pm 0.003$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_124"><alternatives><mml:math>
<mml:mn>0.468</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.033</mml:mn></mml:math><tex-math><![CDATA[$0.468\pm 0.033$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_125"><alternatives><mml:math>
<mml:mn>0.567</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.038</mml:mn></mml:math><tex-math><![CDATA[$0.567\pm 0.038$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_126"><alternatives><mml:math>
<mml:mn>0.618</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.028</mml:mn></mml:math><tex-math><![CDATA[$0.618\pm 0.028$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_127"><alternatives><mml:math>
<mml:mn>0.403</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.040</mml:mn></mml:math><tex-math><![CDATA[$0.403\pm 0.040$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_128"><alternatives><mml:math>
<mml:mn>0.398</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.028</mml:mn></mml:math><tex-math><![CDATA[$0.398\pm 0.028$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_129"><alternatives><mml:math>
<mml:mn>0.091</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.045</mml:mn></mml:math><tex-math><![CDATA[$0.091\pm 0.045$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_130"><alternatives><mml:math>
<mml:mn>0.562</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.026</mml:mn></mml:math><tex-math><![CDATA[$0.562\pm 0.026$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td colspan="11" style="vertical-align: top; text-align: center; border-bottom: solid thin"><bold>TF-IDF</bold></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">Accuracy</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_131"><alternatives><mml:math>
<mml:mn>0.818</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.011</mml:mn></mml:math><tex-math><![CDATA[$0.818\pm 0.011$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_132"><alternatives><mml:math>
<mml:mn>0.943</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.003</mml:mn></mml:math><tex-math><![CDATA[$0.943\pm 0.003$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_133"><alternatives><mml:math>
<mml:mn>0.916</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.005</mml:mn></mml:math><tex-math><![CDATA[$0.916\pm 0.005$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_134"><alternatives><mml:math>
<mml:mn>0.847</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.008</mml:mn></mml:math><tex-math><![CDATA[$0.847\pm 0.008$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_135"><alternatives><mml:math>
<mml:mn>0.957</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.003</mml:mn></mml:math><tex-math><![CDATA[$0.957\pm 0.003$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_136"><alternatives><mml:math>
<mml:mn>0.900</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.008</mml:mn></mml:math><tex-math><![CDATA[$0.900\pm 0.008$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_137"><alternatives><mml:math>
<mml:mn>0.891</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.006</mml:mn></mml:math><tex-math><![CDATA[$0.891\pm 0.006$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_138"><alternatives><mml:math>
<mml:mn>0.759</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.011</mml:mn></mml:math><tex-math><![CDATA[$0.759\pm 0.011$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_139"><alternatives><mml:math>
<mml:mn>0.930</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.004</mml:mn></mml:math><tex-math><![CDATA[$0.930\pm 0.004$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_140"><alternatives><mml:math>
<mml:mn>0.805</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.009</mml:mn></mml:math><tex-math><![CDATA[$0.805\pm 0.009$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_141"><alternatives><mml:math>
<mml:mn>0.761</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.016</mml:mn></mml:math><tex-math><![CDATA[$0.761\pm 0.016$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_142"><alternatives><mml:math>
<mml:mn>0.802</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.013</mml:mn></mml:math><tex-math><![CDATA[$0.802\pm 0.013$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_143"><alternatives><mml:math>
<mml:mn>0.793</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.015</mml:mn></mml:math><tex-math><![CDATA[$0.793\pm 0.015$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_144"><alternatives><mml:math>
<mml:mn>0.458</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.024</mml:mn></mml:math><tex-math><![CDATA[$0.458\pm 0.024$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_145"><alternatives><mml:math>
<mml:mn>0.511</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.030</mml:mn></mml:math><tex-math><![CDATA[$0.511\pm 0.030$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_146"><alternatives><mml:math>
<mml:mn>0.600</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.033</mml:mn></mml:math><tex-math><![CDATA[$0.600\pm 0.033$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_147"><alternatives><mml:math>
<mml:mn>0.402</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.039</mml:mn></mml:math><tex-math><![CDATA[$0.402\pm 0.039$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_148"><alternatives><mml:math>
<mml:mn>0.428</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.026</mml:mn></mml:math><tex-math><![CDATA[$0.428\pm 0.026$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_149"><alternatives><mml:math>
<mml:mn>0.143</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.036</mml:mn></mml:math><tex-math><![CDATA[$0.143\pm 0.036$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_150"><alternatives><mml:math>
<mml:mn>0.541</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.022</mml:mn></mml:math><tex-math><![CDATA[$0.541\pm 0.022$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td colspan="11" style="vertical-align: top; text-align: center; border-bottom: solid thin"><bold>MentalBERT</bold></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">Accuracy</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_151"><alternatives><mml:math>
<mml:mn>0.822</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.009</mml:mn></mml:math><tex-math><![CDATA[$0.822\pm 0.009$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_152"><alternatives><mml:math>
<mml:mn>0.981</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.005</mml:mn></mml:math><tex-math><![CDATA[$0.981\pm 0.005$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_153"><alternatives><mml:math>
<mml:mn>0.967</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.005</mml:mn></mml:math><tex-math><![CDATA[$0.967\pm 0.005$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_154"><alternatives><mml:math>
<mml:mn>0.865</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.009</mml:mn></mml:math><tex-math><![CDATA[$0.865\pm 0.009$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_155"><alternatives><mml:math>
<mml:mn>0.954</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.005</mml:mn></mml:math><tex-math><![CDATA[$0.954\pm 0.005$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_156"><alternatives><mml:math>
<mml:mn>0.930</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.010</mml:mn></mml:math><tex-math><![CDATA[$0.930\pm 0.010$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_157"><alternatives><mml:math>
<mml:mn>0.942</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.007</mml:mn></mml:math><tex-math><![CDATA[$0.942\pm 0.007$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_158"><alternatives><mml:math>
<mml:mn>0.783</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.011</mml:mn></mml:math><tex-math><![CDATA[$0.783\pm 0.011$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_159"><alternatives><mml:math>
<mml:mn>0.934</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.007</mml:mn></mml:math><tex-math><![CDATA[$0.934\pm 0.007$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_160"><alternatives><mml:math>
<mml:mn>0.853</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.012</mml:mn></mml:math><tex-math><![CDATA[$0.853\pm 0.012$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">F1</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_161"><alternatives><mml:math>
<mml:mn>0.789</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.012</mml:mn></mml:math><tex-math><![CDATA[$0.789\pm 0.012$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_162"><alternatives><mml:math>
<mml:mn>0.943</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.013</mml:mn></mml:math><tex-math><![CDATA[$0.943\pm 0.013$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_163"><alternatives><mml:math>
<mml:mn>0.929</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.011</mml:mn></mml:math><tex-math><![CDATA[$0.929\pm 0.011$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_164"><alternatives><mml:math>
<mml:mn>0.503</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.046</mml:mn></mml:math><tex-math><![CDATA[$0.503\pm 0.046$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_165"><alternatives><mml:math>
<mml:mn>0.471</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.070</mml:mn></mml:math><tex-math><![CDATA[$0.471\pm 0.070$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_166"><alternatives><mml:math>
<mml:mn>0.765</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.027</mml:mn></mml:math><tex-math><![CDATA[$0.765\pm 0.027$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_167"><alternatives><mml:math>
<mml:mn>0.741</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.032</mml:mn></mml:math><tex-math><![CDATA[$0.741\pm 0.032$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_168"><alternatives><mml:math>
<mml:mn>0.456</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.037</mml:mn></mml:math><tex-math><![CDATA[$0.456\pm 0.037$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_169"><alternatives><mml:math>
<mml:mn>0.159</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.078</mml:mn></mml:math><tex-math><![CDATA[$0.159\pm 0.078$]]></tex-math></alternatives></inline-formula></td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin"><inline-formula id="j_nejsds105_ineq_170"><alternatives><mml:math>
<mml:mn>0.776</mml:mn>
<mml:mo>±</mml:mo>
<mml:mn>0.019</mml:mn></mml:math><tex-math><![CDATA[$0.776\pm 0.019$]]></tex-math></alternatives></inline-formula></td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="j_nejsds105_s_023">
<label>C.2</label>
<title>Stability and Distinguishing Ability</title>
<p>Table <xref rid="j_nejsds105_tab_011">11</xref> shows the standard deviations of accuracy and F1 scores obtained from 100 repetitive five-fold cross-validation for four trainable NLP methods. Table <xref rid="j_nejsds105_tab_012">12</xref> lists the average Area Under ROC Curves (AUC) obtained from the stratified cross-validation for four trainable NLP methods.</p>
<table-wrap id="j_nejsds105_tab_012">
<label>Table 12</label>
<caption>
<p>The average Area Under ROC Curves (AUC) obtained from the first five-fold cross-validation for four trainable NLP methods.</p>
</caption>
<table>
<thead>
<tr>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"/>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Iso-lation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Depre-ssion</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Anxie-ty</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Issues With Home Life</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Routine</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Lack of Motivation</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>No/ Positive Effects</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Nega-tive Feelings</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>Misce-llane-ous</italic></td>
<td style="vertical-align: top; text-align: justify; border-top: solid thin; border-bottom: solid thin"><italic>All Stress</italic></td>
</tr>
</thead>
<tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">Lexicon</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.855</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.977</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.965</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.843</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.767</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.829</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.631</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.714</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.487</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.813</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">BoW</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.860</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.960</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.980</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.810</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.830</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.850</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.770</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.670</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.630</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.790</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">TF-IDF</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.880</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.950</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.970</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.840</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.860</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.880</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.810</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.720</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.700</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.830</td>
</tr>
</tbody><tbody>
<tr>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">Mental-BERT</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.820</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.970</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.960</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.690</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.670</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.850</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.820</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.650</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.550</td>
<td style="vertical-align: top; text-align: justify; border-bottom: solid thin">0.830</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="j_nejsds105_s_024">
<label>C.3</label>
<title>Pairwise Consistency</title>
<p>Pairwise consistency between five NLP methods and the true labels for each emotion is listed in Figure <xref rid="j_nejsds105_fig_009">9</xref>.</p>
<fig id="j_nejsds105_fig_009">
<label>Figure 9</label>
<caption>
<p>The pairwise comparison between five AI methods and the true label for the ten emotions.</p>
</caption>
<graphic xlink:href="nejsds105_g011.jpg"/>
</fig>
</sec>
</app></app-group>
<ack id="j_nejsds105_ack_001">
<title>Acknowledgements</title>
<p>The authors thank Alexis West and Afton White from Virginia Commonwealth University for categorizing emotions to produce human labeling results.</p></ack>
<ref-list id="j_nejsds105_reflist_001">
<title>References</title>
<ref id="j_nejsds105_ref_001">
<label>[1]</label><mixed-citation publication-type="journal"><string-name><surname>Amona</surname>, <given-names>E.</given-names></string-name>, <string-name><surname>West</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>White</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>Sahoo</surname>, <given-names>I.</given-names></string-name>, <string-name><surname>Chan</surname>, <given-names>D. M.</given-names></string-name>, <string-name><surname>Gandhi</surname>, <given-names>P.</given-names></string-name> and <string-name><surname>Qian</surname>, <given-names>Y.</given-names></string-name> (<year>2025</year>). <article-title>Breakdown of COVID effects on students’ mental health at the beginning of the pandemic</article-title>. <source>PLOS Mental Health</source> <volume>2</volume>(<issue>6</issue>) <fpage>0000363</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_002">
<label>[2]</label><mixed-citation publication-type="chapter"><string-name><surname>Barry</surname>, <given-names>J.</given-names></string-name> (<year>2017</year>). <chapter-title>Sentiment Analysis of Online Reviews Using Bag-of-Words and LSTM Approaches.</chapter-title> In <source>AICS</source> <fpage>272</fpage>–<lpage>274</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_003">
<label>[3]</label><mixed-citation publication-type="journal"><string-name><surname>Bogatinovski</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Todorovski</surname>, <given-names>L.</given-names></string-name>, <string-name><surname>Deroski</surname>, <given-names>S.</given-names></string-name> and <string-name><surname>Kocev</surname>, <given-names>D.</given-names></string-name> (<year>2022</year>). <article-title>Comprehensive comparative study of multi-label classification methods</article-title>. <source>Expert Systems with Applications</source> <volume>203</volume> <fpage>117215</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_004">
<label>[4]</label><mixed-citation publication-type="journal"><string-name><surname>Boon-Itt</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Skunkan</surname>, <given-names>Y.</given-names></string-name> <etal>et al.</etal> (<year>2020</year>). <article-title>Public perception of the COVID-19 pandemic on Twitter: sentiment analysis and topic modeling study</article-title>. <source>JMIR Public Health and Surveillance</source> <volume>6</volume>(<issue>4</issue>) <fpage>21978</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_005">
<label>[5]</label><mixed-citation publication-type="journal"><string-name><surname>Bouazizi</surname>, <given-names>M.</given-names></string-name> and <string-name><surname>Ohtsuki</surname>, <given-names>T.</given-names></string-name> (<year>2019</year>). <article-title>Multi-class sentiment analysis on Twitter: Classification performance and challenges</article-title>. <source>IEEE Access</source> <volume>7</volume> <fpage>46273</fpage>–<lpage>46284</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_006">
<label>[6]</label><mixed-citation publication-type="journal"><string-name><surname>Browning</surname>, <given-names>M. H.</given-names></string-name>, <string-name><surname>Larson</surname>, <given-names>L. R.</given-names></string-name>, <string-name><surname>Sharaievska</surname>, <given-names>I.</given-names></string-name>, <string-name><surname>Rigolon</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>McAnirlin</surname>, <given-names>O.</given-names></string-name>, <string-name><surname>Mullenbach</surname>, <given-names>L.</given-names></string-name>, <string-name><surname>Cloutier</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Vu</surname>, <given-names>T. M.</given-names></string-name>, <string-name><surname>Thomsen</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Reigner</surname>, <given-names>N.</given-names></string-name> <etal>et al.</etal> (<year>2021</year>). <article-title>Psychological impacts from COVID-19 among university students: Risk factors across seven states in the United States</article-title>. <source>PloS One</source> <volume>16</volume>(<issue>1</issue>) <fpage>0245327</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_007">
<label>[7]</label><mixed-citation publication-type="journal"><string-name><surname>Chan</surname>, <given-names>D. M.</given-names></string-name>, <string-name><surname>Broda</surname>, <given-names>M. D.</given-names></string-name>, <string-name><surname>Winslow</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Jones</surname>, <given-names>Q.</given-names></string-name>, <string-name><surname>Luce</surname>, <given-names>C.</given-names></string-name>, <string-name><surname>McGinnis</surname>, <given-names>H. A.</given-names></string-name>, <string-name><surname>Tomlinson</surname>, <given-names>C. A.</given-names></string-name>, <string-name><surname>Hamid</surname>, <given-names>H.</given-names></string-name> and <string-name><surname>Ma</surname>, <given-names>J.</given-names></string-name> (<year>2022</year>). <article-title>The Effects of Prime Supporters within a College Student’s Support Network</article-title>. <source>Nonlinear Dynamics, Psychology &amp; Life Sciences</source> <volume>26</volume>(<issue>4</issue>).</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_008">
<label>[8]</label><mixed-citation publication-type="journal"><string-name><surname>Chawla</surname>, <given-names>N. V.</given-names></string-name>, <string-name><surname>Bowyer</surname>, <given-names>K. W.</given-names></string-name>, <string-name><surname>Hall</surname>, <given-names>L. O.</given-names></string-name> and <string-name><surname>Kegelmeyer</surname>, <given-names>W. P.</given-names></string-name> (<year>2002</year>). <article-title>SMOTE: synthetic minority over-sampling technique</article-title>. <source>Journal of Artificial Intelligence Research</source> <volume>16</volume> <fpage>321</fpage>–<lpage>357</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_009">
<label>[9]</label><mixed-citation publication-type="journal"><string-name><surname>Copeland</surname>, <given-names>W. E.</given-names></string-name>, <string-name><surname>McGinnis</surname>, <given-names>E.</given-names></string-name>, <string-name><surname>Bai</surname>, <given-names>Y.</given-names></string-name>, <string-name><surname>Adams</surname>, <given-names>Z.</given-names></string-name>, <string-name><surname>Nardone</surname>, <given-names>H.</given-names></string-name>, <string-name><surname>Devadanam</surname>, <given-names>V.</given-names></string-name>, <string-name><surname>Rettew</surname>, <given-names>J.</given-names></string-name> and <string-name><surname>Hudziak</surname>, <given-names>J. J.</given-names></string-name> (<year>2021</year>). <article-title>Impact of COVID-19 pandemic on college student mental health and wellness</article-title>. <source>Journal of the American Academy of Child &amp; Adolescent Psychiatry</source> <volume>60</volume>(<issue>1</issue>) <fpage>134</fpage>–<lpage>141</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_010">
<label>[10]</label><mixed-citation publication-type="chapter"><string-name><surname>Demszky</surname>, <given-names>D.</given-names></string-name>, <string-name><surname>Movshovitz-Attias</surname>, <given-names>D.</given-names></string-name>, <string-name><surname>Ko</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Cowen</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>Nemade</surname>, <given-names>G.</given-names></string-name> and <string-name><surname>Ravi</surname>, <given-names>S.</given-names></string-name> (<year>2020</year>). <chapter-title>GoEmotions: A Dataset of Fine-Grained Emotions</chapter-title>. In <source>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics</source> <fpage>4040</fpage>–<lpage>4054</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_011">
<label>[11]</label><mixed-citation publication-type="journal"><string-name><surname>Desmet</surname>, <given-names>B.</given-names></string-name> and <string-name><surname>Hoste</surname>, <given-names>V.</given-names></string-name> (<year>2013</year>). <article-title>Emotion detection in suicide notes</article-title>. <source>Expert Systems with Applications</source> <volume>40</volume>(<issue>16</issue>) <fpage>6351</fpage>–<lpage>6358</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1016/j.eswa.2013.05.050" xlink:type="simple">https://doi.org/10.1016/j.eswa.2013.05.050</ext-link>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_012">
<label>[12]</label><mixed-citation publication-type="chapter"><string-name><surname>Devlin</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Chang</surname>, <given-names>M. -W.</given-names></string-name>, <string-name><surname>Lee</surname>, <given-names>K.</given-names></string-name> and <string-name><surname>Toutanova</surname>, <given-names>K.</given-names></string-name> (<year>2019</year>). <chapter-title>Bert: Pre-training of deep bidirectional transformers for language understanding</chapter-title>. In <source>Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies</source> <fpage>4171</fpage>–<lpage>4186</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_013">
<label>[13]</label><mixed-citation publication-type="journal"><string-name><surname>Floridi</surname>, <given-names>L.</given-names></string-name> and <string-name><surname>Chiriatti</surname>, <given-names>M.</given-names></string-name> (<year>2020</year>). <article-title>GPT-3: Its nature, scope, limits, and consequences</article-title>. <source>Minds and Machines</source> <volume>30</volume> <fpage>681</fpage>–<lpage>694</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_014">
<label>[14]</label><mixed-citation publication-type="journal"><string-name><surname>Guo</surname>, <given-names>X.</given-names></string-name>, <string-name><surname>Zhang</surname>, <given-names>G.</given-names></string-name>, <string-name><surname>Wang</surname>, <given-names>S.</given-names></string-name> and <string-name><surname>Chen</surname>, <given-names>Q.</given-names></string-name> (<year>2020</year>). <article-title>Multi-way matching based fine-grained sentiment analysis for user reviews</article-title>. <source>Neural Computing and Applications</source> <volume>32</volume>(<issue>12</issue>) <fpage>7729</fpage>–<lpage>7743</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_015">
<label>[15]</label><mixed-citation publication-type="journal"><string-name><surname>Hofmann</surname>, <given-names>T.</given-names></string-name>, <string-name><surname>Schölkopf</surname>, <given-names>B.</given-names></string-name> and <string-name><surname>Smola</surname>, <given-names>A. J.</given-names></string-name> (<year>2008</year>). <article-title>Kernel methods in machine learning</article-title>. <source>The Annals of Statistics</source> <volume>36</volume>(<issue>3</issue>) <fpage>1171</fpage>–<lpage>1220</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1214/009053607000000677" xlink:type="simple">https://doi.org/10.1214/009053607000000677</ext-link>. <ext-link ext-link-type="uri" xlink:href="https://mathscinet.ams.org/mathscinet-getitem?mr=2418654">MR2418654</ext-link></mixed-citation>
</ref>
<ref id="j_nejsds105_ref_016">
<label>[16]</label><mixed-citation publication-type="chapter"><string-name><surname>Jain</surname>, <given-names>B.</given-names></string-name>, <string-name><surname>Goyal</surname>, <given-names>G.</given-names></string-name> and <string-name><surname>Sharma</surname>, <given-names>M.</given-names></string-name> (<year>2024</year>). <chapter-title>Evaluating Emotional Detection &amp; Classification Capabilities of GPT-2 &amp; GPT-Neo Using Textual Data</chapter-title>. In <source>2024 14th International Conference on Cloud Computing, Data Science &amp; Engineering (Confluence)</source> <fpage>12</fpage>–<lpage>18</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1109/Confluence60223.2024.10463396" xlink:type="simple">https://doi.org/10.1109/Confluence60223.2024.10463396</ext-link>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_017">
<label>[17]</label><mixed-citation publication-type="chapter"><string-name><surname>Ji</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Zhang</surname>, <given-names>T.</given-names></string-name>, <string-name><surname>Ansari</surname>, <given-names>L.</given-names></string-name>, <string-name><surname>Fu</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Tiwari</surname>, <given-names>P.</given-names></string-name> and <string-name><surname>Cambria</surname>, <given-names>E.</given-names></string-name> (<year>2022</year>). <chapter-title>Mentalbert: Publicly available pretrained language models for mental healthcare</chapter-title>. In <source>Proceedings of the 13th Language Resources and Evaluation Conference</source> <fpage>7184</fpage>–<lpage>7190</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_018">
<label>[18]</label><mixed-citation publication-type="journal"><string-name><surname>Kim</surname>, <given-names>H.</given-names></string-name>, <string-name><surname>Rackoff</surname>, <given-names>G. N.</given-names></string-name>, <string-name><surname>Fitzsimmons-Craft</surname>, <given-names>E. E.</given-names></string-name>, <string-name><surname>Shin</surname>, <given-names>K. E.</given-names></string-name>, <string-name><surname>Zainal</surname>, <given-names>N. H.</given-names></string-name>, <string-name><surname>Schwob</surname>, <given-names>J. T.</given-names></string-name>, <string-name><surname>Eisenberg</surname>, <given-names>D.</given-names></string-name>, <string-name><surname>Wilfley</surname>, <given-names>D. E.</given-names></string-name>, <string-name><surname>Taylor</surname>, <given-names>C. B.</given-names></string-name> and <string-name><surname>Newman</surname>, <given-names>M. G.</given-names></string-name> (<year>2022</year>). <article-title>College mental health before and during the COVID-19 pandemic: results from a nationwide survey</article-title>. <source>Cognitive Therapy and Research</source> <volume>46</volume>(<issue>1</issue>) <fpage>1</fpage>–<lpage>10</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_019">
<label>[19]</label><mixed-citation publication-type="journal"><string-name><surname>Lossio-Ventura</surname>, <given-names>J. A.</given-names></string-name>, <string-name><surname>Weger</surname>, <given-names>R.</given-names></string-name>, <string-name><surname>Lee</surname>, <given-names>A. Y.</given-names></string-name>, <string-name><surname>Guinee</surname>, <given-names>E. P.</given-names></string-name>, <string-name><surname>Chung</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Atlas</surname>, <given-names>L.</given-names></string-name>, <string-name><surname>Linos</surname>, <given-names>E.</given-names></string-name> and <string-name><surname>Pereira</surname>, <given-names>F.</given-names></string-name> (<year>2024</year>). <article-title>A comparison of ChatGPT and fine-tuned open pre-trained transformers (OPT) against widely used sentiment analysis tools: sentiment analysis of COVID-19 survey data</article-title>. <source>JMIR Mental Health</source> <volume>11</volume> <fpage>50150</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_020">
<label>[20]</label><mixed-citation publication-type="chapter"><string-name><surname>Mohammad</surname>, <given-names>S. M.</given-names></string-name> (<year>2018</year>). <chapter-title>Word Affect Intensities</chapter-title>. In <source>Proceedings of the Eleventh International Conference on Language Resources and Evaluation (LREC 2018)</source>. <publisher-name>European Language Resources Association (ELRA)</publisher-name>, <publisher-loc>Miyazaki, Japan</publisher-loc>. <uri>https://aclanthology.org/L18-1027</uri>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_021">
<label>[21]</label><mixed-citation publication-type="journal"><string-name><surname>Mohammad</surname>, <given-names>S. M.</given-names></string-name> and <string-name><surname>Turney</surname>, <given-names>P. D.</given-names></string-name> (<year>2013</year>). <article-title>Crowdsourcing a word–emotion association lexicon</article-title>. <source>Computational Intelligence</source> <volume>29</volume>(<issue>3</issue>) <fpage>436</fpage>–<lpage>465</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1111/j.1467-8640.2012.00460.x" xlink:type="simple">https://doi.org/10.1111/j.1467-8640.2012.00460.x</ext-link>. <ext-link ext-link-type="uri" xlink:href="https://mathscinet.ams.org/mathscinet-getitem?mr=3093841">MR3093841</ext-link></mixed-citation>
</ref>
<ref id="j_nejsds105_ref_022">
<label>[22]</label><mixed-citation publication-type="chapter"><string-name><surname>Mustafa</surname>, <given-names>R. U.</given-names></string-name>, <string-name><surname>Ashraf</surname>, <given-names>N.</given-names></string-name>, <string-name><surname>Ahmed</surname>, <given-names>F. S.</given-names></string-name>, <string-name><surname>Ferzund</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Shahzad</surname>, <given-names>B.</given-names></string-name> and <string-name><surname>Gelbukh</surname>, <given-names>A.</given-names></string-name> (<year>2020</year>). <chapter-title>A Multiclass Depression Detection in Social Media Based on Sentiment Analysis</chapter-title>. In <source>International Conference on Intelligent Systems Design and Applications</source> <fpage>879</fpage>–<lpage>889</lpage> <publisher-name>Springer</publisher-name>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_023">
<label>[23]</label><mixed-citation publication-type="journal"><string-name><surname>Nadkarni</surname>, <given-names>P. M.</given-names></string-name>, <string-name><surname>Ohno-Machado</surname>, <given-names>L.</given-names></string-name> and <string-name><surname>Chapman</surname>, <given-names>W. W.</given-names></string-name> (<year>2011</year>). <article-title>Natural language processing: an introduction</article-title>. <source>Journal of the American Medical Informatics Association</source> <volume>18</volume>(<issue>5</issue>) <fpage>544</fpage>–<lpage>551</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_024">
<label>[24]</label><mixed-citation publication-type="book"><string-name><surname>Nardi</surname>, <given-names>P. M.</given-names></string-name> (<year>2018</year>) <source>Doing survey research: A guide to quantitative methods</source>. <publisher-name>Routledge, an imprint of the Taylor &amp; Francis Group</publisher-name>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_025">
<label>[25]</label><mixed-citation publication-type="journal"><string-name><surname>Naseem</surname>, <given-names>U.</given-names></string-name>, <string-name><surname>Razzak</surname>, <given-names>I.</given-names></string-name>, <string-name><surname>Khushi</surname>, <given-names>M.</given-names></string-name>, <string-name><surname>Eklund</surname>, <given-names>P. W.</given-names></string-name> and <string-name><surname>Kim</surname>, <given-names>J.</given-names></string-name> (<year>2021</year>). <article-title>COVIDSenti: A large-scale benchmark Twitter data set for COVID-19 sentiment analysis</article-title>. <source>IEEE Transactions on Computational Social Systems</source> <volume>8</volume>(<issue>4</issue>) <fpage>1003</fpage>–<lpage>1015</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_026">
<label>[26]</label><mixed-citation publication-type="journal"><string-name><surname>Naveed</surname>, <given-names>H.</given-names></string-name>, <string-name><surname>Khan</surname>, <given-names>A. U.</given-names></string-name>, <string-name><surname>Qiu</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Saqib</surname>, <given-names>M.</given-names></string-name>, <string-name><surname>Anwar</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Usman</surname>, <given-names>M.</given-names></string-name>, <string-name><surname>Akhtar</surname>, <given-names>N.</given-names></string-name>, <string-name><surname>Barnes</surname>, <given-names>N.</given-names></string-name> and <string-name><surname>Mian</surname>, <given-names>A.</given-names></string-name> (<year>2023</year>). <article-title>A comprehensive overview of large language models</article-title>. <source>ACM Transactions on Intelligent Systems and Technology</source>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_027">
<label>[27]</label><mixed-citation publication-type="other"><string-name><surname>OpenAI</surname></string-name> (2023). GPT-4 Technical Report. <italic>arXiv preprint arXiv:</italic><ext-link ext-link-type="uri" xlink:href="https://arxiv.org/abs/2303.08774"><italic>2303.08774</italic></ext-link>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_028">
<label>[28]</label><mixed-citation publication-type="journal"><string-name><surname>Pröllochs</surname>, <given-names>N.</given-names></string-name>, <string-name><surname>Feuerriegel</surname>, <given-names>S.</given-names></string-name> and <string-name><surname>Neumann</surname>, <given-names>D.</given-names></string-name> (<year>2018</year>). <article-title>Statistical inferences for polarity identification in natural language</article-title>. <source>PloS one</source> <volume>13</volume>(<issue>12</issue>) <fpage>0209323</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_029">
<label>[29]</label><mixed-citation publication-type="chapter"><string-name><surname>Qader</surname>, <given-names>W. A.</given-names></string-name>, <string-name><surname>Ameen</surname>, <given-names>M. M.</given-names></string-name> and <string-name><surname>Ahmed</surname>, <given-names>B. I.</given-names></string-name> (<year>2019</year>). <chapter-title>An Overview of Bag of Words: Importance, Implementation, Applications, and Challenges</chapter-title>. In <source>2019 International Engineering Conference (IEC)</source> <fpage>200</fpage>–<lpage>204</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1109/IEC47844.2019.8950616" xlink:type="simple">https://doi.org/10.1109/IEC47844.2019.8950616</ext-link>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_030">
<label>[30]</label><mixed-citation publication-type="other"><string-name><surname>Radford</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>Narasimhan</surname>, <given-names>K.</given-names></string-name>, <string-name><surname>Salimans</surname>, <given-names>T.</given-names></string-name>, <string-name><surname>Sutskever</surname>, <given-names>I.</given-names></string-name> et al. (2018). Improving language understanding by generative pre-training. Technical Report, OpenAI. <uri>https://cdn.openai.com/research-covers/language-unsupervised/</uri>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_031">
<label>[31]</label><mixed-citation publication-type="chapter"><string-name><surname>Rahman</surname>, <given-names>S. S. M. M.</given-names></string-name>, <string-name><surname>Biplob</surname>, <given-names>K. B. M. B.</given-names></string-name>, <string-name><surname>Rahman</surname>, <given-names>M. H.</given-names></string-name>, <string-name><surname>Sarker</surname>, <given-names>K.</given-names></string-name> and <string-name><surname>Islam</surname>, <given-names>T.</given-names></string-name> (<year>2020</year>). <chapter-title>An investigation and evaluation of N-Gram, TF-IDF and ensemble methods in sentiment classification</chapter-title>. In <source>Cyber Security and Computer Science: Second EAI International Conference, ICONCS 2020, Dhaka, Bangladesh, February 15-16, 2020, Proceedings 2</source> <fpage>391</fpage>–<lpage>402</lpage>. <publisher-name>Springer</publisher-name>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_032">
<label>[32]</label><mixed-citation publication-type="chapter"><string-name><surname>Ramos</surname>, <given-names>J.</given-names></string-name> <etal>et al.</etal> (<year>2003</year>). <chapter-title>Using TF-IDF to determine word relevance in document queries</chapter-title>. In <source>Proceedings of the first instructional conference on machine learning</source> <volume>242</volume> <fpage>29</fpage>–<lpage>48</lpage>. <publisher-name>Citeseer</publisher-name>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_033">
<label>[33]</label><mixed-citation publication-type="journal"><string-name><surname>Sebastiani</surname>, <given-names>F.</given-names></string-name> (<year>2002</year>). <article-title>Machine learning in automated text categorization</article-title>. <source>ACM Computing Surveys (CSUR)</source> <volume>34</volume>(<issue>1</issue>) <fpage>1</fpage>–<lpage>47</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_034">
<label>[34]</label><mixed-citation publication-type="journal"><string-name><surname>Smola</surname>, <given-names>A. J.</given-names></string-name> and <string-name><surname>Schölkopf</surname>, <given-names>B.</given-names></string-name> (<year>2004</year>). <article-title>A tutorial on support vector regression</article-title>. <source>Statistics and Computing</source> <volume>14</volume> <fpage>199</fpage>–<lpage>222</lpage>. <ext-link ext-link-type="doi" xlink:href="https://doi.org/10.1023/B:STCO.0000035301.49549.88" xlink:type="simple">https://doi.org/10.1023/B:STCO.0000035301.49549.88</ext-link>. <ext-link ext-link-type="uri" xlink:href="https://mathscinet.ams.org/mathscinet-getitem?mr=2086398">MR2086398</ext-link></mixed-citation>
</ref>
<ref id="j_nejsds105_ref_035">
<label>[35]</label><mixed-citation publication-type="journal"><string-name><surname>Son</surname>, <given-names>C.</given-names></string-name>, <string-name><surname>Hegde</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Smith</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>Wang</surname>, <given-names>X.</given-names></string-name> and <string-name><surname>Sasangohar</surname>, <given-names>F.</given-names></string-name> (<year>2020</year>). <article-title>Effects of COVID-19 on college students’ mental health in the United States: Interview survey study</article-title>. <source>Journal of Medical Internet Research</source> <volume>22</volume>(<issue>9</issue>) <fpage>21279</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_036">
<label>[36]</label><mixed-citation publication-type="journal"><string-name><surname>Stoltzfus</surname>, <given-names>J. C.</given-names></string-name> (<year>2011</year>). <article-title>Logistic regression: a brief primer</article-title>. <source>Academic Emergency Medicine</source> <volume>18</volume>(<issue>10</issue>) <fpage>1099</fpage>–<lpage>1104</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_037">
<label>[37]</label><mixed-citation publication-type="chapter"><string-name><surname>Sundaram</surname>, <given-names>V.</given-names></string-name>, <string-name><surname>Ahmed</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Muqtadeer</surname>, <given-names>S. A.</given-names></string-name> and <string-name><surname>Reddy</surname>, <given-names>R. R.</given-names></string-name> (<year>2021</year>). <chapter-title>Emotion analysis in text using TF-IDF</chapter-title>. In <source>2021 11th International Conference on Cloud Computing, Data Science &amp; Engineering (Confluence)</source> <fpage>292</fpage>–<lpage>297</lpage>. <publisher-name>IEEE</publisher-name>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_038">
<label>[38]</label><mixed-citation publication-type="journal"><string-name><surname>Taboada</surname>, <given-names>M.</given-names></string-name>, <string-name><surname>Brooke</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Tofiloski</surname>, <given-names>M.</given-names></string-name>, <string-name><surname>Voll</surname>, <given-names>K.</given-names></string-name> and <string-name><surname>Stede</surname>, <given-names>M.</given-names></string-name> (<year>2011</year>). <article-title>Lexicon-based methods for sentiment analysis</article-title>. <source>Computational Linguistics</source> <volume>37</volume>(<issue>2</issue>) <fpage>267</fpage>–<lpage>307</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_039">
<label>[39]</label><mixed-citation publication-type="journal"><string-name><surname>Tang</surname>, <given-names>T.</given-names></string-name>, <string-name><surname>Tang</surname>, <given-names>X.</given-names></string-name> and <string-name><surname>Yuan</surname>, <given-names>T.</given-names></string-name> (<year>2020</year>). <article-title>Fine-tuning BERT for multi-label sentiment analysis in unbalanced code-switching text</article-title>. <source>IEEE Access</source> <volume>8</volume> <fpage>193248</fpage>–<lpage>193256</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_040">
<label>[40]</label><mixed-citation publication-type="journal"><string-name><surname>Tsoumakas</surname>, <given-names>G.</given-names></string-name> and <string-name><surname>Katakis</surname>, <given-names>I.</given-names></string-name> (<year>2007</year>). <article-title>Multi-label classification: An overview</article-title>. <source>International Journal of Data Warehousing and Mining</source> <volume>3</volume>(<issue>3</issue>) <fpage>1</fpage>–<lpage>13</lpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_041">
<label>[41]</label><mixed-citation publication-type="journal"><string-name><surname>Vaswani</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>Shazeer</surname>, <given-names>N.</given-names></string-name>, <string-name><surname>Parmar</surname>, <given-names>N.</given-names></string-name>, <string-name><surname>Uszkoreit</surname>, <given-names>J.</given-names></string-name>, <string-name><surname>Jones</surname>, <given-names>L.</given-names></string-name>, <string-name><surname>Gomez</surname>, <given-names>A. N.</given-names></string-name>, <string-name><surname>Kaiser</surname>, <given-names>.</given-names></string-name> and <string-name><surname>Polosukhin</surname>, <given-names>I.</given-names></string-name> (<year>2017</year>). <article-title>Attention is all you need</article-title>. <source>Advances in Neural Information Processing Systems</source> <volume>30</volume>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_042">
<label>[42]</label><mixed-citation publication-type="journal"><string-name><surname>Wang</surname>, <given-names>X.</given-names></string-name>, <string-name><surname>Hegde</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Son</surname>, <given-names>C.</given-names></string-name>, <string-name><surname>Keller</surname>, <given-names>B.</given-names></string-name>, <string-name><surname>Smith</surname>, <given-names>A.</given-names></string-name> and <string-name><surname>Sasangohar</surname>, <given-names>F.</given-names></string-name> (<year>2020</year>). <article-title>Investigating mental health of US college students during the COVID-19 pandemic: Cross-sectional survey study</article-title>. <source>Journal of Medical Internet Research</source> <volume>22</volume>(<issue>9</issue>) <fpage>22817</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_043">
<label>[43]</label><mixed-citation publication-type="journal"><string-name><surname>Weger</surname>, <given-names>R.</given-names></string-name>, <string-name><surname>Lossio-Ventura</surname>, <given-names>J. A.</given-names></string-name>, <string-name><surname>Rose-McCandlish</surname>, <given-names>M.</given-names></string-name>, <string-name><surname>Shaw</surname>, <given-names>J. S.</given-names></string-name>, <string-name><surname>Sinclair</surname>, <given-names>S.</given-names></string-name>, <string-name><surname>Pereira</surname>, <given-names>F.</given-names></string-name>, <string-name><surname>Chung</surname>, <given-names>J. Y.</given-names></string-name>, <string-name><surname>Atlas</surname>, <given-names>L. Y.</given-names></string-name> <etal>et al.</etal> (<year>2023</year>). <article-title>Trends in language use during the COVID-19 pandemic and relationship between language use and mental health: text analysis based on free responses from a longitudinal study</article-title>. <source>JMIR Mental Health</source> <volume>10</volume>(<issue>1</issue>) <fpage>40899</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_044">
<label>[44]</label><mixed-citation publication-type="journal"><string-name><surname>Wright</surname>, <given-names>L.</given-names></string-name>, <string-name><surname>Burton</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>McKinlay</surname>, <given-names>A.</given-names></string-name>, <string-name><surname>Steptoe</surname>, <given-names>A.</given-names></string-name> and <string-name><surname>Fancourt</surname>, <given-names>D.</given-names></string-name> (<year>2022</year>). <article-title>Public opinion about the UK government during COVID-19 and implications for public health: A topic modeling analysis of open-ended survey response data</article-title>. <source>PloS One</source> <volume>17</volume>(<issue>4</issue>) <fpage>0264134</fpage>.</mixed-citation>
</ref>
<ref id="j_nejsds105_ref_045">
<label>[45]</label><mixed-citation publication-type="journal"><string-name><surname>Zeng</surname>, <given-names>X.</given-names></string-name> and <string-name><surname>Martinez</surname>, <given-names>T. R.</given-names></string-name> (<year>2000</year>). <article-title>Distribution-balanced stratified cross-validation for accuracy estimation</article-title>. <source>Journal of Experimental &amp; Theoretical Artificial Intelligence</source> <volume>12</volume>(<issue>1</issue>) <fpage>1</fpage>–<lpage>12</lpage>.</mixed-citation>
</ref>
</ref-list>
</back>
</article>
