<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1 20151215//EN" "http://jats.nlm.nih.gov/publishing/1.1/JATS-journalpublishing1.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xml:lang="en" article-type="research-article" dtd-version="1.1">
<front>
<journal-meta>
<journal-id journal-id-type="pmc">CMC</journal-id>
<journal-id journal-id-type="nlm-ta">CMC</journal-id>
<journal-id journal-id-type="publisher-id">CMC</journal-id>
<journal-title-group>
<journal-title>Computers, Materials &#x0026; Continua</journal-title>
</journal-title-group>
<issn pub-type="epub">1546-2226</issn>
<issn pub-type="ppub">1546-2218</issn>
<publisher>
<publisher-name>Tech Science Press</publisher-name>
<publisher-loc>USA</publisher-loc>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">36779</article-id>
<article-id pub-id-type="doi">10.32604/cmc.2023.036779</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Article</subject>
</subj-group>
</article-categories>
<title-group>
<article-title>Ensemble Deep Learning Framework for Situational Aspects-Based Annotation and Classification of International Student&#x2019;s Tweets during COVID-19</article-title>
<alt-title alt-title-type="left-running-head">Ensemble Deep Learning Framework for Situational Aspects-Based Annotation and Classification of International Student&#x2019;s Tweets during COVID-19</alt-title>
<alt-title alt-title-type="right-running-head">Ensemble Deep Learning Framework for Situational Aspects-Based Annotation and Classification of International Student&#x2019;s Tweets during COVID-19</alt-title>
</title-group>
<contrib-group>
<contrib id="author-1" contrib-type="author">
<name name-style="western"><surname>Hussain</surname><given-names>Shabir</given-names></name><xref ref-type="aff" rid="aff-1">1</xref></contrib>
<contrib id="author-2" contrib-type="author">
<name name-style="western"><surname>Ayoub</surname><given-names>Muhammad</given-names></name><xref ref-type="aff" rid="aff-2">2</xref></contrib>
<contrib id="author-3" contrib-type="author">
<name name-style="western"><surname>Yu</surname><given-names>Yang</given-names></name><xref ref-type="aff" rid="aff-1">1</xref></contrib>
<contrib id="author-4" contrib-type="author">
<name name-style="western"><surname>Wahid</surname><given-names>Junaid Abdul</given-names></name><xref ref-type="aff" rid="aff-1">1</xref></contrib>
<contrib id="author-5" contrib-type="author">
<name name-style="western"><surname>Khan</surname><given-names>Akmal</given-names></name><xref ref-type="aff" rid="aff-3">3</xref></contrib>
<contrib id="author-6" contrib-type="author">
<name name-style="western"><surname>Moller</surname><given-names>Dietmar P. F.</given-names></name><xref ref-type="aff" rid="aff-4">4</xref></contrib>
<contrib id="author-7" contrib-type="author" corresp="yes">
<name name-style="western"><surname>Weiyan</surname><given-names>Hou</given-names></name><xref ref-type="aff" rid="aff-1">1</xref><email>houwy@139.com</email></contrib>
<aff id="aff-1"><label>1</label><institution>School of Information Engineering, Zhengzhou University</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country></aff>
<aff id="aff-2"><label>2</label><institution>School of Computer Science and Engineering, Central South University</institution>, <addr-line>Changsha</addr-line>, <country>China</country></aff>
<aff id="aff-3"><label>3</label><institution>Department of Data Science, The Islamia University of Bahawalpur</institution>, <addr-line>Bahawalpur</addr-line>, <country>Pakistan</country></aff>
<aff id="aff-4"><label>4</label><institution>Clausthal University of Technology</institution>, <addr-line>Clausthal-Zellerfeld</addr-line>, <country>Germany</country></aff>
</contrib-group>
<author-notes>
<corresp id="cor1"><label>&#x002A;</label>Corresponding Author: Hou Weiyan. Email: <email>houwy@139.com</email></corresp>
</author-notes>
<pub-date date-type="collection" publication-format="electronic"><year>2023</year></pub-date>
<pub-date date-type="pub" publication-format="electronic"><day>1</day><month>5</month><year>2023</year></pub-date>
<volume>75</volume>
<issue>3</issue>
<fpage>5355</fpage>
<lpage>5377</lpage>
<history>
<date date-type="received"><day>12</day><month>10</month><year>2022</year>
</date>
<date date-type="accepted"><day>29</day><month>1</month><year>2023</year>
</date>
</history>
<permissions>
<copyright-statement>&#x00A9; 2023 Hussain et al.</copyright-statement>
<copyright-year>2023</copyright-year>
<copyright-holder>Hussain et al.</copyright-holder>
<license xlink:href="https://creativecommons.org/licenses/by/4.0/">
<license-p>This work is licensed under a <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution 4.0 International License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
</license>
</permissions>
<self-uri content-type="pdf" xlink:href="TSP_CMC_36779.pdf"></self-uri>
<abstract>
<p>As the COVID-19 pandemic swept the globe, social media platforms became an essential source of information and communication for many. International students, particularly, turned to Twitter to express their struggles and hardships during this difficult time. To better understand the sentiments and experiences of these international students, we developed the Situational Aspect-Based Annotation and Classification (SABAC) text mining framework. This framework uses a three-layer approach, combining baseline Deep Learning (DL) models with Machine Learning (ML) models as meta-classifiers to accurately predict the sentiments and aspects expressed in tweets from our collected Student-COVID-19 dataset. Using the proposed aspect2class annotation algorithm, we labeled bulk unlabeled tweets according to their contained aspect terms. However, we also recognized the challenges of reducing data&#x2019;s high dimensionality and sparsity to improve performance and annotation on unlabeled datasets. To address this issue, we proposed the Volatile Stopwords Filtering (VSF) technique to reduce sparsity and enhance classifier performance. The resulting Student-COVID Twitter dataset achieved a sophisticated accuracy of 93.21% when using the random forest as a meta-classifier. Through testing on three benchmark datasets, we found that the SABAC ensemble framework performed exceptionally well. Our findings showed that international students during the pandemic faced various issues, including stress, uncertainty, health concerns, financial stress, and difficulties with online classes and returning to school. By analyzing and summarizing these annotated tweets, decision-makers can better understand and address the real-time problems international students face during the ongoing pandemic.</p>
</abstract>
<kwd-group kwd-group-type="author">
<kwd>COVID-19 pandemic</kwd>
<kwd>situational awareness</kwd>
<kwd>ensemble learning</kwd>
<kwd>aspect-based text classification</kwd>
<kwd>deep learning models</kwd>
<kwd>international students</kwd>
<kwd>topic modeling</kwd>
</kwd-group>
<funding-group>
<award-group id="awg1">
<funding-source>National Natural Science Foundation of China</funding-source>
<award-id>92067106</award-id>
</award-group>
<award-group id="awg2">
<funding-source>Ministry of Education of the People&#x2019;s Republic of China</funding-source>
<award-id>E-GCCRC20200309</award-id>
</award-group>
</funding-group>
</article-meta>
</front>
<body>
<sec id="s1">
<label>1</label>
<title>Introduction</title>
<p>The COVID-19 pandemic affected the whole world and changed every human life. Its devastation begins in China Wuhan and spreads worldwide, ruining human lives, health, and economies. The World Health Organization (WHO) [<xref ref-type="bibr" rid="ref-1">1</xref>] declared the COVID-19 pandemic on March 11, 2020, due to its destructive behavior. After discerning the rapid spread of COVID-19 [<xref ref-type="bibr" rid="ref-2">2</xref>], all nations and their governments adopted harsh preventive measures to manage this terrible epidemic and stop it from spreading. About 3.9 billion people have been affected and under lockdown or quarantined in their houses, and international travelers have been quarantined in quarantine centers reserved by different countries to contain the virus [<xref ref-type="bibr" rid="ref-3">3</xref>]. After the surge of COVID-19 cases, every field of life has faced troubles, and this disease disturbed their lives. Its aftershocks will be observed and felt for many years. The student community is one of the influential groups that has been disturbed pathetically and is missing from the vulnerable group&#x2019;s list. This vulnerable group of international students has been facing social and economic obstacles, and no one has addressed their issues globally [<xref ref-type="bibr" rid="ref-4">4</xref>]. Globally lockdown policies were also affected, and universities shut down their campuses by following the government&#x2019;s directives. Developed countries financially helped their citizens in this time of pandemic emergency. Unluckily, international students suffer social and economic costs and are ignored by the authorities [<xref ref-type="bibr" rid="ref-5">5</xref>,<xref ref-type="bibr" rid="ref-6">6</xref>]. International students from developing countries have already experienced difficulties with financial circumstances to continue their studies abroad [<xref ref-type="bibr" rid="ref-7">7</xref>]. The sudden shutdown of university campuses has created problems for students from developing countries. Most of the work found in the literature is survey-based, and the researchers performed statistical analysis on the collected data. A study revealed that 13% of students had faced late graduation concerns, and 4% of students lost their jobs due to the COVID-19 pandemic. Another survey [<xref ref-type="bibr" rid="ref-8">8</xref>] was conducted at &#x201C;<ext-link ext-link-type="uri" xlink:href="http://education.com">education.com</ext-link>&#x201D; to evaluate &#x201C;how COVID-19 affected your study abroad plans&#x201D;, in which they estimated that 4.7% of students intend to cancel their study abroad plans. The number of students who returned to their homes due to the shutdown of university campuses and now want to return to their universities to resume their studies is 47.2%. Moreover, 68.2% of students are interested in studying abroad online. Before the COVID-19 situation, a global investment of $18.66 billion in 2019 and $350 was estimated to reach 2025 in educational technology. Over the decades, social media has become an active technological tool and a news and communication channel for the general public worldwide. It plays an influential role in the COVID-19 pandemic by dismantling information around the globe [<xref ref-type="bibr" rid="ref-9">9</xref>]. The public has used the social media platform more frequently during the COVID-19 pandemic to express their sentiments. The information about any issue and trends on social media spread as COVID-19 spread rapidly. We analyzed many trends that international students influence by using different hashtags like &#x201C;#takeusback&#x201D; to address their study regarding issues [<xref ref-type="bibr" rid="ref-4">4</xref>,<xref ref-type="bibr" rid="ref-10">10</xref>]. They want to return to their universities to continue their studies. To the best of our knowledge, there is no study yet to analyze and understand international students&#x2019; perceptions and problems during the COVID-19 pandemic using text mining. This paper has addressed and explored students&#x2019; sentiments and aspects regarding their financial distress, emotional distress, self-worth, and academic performance distress. The effect of COVID-19 on international students is heterogeneous. This study aims to answer the following research questions.
<list list-type="bullet">
<list-item>
<p>How does international students&#x2019; perception change due to COVID-19, and what problems do they face in this pandemic?</p></list-item>
<list-item>
<p>Using Natural Language Processing (NLP), how do we mine and explore students&#x2019; issues from their given textual feedback on different social media platforms?</p></list-item>
</list></p>
<p>To answer the above research questions and uncover international students&#x2019; issues and views, NLP and Artificial Intelligence (AI) models are used widely to process textual data [<xref ref-type="bibr" rid="ref-11">11</xref>]. We proposed an ensemble deep learning framework (SABAC) for topic extraction, annotation, and classification. The purpose of SABAC is to annotate a large amount of unlabeled textual data automatically according to the situational aspects. In traditional text mining, most of the data is labeled and balanced, and labeling the unbalanced data according to the situational aspects is a laborious and time-consuming task. Therefore, we proposed three layers based SABAC framework. In the first layer of SABAC, we used an ensemble deep learning-based four different models to analyze international students&#x2019; tweets to explore and extract their situational emotions regarding their situation in the COVID-19 pandemic. We proposed and implemented an annotation algorithm in the second layer to annotate the extracted aspect terms as class labels. The third layer of SABAC used annotated tweets, which were annotated from the previous layer for the classification using deep learning algorithms in an ensemble learning manner to classify students&#x2019; textual data according to extracted class labels. In addition to the above-mentioned two research questions, we aim to answer the following research questions to examine issues of international students.
<list list-type="bullet">
<list-item>
<p>Does our proposed framework improve the aspect extraction process from textual feedback given by international students?</p></list-item>
<list-item>
<p>Does our proposed SABAC framework improve topic classification and annotation process accuracy?</p></list-item>
</list></p>
<p>Analyzing the student&#x2019;s tweets about the uncertainty in their future goals due to the COVID-19 pandemic is necessary to uncover hidden aspects in their feedback. Higher authorities can take essential measures regarding their study plans by analyzing international students&#x2019; views. This study will help understand the factors and issues regarding students&#x2019; situational information. Our main contributions to this paper are as follows:
<list list-type="bullet">
<list-item>
<p>We scrapped and collected Twitter dataset in which international students expressed their situational perceptions and opinion, and we named our dataset Student-COVID-19.</p></list-item>
<list-item>
<p>We have proposed a novel ensemble deep learning-based topic modeling and classification framework named SABAC to mine the accurate and robust aspect terms from the international students&#x2019; feedback dataset.</p></list-item>
<list-item>
<p>We also proposed a new ensemble machine learning-based model to perform topic classification and annotate unlabeled Twitter datasets using mined topic terms.</p></list-item>
<list-item>
<p>We proposed and implemented a data filtering technique. We analyzed that using Volatile Stop words Filtering (VSF) improved the performance of machine learning classifiers.</p></list-item>
<list-item>
<p>The results of this study may help international universities and governments to understand the situational aspect and sentiments of international students.</p></list-item>
</list></p>
<p>In the next section of this paper, we discussed related works. It is followed by a description of the research methodology, procedures, and data collection in Section 3. Results and discussion are presented in Section 4. Finally, the research conclusion is in Section 5.</p>
</sec>
<sec id="s2">
<label>2</label>
<title>Literature Review</title>
<p>Since the COVID-19 pandemic started, the interest of researchers has diverted to explore and analyze the effect of COVID-19 from many perspectives. China was the first country to force the regional lockdown strategy in Hubei province, especially Wuhan city, for 76 days [<xref ref-type="bibr" rid="ref-12">12</xref>]. Quarantine centers use IoT systems to monitor the suspected individuals and restrict them from interactions [<xref ref-type="bibr" rid="ref-13">13</xref>]. According to [<xref ref-type="bibr" rid="ref-14">14</xref>], the absence of these social connections leads to depression, anxiety, extreme mental stress, and many other aspects of life. In contrast to mental health, the authors [<xref ref-type="bibr" rid="ref-15">15</xref>] surveyed Liaoning Province, mainland China, to assess the influence of COVID-19 on people&#x2019;s mental health. According to their findings, 52.1% of the 263 participants were terrified and worried due to the epidemic. However, 53.3% of those polled did not feel helpless due to the pandemic. Nowadays, deep learning is being used in various domains of life to improve performance, including face emotion recognition [<xref ref-type="bibr" rid="ref-16">16</xref>], comparative analysis of social communication apps [<xref ref-type="bibr" rid="ref-17">17</xref>], to evaluate the business insides [<xref ref-type="bibr" rid="ref-18">18</xref>], and many more. In this study, we reviewed previous work on text classification using ensemble deep learning  techniques <xref ref-type="table" rid="table-1">Table 1</xref>.</p>
<table-wrap id="table-1">
<label>Table 1</label>
<caption>
<title>Previous work on text classification using ensemble deep learning techniques</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Studies</th>
<th>Models</th>
<th>Ensemble techniques</th>
<th>Dataset</th>
</tr>
</thead>
<tbody>
<tr>
<td>[<xref ref-type="bibr" rid="ref-19">19</xref>]</td>
<td>Decision Tree, Random Forest (RF), Artificial Neural Network (ANN), Support Vector Machine (SVM)</td>
<td>Stacking</td>
<td>Patients survey data</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-20">20</xref>]</td>
<td>ANN, Adaboost</td>
<td>Bagging &#x002B; Boosting</td>
<td>Tweets COVID-19</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-21">21</xref>]</td>
<td>Multi-layer Long Short Term Memory (LSTM)</td>
<td>No</td>
<td>Twitter tweets</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-22">22</xref>]</td>
<td>BERT and LSTM</td>
<td>No</td>
<td>Twitter tweets</td>
</tr>
<tr>
<td/>
<td>Convolutional Neural Network (CNN),</td>
<td></td>
<td>Google trends &#x0026;</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-23">23</xref>]</td>
<td>BiGuru, DistilBert</td>
<td>Boosting</td>
<td>Twitter data</td>
</tr>
<tr>
<td/>
<td>Latent Dirichlet Allocation (LDA), Linear Regression (LR), SVM</td>
<td>Stacking, AdaBoost, bagging</td>
<td>Services reviews datasets</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-24">24</xref>]</td>
<td>LSTM, Bi-Directional Long Short-Term Memory (Bi-LSTM)</td>
<td>Voting, bagging,</td>
<td>Services reviews</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-25">25</xref>]</td>
<td></td>
<td>Stacking</td>
<td>Datasets</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-26">26</xref>]</td>
<td>LSTM, CNN, GRU</td>
<td>Voting, stacking</td>
<td>Twitter tweets</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-27">27</xref>]</td>
<td>CNN</td>
<td>Voting</td>
<td>Health reviews dataset</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-28">28</xref>]</td>
<td>CNN, LSTM, GRU, Bi-LSTM</td>
<td>Stacking</td>
<td>SemEval2016</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The authors [<xref ref-type="bibr" rid="ref-3">3</xref>,<xref ref-type="bibr" rid="ref-32">32</xref>] used machine learning and natural language processing techniques to analyze the 840000 tweets. Their sentiment results showed that the death and lockdown due to the COVID-19 are the aspects that mainly caused stress, anxiety, and Trauma among Indian citizens. COVID-19 increased depression, anxiety, and stress levels in individual life. Their results showed that the lockdown in the country increased depression in individuals. To understand the sentiment of an individual through social media posts, the authors of [<xref ref-type="bibr" rid="ref-33">33</xref>] used an adaptive model for automatic hate speech identification that is ensemble learning-based, enhancing cross-dataset generalization. Base learners in ensemble learning are reliant on the outcomes of base learners in the past. Furthermore, we reported previous ensemble studies and their implementation for text classification using machine learning, as shown in <xref ref-type="table" rid="table-2">Table 2</xref>. As COVID-19 was declared a pandemic by WHO, people started sharing their opinion about mental stress and anxiety due to COVID-19 on Twitter [<xref ref-type="bibr" rid="ref-34">34</xref>]. Meanwhile, to analyze the students&#x2019; mental health and behavior toward COVID-19, the authors [<xref ref-type="bibr" rid="ref-35">35</xref>] surveyed 1182 students of different age groups. Their findings revealed that students used various social media platforms and other coping techniques to minimize worry and mental stress and obtained aid from their friends and family. Due to COVID-19, universities led to online classes, and students were asked to leave dorms; hence, students faced mental health issues. To examine the students&#x2019; mental health and evaluate their online academic performance, the study [<xref ref-type="bibr" rid="ref-36">36</xref>] conducted a general health Questionnaire-based survey among 1123 participants. The results of their experiments were considered significant at a <italic>p</italic>-value set of 0.05. 76.96% of the participants manifested psycho-pathological symptoms measured by this survey. To address and predict international students&#x2019; satisfaction, the researchers [<xref ref-type="bibr" rid="ref-37">37</xref>] gathered survey data from 425 students from different departments in Hong Kong. They performed different machine learning algorithms like regression and random forest; however, they achieved the highest accuracy using elastic net regression, and 65.2% explained variance. Their findings reported that it is critical to rule out the underlying reasons why students from different programs prefer face-to-face learning.</p>
<table-wrap id="table-2">
<label>Table 2</label>
<caption>
<title>Previous work on ensemble deep learning approach for COVID-19 text analytics</title>
</caption>
<table frame="hsides" >
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Studies</th>
<th>Models</th>
<th>Ensemble techniques</th>
<th>Dataset</th>
</tr>
</thead>
<tbody>
<tr>
<td>[<xref ref-type="bibr" rid="ref-29">29</xref>]</td>
<td>Decision Tree (DT), SVM, RF</td>
<td>Stacking</td>
<td>Twitter data from IEEE</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-20">20</xref>]</td>
<td>ANN, Adaboost</td>
<td>Bagging, boosting</td>
<td>Tweets COVID-19</td>
</tr>
<tr>
<td></td>
<td>SVM, RF, DT</td>
<td>Boosting</td>
<td>Twitter API</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-30">30</xref>]</td>
<td>RoBerta, DeBerta,</td>
<td></td>
<td>CONSTRAINT</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-31">31</xref>]</td>
<td>XLNet</td>
<td>Soft, hard voting</td>
<td>COVID-19 dataset</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-19">19</xref>]</td>
<td>DT, RF, ANN, SVM</td>
<td>Stacking</td>
<td>Patients survey data</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-27">27</xref>]</td>
<td>CNN</td>
<td>Voting</td>
<td>Health reviews dataset</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s3">
<label>3</label>
<title>Proposed Framework</title>
<p>This section has discussed significant components of the manuscript, including dataset collection, pre-processing, feature extraction using several NLP techniques, and statistical analysis. The current study consists of two parts: In the first part, we performed aspect extraction using an ensemble learning approach to explore students&#x2019; situational perceptions or aspect terms from the Tweets. The proposed Emergency Situational Awareness (ESA) model is a fusion of different deep learning and machine learning models to improve Situational Understanding (SU), as shown in <xref ref-type="fig" rid="fig-1">Fig. 1</xref>. We further divided our approach into three layers; in the first layer, we used different deep learning models as weak learners (weak classifiers) for Aspect Extraction (AE) from textual data using the ensemble learning approach. After extracting situational aspects from the dataset, we performed annotation of each tweet according to its extracted aspect term using aspect2class Algorithm 1 in the second layer of the proposed SABAC framework. The third layer includes training of deep learning weak classifiers using annotated Tweets according to aspect terms as class labels to perform classification. In this manner, our proposed model is different from other existing solutions, and the results of deep weak classifiers are passed to machine learning-based meta-classifiers as the proposed ensemble technique for the final prediction of class labels on the test dataset.</p>
<fig id="fig-1">
<label>Figure 1</label>
<caption>
<title>Ensemble learning framework for situational awareness</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-1.tif"/>
</fig>
<p>All experiments in this paper are conducted on Intel(R) Celeron(R) CPU N3150 @ 1.60 GHz. The operating system is Windows 64-bit, Python 3.6.6, TensorFlow deep Learning framework 1.8.0, and CUDA 10.1.</p>
<sec id="s3_1">
<label>3.1</label>
<title>Data Collection and Pre-processing</title>
<p>The dataset used for this study is obtained from Twitter. The Twitter dataset was collected using Twitter API from March 2020 to December 2021, and we extracted 13.4k tweets using diffident hashtags represented by trends of international students. We named our collected Twitter dataset Student-COVID-19. The process of collecting data is shown in <xref ref-type="fig" rid="fig-2">Fig. 2</xref>.</p>
<fig id="fig-2">
<label>Figure 2</label>
<caption>
<title>Student-COVID-19 dataset collection</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-2.tif"/>
</fig>
<p>We analyzed different studies [<xref ref-type="bibr" rid="ref-38">38</xref>,<xref ref-type="bibr" rid="ref-39">39</xref>] in this domain and also analyzed various tweets by international students on Twitter and collected &#x201C;back to school&#x201D;, &#x201C;open border&#x201D;, &#x201C;online education&#x201D;, &#x201C;stress&#x201D;, and &#x201C;uncertainty&#x201D; hashtags based on the previous studies and trends of international students tweets [<xref ref-type="bibr" rid="ref-4">4</xref>,<xref ref-type="bibr" rid="ref-5">5</xref>,<xref ref-type="bibr" rid="ref-6">6</xref>]. The combination of these hashtags only posed by the international students who were suffering from mental stress and no study outcome due to online education and requesting for the border opening to go back to school for physical classes, and these hashtags were also considered of the scope by previous studies as well [<xref ref-type="bibr" rid="ref-38">38</xref>,<xref ref-type="bibr" rid="ref-39">39</xref>]. We also performed experiments on our collected and previous benchmark datasets to evaluate the proposed ensemble deep learning framework (SABAC). A detailed description of the benchmark and our collected datasets is shown in <xref ref-type="table" rid="table-3">Table 3</xref>.</p>
<table-wrap id="table-3">
<label>Table 3</label>
<caption>
<title>Detailed dataset description</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Dataset</th>
<th>Description</th>
<th>Class</th>
<th>No. of observation</th>
</tr>
</thead>
<tbody>
<tr>
<td>[<xref ref-type="bibr" rid="ref-28">28</xref>]</td>
<td>English language Tweet collected on 12th workshop on semantic evaluation</td>
<td>3</td>
<td>20634</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-40">40</xref>]</td>
<td>English language text from 20 different newsgroups</td>
<td>2</td>
<td>18000</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-41">41</xref>]</td>
<td>English language text about COVID-19 and English language Tweet</td>
<td>2</td>
<td>10700</td>
</tr>
<tr>
<td>Our collected dataset</td>
<td>Related to COVID-19 and international students</td>
<td>6</td>
<td>13400</td>
</tr>
</tbody>
</table>
</table-wrap>
<sec id="s3_1_1">
<label>3.1.1</label>
<title>Pre-processing</title>
<p>Data pre-processing involves many techniques to make data consistent to perform the experiments. We removed @ symbol, which represents the user&#x2019;s name, RT used for retweets, and the hashtag symbol. We replaced slang words with actual words using <italic>n</italic>-gram according to the procedure defined by [<xref ref-type="bibr" rid="ref-42">42</xref>]. For the second and third datasets, we performed traditional data pre-processing, in which we performed the following techniques to remove the noise from the data.
<list list-type="bullet">
<list-item>
<p>We performed basic pre-processing techniques to clean the data by removing unnecessary and irrelevant information and text, i.e., from these hashtags #takeusback, and #openborders, we removed # symbols.</p></list-item>
<list-item>
<p>We observed that students use many words in combination to create hashtags, such as &#x201C;takeusback&#x201D;, but these words need to be separate for processing take us back. We performed segmentation to void such kinds of issues.</p></list-item>
<list-item>
<p>Stopword removal is also a prevalent method to remove noisy data from the text without affecting the sentence&#x2019;s meaning. We also removed Stopwords from the data in the aspect extraction module.</p></list-item>
<list-item>
<p>Next, we used the lemmatization technique to preserve morphological aspects of words by converting them into their basic form. We performed this task by using the &#x201C;nltk&#x201D; library in python.</p></list-item>
<list-item>
<p>We also removed punctuation, numbers, hyphens, and special symbols from raw text to make data consistent and noise-free.</p></list-item>
<list-item>
<p>To capture and preserve syntactic features from the texts, we performed Part of Speech (POS) tagging to denote each word, i.e., noun, verb, adjective, and adverb.</p></list-item>
</list></p>
</sec>
<sec id="s3_1_2">
<label>3.1.2</label>
<title>Reducing Sparsity</title>
<p>We used the Volatile Stopwords Filtering (VSF) technique to reduce the sparsity problem. The VSF list is generated from the current dataset and is not pre-defined. According to our data&#x2019;s vocabulary analysis, 79% of the terms appeared less than five times in the corpus. Exploring these terms revealed that almost all words with a frequency of fewer than five are less significant, so we excluded all these terms from the feature space. Using the VSF technique improved the accuracy of the classification process.</p>
</sec>
</sec>
<sec id="s3_2">
<label>3.2</label>
<title>Ensemble Learning</title>
<p>In the traditional machine learning classification process, a single classifier is trained on training data at one time [<xref ref-type="bibr" rid="ref-43">43</xref>]. Usually, every classifier produces a different result in accuracy on the same training dataset. It is more complex to determine which classifier could attain adequate accuracy on a particular training dataset if we use multiple classifiers [<xref ref-type="bibr" rid="ref-44">44</xref>] as a base or weak classifier to obtain optimal results. In the ensemble machine learning approach, meta-classifiers produce an optimal generalized output by aggregating the results of weak classifiers [<xref ref-type="bibr" rid="ref-45">45</xref>]. The workflow of our proposed situational awareness ensemble deep learning topic modeling for aspect classification is shown in <xref ref-type="fig" rid="fig-3">Fig. 3</xref>. To ensemble the weak learner&#x2019;s predictions, there are three commonly applicable techniques, bagging, boosting, and stacking. This paper uses a stacking ensemble deep learning approach for topic modeling and aspect classification. The reason for not choosing the bagging and boosting is that it works only with weak homogeneous learners, leading to more bias in models and being computationally expensive. However, we implemented heterogeneous weak classifiers and performed training parallelly using the stacking approach. We parallelly trained multiple deep learning models in our stacked ensemble approach and combined weak learners&#x2019; output. The output of the weak learners is finally used as input for the meta-classifier for the final prediction. We have used Naive Bayes (NB), Logistic Regression (LR), and Support Vector Machines (SVM) as meta-classifiers for the final prediction.</p>
<fig id="fig-3">
<label>Figure 3</label>
<caption>
<title>Aspect extraction using ensemble learning framework for situational awareness<break/></title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-3.tif"/>
</fig>
</sec>
<sec id="s3_3">
<label>3.3</label>
<title>Aspect Extraction as Ensemble Learning</title>
<p>To extract the best and most accurate topic terms as aspect terms from the tweets, we first need to constitute the topic models as baseline classifiers used for topic modeling. We used the first baseline model, Latent Dirichlet allocation (LDA) [<xref ref-type="bibr" rid="ref-34">34</xref>], and a generative probabilistic corpus model, which can identify and describe latent thematic structures within collections of text documents. LDA inputs our document-term matrix and generates an output yielding an <italic>N</italic>X<italic>N</italic> topic matrix, in which <italic>N</italic> is the number of topics assigned to six topics. The LDA algorithm [<xref ref-type="bibr" rid="ref-46">46</xref>] attempts to build a complete representation of the corpus by inferring latent content variables known as topics. For instance, a given corpus <italic>D</italic> consisting of <italic>M</italic> documents, with document d having <italic>N</italic><sub><italic>d</italic></sub> words <inline-formula id="ieqn-1"><mml:math id="mml-ieqn-1"><mml:mo stretchy="false">(</mml:mo><mml:mi>d</mml:mi><mml:mi>&#x03F5;</mml:mi><mml:mn>1</mml:mn><mml:mo>,</mml:mo><mml:mo>&#x2026;</mml:mo><mml:mo>,</mml:mo><mml:mi>M</mml:mi><mml:mo stretchy="false">)</mml:mo></mml:math></inline-formula> LDA model <italic>D</italic> according to the following generative process [<xref ref-type="bibr" rid="ref-46">46</xref>,<xref ref-type="bibr" rid="ref-47">47</xref>].
<list list-type="bullet">
<list-item>
<p>Select a multinomial distribution <inline-formula id="ieqn-2"><mml:math id="mml-ieqn-2"><mml:msub><mml:mi>&#x03B1;</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> for topic <italic>t</italic>, from a Dirichlet distribution with parameter <inline-formula id="ieqn-3"><mml:math id="mml-ieqn-3"><mml:mi>&#x03B2;</mml:mi></mml:math></inline-formula>.</p></list-item>
<list-item>
<p>From a Dirichlet distribution with parameter <inline-formula id="ieqn-4"><mml:math id="mml-ieqn-4"><mml:mi>&#x03B1;</mml:mi></mml:math></inline-formula>, select multinomial distribution <inline-formula id="ieqn-5"><mml:math id="mml-ieqn-5"><mml:msub><mml:mi>&#x03B8;</mml:mi><mml:mrow><mml:mi>t</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> for document <italic>d</italic>.</p></list-item>
<list-item>
<p>Choose a topic <inline-formula id="ieqn-6"><mml:math id="mml-ieqn-6"><mml:msub><mml:mi>z</mml:mi><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> from <inline-formula id="ieqn-7"><mml:math id="mml-ieqn-7"><mml:msub><mml:mrow><mml:mi>&#x2205;</mml:mi></mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> and word <inline-formula id="ieqn-8"><mml:math id="mml-ieqn-8"><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> from <inline-formula id="ieqn-9"><mml:math id="mml-ieqn-9"><mml:msub><mml:mrow><mml:mi>&#x2205;</mml:mi></mml:mrow><mml:mrow><mml:mi>z</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula> for the word <inline-formula id="ieqn-10"><mml:math id="mml-ieqn-10"><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:msub></mml:math></inline-formula>.</p></list-item>
</list></p>
<p>The probability of observed data <italic>D</italic> of a corpus is computed and acquired as shown in <xref ref-type="disp-formula" rid="eqn-1">Eq. (1)</xref>.</p>
<p><disp-formula id="eqn-1"><label>(1)</label><mml:math id="mml-eqn-1" display="block"><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mo stretchy="false">|</mml:mo></mml:mrow><mml:mrow><mml:mi>&#x03B1;</mml:mi></mml:mrow><mml:mo>,</mml:mo><mml:mrow><mml:mi>&#x03B2;</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:munderover><mml:mo movablelimits="false">&#x220F;</mml:mo><mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mi>M</mml:mi></mml:mrow></mml:mrow></mml:munderover><mml:mo>&#x222B;</mml:mo><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>&#x03B8;</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mi>&#x03B1;</mml:mi></mml:mrow><mml:mo stretchy="false">)</mml:mo><mml:mrow><mml:mo>(</mml:mo><mml:munderover><mml:mo movablelimits="false">&#x220F;</mml:mo><mml:mrow><mml:mrow><mml:mi>d</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mi>N</mml:mi></mml:mrow></mml:mrow></mml:munderover><mml:mrow><mml:mi>N</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mn>1</mml:mn></mml:mrow><mml:munder><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mrow><mml:mi>z</mml:mi></mml:mrow></mml:mrow></mml:munder><mml:msub><mml:mrow><mml:mi>d</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>|</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mi>&#x03B8;</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>D</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:mrow><mml:mi>p</mml:mi></mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>n</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mrow><mml:mo stretchy="false">|</mml:mo></mml:mrow><mml:msub><mml:mrow><mml:mi>z</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>d</mml:mi><mml:mi>n</mml:mi></mml:mrow><mml:mo>,</mml:mo><mml:mrow><mml:mi>&#x03B2;</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo stretchy="false">)</mml:mo><mml:mo>)</mml:mo></mml:mrow></mml:math></disp-formula></p>
<p>In <xref ref-type="disp-formula" rid="eqn-1">Eq. (1)</xref>, <inline-formula id="ieqn-11"><mml:math id="mml-ieqn-11"><mml:mi>&#x03B1;</mml:mi></mml:math></inline-formula> represents the parameters of the topic Dirichlet prior and the distribution of words over topics, which, drawn from the Dirichlet distribution, given <inline-formula id="ieqn-12"><mml:math id="mml-ieqn-12"><mml:mi>&#x03B2;</mml:mi></mml:math></inline-formula>. While <italic>T</italic> represents the number of topics, <italic>N</italic> is the vocabulary size, and <italic>M</italic> is the number of documents. On the left side of <xref ref-type="disp-formula" rid="eqn-1">Eq. (1)</xref>, we have a probability of the document that appears for the mixture over latent topics. On the right-hand side of the equations, there are four factors; the first two factors work as the setting of LDA, and the last two factors work as gears of the LDA. Before performing topic modeling using LDA, we performed pre-processing, using the CountVectorizer object from the <italic>SKLearn</italic> library to convert each string to a numerical vector. LDA takes input from our document-term matrix and generates an output yielding an <italic>N</italic> &#x00D7; <italic>N</italic> topic matrix, in which <italic>N</italic> is the number of topics assigned, and 6 is the number of topics. Furthermore, we used the <italic>arg Max</italic> method for each tweet text in the topic matrix. We also adjust hyper-parameters of LDA according to our dataset, as shown in <xref ref-type="table" rid="table-4">Table 4</xref>. The experimental results in extracted topics, their relevant terms, and coherence score are shown in <xref ref-type="table" rid="table-7">Table 7</xref>.</p>
<table-wrap id="table-4">
<label>Table 4</label>
<caption>
<title>Summary of hyper-parameters of baseline models for topic extraction</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Model</th>
<th>No. of components</th>
<th>No. of iteration</th>
<th>Random state</th>
<th>Batch size</th>
</tr>
</thead>
<tbody>
<tr>
<td>LDA</td>
<td>10</td>
<td>100</td>
<td>None</td>
<td>128</td>
</tr>
<tr>
<td>Bert</td>
<td>10</td>
<td>5</td>
<td>None</td>
<td>&#x2013;</td>
</tr>
<tr>
<td>HDP</td>
<td>10</td>
<td>5</td>
<td>None</td>
<td>&#x2013;</td>
</tr>
<tr>
<td>Zero-shot</td>
<td>50</td>
<td>20</td>
<td>&#x2013;</td>
<td>64</td>
</tr>
</tbody>
</table>
</table-wrap>

<fig id="fig-9">
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-9.tif"/>
</fig>
<p>The second baseline model used for topic modeling is the Hierarchical Dirichlet Process (HDP), which uses a Dirichlet process for each data group, with the Dirichlet processes for all groups sharing a base distribution drawn from a Dirichlet process [<xref ref-type="bibr" rid="ref-48">48</xref>]. We used a hierarchical Dirichlet process from the gensim library. We used cosine similarity to compute the feature vector&#x2019;s similarity, as shown in <xref ref-type="disp-formula" rid="eqn-2">Eq. (2)</xref>.</p>
<p><disp-formula id="eqn-2"><label>(2)</label><mml:math id="mml-eqn-2" display="block"><mml:mrow><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>n</mml:mi><mml:mi>e</mml:mi></mml:mrow><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mi>s</mml:mi><mml:mi>i</mml:mi><mml:mi>m</mml:mi><mml:mi>i</mml:mi><mml:mi>l</mml:mi><mml:mi>a</mml:mi><mml:mi>r</mml:mi><mml:mi>i</mml:mi><mml:mi>t</mml:mi><mml:mi>y</mml:mi></mml:mrow><mml:mrow><mml:mo>(</mml:mo><mml:mrow><mml:mi>&#x03B8;</mml:mi></mml:mrow><mml:mo>)</mml:mo></mml:mrow><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi>B</mml:mi></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mo>|</mml:mo><mml:mrow><mml:mo>|</mml:mo><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mo>|</mml:mo></mml:mrow><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mo stretchy="false">|</mml:mo></mml:mrow><mml:mrow><mml:mo>|</mml:mo><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mo>|</mml:mo></mml:mrow><mml:mrow><mml:mo stretchy="false">|</mml:mo></mml:mrow></mml:mrow></mml:mfrac><mml:mo>=</mml:mo><mml:mfrac><mml:mrow><mml:msubsup><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mrow></mml:msubsup><mml:msub><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:msub><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:mrow></mml:msub></mml:mrow><mml:mrow><mml:msqrt><mml:msubsup><mml:mo movablelimits="false">&#x2211;</mml:mo><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mrow></mml:msubsup><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>A</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:mrow></mml:msup></mml:msqrt><mml:mrow><mml:mi>X</mml:mi></mml:mrow><mml:msqrt><mml:munderover><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:mrow><mml:mrow><mml:mrow><mml:mi>n</mml:mi></mml:mrow></mml:mrow></mml:munderover><mml:msup><mml:mrow><mml:mo>(</mml:mo><mml:msub><mml:mrow><mml:mi>B</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>)</mml:mo></mml:mrow><mml:mrow><mml:mrow><mml:msup><mml:mn>2</mml:mn><mml:mo>&#x2032;</mml:mo></mml:msup></mml:mrow></mml:mrow></mml:msup></mml:msqrt></mml:mrow></mml:mfrac></mml:math></disp-formula></p>
<p>In <xref ref-type="disp-formula" rid="eqn-2">Eq. (2)</xref>, A and B are the feature vector, <italic>n</italic> is each feature vector&#x2019;s size, and <italic>i</italic> is the index of each feature value in the feature vector. We also adjust the hyper-parameters of the HDP model according to our dataset, as shown in <xref ref-type="table" rid="table-4">Table 4</xref>. The experimental results in extracted topics, their relevant terms, and coherence score are shown in <xref ref-type="table" rid="table-8">Table 8</xref>. The third technique used for topic extraction is the Zero-Shot Learning transfer learning approach [<xref ref-type="bibr" rid="ref-49">49</xref>]. We have also adjusted hyper-parameters of Zero-Shot Learning according to our dataset, as shown in <xref ref-type="table" rid="table-4">Table 4</xref>. The experimental results in extracted topics, their relevant terms, and coherence score are shown in <xref ref-type="table" rid="table-9">Table 9</xref>. Last but not least Bidirectional Encoder Representations from Transformers (BERT) is used as a base learner for topic extraction. BERT uses a transformer, an attention mechanism that learns contextual relations between words (or sub-words) in a text. We also adjust the hyper-parameters of BERT according to our dataset, as shown in <xref ref-type="table" rid="table-4">Table 4</xref>. The experimental results in extracted topics, their relevant terms, and coherence score are shown in <xref ref-type="table" rid="table-6">Table 6</xref>. Algorithm 1 shows the formal procedure of aspect terms annotation on the unlabeled dataset. The output of the first layer is used as input for the second layer. We extracted six topics and their related terms {<italic>t</italic><sub><italic>i1</italic></sub>, <italic>t</italic><sub><italic>i2</italic></sub>, <italic>t</italic><sub><italic>i3</italic></sub><italic>&#x2026;t</italic><sub><italic>n</italic></sub>} by using different deep learning models. As a result of each topic term, we mapped each aspect term with a related tweet and assigned where the relevant terms and associated synonyms matched.</p>
</sec>
<sec id="s3_4">
<label>3.4</label>
<title>Text Classification as Ensemble Learning</title>
<p>The classification process used as an ensemble approach is illustrated in <xref ref-type="fig" rid="fig-4">Fig. 4</xref>. We construct a set of deep baseline models based on several architectures of networks for each benchmark dataset. The first weak classifier used for extracted aspect classification is the Convolutional Neural Network Model (CNN) [<xref ref-type="bibr" rid="ref-50">50</xref>], which stimulates biological neurons. In recent years it has been widely used for NLP tasks. We adjust the hyper-parameters of CNN according to our classification task, as shown in <xref ref-type="table" rid="table-5">Table 5</xref>. The confusion matrix&#x2019;s experimental results are shown in <xref ref-type="fig" rid="fig-6">Fig. 6</xref>, which shows the classification values. <xref ref-type="fig" rid="fig-6">Fig. 6a</xref> reported the highest classification accuracy by accurately classifying the text into topic 2. The second model for classification as base learner Long Short-Term Memory (LSTM) is a three-gated neural network. We also adjust hyper-parameters of LSTM according to our classification task for six topics, as shown in <xref ref-type="table" rid="table-5">Table 5</xref>. The experimental results in terms of the confusion matrix as shown in <xref ref-type="fig" rid="fig-6">Fig. 6b</xref>. The third base learner for classification is Bi-Directional Long Short-Term Memory (Bi-LSTM). Its bi-directional approach increases efficiency and effectively results in text classification as forward and preceding text [<xref ref-type="bibr" rid="ref-51">51</xref>]. However, in bi-directional, we can flow the input in both directions to preserve future and past information. We also adjust the hyper-parameters of Bi-LSTM according to our classification task for six topics, as shown in <xref ref-type="table" rid="table-6">Table 6</xref> and the confusion matrix in <xref ref-type="fig" rid="fig-6">Fig. 6c</xref>. The fourth weak learner used for classification tasks is the Robustly Optimized BERT pre-trained approach (RoBERTa); BERT&#x2019;s extension changes the pre-training procedure. The base version of the model has 12 layers and 110M parameters. We also adjust hyper-parameters of Bi-LSTM according to our classification task for six topics, as shown in <xref ref-type="table" rid="table-5">Table 5</xref>. The experimental results in the confusion matrix as shown in <xref ref-type="fig" rid="fig-6">Fig. 6d</xref>, show the classification values for all six topics using the RoBERTa on our Twitter tweet datasets.</p>
<fig id="fig-4">
<label>Figure 4</label>
<caption>
<title>Aspect terms classification using ensemble learning framework for situational awareness</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-4.tif"/>
</fig>
<table-wrap id="table-5">
<label>Table 5</label>
<caption>
<title>Summary of deep learning models and its hyper-parameters</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Model</th>
<th>Type</th>
<th>Layers</th>
<th>Trainable parameter</th>
</tr>
</thead>
<tbody>
<tr>
<td>CNN</td>
<td>Sequential</td>
<td>Embedding, Conv1D, Max Pooling, Dense</td>
<td>17942826</td>
</tr>
<tr>
<td>LSTM</td>
<td>Sequential</td>
<td>Embedding, Spatial dropout, LSTM, Dense</td>
<td>581006</td>
</tr>
<tr>
<td>Bi-LSTM</td>
<td>Sequential</td>
<td>Embedding, Spatial dropout, Dense</td>
<td>581006</td>
</tr>
<tr>
<td>BERT</td>
<td>&#x2013;</td>
<td>Keras Layers, Dropout Layer</td>
<td>109483010</td>
</tr>
<tr>
<td>RoBERTa</td>
<td>&#x2013;</td>
<td>TF RoBerta, Dropout, Flatten, Dense</td>
<td>174978821</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="table-6">
<label>Table 6</label>
<caption>
<title>Topics with their relevant terms and coherence score using Bert-topic library</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Topics</th>
<th>Relevant terms</th>
<th>Coherence value</th>
</tr>
</thead>
<tbody>
<tr>
<td>Topic 0</td>
<td>Mental stress</td>
<td>0.034206</td>
</tr>
<tr>
<td/>
<td>Fear</td>
<td>0.02721</td>
</tr>
<tr>
<td/>
<td>Friends</td>
<td>0.0246248</td>
</tr>
<tr>
<td/>
<td>Depressed</td>
<td>0.0153</td>
</tr>
<tr>
<td>Topic 1</td>
<td>Symptoms</td>
<td>0.049454</td>
</tr>
<tr>
<td/>
<td>Stuck</td>
<td>0.0493</td>
</tr>
<tr>
<td/>
<td>Health</td>
<td>0.04677</td>
</tr>
<tr>
<td/>
<td>COVID-19</td>
<td>0.035276</td>
</tr>
<tr>
<td>Topic 2</td>
<td>Hope</td>
<td>0.0483</td>
</tr>
<tr>
<td/>
<td>No learning</td>
<td>0.04541</td>
</tr>
<tr>
<td/>
<td>Tuition fee</td>
<td>0.034158</td>
</tr>
<tr>
<td/>
<td>Future learning</td>
<td>0.0517</td>
</tr>
<tr>
<td>Topic 3</td>
<td>Lockdown</td>
<td>0.0807</td>
</tr>
<tr>
<td/>
<td>Late graduation</td>
<td>0.08794</td>
</tr>
<tr>
<td/>
<td>Routine adjustment</td>
<td>0.08602</td>
</tr>
<tr>
<td/>
<td>Gathering</td>
<td>0.06853</td>
</tr>
<tr>
<td>Topic 4</td>
<td>Save student</td>
<td>0.07634</td>
</tr>
<tr>
<td/>
<td>Anxiety</td>
<td>0.069562</td>
</tr>
<tr>
<td/>
<td>Request</td>
<td>0.03654</td>
</tr>
<tr>
<td/>
<td>Open border</td>
<td>0.02936</td>
</tr>
<tr>
<td>Topic 5</td>
<td>Jobless</td>
<td>0.0352</td>
</tr>
<tr>
<td/>
<td>Stipend</td>
<td>0.02461</td>
</tr>
<tr>
<td/>
<td>China</td>
<td>0.23654</td>
</tr>
<tr>
<td/>
<td>Scholarship</td>
<td>0.01936</td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
</sec>
<sec id="s4">
<label>4</label>
<title>Results and Discussion</title>
<p>This study focuses on a novel Situational Aspect-Based Annotation and Classification (SABAC) framework to uncover international students&#x2019; situational aspects. As discussed in the methodology section, our proposed framework consists of three layers. The dataset used for this study was collected from Twitter using diffident hashtags represented by trends on Twitter from international students.</p>
<p>In the first layer, we used four deep learning models, such as LDA, BERT, HDP, and Zero-Shot Learning, as base learner (weak classifiers) models in the ensemble technique to mine accurate aspect terms from the Twitter dataset. The experimental results in extracted topics with their relevant terms and coherence score are shown in <xref ref-type="table" rid="table-6">Tables 6</xref>&#x2013;<xref ref-type="table" rid="table-9">9</xref>.</p>
<table-wrap id="table-7">
<label>Table 7</label>
<caption>
<title>Topics with their relevant terms and coherence score using LDA</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Topics</th>
<th>Relevant terms</th>
<th>Coherence value</th>
</tr>
</thead>
<tbody>
<tr>
<td>Topic 0</td>
<td>Open border</td>
<td>0.108</td>
</tr>
<tr>
<td/>
<td>Open flights</td>
<td>0.106</td>
</tr>
<tr>
<td/>
<td>Fever</td>
<td>0.028</td>
</tr>
<tr>
<td/>
<td>Crisis</td>
<td>0.015</td>
</tr>
<tr>
<td>Topic 1</td>
<td>Practical knowledge</td>
<td>0.346</td>
</tr>
<tr>
<td/>
<td>International students</td>
<td>0.106</td>
</tr>
<tr>
<td/>
<td>Future goals</td>
<td>0.027</td>
</tr>
<tr>
<td/>
<td>Take us back</td>
<td>0.05</td>
</tr>
<tr>
<td>Topic 2</td>
<td>Internet access</td>
<td>0.149</td>
</tr>
<tr>
<td/>
<td>Online learning</td>
<td>0.092</td>
</tr>
<tr>
<td/>
<td>Symptom</td>
<td>0.055</td>
</tr>
<tr>
<td/>
<td>Tuition fee</td>
<td>0.052</td>
</tr>
<tr>
<td>Topic 3</td>
<td>Worry</td>
<td>0.057</td>
</tr>
<tr>
<td/>
<td>Research work</td>
<td>0.033</td>
</tr>
<tr>
<td/>
<td>Stuck</td>
<td>0.021</td>
</tr>
<tr>
<td/>
<td>Student goal</td>
<td>0.12</td>
</tr>
<tr>
<td>Topic 4</td>
<td>Campaign</td>
<td>0.061</td>
</tr>
<tr>
<td/>
<td>Stress</td>
<td>0.052</td>
</tr>
<tr>
<td/>
<td>Gathering</td>
<td>0.024</td>
</tr>
<tr>
<td/>
<td>Students not thieves</td>
<td>0.016</td>
</tr>
<tr>
<td>Topic 5</td>
<td>Jobless</td>
<td>0.0352</td>
</tr>
<tr>
<td/>
<td>Student</td>
<td>0.02461</td>
</tr>
<tr>
<td/>
<td>Stipend</td>
<td>0.23654</td>
</tr>
<tr>
<td/>
<td>Jobless</td>
<td>0.01936</td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="table-8">
<label>Table 8</label>
<caption>
<title>Topics with their relevant terms and coherence score using HDP</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Topics</th>
<th>Relevant terms</th>
<th>Coherence value</th>
</tr>
</thead>
<tbody>
<tr>
<td>Topic 0</td>
<td>Fear</td>
<td>0.015</td>
</tr>
<tr>
<td/>
<td>Symptoms</td>
<td>0.013</td>
</tr>
<tr>
<td/>
<td>Academic loss</td>
<td>0.005</td>
</tr>
<tr>
<td/>
<td>Failure</td>
<td>0.004</td>
</tr>
<tr>
<td>Topic 1</td>
<td>Stipend</td>
<td>0.004</td>
</tr>
<tr>
<td/>
<td>Academic loss</td>
<td>0.003</td>
</tr>
<tr>
<td/>
<td>Future goal</td>
<td>0.003</td>
</tr>
<tr>
<td/>
<td>Living expenses</td>
<td>0.002</td>
</tr>
<tr>
<td>Topic 2</td>
<td>Visa</td>
<td>0.003</td>
</tr>
<tr>
<td/>
<td>Border policy</td>
<td>0.003</td>
</tr>
<tr>
<td/>
<td>Lockdown routine</td>
<td>0.003</td>
</tr>
<tr>
<td/>
<td>Friends gathering</td>
<td>0.002</td>
</tr>
<tr>
<td>Topic 3</td>
<td>Students not thieves</td>
<td>0.452</td>
</tr>
<tr>
<td/>
<td>Open flights</td>
<td>0.357</td>
</tr>
<tr>
<td/>
<td>Depression</td>
<td>0.3222</td>
</tr>
<tr>
<td/>
<td>University</td>
<td>0.374</td>
</tr>
<tr>
<td>Topic 4</td>
<td>Jobless</td>
<td>0.0352</td>
</tr>
<tr>
<td/>
<td>Stipend</td>
<td>0.02461</td>
</tr>
<tr>
<td/>
<td>China</td>
<td>0.23654</td>
</tr>
<tr>
<td/>
<td>Scholarship</td>
<td>0.01936</td>
</tr>
<tr>
<td>Topic 5</td>
<td>Scholarship</td>
<td>0.322</td>
</tr>
<tr>
<td/>
<td>Remote learning</td>
<td>0.299</td>
</tr>
<tr>
<td/>
<td>Late degree</td>
<td>0.168</td>
</tr>
<tr>
<td/>
<td>Symptom</td>
<td>0.155</td>
</tr>
</tbody>
</table>
</table-wrap><table-wrap id="table-9">
<label>Table 9</label>
<caption>
<title>Topics with their relevant terms and coherence score using Zero-Shot learning</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Topics</th>
<th>Relevant terms</th>
<th>Coherence value</th>
</tr>
</thead>
<tbody>
<tr>
<td>Topic 0</td>
<td>Entry</td>
<td>0.000682</td>
</tr>
<tr>
<td/>
<td>Future folded</td>
<td>0.0005499</td>
</tr>
<tr>
<td/>
<td>Lockdown</td>
<td>0.0005565</td>
</tr>
<tr>
<td/>
<td>Borders</td>
<td>0.00055</td>
</tr>
<tr>
<td>Topic 1</td>
<td>Facing</td>
<td>0.00083</td>
</tr>
<tr>
<td/>
<td>Issue</td>
<td>0.000805</td>
</tr>
<tr>
<td/>
<td>Losses</td>
<td>0.0007826</td>
</tr>
<tr>
<td/>
<td>Take us back to China</td>
<td>0.0006406</td>
</tr>
<tr>
<td>Topic 2</td>
<td>Student</td>
<td>0.0352</td>
</tr>
<tr>
<td/>
<td>No funding</td>
<td>0.02461</td>
</tr>
<tr>
<td/>
<td>China</td>
<td>0.23654</td>
</tr>
<tr>
<td/>
<td>Scholarship</td>
<td>0.01936</td>
</tr>
<tr>
<td>Topic 3</td>
<td>Save international student</td>
<td>0.000895</td>
</tr>
<tr>
<td/>
<td>Social connections</td>
<td>0.000778</td>
</tr>
<tr>
<td/>
<td>Disappointing</td>
<td>0.0007617</td>
</tr>
<tr>
<td/>
<td>Return policy</td>
<td>0.000752</td>
</tr>
<tr>
<td>Topic 4</td>
<td>Lockdown routine</td>
<td>0.00089</td>
</tr>
<tr>
<td/>
<td>Late graduation</td>
<td>0.0007828</td>
</tr>
<tr>
<td/>
<td>Stuck</td>
<td>0.00076436</td>
</tr>
<tr>
<td/>
<td>Return policy</td>
<td>0.000732229</td>
</tr>
<tr>
<td>Topic 5</td>
<td>Discarded</td>
<td>0.000885349</td>
</tr>
<tr>
<td/>
<td>Open border</td>
<td>0.000673</td>
</tr>
<tr>
<td/>
<td>Stipend</td>
<td>0.23654</td>
</tr>
<tr>
<td/>
<td>Jobless</td>
<td>0.01936</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Assessing the results shown in <xref ref-type="table" rid="table-6">Tables 6</xref>&#x2013;<xref ref-type="table" rid="table-9">9</xref>, we can conclude that on the Student-COVID-19 dataset, the SABAC provides better results and coherent topics by selecting six topics and five relevant terms. Our topic modeling techniques&#x2019; performance according to each extracted topic is reported using a word cloud. In addition, the words that dominate the word cloud are most likely directly related to the topic term of the word cloud, as we can see in <xref ref-type="fig" rid="fig-5">Fig. 5a</xref> reporting Topic-0, which talks about the &#x201C;returning to school&#x201D; of international students.</p>
<fig id="fig-5">
<label>Figure 5</label>
<caption>
<title>Word cloud representation of each extracted topic</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-5.tif"/>
</fig>
<p>There are some dominant words in <xref ref-type="fig" rid="fig-5">Fig. 5a</xref> that represent the topic of returning to school, such as &#x201C;school&#x201D; &#x201C;open&#x201D; &#x201C;back&#x201D; and &#x201C;border&#x201D; these words illustrate the issue of international students about their returning to school for physical classes.</p>

<p><disp-formula id="eqn-3"><label>(3)</label><mml:math id="mml-eqn-3" display="block"><mml:mrow><mml:mi>c</mml:mi><mml:mi>v</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:mo>&#x2211;</mml:mo><mml:mrow><mml:mi>i</mml:mi></mml:mrow><mml:mo>&#x003C;</mml:mo><mml:mrow><mml:mi>j</mml:mi></mml:mrow><mml:mtext>&#x00A0;</mml:mtext><mml:mrow><mml:mi>s</mml:mi><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi></mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mrow><mml:mi>w</mml:mi></mml:mrow><mml:mrow><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:mrow></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:math></disp-formula></p>
<p>Similarly, <xref ref-type="fig" rid="fig-5">Figs. 5b</xref>, <xref ref-type="fig" rid="fig-5">5c</xref>, <xref ref-type="fig" rid="fig-5">5d</xref> and <xref ref-type="fig" rid="fig-5">5f</xref> represents Topic-1, Topic-2, Topic-3, Topic-4, and Topic-5, which show Financial Stress, Health, Online Education, Stress, and uncertainty, respectively. In contrast, the word cloud for each topic (Topic-1 to Topic5) contains dominant words representing each topic&#x2019;s authenticity and relevant term score for each topic term. The topic extraction and relevant terms extraction results are shown below using Bert-Topic Library. For the topic extraction and modeling, we used different deep-learning approaches. The complete list of models and their parameters used in this study is shown in <xref ref-type="table" rid="table-4">Table 4</xref>. Similarly, we used other deep learning models to evaluate the topic modeling results. The complete list of models and their architecture summary is shown in <xref ref-type="table" rid="table-5">Table 5</xref>. The coherence score is for accessing the quality of learned topics through different models. We used a coherence score as it is essential to find the optimal number of topics because these topics will ultimately convert into labels for annotating the dataset. As shown in <xref ref-type="disp-formula" rid="eqn-3">Eq. (3)</xref>, for one topic, the words <italic>i</italic>, <italic>j</italic> is scored in <inline-formula id="ieqn-13"><mml:math id="mml-ieqn-13"><mml:mo>&#x2211;</mml:mo><mml:mi>i</mml:mi><mml:mo>&#x003C;</mml:mo><mml:mrow><mml:mi>j</mml:mi><mml:mtext>&#x00A0;</mml:mtext><mml:mi>s</mml:mi><mml:mi>c</mml:mi><mml:mi>o</mml:mi><mml:mi>r</mml:mi><mml:mi>e</mml:mi></mml:mrow><mml:mo stretchy="false">(</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>i</mml:mi></mml:mrow></mml:msub><mml:mo>,</mml:mo><mml:msub><mml:mi>w</mml:mi><mml:mrow><mml:mi>j</mml:mi></mml:mrow></mml:msub><mml:mo stretchy="false">)</mml:mo></mml:math></inline-formula> have the highest probability of occurring for that topic. Furthermore, <xref ref-type="table" rid="table-6">Tables 6</xref>&#x2013;<xref ref-type="table" rid="table-9">9</xref> reported the extracted topics with relevant terms and coherence scores using Bert, LDA, HDP, and Zero-Shot Learning, respectively.</p>

<p>Moreover, the extracted topics have also demonstrated the situation of international students, such as mental stress or fear in the students whose degree is delayed due to lab work. Hence <xref ref-type="table" rid="table-8">Table 8</xref> also represents these terms as relevant terms, similar to <xref ref-type="table" rid="table-6">Table 6</xref>, demonstrating the fear and being stuck. These terms also represent the international student&#x2019;s situation as they are stuck in their rooms and home countries. Hence it represents fear of being late for graduation and unemployment. To better understand the extracted terms from the tweets, we also represent the co-occurrence of words within sentences, as shown in <xref ref-type="fig" rid="fig-7">Fig. 7</xref>. We can conclude that our proposed SABAC model accurately extracts the situational aspects of international students to uncover their issues during the pandemic. The second layer of the proposed SABAC framework used Algorithm 1 to annotate a more significant number of unlabeled tweets into six mined aspect terms. Our proposed framework used the aspect2class algorithm and text similarity matrix to annotate unlabeled tweets into six mined aspect terms. In the third layer of the proposed framework, we used ensemble learning techniques to classify unlabeled Twitter tweets into six mined aspect terms. Using the ensemble technique, we used CNN, LSTM, Bi-LSTM, and RoBERTa models as base-learner classifiers in the third layer to classify our Twitter dataset into six mined aspect terms. The results of the base-learner classifier in the form of precision, recall, and f1-support are shown in <xref ref-type="table" rid="table-11">Table 11</xref>. We used four different ensemble learning techniques in this classification layer of the proposed SABAC. These ensemble techniques include soft prediction, hard prediction, SABAC (soft prediction &#x002B; VSF), and SABAC (Hard prediction &#x002B; VSF). Moreover, we used logistic regression, support vector machine, naive Bayes, and random forest machine learning models as meta-classifiers in Layer-1 to evaluate the final prediction for aspect classification. The results of meta-classifiers&#x2019; using different ensemble techniques are shown in <xref ref-type="table" rid="table-10">Table 10</xref>. We plotted the confusion matrix to depict our four meta-classifiers&#x2019; performances on the test dataset shown in <xref ref-type="fig" rid="fig-6">Fig. 6</xref>.</p>
<fig id="fig-6">
<label>Figure 6</label>
<caption>
<title>Confusion matrix for each aspect topic using meta-classifiers (a) LR, (b) NB, (c) RF, (d) SVM</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-6.tif"/>
</fig>
<fig id="fig-7">
<label>Figure 7</label>
<caption>
<title>Co-occurrences within sentences and words following one another</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-7.tif"/>
</fig>
<table-wrap id="table-10">
<label>Table 10</label>
<caption>
<title>The accuracy of the proposed ensemble framework on our Student-COVID-19 dataset</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>Ensemble technique</th>
<th align="center" colspan="4">Meta classifiers</th>
</tr>
<tr>
<th></th>
<th>Logistic regression</th>
<th>Support vector machine</th>
<th>Na&#x00EF;ve Bayes</th>
<th>Random forest</th>
</tr>
</thead>
<tbody>
<tr>
<td>Hard prediction</td>
<td>91.21</td>
<td>91.32</td>
<td>90.98</td>
<td>91.78</td>
</tr>
<tr>
<td>Soft prediction</td>
<td>91.85</td>
<td>89.29</td>
<td>90.56</td>
<td>89.94</td>
</tr>
<tr>
<td>SABAC (Hard prediction &#x002B; VSF)</td>
<td>92.03</td>
<td>91.98</td>
<td>91.29</td>
<td>92.64</td>
</tr>
<tr>
<td><bold>SABAC (Soft prediction &#x002B; VSF)</bold></td>
<td><bold>92.87</bold></td>
<td><bold>92.87</bold></td>
<td><bold>92.87</bold></td>
<td><bold>92.87</bold></td>
</tr>
</tbody>
</table>
</table-wrap>
<table-wrap id="table-11">
<label>Table 11</label>
<caption>
<title>Performance metrics of baseline models for each topic</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>DL baseline models</th>
<th>Performance matrices</th>
<th>Back to school</th>
<th>Stress</th>
<th>Financial stress</th>
<th>Uncertainty</th>
<th>Online learning</th>
<th>Health</th>
</tr>
</thead>
<tbody>
<tr>
<td>CNN</td>
<td>Precision</td>
<td>0.9</td>
<td>0.87</td>
<td>0.85</td>
<td>0.86</td>
<td>0.85</td>
<td>0.9</td>
</tr>
<tr>
<td/>
<td>Recall</td>
<td>0.93</td>
<td>0.84</td>
<td>0.85</td>
<td>0.82</td>
<td>0.76</td>
<td>1</td>
</tr>
<tr>
<td/>
<td>F1 score</td>
<td>0.91</td>
<td>0.85</td>
<td>0.85</td>
<td>0.84</td>
<td>0.8</td>
<td>0.94</td>
</tr>
<tr>
<td>LSTM</td>
<td>Precision</td>
<td>0.86</td>
<td>0.83</td>
<td>1</td>
<td>0.89</td>
<td>0.95</td>
<td>0.87</td>
</tr>
<tr>
<td/>
<td>Recall</td>
<td>0.94</td>
<td>0.87</td>
<td>0.89</td>
<td>0.7</td>
<td>0.83</td>
<td>1</td>
</tr>
<tr>
<td/>
<td>F1 score</td>
<td>0.9</td>
<td>0.85</td>
<td>0.94</td>
<td>0.78</td>
<td>0.88</td>
<td>0.93</td>
</tr>
<tr>
<td>Bi-LSTM</td>
<td>Precision</td>
<td>0.9</td>
<td>0.92</td>
<td>1</td>
<td>0.85</td>
<td>0.98</td>
<td>0.88</td>
</tr>
<tr>
<td/>
<td>Recall</td>
<td>0.94</td>
<td>0.89</td>
<td>0.96</td>
<td>0.8</td>
<td>0.87</td>
<td>1</td>
</tr>
<tr>
<td/>
<td>F1 score</td>
<td>0.92</td>
<td>0.91</td>
<td>0.98</td>
<td>0.82</td>
<td>0.92</td>
<td>0.94</td>
</tr>
<tr>
<td>RoBERTa</td>
<td>Precision</td>
<td>0.78</td>
<td>0.79</td>
<td>0.92</td>
<td>0.7</td>
<td>0.97</td>
<td>0.89</td>
</tr>
<tr>
<td/>
<td>Recall</td>
<td>0.87</td>
<td>0.84</td>
<td>0.81</td>
<td>0.75</td>
<td>0.67</td>
<td>0.95</td>
</tr>
<tr>
<td/>
<td>F1 score</td>
<td>0.82</td>
<td>0.81</td>
<td>0.86</td>
<td>0.73</td>
<td>0.79</td>
<td>0.92</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>Finally, to evaluate the performance of baseline models and the ensemble approach for each topic, we used different performance metrics such as precision, recall, and F1 score. The comparative values of performance metrics for each topic are shown in <xref ref-type="table" rid="table-11">Table 11</xref>. We conducted several experiments on the previous benchmark datasets to validate our proposed model in the text classification task and compared the ensemble&#x2019;s performance to the best individual baseline models. According to the Pareto principle, we divided each benchmark dataset into training and validation test sets with a ratio of 80% and 20%. The comparative result of an ensemble model on different benchmark datasets is shown in <xref ref-type="table" rid="table-12">Table 12</xref>.</p>
<table-wrap id="table-12">
<label>Table 12</label>
<caption>
<title>Comparative accuracy of proposed ensemble SABAC framework on benchmark datasets and our collected Student-COVID-19 dataset</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th></th>
<th>Baseline model</th>
<th>Voting (%)</th>
<th>Stacking (%)</th>
<th>Proposed SABAC approach (%)</th>
</tr>
</thead>
<tbody>
<tr>
<td>SemEval-2018</td>
<td>CNN &#x003D; 78.33%</td>
<td>82.45</td>
<td>83.21</td>
<td>85.42</td>
</tr>
<tr>
<td/>
<td>LSTM &#x003D; 76.75%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td>Bi-LSTM &#x003D; 75.23%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td>RoBERTa &#x003D; 86.32%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td>20-newsgroup</td>
<td>CNN &#x003D; 82.57%</td>
<td>85.67</td>
<td>85.98</td>
<td>86.76</td>
</tr>
<tr>
<td/>
<td>LSTM &#x003D; 83.75%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td>Bi-LSTM &#x003D; 84.23%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td>RoBERTa &#x003D; 81.41%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td>COVID19-fake</td>
<td>CNN &#x003D; 89.98%</td>
<td>87.31</td>
<td>88.41</td>
<td>88.98</td>
</tr>
<tr>
<td/>
<td>LSTM &#x003D; 87.91%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td>Bi-LSTM &#x003D; 90.03%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td>RoBERTa &#x003D; 83.51%</td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td><bold>Our dataset</bold></td>
<td><bold>CNN &#x003D; 90.15%</bold></td>
<td><bold>91.78</bold></td>
<td><bold>91.78</bold></td>
<td><bold>91.78</bold></td>
</tr>
<tr>
<td><bold>(Students-COVID-19)</bold></td>
<td><bold>LSTM &#x003D; 88.47%</bold></td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td><bold>Bi-LSTM &#x003D; 87.03%</bold></td>
<td/>
<td/>
<td/>
</tr>
<tr>
<td/>
<td><bold>RoBERTa &#x003D; 87.32%</bold></td>
<td/>
<td/>
<td/>
</tr>
</tbody>
</table>
</table-wrap>
<p>The proposed ensemble SABAC approach results on the previous benchmark datasets and our Students-COVID-19 dataset are demonstrated in <xref ref-type="table" rid="table-12">Table 12</xref>, improving accuracy. Compared to the baseline models, the ensemble approaches improved the class prediction accuracy. Using the voting ensemble technique for final prediction, we achieved 82.45% accuracy on the SemEval-2018 dataset, 85.65% on the 20-newsgroup, 87.31% on the COVID19-Fake, and 91.31% on our collected Student-COVID dataset. Furthermore, using the stacking approach for final prediction, we achieved 83.21% accuracy on the SemEval-2018 dataset, 85.98% on the 20-newsgroup, 88.41% on the COVID19-Fake dataset, and 92.47 on our collected Student-COVID dataset. Likewise, we achieved the best results using the proposed SABAC approach in which we used ML models as meta-classifiers for final prediction, and we achieved 85.52% accuracy on the SemEval-2018 dataset, 86.76% accuracy on the 20-newsgroup, 88.98% accuracy on the COVID19-Fake dataset, and 93.21% on our collected Student-COVID-19 dataset. Moreover, <xref ref-type="fig" rid="fig-8">Fig. 8</xref> demonstrates the comparative results of used ensemble techniques on different datasets. The results reveal that the proposed SABAC framework is an improved approach that can perform robust topic extraction, annotation, and classification tasks. Finally, we compared the performance of our proposed approach with previous studies using ensemble techniques, as shown in <xref ref-type="table" rid="table-13">Table 13</xref>.</p>
<fig id="fig-8">
<label>Figure 8</label>
<caption>
<title>The comparative performance evaluation of different ensemble techniques on three benchmarks and our (Student-COVID) datasets</title>
</caption>
<graphic mimetype="image" mime-subtype="tif" xlink:href="CMC_36779-fig-8.tif"/>
</fig>
<table-wrap id="table-13">
<label>Table 13</label>
<caption>
<title>Result comparison with prior study and our proposed approach</title>
</caption>
<table frame="hsides">
<colgroup>
<col align="left"/>
<col align="left"/>
<col align="left"/>
</colgroup>
<thead>
<tr>
<th>References</th>
<th>Approach</th>
<th>Accuracy (%)</th>
</tr>
</thead>
<tbody>
<tr>
<td>[<xref ref-type="bibr" rid="ref-52">52</xref>]</td>
<td>Majority voting</td>
<td>92.21</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-53">53</xref>]</td>
<td>Aggregate</td>
<td>92.3</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-53">53</xref>]</td>
<td>AE1-WELM</td>
<td>88.4</td>
</tr>
<tr>
<td>[<xref ref-type="bibr" rid="ref-54">54</xref>]</td>
<td>Boosting</td>
<td>84.61</td>
</tr>
<tr>
<td><bold>Proposed study</bold></td>
<td><bold>SABAC approach</bold></td>
<td><bold>93.21</bold></td>
</tr>
</tbody>
</table>
</table-wrap>
</sec>
<sec id="s5">
<label>5</label>
<title>Conclusion</title>
<p>In this study, we proposed an improved text mining approach named SABAC to uncover the situational topic terms from the international students&#x2019; tweets. Our findings show that international students face uncertainty, health, financial stress, job stress, online classes stress, and returning to school-related issues. To uncover these findings, an ensemble deep learning framework is proposed and implemented in this paper. Using our proposed framework, we have performed topic modeling to extract aspect terms and performed annotation on unlabeled tweets. After labeling the unlabeled dataset, we performed classification using deep learning models using ensemble stacking and boosting techniques. We achieved 89.94% accuracy on our proposed baseline soft prediction, and performance has been enhanced using Volatile Stopwords Filtering (VSF) method. We gained promising results using our proposed SABAC &#x002B; VSF technique. We achieved 93.21% accuracy on our proposed model and compared our results with the latest reported work in the text mining domain. The study concluded that our proposed SABAC framework would help the authorities appropriately understand international students&#x2019; situational aspects and take the necessary steps for students in the COVID-19 pandemic. In future work, we will like to improve the accuracy of SABAC by handling high dimensional feature space on textual datasets transfer-learning techniques.</p>
</sec>
</body>
<back>
<sec><title>Funding Statement</title>
<p>This research work is supported by the National Natural Science Foundation of China [Grant Number: 92067106] and the Ministry of Education of the People&#x2019;s Republic of China [Grant Number: E-GCCRC20200309].</p>
</sec>
<sec sec-type="COI-statement"><title>Conflicts of Interest</title>
<p>The authors declare they have no conflicts of interest to report regarding the present study.</p>
</sec>
<ref-list content-type="authoryear">
<title>References</title>
<ref id="ref-1"><label>[1]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>B.</given-names> <surname>Kheovichai</surname></string-name> and <string-name><given-names>A. R.</given-names> <surname>Network</surname></string-name></person-group>, &#x201C;<article-title>Collocation and discursive construction of COVID-19 in WHO director general&#x2019;s discourse: A corpus-based study</article-title>,&#x201D; <source>LEARN Journal</source>, vol. <volume>15</volume>, no. <issue>1</issue>, pp. <fpage>10</fpage>&#x2013;<lpage>32</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-2"><label>[2]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Yu</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Ayoub</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Khan</surname></string-name>, <string-name><given-names>R.</given-names> <surname>Rehman</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>IoT and deep learning based approach for rapid screening and face mask detection for infection spread control of COVID-19</article-title>,&#x201D; <source>Applied Sciences</source>, vol. <volume>11</volume>, no. <issue>8</issue>, pp. <fpage>3495</fpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-3"><label>[3]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Praveen</surname></string-name>, <string-name><given-names>R.</given-names> <surname>Ittamalla</surname></string-name> and <string-name><given-names>G.</given-names> <surname>Deepak</surname></string-name></person-group>, &#x201C;<article-title>Analyzing Indian general public&#x2019;s perspective on anxiety, stress and trauma during COVID-19-a machine learning study of 840,000 tweets</article-title>,&#x201D; <source>Diabetes &#x0026; Metabolic Syndrome: Clinical Research &#x0026; Reviews</source>, vol. <volume>15</volume>, no. <issue>3</issue>, pp. <fpage>667</fpage>&#x2013;<lpage>671</lpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-4"><label>[4]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>H.</given-names> <surname>Ma</surname></string-name> and <string-name><given-names>C. J. H. C.</given-names> <surname>Miller</surname></string-name></person-group>, &#x201C;<article-title>Trapped in a double bind: Chinese overseas student anxiety during the COVID-19 pandemic</article-title>,&#x201D; <source>Health Communication</source>, vol. <volume>36</volume>, no. <issue>13</issue>, pp. <fpage>1598</fpage>&#x2013;<lpage>1605</lpage>, <year>2021</year>; <pub-id pub-id-type="pmid">32530311</pub-id></mixed-citation></ref>
<ref id="ref-5"><label>[5]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>D.</given-names> <surname>Firang</surname></string-name></person-group>, &#x201C;<article-title>The impact of COVID-19 pandemic on international students in Canada</article-title>,&#x201D; <source>International Social Work</source>, vol. <volume>63</volume>, no. <issue>6</issue>, pp. <fpage>820</fpage>&#x2013;<lpage>824</lpage>, <year>2020</year>.</mixed-citation></ref>
<ref id="ref-6"><label>[6]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>M. A.</given-names> <surname>Islam</surname></string-name>, <string-name><given-names>S. D.</given-names> <surname>Barna</surname></string-name>, <string-name><given-names>H.</given-names> <surname>Raihan</surname></string-name>, <string-name><given-names>M. N. A.</given-names> <surname>Khan</surname></string-name> and <string-name><given-names>M. T. J. P. O.</given-names> <surname>Hossain</surname></string-name></person-group>, &#x201C;<article-title>Depression and anxiety among university students during the COVID-19 pandemic in Bangladesh: A web-based cross-sectional survey</article-title>,&#x201D; <source>PLoS One</source>, vol. <volume>15</volume>, no. <issue>8</issue>, pp. <fpage>e0238162</fpage>, <year>2020</year>; <pub-id pub-id-type="pmid">32845928</pub-id></mixed-citation></ref>
<ref id="ref-7"><label>[7]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>R.</given-names> <surname>Choudaha</surname></string-name></person-group>, &#x201C;<article-title>Three waves of international student mobility (1999&#x2013;2020)</article-title>,&#x201D; <source>Studies in Higher Education</source>, vol. <volume>42</volume>, no. <issue>5</issue>, pp. <fpage>825</fpage>&#x2013;<lpage>832</lpage>, <year>2017</year>.</mixed-citation></ref>
<ref id="ref-8"><label>[8]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>E. M.</given-names> <surname>Aucejo</surname></string-name>, <string-name><given-names>J.</given-names> <surname>French</surname></string-name>, <string-name><given-names>M. P. U.</given-names> <surname>Araya</surname></string-name> and <string-name><given-names>B. J. J. O. P. E.</given-names> <surname>Zafar</surname></string-name></person-group>, &#x201C;<article-title>The impact of COVID-19 on student experiences and expectations: Evidence from a survey</article-title>,&#x201D; <source>Journal of Public Economics</source>, vol. <volume>191</volume>, no. <issue>3</issue>, pp. <fpage>104271</fpage>, <year>2020</year>; <pub-id pub-id-type="pmid">32873994</pub-id></mixed-citation></ref>
<ref id="ref-9"><label>[9]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>T.</given-names> <surname>Kaya</surname></string-name></person-group>, &#x201C;<article-title>The changes in the effects of social media use of Cypriots due to COVID-19 pandemic</article-title>,&#x201D; <source>Technology in Society</source>, vol. <volume>63</volume>, no. <issue>4</issue>, pp. <fpage>101380</fpage>, <year>2020</year>; <pub-id pub-id-type="pmid">33518848</pub-id></mixed-citation></ref>
<ref id="ref-10"><label>[10]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>A. K.</given-names> <surname>Yadav</surname></string-name></person-group>, &#x201C;<article-title>Impact of online teaching on students&#x2019; education and health in India during the pandemic of COVID-19</article-title>,&#x201D; <source>Ingenta</source>, vol. <volume>2</volume>, no. <issue>4</issue>, pp. <fpage>516</fpage>&#x2013;<lpage>520</lpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-11"><label>[11]</label><mixed-citation publication-type="conf-proc"><person-group person-group-type="author"><string-name><given-names>J. A.</given-names> <surname>Wahid</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>H.</given-names> <surname>Wang</surname></string-name>, <string-name><given-names>Z.</given-names> <surname>Wu</surname></string-name>, <string-name><given-names>L.</given-names> <surname>Shi</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Aspect oriented sentiment classification of COVID-19 twitter data; an enhanced LDA based text analytic approach</article-title>,&#x201D; in <conf-name>2021 Int. Conf. on Computer Engineering and Artificial Intelligence (ICCEAI)</conf-name>, <publisher-loc>Shanghai, China</publisher-loc>, <publisher-name>IEEE</publisher-name>, pp. <fpage>271</fpage>&#x2013;<lpage>275</lpage>, <year>2021</year>. </mixed-citation></ref>
<ref id="ref-12"><label>[12]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>T.</given-names> <surname>Zhou</surname></string-name>, <string-name><given-names>T. -V. T.</given-names> <surname>Nguyen</surname></string-name>, <string-name><given-names>J.</given-names> <surname>Zhong</surname></string-name> and <string-name><given-names>J.</given-names> <surname>Liu</surname></string-name></person-group>, &#x201C;<article-title>A COVID-19 descriptive study of life after lockdown in Wuhan, China</article-title>,&#x201D; <source>Royal Society of Open Science</source>, vol. <volume>7</volume>, no. <issue>9</issue>, pp. <fpage>200705</fpage>, <year>2020</year>.</mixed-citation></ref>
<ref id="ref-13"><label>[13]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>Y.</given-names> <surname>Yu</surname></string-name>, <string-name><given-names>X.</given-names> <surname>Qin</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>W.</given-names> <surname>Hou</surname></string-name> and <string-name><given-names>T.</given-names> <surname>Weis</surname></string-name></person-group>, &#x201C;<article-title>Pedestrian counting based on piezoelectric vibration sensor</article-title>,&#x201D; <source>Applied Sciences</source>, vol. <volume>12</volume>, no. <issue>4</issue>, pp. <fpage>1920</fpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-14"><label>[14]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>J.</given-names> <surname>Singh</surname></string-name> and <string-name><given-names>S.</given-names> <surname>Singh</surname></string-name></person-group>, &#x201C;<article-title>COVID-19 and its impact on society</article-title>,&#x201D; <source>Electronic Research Journal of Social Sciences and Humanities</source>, vol. <volume>2</volume>, no. <issue>1</issue>, pp. <fpage>168</fpage>&#x2013;<lpage>172</lpage>, <year>2020</year>.</mixed-citation></ref>
<ref id="ref-15"><label>[15]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>Y.</given-names> <surname>Zhang</surname></string-name> and <string-name><given-names>Z. F.</given-names> <surname>Ma</surname></string-name></person-group>, &#x201C;<article-title>Impact of the COVID-19 pandemic on mental health and quality of life among local residents in Liaoning Province, China: A cross-sectional study</article-title>,&#x201D; <source>International Journal of Environmental Research and Public Health</source>, vol. <volume>17</volume>, no. <issue>7</issue>, pp. <fpage>2381</fpage>, <year>2020</year>; <pub-id pub-id-type="pmid">32244498</pub-id></mixed-citation></ref>
<ref id="ref-16"><label>[16]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>N.</given-names> <surname>Bukhari</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Ayoub</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Yu</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Khan</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Deep learning based framework for emotion recognition using facial expression</article-title>,&#x201D; <source>Pakistan Journal of Engineering and Technology</source>, vol. <volume>5</volume>, no. <issue>3</issue>, pp. <fpage>51</fpage>&#x2013;<lpage>57</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-17"><label>[17]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>L.</given-names> <surname>Irfan</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Ayoub</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Yu</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Khan</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>A comparative analysis of social communication applications using aspect based sentiment analysis</article-title>,&#x201D; <source>Pakistan Journal of Engineering and Technology</source>, vol. <volume>5</volume>, no. <issue>3</issue>, pp. <fpage>44</fpage>&#x2013;<lpage>50</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-18"><label>[18]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>A.</given-names> <surname>Sahar</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Ayoub</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Yu</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Khan</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Transfer learning-based framework for sentiment classification of cosmetics products reviews</article-title>,&#x201D; <source>Pakistan Journal of Engineering and Technology</source>, vol. <volume>5</volume>, no. <issue>3</issue>, pp. <fpage>38</fpage>&#x2013;<lpage>43</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-19"><label>[19]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>A.</given-names> <surname>Gupta</surname></string-name>, <string-name><given-names>V.</given-names> <surname>Jain</surname></string-name> and <string-name><given-names>A. J. N. G. C.</given-names> <surname>Singh</surname></string-name></person-group>, &#x201C;<article-title>Stacking ensemble-based intelligent machine learning model for predicting post-COVID-19 complications</article-title>,&#x201D; <source>New Generation Computing</source>, vol. <volume>40</volume>, no. <issue>1</issue>, pp. <fpage>1</fpage>&#x2013;<lpage>21</lpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-20"><label>[20]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>P.</given-names> <surname>Vaishali</surname></string-name> and <string-name><given-names>P.</given-names> <surname>Kumari</surname></string-name></person-group>, &#x201C;<article-title>Ensemble learning baThe impact of policymeasures on human mobilitysed classifier to predict depression caused due to pandemic</article-title>,&#x201D; <source>Journal of Physics: Conference Series</source>, <comment>IOP Publishing</comment>, vol. <volume>2089</volume>, no. <issue>1</issue>, pp. <fpage>012026</fpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-21"><label>[21]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>A. S.</given-names> <surname>Imran</surname></string-name>, <string-name><given-names>S. M.</given-names> <surname>Daudpota</surname></string-name>, <string-name><given-names>Z.</given-names> <surname>Kastrati</surname></string-name> and <string-name><given-names>R. J. I. A.</given-names> <surname>Batra</surname></string-name></person-group>, &#x201C;<article-title>Cross-cultural polarity and emotion detection using sentiment analysis and deep learning on COVID-19 related tweets</article-title>,&#x201D; <source>IEEE Access</source>, vol. <volume>8</volume>, pp. <fpage>181074</fpage>&#x2013;<lpage>181090</lpage>, <year>2020</year>; <pub-id pub-id-type="pmid">34812358</pub-id></mixed-citation></ref>
<ref id="ref-22"><label>[22]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>N.</given-names> <surname>Chintalapudi</surname></string-name>, <string-name><given-names>G.</given-names> <surname>Battineni</surname></string-name> and <string-name><given-names>F. J. I. D. R.</given-names> <surname>Amenta</surname></string-name></person-group>, &#x201C;<article-title>Sentimental analysis of COVID-19 tweets using deep learning models</article-title>,&#x201D; <source>Infectious Disease Reports</source>, vol. <volume>13</volume>, no. <issue>2</issue>, pp. <fpage>329</fpage>&#x2013;<lpage>339</lpage>, <year>2021</year>; <pub-id pub-id-type="pmid">33916139</pub-id></mixed-citation></ref>
<ref id="ref-23"><label>[23]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>M. E.</given-names> <surname>Basiri</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Nemati</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Abdar</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Asadi</surname></string-name> and <string-name><given-names>U. R. J. K. -B. S.</given-names> <surname>Acharrya</surname></string-name></person-group>, &#x201C;<article-title>A novel fusion-based deep learning model for sentiment analysis of COVID-19 tweets</article-title>,&#x201D; <source>Knowledge-Based Systems</source>, vol. <volume>228</volume>, no. <issue>2020</issue>, pp. <fpage>107242</fpage>, <year>2021</year>; <pub-id pub-id-type="pmid">36570870</pub-id></mixed-citation></ref>
<ref id="ref-24"><label>[24]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>A.</given-names> <surname>Onan</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Koruko&#x011F;lu</surname></string-name> and <string-name><given-names>H. J. E. S. W. A.</given-names> <surname>Bulut</surname></string-name></person-group>, &#x201C;<article-title>A multiobjective weighted voting ensemble classifier based on differential evolution algorithm for text sentiment classification</article-title>,&#x201D; <source>Expert Systems with Applications</source>, vol. <volume>62</volume>, no. <issue>21</issue>, pp. <fpage>1</fpage>&#x2013;<lpage>16</lpage>, <year>2016</year>.</mixed-citation></ref>
<ref id="ref-25"><label>[25]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>I. E.</given-names> <surname>Livieris</surname></string-name>, <string-name><given-names>L.</given-names> <surname>Iliadis</surname></string-name> and <string-name><given-names>P. J. E. S.</given-names> <surname>Pintelas</surname></string-name></person-group>, &#x201C;<article-title>On ensemble techniques of weight-constrained neural networks</article-title>,&#x201D; <source>Evolving Systems</source>, vol. <volume>12</volume>, no. <issue>1</issue>, pp. <fpage>155</fpage>&#x2013;<lpage>167</lpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-26"><label>[26]</label><mixed-citation publication-type="other"><person-group person-group-type="author"><string-name><given-names>M. S.</given-names> <surname>Akhtar</surname></string-name>, <string-name><given-names>D.</given-names> <surname>Ghosal</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Ekbal</surname></string-name>, <string-name><given-names>P.</given-names> <surname>Bhattacharyya</surname></string-name> and <string-name><given-names>S. J. A. P. A.</given-names> <surname>Kurohashi</surname></string-name></person-group>, &#x201C;<article-title>A multi-task ensemble framework for emotion, sentiment and intensity prediction</article-title>,&#x201D; <comment>arXiv preprint arXiv:1808.01216</comment>, <year>2018</year>.</mixed-citation></ref>
<ref id="ref-27"><label>[27]</label><mixed-citation publication-type="conf-proc"><person-group person-group-type="author"><string-name><given-names>L.</given-names> <surname>Akhtyamova</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Ignatov</surname></string-name> and <string-name><given-names>J.</given-names> <surname>Cardiff</surname></string-name></person-group>, &#x201C;<article-title>A large-scale CNN ensemble for medication safety analysis</article-title>,&#x201D; in <conf-name>Int. Conf. on Applications of Natural Language to Information Systems</conf-name>, <publisher-loc>Saarbr&#x00FC;cken, Germany</publisher-loc>, <publisher-name>Springer</publisher-name>, pp. <fpage>247</fpage>&#x2013;<lpage>253</lpage>, <year>2017</year>. </mixed-citation></ref>
<ref id="ref-28"><label>[28]</label><mixed-citation publication-type="conf-proc"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Mohammad</surname></string-name>, <string-name><given-names>F.</given-names> <surname>Bravo-Marquez</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Salameh</surname></string-name> and <string-name><given-names>S.</given-names> <surname>Kiritchenko</surname></string-name></person-group>, &#x201C;<article-title>Semeval-2018 task 1: Affect in tweets</article-title>,&#x201D; in <conf-name>Proc. of the 12th Int. Workshop on Semantic Evaluation</conf-name>, <publisher-loc> New Orleans, United States</publisher-loc>, pp. <fpage>1</fpage>&#x2013;<lpage>17</lpage>, <year>2018</year>. </mixed-citation></ref>
<ref id="ref-29"><label>[29]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>V.</given-names> <surname>Kandasamy</surname></string-name>, <string-name><given-names>P.</given-names> <surname>Trojovsk&#x00FD;</surname></string-name>, <string-name><given-names>F. A.</given-names> <surname>Machot</surname></string-name>, <string-name><given-names>K.</given-names> <surname>Kyamakya</surname></string-name>, <string-name><given-names>N.</given-names> <surname>Bacanin</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Sentimental analysis of COVID-19 related messages in social networks by involving an N-gram stacked autoencoder integrated in an ensemble learning scheme</article-title>,&#x201D; <source>Sensors</source>, vol. <volume>21</volume>, no. <issue>22</issue>, pp. <fpage>7582</fpage>, <year>2021</year>; <pub-id pub-id-type="pmid">34833656</pub-id></mixed-citation></ref>
<ref id="ref-30"><label>[30]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>M.</given-names> <surname>Ra</surname></string-name>, <string-name><given-names>B.</given-names> <surname>Ab</surname></string-name> and <string-name><given-names>S. J. G. O. R.</given-names> <surname>Kc</surname></string-name></person-group>, &#x201C;<article-title>COVID-19 outbreak: Tweet based analysis and visualization towards the influence of coronavirus in the world</article-title>,&#x201D; <source>Gedrag. Organ</source>, vol. <volume>33</volume>, pp. <fpage>8</fpage>&#x2013;<lpage>9</lpage>, <year>2020</year>.</mixed-citation></ref>
<ref id="ref-31"><label>[31]</label><mixed-citation publication-type="conf-proc"><person-group person-group-type="author"><string-name><given-names>S. D.</given-names> <surname>Das</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Basak</surname></string-name> and <string-name><given-names>S.</given-names> <surname>Dutta</surname></string-name></person-group>, &#x201C;<article-title>A heuristic-driven ensemble framework for COVID-19 fake news detection</article-title>,&#x201D; in <conf-name>Int. Workshop on Combating Online Hostile Posts in Regional Languages During Emergency Situation</conf-name>, <publisher-loc>Dublin, Ireland</publisher-loc>, <publisher-name>Springer</publisher-name>, pp. <fpage>164</fpage>&#x2013;<lpage>176</lpage>, <year>2021</year>. </mixed-citation></ref>
<ref id="ref-32"><label>[32]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Ayoub</surname></string-name>, <string-name><given-names>G.</given-names> <surname>Jilani</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Yu</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Khan</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Aspect2Labels: A novelistic decision support system for higher educational institutions by using multi-layer topic modelling approach</article-title>,&#x201D; <source>Expert Systems with Applications</source>, vol. <volume>209</volume>, no. <issue>1</issue>, pp. <fpage>118119</fpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-33"><label>[33]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Agarwal</surname></string-name> and <string-name><given-names>C. R.</given-names> <surname>Chowdary</surname></string-name></person-group>, &#x201C;<article-title>Combating hate speech using an adaptive ensemble learning model with a case study on COVID-19</article-title>,&#x201D; <source>Expert Systems with Applications</source>, vol. <volume>185</volume>, pp. <fpage>115632</fpage>, <year>2021</year>; <pub-id pub-id-type="pmid">36567759</pub-id></mixed-citation></ref>
<ref id="ref-34"><label>[34]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>J. A.</given-names> <surname>Wahid</surname></string-name>, <string-name><given-names>L.</given-names> <surname>Shi</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Gao</surname></string-name>, <string-name><given-names>B.</given-names> <surname>Yang</surname></string-name>, <string-name><given-names>L.</given-names> <surname>Wei</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Topic2Labels: A framework to annotate and classify the social media data through LDA topics and deep learning models for crisis response</article-title>,&#x201D; <source>Expert Systems with Applications</source>, vol. <volume>195</volume>, no. <issue>1</issue>, pp. <fpage>116562</fpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-35"><label>[35]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>K.</given-names> <surname>Chaturvedi</surname></string-name>, <string-name><given-names>D. K.</given-names> <surname>Vishwakarma</surname></string-name>, <string-name><given-names>N. J. C.</given-names> <surname>Singh</surname></string-name> and <string-name><given-names>Y. S.</given-names> <surname>Review</surname></string-name></person-group>, &#x201C;<article-title>COVID-19 and its impact on education, social life and mental health of students: A survey</article-title>,&#x201D; <source>Children and Youth Services Review</source>, vol. <volume>121</volume>, pp. <fpage>105866</fpage>, <year>2021</year>; <pub-id pub-id-type="pmid">33390636</pub-id></mixed-citation></ref>
<ref id="ref-36"><label>[36]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>Y.</given-names> <surname>Li</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Li</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Rice</surname></string-name>, <string-name><given-names>H.</given-names> <surname>Zhang</surname></string-name>, <string-name><given-names>D.</given-names> <surname>Sha</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>The impact of policy measures on human mobility, COVID-19 cases, and mortality in the US: A spatiotemporal perspective</article-title>,&#x201D; <source>Children and Youth Services Review</source>, vol. <volume>18</volume>, no. <issue>3</issue>, pp. <fpage>996</fpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-37"><label>[37]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>C.</given-names> <surname>Hou</surname></string-name>, <string-name><given-names>J.</given-names> <surname>Chen</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Zhou</surname></string-name>, <string-name><given-names>L.</given-names> <surname>Hua</surname></string-name>, <string-name><given-names>J.</given-names> <surname>Yuan</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>The effectiveness of quarantine of Wuhan city against the Corona Virus Disease 2019 (COVID-19): A well-mixed SEIR model analysis</article-title>,&#x201D; <source>Journal of Medical Virology</source>, vol. <volume>92</volume>, no. <issue>7</issue>, pp. <fpage>841</fpage>&#x2013;<lpage>848</lpage>, <year>2020</year>; <pub-id pub-id-type="pmid">32243599</pub-id></mixed-citation></ref>
<ref id="ref-38"><label>[38]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>K.</given-names> <surname>Kedraka</surname></string-name> and <string-name><given-names>C. J. E. J. O. E. S.</given-names> <surname>Kaltsidis</surname></string-name></person-group>, &#x201C;<article-title>Effects of the COVID-19 pandemic on university pedagogy: Students&#x2019; experiences and considerations</article-title>,&#x201D; <source>European Journal of Education Studies</source>, vol. <volume>7</volume>, no. <issue>8</issue>, pp. <fpage>17</fpage>&#x2013;<lpage>30</lpage>, <year>2020</year>.</mixed-citation></ref>
<ref id="ref-39"><label>[39]</label><mixed-citation publication-type="other"><person-group person-group-type="author"><string-name><given-names>J.</given-names> <surname>Mittelmeier</surname></string-name> and <string-name><given-names>H. J. A. A. S.</given-names> <surname>Cockayne</surname></string-name></person-group>, &#x201C;<article-title>Global depictions of international students in a time of crisis: A thematic analysis of Twitter data during COVID-19</article-title>,&#x201D; <source>International Studies in Sociology of Education</source>, vol. <volume>1</volume>, no. <issue>1</issue>, pp. <fpage>1</fpage>&#x2013;<lpage>24</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-40"><label>[40]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>Q.</given-names> <surname>Du</surname></string-name>, <string-name><given-names>N.</given-names> <surname>Li</surname></string-name>, <string-name><given-names>W.</given-names> <surname>Liu</surname></string-name>, <string-name><given-names>D.</given-names> <surname>Sun</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Yang</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>A topic recognition method of news text based on word embedding enhancement</article-title>,&#x201D; <source>Computational Intelligence and Neuroscience</source>, vol. <volume>2022</volume>, no. <issue>7</issue>, pp. <fpage>1</fpage>&#x2013;<lpage>15</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-41"><label>[41]</label><mixed-citation publication-type="book"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Srivastava</surname></string-name>, <string-name><given-names>R.</given-names> <surname>Raj</surname></string-name> and <string-name><given-names>S.</given-names> <surname>Saumya</surname></string-name></person-group>, &#x201C;<chapter-title>COVID-19 fake news identification using multi-layer convolutional neural network</chapter-title>,&#x201D; in <source>Advanced Computational Paradigms and Hybrid Intelligent Computing</source>, <publisher-loc>Singapore</publisher-loc>: <publisher-name>Springer</publisher-name>, pp. <fpage>149</fpage>&#x2013;<lpage>157</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-42"><label>[42]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>T.</given-names> <surname>Singh</surname></string-name> and <string-name><given-names>M. J. P. C. S.</given-names> <surname>Kumari</surname></string-name></person-group>, &#x201C;<article-title>Role of text pre-processing in Twitter sentiment analysis</article-title>,&#x201D; <source>Procedia Computer Science</source>, vol. <volume>89</volume>, pp. <fpage>549</fpage>&#x2013;<lpage>554</lpage>, <year>2016</year>.</mixed-citation></ref>
<ref id="ref-43"><label>[43]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>L. K.</given-names> <surname>Shrivastav</surname></string-name> and <string-name><given-names>S. K. J. A. I.</given-names> <surname>Jha</surname></string-name></person-group>, &#x201C;<article-title>A gradient boosting machine learning approach in modeling the impact of temperature and humidity on the transmission rate of COVID-19 in India</article-title>,&#x201D; <source>Applied Intelligence</source>, vol. <volume>51</volume>, no. <issue>5</issue>, pp. <fpage>2727</fpage>&#x2013;<lpage>2739</lpage>, <year>2021</year>; <pub-id pub-id-type="pmid">34764559</pub-id></mixed-citation></ref>
<ref id="ref-44"><label>[44]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>C.</given-names> <surname>Janiesch</surname></string-name>, <string-name><given-names>P.</given-names> <surname>Zschech</surname></string-name> and <string-name><given-names>K. J. E. M.</given-names> <surname>Heinrich</surname></string-name></person-group>, &#x201C;<article-title>Machine learning and deep learning</article-title>,&#x201D; <source>Electronic Markets</source>, vol. <volume>31</volume>, no. <issue>3</issue>, pp. <fpage>685</fpage>&#x2013;<lpage>695</lpage>, <year>2021</year>.</mixed-citation></ref>
<ref id="ref-45"><label>[45]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>A.</given-names> <surname>Onan</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Koruko&#x011F;lu</surname></string-name> and <string-name><given-names>H. J. E. S. W. A.</given-names> <surname>Bulut</surname></string-name></person-group>, &#x201C;<article-title>Ensemble of keyword extraction methods and classifiers in text classification</article-title>,&#x201D; <source>Expert Systems with Applications</source>, vol. <volume>57</volume>, no. <issue>8</issue>, pp. <fpage>232</fpage>&#x2013;<lpage>247</lpage>, <year>2016</year>.</mixed-citation></ref>
<ref id="ref-46"><label>[46]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>H.</given-names> <surname>Jelodar</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Wang</surname></string-name>, <string-name><given-names>C.</given-names> <surname>Yuan</surname></string-name>, <string-name><given-names>X.</given-names> <surname>Feng</surname></string-name>, <string-name><given-names>X.</given-names> <surname>Jiang</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Latent dirichlet allocation (LDA) and topic modeling: Models, applications, a survey</article-title>,&#x201D; <source>Multimedia Tools and Applications</source>, vol. <volume>78</volume>, no. <issue>11</issue>, pp. <fpage>15169</fpage>&#x2013;<lpage>15211</lpage>, <year>2019</year>.</mixed-citation></ref>
<ref id="ref-47"><label>[47]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>D.</given-names> <surname>Maier</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Waldherr</surname></string-name>, <string-name><given-names>P.</given-names> <surname>Miltner</surname></string-name>, <string-name><given-names>G.</given-names> <surname>Wiedemann</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Niekler</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Applying LDA topic modeling in communication research: Toward a valid and reliable methodology</article-title>,&#x201D; <source>Communication Methods and Measures</source>, vol. <volume>12</volume>, no. <issue>2&#x2013;3</issue>, pp. <fpage>93</fpage>&#x2013;<lpage>118</lpage>, <year>2018</year>.</mixed-citation></ref>
<ref id="ref-48"><label>[48]</label><mixed-citation publication-type="conf-proc"><person-group person-group-type="author"><string-name><given-names>S.</given-names> <surname>Park</surname></string-name>, <string-name><given-names>D.</given-names> <surname>Lee</surname></string-name>, <string-name><given-names>J.</given-names> <surname>Choi</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Ryu</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Kim</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Hierarchical Dirichlet process topic modeling for large number of answer types classification in open domain question answering</article-title>,&#x201D; in <conf-name>Asia Information Retrieval Symp.,</conf-name> <publisher-loc>Sarawak, Malaysia</publisher-loc>, <publisher-name>Springer</publisher-name>, pp. <fpage>418</fpage>&#x2013;<lpage>428</lpage>, <year>2014</year>. </mixed-citation></ref>
<ref id="ref-49"><label>[49]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>T.</given-names> <surname>Long</surname></string-name>, <string-name><given-names>X.</given-names> <surname>Xu</surname></string-name>, <string-name><given-names>F.</given-names> <surname>Shen</surname></string-name>, <string-name><given-names>L.</given-names> <surname>Liu</surname></string-name>, <string-name><given-names>N.</given-names> <surname>Xie</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>Zero-shot learning via discriminative representation extraction</article-title>,&#x201D; <source>Pattern Recognition Letters</source>, vol. <volume>109</volume>, no. <issue>10</issue>, pp. <fpage>27</fpage>&#x2013;<lpage>34</lpage>, <year>2018</year>.</mixed-citation></ref>
<ref id="ref-50"><label>[50]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>M.</given-names> <surname>Ayoub</surname></string-name>, <string-name><given-names>S.</given-names> <surname>Hussain</surname></string-name>, <string-name><given-names>A.</given-names> <surname>Khan</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Zahid</surname></string-name>, <string-name><given-names>J. A.</given-names> <surname>Wahid</surname></string-name> <etal>et al.</etal></person-group><italic>,</italic> &#x201C;<article-title>A predictive machine learning and deep learning approach on agriculture datasets for new moringa oleifera varieties prediction</article-title>,&#x201D; <source>Pakistan Journal of Engineering and Technology</source>, vol. <volume>5</volume>, no. <issue>1</issue>, pp. <fpage>68</fpage>&#x2013;<lpage>77</lpage>, <year>2022</year>.</mixed-citation></ref>
<ref id="ref-51"><label>[51]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>B.</given-names> <surname>Jang</surname></string-name>, <string-name><given-names>M.</given-names> <surname>Kim</surname></string-name>, <string-name><given-names>G.</given-names> <surname>Harerimana</surname></string-name>, <string-name><given-names>S. -U</given-names> <surname>Kang</surname></string-name> and <string-name><given-names>J. W. J. A. S.</given-names> <surname>Kim</surname></string-name></person-group>, &#x201C;<article-title>Bi-LSTM model to increase accuracy in text classification: Combining Word2vec CNN and attention mechanism</article-title>,&#x201D; <source>Applied Sciences</source>, vol. <volume>10</volume>, no. <issue>17</issue>, pp. <fpage>5841</fpage>, <year>2020</year>.</mixed-citation></ref>
<ref id="ref-52"><label>[52]</label><mixed-citation publication-type="conf-proc"><person-group person-group-type="author"><string-name><given-names>A.</given-names> <surname>Elnagar</surname></string-name>, <string-name><given-names>O.</given-names> <surname>Einea</surname></string-name> and <string-name><given-names>R.</given-names> <surname>Al-Debsi</surname></string-name></person-group>, &#x201C;<article-title>Automatic text tagging of Arabic news articles using ensemble deep learning models</article-title>,&#x201D; in <conf-name>Proc. of the 3rd Int. Conf. on Natural Language and Speech Processing</conf-name>, <publisher-loc>Trento, Italy</publisher-loc>, pp. <fpage>59</fpage>&#x2013;<lpage>66</lpage>, <year>2019</year>. </mixed-citation></ref>
<ref id="ref-53"><label>[53]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>M.</given-names> <surname>Kang</surname></string-name>, <string-name><given-names>J.</given-names> <surname>Ahn</surname></string-name> and <string-name><given-names> K. J. E. S. W. A.</given-names> <surname>Lee</surname></string-name></person-group>, &#x201C;<article-title>Opinion mining using ensemble text hidden Markov models for text classification</article-title>,&#x201D; <source>Expert Systems with Applications</source>, vol. <volume>94</volume>, no. <issue>6</issue>, pp. <fpage>218</fpage>&#x2013;<lpage>227</lpage>, <year>2018</year>.</mixed-citation></ref>
<ref id="ref-54"><label>[54]</label><mixed-citation publication-type="journal"><person-group person-group-type="author"><string-name><given-names>K.</given-names> <surname>Zeng</surname></string-name>, <string-name><given-names>Z.</given-names> <surname>Pan</surname></string-name>, <string-name><given-names>Y.</given-names> <surname>Xu</surname></string-name> and <string-name><given-names>Y.</given-names> <surname>Qu</surname></string-name></person-group>, &#x201C;<article-title>An ensemble learning strategy for eligibility criteria text classification for clinical trial recruitment: Algorithm development and validation</article-title>,&#x201D; <source>JMIR Medical Informatics</source>, vol. <volume>8</volume>, no. <issue>7</issue>, pp. <fpage>e17832</fpage>, <year>2020</year>; <pub-id pub-id-type="pmid">32609092</pub-id></mixed-citation></ref>
</ref-list>
</back>
</article>