<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.3 20070202//EN" "journalpublishing.dtd">
<?covid-19-tdm?>
<article article-type="other" dtd-version="2.3" xml:lang="EN" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink">
<front>
<journal-meta>
<journal-id journal-id-type="publisher-id">Int J Public Health</journal-id>
<journal-title>International Journal of Public Health</journal-title>
<abbrev-journal-title abbrev-type="pubmed">Int J Public Health</abbrev-journal-title>
<issn pub-type="epub">1661-8564</issn>
<publisher>
<publisher-name>Frontiers Media S.A.</publisher-name>
</publisher>
</journal-meta>
<article-meta>
<article-id pub-id-type="publisher-id">1604658</article-id>
<article-id pub-id-type="doi">10.3389/ijph.2022.1604658</article-id>
<article-categories>
<subj-group subj-group-type="heading">
<subject>Public Health Archive</subject>
<subj-group>
<subject>Original Article</subject>
</subj-group>
</subj-group>
</article-categories>
<title-group>
<article-title>Public Attitudes During the Second Lockdown: Sentiment and Topic Analyses Using Tweets From Ontario, Canada</article-title>
<alt-title alt-title-type="left-running-head">Tsao et&#x20;al.</alt-title>
<alt-title alt-title-type="right-running-head">Canadian Attitudes During Second Lockdown</alt-title>
</title-group>
<contrib-group>
<contrib contrib-type="author">
<name>
<surname>Tsao</surname>
<given-names>Shu-Feng</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1580264/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>MacLean</surname>
<given-names>Alexander</given-names>
</name>
<xref ref-type="aff" rid="aff2">
<sup>2</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1674315/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Chen</surname>
<given-names>Helen</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1059723/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Li</surname>
<given-names>Lianghua</given-names>
</name>
<xref ref-type="aff" rid="aff3">
<sup>3</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1664196/overview"/>
</contrib>
<contrib contrib-type="author">
<name>
<surname>Yang</surname>
<given-names>Yang</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1595688/overview"/>
</contrib>
<contrib contrib-type="author" corresp="yes">
<name>
<surname>Butt</surname>
<given-names>Zahid Ahmad</given-names>
</name>
<xref ref-type="aff" rid="aff1">
<sup>1</sup>
</xref>
<xref ref-type="corresp" rid="c001">&#x2a;</xref>
<uri xlink:href="https://loop.frontiersin.org/people/1077068/overview"/>
</contrib>
</contrib-group>
<aff id="aff1">
<sup>1</sup>
<institution>School of Public Health Sciences</institution>
<institution>University of Waterloo</institution>, <addr-line>Waterloo</addr-line>, <addr-line>ON</addr-line>, <country>Canada</country>
</aff>
<aff id="aff2">
<sup>2</sup>
<institution>Systems Design Engineering</institution>, <institution>University of Waterloo</institution>, <addr-line>Waterloo</addr-line>, <addr-line>ON</addr-line>, <country>Canada</country>
</aff>
<aff id="aff3">
<sup>3</sup>
<institution>Faculty of Science</institution>, <institution>University of Waterloo</institution>, <addr-line>Waterloo</addr-line>, <addr-line>ON</addr-line>, <country>Canada</country>
</aff>
<author-notes>
<fn fn-type="edited-by">
<p>
<bold>Edited by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1261362/overview">L. Suzanne Suggs</ext-link>, University of Italian Switzerland, Switzerland</p>
</fn>
<fn fn-type="edited-by">
<p>
<bold>Reviewed by:</bold> <ext-link ext-link-type="uri" xlink:href="https://loop.frontiersin.org/people/1610885/overview">Yana Samuel</ext-link>, Northeastern University, United&#x20;States</p>
</fn>
<corresp id="c001">&#x2a;Correspondence: Zahid Ahmad Butt, <email>zahid.butt@uwaterloo.ca</email>
</corresp>
</author-notes>
<pub-date pub-type="epub">
<day>21</day>
<month>02</month>
<year>2022</year>
</pub-date>
<pub-date pub-type="collection">
<year>2022</year>
</pub-date>
<volume>67</volume>
<elocation-id>1604658</elocation-id>
<history>
<date date-type="received">
<day>30</day>
<month>11</month>
<year>2021</year>
</date>
<date date-type="accepted">
<day>03</day>
<month>02</month>
<year>2022</year>
</date>
</history>
<permissions>
<copyright-statement>Copyright &#xa9; 2022 Tsao, MacLean, Chen, Li, Yang and Butt.</copyright-statement>
<copyright-year>2022</copyright-year>
<copyright-holder>Tsao, MacLean, Chen, Li, Yang and Butt</copyright-holder>
<license xlink:href="http://creativecommons.org/licenses/by/4.0/">
<p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (CC BY). The use, distribution or reproduction in other forums is permitted, provided the original author(s) and the copyright owner(s) are credited and that the original publication in this journal is cited, in accordance with accepted academic practice. No use, distribution or reproduction is permitted which does not comply with these&#x20;terms.</p>
</license>
</permissions>
<abstract>
<p>
<bold>Objective:</bold> This study aimed to explore topics and sentiments using tweets from Ontario, Canada, during the second wave of the COVID-19 pandemic.</p>
<p>
<bold>Methods:</bold> Tweets were collected from December 5, 2020, to March 6, 2021, excluding non-individual accounts. Dates of vaccine-related events and policy changes were collected from public health units in Ontario. The daily number of COVID-19 cases was retrieved from the Ontario provincial government&#x2019;s public health database. Latent Dirichlet Allocation was used for unsupervised topic modelling. VADER was used to calculate daily and average sentiment compound scores for topics identified.</p>
<p>
<bold>Results:</bold> Vaccine, pandemic, business, lockdown, mask, and Ontario were six topics identified from the unsupervised topic modelling. The average sentiment compound score for each topic appeared to be slightly positive, yet the daily sentiment compound scores varied greatly between positive and negative emotions for each&#x20;topic.</p>
<p>
<bold>Conclusion:</bold> Our study results have shown a slightly positive sentiment on average during the second wave of the COVID-19 pandemic in Ontario, along with six topics. Our research has also demonstrated a social listening approach to identify what the public sentiments and opinions are in a timely manner.</p>
</abstract>
<kwd-group>
<kwd>social media</kwd>
<kwd>COVID-19</kwd>
<kwd>sentiment analysis</kwd>
<kwd>lockdown</kwd>
<kwd>topic modelling</kwd>
<kwd>mask</kwd>
<kwd>vaccine</kwd>
</kwd-group>
</article-meta>
</front>
<body>
<sec id="s1">
<title>Introduction</title>
<p>The Coronavirus disease (COVID-19) pandemic has persisted for more than a year and resulted in over 141 million infections with over 3 million deaths worldwide [<xref ref-type="bibr" rid="B1">1</xref>]. In Canada, it has led to over 1 million positive cases and caused more than 24,000 deaths [<xref ref-type="bibr" rid="B2">2</xref>]. During this global crisis, when people have been forced to stay at home and connect virtually, social media platforms have played an increasingly significant role in communications now more than ever before. Therefore, social media data, such as tweets, have become even more important in health research associated with the current pandemic. Understanding public discourses and sentiments from social media data has been critical for researchers and decision makers since it correlates with our behaviours that help or fail to eliminate the COVID-19 infections. Scholars have conducted various topic modelling and sentiment analysis to understand public concerns or attitudes toward the pandemic and public health measures, such as mask wearing, handwashing, travel restrictions, and lockdowns since the early pandemic [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. For example, Abd-Alrazaq et&#x20;al identified 10 themes with positive sentiments and two topics with negative sentiments from 2.8 million English tweets between February 2 and March 15, 2020 [<xref ref-type="bibr" rid="B3">3</xref>]. Furthermore, Boon-Itt and Skunkan found topics changed over time, but negative sentiments persisted when analyzing almost 11 million English tweets from December 13, 2019, to March 9, 2020 [<xref ref-type="bibr" rid="B4">4</xref>]. Similarly, Chandrasekaran et&#x20;al. collected 13.9 million English tweets posted by individuals between January 1 and May 9, 2020. Their findings show a consistent negative sentiment towards topics related to the spread and growth of COVID-19, origin of virus, political perspectives, and racial discrimination, whereas sentiments toward topics associated with preventive measures and treatments, economic impacts, government implementations, healthcare industry changed from negative to positive [<xref ref-type="bibr" rid="B5">5</xref>]. Additionally, Valdez et&#x20;al. collected 86 million English tweets from the United&#x20;States (US) between January 22 and April 9, 2020 and found the number of tweets and ranking of eight identified topics&#x2014;&#x201c;China, Trump, US, lockdown, pandemic, social distancing, home, deaths&#x201d;&#x2014;rose and fell over time with the overall sentiment steadily shifting from negative to positive&#x20;[<xref ref-type="bibr" rid="B6">6</xref>].</p>
<p>Machine learning (ML) techniques have been applied to such research in topic modelling and sentiment analysis. For instance, Latent Dirichlet Allocation (LDA) is commonly applied to topic modelling, and Valence Aware Dictionary and sEntiment Reasoner (VADER) is widely used for sentiment analysis [<xref ref-type="bibr" rid="B4">4</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. LDA identifies topics from documents by classifying relevant individual words or phrases together modelled by Dirichlet distributions [<xref ref-type="bibr" rid="B7">7</xref>].VADER is a lexicon and rule-based sentiment analysis tool that classifies words as positive or negative [<xref ref-type="bibr" rid="B8">8</xref>]. Such advanced ML approaches have gained popularity among quantitative studies in which scholars analyze a large volume of social media data. For example, the World Health Organization (WHO) has developed an Early AI-supported Response with Social Listening (EARS) to understand the public discourses in different countries with data from social media and Internet search queries using a semi-supervised ML algorithm&#x20;[<xref ref-type="bibr" rid="B9">9</xref>].</p>
<p>Social media and Internet query data have also been used to predict the number of COVID-19 cases [<xref ref-type="bibr" rid="B10">10</xref>&#x2013;<xref ref-type="bibr" rid="B13">13</xref>], especially in China, where about 1 billion of its 1.4 billion population have access to the Internet and social media [<xref ref-type="bibr" rid="B14">14</xref>]. Although methods to construct predictive models vary across these studies, researchers, in general, can correctly predict the number of COVID-19 cases in China 6&#x2013;14&#xa0;days before these cases are officially confirmed by lab tests [<xref ref-type="bibr" rid="B9">9</xref>&#x2013;<xref ref-type="bibr" rid="B11">11</xref>]. On the other hand, Shen et&#x20;al. found a ratio of 1:4 between the number of cases and social posts in Wuhan, China [<xref ref-type="bibr" rid="B13">13</xref>]. Additionally, social media data with self-disclosed geolocations have been used to explore the public adherence to social distancing to eliminate the COVID transmissions [<xref ref-type="bibr" rid="B15">15</xref>, <xref ref-type="bibr" rid="B16">16</xref>] or the spread of the pandemic [<xref ref-type="bibr" rid="B17">17</xref>,&#x20;<xref ref-type="bibr" rid="B18">18</xref>].</p>
<p>Although recent literature has demonstrated the utility of social media data for various research, unsupervised ML approaches have not been studied as extensively as supervised ML techniques. In other words, data collection in current literature is conducted with pre-identified keywords or hashtags of research interest, and these pre-defined keywords have also been used as criteria for topic classifications [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>, <xref ref-type="bibr" rid="B10">10</xref>&#x2013;<xref ref-type="bibr" rid="B18">18</xref>]. In addition, each country has its unique context that may not be reflected in global studies as scholars have collected and analyzed social media data limiting to English but not specific countries. In Canada, the second wave of COVID 19 pandemic occurred from December 5, 2020, to March 6, 2021, and Ontario implemented its second lockdown between December 26, 2020, and January 2021. Mask-wearing was mandated after the province moved out of the lockdown. However, in the United&#x20;States (US), lockdowns were rarely implemented throughout the pandemic, except New York and California states. Futtheremore, mask-wearing wasn&#x2019;t mandated. Jang et&#x20;al. compared tweets from Canada with those from US and found that while Canadians shared some similar topics with Americans in factors associated with COVID-19 transmissions, US president, and Wuhan initial outbreak, Canadians expressed appreciation and border restrictions for travel, whereas Americans discussed the similarity between COVID-19 and influenza and lockdown impacts [<xref ref-type="bibr" rid="B19">19</xref>]. In the case of face mask-wearing, people in Asian countries have higher adherence to wearing masks as recommended by public health authorities than those in western culture&#x20;[<xref ref-type="bibr" rid="B20">20</xref>].</p>
<p>While LDA and VADER have been commonly used for topic modelling and sentiment analysis, respectively, deep learning techniques, such as Long Short-Term Memory (LSTM) and Bidirectional Encoder Representations from Transformers (BERT), have become more successful and have been adopted in more recent literature for sentiment analysis [<xref ref-type="bibr" rid="B21">21</xref>&#x2013;<xref ref-type="bibr" rid="B24">24</xref>]. For example, Chandra and Krishna [<xref ref-type="bibr" rid="B21">21</xref>] used deep learning models for COVID-19 tweet sentiment analysis in India from March to September 2021. The study has classified more granular 11 emotions than three general sentiments (i.e.,&#x20;positive, negative, and neutral) from the conventional VADER [<xref ref-type="bibr" rid="B21">21</xref>]. Similarly, Imran et&#x20;al. [<xref ref-type="bibr" rid="B22">22</xref>] used a supervised multi-layer LSTM to classify and compare six emotions across Pakistan, India, Norway, Sweden, Canada, and the US [<xref ref-type="bibr" rid="B22">22</xref>]. Das and Kolya [<xref ref-type="bibr" rid="B23">23</xref>] also proposed a supervised deep convolutional neural network (CNN) to evaluate sentiments and predict COVID-19 cases globally since data were retrieved from 15 countries [<xref ref-type="bibr" rid="B23">23</xref>]. Yet they classified emotions expressed in tweets only as either positive or negative [<xref ref-type="bibr" rid="B23">23</xref>]. However, deep learning techniques still have some limitations. For instance, supervised deep learning techniques demonstrated in existing literature have been conducted in a supervised manner, and this requires large and correctly labelled training datasets [<xref ref-type="bibr" rid="B22">22</xref>&#x2013;<xref ref-type="bibr" rid="B24">24</xref>]. Interpretability is another issue because public health professionals may not have deep understanding of deep learning models, which have been more complicated than conventional LDA and VADER. In other words, although deep learning has more optimal performance than conventional techniques, it has been a &#x201c;black box&#x201d; viewed by many public health professionals [<xref ref-type="bibr" rid="B24">24</xref>]. Additionally, compared to conventional methods, deep learning techniques generally require more computing power, leading to limited implementation in practice.</p>
<p>On the other hand, most studies conducted in the first wave analyzed data with a relatively shorter time frame, several weeks or 1&#xa0;month, for example [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. Furthermore, given existing literature, it still lacks follow-up research to investigate how sentiments and topics have changed over time after the first wave of the COVID-19 pandemic in Canada. Furthermore, given Canada&#x2019;s cultural diversity and the greater provincial autonomy than the federal, each province has tackled the pandemic differently in Canada. It is of our research interest to investigate at a more focused, local level. Therefore, this study aimed to apply an unsupervised ML approach with minimal manual validations to explore both topics and corresponding sentiments using tweets from Ontario, Canada, from December 5, 2020, to March 6,&#x20;2021.</p>
</sec>
<sec sec-type="methods" id="s2">
<title>Methods</title>
<sec id="s2-1">
<title>Tweet Collection</title>
<p>English tweets originated in Ontario, Canada, were collected between December 5, 2020, and March 6, 2021, without being filtered by COVID-19 related keywords or hashtags. This is because our study aimed to apply an unsupervised ML approach to identify possible patterns beyond those explicitly mentioning COVID-19 related keywords or hashtags. Instead, major metropolitan areas in Ontario, namely geolocation tags from Toronto and Ottawa, were identified to limit the scope of data collection to a level allowed by available resources. With these query parameters limited to two cities and the timeframe, 569,467 tweets from Toronto and 141,469 tweets from Ottawa were returned from December 5, 2020, to March 6, 2021, <italic>via</italic> the Twitter Developer API&#x20;[<xref ref-type="bibr" rid="B25">25</xref>].</p>
</sec>
<sec id="s2-2">
<title>Public Health Policy Data Collection</title>
<p>Data were collected on Ontario public health policy changes by each public health unit as a means of comparison against daily case changes and Twitter sentiment from December 5, 2020, to March 6, 2021. Public health policy changes include major vaccine approvals, lockdown announcements, school closures and other public health related enforcement of policies regarding COVID-19 by reviewing each public health unit&#x2019;s COVID-19 information page within the applicable regions.</p>
</sec>
<sec id="s2-3">
<title>Daily Case Count Collection</title>
<p>The daily case counts of all public health units in Ontario from December 5, 2020, to March 6, 2021 were retrieved from the Ontario provincial government&#x2019;s public health database. The extracted data were organized by active cases, resolved cases, and deaths as defined by the Government of Ontario&#x2019;s health&#x20;unit.</p>
</sec>
<sec id="s2-4">
<title>Data Processing</title>
<p>
<xref ref-type="fig" rid="F1">Figure&#x20;1</xref> shows the overall flow diagram. All tweets were transformed to lowercase. Next, non-texts were removed, including punctuations (&#x201c;[&#x201d;, &#x201c;]&#x201d;, &#x201c;,&#x201d;, &#x201c;\&#x201d;, &#x201c;.&#x201d;, &#x201c;:&#x201d;, &#x201c;!&#x201d;, &#x201c;/&#x201d;), special characters (&#x201c;&#x23;&#x201d;, &#x201c;%&#x201d;, &#x201c;$&#x201d;, &#x201c;@&#x201d;), uniform resource locator (URL), emoji, and stop words following standard data preprocessing procedure as previous studies [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. Unsupervised LDA topic modelling was firstly applied by using Python&#x2019;s Gensim package to generate potential keywords for each identified topic in previous literature [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. Three researchers&#x2014;S-FT, HC, and ZB&#x2014;then reviewed the preliminary keywords for each topic generated by the unsupervised topic modelling to collaboratively interpret topics for further data cleansing before conducting the sentiment analysis. All disagreements were resolved through discussions among the three researchers. To reduce noise irrelevant to the pandemic, such as the 2020 United&#x20;States presidential election, from the sample and to better understand the sentiment around various components of the public discourses in Ontario, Canada, the full dataset was further filtered down, and a subset was created by using the topics and keywords identified. The filtering was done by searching for substrings in a tweet matching one of the keywords for a given topic. In addition, to ensure that the sentiment score reflects public sentiment as closely as possible, emojis were added back to the tweets since VADER can recognise them when calculating sentiment scores [<xref ref-type="bibr" rid="B8">8</xref>]. Furthurmore, tweets from public health, governments agencies and political organizations were excluded in the subset as described in a previous study&#x20;[<xref ref-type="bibr" rid="B26">26</xref>].</p>
<fig id="F1" position="float">
<label>FIGURE 1</label>
<caption>
<p>Flow diagram [Public Attitudes during the Second Lockdown: Sentiment and Topic Analyses using Tweets from Ontario, Canada, Canada, 2020].</p>
</caption>
<graphic xlink:href="ijph-67-1604658-g001.tif"/>
</fig>
<p>VADER is used to identify sentiment as it calculates the sentiment attached to individual tokens in text and is adjusted to understand specific tokens commonly used in English social media text [<xref ref-type="bibr" rid="B8">8</xref>]. For each tweet, VADER provides an empirically found sentiment value for individual terms, emoticons, and punctuation marks, modified by defined rules for combinations of terms. From these values, a compound overall sentiment score is calculated by taking the sum of the individual sentiments, with positive values for positive sentiments and negative values for negative ones. This raw score is normalized using the equation <inline-formula id="inf1">
<mml:math id="m1">
<mml:mrow>
<mml:mi>C</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>m</mml:mi>
<mml:mi>p</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>u</mml:mi>
<mml:mi>n</mml:mi>
<mml:mi>d</mml:mi>
<mml:mo>&#x3d;</mml:mo>
<mml:mo>&#xa0;</mml:mo>
<mml:mfrac>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>w</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:mi>e</mml:mi>
</mml:mrow>
<mml:mrow>
<mml:msqrt>
<mml:mrow>
<mml:mi>R</mml:mi>
<mml:mi>a</mml:mi>
<mml:mi>w</mml:mi>
<mml:mi>S</mml:mi>
<mml:mi>c</mml:mi>
<mml:mi>o</mml:mi>
<mml:mi>r</mml:mi>
<mml:msup>
<mml:mi>e</mml:mi>
<mml:mn>2</mml:mn>
</mml:msup>
<mml:mo>&#x2b;</mml:mo>
<mml:mi>&#x3b1;</mml:mi>
</mml:mrow>
</mml:msqrt>
</mml:mrow>
</mml:mfrac>
</mml:mrow>
</mml:math>
</inline-formula> , where &#x3b1; is set to the value of 15 based on the maximum values seen by the authors in training sets and then normalized to ensure that the normalized value is indeed between &#x2212;1 and &#x2b;1 [<xref ref-type="bibr" rid="B8">8</xref>]. The compound score was therefore used for our sentiment analysis. However, it is difficult for humans to understand numeric sentiment scores. Therefore, the compound sentiment scores are categorized as &#x201c;positive&#x201d; if they are equal or greater than &#x2b;0.05, &#x201c;negative&#x201d; if they are equal to or lower than &#x2212;0.05 and &#x201c;neutral&#x201d; if neither based on prior research&#x20;[<xref ref-type="bibr" rid="B27">27</xref>].</p>
</sec>
<sec id="s2-5">
<title>Manual Validation</title>
<p>To determine the accuracy of the unsupervised LDA topic modelling and sentiment analysis. Three researchers&#x2014;S-FT, HC, and ZB&#x2014;conducted inter-rater manual validations for 3% of random tweets from each topic and their sentiment. S-FT was the primary rater, HC and ZB served as secondary raters. The 3% random sample is calculated according to Krippendorff&#x2019;s sampling method with 10% probability of the rarest relevant instances and 95% desired significance level of the answers to our research question [<xref ref-type="bibr" rid="B28">28</xref>]. Inter-rater agreement percentage and validation results were reported in Supplement&#x20;A.</p>
</sec>
</sec>
<sec sec-type="results" id="s3">
<title>Results</title>
<p>
<xref ref-type="table" rid="T1">Table&#x20;1</xref> shows the topics given by the unsupervised LDA topic modelling. These topics were chosen based on the research questions, i.e. public sentiment with regard to lockdown policies and researchers&#x2019; interpretations with corresponding keywords and synonyms from each topic&#x2019;s keyword outputs generated by the unsupervised LDA topic modelling and manual validation.</p>
<table-wrap id="T1" position="float">
<label>TABLE 1</label>
<caption>
<p>Topics, keywords, and synonyms generated from the unsupervised LDA [Public Attitudes during the Second Lockdown: Sentiment and Topic Analyses using Tweets from Ontario, Canada, Canada, 2020].</p>
</caption>
<table>
<thead valign="top">
<tr>
<th align="left">Topics</th>
<th align="center">Human interpretations</th>
<th align="center">Keywords and synonyms</th>
<th align="center">Number of tweets included</th>
</tr>
</thead>
<tbody valign="top">
<tr>
<td align="left">Vaccine</td>
<td align="left">Opinions toward COVID-19 vaccine approval, access, availability, etc.</td>
<td align="left">vaccine, vaccinations, vaccination, vaccines, vaccinated, immunization</td>
<td align="center">6,932</td>
</tr>
<tr>
<td align="left">Pandemic</td>
<td align="left">Impacts of the COVID-19 on life</td>
<td align="left">pandemic, covid-19, covid19, covid 19, covid_19, covid, sars, coronavirus, corona virus, corona, sars-cov-2, outbreak, cases</td>
<td align="center">17,285</td>
</tr>
<tr>
<td align="left">Business</td>
<td align="left">Reviews, supports, and impacts of the COVID-19 pandemic on busniesses, markets, and economics</td>
<td align="left">business, binesses, biness, businesses, biz</td>
<td align="center">5,148</td>
</tr>
<tr>
<td align="left">Lockdown</td>
<td align="left">Opinions toward the second lockdown</td>
<td align="left">lockdown, lockdowns, lock down, shutdown, shut down, shutdowns, grey zone</td>
<td align="center">4,884</td>
</tr>
<tr>
<td align="left">Mask</td>
<td align="left">Opinions toward wearing masks</td>
<td align="left">mask, wearing, wear, face cover, facial cover, facemasking, face mask, masks, maskwearing</td>
<td align="center">6,893</td>
</tr>
<tr>
<td align="left">Ontario</td>
<td align="left">Things happended in Ontario</td>
<td align="left">fordnation, ford, ontario</td>
<td align="center">25,401</td>
</tr>
</tbody>
</table>
</table-wrap>
<p>The numbers of active COVID-19 cases and deaths between December 5, 2020, and March 6, 2021, in Toronto and Ottawa, Ontario, are shown in <xref ref-type="fig" rid="F2">Figure&#x20;2</xref>. <xref ref-type="fig" rid="F3">Figure&#x20;3</xref> demonstrates the sentiment score for each identified topic altogether. Compound sentiment scores for each topic in Ontario are shown in <xref ref-type="sec" rid="s9">Supplementary Figures S4&#x2013;S9</xref> in Supplement B, with purple lines representing vaccine events, orange lines indicating policy change events, and red lines demonstrating extended lockdown in Toronto and Peel regions. The light green line shows the mean compound sentiment score for that topic on a particular day, while the dark green line shows the sentiment score smoothed by averaging using an 11-day rolling window. Examples of positive and negative tweets for each topic are shown in <xref ref-type="sec" rid="s9">Supplementary Tables S2&#x2013;S7</xref> in Supplement&#x20;C.</p>
<fig id="F2" position="float">
<label>FIGURE 2</label>
<caption>
<p>COVID-19 cases in Toronto and Ottawa [Public Attitudes during the Second Lockdown: Sentiment and Topic Analyses using Tweets from Ontario, Canada, Canada, 2020].</p>
</caption>
<graphic xlink:href="ijph-67-1604658-g002.tif"/>
</fig>
<fig id="F3" position="float">
<label>FIGURE 3</label>
<caption>
<p>The overall sentiment compund score [Public Attitudes during the Second Lockdown: Sentiment and Topic Analyses using Tweets from Ontario, Canada, Canada, 2020].</p>
</caption>
<graphic xlink:href="ijph-67-1604658-g003.tif"/>
</fig>
<p>The average sentiment compound score for the topic &#x201c;lockdown&#x201d; (in Supplement B <xref ref-type="sec" rid="s9">Supplementary Figure S4</xref>) started neutral but remained slightly positive afterwards. It went up during the Christmas 2020 break and went down after the second provincial emergency was declared.</p>
<p>The average sentiment compound score for the topic &#x201c;mask&#x201d; (in Supplement B <xref ref-type="sec" rid="s9">Supplementary Figure S5</xref>) has remained slightly positive during the study period. Similar to the previous topic, the score went up during the Christmas 2020 break and also spiked after the AstraZeneca vaccine was approved in Canada, but it went down shortly afterwards.</p>
<p>The average sentiment compound score for the topic &#x201c;Ontario&#x201d; (in Supplement B <xref ref-type="sec" rid="s9">Supplementary Figure S6</xref>) has overall remained slightly positive during the study period, while it consistently declined and plateaued until the second state of emergency&#x20;ended.</p>
<p>The average sentiment compound score for the topic &#x201c;pandemic&#x201d; (in Supplement B <xref ref-type="sec" rid="s9">Supplementary Figure S7</xref>) has been almost neutral over time. However, the score especially decreased after the Pfizer vaccines were delayed and toward the end of the study period.</p>
<p>The average sentiment compound score for the topic &#x201c;vaccine&#x201d; (in Supplement B <xref ref-type="sec" rid="s9">Supplementary Figure S8</xref>) began relatively more positive but went down quickly afterwards. It went up shortly before the Christmas 2020 break but declined and plateaued after&#x20;that.</p>
<p>Like the &#x201c;vaccine&#x201d; topic, the average sentiment compound score for the topic &#x201c;business&#x201d; (in Supplement B <xref ref-type="sec" rid="s9">Supplementary Figure S9</xref>) started positively but stably dropped afterwards until around January 24, 2021, when the COVID-19 case counts were relatively lower (<xref ref-type="fig" rid="F2">Figure&#x20;2</xref>). Interestingly, the average sentiment compound score of the topic &#x201c;business&#x201d; was slightly more positive than all the other topics. However, businesses should have been negatively impacted by the lockdown.</p>
</sec>
<sec sec-type="discussion" id="s4">
<title>Discussion</title>
<p>To our surprise but understandable, there was no obvious correlation between sentiments and cases or key events on average when the pandemic had lasted over 6&#xa0;months when Ontario, Canada declared its second provincial emergency and lockdown. Sentiments were more related to holidays as positivity was higher from Christmas 2020 to New Year Day, 2021, although the second provincial shutdown kicked in on December 26, 2020. As <xref ref-type="table" rid="T1">Table&#x20;1</xref> shows, the &#x201c;Ontario&#x201d; topic includes the highest number of tweets, followed by the &#x201c;pandemic&#x201d; topic. Regardless of vaccine or policy events, the average sentiment compound score during the studied period appeared to be slightly positive across all topics of interest, with daily sentiment compound scores greatly varied between positive and negative emotions (<xref ref-type="sec" rid="s9">Supplementary Figures S4&#x2013;S9</xref>). Positive sentiments spiked on December 25, 2020 (Christmas). However, when the second province-wide lockdown began on December 26, 2020, the sentiment scores went downward regardless of topics. In other words, during the second provincial lockdown, there were weak correlations between sentiment scores and vaccine or policy events.</p>
<p>Positive sentiments across topics are mainly associated with holidays and support for the recommended public health practices such as wearing masks and vaccinations. In contrast, negative sentiment across topics largely reflected frustrations and blame on incompetent political leadership. It is also interesting to observe that Greg Abbott, Texas Governor in the United&#x20;States, was negatively discussed on Twitter among Canadian users when he lifted the mask mandate in Texas on March 2, 2021 [<xref ref-type="bibr" rid="B29">29</xref>]. He was a major subject for several days for &#x201c;business&#x201d; and &#x201c;mask&#x201d; topics.</p>
<p>We did not expect the unsupervised LDA approach for topic modelling to show very limited interpretability in our study. In <xref ref-type="table" rid="T1">Table&#x20;1</xref>, we identified just 66,543 out of 710,936 (9.36%) tweets that can be understood and grouped into six meaningful topics related to our research questions. While we anticipated that the unsupervised ML approach would not generate results as meaningful as supervised ML techniques in previous studies [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>], we did not foresee such restricted interpretability. Therefore, for future studies, we recommend collecting more data and more thorough data preprocessing to achieve higher data quality to train the unsupervised algorithm and avoid &#x201c;garbage in, garbage out.&#x201d; Additionally, for future sentiment analysis, it would be better if emojis could be included to further improve the sentiment scores with a caution that emoji usage can be culturally sensitive in a multicultural country like Canada.</p>
<p>Most existing studies used tweets no later than August 2020, when the first wave of the COVID-19 pandemic was over. In addition, most countries had several lockdowns during the first wave [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. However, in contrast to previous studies showing consistently negative sentiments during the first wave [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>], our tweets showed that Ontarians had a slightly positive sentiment on average during the second wave in Canada. Unlike previous studies [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>], symptoms, severity, and/or spread of COVID-19 pandemic are no longer major topics in our sample, demonstrating that Twitter users might have accepted and adjusted daily life under the ongoing pandemic. Similar to existing research showing negative emotions toward government responses [<xref ref-type="bibr" rid="B30">30</xref>], especially shutdowns during the first wave, negative tweets in our sample also called political leaders &#x201c;incompetent&#x201d; or &#x201c;failure&#x201d; across all topics during the second wave, but the average sentiment compound score remains slightly positive, although the daily sentiment compound scores vary a&#x20;lot.</p>
<p>In addition, our study collected and analyzed tweets over 3&#xa0;months, which is very different from existing research that collected and analyzed data rarely more than a month [<xref ref-type="bibr" rid="B3">3</xref>&#x2013;<xref ref-type="bibr" rid="B6">6</xref>]. Although we did not collect all the possible data given our geolocation restrictions, our research has provided local evidence solely from an aspect of Ontario, Canada, because each country and sub-national entities are unique. This is different from current global sentiment studies that combine and compare different countries together [<xref ref-type="bibr" rid="B30">30</xref>&#x2013;<xref ref-type="bibr" rid="B32">32</xref>]. Furthermore, our research is one of a few studies [<xref ref-type="bibr" rid="B19">19</xref>] that demonstrated a combination of unsupervised topic modelling and qualitative checks, which can generate human-interpretable and meaningful topics or insights from large amounts of data under a time-sensitive nature without an extremely time-consuming process. However, to avoid &#x201c;garbage in, garbage out&#x201d; resulting from the unsupervised ML approach, it remains an important issue to properly specify inclusion and exclusion criteria for data collection, such as keywords or geolocation, to achieve optimized data quality by filtering out meaningless data as much as possible without introducing selection bias in the&#x20;data.</p>
<p>However, our study has several limitations. First of all, due to Twitter&#x2019;s geolocation query methods, only a subset of tweets has geotags identified. It has been estimated that only about 2.31% of tweets with locations are attached to the tweets, and an even smaller number of those have precise locations [<xref ref-type="bibr" rid="B33">33</xref>]. As such, the tweets we were able to identify and use in our analysis represent only a small amount of the actual discourse occurring within the defined temporal and geographical parameters. Additionally, we limited our search to two very specific municipalities&#x2014;Toronto and Ottawa in Ontario, Canada&#x2014;because, during the data collection period, we realized that it was difficult to distinguish &#x201c;Ontario, Canada&#x201d; from &#x201c;Ontario, California&#x201d; given that their common abbreviation is &#x201c;Ontario, CA&#x201d; if we did not specify cities. We also did not collect data from other social media platforms, such as Facebook and Reddit, which has limited our generalizability.</p>
<p>Furthermore, our manual quality validation identified that although small, there is a chance that VADER can misclassify sentiments. For instance, a tweet with sarcasm was regarded as positive but in fact, it should have been considered negative. On the other hand, a tweet with a &#x201c;surprised&#x201d; mood was regarded as negative because the word &#x201c;shocking&#x201d; was repeated many times. Therefore, it is possible that our sentiment analysis is not perfectly accurate as it should have been. Moreover, tweets classified in each topic were not exclusive to other topics. If a user mentioned several topics within a tweet, it would be assigned to multiple topics, such as the case of Greg Abbott that showed up in both &#x201c;Ontario&#x201d; and &#x201c;business&#x201d; topics. However, we decided to leave them as they were because it would be inappropriate to assign only one topic to tweets with multiple topics as they naturally occurred. This observation actually showed that some topics could be highly correlated. Accordingly, how to properly choose keywords and their synonyms as filters remains an important challenge to be addressed.</p>
<p>In conclusion, our results have shown that Ontarians in Toronto and Ottawa have remained a slightly positive sentiment during the second wave of the COVID-19 pandemic regardless of topics. We also identified six topics that emerged from data over time, and these topics have been highly correlated with the ongoing pandemic, although the average positive sentiment could be driven by the Christmas-New Year holiday break amid the second wave rather than by the public health interventions. Compared with prior studies conducted during the first wave [<xref ref-type="bibr" rid="B19">19</xref>], our study has shown different narratives from public discourse during the second wave. That is, people have shifted their focus on COVID-19 related symptoms, transmissions, risk factors, and origin of the virus to how the pandemic has influenced their daily life without specifically mentioning COVID-19. Our research also demonstrated that a mixed approach of unsupervised topic modelling and manual validation could generate timely evidence when experienced experts get involved. However, data quality and limited utility from unsupervised LDA modelling remain a critical issue for future research, and the possibility of misclassification is acknowledged. Therefore, our results show that it is feasible to use social media data to practice social listening as recommended by the World Health Organization (WHO) to understand narratives from the general public [<xref ref-type="bibr" rid="B9">9</xref>] to make informed decisions.</p>
</sec>
</body>
<back>
<sec id="s5">
<title>Author Contributions</title>
<p>S-FT and ZB conceived of the presented idea. AM and LL performed the computations and verified the analytical methods with S-FT, ZB, HC, and YY. ZB and HC supervised the findings of this work. All authors discussed the results and contributed to the final manuscript.</p>
</sec>
<sec sec-type="COI-statement" id="s7">
<title>Conflict of Interest</title>
<p>The authors declare that the research was conducted in the absence of any commercial or financial relationships that could be construed as a potential conflict of interest.</p>
</sec>
<ack>
<p>We are thankful to Therese Tisseverasinghe for her continuous support and help with the review.</p>
</ack>
<sec id="s8">
<title>Supplementary Material</title>
<p>The Supplementary Material for this article can be found online at: <ext-link ext-link-type="uri" xlink:href="https://www.ssph-journal.org/articles/10.3389/ijph.2022.1604658/full#supplementary-material">https://www.ssph-journal.org/articles/10.3389/ijph.2022.1604658/full&#x23;supplementary-material</ext-link>
</p>
<supplementary-material xlink:href="DataSheet3.docx" id="SM1" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet2.docx" id="SM2" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
<supplementary-material xlink:href="DataSheet1.docx" id="SM3" mimetype="application/docx" xmlns:xlink="http://www.w3.org/1999/xlink"/>
</sec>
<sec id="s9">
<title>Abbreviations</title>
<p>COVID-19, Coronavirus disease; LDA, Latent Dirichlet&#x20;allocation; ML, Machine Learning; VADER, Valence Aware Dictionary and sEntiment Reasoner.</p>
</sec>
<ref-list>
<title>References</title>
<ref id="B1">
<label>1.</label>
<citation citation-type="journal">
<collab>WHO Coronavirus (COVID-19)</collab>.(<year>2021</year>) <article-title>Dashboard</article-title>. <source>Who.int</source>. <comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://covid19.who.int/">https://covid19.who.int/</ext-link>
</comment>. (<comment>Accessed April 20, 2021).</comment> </citation>
</ref>
<ref id="B2">
<label>2.</label>
<citation citation-type="journal">
<collab>Canada</collab>.(<year>2021</year>) <article-title>WHO Coronavirus Disease (COVID-19) Dashboard with Vaccination Data</article-title>. <source>Who.int</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://covid19.who.int/region/amro/country/ca">https://covid19.who.int/region/amro/country/ca</ext-link>
</comment>. (<comment>Accessed April 20, 2021)</comment>. </citation>
</ref>
<ref id="B3">
<label>3.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Abd-Alrazaq</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Alhuwail</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Househ</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Hamdi</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Shah</surname>
<given-names>Z</given-names>
</name>
</person-group> <article-title>Top Concerns of Tweeters during the COVID-19 Pandemic: Infoveillance Study</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2020</year>) <volume>22</volume>(<issue>4</issue>):<fpage>e19016</fpage>. <pub-id pub-id-type="doi">10.2196/19016</pub-id> </citation>
</ref>
<ref id="B4">
<label>4.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Boon-Itt</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Skunkan</surname>
<given-names>Y</given-names>
</name>
</person-group>. <article-title>Public Perception of the COVID-19 Pandemic on Twitter: Sentiment Analysis and Topic Modeling Study</article-title>. <source>JMIR Public Health Surveill</source> (<year>2020</year>) <volume>6</volume>(<issue>4</issue>):<fpage>e21978</fpage>. <pub-id pub-id-type="doi">10.2196/21978</pub-id> </citation>
</ref>
<ref id="B5">
<label>5.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chandrasekaran</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Mehta</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Valkunde</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Moustakas</surname>
<given-names>E</given-names>
</name>
</person-group>. <article-title>Topics, Trends, and Sentiments of Tweets about the COVID-19 Pandemic: Temporal Infoveillance Study</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2020</year>) <volume>22</volume>(<issue>10</issue>):<fpage>e22624</fpage>. <pub-id pub-id-type="doi">10.2196/22624</pub-id> </citation>
</ref>
<ref id="B6">
<label>6.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Valdez</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Ten Thij</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Bathina</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Rutter</surname>
<given-names>LA</given-names>
</name>
<name>
<surname>Bollen</surname>
<given-names>J</given-names>
</name>
</person-group>. <article-title>Social media Insights into US Mental Health during the COVID-19 Pandemic: Longitudinal Analysis of Twitter Data</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2020</year>) <volume>22</volume>(<issue>12</issue>):<fpage>e21418</fpage>. <pub-id pub-id-type="doi">10.2196/21418</pub-id> </citation>
</ref>
<ref id="B7">
<label>7.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Blei</surname>
<given-names>DM</given-names>
</name>
<name>
<surname>Andrew</surname>
<given-names>YN</given-names>
</name>
<name>
<surname>Michael</surname>
<given-names>IJ</given-names>
</name>
</person-group>. <article-title>Latent Dirichlet Allocation</article-title>. <source>J&#x20;machine Learn Res</source> (<year>2003</year>) <volume>3</volume>:<fpage>993</fpage>&#x2013;<lpage>1022</lpage>. <pub-id pub-id-type="doi">10.5555/944919.944937</pub-id> </citation>
</ref>
<ref id="B8">
<label>8.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Hutto</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Gilbert</surname>
<given-names>E</given-names>
</name>
</person-group>. <article-title>VADER: A Parsimonious Rule-Based Model for Sentiment Analysis of Social media Text</article-title>. <source>ICWSM</source> (<year>2014</year>) <volume>8</volume>(<issue>1</issue>):<fpage>216</fpage>&#x2013;<lpage>25</lpage>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://ojs.aaai.org/index.php/ICWSM/article/view/14550">https://ojs.aaai.org/index.php/ICWSM/article/view/14550</ext-link>
</comment>. </citation>
</ref>
<ref id="B9">
<label>9.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Purnat</surname>
<given-names>TD</given-names>
</name>
<name>
<surname>Wilson</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Nguyen</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Briand</surname>
<given-names>S</given-names>
</name>
</person-group>. <article-title>EARS - A WHO Platform for AI-Supported Real-Time Online Social Listening of COVID-19 Conversations</article-title>. <source>Stud Health Technol Inform</source> (<year>2021</year>) <volume>281</volume>:<fpage>1009</fpage>&#x2013;<lpage>10</lpage>. <pub-id pub-id-type="doi">10.3233/SHTI210330</pub-id> </citation>
</ref>
<ref id="B10">
<label>10.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>LJ</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Pang</surname>
<given-names>CP</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>H</given-names>
</name>
</person-group>. <article-title>Retrospective Analysis of the Possibility of Predicting the COVID-19 Outbreak from Internet Searches and Social media Data, China, 2020</article-title>. <source>Euro Surveill [Internet</source> (<year>2020</year>) <volume>25</volume>(<issue>10</issue>). <pub-id pub-id-type="doi">10.2807/1560-7917.ES.2020.25.10.2000199</pub-id> </citation>
</ref>
<ref id="B11">
<label>11.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Qin</surname>
<given-names>L</given-names>
</name>
<name>
<surname>Sun</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Wang</surname>
<given-names>Y</given-names>
</name>
<name>
<surname>Wu</surname>
<given-names>K-F</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Shia</surname>
<given-names>B-C</given-names>
</name>
<etal/>
</person-group> <article-title>Prediction of&#x20;Number of Cases of 2019 Novel Coronavirus (COVID-19) Using Social&#x20;media Search index</article-title>. <source>Ijerph</source> (<year>2020</year>) <volume>17</volume>(<issue>7</issue>):<fpage>2365</fpage>. <pub-id pub-id-type="doi">10.3390/ijerph17072365</pub-id> </citation>
</ref>
<ref id="B12">
<label>12.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shen</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Chen</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Luo</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Zhang</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Feng</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Liao</surname>
<given-names>W</given-names>
</name>
</person-group>. <article-title>Using Reports of Symptoms and Diagnoses on Social media to Predict COVID-19 Case Counts in mainland China: Observational Infoveillance Study</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2020</year>) <volume>22</volume>(<issue>5</issue>):<fpage>e19421</fpage>. <pub-id pub-id-type="doi">10.2196/19421</pub-id> </citation>
</ref>
<ref id="B13">
<label>13.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Li</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Xu</surname>
<given-names>Q</given-names>
</name>
<name>
<surname>Cuomo</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Purushothaman</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Mackey</surname>
<given-names>T</given-names>
</name>
</person-group>. <article-title>Data Mining and Content Analysis of the Chinese Social media Platform Weibo during the Early COVID-19 Outbreak: Retrospective Observational Infoveillance Study</article-title>. <source>JMIR Public Health Surveill</source> (<year>2020</year>) <volume>6</volume>(<issue>2</issue>):<fpage>e18700</fpage>. <pub-id pub-id-type="doi">10.2196/18700</pub-id> </citation>
</ref>
<ref id="B14">
<label>14.</label>
<citation citation-type="web">
<collab>China: number of social media users 2017-2025</collab>.(<year>2021</year>) <article-title>Statista.com</article-title>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://www.statista.com/statistics/277586/number-of-social-network-users-in-china/">https://www.statista.com/statistics/277586/number-of-social-network-users-in-china/</ext-link>
</comment>. (<comment>Accessed July 24, 2021)</comment>. </citation>
</ref>
<ref id="B15">
<label>15.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Younis</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Freitag</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Ruthberg</surname>
<given-names>JS</given-names>
</name>
<name>
<surname>Romanes</surname>
<given-names>JP</given-names>
</name>
<name>
<surname>Nielsen</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Mehta</surname>
<given-names>N</given-names>
</name>
</person-group>. <article-title>Social media as an Early Proxy for Social Distancing Indicated by the COVID-19 Reproduction Number: Observational Study</article-title>. <source>JMIR Public Health Surveill</source> (<year>2020</year>) <volume>6</volume>(<issue>4</issue>):<fpage>e21340</fpage>. <pub-id pub-id-type="doi">10.2196/21340</pub-id> </citation>
</ref>
<ref id="B16">
<label>16.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Xu</surname>
<given-names>P</given-names>
</name>
<name>
<surname>Dredze</surname>
<given-names>M</given-names>
</name>
<name>
<surname>Broniatowski</surname>
<given-names>DA</given-names>
</name>
</person-group>. <article-title>The Twitter Social Mobility Index: Measuring Social Distancing Practices with Geolocated Tweets</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2020</year>) <volume>22</volume>(<issue>12</issue>):<fpage>e21499</fpage>. <pub-id pub-id-type="doi">10.2196/21499</pub-id> </citation>
</ref>
<ref id="B17">
<label>17.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bisanzio</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Kraemer</surname>
<given-names>MUG</given-names>
</name>
<name>
<surname>Brewer</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Brownstein</surname>
<given-names>JS</given-names>
</name>
<name>
<surname>Reithinger</surname>
<given-names>R</given-names>
</name>
</person-group>. <article-title>Geolocated Twitter Social media Data to Describe the Geographic Spread of SARS-CoV-2</article-title>. <source>J&#x20;Trav Med [Internet</source> (<year>2020</year>) <volume>27</volume>(<issue>5</issue>). <pub-id pub-id-type="doi">10.1093/jtm/taaa120</pub-id> </citation>
</ref>
<ref id="B18">
<label>18.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Bisanzio</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Kraemer</surname>
<given-names>MUG</given-names>
</name>
<name>
<surname>Bogoch </surname>
<suffix>II</suffix>
</name>
<name>
<surname>Brewer</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Brownstein</surname>
<given-names>JS</given-names>
</name>
<name>
<surname>Reithinger</surname>
<given-names>R</given-names>
</name>
</person-group>. <article-title>Use of Twitter Social media Activity as a Proxy for Human Mobility to Predict the Spatiotemporal Spread of COVID-19 at Global Scale</article-title>. <source>Geospat Health</source> (<year>2020</year>) <volume>15</volume>(<issue>1</issue>):<fpage>19</fpage>&#x2013;<lpage>24</lpage>. <pub-id pub-id-type="doi">10.4081/gh.2020.882</pub-id> </citation>
</ref>
<ref id="B19">
<label>19.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Jang</surname>
<given-names>H</given-names>
</name>
<name>
<surname>Rempel</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Roth</surname>
<given-names>D</given-names>
</name>
<name>
<surname>Carenini</surname>
<given-names>G</given-names>
</name>
<name>
<surname>Janjua</surname>
<given-names>NZ</given-names>
</name>
</person-group>. <article-title>Tracking COVID-19 Discourse on Twitter in North America: Infodemiology Study Using Topic Modeling and Aspect-Based Sentiment Analysis</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2021</year>) <volume>23</volume>(<issue>2</issue>):<fpage>e25431</fpage>. <pub-id pub-id-type="doi">10.2196/25431</pub-id> </citation>
</ref>
<ref id="B20">
<label>20.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Zhao</surname>
<given-names>X</given-names>
</name>
<name>
<surname>Knobel</surname>
<given-names>P</given-names>
</name>
</person-group>. <article-title>Face Mask Wearing during the COVID-19 Pandemic: Comparing Perceptions in China and Three European Countries</article-title>. <source>Transl Behav Med</source> (<year>2021</year>) <volume>11</volume>(<issue>6</issue>):<fpage>1199</fpage>&#x2013;<lpage>204</lpage>. <pub-id pub-id-type="doi">10.1093/tbm/ibab043</pub-id> </citation>
</ref>
<ref id="B21">
<label>21.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chandra</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Krishna</surname>
<given-names>A</given-names>
</name>
</person-group>. <article-title>COVID-19 Sentiment Analysis via Deep Learning during the Rise of Novel Cases</article-title>. <source>PLoS ONE</source> (<year>2021</year>) <volume>16</volume>(<issue>8</issue>):<fpage>e0255615</fpage>. <pub-id pub-id-type="doi">10.1371/journal.pone.0255615</pub-id> </citation>
</ref>
<ref id="B22">
<label>22.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Imran</surname>
<given-names>AS</given-names>
</name>
<name>
<surname>Daudpota</surname>
<given-names>SM</given-names>
</name>
<name>
<surname>Kastrati</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Batra</surname>
<given-names>R</given-names>
</name>
</person-group> <article-title>Cross-Cultural Polarity and Emotion Detection Using Sentiment Analysis and Deep Learning on COVID-19 Related Tweets</article-title>. <source>IEEE Access</source>, <volume>8</volume>. (<year>2020</year>). p. <fpage>181074</fpage>&#x2013;<lpage>90</lpage>. <pub-id pub-id-type="doi">10.1109/ACCESS.2020.3027350</pub-id> </citation>
</ref>
<ref id="B23">
<label>23.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Das</surname>
<given-names>S</given-names>
</name>
<name>
<surname>Kolya</surname>
<given-names>AK</given-names>
</name>
</person-group>. <article-title>Predicting the Pandemic: Sentiment Evaluation and Predictive Analysis from Large-Scale Tweets on Covid-19 by Deep Convolutional Neural Network</article-title>. <source>Evol Intel</source> (<year>2021</year>) <fpage>1</fpage>&#x2013;<lpage>22</lpage>. <pub-id pub-id-type="doi">10.1007/s12065-021-00598-7</pub-id> </citation>
</ref>
<ref id="B24">
<label>24.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Shorten</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Khoshgoftaar</surname>
<given-names>TM</given-names>
</name>
<name>
<surname>Furht</surname>
<given-names>B</given-names>
</name>
</person-group>. <article-title>Deep Learning Applications for COVID-19</article-title>. <source>J&#x20;Big Data</source> (<year>2021</year>) <volume>8</volume>(<issue>1</issue>):<fpage>18</fpage>. <pub-id pub-id-type="doi">10.1186/s40537-020-00392-9</pub-id> </citation>
</ref>
<ref id="B25">
<label>25.</label>
<citation citation-type="book">
<collab>Twitter</collab>. <article-title>Twitter Research for Academics and Marketers</article-title>. <publisher-name>Twitter</publisher-name> (<year>2021</year>). <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://developer.twitter.com/en/use-cases/do-research">https://developer.twitter.com/en/use-cases/do-research</ext-link>
</comment>. (<comment>Accessed May 3, 2021)</comment>. </citation>
</ref>
<ref id="B26">
<label>26.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Slavik</surname>
<given-names>CE</given-names>
</name>
<name>
<surname>Buttle</surname>
<given-names>C</given-names>
</name>
<name>
<surname>Sturrock</surname>
<given-names>SL</given-names>
</name>
<name>
<surname>Darlington</surname>
<given-names>JC</given-names>
</name>
<name>
<surname>Yiannakoulias</surname>
<given-names>N</given-names>
</name>
</person-group>. <article-title>Examining Tweet Content and Engagement of Canadian Public Health Agencies and Decision Makers during COVID-19: Mixed Methods Analysis</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2021</year>) <volume>23</volume>(<issue>3</issue>):<fpage>e24883</fpage>. <pub-id pub-id-type="doi">10.2196/24883</pub-id> </citation>
</ref>
<ref id="B27">
<label>27.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chum</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Nielsen</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Bellows</surname>
<given-names>Z</given-names>
</name>
<name>
<surname>Farrell</surname>
<given-names>E</given-names>
</name>
<name>
<surname>Durette</surname>
<given-names>P-N</given-names>
</name>
<name>
<surname>Banda</surname>
<given-names>JM</given-names>
</name>
<etal/>
</person-group> <article-title>Changes in Public Response Associated with Various COVID-19 Restrictions in Ontario, Canada: Observational Infoveillance Study Using Social media Time Series Data</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2021</year>) <volume>23</volume>(<issue>8</issue>):<fpage>e28716</fpage>. <pub-id pub-id-type="doi">10.2196/28716</pub-id> </citation>
</ref>
<ref id="B28">
<label>28.</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Krippendorff</surname>
<given-names>K</given-names>
</name>
</person-group>. <source>Content Analysis: An Introduction to its Methodology</source>. <edition>4th Edn</edition>. <publisher-loc>Thousand Oaks, CA</publisher-loc>: <publisher-name>SAGE Publications</publisher-name> (<year>2018</year>). </citation>
</ref>
<ref id="B29">
<label>29.</label>
<citation citation-type="book">
<collab>Governor Abbott Lifts Mask Mandate</collab>.(<year>2021</year>) <source>Opens Texas 100 Percent. Texas.Gov</source>. <comment>Available at: <ext-link ext-link-type="uri" xlink:href="https://gov.texas.gov/news/post/governor-abbott-lifts-mask-mandate-opens-texas-100-percent">https://gov.texas.gov/news/post/governor-abbott-lifts-mask-mandate-opens-texas-100-percent</ext-link>
</comment>. (<comment>Acceesed May 4, 2021)</comment>. </citation>
</ref>
<ref id="B30">
<label>30.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Chandrasekaran</surname>
<given-names>R</given-names>
</name>
<name>
<surname>Mehta</surname>
<given-names>V</given-names>
</name>
<name>
<surname>Valkunde</surname>
<given-names>T</given-names>
</name>
<name>
<surname>Moustakas</surname>
<given-names>E</given-names>
</name>
</person-group>. <article-title>Topics, Trends, and Sentiments of Tweets about the COVID-19 Pandemic: Temporal Infoveillance Study</article-title>. <source>J&#x20;Med Internet Res</source> (<year>2020</year>) <volume>22</volume>(<issue>10</issue>):<fpage>e22624</fpage>. <pub-id pub-id-type="doi">10.2196/22624</pub-id> </citation>
</ref>
<ref id="B31">
<label>31.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Lwin</surname>
<given-names>MO</given-names>
</name>
<name>
<surname>Lu</surname>
<given-names>J</given-names>
</name>
<name>
<surname>Sheldenkar</surname>
<given-names>A</given-names>
</name>
<name>
<surname>Schulz</surname>
<given-names>PJ</given-names>
</name>
<name>
<surname>Shin</surname>
<given-names>W</given-names>
</name>
<name>
<surname>Gupta</surname>
<given-names>R</given-names>
</name>
<etal/>
</person-group> <article-title>Global Sentiments Surrounding the COVID-19 Pandemic on Twitter: Analysis of Twitter Trends</article-title>. <source>JMIR Public Health Surveill</source> (<year>2020</year>) <volume>6</volume>(<issue>2</issue>):<fpage>e19447</fpage>. <pub-id pub-id-type="doi">10.2196/19447</pub-id> </citation>
</ref>
<ref id="B32">
<label>32.</label>
<citation citation-type="journal">
<person-group person-group-type="author">
<name>
<surname>Garcia</surname>
<given-names>K</given-names>
</name>
<name>
<surname>Berton</surname>
<given-names>L</given-names>
</name>
</person-group>. <article-title>Topic Detection and Sentiment Analysis in Twitter Content Related to COVID-19 from Brazil and the USA</article-title>. <source>Appl Soft Comput</source> (<year>2021</year>) <volume>101</volume>(<issue>107057</issue>):<fpage>107057</fpage>. <pub-id pub-id-type="doi">10.1016/j.asoc.2020.107057</pub-id> </citation>
</ref>
<ref id="B33">
<label>33.</label>
<citation citation-type="book">
<person-group person-group-type="author">
<name>
<surname>Huang</surname>
<given-names>B</given-names>
</name>
<name>
<surname>Carley</surname>
<given-names>KM</given-names>
</name>
</person-group>. <article-title>A Large-Scale Empirical Study of Geotagging Behavior on Twitter</article-title>. In: <source>Proceedings of the 2019 IEEE/ACM International Conference on Advances in Social Networks Analysis and Mining</source>. <publisher-loc>New York, NY</publisher-loc>: <publisher-name>ACM</publisher-name> (<year>2019</year>). <pub-id pub-id-type="doi">10.1145/3341161.3342870</pub-id> </citation>
</ref>
</ref-list>
</back>
</article>