<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMIR</journal-id>
      <journal-id journal-id-type="nlm-ta">J Med Internet Res</journal-id>
      <journal-title>Journal of Medical Internet Research</journal-title>
      <issn pub-type="epub">1438-8871</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v23i9e27314</article-id>
      <article-id pub-id-type="pmid">34524095</article-id>
      <article-id pub-id-type="doi">10.2196/27314</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Deep Learning for Identification of Alcohol-Related Content on Social Media (Reddit and Twitter): Exploratory Analysis of Alcohol-Related Outcomes</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Mao</surname>
            <given-names>Yuqing</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Ricard</surname>
            <given-names>Benjamin Joseph</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0003-1576-8920</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Hassanpour</surname>
            <given-names>Saeed</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <address>
            <institution>Department of Biomedical Data Science</institution>
            <institution>Dartmouth College</institution>
            <addr-line>Williamson Translational Research Building</addr-line>
            <addr-line>One Medical Center Drive HB 7261</addr-line>
            <addr-line>Lebanon, NH, 03756</addr-line>
            <country>United States</country>
            <phone>1 603 650 1983</phone>
            <email>saeed.hassanpour@dartmouth.edu</email>
          </address>
          <xref rid="aff2" ref-type="aff">2</xref>
          <xref rid="aff3" ref-type="aff">3</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9460-6414</ext-link>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Department of Biomedical Data Science</institution>
        <institution>Dartmouth College</institution>
        <addr-line>Lebanon, NH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Epidemiology</institution>
        <institution>Dartmouth College</institution>
        <addr-line>Hanover, NH</addr-line>
        <country>United States</country>
      </aff>
      <aff id="aff3">
        <label>3</label>
        <institution>Department of Computer Science</institution>
        <institution>Dartmouth College</institution>
        <addr-line>Hanover, NH</addr-line>
        <country>United States</country>
      </aff>
      <author-notes>
        <corresp>Corresponding Author: Saeed Hassanpour <email>saeed.hassanpour@dartmouth.edu</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>15</day>
        <month>9</month>
        <year>2021</year>
      </pub-date>
      <volume>23</volume>
      <issue>9</issue>
      <elocation-id>e27314</elocation-id>
      <history>
        <date date-type="received">
          <day>21</day>
          <month>1</month>
          <year>2021</year>
        </date>
        <date date-type="rev-request">
          <day>11</day>
          <month>2</month>
          <year>2021</year>
        </date>
        <date date-type="rev-recd">
          <day>30</day>
          <month>3</month>
          <year>2021</year>
        </date>
        <date date-type="accepted">
          <day>1</day>
          <month>8</month>
          <year>2021</year>
        </date>
      </history>
      <copyright-statement>©Benjamin Joseph Ricard, Saeed Hassanpour. Originally published in the Journal of Medical Internet Research (https://www.jmir.org), 15.09.2021.</copyright-statement>
      <copyright-year>2021</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in the Journal of Medical Internet Research, is properly cited. The complete bibliographic information, a link to the original publication on https://www.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://www.jmir.org/2021/9/e27314" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Many social media studies have explored the ability of thematic structures, such as hashtags and subreddits, to identify information related to a wide variety of mental health disorders. However, studies and models trained on specific themed communities are often difficult to apply to different social media platforms and related outcomes. A deep learning framework using thematic structures from Reddit and Twitter can have distinct advantages for studying alcohol abuse, particularly among the youth in the United States.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study proposes a new deep learning pipeline that uses thematic structures to identify alcohol-related content across different platforms. We apply our method on Twitter to determine the association of the prevalence of alcohol-related tweets with alcohol-related outcomes reported from the National Institute of Alcoholism and Alcohol Abuse, Centers for Disease Control Behavioral Risk Factor Surveillance System, county health rankings, and the National Industry Classification System.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>The Bidirectional Encoder Representations From Transformers neural network learned to classify 1,302,524 Reddit posts as either alcohol-related or control subreddits. The trained model identified 24 alcohol-related hashtags from an unlabeled data set of 843,769 random tweets. Querying alcohol-related hashtags identified 25,558,846 alcohol-related tweets, including 790,544 location-specific (geotagged) tweets. We calculated the correlation between the prevalence of alcohol-related tweets and alcohol-related outcomes, controlling for confounding effects of age, sex, income, education, and self-reported race, as recorded by the 2013-2018 American Community Survey.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>Significant associations were observed: between alcohol-hashtagged tweets and alcohol consumption (<italic>P</italic>=.01) and heavy drinking (<italic>P</italic>=.005) but not binge drinking (<italic>P</italic>=.37), self-reported at the metropolitan-micropolitan statistical area level; between alcohol-hashtagged tweets and self-reported excessive drinking behavior (<italic>P</italic>=.03) but not motor vehicle fatalities involving alcohol (<italic>P</italic>=.21); between alcohol-hashtagged tweets and the number of breweries (<italic>P</italic>&#60;.001), wineries (<italic>P</italic>&#60;.001), and beer, wine, and liquor stores (<italic>P</italic>&#60;.001) but not drinking places (<italic>P</italic>=.23), per capita at the US county and county-equivalent level; and between alcohol-hashtagged tweets and all gallons of ethanol consumed (<italic>P</italic>&#60;.001), as well as ethanol consumed from wine (<italic>P</italic>&#60;.001) and liquor (<italic>P</italic>=.01) sources but not beer (<italic>P</italic>=.63), at the US state level.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>Here, we present a novel natural language processing pipeline developed using Reddit’s alcohol-related subreddits that identify highly specific alcohol-related Twitter hashtags. The prevalence of identified hashtags contains interpretable information about alcohol consumption at both coarse (eg, US state) and fine-grained (eg, metropolitan-micropolitan statistical area level and county) geographical designations. This approach can expand research and deep learning interventions on alcohol abuse and other behavioral health outcomes.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>social media</kwd>
        <kwd>natural language processing</kwd>
        <kwd>alcohol abuse</kwd>
        <kwd>machine learning</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Alcohol-related causes are the third leading preventable cause of death in the United States, and alcohol abuse contributes to many adverse health outcomes, particularly on the developing brain [<xref ref-type="bibr" rid="ref1">1</xref>-<xref ref-type="bibr" rid="ref4">4</xref>]. The rise of alcohol-related content on Twitter is alarming, with over half of young adults participating in a study [<xref ref-type="bibr" rid="ref5">5</xref>] posting alcohol-related content. Social media use and alcohol consumption are common behaviors; the prevalence rates of Twitter, Reddit, and annual alcohol use for US adults are 22%, 11%, and 70%, respectively [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref7">7</xref>]. Internet- and social media–based interventions are scalable and efficient approaches for developing practical tools for treating and monitoring alcohol abuse, especially for at-risk adolescents and young adults [<xref ref-type="bibr" rid="ref8">8</xref>-<xref ref-type="bibr" rid="ref14">14</xref>]. However, identifying high-risk areas for efficient and helpful monitoring along with population-level interventions remains a difficult task, in part because of survey bias [<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref17">17</xref>].</p>
        <p>Text-based <italic>hashtags</italic> are common among many popular social media platforms such as Twitter, Instagram, and TikTok. Individuals use hashtags to categorize, label, organize, and discover posts and content [<xref ref-type="bibr" rid="ref18">18</xref>]. Previous studies have indicated that study-specific hashtags are useful for mental health research [<xref ref-type="bibr" rid="ref19">19</xref>]. For example, sexual abuse and harassment (#MeToo), breast cancer (#breastcancer), HIV (#HIV), miscarriages (#ihadamiscarriage), tobacco use (#Vapelife), and viral pandemics (#COVID-19) are some of the many important health outcomes that have been previously studied using hashtags on Twitter [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref28">28</xref>]. Other social media platforms such as Reddit contain specific <italic>themed</italic> communities where interested users discuss a particular topic. In contrast to hashtags, themed communities on websites such as Reddit represent posts related to exactly 1 topic of interest. Like hashtags, these communities, such as <italic>r/cripplingalcoholism</italic>, <italic>r/depression</italic>, or <italic>r/opiates</italic> Reddit subreddits and <italic>HIV</italic> Baidu Tieba bar, contain information that can target and understand behavioral health and disease [<xref ref-type="bibr" rid="ref29">29</xref>-<xref ref-type="bibr" rid="ref33">33</xref>]. In addition to hashtags and subreddits, some social media platforms allow for <italic>geotagging</italic> or sharing a user's geographical latitude and longitude coordinates in a post. Geotags have been used in social media research to identify geographically relevant information from social media data [<xref ref-type="bibr" rid="ref34">34</xref>-<xref ref-type="bibr" rid="ref36">36</xref>].</p>
      </sec>
      <sec>
        <title>Previous Work</title>
        <p>Although prior studies have identified specific hashtags or themed communities for studying behavioral health outcomes, many insights are platform-specific. Although helpful information regarding a behavior of interest or themed community may be available on one platform, there may not be such knowledge available on a different platform. Many previous methods examining alcohol content on social media use data from a single platform [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref37">37</xref>-<xref ref-type="bibr" rid="ref42">42</xref>]. Single-platform analyses may limit discoveries and interventions to only a fraction of the population at risk. There is a growing need for behavioral health researchers working with social media data to incorporate analyses from many sources [<xref ref-type="bibr" rid="ref43">43</xref>,<xref ref-type="bibr" rid="ref44">44</xref>]. Although some studies have examined alcohol content on multiple platforms, many methods need survey data from known active users from each source or additional manual annotation [<xref ref-type="bibr" rid="ref45">45</xref>-<xref ref-type="bibr" rid="ref47">47</xref>]. The ability and insights gained from using deep learning methods to learn from a large number of posts from specific communities (ie, Reddit subreddits) to predict alcohol-related content on a different platform (ie, Twitter) remain unclear.</p>
        <p>Many previous studies that identified alcohol-related language on social media platforms relied on training on extrinsic labels, such as survey responses. Reliance on self-report data is problematic as alcohol consumption is subject to bias, particularly among the youth [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>,<xref ref-type="bibr" rid="ref48">48</xref>]. In addition, approaches that use an outcome of interest to both train and evaluate a model (eg, identifying and evaluating alcohol-related hashtags or keywords based on enrichment in regions with higher self-reported alcohol content) may not be generalizable to other related outcomes [<xref ref-type="bibr" rid="ref49">49</xref>].</p>
        <p>Other approaches for studying alcohol content involve identifying a sample as being alcohol-related based on the identification of keywords. Keyword approaches have distinct benefits, such as interpretability. However, identifying text from keywords may rely on standard and predefined terms (eg, searching <italic>drunk</italic>), training on self-report data, or manual review [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref49">49</xref>-<xref ref-type="bibr" rid="ref51">51</xref>]. Classification of social media posts based on previously defined keywords or vector representations (eg, Word2vec) is not as useful when the average length of sequences is small and has out-of-training vocabulary [<xref ref-type="bibr" rid="ref52">52</xref>-<xref ref-type="bibr" rid="ref54">54</xref>]. Training on nonspecific platform information alone may fail to capture relevant keywords, especially for rarer outcomes not prominent in the heterogeneity of random and unlabeled social media chatter [<xref ref-type="bibr" rid="ref55">55</xref>]. In addition, predefined keywords or word vectors may fail to capture slang or the different language structures between Reddit and Twitter [<xref ref-type="bibr" rid="ref56">56</xref>].</p>
        <p>One recent contribution in natural language processing (NLP) is the Bidirectional Encoder Representations From Transformers (BERT) neural network, which has demonstrated superior performance on a wide variety of social media NLP tasks [<xref ref-type="bibr" rid="ref57">57</xref>-<xref ref-type="bibr" rid="ref61">61</xref>]. BERT focuses on learning by analyzing sentences with randomly masked words. This masked language model deconstructs larger strings into smaller tokens and is ideal for dealing with hashtags and other platform-unique token structures [<xref ref-type="bibr" rid="ref57">57</xref>]. Before developing BERT, previous models, such as long-short–term memory networks, logistic regression, Word2vec similarity, and latent Dirichlet allocation, were not well suited to process unknown words and hashtag structures. For example, some previous NLP studies on social media either removed hashtags, represented them as universal tokens, or removed <italic>#</italic> from strings, with no importance given to hashtags (eg, <italic>#ilovebeer</italic> represented as “ ” (space), <italic>HASHTAG</italic>, or <italic>ilovebeer</italic>, respectively) [<xref ref-type="bibr" rid="ref62">62</xref>-<xref ref-type="bibr" rid="ref64">64</xref>]. In contrast, using hashtags and themed communities as explicit labels in a deep learning architecture allows for identifying relevant, platform-specific hashtags that can identify posts that indicate the behavior of interest. In addition, the use of these structures adds a layer of interpretability to our trained neural networks, which are commonly criticized as noninterpretable black boxes [<xref ref-type="bibr" rid="ref65">65</xref>].</p>
        <p>Other previous social media text mining methods implementing deep learning often involve training platform-specific models. One issue with this approach is that each platform’s training models require an extensive amount of usually labeled data from that platform [<xref ref-type="bibr" rid="ref66">66</xref>-<xref ref-type="bibr" rid="ref72">72</xref>]. In addition, although deep learning models have been successful at many tasks, training platform-specific deep networks such as BERT (containing &#62;100 million parameters) is extremely energy- and cost-intensive, and CO<sub>2</sub> emissions from training BERT models have raised concerns about their environmental impact [<xref ref-type="bibr" rid="ref73">73</xref>]. Optimal methods for translating information from previously trained social media deep learning models to discern insights from separate social media platforms remain a relatively unexplored research area.</p>
      </sec>
      <sec>
        <title>The Goal of This Study</title>
        <p>We aim to examine the effectiveness of using thematic structures in a deep learning framework to identify alcohol-related behaviors across different social media platforms. First, we trained on Reddit subreddits to identify alcohol-related targets on another social media platform (Twitter) with a different thematic structure (hashtags). Next, we determined whether the hashtags predicted by the model correlate to known alcohol-related outcomes, including self-reported drinking status, alcohol outlet density, and estimated gallons of ethanol consumed, after controlling for confounding effects of age, sex, income, education, and self-reported race. We show that these data-driven hashtags contain interpretable information about alcohol consumption in the United States. Finally, we present validated and queryable hashtags from our model that behavioral health researchers can use as a starting point for the identification of alcohol-related content on Twitter, Reddit, and other social media platforms.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Overview of the NLP Pipeline</title>
        <p>This study fine-tuned a BERT neural network as a binary classifier to predict Reddit post titles as belonging to either alcohol-related communities or a random subreddit. Next, we applied the Reddit-trained network to a smaller set of random, unlabeled Twitter posts to identify 24 hashtags that were significantly associated with alcohol content. We identified 25,558,846 tweets that contained at least one alcohol-related hashtag for the period between 2010 and 2019. A total of 1,412,041 alcohol-related tweets included latitude and longitude data from <italic>geotagging</italic>. The locations of 790,544 geotagged tweets from 2929 US counties and county equivalents were identified using data from the 2017 US Census Shapefiles database [<xref ref-type="bibr" rid="ref74">74</xref>,<xref ref-type="bibr" rid="ref75">75</xref>]. Finally, we examined the relationship between the prevalence of alcohol-related tweets per population and various outcome measures related to alcohol consumption, including self-reported alcohol consumption and alcohol outlet density. <xref rid="figure1" ref-type="fig">Figure 1</xref> demonstrates an overview of our NLP pipeline. <xref rid="figure2" ref-type="fig">Figure 2</xref> illustrates the choropleth of population-normalized alcohol-hashtagged tweets for US states and Washington, DC.</p>
        <fig id="figure1" position="float">
          <label>Figure 1</label>
          <caption>
            <p>Overview of the methodological pipeline. A bidirectional encoder representation from transformers model trained to classify posts as either 18 alcohol-related or control subreddits. The bidirectional encoder representations from transformers model was applied to a set of tweets containing at least one hashtag. The prediction results were analyzed to find 24 significantly enriched hashtags as positive predictions (ie, prediction probability ≥0.5). Tweets posted between 2010 and 2020 with an alcohol-related hashtag were collected and filtered on geotagged location. BERT: Bidirectional Encoder Representations From Transformers.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e27314_fig1.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
        <fig id="figure2" position="float">
          <label>Figure 2</label>
          <caption>
            <p>Choropleth of the US state and Washington, DC tweets with alcohol-related hashtags per 10,000 persons.</p>
          </caption>
          <graphic xlink:href="jmir_v23i9e27314_fig2.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Reddit Data Set and BERT Training</title>
        <p>A large amount of alcohol-related training data were extracted from Reddit subreddits with the pushshift application programming interface (API) previously used in social media research [<xref ref-type="bibr" rid="ref63">63</xref>,<xref ref-type="bibr" rid="ref76">76</xref>]. On a subreddit, community moderators create description texts that contain links to other, usually related, subreddits. Scraping the description pages for all subreddits containing at least 1000 posts for any links to <italic>r/drunk</italic>, one of the most popular alcohol-related subreddits, and all links from <italic>r/drunk</italic> to other subreddits yielded 17 alcohol-related subreddits. A total of 651,271 post titles from the following 18 subreddits were used as positive alcohol labels for model training: <italic>r/cripplingalcoholism</italic>, <italic>r/vodka</italic>, <italic>r/oldtimehockey</italic>, <italic>r/alcohol</italic>, <italic>r/beer</italic>, <italic>r/bourbon</italic>, <italic>r/homebrewing</italic>, <italic>r/drinkinggames</italic>, <italic>r/wine</italic>, <italic>r/beercirclejerk</italic>, <italic>r/gin</italic>, <italic>r/scotch</italic>, <italic>r/liquor</italic>, <italic>r/showerbeer</italic>, <italic>r/absinthe</italic>, <italic>r/firewater</italic>, <italic>r/beercanada</italic>, and <italic>r/drunk</italic>.</p>
        <p>Negative alcohol (control) posts were gathered by querying 651,271 random posts posted in all other subreddits, excluding the 18 alcohol-related subreddits. Training 79.99% (521,016/651,271), validation 9.99% (65,127/651,271), and testing 9.99% (65,127/651,271), data sets were generated for developing and evaluating the model—a binary classifier trained for posts belonging to either alcohol-related subreddits or other random subreddits. The model fine-tuned a pretrained BERT model with 12 layers and 768 hidden units in PyTorch on an NVIDIA TITAN Xp graphics processing unit using a batch size of 64 for approximately 5 weeks [<xref ref-type="bibr" rid="ref77">77</xref>].</p>
      </sec>
      <sec>
        <title>Twitter Data Set and Identification of Hashtags</title>
        <p>The Twitter API provides tweet information from 7 days before a query. Randomly selected tokens in the Twitter GLoVE word embedding dictionary and their respective hashtags (ie, a string that starts with <italic>#</italic>) were queried using the Twitter API to identify recently posted tweets containing that word or hashtag [<xref ref-type="bibr" rid="ref78">78</xref>]. Each identified hashtag in the data set was requeried to ensure that it was monitored for at least 2 weeks. The initial <italic>random</italic> Twitter data set comprised 843,769 random hashtag-containing tweets posted between January 2019 and October 2019. The Reddit-trained BERT model was applied to this data set to obtain binary predictions for each tweet. A chi-square test identified 24 significant alcohol-related hashtags from posts predicted to be alcohol-positive (ie, final softmax layer prediction <italic>P</italic> value of ≥0.5) relative to posts predicted as negative (ie, final softmax prediction <italic>P</italic> value of &#60;0.5) using a one-tailed <italic>greater</italic> test. We included only hashtags with 5 or more occurrences and applied the Benjamini-Hochberg algorithm for multiple hypothesis correction using a 0.05 false discovery rate, a common approach for multiple hypothesis corrections in social media data analyses [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref42">42</xref>,<xref ref-type="bibr" rid="ref79">79</xref>-<xref ref-type="bibr" rid="ref85">85</xref>]. The analysis resulted in 24 hashtags, as indicated in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>. GetOldTweets, a Python package widely used in social media research, was used to identify 25,558,846 alcohol-hashtagged tweets posted throughout 10 years (between 2010 and 2020) containing at least one significant alcohol-related hashtag [<xref ref-type="bibr" rid="ref55">55</xref>,<xref ref-type="bibr" rid="ref86">86</xref>,<xref ref-type="bibr" rid="ref87">87</xref>].</p>
        <boxed-text id="box1" position="float">
          <title>Alcohol-related hashtags extracted by our Reddit-trained classifier according to alcohol category.</title>
          <p>
            <bold>Beer hashtags</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p><italic>craftbeer</italic>, <italic>beer</italic>, <italic>ncbeer</italic>, <italic>brewery</italic>, <italic>stout</italic>, <italic>beeroclock</italic>, <italic>beergeek</italic>, <italic>beerporn</italic>, <italic>beers</italic>, <italic>instabeer</italic>, <italic>beertime</italic>, <italic>beerstagram</italic>, <italic>beerlover</italic>, <italic>beersnob</italic></p>
            </list-item>
          </list>
          <p>
            <bold>Wine hashtags</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p><italic>winetasting</italic>, <italic>wine</italic>, <italic>winelover</italic>, <italic>wines</italic>, <italic>redwine</italic></p>
            </list-item>
          </list>
          <p>
            <bold>Liquor hashtags</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p><italic>bourbon</italic>, <italic>whiskey</italic>, <italic>whisky</italic></p>
            </list-item>
          </list>
          <p>
            <bold>Multiple or ambiguous hashtags</bold>
          </p>
          <list list-type="bullet">
            <list-item>
              <p><italic>drinklocal</italic>, <italic>drunktwitter</italic></p>
            </list-item>
          </list>
        </boxed-text>
      </sec>
      <sec>
        <title>Geographical Identification of the Prevalence of Alcohol-Related Hashtags</title>
        <p>Next, we tested whether the knowledge of 24 significant alcohol hashtags could uncover information on alcohol-related outcomes in the United States. Alcohol-hashtagged tweets were filtered to 790,544 <italic>geotagged</italic> tweets containing longitude and latitude coordinate locations and mapped to metropolitan-micropolitan statistical areas (MMSAs), US county and county equivalents, and US states and Washington, DC. The total number of alcohol-hashtagged tweets in an area divided by the mean of the population estimates from the 2013-2018 American Community Survey yielded population-normalized alcohol-related hashtag prevalence.</p>
        <p>We then tested the association between geographical prevalence of alcohol-related hashtags and alcohol outcomes. Spearman rho, a ranked nonparametric measure that is more robust to outliers than Pearson correlation, is used to report crude (nonadjusted) correlations [<xref ref-type="bibr" rid="ref88">88</xref>]. Potential confounding variables previously studied in alcohol and social media use include race and sex distribution, median age, education, and income [<xref ref-type="bibr" rid="ref37">37</xref>,<xref ref-type="bibr" rid="ref89">89</xref>]. A linear regression analysis evaluated the relationship between the number of tweets per population and alcohol-related outcomes after including terms to control for confounding effects. Specific confounding variables from the 2013-2018 5-year American Community Survey report included <italic>Percent Reporting White</italic>, <italic>Percent Reporting Black</italic>, <italic>Percent Reporting Hispanic</italic>, <italic>Median Income</italic>, <italic>Percent High School Education</italic>, <italic>Percent Bachelor's Degree Education</italic>, and <italic>Males/100 Females</italic> [<xref ref-type="bibr" rid="ref90">90</xref>]. All alcohol outcomes and confounding variables represented the most recent estimation of alcohol consumption and related behavior at the time of this study.</p>
      </sec>
      <sec>
        <title>Metropolitan-Micropolitan Statistical Areas</title>
        <p>MMSAs are US Census Bureau designations of concentrated urban centers that may be the integrated areas of multiple cities and states (eg, the single <italic>Washington-Arlington-Alexandria, DC-VA-MD-WV MSA</italic> contains 3 US states and Washington, DC) [<xref ref-type="bibr" rid="ref74">74</xref>]. The Behavioral Risk Factor Surveillance System publishes reports of survey responses at selected MMSAs for the following categories [<xref ref-type="bibr" rid="ref91">91</xref>]:</p>
        <list list-type="bullet">
          <list-item>
            <p>any alcohol consumption, defined as at least one alcoholic drink in the last 30 days;</p>
          </list-item>
          <list-item>
            <p>binge drinking behavior, defined as drinking &#62;5 drinks in 1 event for men or &#62;4 drinks in 1 event for women;</p>
          </list-item>
          <list-item>
            <p>heavy drinking, defined as drinking &#62;1 drink per day for women or &#62;2 drinks per day per man;</p>
          </list-item>
        </list>
        <p>All yearly records from 2010-2019 for each MMSA were averaged to obtain a single number for outcome measurements.</p>
      </sec>
      <sec>
        <title>US County and County Equivalent</title>
        <p>Primary US county outcomes were gathered from the University of Wisconsin Population Health Institute County Health Rankings and Roadmaps 2020 data, which included the estimates of excessive drinking, defined as the percentage reporting either binge or heavy drinking behavior as well as measurements of the percentage of motor vehicle fatalities that involved alcohol for the period between 2013 and 2018 [<xref ref-type="bibr" rid="ref92">92</xref>]. In addition, data from the North American Industry Classification System provided by 2017 County Business Patterns (US Census) was used for the number of <italic>Drinking Places (Alcohol Beverages)</italic>; <italic>Wineries</italic>; <italic>Breweries</italic>; and <italic>Beer</italic>, <italic>Wine</italic>, <italic>and Liquor stores</italic> (North American Industry Classification System codes 722410, 312130, 312120, 445310, respectively) present in each county [<xref ref-type="bibr" rid="ref93">93</xref>]. Counties were included if they contained at least one tweet and an average reported population &#62;1000 between 2013 and 2018.</p>
      </sec>
      <sec>
        <title>US States and Washington DC</title>
        <p>Twitter posts containing alcohol-related hashtags were aggregated by state and compared with the National Institute on Alcohol Abuse and Alcoholism's 2018 report, <italic>Apparent Per Capita Alcohol Consumption: National, State, and Regional Trends</italic>. This report predicts gallons of ethanol consumption based on alcohol sales and taxation data, separated for the consumption of wine, beer, or liquor products [<xref ref-type="bibr" rid="ref94">94</xref>]. To determine which hashtags may be useful for detecting individual preferences of alcohol consumption, we calculated the correlation between the consumption of alcohol from different sources of alcoholic drinks (beer, wine, and liquor) and the prevalence of 19 beer, 5 wine, and 3 liquor-specific hashtags, as indicated in <xref ref-type="boxed-text" rid="box1">Textbox 1</xref>.</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <p><xref ref-type="table" rid="table1">Table 1</xref> demonstrates the results from the analysis of alcohol-related hashtags and alcohol-related outcomes. The number of geotagged and alcohol-hashtagged tweets per population significantly correlated with many alcohol-related outcomes, including self-reported measures of individuals (1) reporting any alcohol consumption within 30 days (<italic>P</italic>&#60;.001), (2) meeting the criteria for heavy drinking (<italic>P</italic>&#60;.001), and (3) meeting the criteria for binge drinking (<italic>P</italic>&#60;.001) at the MMSA level (<xref rid="figure3" ref-type="fig">Figure 3</xref>). However, the relationship between MMSA tweets and binge drinking level was not significant after adjusting for confounding effects (<italic>P</italic>=.37).</p>
      <table-wrap position="float" id="table1">
        <label>Table 1</label>
        <caption>
          <p>Spearman correlation and linear regression results between the number of tweets per population and alcohol-related behavior and health indicators.</p>
        </caption>
        <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
          <col width="30"/>
          <col width="430"/>
          <col width="110"/>
          <col width="100"/>
          <col width="0"/>
          <col width="120"/>
          <col width="100"/>
          <col width="0"/>
          <col width="110"/>
          <thead>
            <tr valign="top">
              <td colspan="2">Outcome</td>
              <td colspan="3">Spearman correlation</td>
              <td colspan="3">Adjusted regression</td>
              <td>Sample size, n</td>
            </tr>
            <tr valign="top">
              <td colspan="2">
                <break/>
              </td>
              <td>ρ</td>
              <td><italic>P</italic> value</td>
              <td colspan="2">Coefficient β</td>
              <td><italic>P</italic> value</td>
              <td colspan="2">
                <break/>
              </td>
            </tr>
          </thead>
          <tbody>
            <tr valign="top">
              <td colspan="9">
                <bold>Metropolitan-micropolitan statistical area</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Alcohol consumption</td>
              <td>0.526</td>
              <td>&#60;.001</td>
              <td colspan="2">1038</td>
              <td>.01</td>
              <td colspan="2">179</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Binge drinking</td>
              <td>0.355</td>
              <td>&#60;.001</td>
              <td colspan="2">184.0</td>
              <td>.37</td>
              <td colspan="2">179</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Heavy drinking</td>
              <td>0.387</td>
              <td>&#60;.001</td>
              <td colspan="2">244.8</td>
              <td>.005</td>
              <td colspan="2">179</td>
            </tr>
            <tr valign="top">
              <td colspan="9">
                <bold>County and equivalent</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Excessive drinking</td>
              <td>0.377</td>
              <td>&#60;.001</td>
              <td colspan="2">32.8</td>
              <td>.03</td>
              <td colspan="2">2641</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Percentage of alcohol motor vehicle fatality</td>
              <td>0.063</td>
              <td>.002</td>
              <td colspan="2">110.0</td>
              <td>.21</td>
              <td colspan="2">2641</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Drinking places (alcoholic beverages) per capita</td>
              <td>−0.177</td>
              <td>&#60;.001</td>
              <td colspan="2">−2.18e–03</td>
              <td>.23</td>
              <td colspan="2">1479</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Breweries per capita</td>
              <td>0.263</td>
              <td>&#60;.001</td>
              <td colspan="2">1.86e–03</td>
              <td>&#60;.001</td>
              <td colspan="2">334</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Wineries per capita</td>
              <td>0.130</td>
              <td>.05</td>
              <td colspan="2">2.73e–02</td>
              <td>&#60;.001</td>
              <td colspan="2">228</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Beer, wine, and liquor stores per capita</td>
              <td>−0.043</td>
              <td>.11</td>
              <td colspan="2">0.0039</td>
              <td>&#60;.001</td>
              <td colspan="2">1444</td>
            </tr>
            <tr valign="top">
              <td colspan="9">
                <bold>US states and Washington, DC, all hashtags</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Wine, gallons of ethanol per capita</td>
              <td>0.756</td>
              <td>&#60;.001</td>
              <td colspan="2">74.11</td>
              <td>&#60;.001</td>
              <td colspan="2">51</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Beer, gallons of ethanol per capita</td>
              <td>−0.050</td>
              <td>.73</td>
              <td colspan="2">9.911</td>
              <td>.63</td>
              <td colspan="2">51</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Liquor, gallons of ethanol per capita</td>
              <td>0.320</td>
              <td>.01</td>
              <td colspan="2">62.54</td>
              <td>.03</td>
              <td colspan="2">51</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>All sources, gallons of ethanol per capita</td>
              <td>0.437</td>
              <td>&#60;.001</td>
              <td colspan="2">146.6</td>
              <td>&#60;.001</td>
              <td colspan="2">51</td>
            </tr>
            <tr valign="top">
              <td colspan="9">
                <bold>US states and Washington, DC, hashtags stratified by alcohol category</bold>
              </td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Wine, gallons of ethanol per capita (5 hashtags)</td>
              <td>0.754</td>
              <td>&#60;.001</td>
              <td colspan="2">214.6</td>
              <td>&#60;.001</td>
              <td colspan="2">51</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Beer, gallons of ethanol per capita (19 hashtags)</td>
              <td>−0.001</td>
              <td>.99</td>
              <td colspan="2">16.05</td>
              <td>.63</td>
              <td colspan="2">51</td>
            </tr>
            <tr valign="top">
              <td>
                <break/>
              </td>
              <td>Liquor, gallons of ethanol per capita (3 hashtags)</td>
              <td>0.140</td>
              <td>.33</td>
              <td colspan="2">338.0</td>
              <td>.01</td>
              <td colspan="2"> 51</td>
            </tr>
          </tbody>
        </table>
      </table-wrap>
      <fig id="figure3" position="float">
        <label>Figure 3</label>
        <caption>
          <p>Metropolitan-micropolitan statistical area correlations for alcohol-hashtagged tweets and percent self-reported alcohol consumption. (A) Number of alcohol-hashtagged tweets and self-reported alcohol consumption within 30 days (N=179); (B) number of alcohol-hashtagged tweets and self-reported binge drinking within 30 days (N=179); (C) number of alcohol-hashtagged tweets and self-reported heavy drinking within 30 days (N=179).</p>
        </caption>
        <graphic xlink:href="jmir_v23i9e27314_fig3.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>There was a significant correlation between the percentage of motor vehicle deaths reported as involving alcohol (<italic>P</italic>&#60;.001) and aggregated measures of excessive drinking behavior (<italic>P</italic>&#60;.001) at the county level (<xref rid="figure4" ref-type="fig">Figure 4</xref>). However, the relationship between alcohol-related motor vehicle fatalities and county tweets per population was not significant after adjusting for confounding effects (<italic>P</italic>=.21).</p>
      <fig id="figure4" position="float">
        <label>Figure 4</label>
        <caption>
          <p>County- and county-equivalent–level correlations for alcohol-hashtagged tweets, alcohol motor vehicle fatalities, and self-reported excessive alcohol consumption. Counties are included if they contain at least one tweet and 1000 people (N=2641). (A) County-level correlations for alcohol-hashtagged tweets per population and percentage of motor vehicle fatalities involving alcohol. (B) County-level correlations for alcohol-hashtagged tweets per population and percent self-reporting excessive drinking (reporting either more than five alcoholic drinks on a single occasion for men or more than four alcoholic drinks on a single occasion for women, or more than two drinks per day for men or more than one drink per day for women).</p>
        </caption>
        <graphic xlink:href="jmir_v23i9e27314_fig4.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>There was a significant correlation between the number of alcohol-hashtagged tweets and wineries (<italic>P=</italic>.05), breweries (<italic>P</italic>&#60;.001), and drinking places (alcoholic beverages; <italic>P</italic>&#60;.001) but not beer, wine, and liquor stores (<italic>P</italic>=.11) per capita at the county level (<xref rid="figure5" ref-type="fig">Figure 5</xref>). However, after adjusting for confounding effects, there was a significant association between alcohol-related tweets per population and beer, wine, and liquor stores (<italic>P</italic>&#60;.001) but not drinking places (<italic>P</italic>=.23) per capita.</p>
      <fig id="figure5" position="float">
        <label>Figure 5</label>
        <caption>
          <p>County- and county-equivalent–level correlations for alcohol-hashtagged tweets per person and alcohol-serving outlets, as reported by the North American Industry Classification System. Counties are included if they have at least one (1) tweet in our data set, one (1) alcohol outlet, and contain a population of 1000. (A) Wineries per 10,000 people (n=228 counties); (B) breweries per 10,000 people (n=334); (C) liquor stores per 10,000 people (n=1444); (D) drinking places (alcoholic beverages) per 10,000 people (n=1479).</p>
        </caption>
        <graphic xlink:href="jmir_v23i9e27314_fig5.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
      <p>There was a significant correlation between the prevalence of alcohol-hashtagged tweets and gallons of wine (<italic>P</italic>&#60;.001), liquor (<italic>P</italic>=.01), and overall gallons of consumption (<italic>P</italic>&#60;.001) at the state level (<xref rid="figure6" ref-type="fig">Figure 6</xref>). However, the association with all alcohol-hashtagged tweets and gallons of beer consumed was not significant (<italic>P</italic>=.63).</p>
      <p>The prevalence of five wine hashtags had a significant association with wine consumption at the state level (<italic>P</italic>&#60;.001), but 3 liquor hashtags and 19 beer hashtags did not have a significant relationship with liquor (<italic>P</italic>=.33) and beer (<italic>P</italic>=.99) consumption at the state level. However, there was a significant relationship between gallons of liquor consumed and the prevalence of 3 liquor hashtags (<italic>P=</italic>.01) after controlling for confounding effects (<xref rid="figure6" ref-type="fig">Figure 6</xref>).</p>
      <fig id="figure6" position="float">
        <label>Figure 6</label>
        <caption>
          <p>Gallons of ethanol consumed for US states and alcohol-hashtagged tweets. Population normalization was performed using the average reported population between 2010 and 2018, as reported by the National Institute of Alcohol Abuse and Alcoholism. Top, all 24 hashtags used; gallons of ethanol consumed from (A) wine; (B) beer; (C) liquor; and (D) all alcohol sources and Twitter posts per population. Bottom, only specific hashtags, gallons of ethanol from wine, beer, and liquor, and Twitter posts per population from specific hashtags: (E) wine (5 wine hashtags); (F) beer (14 beer hashtags); (G) liquor (3 liquor hashtags).</p>
        </caption>
        <graphic xlink:href="jmir_v23i9e27314_fig6.png" alt-version="no" mimetype="image" position="float" xlink:type="simple"/>
      </fig>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>We demonstrated that information from alcohol-related subreddits could identify alcohol-related hashtags that correlated with multiple alcohol-related outcomes. The prevalence of geotagged tweets containing these significantly alcohol-related hashtags correlates with alcohol-related behaviors and alcohol outlet density, which are associated with adverse outcomes, including deaths from motor vehicle crashes and excessive drinking [<xref ref-type="bibr" rid="ref95">95</xref>-<xref ref-type="bibr" rid="ref97">97</xref>]. This approach has distinct benefits for studying alcohol-related outcomes. Compared with other approaches to detect alcohol consumption on Twitter, the pipeline presented here is trained using relatively few interpretable input and output parameters, specifically, 18 subreddits and 24 hashtags. The NLP pipeline identified language associated with alcohol abuse on Twitter without manual annotation or predefined keywords and with only the knowledge of relevant subreddits. These results indicate that alcohol-related language, when defined by inclusion into the themed communities of subreddits or containing alcohol-related hashtags, can be used to understand population-level behavior in multiple geographic areas with different population granularity.</p>
        <p>Qualitatively, the model presented here detects a wide variety of different alcohol-related hashtags, including slang. Tweets containing these hashtags capture a large amount of information regarding alcohol consumption behavior at a broad population level. The set of hashtags resulting from this study is useful for future alcohol-related research on Twitter and identifying relevant hashtags or community forum labels on other platforms.</p>
        <p>A notable benefit of using hashtags and subreddits as platform-specific labels for studying alcohol-related outcomes is interpretability. Although deep learning models excel at understanding massive quantities of data, many NLP and deep learning models rely on complex feature representations to classify or characterize text. However, this approach is not easily interpretable [<xref ref-type="bibr" rid="ref65">65</xref>,<xref ref-type="bibr" rid="ref98">98</xref>]. We have demonstrated that by treating subreddits and hashtags as learnable labels, it is possible to directly use hashtags as interpretable features in our NLP pipeline for social media data to understand alcoholic beverage preferences while still learning from a large amount of data.</p>
        <p>Consumption of different alcohol types is associated with a variety of both beneficial and detrimental outcomes [<xref ref-type="bibr" rid="ref99">99</xref>-<xref ref-type="bibr" rid="ref101">101</xref>]. For example, wine consumption is associated with protection from cardiovascular diseases; however, the cause of this effect may be dietary factors and other lifestyle choices [<xref ref-type="bibr" rid="ref99">99</xref>,<xref ref-type="bibr" rid="ref102">102</xref>]. Other studies have associated preferential beer and liquor consumption with adverse outcomes, such as dangerous drinking and other risky behaviors [<xref ref-type="bibr" rid="ref101">101</xref>,<xref ref-type="bibr" rid="ref103">103</xref>,<xref ref-type="bibr" rid="ref104">104</xref>]. Notably, although many studies have examined overall alcohol mentions on Twitter, few models created have been explicitly examined in terms of differences in the types of alcoholic beverages mentioned.</p>
        <p>Our study indicates that information capturing consumption of wine and liquor is directly observable using social media data, as shown by the significant associations between the prevalence of 5 wine-related hashtags and the amount of wine consumed, as well as the number of posts containing at least 1 of the 3 liquor-related hashtags and liquor consumed. However, there was no significant relationship between beer consumption per capita and the number of alcohol-hashtagged Twitter posts in an area. The results here indicate that our model can detect certain types of alcohol consumption behavior (wine and liquor consumption) on Twitter using the interpretability of hashtags but not others (beer consumption). It remains unclear whether our results indicate a bias in our model’s methodological choice (eg, use of hashtags or training procedure) or a difference in social media populations that prefer different alcohol beverages. The difference in correlations might be because of several variables, including the existence of confounding factors related to the prevalence of social media use in the underlying populations that preferentially consume beer over other alcohol types, differences in perceived acceptance of beer consumption behavior, or because of other factors that may confound alcohol and social media posting [<xref ref-type="bibr" rid="ref89">89</xref>]. Alcohol preference is an example of having interpretable hashtag representations for a given model that may help identify behavioral differences associated with an outcome of interest. This evidence suggests that similar models trained on Twitter may detect alcohol wine and liquor consumption but not beer.</p>
      </sec>
      <sec>
        <title>Comparison With Previous Works</title>
        <p>Many previous studies have used hashtags as target labels. However, they mostly rely on a predefined set of hashtags that may not be data-driven or require extensive expert annotation instead of taking advantage of topic-specific sources and social media content on other public social media platforms [<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref105">105</xref>-<xref ref-type="bibr" rid="ref107">107</xref>]. Notably, using a predefined number of hashtags could be biased and too narrow for capturing relevant information, potentially missing informative hashtags for exposure or outcome. Traditional keyword approaches may fail to capture various pieces of information from slang and novel hashtags from platform-specific languages as they are created and popularized. In addition, keyword databases may not exist for all outcomes of interest. Semantic similarity measures, such as Word2vec, may identify hashtags with similar contexts; however, integrating vector representations may lose valuable information relative to training over individual samples, and prediction probabilities or certainty are not readily observable. In contrast, this study indicates that a model trained on a large set of data relevant to the behavior of interest and its application to an unlabeled data set from a different platform can identify data-driven hashtags related to that behavior. This ability to learn hashtags from data is critical, as new hashtags are created every day and may differ substantially between platforms.</p>
        <p>Many social media platforms are directly searchable using hashtags, allowing the ability to gather many highly specific posts instead of gathering a large number of nonspecific posts to identify relevant hashtags, keywords, or alcohol content based on available prevalence data. Although the latter approach has shown success in studying alcohol-related behavior previously, methods to extend the analysis to alternative but potentially related outcomes, platforms, or different geographical designations remain unclear [<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref108">108</xref>]. The generalization of such models necessitates the creation of individual models for each particular outcome and geographic area. Finally, these models may fail to take advantage of extensive research on themed communities to understand alcohol use and other outcomes of interest [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref39">39</xref>,<xref ref-type="bibr" rid="ref40">40</xref>,<xref ref-type="bibr" rid="ref76">76</xref>,<xref ref-type="bibr" rid="ref106">106</xref>,<xref ref-type="bibr" rid="ref109">109</xref>,<xref ref-type="bibr" rid="ref110">110</xref>]. In contrast, the method outlined here may help create more efficient public health interventions to analyze the alcohol consumption behavior for a given geographic area of interest, such as a city or hospital catchment area. This approach is particularly useful when the relevant language is dynamic or contains area-specific slang, making previously established dictionary-based methods incomplete or impractical. In particular, our proposed methodology for identifying hashtags using a previously trained deep learning model can be useful for detecting alcohol consumption behavior on various social media platforms.</p>
      </sec>
      <sec>
        <title>Limitations and Future Work</title>
        <p>There are some limitations to the model and approach proposed in this study. Other health-related behaviors that are not discussed frequently on social media may be more difficult to ascertain and translate between platforms using hashtags. Any model trained on a limited number of social media platforms may be confounded by differences in user preferences, such as age or socioeconomic status. Furthermore, this method relies on identifying known or previously studied subreddits, which may not be suitable for outcomes without known relevant subreddits. Furthermore, we did not compare our models’ performance with the BERT large model or other deep learning alternatives, which can have a different performance for our task. In addition, including additional social media data in model development and using domain knowledge from ontologies, controlled vocabularies, lexicons, and relevant rules and regular expressions can further improve the presented results.</p>
        <p>As future work, we plan to extend this study to other mental and behavioral health topics, such as depression and substance use, and other social media platforms that use hashtags, such as Facebook and Instagram. Deep learning has previously been used to combine the analysis of images and texts from social media users [<xref ref-type="bibr" rid="ref38">38</xref>]. In our future work, we will expand the presented architecture to include other data modalities, such as images and videos, to increase screening capabilities.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>These results indicate that using alcohol-related subreddits as learnable labels to train a BERT neural network can capture interpretable, alcohol-related language on Twitter. Our study suggests a significant correlation between the prevalence of alcohol-related geotagged Twitter hashtags and alcohol-related behaviors as measured by self-reported alcohol consumption, alcohol preferences, and alcohol outlet prevalence. This method has the unique advantages of previous methods, including allowing examination at the MMSA, US county, and US state level for different alcohol-related outcomes. These results suggest that using previously studied hashtags and subreddits as learnable targets in a machine learning framework could expand public health outreach efforts and epidemiology research, particularly for monitoring behavior related to alcohol consumption.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">API</term>
          <def>
            <p>application programming interface</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">BERT</term>
          <def>
            <p>Bidirectional Encoder Representations From Transformers</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">MMSA</term>
          <def>
            <p>metropolitan-micropolitan statistical area</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">NLP</term>
          <def>
            <p>natural language processing</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>Financial support for this work was provided by a National Library of Medicine of the National Institutes of Health T32 training grant through the award number T32LM012204. The authors would like to thank Lamar Moss, Natasha de la Rosa-Rivera, and Richard Ricard for their help and suggestions for improving the manuscript.</p>
    </ack>
    <fn-group>
      <fn fn-type="con">
        <p>Study concept and design: BJR and SH; analysis and interpretation of data: BJR and SH; collection or assembly of data: BJR; drafting of the manuscript: BJR and SH; critical revision of the manuscript for important intellectual content: BJR and SH; funding: BJR and SH; administrative, technical, and logistic support: SH; and study supervision: SH.</p>
      </fn>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Osna</surname>
              <given-names>NA</given-names>
            </name>
            <name name-style="western">
              <surname>Donohue</surname>
              <given-names>TM</given-names>
            </name>
            <name name-style="western">
              <surname>Kharbanda</surname>
              <given-names>KK</given-names>
            </name>
          </person-group>
          <article-title>Alcoholic liver disease: pathogenesis and current management</article-title>
          <source>Alcohol Res</source>
          <year>2017</year>
          <volume>38</volume>
          <issue>2</issue>
          <fpage>147</fpage>
          <lpage>61</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28988570"/>
          </comment>
          <pub-id pub-id-type="medline">28988570</pub-id>
          <pub-id pub-id-type="pmcid">PMC5513682</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Keefe</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Bhatti</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Bajwa</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>DiNicolantonio</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Lavie</surname>
              <given-names>CJ</given-names>
            </name>
          </person-group>
          <article-title>Alcohol and cardiovascular health: the dose makes the poison…or the remedy</article-title>
          <source>Mayo Clin Proc</source>
          <year>2014</year>
          <month>03</month>
          <volume>89</volume>
          <issue>3</issue>
          <fpage>382</fpage>
          <lpage>93</lpage>
          <pub-id pub-id-type="doi">10.1016/j.mayocp.2013.11.005</pub-id>
          <pub-id pub-id-type="medline">24582196</pub-id>
          <pub-id pub-id-type="pii">S0025-6196(13)01002-1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <article-title>Alcohol and public health: Alcohol-Related Disease Impact (ARDI)</article-title>
          <source>Centers for Disease Control and Prevention (CDC)</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://nccd.cdc.gov/DPH_ARDI/default/default.aspx">https://nccd.cdc.gov/DPH_ARDI/default/default.aspx</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Sullivan</surname>
              <given-names>EV</given-names>
            </name>
            <name name-style="western">
              <surname>Honnorat</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Adeli</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Podhajsky</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>De Bellis</surname>
              <given-names>MD</given-names>
            </name>
            <name name-style="western">
              <surname>Voyvodic</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Nooner</surname>
              <given-names>KB</given-names>
            </name>
            <name name-style="western">
              <surname>Baker</surname>
              <given-names>FC</given-names>
            </name>
            <name name-style="western">
              <surname>Colrain</surname>
              <given-names>IM</given-names>
            </name>
            <name name-style="western">
              <surname>Tapert</surname>
              <given-names>SF</given-names>
            </name>
            <name name-style="western">
              <surname>Brown</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Thompson</surname>
              <given-names>WK</given-names>
            </name>
            <name name-style="western">
              <surname>Nagel</surname>
              <given-names>BJ</given-names>
            </name>
            <name name-style="western">
              <surname>Clark</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Pfefferbaum</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Pohl</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>Association of heavy drinking with deviant fiber tract development in frontal brain systems in adolescents</article-title>
          <source>JAMA Psychiatry</source>
          <year>2021</year>
          <month>04</month>
          <day>01</day>
          <volume>78</volume>
          <issue>4</issue>
          <fpage>407</fpage>
          <lpage>15</lpage>
          <pub-id pub-id-type="doi">10.1001/jamapsychiatry.2020.4064</pub-id>
          <pub-id pub-id-type="medline">33377940</pub-id>
          <pub-id pub-id-type="pii">2774515</pub-id>
          <pub-id pub-id-type="pmcid">PMC7774050</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Litt</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Lewis</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Spiro</surname>
              <given-names>ES</given-names>
            </name>
            <name name-style="western">
              <surname>Aulck</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Waldron</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Head-Corliss</surname>
              <given-names>MK</given-names>
            </name>
            <name name-style="western">
              <surname>Swanson</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>#drunktwitter: examining the relations between alcohol-related Twitter content and alcohol willingness and use among underage young adults</article-title>
          <source>Drug Alcohol Depend</source>
          <year>2018</year>
          <month>12</month>
          <day>01</day>
          <volume>193</volume>
          <fpage>75</fpage>
          <lpage>82</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30343237"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.drugalcdep.2018.08.021</pub-id>
          <pub-id pub-id-type="medline">30343237</pub-id>
          <pub-id pub-id-type="pii">S0376-8716(18)30668-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC6239902</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Perrin</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Anderson</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Share of U.S. adults using social media, including Facebook, is mostly unchanged since 2018</article-title>
          <source>Pew Research Center</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.pewresearch.org/fact-tank/2019/04/10/share-of-u-s-adults-using-social-media-including-facebook-is-mostly-unchanged-since-2018/">https://www.pewresearch.org/fact-tank/2019/04/10/share-of-u-s-adults-using-social-media-including-facebook-is-mostly-unchanged-since-2018/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="web">
          <article-title>2018 National Survey of Drug Use and Health (NSDUH) releases</article-title>
          <source>SAMHSA</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.samhsa.gov/data/release/2018-national-survey-drug-use-and-health-nsduh-releases">https://www.samhsa.gov/data/release/2018-national-survey-drug-use-and-health-nsduh-releases</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bonar</surname>
              <given-names>EE</given-names>
            </name>
            <name name-style="western">
              <surname>Schneeberger</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Bourque</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bauermeister</surname>
              <given-names>JA</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>SD</given-names>
            </name>
            <name name-style="western">
              <surname>Blow</surname>
              <given-names>FC</given-names>
            </name>
            <name name-style="western">
              <surname>Cunningham</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Bohnert</surname>
              <given-names>AS</given-names>
            </name>
            <name name-style="western">
              <surname>Zimmerman</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Walton</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Social media interventions for risky drinking among adolescents and emerging adults: protocol for a randomized controlled trial</article-title>
          <source>JMIR Res Protoc</source>
          <year>2020</year>
          <month>05</month>
          <day>13</day>
          <volume>9</volume>
          <issue>5</issue>
          <fpage>e16688</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.researchprotocols.org/2020/5/e16688/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16688</pub-id>
          <pub-id pub-id-type="medline">32401225</pub-id>
          <pub-id pub-id-type="pii">v9i5e16688</pub-id>
          <pub-id pub-id-type="pmcid">PMC7254293</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Arigo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Pagoto</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carter-Harris</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Lillie</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Nebeker</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Using social media for health research: methodological and ethical considerations for recruitment and intervention delivery</article-title>
          <source>Digit Health</source>
          <year>2018</year>
          <month>5</month>
          <day>7</day>
          <volume>4</volume>
          <fpage>2055207618771757</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/2055207618771757?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/2055207618771757</pub-id>
          <pub-id pub-id-type="medline">29942634</pub-id>
          <pub-id pub-id-type="pii">10.1177_2055207618771757</pub-id>
          <pub-id pub-id-type="pmcid">PMC6016568</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology: the epidemiology of (mis)information</article-title>
          <source>Am J Med</source>
          <year>2002</year>
          <month>12</month>
          <day>15</day>
          <volume>113</volume>
          <issue>9</issue>
          <fpage>763</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1016/s0002-9343(02)01473-0</pub-id>
          <pub-id pub-id-type="medline">12517369</pub-id>
          <pub-id pub-id-type="pii">S0002934302014730</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mavragani</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology and infoveillance: scoping review</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>04</month>
          <day>28</day>
          <volume>22</volume>
          <issue>4</issue>
          <fpage>e16206</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/4/e16206/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/16206</pub-id>
          <pub-id pub-id-type="medline">32310818</pub-id>
          <pub-id pub-id-type="pii">v22i4e16206</pub-id>
          <pub-id pub-id-type="pmcid">PMC7189791</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eysenbach</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Infodemiology and infoveillance: framework for an emerging set of public health informatics methods to analyze search, communication and publication behavior on the internet</article-title>
          <source>J Med Internet Res</source>
          <year>2009</year>
          <month>03</month>
          <day>27</day>
          <volume>11</volume>
          <issue>1</issue>
          <fpage>e11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2009/1/e11/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.1157</pub-id>
          <pub-id pub-id-type="medline">19329408</pub-id>
          <pub-id pub-id-type="pii">v11i1e11</pub-id>
          <pub-id pub-id-type="pmcid">PMC2762766</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Martino</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Brooks</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Browne</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Carah</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Zorbas</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Corben</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Saleeba</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Martin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Peeters</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Backholer</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>The nature and extent of online marketing by big food and big alcohol during the COVID-19 pandemic in Australia: content analysis study</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>03</month>
          <day>12</day>
          <volume>7</volume>
          <issue>3</issue>
          <fpage>e25202</fpage>
          <pub-id pub-id-type="doi">10.2196/25202</pub-id>
          <pub-id pub-id-type="medline">33709935</pub-id>
          <pub-id pub-id-type="pii">v7i3e25202</pub-id>
          <pub-id pub-id-type="pmcid">PMC7958974</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Song</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Qian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yu</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Mobile health interventions for self-control of unhealthy alcohol use: systematic review</article-title>
          <source>JMIR Mhealth Uhealth</source>
          <year>2019</year>
          <month>01</month>
          <day>29</day>
          <volume>7</volume>
          <issue>1</issue>
          <fpage>e10899</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mhealth.jmir.org/2019/1/e10899/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/10899</pub-id>
          <pub-id pub-id-type="medline">30694200</pub-id>
          <pub-id pub-id-type="pii">v7i1e10899</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371076</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dawson</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Goldstein</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Pickering</surname>
              <given-names>RP</given-names>
            </name>
            <name name-style="western">
              <surname>Grant</surname>
              <given-names>BF</given-names>
            </name>
          </person-group>
          <article-title>Nonresponse bias in survey estimates of alcohol consumption and its association with harm</article-title>
          <source>J Stud Alcohol Drugs</source>
          <year>2014</year>
          <month>07</month>
          <volume>75</volume>
          <issue>4</issue>
          <fpage>695</fpage>
          <lpage>703</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/24988268"/>
          </comment>
          <pub-id pub-id-type="doi">10.15288/jsad.2014.75.695</pub-id>
          <pub-id pub-id-type="medline">24988268</pub-id>
          <pub-id pub-id-type="pmcid">PMC4108608</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sartor</surname>
              <given-names>CE</given-names>
            </name>
            <name name-style="western">
              <surname>Bucholz</surname>
              <given-names>KK</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>EC</given-names>
            </name>
            <name name-style="western">
              <surname>Madden</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Lynskey</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Heath</surname>
              <given-names>AC</given-names>
            </name>
          </person-group>
          <article-title>Reporting bias in the association between age at first alcohol use and heavy episodic drinking</article-title>
          <source>Alcohol Clin Exp Res</source>
          <year>2011</year>
          <month>08</month>
          <volume>35</volume>
          <issue>8</issue>
          <fpage>1418</fpage>
          <lpage>25</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/21438885"/>
          </comment>
          <pub-id pub-id-type="doi">10.1111/j.1530-0277.2011.01477.x</pub-id>
          <pub-id pub-id-type="medline">21438885</pub-id>
          <pub-id pub-id-type="pmcid">PMC3128178</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Davis</surname>
              <given-names>CG</given-names>
            </name>
            <name name-style="western">
              <surname>Thake</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Vilhena</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Social desirability biases in self-reported alcohol consumption and harms</article-title>
          <source>Addict Behav</source>
          <year>2010</year>
          <month>04</month>
          <volume>35</volume>
          <issue>4</issue>
          <fpage>302</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1016/j.addbeh.2009.11.001</pub-id>
          <pub-id pub-id-type="medline">19932936</pub-id>
          <pub-id pub-id-type="pii">S0306-4603(09)00307-4</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zappavigna</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Searchable talk: the linguistic functions of hashtags</article-title>
          <source>Soc Semiot</source>
          <year>2015</year>
          <month>01</month>
          <day>09</day>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>274</fpage>
          <lpage>91</lpage>
          <pub-id pub-id-type="doi">10.1080/10350330.2014.996948</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref19">
        <label>19</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Berry</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Lobban</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Belousov</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Emsley</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Nenadic</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bucci</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>#WhyWeTweetMH: understanding why people use twitter to discuss mental health problems</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>04</month>
          <day>05</day>
          <volume>19</volume>
          <issue>4</issue>
          <fpage>e107</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/4/e107/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.6173</pub-id>
          <pub-id pub-id-type="medline">28381392</pub-id>
          <pub-id pub-id-type="pii">v19i4e107</pub-id>
          <pub-id pub-id-type="pmcid">PMC5399219</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref20">
        <label>20</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Modrek</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chakalov</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>The #MeToo Movement in the United States: text analysis of early Twitter conversations</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>09</month>
          <day>03</day>
          <volume>21</volume>
          <issue>9</issue>
          <fpage>e13837</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/9/e13837/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13837</pub-id>
          <pub-id pub-id-type="medline">31482849</pub-id>
          <pub-id pub-id-type="pii">v21i9e13837</pub-id>
          <pub-id pub-id-type="pmcid">PMC6751092</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref21">
        <label>21</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>O'Neil</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sojo</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Fileborn</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Scovelle</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Milner</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>The #MeToo movement: an opportunity in public health?</article-title>
          <source>Lancet</source>
          <year>2018</year>
          <month>06</month>
          <day>30</day>
          <volume>391</volume>
          <issue>10140</issue>
          <fpage>2587</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1016/S0140-6736(18)30991-7</pub-id>
          <pub-id pub-id-type="medline">30070210</pub-id>
          <pub-id pub-id-type="pii">S0140-6736(18)30991-7</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref22">
        <label>22</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kero</surname>
              <given-names>KM</given-names>
            </name>
            <name name-style="western">
              <surname>Puuronen</surname>
              <given-names>AH</given-names>
            </name>
            <name name-style="western">
              <surname>Nyqvist</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Langén</surname>
              <given-names>VL</given-names>
            </name>
          </person-group>
          <article-title>Usability of two brief questions as a screening tool for domestic violence and effect of #MeToo on prevalence of self-reported violence</article-title>
          <source>Eur J Obstet Gynecol Reprod Biol</source>
          <year>2020</year>
          <month>12</month>
          <volume>255</volume>
          <fpage>92</fpage>
          <lpage>7</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/33113404"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.ejogrb.2020.10.024</pub-id>
          <pub-id pub-id-type="medline">33113404</pub-id>
          <pub-id pub-id-type="pii">S0301-2115(20)30662-X</pub-id>
          <pub-id pub-id-type="pmcid">PMC7566797</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref23">
        <label>23</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Platt</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>Brady</surname>
              <given-names>RR</given-names>
            </name>
          </person-group>
          <article-title>#BCSM and #breastcancer: contemporary cancer-specific online social media communities</article-title>
          <source>Breast J</source>
          <year>2020</year>
          <month>04</month>
          <volume>26</volume>
          <issue>4</issue>
          <fpage>729</fpage>
          <lpage>33</lpage>
          <pub-id pub-id-type="doi">10.1111/tbj.13576</pub-id>
          <pub-id pub-id-type="medline">31493301</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref24">
        <label>24</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Basch</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>MacLean</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Breast cancer on Instagram: a descriptive study</article-title>
          <source>Int J Prev Med</source>
          <year>2019</year>
          <month>10</month>
          <day>9</day>
          <volume>10</volume>
          <fpage>166</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32133084"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/ijpvm.IJPVM_36_19</pub-id>
          <pub-id pub-id-type="medline">32133084</pub-id>
          <pub-id pub-id-type="pii">IJPVM-10-166</pub-id>
          <pub-id pub-id-type="pmcid">PMC6826772</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref25">
        <label>25</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>George</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Britto</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Krishnan</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Dass</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Prasant</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Aravindhan</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>Assessment of hashtag (#) campaigns aimed at health awareness in social media</article-title>
          <source>J Educ Health Promot</source>
          <year>2018</year>
          <month>9</month>
          <day>14</day>
          <volume>7</volume>
          <fpage>114</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jehp.net/article.asp?issn=2277-9531;year=2018;volume=7;issue=1;spage=114;epage=114;aulast=George"/>
          </comment>
          <pub-id pub-id-type="doi">10.4103/jehp.jehp_37_18</pub-id>
          <pub-id pub-id-type="medline">30271799</pub-id>
          <pub-id pub-id-type="pii">JEHP-7-114</pub-id>
          <pub-id pub-id-type="pmcid">PMC6149119</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref26">
        <label>26</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mercier</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Senter</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Webster</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Henderson Riley</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Instagram users' experiences of miscarriage</article-title>
          <source>Obstet Gynecol</source>
          <year>2020</year>
          <month>01</month>
          <volume>135</volume>
          <issue>1</issue>
          <fpage>166</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.1097/AOG.0000000000003621</pub-id>
          <pub-id pub-id-type="medline">31809440</pub-id>
          <pub-id pub-id-type="pii">00006250-202001000-00022</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref27">
        <label>27</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laestadius</surname>
              <given-names>LI</given-names>
            </name>
            <name name-style="western">
              <surname>Wahl</surname>
              <given-names>MM</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>YI</given-names>
            </name>
          </person-group>
          <article-title>#Vapelife: an exploratory study of electronic cigarette use and promotion on instagram</article-title>
          <source>Subst Use Misuse</source>
          <year>2016</year>
          <month>10</month>
          <day>14</day>
          <volume>51</volume>
          <issue>12</issue>
          <fpage>1669</fpage>
          <lpage>73</lpage>
          <pub-id pub-id-type="doi">10.1080/10826084.2016.1188958</pub-id>
          <pub-id pub-id-type="medline">27484191</pub-id>
          <pub-id pub-id-type="pii">10.1080/10826084.2016.1188958</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref28">
        <label>28</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kudchadkar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Carroll</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>Using social media for rapid information dissemination in a pandemic: #PedsICU and coronavirus disease 2019</article-title>
          <source>Pediatr Crit Care Med</source>
          <year>2020</year>
          <month>08</month>
          <volume>21</volume>
          <issue>8</issue>
          <fpage>538</fpage>
          <lpage>46</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32459792"/>
          </comment>
          <pub-id pub-id-type="doi">10.1097/PCC.0000000000002474</pub-id>
          <pub-id pub-id-type="medline">32459792</pub-id>
          <pub-id pub-id-type="pii">00130478-202008000-00030</pub-id>
          <pub-id pub-id-type="pmcid">PMC7255404</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref29">
        <label>29</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gkotsis</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Oellrich</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Velupillai</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Liakata</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hubbard</surname>
              <given-names>TJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dobson</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Dutta</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Characterisation of mental health conditions in social media using informed deep learning</article-title>
          <source>Sci Rep</source>
          <year>2017</year>
          <month>03</month>
          <day>22</day>
          <volume>7</volume>
          <fpage>45141</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/srep45141"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/srep45141</pub-id>
          <pub-id pub-id-type="medline">28327593</pub-id>
          <pub-id pub-id-type="pii">srep45141</pub-id>
          <pub-id pub-id-type="pmcid">PMC5361083</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref30">
        <label>30</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Tamersoy</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chau</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Characterizing smoking and drinking abstinence from social media</article-title>
          <source>HT ACM Conf Hypertext Soc Media</source>
          <year>2015</year>
          <month>09</month>
          <volume>2015</volume>
          <fpage>139</fpage>
          <lpage>48</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26640831"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2700171.2791247</pub-id>
          <pub-id pub-id-type="medline">26640831</pub-id>
          <pub-id pub-id-type="pmcid">PMC4668115</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref31">
        <label>31</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Lu</surname>
              <given-names>X</given-names>
            </name>
          </person-group>
          <article-title>Analyzing hidden populations online: topic, emotion, and social network of HIV-related users in the largest Chinese online community</article-title>
          <source>BMC Med Inform Decis Mak</source>
          <year>2018</year>
          <month>01</month>
          <day>05</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>2</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcmedinformdecismak.biomedcentral.com/articles/10.1186/s12911-017-0579-1"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12911-017-0579-1</pub-id>
          <pub-id pub-id-type="medline">29304788</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12911-017-0579-1</pub-id>
          <pub-id pub-id-type="pmcid">PMC5755307</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref32">
        <label>32</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pandrekar</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Gopalkrishna</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Saltz</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Social media based analysis of opioid epidemic using Reddit</article-title>
          <source>AMIA Annu Symp Proc</source>
          <year>2018</year>
          <month>12</month>
          <day>5</day>
          <volume>2018</volume>
          <fpage>867</fpage>
          <lpage>76</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30815129"/>
          </comment>
          <pub-id pub-id-type="medline">30815129</pub-id>
          <pub-id pub-id-type="pmcid">PMC6371364</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref33">
        <label>33</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kochan</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ong</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Guler</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Johannson</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Ryerson</surname>
              <given-names>CJ</given-names>
            </name>
            <name name-style="western">
              <surname>Goobie</surname>
              <given-names>GC</given-names>
            </name>
          </person-group>
          <article-title>Social media content of idiopathic pulmonary fibrosis groups and pages on Facebook: cross-sectional analysis</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2021</year>
          <month>05</month>
          <day>31</day>
          <volume>7</volume>
          <issue>5</issue>
          <fpage>e24199</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2021/5/e24199/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/24199</pub-id>
          <pub-id pub-id-type="medline">34057425</pub-id>
          <pub-id pub-id-type="pii">v7i5e24199</pub-id>
          <pub-id pub-id-type="pmcid">PMC8204239</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref34">
        <label>34</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gruebner</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Lowe</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Sykora</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shankardass</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Subramanian</surname>
              <given-names>SV</given-names>
            </name>
            <name name-style="western">
              <surname>Galea</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>A novel surveillance approach for disaster mental health</article-title>
          <source>PLoS One</source>
          <year>2017</year>
          <month>7</month>
          <day>19</day>
          <volume>12</volume>
          <issue>7</issue>
          <fpage>e0181233</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0181233"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0181233</pub-id>
          <pub-id pub-id-type="medline">28723959</pub-id>
          <pub-id pub-id-type="pii">PONE-D-16-19119</pub-id>
          <pub-id pub-id-type="pmcid">PMC5516998</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref35">
        <label>35</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Jurdak</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>AbouJaoude</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cameron</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Newth</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Understanding human mobility from Twitter</article-title>
          <source>PLoS One</source>
          <year>2015</year>
          <month>7</month>
          <day>8</day>
          <volume>10</volume>
          <issue>7</issue>
          <fpage>e0131469</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0131469"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0131469</pub-id>
          <pub-id pub-id-type="medline">26154597</pub-id>
          <pub-id pub-id-type="pii">PONE-D-15-02120</pub-id>
          <pub-id pub-id-type="pmcid">PMC4496063</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref36">
        <label>36</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Tahir</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Hussain</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gogate</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Dashtipour</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ali</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sheikh</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Artificial intelligence-enabled analysis of public attitudes on Facebook and Twitter toward COVID-19 vaccines in the united kingdom and the United States: observational study</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>04</month>
          <day>05</day>
          <volume>23</volume>
          <issue>4</issue>
          <fpage>e26627</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/4/e26627/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26627</pub-id>
          <pub-id pub-id-type="medline">33724919</pub-id>
          <pub-id pub-id-type="pii">v23i4e26627</pub-id>
          <pub-id pub-id-type="pmcid">PMC8023383</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref37">
        <label>37</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Giorgi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Buffone</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Ashford</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Hemmons</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Summers</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hamilton</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Can Twitter be used to predict county excessive alcohol consumption rates?</article-title>
          <source>PLoS One</source>
          <year>2018</year>
          <month>4</month>
          <day>4</day>
          <volume>13</volume>
          <issue>4</issue>
          <fpage>e0194290</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0194290"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0194290</pub-id>
          <pub-id pub-id-type="medline">29617408</pub-id>
          <pub-id pub-id-type="pii">PONE-D-17-28471</pub-id>
          <pub-id pub-id-type="pmcid">PMC5884504</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref38">
        <label>38</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hassanpour</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tomita</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>DeLise</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Crosier</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Marsch</surname>
              <given-names>LA</given-names>
            </name>
          </person-group>
          <article-title>Identifying substance use risk based on deep neural networks and Instagram social media data</article-title>
          <source>Neuropsychopharmacology</source>
          <year>2019</year>
          <month>02</month>
          <volume>44</volume>
          <issue>3</issue>
          <fpage>487</fpage>
          <lpage>94</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30356094"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41386-018-0247-x</pub-id>
          <pub-id pub-id-type="medline">30356094</pub-id>
          <pub-id pub-id-type="pii">10.1038/s41386-018-0247-x</pub-id>
          <pub-id pub-id-type="pmcid">PMC6333814</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref39">
        <label>39</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Marengo</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Azucar</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Giannotta</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Basile</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Settanni</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Exploring the association between problem drinking and language use on Facebook in young adults</article-title>
          <source>Heliyon</source>
          <year>2019</year>
          <month>10</month>
          <day>9</day>
          <volume>5</volume>
          <issue>10</issue>
          <fpage>e02523</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://linkinghub.elsevier.com/retrieve/pii/S2405-8440(19)36183-3"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.heliyon.2019.e02523</pub-id>
          <pub-id pub-id-type="medline">31667380</pub-id>
          <pub-id pub-id-type="pii">S2405-8440(19)36183-3</pub-id>
          <pub-id pub-id-type="pmcid">PMC6812202</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref40">
        <label>40</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Crocamo</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Viviani</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Bartoli</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Carrà</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Pasi</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Detecting binge drinking and alcohol-related risky behaviours from Twitter's users: an exploratory content- and topology-based analysis</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>02</month>
          <day>26</day>
          <volume>17</volume>
          <issue>5</issue>
          <fpage>1510</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17051510"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17051510</pub-id>
          <pub-id pub-id-type="medline">32111047</pub-id>
          <pub-id pub-id-type="pii">ijerph17051510</pub-id>
          <pub-id pub-id-type="pmcid">PMC7084454</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref41">
        <label>41</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cavazos-Rehg</surname>
              <given-names>PA</given-names>
            </name>
            <name name-style="western">
              <surname>Krauss</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Sowles</surname>
              <given-names>SJ</given-names>
            </name>
            <name name-style="western">
              <surname>Bierut</surname>
              <given-names>LJ</given-names>
            </name>
          </person-group>
          <article-title>"Hey Everyone, I'm Drunk." An evaluation of drinking-related Twitter chatter</article-title>
          <source>J Stud Alcohol Drugs</source>
          <year>2015</year>
          <month>07</month>
          <volume>76</volume>
          <issue>4</issue>
          <fpage>635</fpage>
          <lpage>43</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26098041"/>
          </comment>
          <pub-id pub-id-type="doi">10.15288/jsad.2015.76.635</pub-id>
          <pub-id pub-id-type="medline">26098041</pub-id>
          <pub-id pub-id-type="pmcid">PMC4495081</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref42">
        <label>42</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Giorgi</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Yaden</surname>
              <given-names>DB</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Ashford</surname>
              <given-names>RD</given-names>
            </name>
            <name name-style="western">
              <surname>Buffone</surname>
              <given-names>AE</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Curtis</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Cultural differences in Tweeting about drinking across the US</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>02</month>
          <day>11</day>
          <volume>17</volume>
          <issue>4</issue>
          <fpage>1125</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17041125"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17041125</pub-id>
          <pub-id pub-id-type="medline">32053866</pub-id>
          <pub-id pub-id-type="pii">ijerph17041125</pub-id>
          <pub-id pub-id-type="pmcid">PMC7068559</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref43">
        <label>43</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Stellefson</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Paige</surname>
              <given-names>SR</given-names>
            </name>
            <name name-style="western">
              <surname>Chaney</surname>
              <given-names>BH</given-names>
            </name>
            <name name-style="western">
              <surname>Chaney</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Social media and health promotion</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2020</year>
          <month>05</month>
          <day>11</day>
          <volume>17</volume>
          <issue>9</issue>
          <fpage>3323</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph17093323"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph17093323</pub-id>
          <pub-id pub-id-type="medline">32403215</pub-id>
          <pub-id pub-id-type="pii">ijerph17093323</pub-id>
          <pub-id pub-id-type="pmcid">PMC7246655</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref44">
        <label>44</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sadah</surname>
              <given-names>SA</given-names>
            </name>
            <name name-style="western">
              <surname>Shahbazi</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Wiley</surname>
              <given-names>MT</given-names>
            </name>
            <name name-style="western">
              <surname>Hristidis</surname>
              <given-names>V</given-names>
            </name>
          </person-group>
          <article-title>A study of the demographics of web-based health-related social media users</article-title>
          <source>J Med Internet Res</source>
          <year>2015</year>
          <month>08</month>
          <day>06</day>
          <volume>17</volume>
          <issue>8</issue>
          <fpage>e194</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2015/8/e194/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.4308</pub-id>
          <pub-id pub-id-type="medline">26250986</pub-id>
          <pub-id pub-id-type="pii">v17i8e194</pub-id>
          <pub-id pub-id-type="pmcid">PMC4705027</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref45">
        <label>45</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hendriks</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Van den Putte</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Gebhardt</surname>
              <given-names>WA</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Social drinking on social media: content analysis of the social aspects of alcohol-related posts on Facebook and Instagram</article-title>
          <source>J Med Internet Res</source>
          <year>2018</year>
          <month>06</month>
          <day>22</day>
          <volume>20</volume>
          <issue>6</issue>
          <fpage>e226</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2018/6/e226/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.9355</pub-id>
          <pub-id pub-id-type="medline">29934290</pub-id>
          <pub-id pub-id-type="pii">v20i6e226</pub-id>
          <pub-id pub-id-type="pmcid">PMC6035352</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref46">
        <label>46</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Laws</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Hunt</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Antin</surname>
              <given-names>TM</given-names>
            </name>
          </person-group>
          <article-title>Social media platforms as a photo-elicitation tool in research on alcohol intoxication and gender</article-title>
          <source>Nordisk Alkohol Nark</source>
          <year>2018</year>
          <month>08</month>
          <volume>35</volume>
          <issue>4</issue>
          <fpage>288</fpage>
          <lpage>303</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://journals.sagepub.com/doi/10.1177/1455072518781998?url_ver=Z39.88-2003&#38;rfr_id=ori:rid:crossref.org&#38;rfr_dat=cr_pub%3dpubmed"/>
          </comment>
          <pub-id pub-id-type="doi">10.1177/1455072518781998</pub-id>
          <pub-id pub-id-type="medline">30245584</pub-id>
          <pub-id pub-id-type="pmcid">PMC6146389</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref47">
        <label>47</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Gupta</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Lam</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Pettigrew</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tait</surname>
              <given-names>RJ</given-names>
            </name>
          </person-group>
          <article-title>The association between exposure to social media alcohol marketing and youth alcohol use behaviors in India and Australia</article-title>
          <source>BMC Public Health</source>
          <year>2018</year>
          <month>06</month>
          <day>13</day>
          <volume>18</volume>
          <issue>1</issue>
          <fpage>726</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpublichealth.biomedcentral.com/articles/10.1186/s12889-018-5645-9"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12889-018-5645-9</pub-id>
          <pub-id pub-id-type="medline">29895264</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12889-018-5645-9</pub-id>
          <pub-id pub-id-type="pmcid">PMC5998576</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref48">
        <label>48</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rehm</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kilian</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Rovira</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Shield</surname>
              <given-names>KD</given-names>
            </name>
            <name name-style="western">
              <surname>Manthey</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>The elusiveness of representativeness in general population surveys for alcohol</article-title>
          <source>Drug Alcohol Rev</source>
          <year>2021</year>
          <month>02</month>
          <volume>40</volume>
          <issue>2</issue>
          <fpage>161</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.1111/dar.13148</pub-id>
          <pub-id pub-id-type="medline">32830351</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref49">
        <label>49</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nguyen</surname>
              <given-names>QC</given-names>
            </name>
            <name name-style="western">
              <surname>McCullough</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Meng</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Paul</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Kath</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Loomis</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Nsoesie</surname>
              <given-names>EO</given-names>
            </name>
            <name name-style="western">
              <surname>Wen</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>KR</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>F</given-names>
            </name>
          </person-group>
          <article-title>Geotagged US Tweets as predictors of county-level health outcomes, 2015-2016</article-title>
          <source>Am J Public Health</source>
          <year>2017</year>
          <month>11</month>
          <volume>107</volume>
          <issue>11</issue>
          <fpage>1776</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.2105/AJPH.2017.303993</pub-id>
          <pub-id pub-id-type="medline">28933925</pub-id>
          <pub-id pub-id-type="pmcid">PMC5637661</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref50">
        <label>50</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Krauss</surname>
              <given-names>MJ</given-names>
            </name>
            <name name-style="western">
              <surname>Grucza</surname>
              <given-names>RA</given-names>
            </name>
            <name name-style="western">
              <surname>Bierut</surname>
              <given-names>LJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cavazos-Rehg</surname>
              <given-names>PA</given-names>
            </name>
          </person-group>
          <article-title>"Get drunk. Smoke weed. Have fun.": a content analysis of tweets about marijuana and alcohol</article-title>
          <source>Am J Health Promot</source>
          <year>2017</year>
          <month>05</month>
          <volume>31</volume>
          <issue>3</issue>
          <fpage>200</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/26559715"/>
          </comment>
          <pub-id pub-id-type="doi">10.4278/ajhp.150205-QUAL-708</pub-id>
          <pub-id pub-id-type="medline">26559715</pub-id>
          <pub-id pub-id-type="pmcid">PMC4956592</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref51">
        <label>51</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Allem</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dormanesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Majmundar</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Rivera</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Chu</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Unger</surname>
              <given-names>JB</given-names>
            </name>
            <name name-style="western">
              <surname>Cruz</surname>
              <given-names>TB</given-names>
            </name>
          </person-group>
          <article-title>Leading topics in Twitter discourse on JUUL and Puff Bar products: content analysis</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>07</month>
          <day>19</day>
          <volume>23</volume>
          <issue>7</issue>
          <fpage>e26510</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/7/e26510/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/26510</pub-id>
          <pub-id pub-id-type="medline">34279236</pub-id>
          <pub-id pub-id-type="pii">v23i7e26510</pub-id>
          <pub-id pub-id-type="pmcid">PMC8329759</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref52">
        <label>52</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lorentzen</surname>
              <given-names>DG</given-names>
            </name>
            <name name-style="western">
              <surname>Nolin</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Approaching completeness: capturing a hashtagged Twitter conversation and its follow-on conversation</article-title>
          <source>Soc Sci Comput Rev</source>
          <year>2015</year>
          <month>09</month>
          <day>29</day>
          <volume>35</volume>
          <issue>2</issue>
          <fpage>277</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.1177/0894439315607018</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref53">
        <label>53</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Le</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
          </person-group>
          <article-title>Distributed representations of sentences and documents</article-title>
          <source>Proceedings of the 31st International Conference on Machine Learning</source>
          <year>2014</year>
          <conf-name>31st International Conference on Machine Learning</conf-name>
          <conf-date>Jun 21-26, 2014</conf-date>
          <conf-loc>Beijing China</conf-loc>
          <fpage>1188</fpage>
          <lpage>96</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://proceedings.mlr.press/v32/le14.html"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref54">
        <label>54</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mikolov</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Corrado</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Dean</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Efficient estimation of word representations in vector space</article-title>
          <source>arXiv: Computer Science, Computation and Language</source>
          <year>2013</year>
          <month>1</month>
          <access-date>2021-09-02</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1301.3781">https://arxiv.org/abs/1301.3781</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref55">
        <label>55</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Saha</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Torous</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ernala</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rizuto</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Stafford</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>A computational study of mental health awareness campaigns on social media</article-title>
          <source>Transl Behav Med</source>
          <year>2019</year>
          <month>11</month>
          <day>25</day>
          <volume>9</volume>
          <issue>6</issue>
          <fpage>1197</fpage>
          <lpage>207</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30834942"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/tbm/ibz028</pub-id>
          <pub-id pub-id-type="medline">30834942</pub-id>
          <pub-id pub-id-type="pii">5369573</pub-id>
          <pub-id pub-id-type="pmcid">PMC6875652</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref56">
        <label>56</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zomick</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Levitan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Serper</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Linguistic analysis of schizophrenia in Reddit posts</article-title>
          <source>Proceedings of the Sixth Workshop on Computational Linguistics and Clinical Psychology</source>
          <year>2019</year>
          <conf-name>Sixth Workshop on Computational Linguistics and Clinical Psychology</conf-name>
          <conf-date>Jun 2019</conf-date>
          <conf-loc>Minneapolis, Minnesota</conf-loc>
          <fpage>74</fpage>
          <lpage>83</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/w19-3009</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref57">
        <label>57</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Devlin</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Toutanova</surname>
              <given-names>K</given-names>
            </name>
          </person-group>
          <article-title>BERT: pre-training of deep bidirectional transformers for language understanding</article-title>
          <source>Assoc Comput Linguist</source>
          <year>2019</year>
          <month>6</month>
          <fpage>4171</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/N19-1423</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref58">
        <label>58</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rogers</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kovaleva</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Rumshisky</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>A primer in BERTology: what we know about how BERT works</article-title>
          <source>Trans Assoc Comput Linguist</source>
          <year>2020</year>
          <month>12</month>
          <volume>8</volume>
          <fpage>842</fpage>
          <lpage>66</lpage>
          <pub-id pub-id-type="doi">10.1162/tacl_a_00349</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref59">
        <label>59</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mozafari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Farahbakhsh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Crespi</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>A BERT-based transfer learning approach for hate speech detection in online social media</article-title>
          <source>Complex Networks and Their Applications VIII</source>
          <year>2019</year>
          <month>11</month>
          <day>26</day>
          <publisher-loc>Basel, Switzerland</publisher-loc>
          <publisher-name>Springer International Publishing</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref60">
        <label>60</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Heidari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Jones</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using BERT to extract topic-independent sentiment features for social media bot detection</article-title>
          <source>Proceedings of the 11th IEEE Annual Ubiquitous Computing, Electronics &#38; Mobile Communication Conference (UEMCON)</source>
          <year>2020</year>
          <conf-name>11th IEEE Annual Ubiquitous Computing, Electronics &#38; Mobile Communication Conference (UEMCON)</conf-name>
          <conf-date>Oct 28-31, 2020</conf-date>
          <conf-loc>New York, NY, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/uemcon51285.2020.9298158</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref61">
        <label>61</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Mozafari</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Farahbakhsh</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Crespi</surname>
              <given-names>N</given-names>
            </name>
          </person-group>
          <article-title>Hate speech detection and racial bias mitigation in social media based on BERT model</article-title>
          <source>PLoS One</source>
          <year>2020</year>
          <month>8</month>
          <day>27</day>
          <volume>15</volume>
          <issue>8</issue>
          <fpage>e0237861</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0237861"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0237861</pub-id>
          <pub-id pub-id-type="medline">32853205</pub-id>
          <pub-id pub-id-type="pii">PONE-D-20-06639</pub-id>
          <pub-id pub-id-type="pmcid">PMC7451563</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref62">
        <label>62</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pérez-Pérez</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Pérez-Rodríguez</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Fdez-Riverola</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lourenço</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Using Twitter to understand the human bowel disease community: exploratory analysis of key topics</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>08</month>
          <day>15</day>
          <volume>21</volume>
          <issue>8</issue>
          <fpage>e12610</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/8/e12610/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/12610</pub-id>
          <pub-id pub-id-type="medline">31411142</pub-id>
          <pub-id pub-id-type="pii">v21i8e12610</pub-id>
          <pub-id pub-id-type="pmcid">PMC6711036</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref63">
        <label>63</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Li</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Xu</surname>
              <given-names>Q</given-names>
            </name>
            <name name-style="western">
              <surname>Shah</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Mackey</surname>
              <given-names>TK</given-names>
            </name>
          </person-group>
          <article-title>A machine learning approach for the detection and characterization of illicit drug dealers on instagram: model evaluation study</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>06</month>
          <day>15</day>
          <volume>21</volume>
          <issue>6</issue>
          <fpage>e13803</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/6/e13803/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13803</pub-id>
          <pub-id pub-id-type="medline">31199298</pub-id>
          <pub-id pub-id-type="pii">v21i6e13803</pub-id>
          <pub-id pub-id-type="pmcid">PMC6598421</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref64">
        <label>64</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pereira-Kohatsu</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Quijano-Sánchez</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Liberatore</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Camacho-Collados</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Detecting and monitoring hate speech in Twitter</article-title>
          <source>Sensors (Basel)</source>
          <year>2019</year>
          <month>10</month>
          <day>26</day>
          <volume>19</volume>
          <issue>21</issue>
          <fpage>4654</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=s19214654"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/s19214654</pub-id>
          <pub-id pub-id-type="medline">31717760</pub-id>
          <pub-id pub-id-type="pii">s19214654</pub-id>
          <pub-id pub-id-type="pmcid">PMC6864473</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref65">
        <label>65</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chakraborty</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Tomsett</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Raghavendra</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Harborne</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Alzantot</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Cerutti</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Srivastava</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Preece</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Julier</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Rao</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Kelley</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Braines</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Sensoy</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Willis</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Gurram</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>Interpretability of deep learning models: a survey of results</article-title>
          <source>Proceedings of the IEEE SmartWorld, Ubiquitous Intelligence &#38; Computing, Advanced &#38; Trusted Computed, Scalable Computing &#38; Communications, Cloud &#38; Big Data Computing, Internet of People and Smart City Innovation (SmartWorld/SCALCOM/UIC/ATC/CBDCom/IOP/SCI)</source>
          <year>2017</year>
          <conf-name>IEEE SmartWorld, Ubiquitous Intelligence &#38; Computing, Advanced &#38; Trusted Computed, Scalable Computing &#38; Communications, Cloud &#38; Big Data Computing, Internet of People and Smart City Innovation (SmartWorld/SCALCOM/UIC/ATC/CBDCom/IOP/SCI)</conf-name>
          <conf-date>Aug 4-8, 2017</conf-date>
          <conf-loc>San Francisco, CA, USA</conf-loc>
          <pub-id pub-id-type="doi">10.1109/uic-atc.2017.8397411</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref66">
        <label>66</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Singh</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Roberts</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Cohen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cobb</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Fujimoto</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Myneni</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Social Media as a Research Tool (SMaaRT) for risky behavior analytics: methodological review</article-title>
          <source>JMIR Public Health Surveill</source>
          <year>2020</year>
          <month>11</month>
          <day>30</day>
          <volume>6</volume>
          <issue>4</issue>
          <fpage>e21660</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://publichealth.jmir.org/2020/4/e21660/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21660</pub-id>
          <pub-id pub-id-type="medline">33252345</pub-id>
          <pub-id pub-id-type="pii">v6i4e21660</pub-id>
          <pub-id pub-id-type="pmcid">PMC7735906</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref67">
        <label>67</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Wang</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Kou</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Sugumaran</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Luo</surname>
              <given-names>X</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>H</given-names>
            </name>
          </person-group>
          <article-title>Emotion correlation mining through deep learning models on natural language text</article-title>
          <source>IEEE Trans Cybern</source>
          <year>2020</year>
          <month>05</month>
          <day>12</day>
          <fpage>2987064</fpage>
          <comment>(forthcoming)</comment>
          <pub-id pub-id-type="doi">10.1109/TCYB.2020.2987064</pub-id>
          <pub-id pub-id-type="medline">32413938</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref68">
        <label>68</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Weissenbacher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez-Hernandez</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Towards scaling Twitter for digital epidemiology of birth defects</article-title>
          <source>NPJ Digit Med</source>
          <year>2019</year>
          <month>10</month>
          <day>1</day>
          <volume>2</volume>
          <fpage>96</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://doi.org/10.1038/s41746-019-0170-5"/>
          </comment>
          <pub-id pub-id-type="doi">10.1038/s41746-019-0170-5</pub-id>
          <pub-id pub-id-type="medline">31583284</pub-id>
          <pub-id pub-id-type="pii">170</pub-id>
          <pub-id pub-id-type="pmcid">PMC6773753</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref69">
        <label>69</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Klein</surname>
              <given-names>AZ</given-names>
            </name>
            <name name-style="western">
              <surname>Magge</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Amaro</surname>
              <given-names>JF</given-names>
            </name>
            <name name-style="western">
              <surname>Weissenbacher</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hernandez</surname>
              <given-names>GG</given-names>
            </name>
          </person-group>
          <article-title>Toward using Twitter for tracking COVID-19: a natural language processing pipeline and exploratory data set</article-title>
          <source>J Med Internet Res</source>
          <year>2021</year>
          <month>01</month>
          <day>22</day>
          <volume>23</volume>
          <issue>1</issue>
          <fpage>e25314</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2021/1/e25314/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/25314</pub-id>
          <pub-id pub-id-type="medline">33449904</pub-id>
          <pub-id pub-id-type="pii">v23i1e25314</pub-id>
          <pub-id pub-id-type="pmcid">PMC7834613</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref70">
        <label>70</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Edo-Osagie</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Lake</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Edeghere</surname>
              <given-names>O</given-names>
            </name>
            <name name-style="western">
              <surname>De La Iglesia</surname>
              <given-names>B</given-names>
            </name>
          </person-group>
          <article-title>Twitter mining using semi-supervised classification for relevance filtering in syndromic surveillance</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>7</month>
          <day>18</day>
          <volume>14</volume>
          <issue>7</issue>
          <fpage>e0210689</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://dx.plos.org/10.1371/journal.pone.0210689"/>
          </comment>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0210689</pub-id>
          <pub-id pub-id-type="medline">31318885</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-34849</pub-id>
          <pub-id pub-id-type="pmcid">PMC6638773</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref71">
        <label>71</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Ru</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Li</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Hu</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Yao</surname>
              <given-names>L</given-names>
            </name>
          </person-group>
          <article-title>Serendipity-a machine-learning application for mining serendipitous drug usage from social media</article-title>
          <source>IEEE Trans Nanobioscience</source>
          <year>2019</year>
          <month>07</month>
          <volume>18</volume>
          <issue>3</issue>
          <fpage>324</fpage>
          <lpage>34</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/30951476"/>
          </comment>
          <pub-id pub-id-type="doi">10.1109/TNB.2019.2909094</pub-id>
          <pub-id pub-id-type="medline">30951476</pub-id>
          <pub-id pub-id-type="pmcid">PMC6650153</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref72">
        <label>72</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Nikfarjam</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sarker</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>O'Connor</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Ginn</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Gonzalez</surname>
              <given-names>G</given-names>
            </name>
          </person-group>
          <article-title>Pharmacovigilance from social media: mining adverse drug reaction mentions using sequence labeling with word embedding cluster features</article-title>
          <source>J Am Med Inform Assoc</source>
          <year>2015</year>
          <month>05</month>
          <volume>22</volume>
          <issue>3</issue>
          <fpage>671</fpage>
          <lpage>81</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/25755127"/>
          </comment>
          <pub-id pub-id-type="doi">10.1093/jamia/ocu041</pub-id>
          <pub-id pub-id-type="medline">25755127</pub-id>
          <pub-id pub-id-type="pii">ocu041</pub-id>
          <pub-id pub-id-type="pmcid">PMC4457113</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref73">
        <label>73</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Strubell</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>Ganesh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>McCallum</surname>
              <given-names>A</given-names>
            </name>
          </person-group>
          <article-title>Energy and policy considerations for modern deep learning research</article-title>
          <source>AAAI</source>
          <year>2020</year>
          <month>04</month>
          <day>03</day>
          <volume>34</volume>
          <issue>09</issue>
          <fpage>13693</fpage>
          <lpage>6</lpage>
          <pub-id pub-id-type="doi">10.1609/aaai.v34i09.7123</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref74">
        <label>74</label>
        <nlm-citation citation-type="web">
          <article-title>Metropolitan and micropolitan statistical areas population totals and components of change: 2010-2019</article-title>
          <source>United States Census Bureau</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/data/tables/time-series/demo/popest/2010s-total-metro-and-micro-statistical-areas.html">https://www.census.gov/data/tables/time-series/demo/popest/2010s-total-metro-and-micro-statistical-areas.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref75">
        <label>75</label>
        <nlm-citation citation-type="web">
          <article-title>Population, population change, and estimated components of population change: April 1, 2010 to July 1, 2019 (NST-EST2019-alldata)</article-title>
          <source>United States Census Bureau</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/data/tables/time-series/demo/popest/2010s-national-total.html">https://www.census.gov/data/tables/time-series/demo/popest/2010s-national-total.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref76">
        <label>76</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhan</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zhang</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Okamoto</surname>
              <given-names>JM</given-names>
            </name>
            <name name-style="western">
              <surname>Zeng</surname>
              <given-names>DD</given-names>
            </name>
            <name name-style="western">
              <surname>Leischow</surname>
              <given-names>SJ</given-names>
            </name>
          </person-group>
          <article-title>Underage JUUL use patterns: content analysis of Reddit messages</article-title>
          <source>J Med Internet Res</source>
          <year>2019</year>
          <month>09</month>
          <day>09</day>
          <volume>21</volume>
          <issue>9</issue>
          <fpage>e13038</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2019/9/e13038/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/13038</pub-id>
          <pub-id pub-id-type="medline">31502542</pub-id>
          <pub-id pub-id-type="pii">v21i9e13038</pub-id>
          <pub-id pub-id-type="pmcid">PMC6786857</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref77">
        <label>77</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Paszke</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Gross</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Massa</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Lerer</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Bradbury</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chanan</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Killeen</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Lin</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Gimelshein</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Antiga</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Desmaison</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kopf</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Yang</surname>
              <given-names>E</given-names>
            </name>
            <name name-style="western">
              <surname>DeVito</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Raison</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Tejani</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Chilamkurthy</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Steiner</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Fang</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Bai</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Chintala</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>PyTorch: an imperative style, high-performance deep learning library</article-title>
          <source>arXiv: Computer Science, Machine Learning</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://arxiv.org/abs/1912.01703">https://arxiv.org/abs/1912.01703</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref78">
        <label>78</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Pennington</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Socher</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>GloVe: global vectors for word representation</article-title>
          <source>Proceedings of the Conference on Empirical Methods in Natural Language Processing (EMNLP)</source>
          <year>2014</year>
          <conf-name>Conference on Empirical Methods in Natural Language Processing (EMNLP)</conf-name>
          <conf-date>Oct 2014</conf-date>
          <conf-loc>Doha, Qatar</conf-loc>
          <fpage>1532</fpage>
          <lpage>43</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.aclweb.org/anthology/D14-1162"/>
          </comment>
          <pub-id pub-id-type="doi">10.3115/v1/d14-1162</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref79">
        <label>79</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Benjamini</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Hochberg</surname>
              <given-names>Y</given-names>
            </name>
          </person-group>
          <article-title>Controlling the false discovery rate: a practical and powerful approach to multiple testing</article-title>
          <source>J R Stat Soc Series B Stat Methodol</source>
          <year>1995</year>
          <volume>57</volume>
          <issue>1</issue>
          <fpage>289</fpage>
          <lpage>300</lpage>
          <pub-id pub-id-type="doi">10.1111/j.2517-6161.1995.tb02031.x</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref80">
        <label>80</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hopkins</surname>
              <given-names>ZH</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Secrest</surname>
              <given-names>AM</given-names>
            </name>
          </person-group>
          <article-title>Influence of social media on cosmetic procedure interest</article-title>
          <source>J Clin Aesthet Dermatol</source>
          <year>2020</year>
          <month>01</month>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>28</fpage>
          <lpage>31</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32082468"/>
          </comment>
          <pub-id pub-id-type="medline">32082468</pub-id>
          <pub-id pub-id-type="pmcid">PMC7028372</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref81">
        <label>81</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Hill</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Padrez</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Evaluating the predictability of medical conditions from social media posts</article-title>
          <source>PLoS One</source>
          <year>2019</year>
          <month>6</month>
          <day>17</day>
          <volume>14</volume>
          <issue>6</issue>
          <fpage>e0215476</fpage>
          <pub-id pub-id-type="doi">10.1371/journal.pone.0215476</pub-id>
          <pub-id pub-id-type="medline">31206534</pub-id>
          <pub-id pub-id-type="pii">PONE-D-18-34864</pub-id>
          <pub-id pub-id-type="pmcid">PMC6576767</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref82">
        <label>82</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Eichstaedt</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>LH</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Preoţiuc-Pietro</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>DA</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
          </person-group>
          <article-title>Facebook language predicts depression in medical records</article-title>
          <source>Proc Natl Acad Sci U S A</source>
          <year>2018</year>
          <month>10</month>
          <day>30</day>
          <volume>115</volume>
          <issue>44</issue>
          <fpage>11203</fpage>
          <lpage>8</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.pnas.org/cgi/pmidlookup?view=long&#38;pmid=30322910"/>
          </comment>
          <pub-id pub-id-type="doi">10.1073/pnas.1802331115</pub-id>
          <pub-id pub-id-type="medline">30322910</pub-id>
          <pub-id pub-id-type="pii">1802331115</pub-id>
          <pub-id pub-id-type="pmcid">PMC6217418</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref83">
        <label>83</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Griffis</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Asch</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>H</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Buttenheim</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Barg</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Mitra</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Using social media to track geographic variability in language about diabetes: analysis of diabetes-related tweets across the United States</article-title>
          <source>JMIR Diabetes</source>
          <year>2020</year>
          <month>01</month>
          <day>26</day>
          <volume>5</volume>
          <issue>1</issue>
          <fpage>e14431</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://diabetes.jmir.org/2020/1/e14431/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/14431</pub-id>
          <pub-id pub-id-type="medline">32044757</pub-id>
          <pub-id pub-id-type="pii">v5i1e14431</pub-id>
          <pub-id pub-id-type="pmcid">PMC7055793</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref84">
        <label>84</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Smith</surname>
              <given-names>RJ</given-names>
            </name>
            <name name-style="western">
              <surname>Crutchley</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Schwartz</surname>
              <given-names>HA</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Shofer</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Padrez</surname>
              <given-names>KA</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>RM</given-names>
            </name>
          </person-group>
          <article-title>Variations in Facebook posting patterns across validated patient health conditions: a prospective cohort study</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>01</month>
          <day>06</day>
          <volume>19</volume>
          <issue>1</issue>
          <fpage>e7</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/1/e7/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.6486</pub-id>
          <pub-id pub-id-type="medline">28062392</pub-id>
          <pub-id pub-id-type="pii">v19i1e7</pub-id>
          <pub-id pub-id-type="pmcid">PMC5251170</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref85">
        <label>85</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Guntuku</surname>
              <given-names>SC</given-names>
            </name>
            <name name-style="western">
              <surname>Schneider</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Pelullo</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Young</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Wong</surname>
              <given-names>V</given-names>
            </name>
            <name name-style="western">
              <surname>Ungar</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Polsky</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Volpp</surname>
              <given-names>KG</given-names>
            </name>
            <name name-style="western">
              <surname>Merchant</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Studying expressions of loneliness in individuals using twitter: an observational study</article-title>
          <source>BMJ Open</source>
          <year>2019</year>
          <month>11</month>
          <day>04</day>
          <volume>9</volume>
          <issue>11</issue>
          <fpage>e030355</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmjopen.bmj.com/lookup/pmidlookup?view=long&#38;pmid=31685502"/>
          </comment>
          <pub-id pub-id-type="doi">10.1136/bmjopen-2019-030355</pub-id>
          <pub-id pub-id-type="medline">31685502</pub-id>
          <pub-id pub-id-type="pii">bmjopen-2019-030355</pub-id>
          <pub-id pub-id-type="pmcid">PMC6830671</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref86">
        <label>86</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Cecinati</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Matthews</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Natarajan</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>McCullen</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Coley</surname>
              <given-names>D</given-names>
            </name>
          </person-group>
          <article-title>Mining social media to identify heat waves</article-title>
          <source>Int J Environ Res Public Health</source>
          <year>2019</year>
          <month>03</month>
          <day>02</day>
          <volume>16</volume>
          <issue>5</issue>
          <fpage>762</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mdpi.com/resolver?pii=ijerph16050762"/>
          </comment>
          <pub-id pub-id-type="doi">10.3390/ijerph16050762</pub-id>
          <pub-id pub-id-type="medline">30832387</pub-id>
          <pub-id pub-id-type="pii">ijerph16050762</pub-id>
          <pub-id pub-id-type="pmcid">PMC6427652</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref87">
        <label>87</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Birnbaum</surname>
              <given-names>ML</given-names>
            </name>
            <name name-style="western">
              <surname>Ernala</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Rizvi</surname>
              <given-names>AF</given-names>
            </name>
            <name name-style="western">
              <surname>De Choudhury</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Kane</surname>
              <given-names>JM</given-names>
            </name>
          </person-group>
          <article-title>A collaborative approach to identifying social media markers of schizophrenia by employing machine learning and clinical appraisals</article-title>
          <source>J Med Internet Res</source>
          <year>2017</year>
          <month>08</month>
          <day>14</day>
          <volume>19</volume>
          <issue>8</issue>
          <fpage>e289</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2017/8/e289/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/jmir.7956</pub-id>
          <pub-id pub-id-type="medline">28807891</pub-id>
          <pub-id pub-id-type="pii">v19i8e289</pub-id>
          <pub-id pub-id-type="pmcid">PMC5575421</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref88">
        <label>88</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Spearman</surname>
              <given-names>C</given-names>
            </name>
          </person-group>
          <article-title>The proof and measurement of association between two things</article-title>
          <source>Am J Psychol</source>
          <year>1904</year>
          <volume>15</volume>
          <issue>1</issue>
          <fpage>72</fpage>
          <lpage>101</lpage>
          <pub-id pub-id-type="doi">10.2307/1412159</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref89">
        <label>89</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Bergman</surname>
              <given-names>BG</given-names>
            </name>
            <name name-style="western">
              <surname>Wu</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Marsch</surname>
              <given-names>LA</given-names>
            </name>
            <name name-style="western">
              <surname>Crosier</surname>
              <given-names>BS</given-names>
            </name>
            <name name-style="western">
              <surname>DeLise</surname>
              <given-names>TC</given-names>
            </name>
            <name name-style="western">
              <surname>Hassanpour</surname>
              <given-names>S</given-names>
            </name>
          </person-group>
          <article-title>Associations between substance use and Instagram participation to inform social network-based screening models: multimodal cross-sectional study</article-title>
          <source>J Med Internet Res</source>
          <year>2020</year>
          <month>09</month>
          <day>16</day>
          <volume>22</volume>
          <issue>9</issue>
          <fpage>e21916</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.jmir.org/2020/9/e21916/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/21916</pub-id>
          <pub-id pub-id-type="medline">32936081</pub-id>
          <pub-id pub-id-type="pii">v22i9e21916</pub-id>
          <pub-id pub-id-type="pmcid">PMC7527914</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref90">
        <label>90</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <collab>United States Census Bureau</collab>
          </person-group>
          <article-title>Educational Attainment, Income in the Past 12 Months (In 2018 inflation-adjusted dollars), ACS Demographic and Housing Estimates</article-title>
          <source>American Community Survey</source>
          <year>2018</year>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/acs/www/data/data-tables-and-tools/subject-tables/">https://www.census.gov/acs/www/data/data-tables-and-tools/subject-tables/</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref91">
        <label>91</label>
        <nlm-citation citation-type="web">
          <article-title>Behavioral risk factor surveillance system</article-title>
          <source>Centers for Disease Control and Prevention</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.cdc.gov/brfss/index.html">https://www.cdc.gov/brfss/index.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref92">
        <label>92</label>
        <nlm-citation citation-type="web">
          <article-title>2019 County Health Rankings Key Findings Report</article-title>
          <source>University of Wisconsin Population Health Institute</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.countyhealthrankings.org/reports/2019-county-health-rankings-key-findings-report">https://www.countyhealthrankings.org/reports/2019-county-health-rankings-key-findings-report</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref93">
        <label>93</label>
        <nlm-citation citation-type="web">
          <article-title>County business patterns: 2017</article-title>
          <source>United States Census Bureau</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.census.gov/data/datasets/2017/econ/cbp/2017-cbp.html">https://www.census.gov/data/datasets/2017/econ/cbp/2017-cbp.html</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref94">
        <label>94</label>
        <nlm-citation citation-type="web">
          <article-title>Apparent per capita alcohol consumption: national, state, and regional trends 1977-2018</article-title>
          <source>Open ICPSR</source>
          <access-date>2021-08-24</access-date>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.openicpsr.org/openicpsr/project/105583/version/V5/view;jsessionid=D71A8F94F8F63A42806C3C45BD042D9D">https://www.openicpsr.org/openicpsr/project/105583/version/V5/view;jsessionid=D71A8F94F8F63A42806C3C45BD042D9D</ext-link>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref95">
        <label>95</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavanagh</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Kelly</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Krnjacki</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Thornton</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Jolley</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Subramanian</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Turrell</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Bentley</surname>
              <given-names>R</given-names>
            </name>
          </person-group>
          <article-title>Access to alcohol outlets and harmful alcohol consumption: a multi-level study in Melbourne, Australia</article-title>
          <source>Addiction</source>
          <year>2011</year>
          <month>10</month>
          <volume>106</volume>
          <issue>10</issue>
          <fpage>1772</fpage>
          <lpage>9</lpage>
          <pub-id pub-id-type="doi">10.1111/j.1360-0443.2011.03510.x</pub-id>
          <pub-id pub-id-type="medline">21615583</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref96">
        <label>96</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Popova</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Giesbrecht</surname>
              <given-names>N</given-names>
            </name>
            <name name-style="western">
              <surname>Bekmuradov</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Patra</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Hours and days of sale and density of alcohol outlets: impacts on alcohol consumption and damage: a systematic review</article-title>
          <source>Alcohol Alcohol</source>
          <year>2009</year>
          <volume>44</volume>
          <issue>5</issue>
          <fpage>500</fpage>
          <lpage>16</lpage>
          <pub-id pub-id-type="doi">10.1093/alcalc/agp054</pub-id>
          <pub-id pub-id-type="medline">19734159</pub-id>
          <pub-id pub-id-type="pii">agp054</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref97">
        <label>97</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Treno</surname>
              <given-names>AJ</given-names>
            </name>
            <name name-style="western">
              <surname>Johnson</surname>
              <given-names>FW</given-names>
            </name>
            <name name-style="western">
              <surname>Remer</surname>
              <given-names>LG</given-names>
            </name>
            <name name-style="western">
              <surname>Gruenewald</surname>
              <given-names>PJ</given-names>
            </name>
          </person-group>
          <article-title>The impact of outlet densities on alcohol-related crashes: a spatial panel approach</article-title>
          <source>Accid Anal Prev</source>
          <year>2007</year>
          <month>09</month>
          <volume>39</volume>
          <issue>5</issue>
          <fpage>894</fpage>
          <lpage>901</lpage>
          <pub-id pub-id-type="doi">10.1016/j.aap.2006.12.011</pub-id>
          <pub-id pub-id-type="medline">17275773</pub-id>
          <pub-id pub-id-type="pii">S0001-4575(07)00004-8</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref98">
        <label>98</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Belinkov</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Gehrmann</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>Pavlick</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Interpretability and analysis in neural NLP</article-title>
          <source>Proceedings of the 58th Annual Meeting of the Association for Computational Linguistics: Tutorial Abstracts</source>
          <year>2020</year>
          <conf-name>58th Annual Meeting of the Association for Computational Linguistics: Tutorial Abstracts</conf-name>
          <conf-date>Jul, 2020</conf-date>
          <conf-loc>Online</conf-loc>
          <publisher-name>Association for Computational Linguistics</publisher-name>
          <fpage>1</fpage>
          <lpage>5</lpage>
          <pub-id pub-id-type="doi">10.18653/v1/2020.acl-tutorials.1</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref99">
        <label>99</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Barefoot</surname>
              <given-names>JC</given-names>
            </name>
            <name name-style="western">
              <surname>Grønbaek</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Feaganes</surname>
              <given-names>JR</given-names>
            </name>
            <name name-style="western">
              <surname>McPherson</surname>
              <given-names>RS</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>RB</given-names>
            </name>
            <name name-style="western">
              <surname>Siegler</surname>
              <given-names>IC</given-names>
            </name>
          </person-group>
          <article-title>Alcoholic beverage preference, diet, and health habits in the UNC Alumni Heart Study</article-title>
          <source>Am J Clin Nutr</source>
          <year>2002</year>
          <month>08</month>
          <volume>76</volume>
          <issue>2</issue>
          <fpage>466</fpage>
          <lpage>72</lpage>
          <pub-id pub-id-type="doi">10.1093/ajcn/76.2.466</pub-id>
          <pub-id pub-id-type="medline">12145024</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref100">
        <label>100</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Sluik</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Bezemer</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Sierksma</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Feskens</surname>
              <given-names>E</given-names>
            </name>
          </person-group>
          <article-title>Alcoholic beverage preference and dietary habits: a systematic literature review</article-title>
          <source>Crit Rev Food Sci Nutr</source>
          <year>2016</year>
          <month>10</month>
          <day>25</day>
          <volume>56</volume>
          <issue>14</issue>
          <fpage>2370</fpage>
          <lpage>82</lpage>
          <pub-id pub-id-type="doi">10.1080/10408398.2013.841118</pub-id>
          <pub-id pub-id-type="medline">25674684</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref101">
        <label>101</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Dey</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Gmel</surname>
              <given-names>G</given-names>
            </name>
            <name name-style="western">
              <surname>Studer</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Dermota</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Mohler-Kuo</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Beverage preferences and associated drinking patterns, consequences and other substance use behaviours</article-title>
          <source>Eur J Public Health</source>
          <year>2014</year>
          <month>06</month>
          <volume>24</volume>
          <issue>3</issue>
          <fpage>496</fpage>
          <lpage>501</lpage>
          <pub-id pub-id-type="doi">10.1093/eurpub/ckt109</pub-id>
          <pub-id pub-id-type="medline">23940073</pub-id>
          <pub-id pub-id-type="pii">ckt109</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref102">
        <label>102</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alcácera</surname>
              <given-names>MA</given-names>
            </name>
            <name name-style="western">
              <surname>Marques-Lopes</surname>
              <given-names>I</given-names>
            </name>
            <name name-style="western">
              <surname>Fajó-Pascual</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Foncillas</surname>
              <given-names>JP</given-names>
            </name>
            <name name-style="western">
              <surname>Carmona-Torre</surname>
              <given-names>F</given-names>
            </name>
            <name name-style="western">
              <surname>Martínez-González</surname>
              <given-names>MA</given-names>
            </name>
          </person-group>
          <article-title>Alcoholic beverage preference and dietary pattern in Spanish university graduates: the SUN cohort study</article-title>
          <source>Eur J Clin Nutr</source>
          <year>2008</year>
          <month>10</month>
          <volume>62</volume>
          <issue>10</issue>
          <fpage>1178</fpage>
          <lpage>86</lpage>
          <pub-id pub-id-type="doi">10.1038/sj.ejcn.1602833</pub-id>
          <pub-id pub-id-type="medline">17609695</pub-id>
          <pub-id pub-id-type="pii">1602833</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref103">
        <label>103</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Siegel</surname>
              <given-names>MB</given-names>
            </name>
            <name name-style="western">
              <surname>Naimi</surname>
              <given-names>TS</given-names>
            </name>
            <name name-style="western">
              <surname>Cremeens</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Nelson</surname>
              <given-names>DE</given-names>
            </name>
          </person-group>
          <article-title>Alcoholic beverage preferences and associated drinking patterns and risk behaviors among high school youth</article-title>
          <source>Am J Prev Med</source>
          <year>2011</year>
          <month>04</month>
          <volume>40</volume>
          <issue>4</issue>
          <fpage>419</fpage>
          <lpage>26</lpage>
          <pub-id pub-id-type="doi">10.1016/j.amepre.2010.12.011</pub-id>
          <pub-id pub-id-type="medline">21406275</pub-id>
          <pub-id pub-id-type="pii">S0749-3797(10)00797-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref104">
        <label>104</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>McCann</surname>
              <given-names>SE</given-names>
            </name>
            <name name-style="western">
              <surname>Sempos</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Freudenheim</surname>
              <given-names>JL</given-names>
            </name>
            <name name-style="western">
              <surname>Muti</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Russell</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Nochajski</surname>
              <given-names>TH</given-names>
            </name>
            <name name-style="western">
              <surname>Ram</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Hovey</surname>
              <given-names>K</given-names>
            </name>
            <name name-style="western">
              <surname>Trevisan</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Alcoholic beverage preference and characteristics of drinkers and nondrinkers in western New York (United States)</article-title>
          <source>Nutr Metab Cardiovasc Dis</source>
          <year>2003</year>
          <month>02</month>
          <volume>13</volume>
          <issue>1</issue>
          <fpage>2</fpage>
          <lpage>11</lpage>
          <pub-id pub-id-type="doi">10.1016/s0939-4753(03)80162-x</pub-id>
          <pub-id pub-id-type="medline">12772432</pub-id>
          <pub-id pub-id-type="pii">S0939-4753(03)80162-X</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref105">
        <label>105</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lachmar</surname>
              <given-names>EM</given-names>
            </name>
            <name name-style="western">
              <surname>Wittenborn</surname>
              <given-names>AK</given-names>
            </name>
            <name name-style="western">
              <surname>Bogen</surname>
              <given-names>KW</given-names>
            </name>
            <name name-style="western">
              <surname>McCauley</surname>
              <given-names>HL</given-names>
            </name>
          </person-group>
          <article-title>#MyDepressionLooksLike: examining public discourse about depression on Twitter</article-title>
          <source>JMIR Ment Health</source>
          <year>2017</year>
          <month>10</month>
          <day>18</day>
          <volume>4</volume>
          <issue>4</issue>
          <fpage>e43</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://mental.jmir.org/2017/4/e43/"/>
          </comment>
          <pub-id pub-id-type="doi">10.2196/mental.8141</pub-id>
          <pub-id pub-id-type="medline">29046270</pub-id>
          <pub-id pub-id-type="pii">v4i4e43</pub-id>
          <pub-id pub-id-type="pmcid">PMC5666224</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref106">
        <label>106</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Alberga</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Withnell</surname>
              <given-names>S</given-names>
            </name>
            <name name-style="western">
              <surname>von Ranson</surname>
              <given-names>KM</given-names>
            </name>
          </person-group>
          <article-title>Fitspiration and thinspiration: a comparison across three social networking sites</article-title>
          <source>J Eat Disord</source>
          <year>2018</year>
          <month>11</month>
          <day>26</day>
          <volume>6</volume>
          <fpage>39</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jeatdisord.biomedcentral.com/articles/10.1186/s40337-018-0227-x"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s40337-018-0227-x</pub-id>
          <pub-id pub-id-type="medline">30534376</pub-id>
          <pub-id pub-id-type="pii">227</pub-id>
          <pub-id pub-id-type="pmcid">PMC6260773</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref107">
        <label>107</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shepherd</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Sanders</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Doyle</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Shaw</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Using social media for support and feedback by mental health service users: thematic analysis of a twitter conversation</article-title>
          <source>BMC Psychiatry</source>
          <year>2015</year>
          <month>02</month>
          <day>19</day>
          <volume>15</volume>
          <fpage>29</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcpsychiatry.biomedcentral.com/articles/10.1186/s12888-015-0408-y"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/s12888-015-0408-y</pub-id>
          <pub-id pub-id-type="medline">25881089</pub-id>
          <pub-id pub-id-type="pii">10.1186/s12888-015-0408-y</pub-id>
          <pub-id pub-id-type="pmcid">PMC4337200</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref108">
        <label>108</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>van Swol</surname>
              <given-names>LM</given-names>
            </name>
            <name name-style="western">
              <surname>Chang</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Kerr</surname>
              <given-names>B</given-names>
            </name>
            <name name-style="western">
              <surname>Moreno</surname>
              <given-names>M</given-names>
            </name>
          </person-group>
          <article-title>Linguistic predictors of problematic drinking in alcohol-related Facebook posts</article-title>
          <source>J Health Commun</source>
          <year>2020</year>
          <month>03</month>
          <day>03</day>
          <volume>25</volume>
          <issue>3</issue>
          <fpage>214</fpage>
          <lpage>22</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/32096449"/>
          </comment>
          <pub-id pub-id-type="doi">10.1080/10810730.2020.1731632</pub-id>
          <pub-id pub-id-type="medline">32096449</pub-id>
          <pub-id pub-id-type="pmcid">PMC7654720</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref109">
        <label>109</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Conway</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>AT</given-names>
            </name>
          </person-group>
          <article-title>Examining thematic similarity, difference, and membership in three online mental health communities from reddit: a text mining and visualization approach</article-title>
          <source>Comput Hum Behav</source>
          <year>2018</year>
          <month>01</month>
          <volume>78</volume>
          <fpage>98</fpage>
          <lpage>112</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/29456286"/>
          </comment>
          <pub-id pub-id-type="doi">10.1016/j.chb.2017.09.001</pub-id>
          <pub-id pub-id-type="medline">29456286</pub-id>
          <pub-id pub-id-type="pmcid">PMC5810583</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref110">
        <label>110</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kavuluru</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Williams</surname>
              <given-names>AG</given-names>
            </name>
            <name name-style="western">
              <surname>Ramos-Morales</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Haye</surname>
              <given-names>L</given-names>
            </name>
            <name name-style="western">
              <surname>Holaday</surname>
              <given-names>T</given-names>
            </name>
            <name name-style="western">
              <surname>Cerel</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Classification of helpful comments on online suicide watch forums</article-title>
          <source>ACM BCB</source>
          <year>2016</year>
          <month>10</month>
          <volume>2016</volume>
          <fpage>32</fpage>
          <lpage>40</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/28736770"/>
          </comment>
          <pub-id pub-id-type="doi">10.1145/2975167.2975170</pub-id>
          <pub-id pub-id-type="medline">28736770</pub-id>
          <pub-id pub-id-type="pmcid">PMC5521987</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
