<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
    <front>
        <journal-meta>
            <journal-id journal-id-type="publisher-id">ResProt</journal-id>
            <journal-id journal-id-type="nlm-ta">JMIR Res Protoc</journal-id>
            <journal-title>JMIR Research Protocols</journal-title>
            <issn pub-type="epub">1929-0748</issn>
            <publisher>
                <publisher-name>JMIR Publications Inc.</publisher-name>
                <publisher-loc>Toronto, Canada</publisher-loc>
            </publisher>
        </journal-meta>
        <article-meta>
            <article-id pub-id-type="publisher-id">v4i3e78</article-id>
            <article-id pub-id-type="pmid">26137885</article-id>
            <article-id pub-id-type="doi">10.2196/resprot.3433</article-id>
            <article-categories>
                <subj-group subj-group-type="heading">
                    <subject>Original Paper</subject>
                </subj-group>
                <subj-group subj-group-type="article-type">
                    <subject>Original Paper</subject>
                </subj-group>
            </article-categories>
            <title-group>
                <article-title>Collecting and Analyzing Patient Experiences of Health Care From Social Media</article-title>
            </title-group>
            <contrib-group>
                <contrib contrib-type="editor">
                    <name>
                        <surname>Eysenbach</surname>
                        <given-names>Gunther</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Bardach</surname>
                        <given-names>Naomi</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Greaves</surname>
                        <given-names>Felix</given-names>
                    </name>
                </contrib>
                <contrib contrib-type="reviewer">
                    <name>
                        <surname>Wallace</surname>
                        <given-names>Byron</given-names>
                    </name>
                </contrib>
            </contrib-group>
            <contrib-group>
                <contrib contrib-type="author" id="contrib1">
                    <name name-style="western">
                        <surname>Rastegar-Mojarad</surname>
                        <given-names>Majid</given-names>
                    </name>
                    <degrees>MSc</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0001-6962-3554</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib2">
                    <name name-style="western">
                        <surname>Ye</surname>
                        <given-names>Zhan</given-names>
                    </name>
                    <degrees>PhD</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0426-0382</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib3">
                    <name name-style="western">
                        <surname>Wall</surname>
                        <given-names>Daniel</given-names>
                    </name>
                    <degrees>BSc</degrees>
                    <xref rid="aff1" ref-type="aff">1</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-2005-7819</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib4" equal-contrib="yes">
                    <name name-style="western">
                        <surname>Murali</surname>
                        <given-names>Narayana</given-names>
                    </name>
                    <degrees>MD</degrees>
                    <xref rid="aff2" ref-type="aff">2</xref>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0002-0099-5330</ext-link>
                </contrib>
                <contrib contrib-type="author" id="contrib5" corresp="yes">
                    <name name-style="western">
                        <surname>Lin</surname>
                        <given-names>Simon</given-names>
                    </name>
                    <degrees>MD, MBA</degrees>
                    <xref rid="aff3" ref-type="aff">3</xref>
                    <address>
                        <institution>The Research Institute at Nationwide Children's Hospital</institution>
                        <addr-line>575 Children&#8217;s Crossroad</addr-line>
                        <addr-line>Columbus, OH, 43017</addr-line>
                        <country>United States</country>
                        <phone>1 614 355 6629</phone>
                        <fax>1 614 355 6629</fax>
                        <email>Simon.Lin@NationwideChildrens.org</email>
                    </address>
                    <ext-link ext-link-type="orcid">http://orcid.org/0000-0003-2876-2042</ext-link>
                </contrib>
            </contrib-group>
            <aff id="aff1">
                <sup>1</sup>
                <institution>Marshfield Clinic Research Foundation</institution>
                <institution>Biomedical Informatics Research Center</institution>
                <addr-line>Marshfield, WI</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff2">
                <sup>2</sup>
                <institution>Marshfield Clinic</institution>
                <institution>Nephrology</institution>
                <addr-line>Marshfield, WI</addr-line>
                <country>United States</country>
            </aff>
            <aff id="aff3">
                <sup>3</sup>
                <institution>The Research Institute at Nationwide Children's Hospital</institution>
                <addr-line>Columbus, OH</addr-line>
                <country>United States</country>
            </aff>
            <author-notes>
                <corresp>Corresponding Author: Simon Lin <email>Simon.Lin@NationwideChildrens.org</email>
                </corresp>
            </author-notes>
            <pub-date pub-type="collection">
                <season>Jul-Sep</season>
                <year>2015</year>
            </pub-date>
            <pub-date pub-type="epub">
                <day>02</day>
                <month>07</month>
                <year>2015</year>
            </pub-date>
            <volume>4</volume>
            <issue>3</issue>
            <elocation-id>e78</elocation-id>
            <!--history from ojs - api-xml-->
            <history>
                <date date-type="received">
                    <day>31</day>
                    <month>3</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-request">
                    <day>7</day>
                    <month>11</month>
                    <year>2014</year>
                </date>
                <date date-type="rev-recd">
                    <day>15</day>
                    <month>12</month>
                    <year>2014</year>
                </date>
                <date date-type="accepted">
                    <day>14</day>
                    <month>2</month>
                    <year>2015</year>
                </date>
            </history>
            <!--(c) the authors - correct author names and publication date here if necessary. Date in form ', dd.mm.yyyy' after jmir.org-->
            <copyright-statement>&#169;Majid Rastegar-Mojarad, Zhan Ye, Daniel Wall, Narayana Murali, Simon Lin. Originally published in JMIR Research Protocols (http://www.researchprotocols.org), 02.07.2015. </copyright-statement>
            <copyright-year>2015</copyright-year>
            <license license-type="open-access" xlink:href="http://creativecommons.org/licenses/by/2.0/">
                <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (http://creativecommons.org/licenses/by/2.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Research Protocols, is properly cited. The complete bibliographic information, a link to the original publication on http://www.researchprotocols.org, as well as this copyright and license information must be included.</p>
            </license>
            <self-uri xlink:href="http://www.researchprotocols.org/2015/3/e78/" xlink:type="simple" />
            <abstract>
                <sec sec-type="background">
                    <title>Background</title>
                    <p>Social Media, such as Yelp, provides rich information of consumer experience. Previous studies suggest that Yelp can serve as a new source to study patient experience. However, the lack of a corpus of patient reviews causes a major bottleneck for applying computational techniques.</p>
                </sec>
                <sec sec-type="objective">
                    <title>Objective</title>
                    <p>The objective of this study is to create a corpus of patient experience (COPE) and report descriptive statistics to characterize COPE.</p>
                </sec>
                <sec sec-type="methods">
                    <title>Methods</title>
                    <p>Yelp reviews about health care-related businesses were extracted from the Yelp Academic Dataset. Natural language processing (NLP) tools were used to split reviews into sentences, extract noun phrases and adjectives from each sentence, and generate parse trees and dependency trees for each sentence. Sentiment analysis techniques and Hadoop were used to calculate a sentiment score of each sentence and for parallel processing, respectively.</p>
                </sec>
                <sec sec-type="results">
                    <title>Results</title>
                    <p>COPE contains 79,173 sentences from 6914 patient reviews of 985 health care facilities near 30 universities in the United States. We found that patients wrote longer reviews when they rated the facility poorly (1 or 2 stars). We demonstrated that the computed sentiment scores correlated well with consumer-generated ratings. A consumer vocabulary to describe their health care experience was constructed by a statistical analysis of word counts and co-occurrences in COPE.</p>
                </sec>
                <sec sec-type="conclusions">
                    <title>Conclusions</title>
                    <p>A corpus called COPE was built as an initial step to utilize social media to understand patient experiences at health care facilities. The corpus is available to download and COPE can be used in future studies to extract knowledge of patients&#8217; experiences from their perspectives. Such information can subsequently inform and provide opportunity to improve the quality of health care.</p>
                </sec>
            </abstract>
            <kwd-group>
                <kwd>patient satisfaction</kwd>
                <kwd>social media</kwd>
                <kwd>health care</kwd>
                <kwd>natural language processing</kwd>
                <kwd>consumer health information</kwd>
            </kwd-group>
        </article-meta>
    </front>
    <body>
        <sec sec-type="introduction">
            <title>Introduction</title>
            <p>In the current era of information technology, patients often post their experiences with health care providers to social media websites, similar to reviews of restaurants or hotels. A 2012 survey by the University of Michigan found 65% of the US population was aware of online physician ratings [<xref ref-type="bibr" rid="ref1">1</xref>]. Another survey by PwC Health Research Institute in 2013 [<xref ref-type="bibr" rid="ref2">2</xref>] suggested nearly half of all consumers had read health care reviews online and, of those, 68% utilized the information within the review to assist with the selection of their health care provider. The same survey cited 24% of consumers have written a health care review, up from the 7% estimate in a 2011 survey [<xref ref-type="bibr" rid="ref3">3</xref>].</p>
            <p>Besides numerical ratings, the textual content in patient reviews can be a valuable resource for health care providers to improve their services. Data on patient experience is becoming a critical component in the value-based purchasing program proposed by the Center for Medicare and Medicaid Services (CMS) [<xref ref-type="bibr" rid="ref4">4</xref>]. In contrast to Press Ganey or Hospital Consumer Assessment of Healthcare Providers and Systems (HCAHPS) [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>], the peer-to-peer nature of patient reviews on social media websites provides a unique perspective for health care providers to understand patient satisfaction. This study is one of a few which focuses on utilizing online peer-to-peer communications to learn about patient experiences and concerns about health care providers [<xref ref-type="bibr" rid="ref7">7</xref>,<xref ref-type="bibr" rid="ref8">8</xref>].</p>
            <p>Several researchers have studied online patients reviews [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref20">20</xref>], but most of them analyzed doctors rating website [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref20">20</xref>]. Greaves et al [<xref ref-type="bibr" rid="ref7">7</xref>] conducted a sentiment analysis study on 6412 online comments about hospitals on the English National Health Service (NHS) website in 2010. They applied machine learning approach to classify reviews into positive and negative classes. In addition, Alemi et al [<xref ref-type="bibr" rid="ref9">9</xref>] studied 995 online comments at the RateMDs website [<xref ref-type="bibr" rid="ref21">21</xref>] and showed that real-time satisfaction surveys were possible.</p>
            <p>Yelp is a popular social media website that allows customers to share their business experiences with other customers. Previous studies suggest that Yelp can be a reliable source to study patient experiences with health care providers [<xref ref-type="bibr" rid="ref22">22</xref>]. Yelp has made available an Academic Dataset of the 13,490 closest businesses to 30 universities for researchers to explore [<xref ref-type="bibr" rid="ref23">23</xref>]. Many methodological papers have been published on analyzing restaurants [<xref ref-type="bibr" rid="ref24">24</xref>-<xref ref-type="bibr" rid="ref26">26</xref>] using this data set. However, this data set has yet to be studied in the context of health care.</p>
            <p>A PubMed search of &#8220;Yelp&#8221; resulted in only 3 papers. Kadry et al [<xref ref-type="bibr" rid="ref17">17</xref>] conducted a study to analyze 4999 physicians&#8217; ratings in the 10 most visited websites including Yelp. They found that most patients gave physicians favorable ratings: the average rating was 77 out of 100. Bardach et al [<xref ref-type="bibr" rid="ref21">21</xref>] found the Yelp ratings correlate well (<italic>P</italic>&#60;.001) with traditional measures of hospital quality (HCAHPS) and suggested that Yelp can be a reliable source to study patient experience. Recently, Butcher [<xref ref-type="bibr" rid="ref27">27</xref>] reported that health care providers are starting to pay attention to the Yelp ratings. All 3 papers analyzed Yelp ratings but did not utilize the wealth of information contained in the corpus of Yelp reviews.</p>
            <p>We addressed this gap by using a corpus of Yelp reviews to characterize patient experience. A &#34;corpus&#34; is a collection of texts presented in electronic form. In this study, we used the Yelp Academic Dataset to construct a corpus of patient experiences. Several natural language processing (NLP) methods and tools were utilized to clean the data and tag the parts-of-speech such as noun phrases and adjectives, and to create parse and dependency trees. A sentiment score for each sentence was also projected and insights from summary statistics of the corpus are presented here.</p>
        </sec>
        <sec sec-type="methods">
            <title>Methods</title>
            <p>We used 26 health care-related categories (examples include hospitals, urgent care facilities, and medical centers) to extract health care related businesses (a list of categories is provided in <xref ref-type="app" rid="app1">Multimedia Appendix 1</xref>) from the Yelp Academic Dataset. After identifying 6914 reviews, Stanford Core NLP [<xref ref-type="bibr" rid="ref28">28</xref>] was used to split reviews into sentences. Porter Stemmer [<xref ref-type="bibr" rid="ref29">29</xref>] was applied to stem each sentence. Stanford Core NLP was further used to produce parse trees and dependency trees for the sentences and part-of-speech tags for each word. Hadoop was used to run the NLP in parallel to create the corpus. Dragoon Tool was used to extract nouns and adjectival phrases [<xref ref-type="bibr" rid="ref30">30</xref>]. Sentiment score for each sentence were derived using SentiWordNet [<xref ref-type="bibr" rid="ref31">31</xref>]. In addition, each sentence was tagged to classify whether or not it was negated. The Hidden Markov Model was used in our negation detection tool [<xref ref-type="bibr" rid="ref32">32</xref>]. By filtering out terms, which appeared &#60;5 times, 7612 words were selected to form a COPE vocabulary list. The COPE vocabulary list was compared with the consumer health vocabulary (CHV) [<xref ref-type="bibr" rid="ref33">33</xref>] which is the gold standard in this domain. The CHV covers all health topics. The latest CHV of 2011 contains 158,519 words. To identify co-occurring pairs of terms in each review, we tokenized words and then removed stop words. A Chi-square test was conducted and the odds ratio for each pair for each term which appeared at &#8805;25 times (empirical cutoff) in the corpus was calculated. Finally, a network of the pairs with high Chi-square (&#62;100), significant <italic>P</italic> values (<italic>P</italic>&#60;.05) and odds ratios &#62;1 was built.</p>
        </sec>
        <sec sec-type="results">
            <title>Results</title>
            <sec>
                <title>Overview</title>
                <p>The first observational study of how patients communicate with their peers regarding their health care experiences using the social media website Yelp is presented here. To analyze these communications, a corpus was established and characterized with descriptive statistics.</p>
            </sec>
            <sec>
                <title>Corpus of Patient Experience (COPE)</title>
                <p>The COPE contains 79,173 sentences from 6914 patient reviews of 985 health care facilities near 30 universities in the United States. The top 10 cities with the most reviews incorporated into COPE are summarized in <xref ref-type="table" rid="table1">Table 1</xref>. For each sentence in COPE, a part-of-speech analysis was conducted (<xref ref-type="fig" rid="figure1">Figure 1</xref>) and made available for future research.</p>
                <p>The list of the most commonly encountered nouns, adjectives, and verbs in the corpus and rates of frequency are shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p>
                <table-wrap position="float" id="table1">
                    <label>Table 1</label>
                    <caption>
                        <p>The number of health care facilities and reviews from the top 10 cities covered by the COPE.</p>
                    </caption>
                    <table width="491" border="0" cellpadding="1" cellspacing="0" rules="groups" frame="hsides">
                        <col width="159" />
                        <col width="187" />
                        <col width="140" />
                        <thead>
                            <tr valign="top">
                                <td>City</td>
                                <td>Health care facilities, n</td>
                                <td>Reviews, n</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Palo Alto, CA</td>
                                <td>123</td>
                                <td>988</td>
                            </tr>
                            <tr valign="top">
                                <td>La Jolla, CA</td>
                                <td>122</td>
                                <td>872</td>
                            </tr>
                            <tr valign="top">
                                <td>Pasadena, CA</td>
                                <td>76</td>
                                <td>831</td>
                            </tr>
                            <tr valign="top">
                                <td>Cambridge, MA</td>
                                <td>50</td>
                                <td>611</td>
                            </tr>
                            <tr valign="top">
                                <td>Los Angeles, CA</td>
                                <td>75</td>
                                <td>541</td>
                            </tr>
                            <tr valign="top">
                                <td>Austin, TX</td>
                                <td>31</td>
                                <td>239</td>
                            </tr>
                            <tr valign="top">
                                <td>San Diego, CA</td>
                                <td>31</td>
                                <td>252</td>
                            </tr>
                            <tr valign="top">
                                <td>Houston, TX</td>
                                <td>58</td>
                                <td>261</td>
                            </tr>
                            <tr valign="top">
                                <td>San Luis Obispo, CA</td>
                                <td>56</td>
                                <td>235</td>
                            </tr>
                            <tr valign="top">
                                <td>Seattle, WA</td>
                                <td>28</td>
                                <td>255</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <table-wrap position="float" id="table2">
                    <label>Table 2</label>
                    <caption>
                        <p>The top 20 noun phrases, adjectives, and verbs in COPE (after lemmatization).</p>
                    </caption>
                    <table width="561" border="0" cellpadding="1" cellspacing="0" rules="groups" frame="hsides">
                        <col width="100" />
                        <col width="83" />
                        <col width="100" />
                        <col width="83" />
                        <col width="100" />
                        <col width="83" />
                        <thead>
                            <tr valign="top">
                                <td>Noun phrase</td>
                                <td>Frequency (per1000 sentences)</td>
                                <td>Adjectives</td>
                                <td>Frequency (per 1000 sentences)</td>
                                <td>Verbs</td>
                                <td>Frequency (per 1000 sentences)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Time</td>
                                <td>52.24</td>
                                <td>Good</td>
                                <td>52.90</td>
                                <td>Be</td>
                                <td>381.42</td>
                            </tr>
                            <tr valign="top">
                                <td>Doctor</td>
                                <td>38.20</td>
                                <td>Great</td>
                                <td>35.51</td>
                                <td>Have</td>
                                <td>197.99</td>
                            </tr>
                            <tr valign="top">
                                <td>Massage</td>
                                <td>32.43</td>
                                <td>Nice</td>
                                <td>19.89</td>
                                <td>Go</td>
                                <td>83.18</td>
                            </tr>
                            <tr valign="top">
                                <td>Place</td>
                                <td>31.08</td>
                                <td>First</td>
                                <td>17.78</td>
                                <td>Get</td>
                                <td>80.35</td>
                            </tr>
                            <tr valign="top">
                                <td>Staff</td>
                                <td>30.11</td>
                                <td>New</td>
                                <td>16.09</td>
                                <td>Do</td>
                                <td>68.72</td>
                            </tr>
                            <tr valign="top">
                                <td>Office</td>
                                <td>28.97</td>
                                <td>Friendly</td>
                                <td>16.01</td>
                                <td>Make</td>
                                <td>40.97</td>
                            </tr>
                            <tr valign="top">
                                <td>Care</td>
                                <td>28.68</td>
                                <td>Few</td>
                                <td>13.08</td>
                                <td>See</td>
                                <td>39.87</td>
                            </tr>
                            <tr valign="top">
                                <td>Appointment</td>
                                <td>25.96</td>
                                <td>Bad</td>
                                <td>13.02</td>
                                <td>Take</td>
                                <td>35.85</td>
                            </tr>
                            <tr valign="top">
                                <td>Experience</td>
                                <td>25.45</td>
                                <td>Sure</td>
                                <td>11.27</td>
                                <td>Feel</td>
                                <td>32.85</td>
                            </tr>
                            <tr valign="top">
                                <td>Dentist</td>
                                <td>21.39</td>
                                <td>Dental</td>
                                <td>11.24</td>
                                <td>Give</td>
                                <td>31.69</td>
                            </tr>
                            <tr valign="top">
                                <td>Eye</td>
                                <td>18.79</td>
                                <td>Little</td>
                                <td>11.08</td>
                                <td>Come</td>
                                <td>31.17</td>
                            </tr>
                            <tr valign="top">
                                <td>Patient</td>
                                <td>17.68</td>
                                <td>Clean</td>
                                <td>10.90</td>
                                <td>Say</td>
                                <td>31.08</td>
                            </tr>
                            <tr valign="top">
                                <td>Service</td>
                                <td>16.88</td>
                                <td>Many</td>
                                <td>10.82</td>
                                <td>Tell</td>
                                <td>30.59</td>
                            </tr>
                            <tr valign="top">
                                <td>Room</td>
                                <td>16.50</td>
                                <td>Professional</td>
                                <td>10.52</td>
                                <td>Know</td>
                                <td>28.49</td>
                            </tr>
                            <tr valign="top">
                                <td>Insurance</td>
                                <td>16.47</td>
                                <td>Last</td>
                                <td>10.18</td>
                                <td>Find</td>
                                <td>23.13</td>
                            </tr>
                            <tr valign="top">
                                <td>Hour</td>
                                <td>15.75</td>
                                <td>Live</td>
                                <td>9.97</td>
                                <td>Want</td>
                                <td>21.78</td>
                            </tr>
                            <tr valign="top">
                                <td>People</td>
                                <td>15.66</td>
                                <td>Medical</td>
                                <td>9.85</td>
                                <td>Think</td>
                                <td>20.36</td>
                            </tr>
                            <tr valign="top">
                                <td>Surgery</td>
                                <td>15.19</td>
                                <td>Next</td>
                                <td>9.66</td>
                                <td>Ask</td>
                                <td>20.25</td>
                            </tr>
                            <tr valign="top">
                                <td>Pain</td>
                                <td>14.77</td>
                                <td>Much</td>
                                <td>9.25</td>
                                <td>Recommend</td>
                                <td>18.99</td>
                            </tr>
                            <tr valign="top">
                                <td>Review</td>
                                <td>14.09</td>
                                <td>Same</td>
                                <td>8.94</td>
                                <td>Visit</td>
                                <td>15.88</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <fig id="figure1" position="float">
                    <label>Figure 1</label>
                    <caption>
                        <p>Part-of-speech analysis conducted on each sentence in COPE.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig1.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Descriptive Statistics of Reviews in COPE</title>
                <p>Over the years, there has been a rapid growth of the number of COPE reviews posted on Yelp (<xref ref-type="fig" rid="figure2">Figure 2</xref>). The earliest COPE review was published in 2005, and the most recent was published in 2012. The earlier years, between 2005-2007, were associated with a very high year-over-year growth rate, with a doubling time every 6 months. From 2007-2012, growth stabilized at a rate of 1.5 times annually. Note that 2012 was only a partial year of data collection.</p>
                <p>Although most facilities (93.0%, 916/985) received &#60;20 reviews, 2 facilities (%0.2, 2/985) received &#62;100 reviews (<xref ref-type="fig" rid="figure3">Figure 3</xref>). The median length of each review was 635 characters (<xref ref-type="fig" rid="figure4">Figure 4</xref>) and the median number of sentences in each review was 9 (<xref ref-type="fig" rid="figure5">Figure 5</xref>).</p>
                <fig id="figure2" position="float">
                    <label>Figure 2</label>
                    <caption>
                        <p>Number of reviews per years.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig2.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure3" position="float">
                    <label>Figure 3</label>
                    <caption>
                        <p>Distribution of reviews.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig3.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure4" position="float">
                    <label>Figure 4</label>
                    <caption>
                        <p>Distribution of review length.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig4.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure5" position="float">
                    <label>Figure 5</label>
                    <caption>
                        <p>Number of sentences per review.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig5.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>Consumer Rating and Sentiment Analysis of COPE</title>
                <p>On a scale of 1-5 (with 5 being the best), 69.68% (4817/6914) patients rated the facility favorably (&#8805;4 out of 5) (<xref ref-type="fig" rid="figure6">Figure 6</xref>). A trend was identified between length of patient reviews and perception of a negative experience (correlation=-.5829, <italic>P</italic>&#60;.001) (<xref ref-type="fig" rid="figure7">Figure 7</xref>). <xref ref-type="fig" rid="figure8">Figure 8</xref> illustrates the distribution of sentiment score per sentence. The computed sentiment score was compared with the consumer-generated rating (<italic>P</italic>&#60;.001, Pearson correlation test) (<xref ref-type="fig" rid="figure9">Figure 9</xref>). The sentiment score reflects the degree of accumulation of sentimental words in a sentence, which can be signified by <italic>positive</italic> words such as &#8220;pleasing&#8221; and &#8220;perfect,&#8221; and <italic>negative</italic> words such as &#8220;unhappy&#8221; and &#8220;disappointing.&#8221; Longer sentences tended to carry stronger sentiment score (<xref ref-type="fig" rid="figure10">Figure 10</xref>).</p>
                <fig id="figure6" position="float">
                    <label>Figure 6</label>
                    <caption>
                        <p>Distribution of the rating scores per review.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig6.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure7" position="float">
                    <label>Figure 7</label>
                    <caption>
                        <p>Length of review versus rating score.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig7.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure8" position="float">
                    <label>Figure 8</label>
                    <caption>
                        <p>Distribution of the sentiment score per sentence.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig8.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure9" position="float">
                    <label>Figure 9</label>
                    <caption>
                        <p>Mean sentiment score of sentences in each review per patient-generated overall rating.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig9.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure10" position="float">
                    <label>Figure 10</label>
                    <caption>
                        <p>Sentiment score per length of sentence.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig10.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
            <sec>
                <title>A Consumer Vocabulary Derived From COPE to Describe Their Health Care Experience</title>
                <p>A total of 25,692 words were derived from COPE. Consistent with vocabulary used in other domains, the top 25% of the vocabulary covered 92% of the usage (<xref ref-type="fig" rid="figure11">Figure 11</xref>).</p>
                <p>COPE vocabulary was also compared to the CHV [<xref ref-type="bibr" rid="ref32">32</xref>]. Of all the words in the COPE vocabulary, 8136 (31.67%, 8136/25692) were found in the CHV. The top 20 overlapping and non-overlapping words within the CHV are shown in <xref ref-type="table" rid="table3">Table 3</xref>.</p>
                <table-wrap position="float" id="table3">
                    <label>Table 3</label>
                    <caption>
                        <p>The top 20 overlapping and non-overlapping words within the CHV.</p>
                    </caption>
                    <table width="570" border="0" cellpadding="1" cellspacing="0" rules="groups" frame="hsides">
                        <col width="104" />
                        <col width="171" />
                        <col width="134" />
                        <col width="153" />
                        <thead>
                            <tr valign="top">
                                <td colspan="2">Overlapping</td>
                                <td colspan="2">Non-overlapping</td>
                            </tr>
                            <tr valign="top">
                                <td>Word</td>
                                <td>Frequency (per 1000 sentences)</td>
                                <td>Word</td>
                                <td>Frequency (per 1000 sentences)</td>
                            </tr>
                        </thead>
                        <tbody>
                            <tr valign="top">
                                <td>Good</td>
                                <td>53.54</td>
                                <td>Take</td>
                                <td>36.43</td>
                            </tr>
                            <tr valign="top">
                                <td>Time</td>
                                <td>52.21</td>
                                <td>Give</td>
                                <td>31.69</td>
                            </tr>
                            <tr valign="top">
                                <td>Like</td>
                                <td>40.91</td>
                                <td>Tell</td>
                                <td>30.59</td>
                            </tr>
                            <tr valign="top">
                                <td>See</td>
                                <td>39.87</td>
                                <td>Care</td>
                                <td>28.68</td>
                            </tr>
                            <tr valign="top">
                                <td>Doctor</td>
                                <td>38.20</td>
                                <td>Know</td>
                                <td>28.49</td>
                            </tr>
                            <tr valign="top">
                                <td>Back</td>
                                <td>35.85</td>
                                <td>Call</td>
                                <td>24.70</td>
                            </tr>
                            <tr valign="top">
                                <td>Great</td>
                                <td>35.84</td>
                                <td>Wait</td>
                                <td>23.98</td>
                            </tr>
                            <tr valign="top">
                                <td>Feel</td>
                                <td>35.06</td>
                                <td>Find</td>
                                <td>23.13</td>
                            </tr>
                            <tr valign="top">
                                <td>Massage</td>
                                <td>32.43</td>
                                <td>Ask</td>
                                <td>20.25</td>
                            </tr>
                            <tr valign="top">
                                <td>Come</td>
                                <td>31.17</td>
                                <td>Nice</td>
                                <td>19.99</td>
                            </tr>
                            <tr valign="top">
                                <td>Place</td>
                                <td>31.08</td>
                                <td>Room</td>
                                <td>16.50</td>
                            </tr>
                            <tr valign="top">
                                <td>Work</td>
                                <td>30.50</td>
                                <td>Friendly</td>
                                <td>16.16</td>
                            </tr>
                            <tr valign="top">
                                <td>Staff</td>
                                <td>30.11</td>
                                <td>Visit</td>
                                <td>15.88</td>
                            </tr>
                            <tr valign="top">
                                <td>Office</td>
                                <td>28.97</td>
                                <td>Help</td>
                                <td>15.72</td>
                            </tr>
                            <tr valign="top">
                                <td>Appointment</td>
                                <td>25.96</td>
                                <td>Use</td>
                                <td>14.22</td>
                            </tr>
                            <tr valign="top">
                                <td>Experience</td>
                                <td>25.45</td>
                                <td>Seem</td>
                                <td>11.74</td>
                            </tr>
                            <tr valign="top">
                                <td>Look</td>
                                <td>23.96</td>
                                <td>Clean</td>
                                <td>11.55</td>
                            </tr>
                            <tr valign="top">
                                <td>Dentist</td>
                                <td>21.39</td>
                                <td>Check</td>
                                <td>10.29</td>
                            </tr>
                            <tr valign="top">
                                <td>Think</td>
                                <td>20.96</td>
                                <td>Exam</td>
                                <td>10.21</td>
                            </tr>
                            <tr valign="top">
                                <td>Well</td>
                                <td>19.37</td>
                                <td>Explain</td>
                                <td>9.06</td>
                            </tr>
                        </tbody>
                    </table>
                </table-wrap>
                <p>A co-occurrence analysis [<xref ref-type="bibr" rid="ref34">34</xref>] revealed that these words formed a network. For example, the following words formed a tight cluster when patients described their experience with platelet donation (&#8221;blood&#8221;, &#8220;donor&#8221;, &#8220;platelets&#8221;), the snacks offered (&#8220;cookie&#8221; and &#8220;juice&#8221;), and the thank-you items given (&#8220;movie&#8221; and &#8220;ticket&#8221;) (<xref ref-type="fig" rid="figure11">Figure 11</xref>).</p>
                <fig id="figure11" position="float">
                    <label>Figure 11</label>
                    <caption>
                        <p>Cumulative usage of terms versus rank of terms.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig11.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
                <fig id="figure12" position="float">
                    <label>Figure 12</label>
                    <caption>
                        <p>A network of words used by customers to describe their experiences. The size of the node indicates the frequency of the word and the width of the lines indicates the number of co-occurrences of the word-pair in the same review. An example of usage of the word “platelet” is shown in the call-out box.</p>
                    </caption>
                    <graphic xlink:href="resprot_v4i3e78_fig12.jpg" alt-version="no" mimetype="image" position="float" xlink:type="simple" />
                </fig>
            </sec>
        </sec>
        <sec sec-type="discussion">
            <title>Discussion</title>
            <sec>
                <title>Principal Findings</title>
                <p>This study yields insightful results following a statistical analysis of 79,173 sentences from 6914 patient reviews of 985 health care facilities. The trend that we observed between length of patient reviews and perception of a negative experience is consistent with a previous study of consumer reviews [<xref ref-type="bibr" rid="ref35">35</xref>]. <xref ref-type="fig" rid="figure4">Figures 4</xref> and <xref ref-type="fig" rid="figure5">5</xref> suggest that the texts in COPE are much longer than Twitter (140 characters), which allow more sophisticated content analysis such as identifying the debates among different reviewers in future research studies.</p>
                <p>Findings in this study indicate that online reviews could be used to understand important aspects of business from the customers&#8217; point of view. Consistent with a previous report on CHV [<xref ref-type="bibr" rid="ref33">33</xref>], we also observed that a small vocabulary set (25%) covered a majority (92%) of the content (<xref ref-type="fig" rid="figure10">Figure 10</xref>). In examining <xref ref-type="table" rid="table2">Table 2</xref> and considering the most frequent noun phrases (ie, time, doctor, massage, place, staff, office, care, appointment) we can see important aspects of health care business as the most frequent terms used by patients. <xref ref-type="table" rid="table3">Table 3</xref> further suggests that the COPE vocabulary list covers more about the patient experience with health care providers, including sentiment words such as &#8220;nice&#8221; and &#8220;friendly&#8221; and experiential words such as &#8220;wait&#8221; and &#8220;visit&#8221;. Moreover, the co-occurrence analysis revealed a statistical &#8220;wordnet&#8221;, which can recover some interesting associations in the context of health care (<xref ref-type="fig" rid="figure11">Figure 11</xref>).</p>
                <p>Our comparison of the computed sentiment score with consumer-generated rating (<xref ref-type="fig" rid="figure9">Figure 9</xref>) showed good correlation between the mean sentiment score of sentences and patient-generated. This result further validated our computational approach for sentiment analysis and the consistency of rating by the patients.</p>
            </sec>
            <sec>
                <title>Limitations</title>
                <p>The data source of the Yelp Academic Dataset used herein was associated with the following study limitations. First, it was geographically biased with businesses surrounding 30 universities in the United States. <xref ref-type="table" rid="table1">Table 1</xref> suggests that the data set is highly concentrated in the east and west coasts, and Texas. Second, the date range of the reviews was limited from 2005-2012. There were no updates available from the Yelp Academic Dataset. However, this dataset is the accessible Yelp data for academic research, since the Terms of Service by Yelp Inc prevents any automatic data retrieval of Yelp contents. In addition, there is an implicit selection bias toward &#8220;patients&#8221; (we cannot verify they are truly patients) who choose to write a review at Yelp. Moreover, the credibility and content of some reviews has been challenged by physicians and provider organizations on whether the review content truly reflects an unbiased patient experience or is representative of the actual quality of care [<xref ref-type="bibr" rid="ref27">27</xref>].</p>
            </sec>
            <sec>
                <title>Conclusions</title>
                <p>The created and characterized COPE corpus includes patient reviews, ratings, parse trees, dependency trees, and a vocabulary list. The COPE corpus further enables future policy studies, such as using machine learning techniques such as unsupervised learning of topic analysis or supervised analysis of classifications [<xref ref-type="bibr" rid="ref7">7</xref>] to analyze the patient reviews in the context of six domains of quality established by the Institute of Medicine [<xref ref-type="bibr" rid="ref36">36</xref>]. COPE is available for academic use [<xref ref-type="bibr" rid="ref37">37</xref>].</p>
            </sec>
        </sec>
    </body>
    <back>
        <app-group>
            <app id="app1">
                <title>Multimedia Appendix 1</title>
                <p>List of the 26 Yelp health care categories in the study.</p>
                <media xlink:href="resprot_v4i3e78_app1.pdf" xlink:title="PDF File (Adobe PDF File), 99KB" />
            </app>
        </app-group>
        <glossary>
            <title>Abbreviations</title>
            <def-list>
                <def-item>
                    <term id="abb1">CHV</term>
                    <def>
                        <p>Consumer health vocabulary</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb2">COPE</term>
                    <def>
                        <p>Corpus of Patient Experience</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb3">HCAHPS</term>
                    <def>
                        <p>Hospital Consumer Assessment of Healthcare Providers and Systems</p>
                    </def>
                </def-item>
                <def-item>
                    <term id="abb4">NLP</term>
                    <def>
                        <p>Natural language processing</p>
                    </def>
                </def-item>
            </def-list>
        </glossary>
        <ack>
            <p>The authors would like to thank Dr Bob Greenlee for helpful discussions. Majid Rastegar-Mojarad was funded through philanthropic support of Marshfield Clinic Research Foundation&#8217;s &#8220;Dr John Melski Endowed Physician Scientist&#8221; Award to Dr Simon Lin. We thank Dr Ingrid Glurich for critical review, editing, and comments.</p>
        </ack>
        <fn-group>
            <fn fn-type="conflict">
                <p>None declared.</p>
            </fn>
        </fn-group>
        <ref-list>
            <ref id="ref1">
                <label>1</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hanauer</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zheng</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Singer</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gebremariam</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Davis</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>PUblic awareness, perception, and use of online physician rating sites</article-title>
                    <source>JAMA</source>
                    <year>2014</year>
                    <month>02</month>
                </nlm-citation>
            </ref>
            <ref id="ref2">
                <label>2</label>
                <nlm-citation citation-type="web">
                    <source>PwC Scoring healthcare: Navigating customer experience ratings</source>
                    <access-date>2014-03-07</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.pwc.com/us/en/health-industries/publications/scoring-patient-healthcare-experience.jhtml">http://www.pwc.com/us/en/health-industries/publications/scoring-patient-healthcare-experience.jhtml</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6NtsD1BBD</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref3">
                <label>3</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Keckley</surname>
                            <given-names>P</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Coughlin</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Eselius</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <source>2011 Survey of Health Care Consumers in the United States: Key Findings, Strategic Implications</source>
                    <year>2011</year>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>Deloitte Center for Health Solutions</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref4">
                <label>4</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Shoemaker</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>What value-based purchasing means to your hospital</article-title>
                    <source>Healthc Financ Manage</source>
                    <year>2011</year>
                    <month>08</month>
                    <volume>65</volume>
                    <issue>8</issue>
                    <fpage>60</fpage>
                    <lpage>8</lpage>
                    <pub-id pub-id-type="medline">21866722</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref5">
                <label>5</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zusman</surname>
                            <given-names>EE</given-names>
                        </name>
                    </person-group>
                    <article-title>HCAHPS replaces Press Ganey survey as quality measure for patient hospital experience</article-title>
                    <source>Neurosurgery</source>
                    <year>2012</year>
                    <month>08</month>
                    <volume>71</volume>
                    <issue>2</issue>
                    <fpage>N21</fpage>
                    <lpage>4</lpage>
                    <pub-id pub-id-type="doi">10.1227/01.neu.0000417536.07871.ed</pub-id>
                    <pub-id pub-id-type="medline">22811203</pub-id>
                    <pub-id pub-id-type="pii">00006123-201208000-00006</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref6">
                <label>6</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Long</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Impressing patients while improving HCAHPS</article-title>
                    <source>Nurs Manage</source>
                    <year>2012</year>
                    <month>12</month>
                    <volume>43</volume>
                    <issue>12</issue>
                    <fpage>32</fpage>
                    <lpage>7</lpage>
                    <pub-id pub-id-type="doi">10.1097/01.NUMA.0000422891.99334.68</pub-id>
                    <pub-id pub-id-type="medline">23183607</pub-id>
                    <pub-id pub-id-type="pii">00006247-201212000-00009</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref7">
                <label>7</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Greaves</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ramirez-Cano</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Millett</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Darzi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Donaldson</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Use of sentiment analysis for capturing patient experience from free-text comments posted online</article-title>
                    <source>J Med Internet Res</source>
                    <year>2013</year>
                    <volume>15</volume>
                    <issue>11</issue>
                    <fpage>e239</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2013/11/e239/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.2721</pub-id>
                    <pub-id pub-id-type="medline">24184993</pub-id>
                    <pub-id pub-id-type="pii">v15i11e239</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3841376</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref8">
                <label>8</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Greaves</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ramirez-Cano</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Millett</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Darzi</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Donaldson</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Harnessing the cloud of patient experience: using social media to detect poor quality healthcare</article-title>
                    <source>BMJ Qual Saf</source>
                    <year>2013</year>
                    <month>03</month>
                    <volume>22</volume>
                    <issue>3</issue>
                    <fpage>251</fpage>
                    <lpage>5</lpage>
                    <pub-id pub-id-type="doi">10.1136/bmjqs-2012-001527</pub-id>
                    <pub-id pub-id-type="medline">23349387</pub-id>
                    <pub-id pub-id-type="pii">bmjqs-2012-001527</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref9">
                <label>9</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Alemi</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Torii</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Clementz</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Aron</surname>
                            <given-names>DC</given-names>
                        </name>
                    </person-group>
                    <article-title>Feasibility of real-time satisfaction surveys through automated analysis of patients' unstructured comments and sentiments</article-title>
                    <source>Qual Manag Health Care</source>
                    <year>2012</year>
                    <volume>21</volume>
                    <issue>1</issue>
                    <fpage>9</fpage>
                    <lpage>19</lpage>
                    <pub-id pub-id-type="doi">10.1097/QMH.0b013e3182417fc4</pub-id>
                    <pub-id pub-id-type="medline">22207014</pub-id>
                    <pub-id pub-id-type="pii">00019514-201201000-00004</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref10">
                <label>10</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cambria</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hussain</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Durrani</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>Sentic computing for patient centered applications</article-title>
                    <year>2010</year>
                    <month>10</month>
                    <day>28</day>
                    <conf-name>IEEE 10th International Conference on Signal Processing</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Beijing, China</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref11">
                <label>11</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Cambria</surname>
                            <given-names>E</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hussain</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Havasi</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Towards the crowd validation of the British National Health Service</article-title>
                    <source>Extending the Frontiers of Society On-Line</source>
                    <year>2010</year>
                    <month>04</month>
                    <day>27</day>
                    <conf-name>WebSci10</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Raleigh, NC</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref12">
                <label>12</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Van de Belt</surname>
                            <given-names>TH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Engelen</surname>
                            <given-names>LJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Verhoef</surname>
                            <given-names>LM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Van der Weide</surname>
                            <given-names>MJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schoonhoven</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kool</surname>
                            <given-names>RB</given-names>
                        </name>
                    </person-group>
                    <article-title>Using patient experiences on Dutch social media to supervise health care services: exploratory study</article-title>
                    <source>J Med Internet Res</source>
                    <year>2015</year>
                    <volume>17</volume>
                    <issue>1</issue>
                    <fpage>e7</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2015/1/e7/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3906</pub-id>
                    <pub-id pub-id-type="medline">25592481</pub-id>
                    <pub-id pub-id-type="pii">v17i1e7</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4319082</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref13">
                <label>13</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>L&#243;pez</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Detz</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Ratanawongsa</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sarkar</surname>
                            <given-names>U</given-names>
                        </name>
                    </person-group>
                    <article-title>What patients say about their doctors online: a qualitative content analysis</article-title>
                    <source>J Gen Intern Med</source>
                    <year>2012</year>
                </nlm-citation>
            </ref>
            <ref id="ref14">
                <label>14</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Lagu</surname>
                            <given-names>T</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hannon</surname>
                            <given-names>N</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rothberg</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Lindenauer</surname>
                            <given-names>P</given-names>
                        </name>
                    </person-group>
                    <article-title>Patients&#8217; Evaluations of Health Care Providers in the Era of Social Networking: An Analysis of Physician-Rating Websites</article-title>
                    <source>J Gen Intern Med</source>
                    <year>2010</year>
                </nlm-citation>
            </ref>
            <ref id="ref15">
                <label>15</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Brody</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Elhadad</surname>
                            <given-names>N</given-names>
                        </name>
                    </person-group>
                    <article-title>Detecting Salient Aspects in Online Reviews of Health Providers</article-title>
                    <year>2010</year>
                    <conf-name>AMIA Annu Symp Proc</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>USA</conf-loc>
                    <fpage>202</fpage>
                    <lpage>206</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref16">
                <label>16</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Paul</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Wallace</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dredze</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>What Affects Patient (Dis)satisfaction? Analyzing Online Doctor Ratings with a Joint Topic-Sentiment Model</article-title>
                    <year>2013</year>
                    <conf-name>Workshops at the Twenty-Seventh AAAI Conference on Artificial Intelligence</conf-name>
                    <conf-date>2013</conf-date>
                    <conf-loc>Bellevue, Washington</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref17">
                <label>17</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Kadry</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Chu</surname>
                            <given-names>LF</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kadry</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Gammas</surname>
                            <given-names>D</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Macario</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>Analysis of 4999 online physician ratings indicates that most patients give physicians a favorable rating</article-title>
                    <source>J Med Internet Res</source>
                    <year>2011</year>
                    <volume>13</volume>
                    <issue>4</issue>
                    <fpage>e95</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2011/4/e95/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.1960</pub-id>
                    <pub-id pub-id-type="medline">22088924</pub-id>
                    <pub-id pub-id-type="pii">v13i4e95</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3222200</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref18">
                <label>18</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Terlutter</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Bidmon</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>R&#246;ttl</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Who uses physician-rating websites? Differences in sociodemographic variables, psychographic variables, and health status of users and nonusers of physician-rating websites</article-title>
                    <source>J Med Internet Res</source>
                    <year>2014</year>
                    <volume>16</volume>
                    <issue>3</issue>
                    <fpage>e97</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/3/e97/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3145</pub-id>
                    <pub-id pub-id-type="medline">24686918</pub-id>
                    <pub-id pub-id-type="pii">v16i3e97</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4004145</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref19">
                <label>19</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Emmert</surname>
                            <given-names>M</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Halling</surname>
                            <given-names>F</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Meier</surname>
                            <given-names>F</given-names>
                        </name>
                    </person-group>
                    <article-title>Evaluations of dentists on a German physician rating Website: an analysis of the ratings</article-title>
                    <source>J Med Internet Res</source>
                    <year>2015</year>
                    <volume>17</volume>
                    <issue>1</issue>
                    <fpage>e15</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2015/1/e15/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3830</pub-id>
                    <pub-id pub-id-type="medline">25582914</pub-id>
                    <pub-id pub-id-type="pii">v17i1e15</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4319074</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref20">
                <label>20</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Verhoef</surname>
                            <given-names>LM</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Van de Belt</surname>
                            <given-names>TH</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Engelen</surname>
                            <given-names>LJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Schoonhoven</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Kool</surname>
                            <given-names>RB</given-names>
                        </name>
                    </person-group>
                    <article-title>Social media and rating sites as tools to understanding quality of care: a scoping review</article-title>
                    <source>J Med Internet Res</source>
                    <year>2014</year>
                    <volume>16</volume>
                    <issue>2</issue>
                    <fpage>e56</fpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://www.jmir.org/2014/2/e56/" />
                    </comment>
                    <pub-id pub-id-type="doi">10.2196/jmir.3024</pub-id>
                    <pub-id pub-id-type="medline">24566844</pub-id>
                    <pub-id pub-id-type="pii">v16i2e56</pub-id>
                    <pub-id pub-id-type="pmcid">PMC3961699</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref21">
                <label>21</label>
                <nlm-citation citation-type="web">
                    <source>RateMDs</source>
                    <access-date>2015-06-11</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.ratemds.com/co/colorado-springs/">https://www.ratemds.com/co/colorado-springs/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZC3b4Qtu</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref22">
                <label>22</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Bardach</surname>
                            <given-names>NS</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Asteria-Pe&#241;aloza</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Boscardin</surname>
                            <given-names>WJ</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Dudley</surname>
                            <given-names>RA</given-names>
                        </name>
                    </person-group>
                    <article-title>The relationship between commercial website ratings and traditional hospital performance measures in the USA</article-title>
                    <source>BMJ Qual Saf</source>
                    <year>2013</year>
                    <month>03</month>
                    <volume>22</volume>
                    <issue>3</issue>
                    <fpage>194</fpage>
                    <lpage>202</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://europepmc.org/abstract/MED/23178860" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1136/bmjqs-2012-001360</pub-id>
                    <pub-id pub-id-type="medline">23178860</pub-id>
                    <pub-id pub-id-type="pii">bmjqs-2012-001360</pub-id>
                    <pub-id pub-id-type="pmcid">PMC4074426</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref23">
                <label>23</label>
                <nlm-citation citation-type="web">
                    <source>Yelp Academic Dataset</source>
                    <access-date>2014-03-07</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://www.yelp.com/academic_dataset">https://www.yelp.com/academic_dataset</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ntnn0cmP</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref24">
                <label>24</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Wang</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhao</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Guo</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>North</surname>
                            <given-names>C</given-names>
                        </name>
                    </person-group>
                    <article-title>Clustered layout word cloud for user generated review</article-title>
                    <year>2013</year>
                    <conf-name>The Yelp Challenge, Virginia Polytechnic Institute and State University</conf-name>
                    <conf-date>2013</conf-date>
                    <conf-loc>Blacksburg, VA</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref25">
                <label>25</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Huang</surname>
                            <given-names>J</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Rogers</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Joo</surname>
                            <given-names>E</given-names>
                        </name>
                    </person-group>
                    <article-title>Improving restaurants by extracting subtopics from Yelp reviews</article-title>
                    <year>2013</year>
                    <conf-name>The Yelp Challenge, University of California at Berkeley</conf-name>
                    <conf-date>2013</conf-date>
                    <conf-loc>Berkeley, CA</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref26">
                <label>26</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Hood</surname>
                            <given-names>B</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hwang</surname>
                            <given-names>V</given-names>
                        </name>
                        <name name-style="western">
                            <surname>King</surname>
                            <given-names>J</given-names>
                        </name>
                    </person-group>
                    <article-title>Inferring future business attention</article-title>
                    <source>Presented at the Yelp Challenge, Carnegie Mellon University</source>
                    <year>2013</year>
                    <conf-name>The Yelp Challenge, Carnegie Mellon University</conf-name>
                    <conf-date>2013</conf-date>
                    <conf-loc>Pittsburgh, PA</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref27">
                <label>27</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Butcher</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>The ratings game: bracing for the Yelp effect</article-title>
                    <source>Hosp Health Netw</source>
                    <year>2013</year>
                    <month>06</month>
                    <volume>87</volume>
                    <issue>6</issue>
                    <fpage>17</fpage>
                    <lpage>8</lpage>
                    <pub-id pub-id-type="medline">23885475</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref28">
                <label>28</label>
                <nlm-citation citation-type="web">
                    <source>The Stanford Natural Language Processing Group</source>
                    <access-date>2014-03-07</access-date>
                    <comment>Stanford CoreNLP: A Suite of Core NLP Tools<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://nlp.stanford.edu/downloads/corenlp.shtml">http://nlp.stanford.edu/downloads/corenlp.shtml</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6Ntp1C8H0</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref29">
                <label>29</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Porter</surname>
                            <given-names>M</given-names>
                        </name>
                    </person-group>
                    <article-title>An algorithm for suffix stripping</article-title>
                    <source>Program</source>
                    <year>1980</year>
                    <volume>14</volume>
                    <issue>3</issue>
                    <fpage>130</fpage>
                    <lpage>137</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref30">
                <label>30</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zhou</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Zhang</surname>
                            <given-names>X</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hu</surname>
                            <given-names>X</given-names>
                        </name>
                    </person-group>
                    <article-title>Dragon Toolkit: incorporating auto-learned semantic knowledge into large-scale text retrieval and mining</article-title>
                    <year>2007</year>
                    <conf-name>Proceedings of the 19th IEEE International Conference on Tools with Artificial Intelligence (ICTAI)</conf-name>
                    <conf-date>2007</conf-date>
                    <conf-loc>Patras, Greece</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref31">
                <label>31</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Baccianella</surname>
                            <given-names>S</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Esuli</surname>
                            <given-names>A</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Sebastiani</surname>
                            <given-names>F</given-names>
                        </name>
                    </person-group>
                    <article-title>SentiWordNet 3.0: An enhanced lexical resource for sentiment analysis and opinion mining</article-title>
                    <year>2010</year>
                    <conf-name>7th Conference on International Language Resources and Evaluation (LREC’10)</conf-name>
                    <conf-date>2010</conf-date>
                    <conf-loc>Malta</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref32">
                <label>32</label>
                <nlm-citation citation-type="web">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Rastegar-Mojarad</surname>
                            <given-names>Majid</given-names>
                        </name>
                    </person-group>
                    <source>Theses and Dissertations</source>
                    <year>2013</year>
                    <publisher-loc>Millwaukee, WI</publisher-loc>
                    <publisher-name>University of Wisconsin-Milwaukee</publisher-name>
                    <comment>Extraction and Classification of Drug-Drug Interaction from Biomedical Text Using a Two-Stage Classifier<ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://dc.uwm.edu/cgi/viewcontent.cgi?article=1309&#38;context=etd">http://dc.uwm.edu/cgi/viewcontent.cgi?article=1309&#38;context=etd</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZR6wxPCo</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref33">
                <label>33</label>
                <nlm-citation citation-type="journal">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Zeng</surname>
                            <given-names>QT</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Tse</surname>
                            <given-names>T</given-names>
                        </name>
                    </person-group>
                    <article-title>Exploring and developing consumer health vocabularies</article-title>
                    <source>J Am Med Inform Assoc</source>
                    <year>2006</year>
                    <volume>13</volume>
                    <issue>1</issue>
                    <fpage>24</fpage>
                    <lpage>9</lpage>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="http://jamia.oxfordjournals.org/cgi/pmidlookup?view=long&#38;pmid=16221948" />
                    </comment>
                    <pub-id pub-id-type="doi">10.1197/jamia.M1761</pub-id>
                    <pub-id pub-id-type="medline">16221948</pub-id>
                    <pub-id pub-id-type="pii">M1761</pub-id>
                    <pub-id pub-id-type="pmcid">PMC1380193</pub-id>
                </nlm-citation>
            </ref>
            <ref id="ref34">
                <label>34</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Yang</surname>
                            <given-names>C</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Jiang</surname>
                            <given-names>L</given-names>
                        </name>
                    </person-group>
                    <article-title>Using co-occurrence analysis to expand consumer health vocabularies from social media data</article-title>
                    <year>2013</year>
                    <conf-name>Proceedings of IEEE International Conference on Healthcare Informatics</conf-name>
                    <conf-date>2013</conf-date>
                    <conf-loc>Philadelphia, PA</conf-loc>
                </nlm-citation>
            </ref>
            <ref id="ref35">
                <label>35</label>
                <nlm-citation citation-type="confproc">
                    <person-group person-group-type="author">
                        <name name-style="western">
                            <surname>Vasa</surname>
                            <given-names>R</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Hoon</surname>
                            <given-names>L</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Mouzakis</surname>
                            <given-names>K</given-names>
                        </name>
                        <name name-style="western">
                            <surname>Noguchi</surname>
                            <given-names>A</given-names>
                        </name>
                    </person-group>
                    <article-title>A preliminary analysis of mobile app user reviews</article-title>
                    <year>2012</year>
                    <conf-name>Proceedings of the 24th Australian Computer-Human Interaction Conference</conf-name>
                    <conf-date>2012</conf-date>
                    <conf-loc>New York, NY</conf-loc>
                    <fpage>241</fpage>
                    <lpage>244</lpage>
                </nlm-citation>
            </ref>
            <ref id="ref36">
                <label>36</label>
                <nlm-citation citation-type="book">
                    <person-group person-group-type="author">
                        <collab>Committee on Quality of Health Care in America; Institute of Medicine</collab>
                    </person-group>
                    <source>Crossing the Quality Chasm: A New Health System for the 21st Century</source>
                    <year>2001</year>
                    <publisher-loc>Washington, DC</publisher-loc>
                    <publisher-name>National Academy Press</publisher-name>
                </nlm-citation>
            </ref>
            <ref id="ref37">
                <label>37</label>
                <nlm-citation citation-type="web">
                    <source>Corpus of Patient Experience</source>
                    <access-date>2015-06-12</access-date>
                    <comment>
                        <ext-link xmlns:xlink="http://www.w3.org/1999/xlink" xlink:type="simple" xlink:href="https://cope.codeplex.com/">https://cope.codeplex.com/</ext-link>
                    </comment>
                    <pub-id pub-id-type="other">6ZDf75mfB</pub-id>
                </nlm-citation>
            </ref>
        </ref-list>
    </back>
</article>
