<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "http://dtd.nlm.nih.gov/publishing/2.0/journalpublishing.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" article-type="research-article" dtd-version="2.0">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">JMI</journal-id>
      <journal-id journal-id-type="nlm-ta">JMIR Med Inform</journal-id>
      <journal-title>JMIR Medical Informatics</journal-title>
      <issn pub-type="epub">2291-9694</issn>
      <publisher>
        <publisher-name>JMIR Publications</publisher-name>
        <publisher-loc>Toronto, Canada</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">v7i3e14763</article-id>
      <article-id pub-id-type="pmid">31573948</article-id>
      <article-id pub-id-type="doi">10.2196/14763</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Original Paper</subject>
        </subj-group>
        <subj-group subj-group-type="article-type">
          <subject>Original Paper</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>Mining Hidden Knowledge About Illegal Compensation for Occupational Injury: Topic Model Approach</article-title>
      </title-group>
      <contrib-group>
        <contrib contrib-type="editor">
          <name>
            <surname>Eysenbach</surname>
            <given-names>Gunther</given-names>
          </name>
        </contrib>
      </contrib-group>
      <aff id="aff1">
        <label>1</label>
        <institution>Institute of Health and Environment</institution>
        <institution>Seoul National University</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <aff id="aff2">
        <label>2</label>
        <institution>Department of Preventive Medicine</institution>
        <institution>Seoul National University College of Medicine</institution>
        <addr-line>Seoul</addr-line>
        <country>Republic of Korea</country>
      </aff>
      <contrib-group>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Carvalho</surname>
            <given-names>Darlinton</given-names>
          </name>
        </contrib>
        <contrib contrib-type="reviewer">
          <name>
            <surname>Laurent</surname>
            <given-names>Christophe</given-names>
          </name>
        </contrib>
      </contrib-group>
      <contrib-group>
        <contrib id="contrib1" contrib-type="author">
          <name name-style="western">
            <surname>Min</surname>
            <given-names>Jin-Young</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff1" ref-type="aff">1</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-6578-7348</ext-link>
        </contrib>
        <contrib id="contrib2" contrib-type="author">
          <name name-style="western">
            <surname>Song</surname>
            <given-names>Sung-Hee</given-names>
          </name>
          <degrees>BSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-6225-2412</ext-link>
        </contrib>
        <contrib id="contrib3" contrib-type="author">
          <name name-style="western">
            <surname>Kim</surname>
            <given-names>HyeJin</given-names>
          </name>
          <degrees>MSc</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0002-9377-7585</ext-link>
        </contrib>
        <contrib id="contrib4" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Min</surname>
            <given-names>Kyoung-Bok</given-names>
          </name>
          <degrees>PhD</degrees>
          <xref rid="aff2" ref-type="aff">2</xref>
          <address>
            <institution>Department of Preventive Medicine</institution>
            <institution>Seoul National University College of Medicine</institution>
            <addr-line>1 Daehak-ro, Jongro-gu</addr-line>
            <addr-line>Seoul</addr-line>
            <country>Republic of Korea</country>
            <phone>82 027408968</phone>
            <email>minkb@snu.ac.kr</email>
          </address>
          <ext-link ext-link-type="orcid">https://orcid.org/0000-0001-9576-0093</ext-link>
        </contrib>
      </contrib-group>
      <author-notes>
        <corresp>Corresponding Author: Kyoung-Bok Min <email>minkb@snu.ac.kr</email></corresp>
      </author-notes>
      <pub-date pub-type="collection">
        <season>Jul-Sep</season>
        <year>2019</year>
      </pub-date>
      <pub-date pub-type="epub">
        <day>26</day>
        <month>9</month>
        <year>2019</year>
      </pub-date>
      <volume>7</volume>
      <issue>3</issue>
      <elocation-id>e14763</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>5</month>
          <year>2019</year>
        </date>
        <date date-type="rev-request">
          <day>9</day>
          <month>7</month>
          <year>2019</year>
        </date>
        <date date-type="rev-recd">
          <day>11</day>
          <month>8</month>
          <year>2019</year>
        </date>
        <date date-type="accepted">
          <day>30</day>
          <month>8</month>
          <year>2019</year>
        </date>
      </history>
      <copyright-statement>©Jin-Young Min, Sung-Hee Song, HyeJin Kim, Kyoung-Bok Min. Originally published in JMIR Medical Informatics (http://medinform.jmir.org), 26.09.2019</copyright-statement>
      <copyright-year>2019</copyright-year>
      <license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/">
        <p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (https://creativecommons.org/licenses/by/4.0/), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Medical Informatics, is properly cited. The complete bibliographic information, a link to the original publication on http://medinform.jmir.org/, as well as this copyright and license information must be included.</p>
      </license>
      <self-uri xlink:href="https://medinform.jmir.org/2019/3/e14763" xlink:type="simple"/>
      <abstract>
        <sec sec-type="background">
          <title>Background</title>
          <p>Although injured employees are legally covered by workers’ compensation insurance in South Korea, some employers make agreements to prevent the injured employees from claiming their compensation. Thus, this leads to underreporting of occupational injury statistics. Illegal compensation (called <italic>gong-sang</italic> in Korean) is a critical method used to underreport or cover-up occupational injuries. However, <italic>gong-sang</italic> is not counted in the official occupational injury statistics; therefore, we cannot identify <italic>gong-sang</italic>–related issues.</p>
        </sec>
        <sec sec-type="objective">
          <title>Objective</title>
          <p>This study aimed to analyze social media data using topic modeling to explore hidden knowledge about illegal compensation—<italic>gong-sang</italic>—for occupational injury in South Korea.</p>
        </sec>
        <sec sec-type="methods">
          <title>Methods</title>
          <p>We collected 2210 documents from social media data by filtering the keyword, <italic>gong-sang</italic>. The study period was between January 1, 2006, and December 31, 2017. After completing natural language processing of the Korean language, a morphological analyzer, we performed topic modeling using latent Dirichlet allocation (LDA) in the Python library, Gensim. A 10-topic model was selected and run with 3000 Gibbs sampling iterations to fit the model.</p>
        </sec>
        <sec sec-type="results">
          <title>Results</title>
          <p>The LDA model was used to classify <italic>gong-sang</italic>–related documents into 4 categories from a total of 10 topics. Topic 1 was the greatest concern (60.5%). Workers who suffered from industrial accidents seemed to be worried about illegal compensation and legal insurance claims, wherein keywords on the choice between illegal compensation and legal insurance claims were included. In topic 2, keywords were associated with claims for industrial accident insurance benefits. Topics 3 and 4, as the second highest concern (19%), contained keywords implying the monetary compensation of <italic>gong-sang</italic>. Topics 5 to 10 included keywords on vulnerable jobs (ie, workers in the construction and defense industry, delivery riders, and foreign workers) and body parts (ie, injuries to the hands, face, teeth, lower limbs, and back) to <italic>gong-sang</italic>.</p>
        </sec>
        <sec sec-type="conclusions">
          <title>Conclusions</title>
          <p>We explored hidden knowledge to identify the salient issues surrounding <italic>gong-sang</italic> using the LDA model. These topics may provide valuable information to ensure the more efficient operation of South Korea’s occupational health and safety administration and protect vulnerable workers from illegal <italic>gong-sang</italic> compensation practices.</p>
        </sec>
      </abstract>
      <kwd-group>
        <kwd>occupational injuries</kwd>
        <kwd>worker’s compensation</kwd>
        <kwd>social media</kwd>
        <kwd>Korea</kwd>
      </kwd-group>
    </article-meta>
  </front>
  <body>
    <sec sec-type="introduction">
      <title>Introduction</title>
      <sec>
        <title>Background</title>
        <p>Occupational injuries, defined as work-related injuries, diseases, and death, are an important public health issue. They are one of the main causes of workers’ morbidity, disability, and mortality as well as substantial losses in social and economic activities. According to the International Labor Office (ILO), 2.3 million workers die from an occupational injury or a disease annually [<xref ref-type="bibr" rid="ref1">1</xref>]. The global burden of occupational injuries has reached 4% of the global gross domestic product (approximately US $3 trillion) [<xref ref-type="bibr" rid="ref1">1</xref>].</p>
        <p>Although it is difficult to compare national rates of occupational injuries because of variations in legal and compensation criteria, South Korea’s occupational injury statistics have certain unique features, including the lowest nonfatal occupational injury rate alongside the highest death rate [<xref ref-type="bibr" rid="ref2">2</xref>]. When compared with other Organization for Economic Co-operation and Development (OECD) member countries in 2014, South Korea’s nonfatal occupational injury rate of 0.53% was far below the OECD average of 2.7%, whereas fatal work-related deaths in the country were ranked the highest (ie, 10.8 per 100,000 people) [<xref ref-type="bibr" rid="ref3">3</xref>]. South Korea also reported lower numbers of nonfatal occupational injuries and higher rates of fatal occupational injuries than European countries [<xref ref-type="bibr" rid="ref2">2</xref>].</p>
        <p>Workers in Korea are legally covered by workers’ compensation insurance when they receive more than 3 days of medical treatment [<xref ref-type="bibr" rid="ref4">4</xref>]. However, some employers make agreements with workers to prevent them from applying for the compensation insurance benefit, even in cases requiring up to 4 days of treatment. Such agreements giving way for illegal compensation (<italic>gong-sang</italic> in Korean) is considered a critical example of occupational injury cover-up. Literally, “<italic>gong-sang</italic>” means a wound caused while performing official duties; in practice, it means an agreement between an employer and employee not covered by the worker’s compensation insurance where the employer pays directly for the worker’s compensation for medical treatment and suspension of employment when injured at work. It is unfortunate that illegal compensation or <italic>gong-sang</italic> rates are not captured by official occupational injury statistics, and, thus, it is impossible to monitor illegally compensated occupational injuries using the conventional system [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref6">6</xref>].</p>
        <p>In this era of digital information and communication technologies, many people post their reviews of products and services from restaurants, hotels, and hospitals on the Web. They also seek professional advice on health and legal issues through social media websites. In these circumstances, seeking advice about illegal compensation or <italic>gong-sang</italic> may be similar. Injured workers who are forced by employers to agree to illegal compensation may discuss it with experts, experienced people, and the public using social media. If this is the case, Web-based data may be useful for identifying the undisclosed contents of <italic>gong-sang</italic> provided for injured employees and the hidden administration of occupational health and safety.</p>
      </sec>
      <sec>
        <title>Objectives</title>
        <p>This study aimed to analyze social media data using topic modeling to explore issues surrounding <italic>gong-sang</italic>. Topic modeling is a widely used text mining approach for analyzing large volumes of unlabeled documents to discover hidden textual patterns [<xref ref-type="bibr" rid="ref7">7</xref>]. Specific concerns addressed when analyzing data about <italic>gong-sang</italic> included the key issues described by the victims: what type of worker is vulnerable, and what kind of injuries are subject to illegal compensation.</p>
      </sec>
    </sec>
    <sec sec-type="methods">
      <title>Methods</title>
      <sec>
        <title>Data Extraction and Processing</title>
        <p>We collected social media data from knowledge-sharing websites, such as Naver Knowledge In. Knowledge-sharing websites allow people to interact with each other and share their knowledge by asking and answering questions. These websites have an accumulated knowledge database through a question-answering system. From the database, this study focused on posts pertaining to occupational injury and responded through a certified labor attorney as expert counseling. Web scraping was used to scrape 374,308 documents with the keyword, <italic>occupational injury</italic>. Using the keyword, <italic>gong-sang</italic>, the data were filtered, and 3692 documents were identified in the social media context. We further removed 1231 duplicated documents and applied a limited study period between January 1, 2006, and December 31, 2017. Finally, 2210 documents were included for further analysis. We analyzed Google Trends data to highlight public attention to <italic>gong-sang</italic> issues and displayed the trend for search queries on occupational accidents, <italic>gong-sang</italic> handling, and workers’ compensation. Google Trends provided a time series index of the number of the queries entered into Google for a given topic in South Korea across 12 years (2006-2017). The value displayed in Google Trends is not based on the total number of searches but represents the search interest relative to the highest point on the chart for the given time and geographic region.</p>
        <p>Social media posts pertaining to occupational injury were processed to transform unstructured textual documents into structured data using the Python package. For natural language processing of the Korean language, KoNLPy, a relatively new open source morphological analyzer library, developed by Park and Cho [<xref ref-type="bibr" rid="ref8">8</xref>], was used. Thereafter, unnecessary sentence components (ie, special characteristics, numbers, and punctuations) and meaningless words (ie, <italic>a</italic>, <italic>the</italic>, and <italic>it</italic>) in the text file were removed, and nouns were extracted with more than 2 letters. Next, a term-document matrix was constructed, which used term frequency–inverse document frequency (TF-IDF) weights for information retrieval. A TF-IDF algorithm evaluates how important a word is in a document in a collection or corpus, with the value increasing proportionally to the number of times a word appears in a document [<xref ref-type="bibr" rid="ref9">9</xref>]. To provide relationships between the keywords in the <italic>gong-sang</italic>-related documents, we analyzed co-occurrence network of high-frequency words using Gephi modules in Python.</p>
      </sec>
      <sec>
        <title>Applying Topic Modeling</title>
        <p>Topic modeling is an emerging field in machine learning that detects the hidden topics in large textual corpora. Latent Dirichlet allocation (LDA) is one of the most popular topic modeling techniques. LDA states that each document in a corpus is a mixture of latent topics and that each word’s presence is attributable to one of the document’s topics [<xref ref-type="bibr" rid="ref7">7</xref>]. In the LDA model, topic distribution over each document and word distribution over each topic share the common Dirichlet prior [<xref ref-type="bibr" rid="ref7">7</xref>]. We used LDA in Gensim, a Python library, for topic modeling. Perplexity was evaluated to determine the optimal number of topics and then computed to determine the difference in perplexity change. Perplexity is a common method to measure how well a probability distribution predicts a held-out sample [<xref ref-type="bibr" rid="ref7">7</xref>]. A lower value of the difference in perplexity change denotes a better probabilistic model. LDA defines a <italic>topic</italic> as a probability distribution over a fixed vocabulary in a given document [<xref ref-type="bibr" rid="ref7">7</xref>]. The parameter λ determines the weight given to the probability of a term within a topic relative to its lift. Setting λ=1 results in the familiar ranking of terms in decreasing order of their topic-specific probability, whereas setting λ=0 ranks terms solely by their lift. We set λ=1 and run the LDA with 3000 Gibbs sampling iterations. A 10-topic model with the lowest difference in perplexity change was used, and topics were plotted using circles on a 2-dimensional plane along the transverse (PC1) and longitudinal (PC2) axes. In this visualization, each topic was presented as a circle, and the circle area represented the prevalence of each topic. The centers of each topic were determined by computing the distance between topics. Furthermore, we used multidimensional scaling to represent the intertopic distances in 2 dimensions [<xref ref-type="bibr" rid="ref10">10</xref>].</p>
      </sec>
    </sec>
    <sec sec-type="results">
      <title>Results</title>
      <sec>
        <title>Summary Statistics</title>
        <p><xref rid="figure1" ref-type="fig">Figure 1</xref> displays the trends on Google Trends for search queries on <italic>gong-sang</italic>–related topics, specifically occupational accidents, <italic>gong-sang</italic> handling, and workers’ compensation, over 12 years. Among them, occupational accidents was the most popular term. The popularity of occupational accidents nonlinearly decreased from 2006 until 2012; subsequently, it steadily increased. In the queries for <italic>gong-sang</italic> handling and workers’ compensation, although there was a wide fluctuation in their popularity between 2006 and 2010, the queries’ concern continued even when the popularity was low, relative to occupational accidents.</p>
        <p>The value is calculated relative to the highest point on the chart for 12 years in South Korea: a value of 100 is the highest popularity of each term, and a value of 50 means that these terms were searched as frequently as half of the highest popularity.</p>
        <p>We identified 2210 <italic>gong-sang</italic>–related documents from the expert counseling service between January 1, 2006, and December 31, 2017. <xref ref-type="table" rid="table1">Table 1</xref> shows the distribution of the number of documents during the study period. The number of documents was less than 100 in 2006 and 2007; however, over the years, there has been a gradual increase in the documents.</p>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows a word cloud display, a visual representation of the word frequency within the <italic>gong-sang</italic>–related documentation. The clouds provide greater prominence to words that appear more frequently in the given text.</p>
        <p><xref rid="figure2" ref-type="fig">Figure 2</xref> shows co-occurrence network of high frequency words in the <italic>gong-sang</italic>-related documents. A node represents the co-occurrence relationship between two words appearing in the same article simultaneously. Nodes with a large degree are considered as high-connectivity nodes or hub nodes.</p>
        <fig id="figure1" position="float">
          <caption>
            <p>The trend on Google Trends for search queries on gong-sang–related topics—occupational accident, gong-sang handling, and workers’ compensation—between 2006 and 2017.</p>
          </caption>
          <graphic xlink:href="medinform_v7i3e14763_fig1.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <table-wrap position="float" id="table1">
          <label>Table 1</label>
          <caption>
            <p>The number of gong-sang-related documents between 2006 and 2017 (N=2210).</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Year</td>
                <td>Number of documents, n (%)</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>2006</td>
                <td>49 (2.2)</td>
              </tr>
              <tr valign="top">
                <td>2007</td>
                <td>70 (3.2)</td>
              </tr>
              <tr valign="top">
                <td>2008</td>
                <td>110 (5.0)</td>
              </tr>
              <tr valign="top">
                <td>2009</td>
                <td>156 (7.1)</td>
              </tr>
              <tr valign="top">
                <td>2010</td>
                <td>111 (5.0)</td>
              </tr>
              <tr valign="top">
                <td>2011</td>
                <td>121 (5.5)</td>
              </tr>
              <tr valign="top">
                <td>2012</td>
                <td>156 (7.1)</td>
              </tr>
              <tr valign="top">
                <td>2013</td>
                <td>197 (8.9)</td>
              </tr>
              <tr valign="top">
                <td>2014</td>
                <td>236 (10.7)</td>
              </tr>
              <tr valign="top">
                <td>2015</td>
                <td>289 (13.1)</td>
              </tr>
              <tr valign="top">
                <td>2016</td>
                <td>329 (14.9)</td>
              </tr>
              <tr valign="top">
                <td>2017</td>
                <td>386 (17.5)</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure2" position="float">
          <caption>
            <p>Co-occurrence network of high-frequency words in the gong-sang–related documents.</p>
          </caption>
          <graphic xlink:href="medinform_v7i3e14763_fig2.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
      </sec>
      <sec>
        <title>Topic Modeling</title>
        <p>In <xref ref-type="table" rid="table2">Table 2</xref>, the top 20 most frequent words have been provided. Intuitive words about <italic>gong-sang</italic> (ie, handling, company, <italic>gong-sang</italic>, and occupational injury) were sorted into the upper half. Words such as hospital, treatment, level, surgical operation, hospitalization, accident, site, diagnosis, and back were associated with bodily injury.</p>
        <p>To classify the given documents on a particular topic, we determined the number of topics by calculating their perplexity. We adopted a 10-topic model with the lowest difference in perplexity changes and plotted the topics as seen in <xref rid="figure3" ref-type="fig">Figure 3</xref>. The overall view of topics is expressed as circles on the left panel, and the top 20 most useful terms for interpreting each topic are shown in a bar chart on the right panel.</p>
        <table-wrap position="float" id="table2">
          <label>Table 2</label>
          <caption>
            <p>Top 20 high-frequency words in the gong-sang–related documents.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="500"/>
            <col width="500"/>
            <thead>
              <tr valign="top">
                <td>Keywords</td>
                <td>Frequency</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td>handling</td>
                <td>6076</td>
              </tr>
              <tr valign="top">
                <td>company</td>
                <td>5251</td>
              </tr>
              <tr valign="top">
                <td>gong-sang</td>
                <td>4188</td>
              </tr>
              <tr valign="top">
                <td>occupational injury</td>
                <td>3682</td>
              </tr>
              <tr valign="top">
                <td>hospital</td>
                <td>3238</td>
              </tr>
              <tr valign="top">
                <td>treatment</td>
                <td>2371</td>
              </tr>
              <tr valign="top">
                <td>level</td>
                <td>1684</td>
              </tr>
              <tr valign="top">
                <td>surgical operation</td>
                <td>1501</td>
              </tr>
              <tr valign="top">
                <td>insurance</td>
                <td>1242</td>
              </tr>
              <tr valign="top">
                <td>hospitalization</td>
                <td>1239</td>
              </tr>
              <tr valign="top">
                <td>accident</td>
                <td>1032</td>
              </tr>
              <tr valign="top">
                <td>pay</td>
                <td>1022</td>
              </tr>
              <tr valign="top">
                <td>case</td>
                <td>970</td>
              </tr>
              <tr valign="top">
                <td>site</td>
                <td>929</td>
              </tr>
              <tr valign="top">
                <td>condition</td>
                <td>911</td>
              </tr>
              <tr valign="top">
                <td>agreement</td>
                <td>868</td>
              </tr>
              <tr valign="top">
                <td>re-treat</td>
                <td>837</td>
              </tr>
              <tr valign="top">
                <td>diagnosis</td>
                <td>822</td>
              </tr>
              <tr valign="top">
                <td>working</td>
                <td>791</td>
              </tr>
              <tr valign="top">
                <td>back</td>
                <td>750</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
        <fig id="figure3" position="float">
          <caption>
            <p>The layout of latent Dirichlet allocation of the gong-sang–related documents, with a global topic view on the left and the term bar charts on the right. PC1: transverse axe; PC2: longitudinal axe.</p>
          </caption>
          <graphic xlink:href="medinform_v7i3e14763_fig3.png" alt-version="no" position="float" xlink:type="simple"/>
        </fig>
        <p>Keywords on each topic with a percentage of the given documents are summarized in <xref ref-type="table" rid="table3">Table 3</xref>. Topic 1 was the most popular at 60.5%. We interpreted this topic as the choice between illegal compensation (<italic>gong-sang</italic>) and legal insurance claims (actual medical cost insurance as private insurance or industrial accident compensation insurance as social insurance). Topic 2 included keywords associated with claims for industrial accident insurance benefits. Topics 3 and 4 were classified as similar subjects: monetary compensation for subcontractors (topic 3) and daily workers (topic 4). Approximately, 11% corresponded to topics 5 to 10. These 5 topics involved keywords relating to injured body parts and the employment status of <italic>gong-sang</italic>. The words included hand injury (topic 5), construction workers (topic 6), accidental injury to the body (topic 7), vulnerable job (topic 8), lower limb and back injury (topic 9), and foreign workers (topic 10).</p>
        <table-wrap position="float" id="table3">
          <label>Table 3</label>
          <caption>
            <p>Topic classification and keywords on gong-sang.</p>
          </caption>
          <table width="1000" cellpadding="5" cellspacing="0" border="1" rules="groups" frame="hsides">
            <col width="30"/>
            <col width="370"/>
            <col width="510"/>
            <col width="90"/>
            <thead>
              <tr valign="top">
                <td colspan="2">Classification and topic name</td>
                <td>Keywords</td>
                <td>Values, %</td>
              </tr>
            </thead>
            <tbody>
              <tr valign="top">
                <td colspan="4">
                  <bold>Choice between illegal compensation and legal insurance claims</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 1: Actual medical cost insurance or industrial accident compensation insurance</td>
                <td>insurance, hospital, company, pay, occupational accident, actual expense, retreat, diagnosis, agreement, treatment, hospitalization, indemnification, application, amount, claim</td>
                <td>60.5</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Claim for industrial accident insurance benefits</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 2: Industrial accident insurance benefits</td>
                <td>payment, surgical operation, medical expenses, fracture, burden, employee, medical treatment, allowance, receipt, disability, salary, bonus, guarantee, public corporation, business owner</td>
                <td>11.3</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Monetary compensation for subcontractors and daily workers</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 3: Money compensation for subcontractors</td>
                <td>salary, subcontract, hammering, claim, calculation, date, annual leave, medical expenses, scar, in-company, lumbar, basic pay, shipyard, money, industrial accident</td>
                <td>11.1</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 4: Money compensation for daily workers</td>
                <td>muscle, X-ray, daily pay, daily wage, action, total amount, loss, disability, injury, hospital charge, convalescence, work, business owner, refusal, exemption</td>
                <td>8.1</td>
              </tr>
              <tr valign="top">
                <td colspan="4">
                  <bold>Descriptions of illegal compensation: vulnerable body part and employment status</bold>
                </td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 5: Hand injuries</td>
                <td>Finger, record, general practice, needle, suture, first medical examination, right hand, stitches, materials, operation, thumb, index finger, emergency department, centimeter, laceration</td>
                <td>2.9</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 6: Construction workers</td>
                <td>medical certificate, severance pay, progression, region, subcontract, last year, Saturday, duration, reason, disk, resign, one’s own expense, building completion, official vacation, flange</td>
                <td>2.0</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 7: Accidental injury to the body</td>
                <td>day labor, face, circumstance, acquaintance, tooth fracture, degeneration, traffic accident, cause, dental crown, exposure, nitric acid, breathing, right, chest, implant</td>
                <td>2.7</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 8: Vulnerable jobs</td>
                <td>metal pin, claim, construction, guard, carpenter, pickup, delivery, outskirts, penalty, defense industry, rider, memorandum, separate collection, defense personnel, McDonalds</td>
                <td>1.7</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 9: Lower limb and back injuries</td>
                <td>knee, cartilage, cast, cruciate ligaments, height, mediation, ligaments, rupture, compensation, coin patch, defeat, medicine, back, tarsal bone, technician</td>
                <td>0.9</td>
              </tr>
              <tr valign="top">
                <td>
                  <break/>
                </td>
                <td>Topic 10: Foreign workers</td>
                <td>outplacement, inflammation, evidence, patient, foreigner, recruitment, rotation, overwork, hospitalization, surgical operation, trauma, South Korea, Hangeul, (Korean alphabet), reentry, false</td>
                <td>0.6</td>
              </tr>
            </tbody>
          </table>
        </table-wrap>
      </sec>
    </sec>
    <sec sec-type="discussion">
      <title>Discussion</title>
      <sec>
        <title>Principal Findings</title>
        <p>Illegal compensation (ie, <italic>gong-sang</italic>) because of occupational injury is a serious social problem in South Korea. At the company level, <italic>gong-sang</italic> entails a violation of an employer’s legal obligations, for example, the obligation to declare serious industrial accidents. However, as <italic>gong-sang</italic> is used to avoid penalties, including court proceedings under the Korean Industrial Safety and Health Act, avoid increases in insurance premiums, and, in case of construction companies, avoid restrictions in government-ordered construction projects, companies often force injured workers to agree to <italic>gong-sang</italic>. At the public level, <italic>gong-sang</italic> could be a financial burden for the National Health Insurance scheme, because workers’ injuries that are not officially reported as industrial accidents will be covered by the National Health Insurance and not the industrial accident compensation insurance. The practice of <italic>gong-sang</italic> in the workplace consequently leads to the distortion of official occupational accident statistics.</p>
        <p>Despite the significance of <italic>gong-sang</italic>, it is not formally declared. Some surveys have provided a limited understanding of <italic>gong-sang</italic> by focusing on workers in a certain job. Our study analyzed a Web-based knowledge search dataset from 2006 to 2017 and identified the major issues surrounding <italic>gong-sang</italic>. The results of topic modeling were classified into 4 categories from 10 topics. Topic 1 was of the greatest concern (60.5%). Workers who suffered from industrial accidents seemed to be worried about illegal compensation and legal insurance claims. There were words alluding to <italic>gong-sang</italic>, such as company, occupational accident, agreement, diagnosis, and indemnification. Some words implied legal compensation: actual medical cost insurance (ie, hospital, actual expense, hospitalization, treatment, and application) as personal insurance and workers’ compensation insurance (ie, insurance, pay, retreat, amount, and claim) as social insurance. According to a study of industrial accidents [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref11">11</xref>], injured workers (those requiring medical care for more than 3 days) often tacitly agreed to <italic>gong-sang</italic> with the employer. Workers compensated with <italic>gong-sang</italic> were often in trouble because of insufficient company payouts and the aftereffects of their occupational accident. Thereafter, the entire burden would be on the individual. Such circumstances may lead workers to be concerned about whether they were receiving illegal compensation (<italic>gong-sang</italic>) or legal insurance claims.</p>
        <p>The next highest concern (19.2%) was the <italic>gong-sang</italic> monetary compensation, and topics 3 and 4 corresponded to this. There were keywords estimating monetary rewards from occupational injuries (ie, salary, claim, calculation, date, annual leave, medical expense, scar, lumbar, basic pay, money, industrial accident, muscle, X-ray, total amount, disability, injury, hospital charge, and convalescence) and conjecturing the company’s attitude (ie, loss, business owners, action, refusal, and exemption). Vulnerable workers, such as subcontractors (ie, subcontract, hammering, shipyard, and in-company) and daily workers (ie, daily pay, daily wage, and work), seemed to be more involved in this issue. A subcontractor is hired by a general contractor to perform a specific task as part of an overall project. Subcontractors or daily workers, as a representative class excluded from social insurance, were often forced to accept <italic>gong-sang</italic> from company or business owners in the event of an occupational accident and were known to prefer it often [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref12">12</xref>].</p>
        <p>Another important classification was claiming for industrial accident insurance benefits. Industrial accident compensation benefit is a social insurance system administered by the state to promptly compensate workers who have suffered an industrial accident and to relieve the employer’s temporary economic burden. Topic 2 included keywords, implying medical care benefits (ie, payment, surgical operation, medical expenses, fracture, medical treatment, and receipt), unemployment benefits (ie, allowance, salary, bonus, guarantee, and business owner), and disability benefits (ie, burden, employee, disability, and public corporation), which are components of industrial accident compensation benefits.</p>
        <p>The remaining topics (topics 5-10) were classified as descriptions of illegal compensation, focusing on vulnerable body parts and employment status. The main keywords of topic 5 referred to hand injuries (ie, finger, general practice, needle, suture, first medical examination, right hand, stiches, surgical operation, thumb, index finger, emergency department, centimeter, and laceration). Topic 9 suggested keywords corresponding to the lower limbs (ie, knee, cartilage, cast, cruciate ligaments, ligaments, rupture, and tarsal bone) and back injuries (ie, coin patch, medicine, and back). In topic 7, keywords also suggested bodily injuries (ie, face, tooth fracture, degeneration, dental crown, breathing, chest, and implant) because of occupational accidents (ie, day labor, traffic accident, cause, exposure, and nitric acid). Despite the lack of official statistics, it seemed that fatal industrial accidents were covered by workers’ compensation insurance, and <italic>gong-sang</italic> was taken for granted in nonfatal injury cases. Our data indicated that nonfatal injuries that occurred to the hands, face, teeth, lower limbs, and back were often associated with <italic>gong-sang</italic>.</p>
        <p>The employment status vulnerable to <italic>gong-sang</italic> seemed to be referenced most in topics 6, 8, and 10. There were keywords such as construction workers (ie, region, subcontract, Saturday, duration, building completion, and flange) in topic 6, vulnerable jobs (ie, construction, guard, carpenter, pickup, delivery, defense industry, rider, separate collection, defense personnel, and McDonalds) in topic 8, and foreign workers (ie, foreigner, recruitment, rotation, overwork, South Korea, Hangeul, and reentry) in topic 10. Additional words across these 3 topics were likely to refer to managing <italic>gong-sang</italic>. For example, the type of compensation (ie, medical certificate, severance pay, progression, last year, reason, disk, resign, one’s own expense, and official vacation in topic 6) and the consequences (ie, outplacement, inflammation, evidence, patient, hospitalization, surgical operation, trauma, and false in topic 10). Workers in precarious jobs, such as builders, guards, and delivery persons, lack occupational health and safety protection and social security coverage [<xref ref-type="bibr" rid="ref13">13</xref>]. Although they are covered by workers’ compensation insurance, workers in precarious jobs tend to prefer <italic>gong-sang</italic> because they are afraid of the disadvantages related to their work due to official insurance claims [<xref ref-type="bibr" rid="ref6">6</xref>,<xref ref-type="bibr" rid="ref12">12</xref>]. Our results indicated that workers in defense-related industries (or defense personnel) and foreign workers were particularly vulnerable. A worker in the defense industry refers to young men who are treated as an exception and have their military duties substituted within a fixed duration. Although workers in defense-related industries are treated unfairly and are offered <italic>gong-sang</italic> in the case of occupational injury, they tend to be overlooked because of the mandatory replacement period for military service [<xref ref-type="bibr" rid="ref14">14</xref>]. Meanwhile, foreign workers have the same basic labor rights as Korean nationals. Nonetheless, many foreign workers remain unaware of the industrial health and safety provisions in different countries, and their job stability tends to be poor because of their illegal immigration status [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>]; therefore, they are not offered appropriate compensation in the workplace.</p>
      </sec>
      <sec>
        <title>Implication</title>
        <p>This is the first study to use topic modeling to analyze unstructured Web-based text data about <italic>gong-sang</italic>–related topics. Our study provides important insights into the actual circumferences surrounding <italic>gong-sang</italic>, for example, injured workers’ concerns (as seen in topics 1-4) about <italic>gong-sang</italic> and the types of jobs and injuries associated with <italic>gong-sang</italic> (topics 5-10). However, illegal compensation or <italic>gong-sang</italic> is considered as a situation exclusive to South Korea. According to our observations, companies would like to limit their penalties (such as increases in insurance premiums and restrictions in government-ordered construction projects) derived from employees’ injury or illness and impose illegal compensations for injured workers. However, it is not known whether regulations and/or insurance in other countries obligate employers to compensate injured workers. For example, some international firms have arrangements wherein they offer a pickup and drop-off service for workers who cannot walk. Regulations in the West allow such services and companies to not register these people as temporarily unemployed when they conduct adapted tasks. Eventually, illegal workers’ compensation in South Korea may not be considered as a crime or fraud in the rest of the world. The interpretation and application of our results should be executed cautiously.</p>
      </sec>
      <sec>
        <title>Limitation</title>
        <p>This study needs to address the drawbacks of topic modeling. The topic modeling technique is highly effective for extracting knowledge from previously unknown information contained in unstructured big data [<xref ref-type="bibr" rid="ref17">17</xref>,<xref ref-type="bibr" rid="ref18">18</xref>] and has been widely used in the field of biological and medical document mining. Nonetheless, as is the case with all text mining approaches, difficulties arise when making interpretations and subjective validations, as the <italic>truth</italic> contained in the given documents and the number of relevant themes are not known <italic>a priori</italic> [<xref ref-type="bibr" rid="ref18">18</xref>]. We determined the best topic model by applying 3000 iterative processes and a perplexity-based method. However, the total number of topics remains unknown and depends on reasonable deductions. Future study is required to validate our perspective of <italic>gong-sang–</italic>related issues. A comparative study of another methodological approach (ie, grounded theory and deep learning) could be useful for knowledge discovery and comprehension.</p>
      </sec>
      <sec>
        <title>Conclusions</title>
        <p>In conclusion, we explored unstructured Web-based data and discovered hidden knowledge to identify the salient issues surrounding <italic>gong-sang</italic>. The topics formulated by LDA topic modeling included queries about legal insurance claims, such as private or social insurance (topics 1-2), monetary compensation (topics 3-4), injured body parts (topics 5, 7, and 9), and the type of jobs (topics 6, 8, and 10) vulnerable to <italic>gong-sang</italic>. These topics may provide valuable information to ensure further efficient operation of South Korea’s occupational health and safety administration and protect vulnerable workers from illegal <italic>gong-sang</italic> compensation practices.</p>
      </sec>
    </sec>
  </body>
  <back>
    <app-group/>
    <glossary>
      <title>Abbreviations</title>
      <def-list>
        <def-item>
          <term id="abb1">ILO</term>
          <def>
            <p>International Labor Office</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb2">LDA</term>
          <def>
            <p>latent Dirichlet allocation</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb3">OECD</term>
          <def>
            <p>Organization for Economic Co-operation and Development</p>
          </def>
        </def-item>
        <def-item>
          <term id="abb4">TF-IDF</term>
          <def>
            <p>term frequency-inverse document frequency</p>
          </def>
        </def-item>
      </def-list>
    </glossary>
    <ack>
      <p>This study was funded by the National Research Foundation of Korea grant funded by the Korean government (No. NRF-2017R1E1A1A01078235).</p>
    </ack>
    <fn-group>
      <fn fn-type="conflict">
        <p>None declared.</p>
      </fn>
    </fn-group>
    <ref-list>
      <ref id="ref1">
        <label>1</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hämäläinen</surname>
              <given-names>P</given-names>
            </name>
            <name name-style="western">
              <surname>Takala</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Kiat</surname>
              <given-names>TB</given-names>
            </name>
          </person-group>
          <source>Global Estimates of Occupational Accidents and Work-related Illnesses 2017</source>
          <year>2017</year>
          <publisher-loc>Singapore</publisher-loc>
          <publisher-name>Workplace Safety and Health Institute</publisher-name>
        </nlm-citation>
      </ref>
      <ref id="ref2">
        <label>2</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>SK</given-names>
            </name>
            <name name-style="western">
              <surname>Kwon</surname>
              <given-names>OJ</given-names>
            </name>
          </person-group>
          <article-title>Occupational injury statistics in Korea</article-title>
          <source>Saf Health Work</source>
          <year>2011</year>
          <month>03</month>
          <volume>2</volume>
          <issue>1</issue>
          <fpage>52</fpage>
          <lpage>6</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://linkinghub.elsevier.com/retrieve/pii/S2093-7911(11)21007-2"/>
          </comment>
          <pub-id pub-id-type="doi">10.5491/SHAW.2011.2.1.52</pub-id>
          <pub-id pub-id-type="medline">22953187</pub-id>
          <pub-id pub-id-type="pii">S2093-7911(11)21007-2</pub-id>
          <pub-id pub-id-type="pmcid">PMC3431889</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref3">
        <label>3</label>
        <nlm-citation citation-type="web">
          <source>Open Government Data Platform</source>
          <year>2013</year>
          <access-date>2019-09-12</access-date>
          <comment>Industrial Injuries in Factories<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://data.gov.in/catalog/industrial-injuries-factories?filters%5Bfield_catalog_reference%5D=88650&#38;format=json&#38;offset=0&#38;limit=6&#38;sort%5Bcreated%5D=desc">https://data.gov.in/catalog/industrial-injuries-factories?filters%5Bfield_catalog_reference%5D=88650&#38;format=json&#38;offset=0&#38;limit=6&#38;sort%5Bcreated%5D=desc</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref4">
        <label>4</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rhee</surname>
              <given-names>KY</given-names>
            </name>
            <name name-style="western">
              <surname>Choe</surname>
              <given-names>SW</given-names>
            </name>
          </person-group>
          <article-title>Management system of occupational diseases in Korea: statistics, report and monitoring system</article-title>
          <source>J Korean Med Sci</source>
          <year>2010</year>
          <month>12</month>
          <volume>25</volume>
          <issue>Suppl</issue>
          <fpage>S119</fpage>
          <lpage>26</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://jkms.org/DOIx.php?id=10.3346/jkms.2010.25.S.S119"/>
          </comment>
          <pub-id pub-id-type="doi">10.3346/jkms.2010.25.S.S119</pub-id>
          <pub-id pub-id-type="medline">21258584</pub-id>
          <pub-id pub-id-type="pmcid">PMC3023350</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref5">
        <label>5</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Choi</surname>
              <given-names>U</given-names>
            </name>
          </person-group>
          <article-title>Survey on the Industrial Accident Insurance Act: suggestion of several points to be revised</article-title>
          <source>Labor Law Rev</source>
          <year>2009</year>
          <volume>26</volume>
          <fpage>317</fpage>
          <lpage>47</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://m.riss.kr/search/detail/DetailView.do?p_mat_type=1a0202e37d52c72d&#38;control_no=f9529104849e6109e9810257f7042666"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref6">
        <label>6</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>JS</given-names>
            </name>
          </person-group>
          <article-title>Risk-shifting and institutional lag: industrial accident statistics of regular workers and inside contract workers at the Hyundai motor Ulsan plant</article-title>
          <source>Korean J Labor Stud</source>
          <year>2007</year>
          <volume>13</volume>
          <issue>2</issue>
          <fpage>213</fpage>
          <lpage>48</lpage>
          <pub-id pub-id-type="doi">10.17005/kals.2007.13.2.213</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref7">
        <label>7</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Blei</surname>
              <given-names>DM</given-names>
            </name>
            <name name-style="western">
              <surname>Ng</surname>
              <given-names>AY</given-names>
            </name>
            <name name-style="western">
              <surname>Jordan</surname>
              <given-names>MI</given-names>
            </name>
          </person-group>
          <article-title>Latent dirichlet allocation</article-title>
          <source>J Mach Learn Res</source>
          <year>2003</year>
          <month>01</month>
          <volume>3</volume>
          <fpage>993</fpage>
          <lpage>1022</lpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="http://www.jmlr.org/papers/volume3/blei03a/blei03a.pdf"/>
          </comment>
        </nlm-citation>
      </ref>
      <ref id="ref8">
        <label>8</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Park</surname>
              <given-names>EJ</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>SZ</given-names>
            </name>
          </person-group>
          <article-title>KoNLPy: Korean Natural Language Processing in Python</article-title>
          <source>Proceedings of the 26th Annual Conference on Human &#38; Cognitive Language Technology</source>
          <year>2014</year>
          <conf-name>HLTCon'14</conf-name>
          <conf-date>December, 2014</conf-date>
          <conf-loc>Chuncheon, Korea</conf-loc>
        </nlm-citation>
      </ref>
      <ref id="ref9">
        <label>9</label>
        <nlm-citation citation-type="book">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Rajaraman</surname>
              <given-names>A</given-names>
            </name>
            <name name-style="western">
              <surname>Ullman</surname>
              <given-names>JD</given-names>
            </name>
          </person-group>
          <article-title>Data mining</article-title>
          <source>Mining Of Massive Datasets</source>
          <year>2011</year>
          <publisher-loc>Cambridge, United Kingdom</publisher-loc>
          <publisher-name>Cambridge University Press</publisher-name>
          <fpage>1</fpage>
          <lpage>17</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref10">
        <label>10</label>
        <nlm-citation citation-type="confproc">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Chuang</surname>
              <given-names>J</given-names>
            </name>
            <name name-style="western">
              <surname>Ramage</surname>
              <given-names>D</given-names>
            </name>
            <name name-style="western">
              <surname>Manning</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Heer</surname>
              <given-names>J</given-names>
            </name>
          </person-group>
          <article-title>Interpretation and Trust: Designing Model-Driven Visualizations for Text Analysis</article-title>
          <source>Proceedings of the SIGCHI Conference on Human Factors in Computing Systems</source>
          <year>2012</year>
          <conf-name>CHI’12</conf-name>
          <conf-date>May 5-10, 2012</conf-date>
          <conf-loc>Austin, Texas, USA</conf-loc>
          <fpage>443</fpage>
          <lpage>52</lpage>
          <pub-id pub-id-type="doi">10.1145/2207676.2207738</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref11">
        <label>11</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Nam</surname>
              <given-names>KS</given-names>
            </name>
          </person-group>
          <article-title>The state of unreported industrial accidents and its counter-measures in small and medium-sized manufacturing companies</article-title>
          <source>J Korea Saf Manag Sci</source>
          <year>2007</year>
          <volume>9</volume>
          <issue>3</issue>
          <fpage>29</fpage>
          <lpage>40</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref12">
        <label>12</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Shin</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>DH</given-names>
            </name>
            <name name-style="western">
              <surname>Ahn</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HD</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>JH</given-names>
            </name>
            <name name-style="western">
              <surname>Kang</surname>
              <given-names>HM</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>JT</given-names>
            </name>
          </person-group>
          <article-title>Factors associated with occupational injuries of ship-building supply workers in Busan</article-title>
          <source>Korean J Occup Environ Med</source>
          <year>2008</year>
          <month>01</month>
          <volume>20</volume>
          <issue>1</issue>
          <fpage>15</fpage>
          <lpage>24</lpage>
          <pub-id pub-id-type="doi">10.35371/kjoem.2008.20.1.15</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref13">
        <label>13</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Quinlan</surname>
              <given-names>M</given-names>
            </name>
            <name name-style="western">
              <surname>Mayhew</surname>
              <given-names>C</given-names>
            </name>
            <name name-style="western">
              <surname>Bohle</surname>
              <given-names>P</given-names>
            </name>
          </person-group>
          <article-title>The global expansion of precarious employment, work disorganization, and consequences for occupational health: a review of recent research</article-title>
          <source>Int J Health Serv</source>
          <year>2001</year>
          <volume>31</volume>
          <issue>2</issue>
          <fpage>335</fpage>
          <lpage>414</lpage>
          <pub-id pub-id-type="doi">10.2190/607H-TTV0-QCN6-YLT4</pub-id>
          <pub-id pub-id-type="medline">11407174</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref14">
        <label>14</label>
        <nlm-citation citation-type="web">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>YS</given-names>
            </name>
          </person-group>
          <source>Maeil Business Newspaper</source>
          <access-date>2019-05-02</access-date>
          <comment>Occupational Injuries of Defense Personnel Doubled Over Two Years<ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://www.mk.co.kr/news/politics/view/2018/10/661495">https://www.mk.co.kr/news/politics/view/2018/10/661495</ext-link>
                                                </comment>
        </nlm-citation>
      </ref>
      <ref id="ref15">
        <label>15</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Hwang</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Kim</surname>
              <given-names>HS</given-names>
            </name>
            <name name-style="western">
              <surname>Lee</surname>
              <given-names>SH</given-names>
            </name>
            <name name-style="western">
              <surname>Paik</surname>
              <given-names>NW</given-names>
            </name>
          </person-group>
          <article-title>A statistical study on industrial accidents in migrant workers in Seoul and Kyungin area</article-title>
          <source>J Korean Soc Occup Environ Hyg</source>
          <year>2006</year>
          <volume>16</volume>
          <issue>1</issue>
          <fpage>17</fpage>
          <lpage>26</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref16">
        <label>16</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Yi</surname>
              <given-names>KH</given-names>
            </name>
            <name name-style="western">
              <surname>Cho</surname>
              <given-names>HH</given-names>
            </name>
            <name name-style="western">
              <surname>You</surname>
              <given-names>KH</given-names>
            </name>
          </person-group>
          <article-title>The comparative study on the occupational injury rate and mortality rate of the total workers and foreign workers</article-title>
          <source>J Korean Soc Saf</source>
          <year>2012</year>
          <volume>27</volume>
          <issue>1</issue>
          <fpage>96</fpage>
          <lpage>104</lpage>
        </nlm-citation>
      </ref>
      <ref id="ref17">
        <label>17</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>JJ</given-names>
            </name>
            <name name-style="western">
              <surname>Perkins</surname>
              <given-names>R</given-names>
            </name>
            <name name-style="western">
              <surname>Liu</surname>
              <given-names>Z</given-names>
            </name>
            <name name-style="western">
              <surname>Ge</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Ding</surname>
              <given-names>Y</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>W</given-names>
            </name>
          </person-group>
          <article-title>A heuristic approach to determine an appropriate number of topics in topic modeling</article-title>
          <source>BioMed Cent Bioinform</source>
          <year>2015</year>
          <volume>16</volume>
          <issue>Suppl 13</issue>
          <fpage>S8</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-16-S13-S8"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-16-S13-S8</pub-id>
          <pub-id pub-id-type="medline">26424364</pub-id>
          <pub-id pub-id-type="pii">1471-2105-16-S13-S8</pub-id>
          <pub-id pub-id-type="pmcid">PMC4597325</pub-id>
        </nlm-citation>
      </ref>
      <ref id="ref18">
        <label>18</label>
        <nlm-citation citation-type="journal">
          <person-group person-group-type="author">
            <name name-style="western">
              <surname>Zhao</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Zou</surname>
              <given-names>W</given-names>
            </name>
            <name name-style="western">
              <surname>Chen</surname>
              <given-names>JJ</given-names>
            </name>
          </person-group>
          <article-title>Topic modeling for cluster analysis of large biological and medical datasets</article-title>
          <source>BioMed Cent Bioinform</source>
          <year>2014</year>
          <volume>15</volume>
          <issue>Suppl 11</issue>
          <fpage>S11</fpage>
          <comment>
            <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://bmcbioinformatics.biomedcentral.com/articles/10.1186/1471-2105-15-S11-S11"/>
          </comment>
          <pub-id pub-id-type="doi">10.1186/1471-2105-15-S11-S11</pub-id>
          <pub-id pub-id-type="medline">25350106</pub-id>
          <pub-id pub-id-type="pii">1471-2105-15-S11-S11</pub-id>
          <pub-id pub-id-type="pmcid">PMC4251039</pub-id>
        </nlm-citation>
      </ref>
    </ref-list>
  </back>
</article>
