@inproceedings{wang-etal-2019-bigodm,
title = "{BIGODM} System in the Social Media Mining for Health Applications Shared Task 2019",
author = "Wang, Chen-Kai and
Dai, Hong-Jie and
Wang, Bo-Hung",
editor = "Weissenbacher, Davy and
Gonzalez-Hernandez, Graciela",
booktitle = "Proceedings of the Fourth Social Media Mining for Health Applications ({\#}SMM4H) Workshop {\&} Shared Task",
month = aug,
year = "2019",
address = "Florence, Italy",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/W19-3220",
doi = "10.18653/v1/W19-3220",
pages = "117--119",
abstract = "In this study, we describe our methods to automatically classify Twitter posts conveying events of adverse drug reaction (ADR). Based on our previous experience in tackling the ADR classification task, we empirically applied the vote-based under-sampling ensemble approach along with linear support vector machine (SVM) to develop our classifiers as part of our participation in ACL 2019 Social Media Mining for Health Applications (SMM4H) shared task 1. The best-performed model on the test sets were trained on a merged corpus consisting of the datasets released by SMM4H 2017 and 2019. By using VUE, the corpus was randomly under-sampled with 2:1 ratio between the negative and positive classes to create an ensemble using the linear kernel trained with features including bag-of-word, domain knowledge, negation and word embedding. The best performing model achieved an F-measure of 0.551 which is about 5{\%} higher than the average F-scores of 16 teams.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="wang-etal-2019-bigodm">
<titleInfo>
<title>BIGODM System in the Social Media Mining for Health Applications Shared Task 2019</title>
</titleInfo>
<name type="personal">
<namePart type="given">Chen-Kai</namePart>
<namePart type="family">Wang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Hong-Jie</namePart>
<namePart type="family">Dai</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Bo-Hung</namePart>
<namePart type="family">Wang</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-08</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the Fourth Social Media Mining for Health Applications (#SMM4H) Workshop & Shared Task</title>
</titleInfo>
<name type="personal">
<namePart type="given">Davy</namePart>
<namePart type="family">Weissenbacher</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Graciela</namePart>
<namePart type="family">Gonzalez-Hernandez</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Florence, Italy</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>In this study, we describe our methods to automatically classify Twitter posts conveying events of adverse drug reaction (ADR). Based on our previous experience in tackling the ADR classification task, we empirically applied the vote-based under-sampling ensemble approach along with linear support vector machine (SVM) to develop our classifiers as part of our participation in ACL 2019 Social Media Mining for Health Applications (SMM4H) shared task 1. The best-performed model on the test sets were trained on a merged corpus consisting of the datasets released by SMM4H 2017 and 2019. By using VUE, the corpus was randomly under-sampled with 2:1 ratio between the negative and positive classes to create an ensemble using the linear kernel trained with features including bag-of-word, domain knowledge, negation and word embedding. The best performing model achieved an F-measure of 0.551 which is about 5% higher than the average F-scores of 16 teams.</abstract>
<identifier type="citekey">wang-etal-2019-bigodm</identifier>
<identifier type="doi">10.18653/v1/W19-3220</identifier>
<location>
<url>https://aclanthology.org/W19-3220</url>
</location>
<part>
<date>2019-08</date>
<extent unit="page">
<start>117</start>
<end>119</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T BIGODM System in the Social Media Mining for Health Applications Shared Task 2019
%A Wang, Chen-Kai
%A Dai, Hong-Jie
%A Wang, Bo-Hung
%Y Weissenbacher, Davy
%Y Gonzalez-Hernandez, Graciela
%S Proceedings of the Fourth Social Media Mining for Health Applications (#SMM4H) Workshop & Shared Task
%D 2019
%8 August
%I Association for Computational Linguistics
%C Florence, Italy
%F wang-etal-2019-bigodm
%X In this study, we describe our methods to automatically classify Twitter posts conveying events of adverse drug reaction (ADR). Based on our previous experience in tackling the ADR classification task, we empirically applied the vote-based under-sampling ensemble approach along with linear support vector machine (SVM) to develop our classifiers as part of our participation in ACL 2019 Social Media Mining for Health Applications (SMM4H) shared task 1. The best-performed model on the test sets were trained on a merged corpus consisting of the datasets released by SMM4H 2017 and 2019. By using VUE, the corpus was randomly under-sampled with 2:1 ratio between the negative and positive classes to create an ensemble using the linear kernel trained with features including bag-of-word, domain knowledge, negation and word embedding. The best performing model achieved an F-measure of 0.551 which is about 5% higher than the average F-scores of 16 teams.
%R 10.18653/v1/W19-3220
%U https://aclanthology.org/W19-3220
%U https://doi.org/10.18653/v1/W19-3220
%P 117-119
Markdown (Informal)
[BIGODM System in the Social Media Mining for Health Applications Shared Task 2019](https://aclanthology.org/W19-3220) (Wang et al., ACL 2019)
ACL