@inproceedings{gabud-etal-2023-hybrid,
title = "A Hybrid of Rule-based and Transformer-based Approaches for Relation Extraction in Biodiversity Literature",
author = "Gabud, Roselyn and
Lapitan, Portia and
Mariano, Vladimir and
Mendoza, Eduardo and
Pampolina, Nelson and
Clari{\~n}o, Maria Art Antonette and
Batista-Navarro, Riza",
editor = "Surdeanu, Mihai and
Riloff, Ellen and
Chiticariu, Laura and
Frietag, Dayne and
Hahn-Powell, Gus and
Morrison, Clayton T. and
Noriega-Atala, Enrique and
Sharp, Rebecca and
Valenzuela-Escarcega, Marco",
booktitle = "Proceedings of the 2nd Workshop on Pattern-based Approaches to NLP in the Age of Deep Learning",
month = dec,
year = "2023",
address = "Singapore",
publisher = "Association for Computational Linguistics",
url = "https://aclanthology.org/2023.pandl-1.10",
doi = "10.18653/v1/2023.pandl-1.10",
pages = "103--113",
abstract = "Relation extraction (RE) is one of the tasks behind many relevant natural language processing (NLP) applications. Exploiting the information hidden in millions of scholarly articles by leveraging NLP, specifically RE, systems could benefit studies in specialized domains, e.g. biomedicine and biodiversity. Although deep learning (DL)-based methods have shown state-of-the-art performance in many NLP tasks including RE, DL for domain-specific RE systems has been hindered by the lack of expert-labeled datasets which are typically required to train such methods. In this paper, we take advantage of the zero-shot (i.e., not requiring any labeled data) capability of pattern-based methods for RE using a rule-based approach, combined with templates for natural language inference (NLI) transformer models. We present our hybrid method for RE that exploits the advantages of both methods, i.e., interpretability of rules and transferability of transformers. Evaluated on a corpus of biodiversity literature with annotated relations, our hybrid method demonstrated an improvement of up to 15 percentage points in recall and best performance over solely rule-based and transformer-based methods with F1-scores ranging from 89.61{\%} to 96.75{\%} for reproductive condition - temporal expression relations, and ranging from 85.39{\%} to 89.90{\%} for habitat - geographic location relations.",
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="gabud-etal-2023-hybrid">
<titleInfo>
<title>A Hybrid of Rule-based and Transformer-based Approaches for Relation Extraction in Biodiversity Literature</title>
</titleInfo>
<name type="personal">
<namePart type="given">Roselyn</namePart>
<namePart type="family">Gabud</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Portia</namePart>
<namePart type="family">Lapitan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Vladimir</namePart>
<namePart type="family">Mariano</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eduardo</namePart>
<namePart type="family">Mendoza</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Nelson</namePart>
<namePart type="family">Pampolina</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Maria</namePart>
<namePart type="given">Art</namePart>
<namePart type="given">Antonette</namePart>
<namePart type="family">Clariño</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Riza</namePart>
<namePart type="family">Batista-Navarro</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2023-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<relatedItem type="host">
<titleInfo>
<title>Proceedings of the 2nd Workshop on Pattern-based Approaches to NLP in the Age of Deep Learning</title>
</titleInfo>
<name type="personal">
<namePart type="given">Mihai</namePart>
<namePart type="family">Surdeanu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Ellen</namePart>
<namePart type="family">Riloff</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Laura</namePart>
<namePart type="family">Chiticariu</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Dayne</namePart>
<namePart type="family">Frietag</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Gus</namePart>
<namePart type="family">Hahn-Powell</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Clayton</namePart>
<namePart type="given">T</namePart>
<namePart type="family">Morrison</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Enrique</namePart>
<namePart type="family">Noriega-Atala</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Rebecca</namePart>
<namePart type="family">Sharp</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Marco</namePart>
<namePart type="family">Valenzuela-Escarcega</namePart>
<role>
<roleTerm authority="marcrelator" type="text">editor</roleTerm>
</role>
</name>
<originInfo>
<publisher>Association for Computational Linguistics</publisher>
<place>
<placeTerm type="text">Singapore</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">conference publication</genre>
</relatedItem>
<abstract>Relation extraction (RE) is one of the tasks behind many relevant natural language processing (NLP) applications. Exploiting the information hidden in millions of scholarly articles by leveraging NLP, specifically RE, systems could benefit studies in specialized domains, e.g. biomedicine and biodiversity. Although deep learning (DL)-based methods have shown state-of-the-art performance in many NLP tasks including RE, DL for domain-specific RE systems has been hindered by the lack of expert-labeled datasets which are typically required to train such methods. In this paper, we take advantage of the zero-shot (i.e., not requiring any labeled data) capability of pattern-based methods for RE using a rule-based approach, combined with templates for natural language inference (NLI) transformer models. We present our hybrid method for RE that exploits the advantages of both methods, i.e., interpretability of rules and transferability of transformers. Evaluated on a corpus of biodiversity literature with annotated relations, our hybrid method demonstrated an improvement of up to 15 percentage points in recall and best performance over solely rule-based and transformer-based methods with F1-scores ranging from 89.61% to 96.75% for reproductive condition - temporal expression relations, and ranging from 85.39% to 89.90% for habitat - geographic location relations.</abstract>
<identifier type="citekey">gabud-etal-2023-hybrid</identifier>
<identifier type="doi">10.18653/v1/2023.pandl-1.10</identifier>
<location>
<url>https://aclanthology.org/2023.pandl-1.10</url>
</location>
<part>
<date>2023-12</date>
<extent unit="page">
<start>103</start>
<end>113</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Conference Proceedings
%T A Hybrid of Rule-based and Transformer-based Approaches for Relation Extraction in Biodiversity Literature
%A Gabud, Roselyn
%A Lapitan, Portia
%A Mariano, Vladimir
%A Mendoza, Eduardo
%A Pampolina, Nelson
%A Clariño, Maria Art Antonette
%A Batista-Navarro, Riza
%Y Surdeanu, Mihai
%Y Riloff, Ellen
%Y Chiticariu, Laura
%Y Frietag, Dayne
%Y Hahn-Powell, Gus
%Y Morrison, Clayton T.
%Y Noriega-Atala, Enrique
%Y Sharp, Rebecca
%Y Valenzuela-Escarcega, Marco
%S Proceedings of the 2nd Workshop on Pattern-based Approaches to NLP in the Age of Deep Learning
%D 2023
%8 December
%I Association for Computational Linguistics
%C Singapore
%F gabud-etal-2023-hybrid
%X Relation extraction (RE) is one of the tasks behind many relevant natural language processing (NLP) applications. Exploiting the information hidden in millions of scholarly articles by leveraging NLP, specifically RE, systems could benefit studies in specialized domains, e.g. biomedicine and biodiversity. Although deep learning (DL)-based methods have shown state-of-the-art performance in many NLP tasks including RE, DL for domain-specific RE systems has been hindered by the lack of expert-labeled datasets which are typically required to train such methods. In this paper, we take advantage of the zero-shot (i.e., not requiring any labeled data) capability of pattern-based methods for RE using a rule-based approach, combined with templates for natural language inference (NLI) transformer models. We present our hybrid method for RE that exploits the advantages of both methods, i.e., interpretability of rules and transferability of transformers. Evaluated on a corpus of biodiversity literature with annotated relations, our hybrid method demonstrated an improvement of up to 15 percentage points in recall and best performance over solely rule-based and transformer-based methods with F1-scores ranging from 89.61% to 96.75% for reproductive condition - temporal expression relations, and ranging from 85.39% to 89.90% for habitat - geographic location relations.
%R 10.18653/v1/2023.pandl-1.10
%U https://aclanthology.org/2023.pandl-1.10
%U https://doi.org/10.18653/v1/2023.pandl-1.10
%P 103-113
Markdown (Informal)
[A Hybrid of Rule-based and Transformer-based Approaches for Relation Extraction in Biodiversity Literature](https://aclanthology.org/2023.pandl-1.10) (Gabud et al., PANDL-WS 2023)
ACL