@article{sachan-etal-2019-discourse,
title = "Discourse in Multimedia: A Case Study in Extracting Geometry Knowledge from Textbooks",
author = "Sachan, Mrinmaya and
Dubey, Avinava and
Hovy, Eduard H. and
Mitchell, Tom M. and
Roth, Dan and
Xing, Eric P.",
journal = "Computational Linguistics",
volume = "45",
number = "4",
month = dec,
year = "2019",
address = "Cambridge, MA",
publisher = "MIT Press",
url = "https://aclanthology.org/J19-4002/",
doi = "10.1162/coli_a_00360",
pages = "627--665",
abstract = "To ensure readability, text is often written and presented with due formatting. These text formatting devices help the writer to effectively convey the narrative. At the same time, these help the readers pick up the structure of the discourse and comprehend the conveyed information. There have been a number of linguistic theories on discourse structure of text. However, these theories only consider unformatted text. Multimedia text contains rich formatting features that can be leveraged for various NLP tasks. In this article, we study some of these discourse features in multimedia text and what communicative function they fulfill in the context. As a case study, we use these features to harvest structured subject knowledge of geometry from textbooks. We conclude that the discourse and text layout features provide information that is complementary to lexical semantic information. Finally, we show that the harvested structured knowledge can be used to improve an existing solver for geometry problems, making it more accurate as well as more explainable."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="sachan-etal-2019-discourse">
<titleInfo>
<title>Discourse in Multimedia: A Case Study in Extracting Geometry Knowledge from Textbooks</title>
</titleInfo>
<name type="personal">
<namePart type="given">Mrinmaya</namePart>
<namePart type="family">Sachan</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Avinava</namePart>
<namePart type="family">Dubey</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eduard</namePart>
<namePart type="given">H</namePart>
<namePart type="family">Hovy</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tom</namePart>
<namePart type="given">M</namePart>
<namePart type="family">Mitchell</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Dan</namePart>
<namePart type="family">Roth</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Eric</namePart>
<namePart type="given">P</namePart>
<namePart type="family">Xing</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2019-12</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Computational Linguistics</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>MIT Press</publisher>
<place>
<placeTerm type="text">Cambridge, MA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>To ensure readability, text is often written and presented with due formatting. These text formatting devices help the writer to effectively convey the narrative. At the same time, these help the readers pick up the structure of the discourse and comprehend the conveyed information. There have been a number of linguistic theories on discourse structure of text. However, these theories only consider unformatted text. Multimedia text contains rich formatting features that can be leveraged for various NLP tasks. In this article, we study some of these discourse features in multimedia text and what communicative function they fulfill in the context. As a case study, we use these features to harvest structured subject knowledge of geometry from textbooks. We conclude that the discourse and text layout features provide information that is complementary to lexical semantic information. Finally, we show that the harvested structured knowledge can be used to improve an existing solver for geometry problems, making it more accurate as well as more explainable.</abstract>
<identifier type="citekey">sachan-etal-2019-discourse</identifier>
<identifier type="doi">10.1162/coli_a_00360</identifier>
<location>
<url>https://aclanthology.org/J19-4002/</url>
</location>
<part>
<date>2019-12</date>
<detail type="volume"><number>45</number></detail>
<detail type="issue"><number>4</number></detail>
<extent unit="page">
<start>627</start>
<end>665</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T Discourse in Multimedia: A Case Study in Extracting Geometry Knowledge from Textbooks
%A Sachan, Mrinmaya
%A Dubey, Avinava
%A Hovy, Eduard H.
%A Mitchell, Tom M.
%A Roth, Dan
%A Xing, Eric P.
%J Computational Linguistics
%D 2019
%8 December
%V 45
%N 4
%I MIT Press
%C Cambridge, MA
%F sachan-etal-2019-discourse
%X To ensure readability, text is often written and presented with due formatting. These text formatting devices help the writer to effectively convey the narrative. At the same time, these help the readers pick up the structure of the discourse and comprehend the conveyed information. There have been a number of linguistic theories on discourse structure of text. However, these theories only consider unformatted text. Multimedia text contains rich formatting features that can be leveraged for various NLP tasks. In this article, we study some of these discourse features in multimedia text and what communicative function they fulfill in the context. As a case study, we use these features to harvest structured subject knowledge of geometry from textbooks. We conclude that the discourse and text layout features provide information that is complementary to lexical semantic information. Finally, we show that the harvested structured knowledge can be used to improve an existing solver for geometry problems, making it more accurate as well as more explainable.
%R 10.1162/coli_a_00360
%U https://aclanthology.org/J19-4002/
%U https://doi.org/10.1162/coli_a_00360
%P 627-665
Markdown (Informal)
[Discourse in Multimedia: A Case Study in Extracting Geometry Knowledge from Textbooks](https://aclanthology.org/J19-4002/) (Sachan et al., CL 2019)
ACL