@article{kuznetsova-etal-2014-treetalk,
title = "{T}ree{T}alk: Composition and Compression of Trees for Image Descriptions",
author = "Kuznetsova, Polina and
Ordonez, Vicente and
Berg, Tamara L. and
Choi, Yejin",
editor = "Lin, Dekang and
Collins, Michael and
Lee, Lillian",
journal = "Transactions of the Association for Computational Linguistics",
volume = "2",
year = "2014",
address = "Cambridge, MA",
publisher = "MIT Press",
url = "https://aclanthology.org/Q14-1028/",
doi = "10.1162/tacl_a_00188",
pages = "351--362",
abstract = "We present a new tree based approach to composing expressive image descriptions that makes use of naturally occuring web images with captions. We investigate two related tasks: image caption generalization and generation, where the former is an optional subtask of the latter. The high-level idea of our approach is to harvest expressive phrases (as tree fragments) from existing image descriptions, then to compose a new description by selectively combining the extracted (and optionally pruned) tree fragments. Key algorithmic components are tree composition and compression, both integrating tree structure with sequence structure. Our proposed system attains significantly better performance than previous approaches for both image caption generalization and generation. In addition, our work is the first to show the empirical benefit of automatically generalized captions for composing natural image descriptions."
}
<?xml version="1.0" encoding="UTF-8"?>
<modsCollection xmlns="http://www.loc.gov/mods/v3">
<mods ID="kuznetsova-etal-2014-treetalk">
<titleInfo>
<title>TreeTalk: Composition and Compression of Trees for Image Descriptions</title>
</titleInfo>
<name type="personal">
<namePart type="given">Polina</namePart>
<namePart type="family">Kuznetsova</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Vicente</namePart>
<namePart type="family">Ordonez</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Tamara</namePart>
<namePart type="given">L</namePart>
<namePart type="family">Berg</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<name type="personal">
<namePart type="given">Yejin</namePart>
<namePart type="family">Choi</namePart>
<role>
<roleTerm authority="marcrelator" type="text">author</roleTerm>
</role>
</name>
<originInfo>
<dateIssued>2014</dateIssued>
</originInfo>
<typeOfResource>text</typeOfResource>
<genre authority="bibutilsgt">journal article</genre>
<relatedItem type="host">
<titleInfo>
<title>Transactions of the Association for Computational Linguistics</title>
</titleInfo>
<originInfo>
<issuance>continuing</issuance>
<publisher>MIT Press</publisher>
<place>
<placeTerm type="text">Cambridge, MA</placeTerm>
</place>
</originInfo>
<genre authority="marcgt">periodical</genre>
<genre authority="bibutilsgt">academic journal</genre>
</relatedItem>
<abstract>We present a new tree based approach to composing expressive image descriptions that makes use of naturally occuring web images with captions. We investigate two related tasks: image caption generalization and generation, where the former is an optional subtask of the latter. The high-level idea of our approach is to harvest expressive phrases (as tree fragments) from existing image descriptions, then to compose a new description by selectively combining the extracted (and optionally pruned) tree fragments. Key algorithmic components are tree composition and compression, both integrating tree structure with sequence structure. Our proposed system attains significantly better performance than previous approaches for both image caption generalization and generation. In addition, our work is the first to show the empirical benefit of automatically generalized captions for composing natural image descriptions.</abstract>
<identifier type="citekey">kuznetsova-etal-2014-treetalk</identifier>
<identifier type="doi">10.1162/tacl_a_00188</identifier>
<location>
<url>https://aclanthology.org/Q14-1028/</url>
</location>
<part>
<date>2014</date>
<detail type="volume"><number>2</number></detail>
<extent unit="page">
<start>351</start>
<end>362</end>
</extent>
</part>
</mods>
</modsCollection>
%0 Journal Article
%T TreeTalk: Composition and Compression of Trees for Image Descriptions
%A Kuznetsova, Polina
%A Ordonez, Vicente
%A Berg, Tamara L.
%A Choi, Yejin
%J Transactions of the Association for Computational Linguistics
%D 2014
%V 2
%I MIT Press
%C Cambridge, MA
%F kuznetsova-etal-2014-treetalk
%X We present a new tree based approach to composing expressive image descriptions that makes use of naturally occuring web images with captions. We investigate two related tasks: image caption generalization and generation, where the former is an optional subtask of the latter. The high-level idea of our approach is to harvest expressive phrases (as tree fragments) from existing image descriptions, then to compose a new description by selectively combining the extracted (and optionally pruned) tree fragments. Key algorithmic components are tree composition and compression, both integrating tree structure with sequence structure. Our proposed system attains significantly better performance than previous approaches for both image caption generalization and generation. In addition, our work is the first to show the empirical benefit of automatically generalized captions for composing natural image descriptions.
%R 10.1162/tacl_a_00188
%U https://aclanthology.org/Q14-1028/
%U https://doi.org/10.1162/tacl_a_00188
%P 351-362
Markdown (Informal)
[TreeTalk: Composition and Compression of Trees for Image Descriptions](https://aclanthology.org/Q14-1028/) (Kuznetsova et al., TACL 2014)
ACL