<?xml version="1.0" encoding="UTF-8" ?>
<volume id="W14">
  <paper id="5400">
    <title>Proceedings of the Third Workshop on Vision and Language</title>
    <editor>Anja Belz</editor>
    <editor>Darren Cosker</editor>
    <editor>Frank Keller</editor>
    <editor>William Smith</editor>
    <editor>Kalina Bontcheva</editor>
    <editor>Sien Moens</editor>
    <editor>Alan Smeaton</editor>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <url>http://www.aclweb.org/anthology/W14-54</url>
    <bibtype>book</bibtype>
    <bibkey>VL:2014</bibkey>
  </paper>

  <paper id="5401">
    <title>The Effect of Sensor Errors in Situated Human-Computer Dialogue</title>
    <author><first>Niels</first><last>Sch&#252;tte</last></author>
    <author><first>John</first><last>Kelleher</last></author>
    <author><first>Brian</first><last>Mac Namee</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>1&#8211;8</pages>
    <url>http://www.aclweb.org/anthology/W14-5401</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>schutte-kelleher-macnamee:2014:VL</bibkey>
  </paper>

  <paper id="5402">
    <title>Joint Navigation in Commander/Robot Teams: Dialog &#38; Task Performance When Vision is Bandwidth-Limited</title>
    <author><first>Douglas</first><last>Summers-Stay</last></author>
    <author><first>Taylor</first><last>Cassidy</last></author>
    <author><first>Clare</first><last>Voss</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>9&#8211;16</pages>
    <url>http://www.aclweb.org/anthology/W14-5402</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>summersstay-cassidy-voss:2014:VL</bibkey>
  </paper>

  <paper id="5403">
    <title>TUHOI: Trento Universal Human Object Interaction Dataset</title>
    <author><first>Dieu-Thu</first><last>Le</last></author>
    <author><first>Jasper</first><last>Uijlings</last></author>
    <author><first>Raffaella</first><last>Bernardi</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>17&#8211;24</pages>
    <url>http://www.aclweb.org/anthology/W14-5403</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>le-uijlings-bernardi:2014:VL</bibkey>
  </paper>

  <paper id="5404">
    <title>Concept-oriented labelling of patent images based on Random Forests and proximity-driven generation of synthetic data</title>
    <author><first>Dimitris</first><last>Liparas</last></author>
    <author><first>Anastasia</first><last>Moumtzidou</last></author>
    <author><first>Stefanos</first><last>Vrochidis</last></author>
    <author><first>Ioannis</first><last>Kompatsiaris</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>25&#8211;32</pages>
    <url>http://www.aclweb.org/anthology/W14-5404</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>liparas-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5405">
    <title>Exploration of functional semantics of prepositions from corpora of descriptions of visual scenes</title>
    <author><first>Simon</first><last>Dobnik</last></author>
    <author><first>John</first><last>Kelleher</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>33&#8211;37</pages>
    <url>http://www.aclweb.org/anthology/W14-5405</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>dobnik-kelleher:2014:VL</bibkey>
  </paper>

  <paper id="5406">
    <title>A Poodle or a Dog? Evaluating Automatic Image Annotation Using Human Descriptions at Different Levels of Granularity</title>
    <author><first>Josiah</first><last>Wang</last></author>
    <author><first>Fei</first><last>Yan</last></author>
    <author><first>Ahmet</first><last>Aker</last></author>
    <author><first>Robert</first><last>Gaizauskas</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>38&#8211;45</pages>
    <url>http://www.aclweb.org/anthology/W14-5406</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>wang-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5407">
    <title>Key Event Detection in Video using ASR and Visual Data</title>
    <author><first>Niraj</first><last>Shrestha</last></author>
    <author><first>Aparna N.</first><last>Venkitasubramanian</last></author>
    <author><first>Marie-Francine</first><last>Moens</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>46&#8211;53</pages>
    <url>http://www.aclweb.org/anthology/W14-5407</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>shrestha-venkitasubramanian-moens:2014:VL</bibkey>
  </paper>

  <paper id="5408">
    <title>Twitter User Gender Inference Using Combined Analysis of Text and Image Processing</title>
    <author><first>Shigeyuki</first><last>Sakaki</last></author>
    <author><first>Yasuhide</first><last>Miura</last></author>
    <author><first>Xiaojun</first><last>Ma</last></author>
    <author><first>Keigo</first><last>Hattori</last></author>
    <author><first>Tomoko</first><last>Ohkuma</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>54&#8211;61</pages>
    <url>http://www.aclweb.org/anthology/W14-5408</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>sakaki-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5409">
    <title>Semantic and geometric enrichment of 3D geo-spatial models with captioned photos and labelled illustrations</title>
    <author><first>Chris</first><last>Jones</last></author>
    <author><first>Paul</first><last>Rosin</last></author>
    <author><first>Jonathan</first><last>Slade</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>62&#8211;67</pages>
    <url>http://www.aclweb.org/anthology/W14-5409</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>jones-rosin-slade:2014:VL</bibkey>
  </paper>

  <paper id="5410">
    <title>Weakly supervised construction of a repository of iconic images</title>
    <author><first>Lydia</first><last>Weiland</last></author>
    <author><first>Wolfgang</first><last>Effelsberg</last></author>
    <author><first>Simone Paolo</first><last>Ponzetto</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>68&#8211;73</pages>
    <url>http://www.aclweb.org/anthology/W14-5410</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>weiland-effelsberg-ponzetto:2014:VL</bibkey>
  </paper>

  <paper id="5411">
    <title>Cross-media Cross-genre Information Ranking based on Multi-media Information Networks</title>
    <author><first>Tongtao</first><last>Zhang</last></author>
    <author><first>Haibo</first><last>Li</last></author>
    <author><first>Hongzhao</first><last>Huang</last></author>
    <author><first>Heng</first><last>Ji</last></author>
    <author><first>Min-Hsuan</first><last>Tsai</last></author>
    <author><first>Shen-Fu</first><last>Tsai</last></author>
    <author><first>Thomas</first><last>Huang</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>74&#8211;81</pages>
    <url>http://www.aclweb.org/anthology/W14-5411</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>zhang-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5412">
    <title>Speech-accompanying gestures in Russian: functions and verbal context</title>
    <author><first>Yulia</first><last>Nikolaeva</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>82&#8211;86</pages>
    <url>http://www.aclweb.org/anthology/W14-5412</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>nikolaeva:2014:VL</bibkey>
  </paper>

  <paper id="5413">
    <title>DALES: Automated Tool for Detection, Annotation, Labelling, and Segmentation of Multiple Objects in Multi-Camera Video Streams</title>
    <author><first>Mohammad</first><last>Bhat</last></author>
    <author><first>Joanna Isabelle</first><last>Olszewska</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>87&#8211;94</pages>
    <url>http://www.aclweb.org/anthology/W14-5413</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>bhat-olszewska:2014:VL</bibkey>
  </paper>

  <paper id="5414">
    <title>A Hybrid Segmentation of Web Pages for Vibro-Tactile Access on Touch-Screen Devices</title>
    <author><first>Waseem</first><last>SAFI</last></author>
    <author><first>Fabrice</first><last>Maurel</last></author>
    <author><first>Jean-Marc</first><last>Routoure</last></author>
    <author><first>Pierre</first><last>Beust</last></author>
    <author><first>Ga&#235;l</first><last>Dias</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>95&#8211;102</pages>
    <url>http://www.aclweb.org/anthology/W14-5414</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>safi-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5415">
    <title>Expression Recognition by Using Facial and Vocal Expressions</title>
    <author><first>Gholamreza</first><last>Anbarjafari</last></author>
    <author><first>Alvo</first><last>Aabloo</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>103&#8211;105</pages>
    <url>http://www.aclweb.org/anthology/W14-5415</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>anbarjafari-aabloo:2014:VL</bibkey>
  </paper>

  <paper id="5416">
    <title>Formulating Queries for Collecting Training Examples in Visual Concept Classification</title>
    <author><first>Kevin</first><last>McGuinness</last></author>
    <author><first>Feiyan</first><last>Hu</last></author>
    <author><first>Rami</first><last>Albatal</last></author>
    <author><first>Alan</first><last>Smeaton</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>106&#8211;108</pages>
    <url>http://www.aclweb.org/anthology/W14-5416</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>mcguinness-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5417">
    <title>Towards Succinct and Relevant Image Descriptions</title>
    <author><first>Desmond</first><last>Elliott</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>109&#8211;111</pages>
    <url>http://www.aclweb.org/anthology/W14-5417</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>elliott:2014:VL</bibkey>
  </paper>

  <paper id="5418">
    <title>Coloring Objects: Adjective-Noun Visual Semantic Compositionality</title>
    <author><first>Dat</first><last>Tien Nguyen</last></author>
    <author><first>Angeliki</first><last>Lazaridou</last></author>
    <author><first>Raffaella</first><last>Bernardi</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>112&#8211;114</pages>
    <url>http://www.aclweb.org/anthology/W14-5418</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>tiennguyen-lazaridou-bernardi:2014:VL</bibkey>
  </paper>

  <paper id="5419">
    <title>Multi-layered Image Representation for Image Interpretation</title>
    <author><first>Marina</first><last>Ivasic-Kos</last></author>
    <author><first>Miran</first><last>Pobar</last></author>
    <author><first>Ivo</first><last>Ipsic</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>115&#8211;117</pages>
    <url>http://www.aclweb.org/anthology/W14-5419</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>ivasickos-pobar-ipsic:2014:VL</bibkey>
  </paper>

  <paper id="5420">
    <title>The Last 10 Metres: Using Visual Analysis and Verbal Communication in Guiding Visually Impaired Smartphone Users to Entrances</title>
    <author><first>Anja</first><last>Belz</last></author>
    <author><first>Anil</first><last>Bharath</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>118&#8211;120</pages>
    <url>http://www.aclweb.org/anthology/W14-5420</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>belz-bharath:2014:VL</bibkey>
  </paper>

  <paper id="5421">
    <title>Keyphrase Extraction using Textual and Visual Features</title>
    <author><first>Yaakov</first><last>HaCohen-Kerner</last></author>
    <author><first>Stefanos</first><last>Vrochidis</last></author>
    <author><first>Dimitris</first><last>Liparas</last></author>
    <author><first>Anastasia</first><last>Moumtzidou</last></author>
    <author><first>Ioannis</first><last>Kompatsiaris</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>121&#8211;123</pages>
    <url>http://www.aclweb.org/anthology/W14-5421</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>hacohenkerner-EtAl:2014:VL</bibkey>
  </paper>

  <paper id="5422">
    <title>Towards automatic annotation of communicative gesturing</title>
    <author><first>Kristiina</first><last>Jokinen</last></author>
    <author><first>Graham</first><last>Wilcock</last></author>
    <booktitle>Proceedings of the Third Workshop on Vision and Language</booktitle>
    <month>August</month>
    <year>2014</year>
    <address>Dublin, Ireland</address>
    <publisher>Dublin City University and the Association for Computational Linguistics</publisher>
    <pages>124&#8211;125</pages>
    <url>http://www.aclweb.org/anthology/W14-5422</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>jokinen-wilcock:2014:VL</bibkey>
  </paper>

</volume>

