<?xml version="1.0" encoding="UTF-8" ?>
<volume id="W14">
  <paper id="0400">
    <title>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</title>
    <editor><first>Felix</first><last>Bildhauer</last></editor>
    <editor><first>Roland</first><last>Schäfer</last></editor>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <url>http://www.aclweb.org/anthology/W14-04</url>
    <bibtype>book</bibtype>
    <bibkey>WaC9:2014</bibkey>
  </paper>

  <paper id="0401">
    <title>Finding Viable Seed URLs for Web Corpora: A Scouting Approach and Comparative Study of Available Sources</title>
    <author><first>Adrien</first><last>Barbaresi</last></author>
    <booktitle>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</booktitle>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <pages>1&#8211;8</pages>
    <url>http://www.aclweb.org/anthology/W14-0401</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>barbaresi:2014:WaC9</bibkey>
  </paper>

  <paper id="0402">
    <title>Focused Web Corpus Crawling</title>
    <author><first>Roland</first><last>Sch&#228;fer</last></author>
    <author><first>Adrien</first><last>Barbaresi</last></author>
    <author><first>Felix</first><last>Bildhauer</last></author>
    <booktitle>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</booktitle>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <pages>9&#8211;15</pages>
    <url>http://www.aclweb.org/anthology/W14-0402</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>schafer-barbaresi-bildhauer:2014:WaC9</bibkey>
  </paper>

  <paper id="0403">
    <title>Less Destructive Cleaning of Web Documents by Using Standoff Annotation</title>
    <author><first>Maik</first><last>St&#252;hrenberg</last></author>
    <booktitle>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</booktitle>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <pages>16&#8211;21</pages>
    <url>http://www.aclweb.org/anthology/W14-0403</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>stuhrenberg:2014:WaC9</bibkey>
  </paper>

  <paper id="0404">
    <title>Some Issues on the Normalization of a Corpus of Products Reviews in Portuguese</title>
    <author><first>Magali</first><last>Sanches Duran</last></author>
    <author><first>Lucas</first><last>Avan&#231;o</last></author>
    <author><first>Sandra</first><last>Alu&#237;sio</last></author>
    <author><first>Thiago</first><last>Pardo</last></author>
    <author><first>Maria da Gra&#231;a</first><last>Volpe Nunes</last></author>
    <booktitle>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</booktitle>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <pages>22&#8211;28</pages>
    <url>http://www.aclweb.org/anthology/W14-0404</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>sanchesduran-EtAl:2014:WaC9</bibkey>
  </paper>

  <paper id="0405">
    <title>{bs,hr,sr}WaC - Web Corpora of Bosnian, Croatian and Serbian</title>
    <author><first>Nikola</first><last>Ljube&#x161;i&#x107;</last></author>
    <author><first>Filip</first><last>Klubi&#x10D;ka</last></author>
    <booktitle>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</booktitle>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <pages>29&#8211;35</pages>
    <url>http://www.aclweb.org/anthology/W14-0405</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>ljubevsic-klubivcka:2014:WaC9</bibkey>
  </paper>

  <paper id="0406">
    <title>The PAIS&#192; Corpus of Italian Web Texts</title>
    <author><first>Verena</first><last>Lyding</last></author>
    <author><first>Egon</first><last>Stemle</last></author>
    <author><first>Claudia</first><last>Borghetti</last></author>
    <author><first>Marco</first><last>Brunello</last></author>
    <author><first>Sara</first><last>Castagnoli</last></author>
    <author><first>Felice</first><last>Dell'Orletta</last></author>
    <author><first>Henrik</first><last>Dittmann</last></author>
    <author><first>Alessandro</first><last>Lenci</last></author>
    <author><first>Vito</first><last>Pirrelli</last></author>
    <booktitle>Proceedings of the 9th Web as Corpus Workshop (WaC-9)</booktitle>
    <month>April</month>
    <year>2014</year>
    <address>Gothenburg, Sweden</address>
    <publisher>Association for Computational Linguistics</publisher>
    <pages>36&#8211;43</pages>
    <url>http://www.aclweb.org/anthology/W14-0406</url>
    <bibtype>inproceedings</bibtype>
    <bibkey>lyding-EtAl:2014:WaC9</bibkey>
  </paper>

</volume>

