@InProceedings{barbaresi:2014:WaC9,
  author    = {Barbaresi, Adrien},
  title     = {Finding Viable Seed URLs for Web Corpora: A Scouting Approach and Comparative Study of Available Sources},
  booktitle = {Proceedings of the 9th Web as Corpus Workshop (WaC-9)},
  month     = {April},
  year      = {2014},
  address   = {Gothenburg, Sweden},
  publisher = {Association for Computational Linguistics},
  pages     = {1--8},
  url       = {http://www.aclweb.org/anthology/W14-0401}
}

