@inproceedings{PANUNZI12.548.L12-1309,
    author = {Alessandro Panunzi and Marco Fabbri and Massimo Moneglia and Lorenzo Gregori and Samuele Paladini},
    url = {http://www.lrec-conf.org/proceedings/lrec2012/pdf/548_Paper.pdf},
    note = {ACL Anthology Identifier: L12-1309},
    title = {RIDIRE-CPI: an Open Source Crawling and Processing Infrastructure for Supervised Web-Corpora Building},
    booktitle = {Proceedings of the Eighth International Conference on Language Resources and Evaluation (LREC-2012)},
    year = {2012},
    month = {May},
    address = {Istanbul, Turkey},
    editor = {Nicoletta Calzolari and Khalid Choukri and Thierry Declerck and Mehmet U\u{g}ur Do\u{g}an and Bente Maegaard and Joseph Mariani and Jan Odijk and Stelios Piperidis},
    publisher = {European Language Resources Association (ELRA)},
    isbn = {978-2-9517408-7-7},
    language = {English},
    pages = {2274--2279}
    }
