@inproceedings{L16-1697,
 abstract = {Active learning (AL) is often used in corpus construction (CC) for selecting ``informative'' documents for annotation. This is ideal for focusing annotation efforts when all documents cannot be annotated, but has the limitation that it is carried out in a closed-loop, selecting points that will improve an existing model. For phenomena-driven and exploratory CC, the lack of existing-models and specific task(s) for using it make traditional AL inapplicable. In this paper we propose a novel method for model-free AL utilising characteristics of phenomena for applying AL to select documents for annotation. The method can also supplement traditional closed-loop AL-based CC to extend the utility of the corpus created beyond a single task. We introduce our tool, MOVE, and show its potential with a real world case-study.
},
 address = {Portorož, Slovenia},
 author = {Dain Kaplan and Neil Rubens and Simone Teufel and Takenobu Tokunaga},
 booktitle = {Proceedings of the Tenth International Conference on Language Resources and Evaluation (LREC 2016)},
 month = {May},
 pages = {4402--4409},
 publisher = {European Language Resources Association (ELRA)},
 title = {Solving the AL Chicken-and-Egg Corpus and Model Problem: Model-free Active Learning for Phenomena-driven Corpus Construction},
 url = {https://www.aclweb.org/anthology/L16-1697},
 year = {2016}
}

