<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4314.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1433" marginTop="1240" marginRight="1378" marginBottom="358" offsetX="-26" offsetY="32" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1433" t="1240" r="10531" b="4092">

<column l="1433" t="1240" r="10531" b="4092">

<para l="1670" t="1306" r="10277" b="1886" alignment="centered" spaceBefore="17" lsp="exactly" lspExact="322" language="en">

<ln l="1670" t="1306" r="10277" b="1570" baseLine="1502" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1670" t="1306" r="3418" b="1517">DCU-ADAPT:</wd>

<space/>

<wd l="3518" t="1306" r="4637" b="1570">Learning</wd>

<space/>

<wd l="4714" t="1306" r="5237" b="1512">Edit</wd>

<space/>

<wd l="5318" t="1306" r="6677" b="1570">Operations</wd>

<space/>

<wd l="6754" t="1306" r="7109" b="1512">for</wd>

<space/>

<wd l="7186" t="1306" r="8448" b="1570">Microblog</wd>

<space/>

<wd l="8525" t="1306" r="10277" b="1517">Normalisation
</wd>

</ln>

<ln l="3998" t="1622" r="7954" b="1886" baseLine="1824" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3998" t="1622" r="4531" b="1829">with</wd>

<space/>

<wd l="4613" t="1627" r="4987" b="1829">the</wd>

<space/>

<wd l="5074" t="1622" r="6523" b="1834">Generalised</wd>

<space/>

<wd l="6600" t="1627" r="7954" b="1886">Perceptron</wd>

</ln>

</para>

<para l="3576" t="2117" r="8371" b="3739" alignment="centered" spaceBefore="179" spaceAfter="341" lsp="exactly" lspExact="278" language="en">

<ln l="4046" t="2117" r="7906" b="2338" baseLine="2280" forcedEOF="true">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4046" t="2117" r="4901" b="2309">Joachim</wd>

<space/>

<wd l="4963" t="2122" r="5770" b="2338">Wagner</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5894" t="2122" r="6235" b="2290">and</wd>

<space/>

</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6355" t="2117" r="7200" b="2309">Jennifer</wd>

<space/>

<wd l="7262" t="2122" r="7906" b="2290">Foster
</wd>

</run>

</ln>

<ln l="5232" t="2395" r="6715" b="2568" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="5232" t="2400" r="6019" b="2563">ADAPT</wd>

<space/>

<wd l="6086" t="2400" r="6715" b="2568">Centre
</wd>

</ln>

<ln l="4954" t="2674" r="6998" b="2894" baseLine="2837" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="4954" t="2678" r="5606" b="2846">School</wd>

<space/>

<wd l="5674" t="2678" r="5885" b="2846">of</wd>

<space/>

<wd l="5933" t="2678" r="6998" b="2894">Computing
</wd>

</ln>

<ln l="4877" t="2952" r="7070" b="3173" baseLine="3115" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="4877" t="2957" r="5544" b="3125">Dublin</wd>

<space/>

<wd l="5606" t="2957" r="6010" b="3173">City</wd>

<space/>

<wd l="6072" t="2957" r="7070" b="3173">University
</wd>

</ln>

<ln l="5246" t="3230" r="6706" b="3432" baseLine="3394" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="5246" t="3235" r="5957" b="3432">Dublin,</wd>

<space/>

<wd l="6029" t="3235" r="6706" b="3403">Ireland
</wd>

</ln>

<ln l="3576" t="3494" r="8371" b="3739" baseLine="3677" forcedEOF="true">

<wd l="3576" t="3494" r="8371" b="3739"><run underlined="none" subsuperscript="none" fontSize="1400" fontFace="Courier New" fontFamily="swiss" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">jwagner|jfoster</run>

<run underlined="none" subsuperscript="none" fontSize="1400" fontFace="Courier New" fontFamily="swiss" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">@computing.dcu.ie</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<section l="1433" t="4092" r="10531" b="15317">

<column l="1433" t="4092" r="5820" b="15317">

<para l="3178" t="4142" r="4070" b="4315" alignment="centered" spaceBefore="3" lsp="exactly" lspExact="273" language="en">

<ln l="3178" t="4142" r="4070" b="4315" baseLine="4306" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3178" t="4142" r="4070" b="4315">Abstract</wd>

</ln>

</para>

<para l="1781" t="4546" r="5467" b="10982" alignment="justified" li="288" ri="360" spaceBefore="116" lsp="exactly" lspExact="271" language="en">

<ln l="1781" t="4546" r="5462" b="4747" baseLine="4699" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="4550" r="2064" b="4704">We</wd>

<space/>

<wd l="2155" t="4546" r="2875" b="4704">describe</wd>

<space/>

<wd l="2962" t="4546" r="3226" b="4704">the</wd>

<space/>

<wd l="3312" t="4546" r="3758" b="4704">work</wd>

<space/>

<wd l="3850" t="4546" r="4450" b="4704">carried</wd>

<space/>

<wd l="4536" t="4570" r="4814" b="4704">out</wd>

<space/>

<wd l="4896" t="4546" r="5112" b="4747">by</wd>

<space/>

<wd l="5198" t="4546" r="5462" b="4704">the</wd>

<space/>

</ln>

<ln l="1781" t="4819" r="5453" b="4978" baseLine="4968" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="4824" r="3029" b="4978">DCU-ADAPT</wd>

<space/>

<wd l="3125" t="4843" r="3552" b="4978">team</wd>

<space/>

<wd l="3648" t="4872" r="3864" b="4978">on</wd>

<space/>

<wd l="3955" t="4819" r="4219" b="4978">the</wd>

<space/>

<wd l="4315" t="4819" r="4963" b="4978">Lexical</wd>

<space/>

<wd l="5059" t="4824" r="5453" b="4978">Nor-</wd>

</ln>

<ln l="1781" t="5088" r="5453" b="5246" baseLine="5242" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="5088" r="2693" b="5246">malisation</wd>

<space/>

<wd l="2798" t="5088" r="3360" b="5246">shared</wd>

<space/>

<wd l="3456" t="5088" r="3811" b="5246">task</wd>

<space/>

<wd l="3912" t="5112" r="4066" b="5246">at</wd>

<space/>

<wd l="4162" t="5093" r="4872" b="5246">W-NUT</wd>

<space/>

<wd l="4978" t="5088" r="5453" b="5246">2015.</wd>

<space/>

</ln>

<ln l="1781" t="5362" r="5453" b="5563" baseLine="5510" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="5366" r="2064" b="5520">We</wd>

<space/>

<wd l="2155" t="5362" r="2554" b="5520">train</wd>

<space/>

<wd l="2645" t="5414" r="2741" b="5520">a</wd>

<space/>

<wd l="2832" t="5362" r="3821" b="5563">generalised</wd>

<space/>

<wd l="3907" t="5386" r="4843" b="5563">perceptron</wd>

<space/>

<wd l="4930" t="5386" r="5093" b="5520">to</wd>

<space/>

<wd l="5194" t="5414" r="5453" b="5520">an-</wd>

</ln>

<ln l="1781" t="5630" r="5467" b="5832" baseLine="5784" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="5654" r="2314" b="5789">notate</wd>

<space/>

<wd l="2381" t="5630" r="2851" b="5832">noisy</wd>

<space/>

<wd l="2923" t="5654" r="3245" b="5789">text</wd>

<space/>

<wd l="3312" t="5630" r="3701" b="5789">with</wd>

<space/>

<wd l="3773" t="5630" r="4094" b="5789">edit</wd>

<space/>

<wd l="4166" t="5630" r="5064" b="5832">operations</wd>

<space/>

<wd l="5136" t="5630" r="5467" b="5789">that</wd>

<space/>

</ln>

<ln l="1781" t="5904" r="5453" b="6062" baseLine="6053" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="5904" r="2640" b="6062">normalise</wd>

<space/>

<wd l="2731" t="5904" r="3000" b="6062">the</wd>

<space/>

<wd l="3091" t="5928" r="3418" b="6062">text</wd>

<space/>

<wd l="3509" t="5904" r="3984" b="6062">when</wd>

<space/>

<wd l="4080" t="5904" r="4886" b="6062">executed.</wd>

<space/>

<wd l="5078" t="5909" r="5453" b="6062">Fea-</wd>

</ln>

<ln l="1781" t="6173" r="5453" b="6374" baseLine="6326">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1781" t="6197" r="2198" b="6331">tures</wd>

<space/>

<wd l="2256" t="6226" r="2515" b="6331">are</wd>

<space/>

<wd l="2568" t="6173" r="3365" b="6331">character</wd>

<space/>

</run>

<wd l="3413" t="6226" r="4186" b="6374"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-3">n</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">-grams,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="4243" t="6197" r="5035" b="6331">recurrent</wd>

<space/>

<wd l="5078" t="6226" r="5453" b="6331">neu-</wd>

</run>

</ln>

<ln l="1781" t="6446" r="5467" b="6648" baseLine="6595" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="6446" r="2006" b="6605">ral</wd>

<space/>

<wd l="2088" t="6446" r="2798" b="6605">network</wd>

<space/>

<wd l="2875" t="6446" r="3662" b="6648">language</wd>

<space/>

<wd l="3739" t="6446" r="4282" b="6605">model</wd>

<space/>

<wd l="4358" t="6446" r="4954" b="6605">hidden</wd>

<space/>

<wd l="5030" t="6446" r="5467" b="6648">layer</wd>

<space/>

</ln>

<ln l="1786" t="6715" r="5453" b="6917" baseLine="6864" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1786" t="6715" r="2760" b="6902">activations,</wd>

<space/>

<wd l="2904" t="6715" r="3701" b="6874">character</wd>

<space/>

<wd l="3816" t="6715" r="4224" b="6874">class</wd>

<space/>

<wd l="4349" t="6715" r="4661" b="6874">and</wd>

<space/>

<wd l="4781" t="6715" r="5453" b="6917">eligibil-</wd>

</ln>

<ln l="1781" t="6989" r="5453" b="7190" baseLine="7138" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="6989" r="2006" b="7190">ity</wd>

<space/>

<wd l="2078" t="6989" r="2338" b="7147">for</wd>

<space/>

<wd l="2405" t="6989" r="3000" b="7190">editing</wd>

<space/>

<wd l="3077" t="6989" r="3926" b="7190">according</wd>

<space/>

<wd l="3998" t="7013" r="4166" b="7147">to</wd>

<space/>

<wd l="4234" t="6989" r="4502" b="7147">the</wd>

<space/>

<wd l="4570" t="6989" r="4920" b="7147">task</wd>

<space/>

<wd l="4987" t="6989" r="5453" b="7147">rules.</wd>

<space/>

</ln>

<ln l="1781" t="7258" r="5458" b="7459" baseLine="7406" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="7262" r="2064" b="7416">We</wd>

<space/>

<wd l="2150" t="7258" r="2899" b="7416">combine</wd>

<space/>

<wd l="2981" t="7258" r="3941" b="7459">predictions</wd>

<space/>

<wd l="4032" t="7258" r="4459" b="7416">from</wd>

<space/>

<wd l="4541" t="7258" r="4742" b="7416">25</wd>

<space/>

<wd l="4834" t="7258" r="5458" b="7416">models</wd>

<space/>

</ln>

<ln l="1781" t="7526" r="5462" b="7728" baseLine="7680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="7526" r="2386" b="7685">trained</wd>

<space/>

<wd l="2467" t="7579" r="2678" b="7685">on</wd>

<space/>

<wd l="2765" t="7526" r="3374" b="7685">subsets</wd>

<space/>

<wd l="3461" t="7526" r="3653" b="7685">of</wd>

<space/>

<wd l="3715" t="7526" r="3979" b="7685">the</wd>

<space/>

<wd l="4056" t="7526" r="4733" b="7728">training</wd>

<space/>

<wd l="4814" t="7526" r="5174" b="7685">data</wd>

<space/>

<wd l="5246" t="7526" r="5462" b="7728">by</wd>

<space/>

</ln>

<ln l="1790" t="7800" r="5453" b="8002" baseLine="7949" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1790" t="7800" r="2554" b="8002">selecting</wd>

<space/>

<wd l="2602" t="7800" r="2866" b="7958">the</wd>

<space/>

<wd l="2914" t="7800" r="3902" b="8002">most-likely</wd>

<space/>

<wd l="3950" t="7800" r="5155" b="7958">normalisation</wd>

<space/>

<wd l="5203" t="7853" r="5453" b="7958">ac-</wd>

</ln>

<ln l="1786" t="8069" r="5462" b="8270" baseLine="8222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1786" t="8069" r="2443" b="8270">cording</wd>

<space/>

<wd l="2491" t="8093" r="2654" b="8227">to</wd>

<space/>

<wd l="2707" t="8122" r="2803" b="8227">a</wd>

<space/>

<wd l="2846" t="8069" r="3648" b="8227">character</wd>

<space/>

<wd l="3686" t="8069" r="4474" b="8270">language</wd>

<space/>

<wd l="4517" t="8069" r="5102" b="8227">model.</wd>

<space/>

<wd l="5179" t="8074" r="5462" b="8227">We</wd>

<space/>

</ln>

<ln l="1786" t="8342" r="5453" b="8544" baseLine="8491" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1786" t="8395" r="2530" b="8544">compare</wd>

<space/>

<wd l="2606" t="8342" r="2870" b="8501">the</wd>

<space/>

<wd l="2947" t="8395" r="3240" b="8501">use</wd>

<space/>

<wd l="3317" t="8342" r="3509" b="8501">of</wd>

<space/>

<wd l="3576" t="8395" r="3672" b="8501">a</wd>

<space/>

<wd l="3749" t="8342" r="4738" b="8544">generalised</wd>

<space/>

<wd l="4810" t="8395" r="5453" b="8544">percep-</wd>

</ln>

<ln l="1781" t="8611" r="5458" b="8770" baseLine="8765" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="8635" r="2131" b="8770">tron</wd>

<space/>

<wd l="2174" t="8635" r="2342" b="8770">to</wd>

<space/>

<wd l="2390" t="8611" r="2654" b="8770">the</wd>

<space/>

<wd l="2698" t="8664" r="2990" b="8770">use</wd>

<space/>

<wd l="3038" t="8611" r="3226" b="8770">of</wd>

<space/>

<wd l="3264" t="8611" r="4238" b="8770">conditional</wd>

<space/>

<wd l="4282" t="8611" r="4954" b="8770">random</wd>

<space/>

<wd l="4997" t="8611" r="5458" b="8770">fields</wd>

<space/>

</ln>

<ln l="1781" t="8885" r="5462" b="9086" baseLine="9034" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="8885" r="2592" b="9043">restricted</wd>

<space/>

<wd l="2683" t="8909" r="2851" b="9043">to</wd>

<space/>

<wd l="2957" t="8885" r="3590" b="9043">smaller</wd>

<space/>

<wd l="3686" t="8909" r="4411" b="9043">amounts</wd>

<space/>

<wd l="4517" t="8885" r="4709" b="9043">of</wd>

<space/>

<wd l="4786" t="8885" r="5462" b="9086">training</wd>

<space/>

</ln>

<ln l="1786" t="9154" r="5453" b="9355" baseLine="9307" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1786" t="9154" r="2146" b="9312">data</wd>

<space/>

<wd l="2266" t="9154" r="2578" b="9312">due</wd>

<space/>

<wd l="2698" t="9178" r="2866" b="9312">to</wd>

<space/>

<wd l="2986" t="9206" r="3710" b="9355">memory</wd>

<space/>

<wd l="3835" t="9154" r="4819" b="9312">constraints.</wd>

<space/>

<wd l="5093" t="9158" r="5453" b="9312">Fur-</wd>

</ln>

<ln l="1781" t="9427" r="5453" b="9629" baseLine="9576" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="9427" r="2611" b="9614">thermore,</wd>

<space/>

<wd l="2698" t="9480" r="2952" b="9586">we</wd>

<space/>

<wd l="3029" t="9427" r="3494" b="9586">make</wd>

<space/>

<wd l="3576" t="9480" r="3672" b="9586">a</wd>

<space/>

<wd l="3744" t="9427" r="4080" b="9586">first</wd>

<space/>

<wd l="4157" t="9451" r="4810" b="9629">attempt</wd>

<space/>

<wd l="4877" t="9451" r="5045" b="9586">to</wd>

<space/>

<wd l="5122" t="9480" r="5453" b="9586">ver-</wd>

</ln>

<ln l="1781" t="9696" r="5462" b="9898" baseLine="9845" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="9696" r="2021" b="9898">ify</wd>

<space/>

<wd l="2107" t="9696" r="2904" b="9898">Chrupała</wd>

<space/>

<wd l="2986" t="9701" r="3696" b="9893">(2014)’s</wd>

<space/>

<wd l="3782" t="9696" r="4709" b="9898">hypothesis</wd>

<space/>

<wd l="4795" t="9696" r="5122" b="9854">that</wd>

<space/>

<wd l="5198" t="9696" r="5462" b="9854">the</wd>

<space/>

</ln>

<ln l="1781" t="9970" r="5462" b="10171" baseLine="10118" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="9970" r="2251" b="10171">noisy</wd>

<space/>

<wd l="2328" t="9970" r="3000" b="10128">channel</wd>

<space/>

<wd l="3072" t="9970" r="3614" b="10128">model</wd>

<space/>

<wd l="3691" t="9970" r="4234" b="10128">would</wd>

<space/>

<wd l="4306" t="9994" r="4584" b="10128">not</wd>

<space/>

<wd l="4656" t="9970" r="4862" b="10128">be</wd>

<space/>

<wd l="4934" t="9970" r="5462" b="10128">useful</wd>

<space/>

</ln>

<ln l="1786" t="10238" r="5467" b="10440" baseLine="10387" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1786" t="10238" r="2093" b="10397">due</wd>

<space/>

<wd l="2160" t="10262" r="2323" b="10397">to</wd>

<space/>

<wd l="2390" t="10238" r="2654" b="10397">the</wd>

<space/>

<wd l="2717" t="10238" r="3341" b="10397">limited</wd>

<space/>

<wd l="3403" t="10262" r="4056" b="10397">amount</wd>

<space/>

<wd l="4123" t="10238" r="4310" b="10397">of</wd>

<space/>

<wd l="4358" t="10238" r="5035" b="10440">training</wd>

<space/>

<wd l="5107" t="10238" r="5467" b="10397">data</wd>

<space/>

</ln>

<ln l="1781" t="10507" r="5453" b="10709" baseLine="10661" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1781" t="10507" r="2040" b="10666">for</wd>

<space/>

<wd l="2083" t="10507" r="2347" b="10666">the</wd>

<space/>

<wd l="2405" t="10560" r="2966" b="10666">source</wd>

<space/>

<wd l="3014" t="10507" r="3802" b="10709">language</wd>

<space/>

<wd l="3850" t="10507" r="4435" b="10694">model,</wd>

<space/>

<wd l="4498" t="10507" r="4752" b="10666">i.e.</wd>

<space/>

<wd l="4810" t="10507" r="5078" b="10666">the</wd>

<space/>

<wd l="5126" t="10507" r="5453" b="10666">lan-</wd>

</ln>

<ln l="1786" t="10781" r="4618" b="10982" baseLine="10930" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1786" t="10834" r="2299" b="10982">guage</wd>

<space/>

<wd l="2357" t="10781" r="2899" b="10939">model</wd>

<space/>

<wd l="2962" t="10834" r="3178" b="10939">on</wd>

<space/>

<wd l="3230" t="10781" r="4200" b="10939">normalised</wd>

<space/>

<wd l="4253" t="10805" r="4618" b="10939">text.</wd>

</ln>

</para>

<para l="1454" t="11165" r="3091" b="11338" alignment="left" spaceBefore="129" lsp="exactly" lspExact="273" language="en">

<ln l="1454" t="11165" r="3091" b="11338" baseLine="11328" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1454" t="11165" r="1550" b="11333">1</wd>

<space/>

<wd l="1805" t="11165" r="3091" b="11338">Introduction</wd>

</ln>

</para>

<para l="1440" t="11582" r="5808" b="14765" alignment="justified" spaceBefore="133" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="11582" r="5808" b="11784" baseLine="11736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11582" r="1781" b="11741">The</wd>

<space/>

<wd l="1877" t="11587" r="2587" b="11741">W-NUT</wd>

<space/>

<wd l="2688" t="11582" r="3336" b="11741">Lexical</wd>

<space/>

<wd l="3437" t="11582" r="4690" b="11741">Normalisation</wd>

<space/>

<wd l="4786" t="11582" r="5045" b="11741">for</wd>

<space/>

<wd l="5141" t="11582" r="5808" b="11784">English</wd>

<space/>

</ln>

<ln l="1440" t="11856" r="5808" b="12058" baseLine="12005" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11861" r="2045" b="12014">Tweets</wd>

<space/>

<wd l="2155" t="11856" r="2717" b="12014">shared</wd>

<space/>

<wd l="2808" t="11856" r="3158" b="12014">task</wd>

<space/>

<wd l="3254" t="11856" r="3389" b="12014">is</wd>

<space/>

<wd l="3490" t="11880" r="3658" b="12014">to</wd>

<space/>

<wd l="3754" t="11856" r="4613" b="12014">normalise</wd>

<space/>

<wd l="4718" t="11856" r="5395" b="12058">spelling</wd>

<space/>

<wd l="5496" t="11856" r="5808" b="12014">and</wd>

<space/>

</ln>

<ln l="1440" t="12125" r="5794" b="12326" baseLine="12278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12149" r="1608" b="12283">to</wd>

<space/>

<wd l="1670" t="12125" r="2294" b="12326">expand</wd>

<space/>

<wd l="2357" t="12125" r="3408" b="12283">contractions</wd>

<space/>

<wd l="3475" t="12125" r="3648" b="12278">in</wd>

<space/>

<wd l="3701" t="12125" r="4373" b="12326">English</wd>

<space/>

<wd l="4426" t="12125" r="5318" b="12326">microblog</wd>

<space/>

<wd l="5381" t="12178" r="5794" b="12283">mes-</wd>

</ln>

<ln l="1450" t="12398" r="5794" b="12600" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="12451" r="1906" b="12600">sages</wd>

<space/>

<wd l="1968" t="12398" r="2774" b="12595">(Baldwin</wd>

<space/>

<wd l="2822" t="12422" r="2976" b="12557">et</wd>

<space/>

<wd l="3029" t="12398" r="3278" b="12586">al.,</wd>

<space/>

<wd l="3341" t="12398" r="3888" b="12595">2015).</wd>

<space/>

<wd l="3965" t="12398" r="4344" b="12557">This</wd>

<space/>

<wd l="4402" t="12398" r="5122" b="12557">includes</wd>

<space/>

<wd l="5179" t="12422" r="5794" b="12557">one-to-</wd>

</ln>

<ln l="1440" t="12667" r="5798" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12720" r="1920" b="12869">many</wd>

<space/>

<wd l="1973" t="12667" r="2285" b="12826">and</wd>

<space/>

<wd l="2328" t="12691" r="3437" b="12869">many-to-one</wd>

<space/>

<wd l="3485" t="12667" r="4627" b="12869">replacements</wd>

<space/>

<wd l="4690" t="12720" r="4858" b="12826">as</wd>

<space/>

<wd l="4910" t="12667" r="5083" b="12821">in</wd>

<space/>

<wd l="5131" t="12672" r="5798" b="12826">“we’re”</wd>

<space/>

</ln>

<ln l="1445" t="12941" r="5808" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12941" r="1757" b="13099">and</wd>

<space/>

<wd l="1824" t="12941" r="1973" b="13094">“l</wd>

<space/>

<wd l="2045" t="12994" r="2146" b="13099">o</wd>

<space/>

<wd l="2218" t="12994" r="2323" b="13099">v</wd>

<space/>

<wd l="2395" t="12946" r="2626" b="13099">e”.</wd>

<space/>

<wd l="2736" t="12941" r="3350" b="13099">Tokens</wd>

<space/>

<wd l="3427" t="12941" r="4339" b="13142">containing</wd>

<space/>

<wd l="4411" t="12941" r="5285" b="13099">characters</wd>

<space/>

<wd l="5362" t="12941" r="5808" b="13099">other</wd>

<space/>

</ln>

<ln l="1440" t="13210" r="5803" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="13210" r="1819" b="13368">than</wd>

<space/>

<wd l="1896" t="13210" r="3072" b="13411">alphanumeric</wd>

<space/>

<wd l="3158" t="13210" r="4032" b="13368">characters</wd>

<space/>

<wd l="4118" t="13210" r="4430" b="13368">and</wd>

<space/>

<wd l="4507" t="13210" r="4771" b="13368">the</wd>

<space/>

<wd l="4853" t="13210" r="5803" b="13411">apostrophe</wd>

<space/>

</ln>

<ln l="1445" t="13478" r="5798" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="13531" r="1704" b="13637">are</wd>

<space/>

<wd l="1752" t="13478" r="2534" b="13637">excluded</wd>

<space/>

<wd l="2578" t="13478" r="3005" b="13637">from</wd>

<space/>

<wd l="3043" t="13478" r="3307" b="13637">the</wd>

<space/>

<wd l="3355" t="13478" r="3749" b="13666">task,</wd>

<space/>

<wd l="3811" t="13531" r="3979" b="13637">as</wd>

<space/>

<wd l="4027" t="13478" r="4402" b="13637">well</wd>

<space/>

<wd l="4454" t="13531" r="4622" b="13637">as</wd>

<space/>

<wd l="4670" t="13531" r="5246" b="13680">proper</wd>

<space/>

<wd l="5285" t="13531" r="5798" b="13637">nouns</wd>

<space/>

</ln>

<ln l="1445" t="13752" r="5794" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="13752" r="1757" b="13910">and</wd>

<space/>

<wd l="1843" t="13805" r="2678" b="13954">acronyms</wd>

<space/>

<wd l="2770" t="13752" r="3096" b="13910">that</wd>

<space/>

<wd l="3182" t="13752" r="3725" b="13910">would</wd>

<space/>

<wd l="3806" t="13752" r="4013" b="13910">be</wd>

<space/>

<wd l="4104" t="13752" r="5016" b="13954">acceptable</wd>

<space/>

<wd l="5102" t="13752" r="5275" b="13906">in</wd>

<space/>

<wd l="5357" t="13752" r="5794" b="13910">well-</wd>

</ln>

<ln l="1445" t="14021" r="5803" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="14021" r="1973" b="14179">edited</wd>

<space/>

<wd l="2030" t="14045" r="2395" b="14179">text.</wd>

<space/>

<wd l="2486" t="14021" r="2885" b="14218">(The</wd>

<space/>

<wd l="2942" t="14021" r="3432" b="14222">input,</wd>

<space/>

<wd l="3499" t="14021" r="4272" b="14208">however,</wd>

<space/>

<wd l="4344" t="14021" r="4728" b="14179">does</wd>

<space/>

<wd l="4795" t="14045" r="5074" b="14179">not</wd>

<space/>

<wd l="5126" t="14021" r="5803" b="14222">identify</wd>

<space/>

</ln>

<ln l="1450" t="14294" r="5798" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="14294" r="1843" b="14453">such</wd>

<space/>

<wd l="1906" t="14294" r="2467" b="14453">tokens</wd>

<space/>

<wd l="2549" t="14294" r="2861" b="14453">and</wd>

<space/>

<wd l="2923" t="14294" r="4109" b="14496">unnecessarily</wd>

<space/>

<wd l="4181" t="14294" r="5083" b="14496">modifying</wd>

<space/>

<wd l="5155" t="14294" r="5597" b="14453">them</wd>

<space/>

<wd l="5659" t="14294" r="5798" b="14453">is</wd>

<space/>

</ln>

<ln l="1440" t="14563" r="3878" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14563" r="2266" b="14765">penalised</wd>

<space/>

<wd l="2318" t="14563" r="2491" b="14717">in</wd>

<space/>

<wd l="2544" t="14563" r="2808" b="14722">the</wd>

<space/>

<wd l="2870" t="14563" r="3878" b="14760">evaluation.)</wd>

</ln>

</para>

<para l="1440" t="14837" r="5794" b="15307" alignment="justified" fli="216" lsp="exactly" lspExact="266" language="en">

<ln l="1656" t="14837" r="5794" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="14842" r="1882" b="14995">To</wd>

<space/>

<wd l="1949" t="14837" r="2419" b="14995">make</wd>

<space/>

<wd l="2486" t="14837" r="3384" b="14995">evaluation</wd>

<space/>

<wd l="3451" t="14837" r="3989" b="15024">easier,</wd>

<space/>

<wd l="4070" t="14837" r="5078" b="15038">participants</wd>

<space/>

<wd l="5155" t="14890" r="5419" b="14995">are</wd>

<space/>

<wd l="5482" t="14837" r="5794" b="14995">fur-</wd>

</ln>

<ln l="1440" t="15106" r="5794" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="15106" r="1786" b="15264">ther</wd>

<space/>

<wd l="1867" t="15106" r="2597" b="15307">required</wd>

<space/>

<wd l="2683" t="15130" r="2851" b="15264">to</wd>

<space/>

<wd l="2947" t="15106" r="3379" b="15307">align</wd>

<space/>

<wd l="3470" t="15130" r="4027" b="15307">output</wd>

<space/>

<wd l="4114" t="15106" r="4670" b="15264">tokens</wd>

<space/>

<wd l="4766" t="15130" r="4934" b="15264">to</wd>

<space/>

<wd l="5026" t="15106" r="5477" b="15307">input</wd>

<space/>

<wd l="5563" t="15130" r="5794" b="15264">to-</wd>

</ln>

<ln l="0" t="0" r="0" b="0" baseLine="0" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<space/>

</ln>

</para>

</column>

<column l="6144" t="4092" r="10531" b="15317">

<para l="6144" t="4157" r="10512" b="5712" alignment="justified" spaceBefore="4" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="4157" r="10512" b="4358" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4157" r="6586" b="4344">kens,</wd>

<space/>

<wd l="6677" t="4210" r="6974" b="4358">e.g.</wd>

<space/>

<wd l="7056" t="4157" r="7531" b="4315">when</wd>

<space/>

<wd l="7598" t="4157" r="7867" b="4315">the</wd>

<space/>

<wd l="7939" t="4157" r="8304" b="4315">four</wd>

<space/>

<wd l="8371" t="4157" r="8928" b="4315">tokens</wd>

<space/>

<wd l="9014" t="4157" r="9307" b="4344">“l”,</wd>

<space/>

<wd l="9398" t="4162" r="9739" b="4344">“o”,</wd>

<space/>

<wd l="9826" t="4162" r="10118" b="4315">“v”</wd>

<space/>

<wd l="10200" t="4157" r="10512" b="4315">and</wd>

<space/>

</ln>

<ln l="6149" t="4426" r="10498" b="4627" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="4430" r="6432" b="4584">“e”</wd>

<space/>

<wd l="6523" t="4478" r="6787" b="4584">are</wd>

<space/>

<wd l="6874" t="4426" r="8035" b="4627">amalgamated</wd>

<space/>

<wd l="8117" t="4450" r="8285" b="4584">to</wd>

<space/>

<wd l="8371" t="4426" r="8635" b="4584">the</wd>

<space/>

<wd l="8731" t="4426" r="9240" b="4627">single</wd>

<space/>

<wd l="9326" t="4426" r="9811" b="4584">token</wd>

<space/>

<wd l="9898" t="4426" r="10498" b="4613">“love”,</wd>

<space/>

</ln>

<ln l="6144" t="4699" r="10502" b="4901" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4699" r="6581" b="4858">three</wd>

<space/>

<wd l="6634" t="4723" r="7171" b="4901">empty</wd>

<space/>

<wd l="7219" t="4699" r="7781" b="4858">tokens</wd>

<space/>

<wd l="7834" t="4723" r="8261" b="4858">must</wd>

<space/>

<wd l="8304" t="4699" r="8866" b="4858">follow</wd>

<space/>

<wd l="8918" t="4699" r="9086" b="4853">in</wd>

<space/>

<wd l="9134" t="4699" r="9398" b="4858">the</wd>

<space/>

<wd l="9451" t="4723" r="10046" b="4901">output.</wd>

<space/>

<wd l="10123" t="4699" r="10502" b="4858">This</wd>

<space/>

</ln>

<ln l="6144" t="4968" r="10512" b="5170" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4968" r="6283" b="5126">is</wd>

<space/>

<wd l="6350" t="5021" r="6730" b="5170">easy</wd>

<space/>

<wd l="6782" t="4968" r="7042" b="5126">for</wd>

<space/>

<wd l="7094" t="4968" r="8064" b="5170">approaches</wd>

<space/>

<wd l="8122" t="4968" r="8453" b="5126">that</wd>

<space/>

<wd l="8501" t="5021" r="9149" b="5170">process</wd>

<space/>

<wd l="9211" t="4968" r="9475" b="5126">the</wd>

<space/>

<wd l="9528" t="4968" r="9979" b="5170">input</wd>

<space/>

<wd l="10027" t="4968" r="10512" b="5126">token</wd>

<space/>

</ln>

<ln l="6144" t="5242" r="10512" b="5443" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5242" r="6360" b="5443">by</wd>

<space/>

<wd l="6437" t="5242" r="6922" b="5400">token</wd>

<space/>

<wd l="6994" t="5242" r="7272" b="5400">but</wd>

<space/>

<wd l="7344" t="5294" r="7718" b="5443">may</wd>

<space/>

<wd l="7795" t="5242" r="8410" b="5443">require</wd>

<space/>

<wd l="8491" t="5266" r="8923" b="5400">extra</wd>

<space/>

<wd l="8995" t="5242" r="9442" b="5400">work</wd>

<space/>

<wd l="9514" t="5242" r="9662" b="5395">if</wd>

<space/>

<wd l="9720" t="5242" r="9989" b="5400">the</wd>

<space/>

<wd l="10061" t="5242" r="10512" b="5443">input</wd>

<space/>

</ln>

<ln l="6154" t="5510" r="8755" b="5712" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="5510" r="6638" b="5712">string</wd>

<space/>

<wd l="6696" t="5510" r="6835" b="5669">is</wd>

<space/>

<wd l="6898" t="5510" r="7757" b="5712">processed</wd>

<space/>

<wd l="7819" t="5510" r="8755" b="5712">differently.</wd>

</ln>

</para>

<para l="6144" t="5803" r="10512" b="7358" alignment="justified" spaceBefore="20" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="5803" r="10502" b="6005" baseLine="5952" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="5808" r="6648" b="5962">We</wd>

<space/>

<wd l="6715" t="5803" r="7637" b="6005">participate</wd>

<space/>

<wd l="7699" t="5803" r="7872" b="5957">in</wd>

<space/>

<wd l="7934" t="5803" r="8203" b="5962">the</wd>

<space/>

<wd l="8270" t="5803" r="9274" b="5962">constrained</wd>

<space/>

<wd l="9336" t="5803" r="9821" b="5962">mode</wd>

<space/>

<wd l="9888" t="5803" r="10219" b="5962">that</wd>

<space/>

<wd l="10286" t="5803" r="10502" b="5962">al-</wd>

</ln>

<ln l="6144" t="6072" r="10502" b="6230" baseLine="6226" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6072" r="6542" b="6230">lows</wd>

<space/>

<wd l="6619" t="6072" r="7709" b="6230">off-the-shelf</wd>

<space/>

<wd l="7757" t="6072" r="8174" b="6230">tools</wd>

<space/>

<wd l="8242" t="6072" r="8520" b="6230">but</wd>

<space/>

<wd l="8578" t="6125" r="8789" b="6230">no</wd>

<space/>

<wd l="8856" t="6072" r="10056" b="6230">normalisation</wd>

<space/>

<wd l="10114" t="6072" r="10502" b="6230">lexi-</wd>

</ln>

<ln l="6149" t="6346" r="10498" b="6533" baseLine="6494" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="6398" r="6538" b="6504">cons</wd>

<space/>

<wd l="6610" t="6346" r="6922" b="6504">and</wd>

<space/>

<wd l="6984" t="6346" r="7848" b="6504">additional</wd>

<space/>

<wd l="7915" t="6346" r="8280" b="6504">data</wd>

<space/>

<wd l="8333" t="6370" r="8501" b="6504">to</wd>

<space/>

<wd l="8563" t="6346" r="8770" b="6504">be</wd>

<space/>

<wd l="8827" t="6346" r="9274" b="6504">used.</wd>

<space/>

<wd l="9365" t="6346" r="10498" b="6533">Furthermore,</wd>

<space/>

</ln>

<ln l="6144" t="6614" r="10512" b="6816" baseLine="6768" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6667" r="6398" b="6773">we</wd>

<space/>

<wd l="6490" t="6614" r="6701" b="6773">do</wd>

<space/>

<wd l="6792" t="6638" r="7070" b="6773">not</wd>

<space/>

<wd l="7157" t="6667" r="7445" b="6773">use</wd>

<space/>

<wd l="7536" t="6667" r="7838" b="6816">any</wd>

<space/>

<wd l="7930" t="6614" r="8568" b="6773">lexicon</wd>

<space/>

<wd l="8659" t="6614" r="8851" b="6773">of</wd>

<space/>

<wd l="8928" t="6614" r="9754" b="6773">canonical</wd>

<space/>

<wd l="9845" t="6614" r="10512" b="6816">English</wd>

<space/>

</ln>

<ln l="6144" t="6888" r="10512" b="7090" baseLine="7037" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6888" r="6422" b="7046">but</wd>

<space/>

<wd l="6475" t="6888" r="6912" b="7046">learn</wd>

<space/>

<wd l="6965" t="6941" r="7258" b="7046">our</wd>

<space/>

<wd l="7306" t="6888" r="8506" b="7046">normalisation</wd>

<space/>

<wd l="8558" t="6888" r="9101" b="7046">model</wd>

<space/>

<wd l="9158" t="6888" r="9710" b="7090">purely</wd>

<space/>

<wd l="9768" t="6888" r="10195" b="7046">from</wd>

<space/>

<wd l="10243" t="6888" r="10512" b="7046">the</wd>

<space/>

</ln>

<ln l="6144" t="7157" r="8112" b="7358" baseLine="7310" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7157" r="6922" b="7358">provided</wd>

<space/>

<wd l="6974" t="7157" r="7646" b="7358">training</wd>

<space/>

<wd l="7709" t="7157" r="8112" b="7315">data.</wd>

</ln>

</para>

<para l="6144" t="7450" r="10517" b="11174" alignment="justified" spaceBefore="18" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6370" t="7450" r="10507" b="7651" baseLine="7598" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="7454" r="6706" b="7608">Our</wd>

<space/>

<wd l="6898" t="7450" r="7694" b="7651">approach</wd>

<space/>

<wd l="7882" t="7450" r="8525" b="7608">follows</wd>

<space/>

<wd l="8722" t="7450" r="9461" b="7651">previous</wd>

<space/>

<wd l="9658" t="7450" r="10104" b="7608">work</wd>

<space/>

<wd l="10291" t="7450" r="10507" b="7651">by</wd>

<space/>

</ln>

<ln l="6149" t="7718" r="10502" b="7920" baseLine="7872" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="7718" r="6950" b="7920">Chrupała</wd>

<space/>

<wd l="7042" t="7723" r="7603" b="7915">(2014)</wd>

<space/>

<wd l="7704" t="7718" r="7877" b="7872">in</wd>

<space/>

<wd l="7963" t="7718" r="8290" b="7877">that</wd>

<space/>

<wd l="8376" t="7771" r="8630" b="7877">we</wd>

<space/>

<wd l="8722" t="7718" r="9120" b="7877">train</wd>

<space/>

<wd l="9211" t="7771" r="9307" b="7877">a</wd>

<space/>

<wd l="9403" t="7771" r="10190" b="7920">sequence</wd>

<space/>

<wd l="10282" t="7718" r="10502" b="7877">la-</wd>

</ln>

<ln l="6144" t="7992" r="10512" b="8194" baseLine="8141" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7992" r="6648" b="8150">beller</wd>

<space/>

<wd l="6696" t="8016" r="6864" b="8150">to</wd>

<space/>

<wd l="6926" t="8016" r="7661" b="8150">annotate</wd>

<space/>

<wd l="7718" t="7992" r="8045" b="8150">edit</wd>

<space/>

<wd l="8098" t="7992" r="8995" b="8194">operations</wd>

<space/>

<wd l="9058" t="7992" r="9389" b="8150">that</wd>

<space/>

<wd l="9442" t="8045" r="9706" b="8150">are</wd>

<space/>

<wd l="9758" t="7992" r="10512" b="8150">intended</wd>

<space/>

</ln>

<ln l="6144" t="8261" r="10512" b="8462" baseLine="8414" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8285" r="6312" b="8419">to</wd>

<space/>

<wd l="6408" t="8261" r="7267" b="8419">normalise</wd>

<space/>

<wd l="7363" t="8261" r="7627" b="8419">the</wd>

<space/>

<wd l="7723" t="8285" r="8050" b="8419">text</wd>

<space/>

<wd l="8141" t="8261" r="8611" b="8419">when</wd>

<space/>

<wd l="8707" t="8261" r="9350" b="8462">applied</wd>

<space/>

<wd l="9442" t="8285" r="9605" b="8419">to</wd>

<space/>

<wd l="9701" t="8261" r="9970" b="8419">the</wd>

<space/>

<wd l="10061" t="8261" r="10512" b="8462">input</wd>

<space/>

</ln>

<ln l="6144" t="8534" r="10507" b="8736" baseLine="8683" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8558" r="6514" b="8693">text.</wd>

<space/>

<wd l="6686" t="8539" r="7507" b="8722">However,</wd>

<space/>

<wd l="7613" t="8534" r="8093" b="8693">while</wd>

<space/>

<wd l="8189" t="8534" r="8986" b="8736">Chrupała</wd>

<space/>

<wd l="9067" t="8587" r="9437" b="8693">uses</wd>

<space/>

<wd l="9533" t="8534" r="10507" b="8693">conditional</wd>

<space/>

</ln>

<ln l="6144" t="8803" r="10517" b="9005" baseLine="8957" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8803" r="6816" b="8962">random</wd>

<space/>

<wd l="6902" t="8803" r="7358" b="8962">fields</wd>

<space/>

<wd l="7450" t="8803" r="7709" b="8962">for</wd>

<space/>

<wd l="7800" t="8856" r="8587" b="9005">sequence</wd>

<space/>

<wd l="8674" t="8803" r="9480" b="9005">labelling,</wd>

<space/>

<wd l="9581" t="8856" r="9835" b="8962">we</wd>

<space/>

<wd l="9917" t="8803" r="10517" b="8962">further</wd>

<space/>

</ln>

<ln l="6149" t="9077" r="10512" b="9278" baseLine="9226" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9077" r="7128" b="9278">experiment</wd>

<space/>

<wd l="7224" t="9077" r="7613" b="9235">with</wd>

<space/>

<wd l="7709" t="9077" r="8179" b="9278">using</wd>

<space/>

<wd l="8285" t="9130" r="8381" b="9235">a</wd>

<space/>

<wd l="8477" t="9077" r="9470" b="9278">generalised</wd>

<space/>

<wd l="9566" t="9082" r="10512" b="9278">Perceptron</wd>

<space/>

</ln>

<ln l="6149" t="9346" r="10512" b="9547" baseLine="9499" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9346" r="6461" b="9504">and</wd>

<space/>

<wd l="6514" t="9346" r="6902" b="9504">with</wd>

<space/>

<wd l="6955" t="9346" r="7426" b="9547">using</wd>

<space/>

<wd l="7488" t="9398" r="7584" b="9504">a</wd>

<space/>

<wd l="7642" t="9346" r="8213" b="9547">simple</wd>

<space/>

<wd l="8266" t="9346" r="8736" b="9547">noisy</wd>

<space/>

<wd l="8798" t="9346" r="9470" b="9504">channel</wd>

<space/>

<wd l="9523" t="9346" r="10066" b="9504">model</wd>

<space/>

<wd l="10123" t="9346" r="10512" b="9504">with</wd>

<space/>

</ln>

<ln l="6149" t="9619" r="10512" b="9821" baseLine="9768">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="9619" r="6950" b="9778">character</wd>

<space/>

</run>

<wd l="7018" t="9672" r="7666" b="9821"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">n</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">-gram</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7733" t="9619" r="8520" b="9821">language</wd>

<space/>

<wd l="8587" t="9619" r="9211" b="9778">models</wd>

<space/>

<wd l="9283" t="9619" r="9893" b="9778">trained</wd>

<space/>

<wd l="9965" t="9672" r="10176" b="9778">on</wd>

<space/>

<wd l="10243" t="9619" r="10512" b="9778">the</wd>

<space/>

</run>

</ln>

<ln l="6144" t="9888" r="10502" b="10090" baseLine="10037" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9888" r="7118" b="10046">normalised</wd>

<space/>

<wd l="7171" t="9888" r="7512" b="10046">side</wd>

<space/>

<wd l="7565" t="9888" r="7757" b="10046">of</wd>

<space/>

<wd l="7790" t="9888" r="8054" b="10046">the</wd>

<space/>

<wd l="8102" t="9888" r="8779" b="10090">training</wd>

<space/>

<wd l="8837" t="9888" r="9197" b="10046">data</wd>

<space/>

<wd l="9240" t="9912" r="9408" b="10046">to</wd>

<space/>

<wd l="9470" t="9888" r="9955" b="10046">select</wd>

<space/>

<wd l="10003" t="9888" r="10267" b="10046">the</wd>

<space/>

<wd l="10320" t="9888" r="10502" b="10042">fi-</wd>

</ln>

<ln l="6144" t="10157" r="10502" b="10315" baseLine="10310" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10157" r="6408" b="10315">nal</wd>

<space/>

<wd l="6466" t="10157" r="7666" b="10315">normalisation</wd>

<space/>

<wd l="7718" t="10157" r="8146" b="10315">from</wd>

<space/>

<wd l="8198" t="10210" r="8294" b="10315">a</wd>

<space/>

<wd l="8352" t="10181" r="8587" b="10315">set</wd>

<space/>

<wd l="8640" t="10157" r="8832" b="10315">of</wd>

<space/>

<wd l="8875" t="10157" r="9706" b="10315">candidate</wd>

<space/>

<wd l="9758" t="10157" r="10502" b="10315">normali-</wd>

</ln>

<ln l="6154" t="10430" r="10502" b="10632" baseLine="10579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="10430" r="6667" b="10589">sation</wd>

<space/>

<wd l="6720" t="10430" r="7565" b="10632">generated</wd>

<space/>

<wd l="7608" t="10430" r="8035" b="10589">from</wd>

<space/>

<wd l="8083" t="10483" r="8285" b="10589">an</wd>

<space/>

<wd l="8338" t="10430" r="9158" b="10589">ensemble</wd>

<space/>

<wd l="9211" t="10430" r="9398" b="10589">of</wd>

<space/>

<wd l="9442" t="10483" r="10234" b="10632">sequence</wd>

<space/>

<wd l="10282" t="10430" r="10502" b="10589">la-</wd>

</ln>

<ln l="6144" t="10699" r="10512" b="10901" baseLine="10853" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10699" r="6720" b="10858">bellers</wd>

<space/>

<wd l="6802" t="10699" r="7109" b="10858">and</wd>

<space/>

<wd l="7176" t="10699" r="7603" b="10858">from</wd>

<space/>

<wd l="7680" t="10699" r="8587" b="10901">selectively</wd>

<space/>

<wd l="8659" t="10699" r="9398" b="10901">ignoring</wd>

<space/>

<wd l="9475" t="10752" r="9926" b="10858">some</wd>

<space/>

<wd l="9998" t="10699" r="10190" b="10858">of</wd>

<space/>

<wd l="10243" t="10699" r="10512" b="10858">the</wd>

<space/>

</ln>

<ln l="6144" t="10973" r="8333" b="11174" baseLine="11122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10973" r="6946" b="11174">proposed</wd>

<space/>

<wd l="7003" t="10973" r="7330" b="11131">edit</wd>

<space/>

<wd l="7387" t="10973" r="8333" b="11174">operations.</wd>

</ln>

</para>

<para l="6144" t="11506" r="8539" b="11726" alignment="left" spaceBefore="278" lsp="exactly" lspExact="273" language="en">

<ln l="6144" t="11506" r="8539" b="11726" baseLine="11669" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">

<wd l="6144" t="11506" r="6259" b="11674">2</wd>

<space/>

<wd l="6504" t="11506" r="7896" b="11726">Experimental</wd>

<space/>

<wd l="7963" t="11506" r="8539" b="11726">Setup</wd>

</ln>

</para>

<para l="6144" t="11981" r="9422" b="12144" alignment="left" spaceBefore="214" lsp="exactly" lspExact="254" language="en">

<ln l="6144" t="11981" r="9422" b="12144" baseLine="12139" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11986" r="6408" b="12144">2.1</wd>

<space/>

<wd l="6638" t="11990" r="7085" b="12144">Data</wd>

<space/>

<wd l="7142" t="11986" r="7435" b="12144">Set</wd>

<space/>

<wd l="7488" t="11990" r="7834" b="12144">and</wd>

<space/>

<wd l="7901" t="11986" r="9422" b="12144">Cross-validation</wd>

</ln>

</para>

<para l="6144" t="12374" r="10502" b="13934" alignment="justified" spaceBefore="115" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="12374" r="10502" b="12576" baseLine="12528" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="12374" r="6485" b="12533">The</wd>

<space/>

<wd l="6538" t="12374" r="7430" b="12576">microblog</wd>

<space/>

<wd l="7493" t="12374" r="7858" b="12533">data</wd>

<space/>

<wd l="7915" t="12398" r="8150" b="12533">set</wd>

<space/>

<wd l="8208" t="12374" r="8395" b="12533">of</wd>

<space/>

<wd l="8438" t="12374" r="8702" b="12533">the</wd>

<space/>

<wd l="8765" t="12374" r="9326" b="12533">shared</wd>

<space/>

<wd l="9379" t="12374" r="9730" b="12533">task</wd>

<space/>

<wd l="9787" t="12374" r="10502" b="12533">contains</wd>

<space/>

</ln>

<ln l="6149" t="12648" r="10502" b="12850" baseLine="12797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="12648" r="6634" b="12835">2,950</wd>

<space/>

<wd l="6710" t="12672" r="7258" b="12806">tweets</wd>

<space/>

<wd l="7339" t="12648" r="7594" b="12806">for</wd>

<space/>

<wd l="7661" t="12648" r="8338" b="12850">training</wd>

<space/>

<wd l="8419" t="12648" r="8731" b="12806">and</wd>

<space/>

<wd l="8822" t="12648" r="9283" b="12835">1,967</wd>

<space/>

<wd l="9360" t="12672" r="9912" b="12806">tweets</wd>

<space/>

<wd l="9989" t="12648" r="10248" b="12806">for</wd>

<space/>

<wd l="10320" t="12648" r="10502" b="12802">fi-</wd>

</ln>

<ln l="6144" t="12917" r="10502" b="13118" baseLine="13070" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="12917" r="6408" b="13075">nal</wd>

<space/>

<wd l="6466" t="12917" r="7090" b="13118">testing.</wd>

<space/>

<wd l="7166" t="12917" r="7603" b="13075">Each</wd>

<space/>

<wd l="7656" t="12941" r="8126" b="13075">tweet</wd>

<space/>

<wd l="8179" t="12917" r="8314" b="13075">is</wd>

<space/>

<wd l="8376" t="12917" r="9211" b="13075">tokenised</wd>

<space/>

<wd l="9264" t="12917" r="9576" b="13075">and</wd>

<space/>

<wd l="9624" t="12917" r="9893" b="13075">the</wd>

<space/>

<wd l="9946" t="12917" r="10502" b="13075">tokens</wd>

<space/>

</ln>

<ln l="6149" t="13190" r="10498" b="13392" baseLine="13339" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="13190" r="6341" b="13349">of</wd>

<space/>

<wd l="6394" t="13190" r="6662" b="13349">the</wd>

<space/>

<wd l="6730" t="13190" r="7699" b="13349">normalised</wd>

<space/>

<wd l="7766" t="13214" r="8318" b="13349">tweets</wd>

<space/>

<wd l="8395" t="13243" r="8659" b="13349">are</wd>

<space/>

<wd l="8731" t="13190" r="9370" b="13392">aligned</wd>

<space/>

<wd l="9437" t="13214" r="9600" b="13349">to</wd>

<space/>

<wd l="9672" t="13190" r="9941" b="13349">the</wd>

<space/>

<wd l="10008" t="13190" r="10498" b="13392">input,</wd>

<space/>

</ln>

<ln l="6149" t="13459" r="10502" b="13661" baseLine="13613" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="13459" r="6902" b="13661">allowing</wd>

<space/>

<wd l="6965" t="13459" r="7219" b="13618">for</wd>

<space/>

<wd l="7282" t="13483" r="8266" b="13646">one-to-one,</wd>

<space/>

<wd l="8338" t="13483" r="9446" b="13661">many-to-one</wd>

<space/>

<wd l="9514" t="13459" r="9821" b="13618">and</wd>

<space/>

<wd l="9888" t="13483" r="10502" b="13618">one-to-</wd>

</ln>

<ln l="6144" t="13733" r="7685" b="13934" baseLine="13882" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="13786" r="6624" b="13934">many</wd>

<space/>

<wd l="6686" t="13733" r="7685" b="13934">alignments.</wd>

</ln>

</para>

<para l="6144" t="14021" r="10526" b="15264" alignment="justified" spaceBefore="22" fli="216" lsp="exactly" lspExact="269" language="en">

<ln l="6365" t="14021" r="10502" b="14208" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="14026" r="6667" b="14179">For</wd>

<space/>

<wd l="6725" t="14021" r="7464" b="14179">five-fold</wd>

<space/>

<wd l="7526" t="14021" r="8952" b="14208">cross-validation,</wd>

<space/>

<wd l="9019" t="14074" r="9274" b="14179">we</wd>

<space/>

<wd l="9341" t="14045" r="9662" b="14179">sort</wd>

<space/>

<wd l="9715" t="14021" r="9979" b="14179">the</wd>

<space/>

<wd l="10037" t="14021" r="10502" b="14179">train-</wd>

</ln>

<ln l="6144" t="14294" r="10526" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14294" r="6422" b="14496">ing</wd>

<space/>

<wd l="6523" t="14294" r="6888" b="14453">data</wd>

<space/>

<wd l="6974" t="14294" r="7190" b="14496">by</wd>

<space/>

<wd l="7286" t="14318" r="7762" b="14453">tweet</wd>

<space/>

<wd l="7853" t="14299" r="8078" b="14448">ID</wd>

<space/>

<wd l="8184" t="14294" r="8496" b="14453">and</wd>

<space/>

<wd l="8597" t="14294" r="8966" b="14496">split</wd>

<space/>

<wd l="9058" t="14294" r="9178" b="14453">it</wd>

<space/>

<wd l="9274" t="14294" r="9610" b="14453">into</wd>

<space/>

<wd l="9710" t="14294" r="9802" b="14453">5</wd>

<space/>

<wd l="9917" t="14318" r="10229" b="14453">sets</wd>

<space/>

<wd l="10334" t="14294" r="10526" b="14453">of</wd>

<space/>

</ln>

<ln l="6144" t="14563" r="10502" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14563" r="6821" b="14765">roughly</wd>

<space/>

<wd l="6907" t="14563" r="7171" b="14722">the</wd>

<space/>

<wd l="7262" t="14616" r="7699" b="14722">same</wd>

<space/>

<wd l="7781" t="14563" r="8453" b="14722">number</wd>

<space/>

<wd l="8534" t="14563" r="8722" b="14722">of</wd>

<space/>

<wd l="8789" t="14563" r="9403" b="14722">tokens.</wd>

<space/>

<wd l="9566" t="14563" r="9970" b="14760">(The</wd>

<space/>

<wd l="10051" t="14616" r="10502" b="14722">num-</wd>

</ln>

<ln l="6144" t="14837" r="10502" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14837" r="6427" b="14995">ber</wd>

<space/>

<wd l="6514" t="14837" r="6701" b="14995">of</wd>

<space/>

<wd l="6773" t="14861" r="7320" b="14995">tweets</wd>

<space/>

<wd l="7411" t="14837" r="7920" b="14995">varies</wd>

<space/>

<wd l="8011" t="14837" r="8438" b="14995">from</wd>

<space/>

<wd l="8520" t="14837" r="8837" b="14995">579</wd>

<space/>

<wd l="8923" t="14861" r="9091" b="14995">to</wd>

<space/>

<wd l="9182" t="14837" r="9624" b="15034">606.)</wd>

<space/>

<wd l="9787" t="14842" r="10502" b="15038">Systems</wd>

<space/>

</ln>

<ln l="6149" t="15106" r="10502" b="15264" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6149" t="15158" r="6413" b="15264">are</wd>

<space/>

<wd l="6480" t="15106" r="7085" b="15264">trained</wd>

<space/>

<wd l="7157" t="15158" r="7368" b="15264">on</wd>

<space/>

<wd l="7435" t="15106" r="7805" b="15264">four</wd>

<space/>

<wd l="7877" t="15130" r="8184" b="15264">sets</wd>

<space/>

<wd l="8261" t="15106" r="8573" b="15264">and</wd>

<space/>

<wd l="8640" t="15106" r="9149" b="15264">tested</wd>

<space/>

<wd l="9221" t="15158" r="9437" b="15264">on</wd>

<space/>

<wd l="9499" t="15106" r="9763" b="15264">the</wd>

<space/>

<wd l="9830" t="15106" r="10502" b="15264">remain-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<section l="1433" t="15317" r="10531" b="16480">

<column l="1433" t="15317" r="10531" b="16480">

<para l="5804" t="15792" r="6138" b="15946" alignment="centered" spaceBefore="406" lsp="exactly" lspExact="271" language="en">

<ln l="5870" t="15792" r="6072" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="37">

<wd l="5870" t="15792" r="6072" b="15946">93</wd>

</ln>

</para>

<para l="2918" t="16133" r="8981" b="16469" alignment="centered" spaceBefore="138" lsp="exactly" lspExact="170" language="en">

<ln l="2918" t="16133" r="8981" b="16301" baseLine="16253" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2918" t="16133" r="3802" b="16296">Proceedings</wd>

<space/>

<wd l="3854" t="16133" r="4018" b="16296">of</wd>

<space/>

<wd l="4037" t="16133" r="4248" b="16262">the</wd>

<space/>

<wd l="4286" t="16138" r="4622" b="16262">ACL</wd>

<space/>

<wd l="4666" t="16133" r="5026" b="16262">2015</wd>

<space/>

<wd l="5078" t="16133" r="5779" b="16296">Workshop</wd>

<space/>

<wd l="5832" t="16176" r="6000" b="16262">on</wd>

<space/>

<wd l="6043" t="16138" r="6456" b="16296">Noisy</wd>

<space/>

<wd l="6518" t="16133" r="7627" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7675" t="16138" r="7992" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8045" t="16171" r="8443" b="16301">pages</wd>

<space/>

<wd l="8501" t="16133" r="8981" b="16286">93–98,
</wd>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4314.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1260" marginRight="1388" marginBottom="1302" offsetX="-20" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1260" r="10521" b="15310">

<column l="1440" t="1260" r="5822" b="15310">

<para l="1440" t="1320" r="5808" b="2563" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="1320" r="5808" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1320" r="1714" b="1522">ing</wd>

<space/>

<wd l="1824" t="1344" r="2102" b="1478">set.</wd>

<space/>

<wd l="2318" t="1320" r="2794" b="1478">Since</wd>

<space/>

<wd l="2894" t="1320" r="3158" b="1478">the</wd>

<space/>

<wd l="3269" t="1373" r="4056" b="1522">sequence</wd>

<space/>

<wd l="4157" t="1320" r="4886" b="1478">labellers</wd>

<space/>

<wd l="4992" t="1320" r="5611" b="1522">require</wd>

<space/>

<wd l="5712" t="1373" r="5808" b="1478">a</wd>

<space/>

</ln>

<ln l="1445" t="1594" r="5808" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1594" r="2558" b="1795">development</wd>

<space/>

<wd l="2659" t="1618" r="2938" b="1781">set,</wd>

<space/>

<wd l="3048" t="1646" r="3302" b="1752">we</wd>

<space/>

<wd l="3403" t="1594" r="3773" b="1795">split</wd>

<space/>

<wd l="3864" t="1594" r="4128" b="1752">the</wd>

<space/>

<wd l="4219" t="1594" r="4718" b="1752">union</wd>

<space/>

<wd l="4814" t="1594" r="5006" b="1752">of</wd>

<space/>

<wd l="5083" t="1594" r="5347" b="1752">the</wd>

<space/>

<wd l="5443" t="1594" r="5808" b="1752">four</wd>

<space/>

</ln>

<ln l="1450" t="1862" r="5794" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="1886" r="1762" b="2021">sets</wd>

<space/>

<wd l="1862" t="1862" r="2333" b="2064">again</wd>

<space/>

<wd l="2419" t="1862" r="2755" b="2021">into</wd>

<space/>

<wd l="2856" t="1862" r="2947" b="2021">5</wd>

<space/>

<wd l="3058" t="1886" r="3370" b="2021">sets</wd>

<space/>

<wd l="3466" t="1886" r="3634" b="2021">to</wd>

<space/>

<wd l="3734" t="1915" r="4171" b="2064">carry</wd>

<space/>

<wd l="4272" t="1886" r="4546" b="2021">out</wd>

<space/>

<wd l="4637" t="1862" r="5194" b="2021">nested</wd>

<space/>

<wd l="5290" t="1915" r="5794" b="2021">cross-</wd>

</ln>

<ln l="1440" t="2136" r="5794" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2136" r="2352" b="2323">validation,</wd>

<space/>

<wd l="2410" t="2136" r="3082" b="2338">training</wd>

<space/>

<wd l="3134" t="2136" r="3336" b="2294">25</wd>

<space/>

<wd l="3394" t="2136" r="4013" b="2294">models</wd>

<space/>

<wd l="4066" t="2136" r="4238" b="2290">in</wd>

<space/>

<wd l="4282" t="2136" r="4666" b="2294">total</wd>

<space/>

<wd l="4714" t="2136" r="4973" b="2294">for</wd>

<space/>

<wd l="5016" t="2136" r="5410" b="2294">each</wd>

<space/>

<wd l="5462" t="2189" r="5794" b="2338">sys-</wd>

</ln>

<ln l="1440" t="2410" r="1810" b="2563" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2429" r="1810" b="2563">tem.</wd>

</ln>

</para>

<para l="1440" t="2842" r="3696" b="3000" alignment="left" spaceBefore="188" lsp="exactly" lspExact="251" language="en">

<ln l="1440" t="2842" r="3696" b="3000" baseLine="2995" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="1440" t="2842" r="1709" b="3000">2.2</wd>

<space/>

<wd l="1930" t="2846" r="2650" b="3000">Feature</wd>

<space/>

<wd l="2702" t="2842" r="3696" b="3000">Extraction</wd>

</ln>

</para>

<para l="1440" t="3192" r="5818" b="8002" alignment="justified" spaceBefore="106" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="3192" r="5803" b="3394" baseLine="3346" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="3197" r="1742" b="3350">For</wd>

<space/>

<wd l="1819" t="3192" r="2678" b="3394">extracting</wd>

<space/>

<wd l="2755" t="3216" r="3542" b="3350">recurrent</wd>

<space/>

<wd l="3614" t="3192" r="4157" b="3350">neural</wd>

<space/>

<wd l="4234" t="3192" r="4949" b="3350">network</wd>

<space/>

<wd l="5016" t="3192" r="5803" b="3394">language</wd>

<space/>

</ln>

<ln l="1440" t="3427" r="5794" b="3667" baseLine="3610">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1440" t="3466" r="1982" b="3624">model</wd>

<space/>

<wd l="2050" t="3466" r="2784" b="3653">features,</wd>

<space/>

<wd l="2856" t="3518" r="3110" b="3624">we</wd>

<space/>

<wd l="3173" t="3518" r="3466" b="3624">use</wd>

<space/>

</run>

<wd l="3528" t="3427" r="4166" b="3624"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">Elman</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="4258" t="3466" r="5165" b="3667">(Chrupała,</wd>

<space/>

<wd l="5246" t="3470" r="5794" b="3662">2014),</wd>

<space/>

</run>

</ln>

<ln l="1445" t="3701" r="5808" b="3931" baseLine="3884">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1445" t="3787" r="1541" b="3893">a</wd>

<space/>

<wd l="1579" t="3734" r="2683" b="3893">modification</wd>

<space/>

<wd l="2726" t="3734" r="2918" b="3893">of</wd>

<space/>

<wd l="2947" t="3734" r="3211" b="3893">the</wd>

<space/>

<wd l="3254" t="3739" r="4042" b="3893">RNNLM</wd>

<space/>

</run>

<wd l="4085" t="3701" r="4733" b="3893"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">toolkit</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="4795" t="3734" r="5602" b="3931">(Mikolov</wd>

<space/>

<wd l="5654" t="3758" r="5808" b="3893">et</wd>

<space/>

</run>

</ln>

<ln l="1445" t="4008" r="5808" b="4210" baseLine="4157" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="4008" r="1694" b="4195">al.,</wd>

<space/>

<wd l="1757" t="4013" r="2237" b="4195">2010;</wd>

<space/>

<wd l="2294" t="4008" r="3072" b="4195">Mikolov,</wd>

<space/>

<wd l="3130" t="4013" r="3624" b="4205">2012)</wd>

<space/>

<wd l="3677" t="4008" r="4008" b="4166">that</wd>

<space/>

<wd l="4051" t="4032" r="4680" b="4210">outputs</wd>

<space/>

<wd l="4733" t="4008" r="5328" b="4166">hidden</wd>

<space/>

<wd l="5371" t="4008" r="5808" b="4210">layer</wd>

<space/>

</ln>

<ln l="1445" t="4277" r="5808" b="4435" baseLine="4426" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="4277" r="2419" b="4435">activations.</wd>

<space/>

<wd l="2549" t="4282" r="2832" b="4435">We</wd>

<space/>

<wd l="2904" t="4330" r="3197" b="4435">use</wd>

<space/>

<wd l="3269" t="4277" r="3533" b="4435">the</wd>

<space/>

<wd l="3610" t="4277" r="4704" b="4435">off-the-shelf</wd>

<space/>

<wd l="4766" t="4277" r="5309" b="4435">model</wd>

<space/>

<wd l="5381" t="4277" r="5808" b="4435">from</wd>

<space/>

</ln>

<ln l="1445" t="4512" r="5818" b="4752" baseLine="4697">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1445" t="4550" r="2242" b="4752">Chrupała</wd>

<space/>

</run>

<wd l="2309" t="4512" r="3014" b="4747"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">(2014)</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">3</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="3115" t="4550" r="3451" b="4709">The</wd>

<space/>

<wd l="3514" t="4550" r="3965" b="4752">input</wd>

<space/>

<wd l="4027" t="4603" r="4291" b="4709">are</wd>

<space/>

<wd l="4349" t="4550" r="4618" b="4709">the</wd>

<space/>

<wd l="4685" t="4550" r="5554" b="4709">characters</wd>

<space/>

<wd l="5630" t="4550" r="5818" b="4709">of</wd>

<space/>

</run>

</ln>

<ln l="1440" t="4781" r="5808" b="5021" baseLine="4964">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1440" t="4819" r="1704" b="4978">the</wd>

<space/>

</run>

<wd l="1757" t="4781" r="2304" b="4978"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">tweet</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">4</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="2366" t="4819" r="2539" b="4973">in</wd>

<space/>

<wd l="2587" t="4819" r="3254" b="4978">one-hot</wd>

<space/>

<wd l="3302" t="4819" r="4142" b="5021">encoding.</wd>

<space/>

<wd l="4219" t="4819" r="4560" b="4978">The</wd>

<space/>

<wd l="4608" t="4819" r="5323" b="4978">network</wd>

<space/>

<wd l="5371" t="4819" r="5650" b="4978">has</wd>

<space/>

<wd l="5712" t="4872" r="5808" b="4978">a</wd>

<space/>

</run>

</ln>

<ln l="1440" t="5088" r="5803" b="5290" baseLine="5242" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5088" r="2035" b="5246">hidden</wd>

<space/>

<wd l="2102" t="5088" r="2539" b="5290">layer</wd>

<space/>

<wd l="2606" t="5088" r="2995" b="5246">with</wd>

<space/>

<wd l="3058" t="5093" r="3384" b="5246">400</wd>

<space/>

<wd l="3451" t="5141" r="4138" b="5246">neurons</wd>

<space/>

<wd l="4214" t="5088" r="4526" b="5246">and</wd>

<space/>

<wd l="4594" t="5088" r="4714" b="5246">it</wd>

<space/>

<wd l="4781" t="5088" r="5462" b="5290">predicts</wd>

<space/>

<wd l="5539" t="5088" r="5803" b="5246">the</wd>

<space/>

</ln>

<ln l="1440" t="5362" r="5803" b="5563" baseLine="5510" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5386" r="1814" b="5520">next</wd>

<space/>

<wd l="1877" t="5362" r="2294" b="5563">byte.</wd>

<space/>

<wd l="2395" t="5362" r="3278" b="5563">Following</wd>

<space/>

<wd l="3350" t="5362" r="4147" b="5563">Chrupała</wd>

<space/>

<wd l="4219" t="5366" r="4834" b="5558">(2014),</wd>

<space/>

<wd l="4906" t="5414" r="5160" b="5520">we</wd>

<space/>

<wd l="5222" t="5362" r="5803" b="5520">reduce</wd>

<space/>

</ln>

<ln l="1440" t="5630" r="5794" b="5832" baseLine="5784" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5630" r="1704" b="5789">the</wd>

<space/>

<wd l="1776" t="5635" r="2102" b="5789">400</wd>

<space/>

<wd l="2179" t="5630" r="3101" b="5789">activations</wd>

<space/>

<wd l="3182" t="5654" r="3350" b="5789">to</wd>

<space/>

<wd l="3446" t="5635" r="3638" b="5789">10</wd>

<space/>

<wd l="3715" t="5630" r="4267" b="5832">binary</wd>

<space/>

<wd l="4344" t="5630" r="5074" b="5789">features:</wd>

<space/>

<wd l="5194" t="5635" r="5477" b="5789">We</wd>

<space/>

<wd l="5558" t="5683" r="5794" b="5789">se-</wd>

</ln>

<ln l="1440" t="5904" r="5803" b="6106" baseLine="6053" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5904" r="1757" b="6062">lect</wd>

<space/>

<wd l="1810" t="5904" r="2078" b="6062">the</wd>

<space/>

<wd l="2160" t="5909" r="2347" b="6062">10</wd>

<space/>

<wd l="2410" t="5928" r="2837" b="6062">most</wd>

<space/>

<wd l="2894" t="5904" r="3403" b="6062">active</wd>

<space/>

<wd l="3461" t="5957" r="4142" b="6062">neurons</wd>

<space/>

<wd l="4205" t="5904" r="4378" b="6058">in</wd>

<space/>

<wd l="4435" t="5904" r="4896" b="6062">order</wd>

<space/>

<wd l="4954" t="5904" r="5266" b="6062">and</wd>

<space/>

<wd l="5323" t="5904" r="5803" b="6106">apply</wd>

<space/>

</ln>

<ln l="1445" t="6173" r="5803" b="6370" baseLine="6326" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6226" r="1541" b="6331">a</wd>

<space/>

<wd l="1584" t="6173" r="2395" b="6331">threshold</wd>

<space/>

<wd l="2453" t="6173" r="2851" b="6370">(0.5)</wd>

<space/>

<wd l="2909" t="6197" r="3077" b="6331">to</wd>

<space/>

<wd l="3125" t="6173" r="3394" b="6331">the</wd>

<space/>

<wd l="3446" t="6173" r="4334" b="6331">activation.</wd>

<space/>

<wd l="4411" t="6173" r="4747" b="6331">The</wd>

<space/>

<wd l="4795" t="6173" r="5261" b="6331">value</wd>

<space/>

<wd l="5314" t="6173" r="5506" b="6331">of</wd>

<space/>

<wd l="5539" t="6173" r="5803" b="6331">the</wd>

<space/>

</ln>

<ln l="1445" t="6446" r="5803" b="6648" baseLine="6595" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6446" r="1757" b="6605">i-th</wd>

<space/>

<wd l="1800" t="6446" r="2405" b="6605">feature</wd>

<space/>

<wd l="2453" t="6499" r="3274" b="6648">expresses</wd>

<space/>

<wd l="3326" t="6446" r="3859" b="6605">which</wd>

<space/>

<wd l="3902" t="6499" r="4512" b="6605">neuron</wd>

<space/>

<wd l="4550" t="6499" r="4882" b="6605">was</wd>

<space/>

<wd l="4939" t="6446" r="5251" b="6605">i-th</wd>

<space/>

<wd l="5299" t="6446" r="5803" b="6605">active</wd>

<space/>

</ln>

<ln l="1445" t="6715" r="5803" b="6917" baseLine="6869" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6715" r="1757" b="6874">and</wd>

<space/>

<wd l="1819" t="6715" r="2525" b="6874">whether</wd>

<space/>

<wd l="2587" t="6715" r="2784" b="6874">its</wd>

<space/>

<wd l="2861" t="6715" r="3710" b="6874">activation</wd>

<space/>

<wd l="3773" t="6768" r="4099" b="6874">was</wd>

<space/>

<wd l="4171" t="6715" r="4699" b="6874">below</wd>

<space/>

<wd l="4771" t="6715" r="5083" b="6902">0.5,</wd>

<space/>

<wd l="5165" t="6768" r="5462" b="6917">e.g.</wd>

<space/>

<wd l="5539" t="6715" r="5803" b="6874">the</wd>

<space/>

</ln>

<ln l="1445" t="6989" r="5808" b="7147" baseLine="7138" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6989" r="1781" b="7147">first</wd>

<space/>

<wd l="1829" t="6989" r="2434" b="7147">feature</wd>

<space/>

<wd l="2496" t="7013" r="2962" b="7147">states</wd>

<space/>

<wd l="3019" t="6989" r="3552" b="7147">which</wd>

<space/>

<wd l="3605" t="7042" r="4210" b="7147">neuron</wd>

<space/>

<wd l="4258" t="6989" r="4397" b="7147">is</wd>

<space/>

<wd l="4454" t="7013" r="4882" b="7147">most</wd>

<space/>

<wd l="4934" t="6989" r="5438" b="7147">active</wd>

<space/>

<wd l="5496" t="6989" r="5808" b="7147">and</wd>

<space/>

</ln>

<ln l="1440" t="7258" r="5803" b="7416" baseLine="7406" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="7258" r="2146" b="7416">whether</wd>

<space/>

<wd l="2198" t="7310" r="2381" b="7416">or</wd>

<space/>

<wd l="2424" t="7282" r="2707" b="7416">not</wd>

<space/>

<wd l="2755" t="7258" r="2952" b="7416">its</wd>

<space/>

<wd l="3014" t="7258" r="3859" b="7416">activation</wd>

<space/>

<wd l="3912" t="7258" r="4046" b="7416">is</wd>

<space/>

<wd l="4104" t="7258" r="4627" b="7416">below</wd>

<space/>

<wd l="4690" t="7258" r="5002" b="7416">0.5.</wd>

<space/>

<wd l="5078" t="7262" r="5309" b="7416">As</wd>

<space/>

<wd l="5371" t="7258" r="5803" b="7416">there</wd>

<space/>

</ln>

<ln l="1445" t="7531" r="5794" b="7733" baseLine="7680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="7584" r="1704" b="7690">are</wd>

<space/>

<wd l="1786" t="7536" r="2112" b="7690">400</wd>

<space/>

<wd l="2194" t="7584" r="2875" b="7690">neurons</wd>

<space/>

<wd l="2971" t="7531" r="3278" b="7690">and</wd>

<space/>

<wd l="3365" t="7536" r="3466" b="7685">2</wd>

<space/>

<wd l="3547" t="7531" r="4262" b="7733">possible</wd>

<space/>

<wd l="4344" t="7531" r="5146" b="7690">binarised</wd>

<space/>

<wd l="5227" t="7531" r="5794" b="7690">activa-</wd>

</ln>

<ln l="1440" t="7762" r="4613" b="8002" baseLine="7945">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1440" t="7800" r="1906" b="7987">tions,</wd>

<space/>

<wd l="1973" t="7800" r="2410" b="7958">there</wd>

<space/>

<wd l="2467" t="7853" r="2731" b="7958">are</wd>

<space/>

<wd l="2794" t="7805" r="3110" b="7958">800</wd>

<space/>

<wd l="3168" t="7800" r="3883" b="8002">possible</wd>

<space/>

</run>

<wd l="3936" t="7762" r="4613" b="7958"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">values.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">5</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="8069" r="5808" b="10714" alignment="justified" fli="216" lsp="exactly" lspExact="269" language="en">

<ln l="1656" t="8069" r="5803" b="8270" baseLine="8222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="8069" r="2026" b="8227">Edit</wd>

<space/>

<wd l="2102" t="8069" r="3000" b="8270">operations</wd>

<space/>

<wd l="3091" t="8122" r="3350" b="8227">are</wd>

<space/>

<wd l="3437" t="8069" r="4229" b="8227">extracted</wd>

<space/>

<wd l="4306" t="8069" r="4733" b="8227">from</wd>

<space/>

<wd l="4805" t="8069" r="5074" b="8227">the</wd>

<space/>

<wd l="5150" t="8069" r="5803" b="8270">parallel</wd>

<space/>

</ln>

<ln l="1440" t="8342" r="5803" b="8544" baseLine="8491" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8342" r="2117" b="8544">training</wd>

<space/>

<wd l="2174" t="8342" r="2539" b="8501">data</wd>

<space/>

<wd l="2597" t="8342" r="3418" b="8544">searching</wd>

<space/>

<wd l="3470" t="8342" r="3730" b="8501">for</wd>

<space/>

<wd l="3778" t="8342" r="4046" b="8501">the</wd>

<space/>

<wd l="4094" t="8342" r="4661" b="8501">lowest</wd>

<space/>

<wd l="4718" t="8342" r="5040" b="8501">edit</wd>

<space/>

<wd l="5098" t="8342" r="5803" b="8501">distance</wd>

<space/>

</ln>

<ln l="1445" t="8611" r="5798" b="8813" baseLine="8765" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="8611" r="1757" b="8770">and</wd>

<space/>

<wd l="1853" t="8611" r="2683" b="8813">recording</wd>

<space/>

<wd l="2784" t="8611" r="3048" b="8770">the</wd>

<space/>

<wd l="3149" t="8611" r="3475" b="8770">edit</wd>

<space/>

<wd l="3571" t="8611" r="4469" b="8813">operations</wd>

<space/>

<wd l="4570" t="8611" r="4958" b="8770">with</wd>

<space/>

<wd l="5059" t="8611" r="5798" b="8813">dynamic</wd>

<space/>

</ln>

<ln l="1440" t="8885" r="5794" b="9086" baseLine="9034" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8885" r="2669" b="9086">programming.</wd>

<space/>

<wd l="2798" t="8890" r="3086" b="9043">We</wd>

<space/>

<wd l="3163" t="8885" r="4027" b="9043">customise</wd>

<space/>

<wd l="4099" t="8885" r="4368" b="9043">the</wd>

<space/>

<wd l="4445" t="8885" r="4766" b="9043">edit</wd>

<space/>

<wd l="4843" t="8909" r="5266" b="9043">costs</wd>

<space/>

<wd l="5347" t="8885" r="5794" b="9043">func-</wd>

</ln>

<ln l="1440" t="9154" r="5794" b="9355" baseLine="9307" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9154" r="1781" b="9312">tion</wd>

<space/>

<wd l="1858" t="9178" r="2026" b="9312">to</wd>

<space/>

<wd l="2112" t="9154" r="2702" b="9355">always</wd>

<space/>

<wd l="2789" t="9178" r="3576" b="9355">postpone</wd>

<space/>

<wd l="3653" t="9154" r="4493" b="9312">insertions</wd>

<space/>

<wd l="4579" t="9178" r="4747" b="9312">to</wd>

<space/>

<wd l="4834" t="9154" r="5232" b="9312">after</wd>

<space/>

<wd l="5314" t="9154" r="5794" b="9312">delet-</wd>

</ln>

<ln l="1440" t="9427" r="5803" b="9629" baseLine="9576" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9427" r="1714" b="9629">ing</wd>

<space/>

<wd l="1790" t="9427" r="2659" b="9586">characters</wd>

<space/>

<wd l="2746" t="9480" r="2923" b="9586">so</wd>

<space/>

<wd l="2995" t="9427" r="3322" b="9586">that</wd>

<space/>

<wd l="3394" t="9427" r="3787" b="9586">each</wd>

<space/>

<wd l="3850" t="9427" r="4301" b="9629">input</wd>

<space/>

<wd l="4373" t="9427" r="5170" b="9586">character</wd>

<space/>

<wd l="5237" t="9480" r="5530" b="9586">can</wd>

<space/>

<wd l="5602" t="9427" r="5803" b="9586">be</wd>

<space/>

</ln>

<ln l="1445" t="9696" r="5808" b="9898" baseLine="9850" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9696" r="2194" b="9898">assigned</wd>

<space/>

<wd l="2280" t="9696" r="2899" b="9898">exactly</wd>

<space/>

<wd l="2990" t="9749" r="3302" b="9854">one</wd>

<space/>

<wd l="3389" t="9696" r="3715" b="9854">edit</wd>

<space/>

<wd l="3802" t="9696" r="4622" b="9898">operation</wd>

<space/>

<wd l="4704" t="9696" r="5131" b="9854">from</wd>

<space/>

<wd l="5213" t="9696" r="5477" b="9854">the</wd>

<space/>

<wd l="5573" t="9720" r="5808" b="9854">set</wd>

<space/>

</ln>

<ln l="1454" t="9955" r="5803" b="10181" baseLine="10118">

<wd l="1454" t="9955" r="1762" b="10181"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-3">{</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">do</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="1834" t="9970" r="2544" b="10171">nothing,</wd>

<space/>

<wd l="2630" t="9970" r="3149" b="10128">delete</wd>

<space/>

<wd l="3221" t="9970" r="4051" b="10157">character,</wd>

<space/>

<wd l="4133" t="9970" r="4618" b="10128">insert</wd>

<space/>

<wd l="4694" t="9970" r="5179" b="10171">string</wd>

<space/>

<wd l="5246" t="9970" r="5803" b="10128">before</wd>

<space/>

</run>

</ln>

<ln l="1445" t="10224" r="5803" b="10450" baseLine="10387">

<wd l="1445" t="10224" r="2390" b="10450"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">character</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-3">}</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="2486" t="10243" r="2707" b="10397">To</wd>

<space/>

<wd l="2774" t="10262" r="3413" b="10440">capture</wd>

<space/>

<wd l="3470" t="10238" r="4310" b="10397">insertions</wd>

<space/>

<wd l="4382" t="10262" r="4541" b="10397">at</wd>

<space/>

<wd l="4598" t="10238" r="4862" b="10397">the</wd>

<space/>

<wd l="4930" t="10238" r="5242" b="10397">end</wd>

<space/>

<wd l="5304" t="10238" r="5491" b="10397">of</wd>

<space/>

<wd l="5539" t="10238" r="5803" b="10397">the</wd>

<space/>

</run>

</ln>

<ln l="1440" t="10512" r="5333" b="10714" baseLine="10661" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10536" r="1954" b="10699">tweet,</wd>

<space/>

<wd l="2021" t="10565" r="2275" b="10670">we</wd>

<space/>

<wd l="2338" t="10512" r="2962" b="10714">append</wd>

<space/>

<wd l="3019" t="10565" r="3115" b="10670">a</wd>

<space/>

<wd l="3168" t="10517" r="3749" b="10670">NULL</wd>

<space/>

<wd l="3802" t="10512" r="4176" b="10714">byte</wd>

<space/>

<wd l="4234" t="10536" r="4402" b="10670">to</wd>

<space/>

<wd l="4464" t="10512" r="4666" b="10670">all</wd>

<space/>

<wd l="4728" t="10536" r="5333" b="10670">tweets.</wd>

</ln>

</para>

<para l="1440" t="10781" r="5808" b="12878" alignment="justified" spaceBefore="1" spaceAfter="73" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="10781" r="5798" b="10982" baseLine="10930" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="10781" r="1997" b="10939">The</wd>

<space/>

<wd l="2088" t="10781" r="2597" b="10939">above</wd>

<space/>

<wd l="2698" t="10805" r="3192" b="10982">setup,</wd>

<space/>

<wd l="3298" t="10781" r="3984" b="10939">features</wd>

<space/>

<wd l="4085" t="10781" r="4397" b="10939">and</wd>

<space/>

<wd l="4488" t="10781" r="4810" b="10939">edit</wd>

<space/>

<wd l="4901" t="10781" r="5798" b="10982">operations</wd>

<space/>

</ln>

<ln l="1445" t="11050" r="5808" b="11251" baseLine="11203" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11102" r="1704" b="11208">are</wd>

<space/>

<wd l="1766" t="11050" r="2515" b="11208">identical</wd>

<space/>

<wd l="2578" t="11074" r="2746" b="11208">to</wd>

<space/>

<wd l="2813" t="11050" r="3610" b="11251">Chrupała</wd>

<space/>

<wd l="3677" t="11054" r="4238" b="11246">(2014)</wd>

<space/>

<wd l="4306" t="11074" r="4474" b="11208">to</wd>

<space/>

<wd l="4536" t="11050" r="4800" b="11208">the</wd>

<space/>

<wd l="4862" t="11050" r="5218" b="11208">best</wd>

<space/>

<wd l="5280" t="11050" r="5467" b="11208">of</wd>

<space/>

<wd l="5520" t="11102" r="5808" b="11208">our</wd>

<space/>

</ln>

<ln l="1440" t="11323" r="5794" b="11525" baseLine="11472" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11323" r="2434" b="11525">knowledge.</wd>

<space/>

<wd l="2549" t="11328" r="2837" b="11482">We</wd>

<space/>

<wd l="2904" t="11323" r="3499" b="11482">further</wd>

<space/>

<wd l="3566" t="11323" r="3878" b="11482">add</wd>

<space/>

<wd l="3950" t="11376" r="4046" b="11482">a</wd>

<space/>

<wd l="4114" t="11323" r="4915" b="11482">character</wd>

<space/>

<wd l="4982" t="11323" r="5390" b="11482">class</wd>

<space/>

<wd l="5467" t="11323" r="5794" b="11482">fea-</wd>

</ln>

<ln l="1440" t="11578" r="5794" b="11803" baseLine="11746">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="11616" r="1781" b="11750">ture</wd>

<space/>

</run>

<wd l="1853" t="11578" r="2573" b="11803"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">{</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">NULL,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2645" t="11592" r="3302" b="11779">control,</wd>

<space/>

<wd l="3384" t="11645" r="3902" b="11794">space,</wd>

<space/>

<wd l="3974" t="11592" r="4973" b="11794">apostrophe,</wd>

<space/>

<wd l="5040" t="11616" r="5794" b="11794">punctua-</wd>

</run>

</ln>

<ln l="1440" t="11866" r="5794" b="12067" baseLine="12014" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11866" r="1824" b="12053">tion,</wd>

<space/>

<wd l="1901" t="11866" r="2338" b="12067">digit,</wd>

<space/>

<wd l="2414" t="11890" r="2938" b="12067">quote,</wd>

<space/>

<wd l="3005" t="11866" r="3691" b="12053">bracket,</wd>

<space/>

<wd l="3763" t="11866" r="4627" b="12024">lowercase</wd>

<space/>

<wd l="4685" t="11866" r="5170" b="12053">letter,</wd>

<space/>

<wd l="5242" t="11918" r="5794" b="12067">upper-</wd>

</ln>

<ln l="1445" t="12120" r="5794" b="12346" baseLine="12288">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="12187" r="1814" b="12293">case</wd>

<space/>

<wd l="1886" t="12134" r="2366" b="12322">letter,</wd>

<space/>

<wd l="2453" t="12139" r="3466" b="12322">non-ASCII,</wd>

<space/>

</run>

<wd l="3547" t="12120" r="4090" b="12346"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">other</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">}</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="4176" t="12134" r="4488" b="12293">and</wd>

<space/>

<wd l="4560" t="12187" r="4656" b="12293">a</wd>

<space/>

<wd l="4718" t="12134" r="5323" b="12293">feature</wd>

<space/>

<wd l="5395" t="12134" r="5794" b="12293">indi-</wd>

</run>

</ln>

<ln l="1445" t="12408" r="5808" b="12610" baseLine="12557" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12408" r="1968" b="12610">cating</wd>

<space/>

<wd l="2026" t="12408" r="2736" b="12566">whether</wd>

<space/>

<wd l="2784" t="12408" r="3053" b="12566">the</wd>

<space/>

<wd l="3110" t="12408" r="3912" b="12566">character</wd>

<space/>

<wd l="3960" t="12408" r="4099" b="12566">is</wd>

<space/>

<wd l="4162" t="12437" r="4502" b="12610">part</wd>

<space/>

<wd l="4560" t="12408" r="4747" b="12566">of</wd>

<space/>

<wd l="4795" t="12461" r="4891" b="12566">a</wd>

<space/>

<wd l="4939" t="12408" r="5424" b="12566">token</wd>

<space/>

<wd l="5477" t="12408" r="5808" b="12566">that</wd>

<space/>

</ln>

<ln l="1440" t="12677" r="5808" b="12878" baseLine="12830" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12677" r="1579" b="12835">is</wd>

<space/>

<wd l="1651" t="12677" r="2299" b="12878">eligible</wd>

<space/>

<wd l="2362" t="12677" r="2621" b="12835">for</wd>

<space/>

<wd l="2683" t="12677" r="3278" b="12878">editing</wd>

<space/>

<wd l="3350" t="12677" r="4200" b="12878">according</wd>

<space/>

<wd l="4267" t="12701" r="4430" b="12835">to</wd>

<space/>

<wd l="4498" t="12677" r="4762" b="12835">the</wd>

<space/>

<wd l="4834" t="12677" r="5395" b="12835">shared</wd>

<space/>

<wd l="5453" t="12677" r="5808" b="12835">task</wd>

</ln>

</para>

<rulerline l="1440" t="12979" r="2640" b="12979" type="single" width="10" color="000000"/>

<para l="1694" t="13037" r="5736" b="13445" alignment="left" li="216" ri="72" spaceBefore="37" lsp="exactly" lspExact="218" language="en">

<ln l="1704" t="13037" r="5736" b="13229" baseLine="13188">

<wd l="1704" t="13037" r="5736" b="13229"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-1">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">https://bitbucket.org/gchrupala/elman</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1"><space/>

</run>

</ln>

<ln l="1694" t="13253" r="3576" b="13445" baseLine="13406">

<wd l="1694" t="13253" r="3576" b="13445"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-1">2</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">http://rnnlm.org/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1699" t="13474" r="5189" b="13661" alignment="left" li="216" spaceBefore="19" lsp="exactly" lspExact="199" language="en">

<ln l="1699" t="13474" r="5189" b="13661" baseLine="13624">

<wd l="1699" t="13474" r="5189" b="13661"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">https://bitbucket.org/gchrupala/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1454" t="13709" r="3480" b="13843" alignment="left" spaceBefore="15" lsp="exactly" lspExact="180" language="en">

<ln l="1454" t="13709" r="3480" b="13843" baseLine="13824" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">

<wd l="1454" t="13709" r="3480" b="13843">codeswitch/overview</wd>

</ln>

</para>

<para l="1440" t="13886" r="5798" b="14486" alignment="justified" spaceBefore="39" fli="216" lsp="exactly" lspExact="198" language="en">

<ln l="1694" t="13886" r="5798" b="14088" baseLine="14043">

<wd l="1694" t="13886" r="2150" b="14050"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">4</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">More</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2203" t="13920" r="2880" b="14088">precisely,</wd>

<space/>

<wd l="2942" t="13958" r="3149" b="14050">we</wd>

<space/>

<wd l="3206" t="13958" r="3734" b="14088">process</wd>

<space/>

<wd l="3797" t="13920" r="4277" b="14050">UTF-8</wd>

<space/>

<wd l="4339" t="13920" r="4752" b="14088">bytes.</wd>

<space/>

<wd l="4843" t="13925" r="5093" b="14050">For</wd>

<space/>

<wd l="5146" t="13920" r="5362" b="14050">the</wd>

<space/>

<wd l="5419" t="13920" r="5798" b="14050">train-</wd>

</run>

</ln>

<ln l="1440" t="14122" r="5798" b="14290" baseLine="14242" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14122" r="1666" b="14290">ing</wd>

<space/>

<wd l="1714" t="14122" r="2050" b="14275">data,</wd>

<space/>

<wd l="2098" t="14122" r="2347" b="14251">this</wd>

<space/>

<wd l="2395" t="14122" r="2510" b="14251">is</wd>

<space/>

<wd l="2558" t="14122" r="2774" b="14251">the</wd>

<space/>

<wd l="2822" t="14160" r="3182" b="14251">same</wd>

<space/>

<wd l="3230" t="14160" r="3370" b="14251">as</wd>

<space/>

<wd l="3418" t="14122" r="4138" b="14251">characters</wd>

<space/>

<wd l="4190" t="14160" r="4330" b="14251">as</wd>

<space/>

<wd l="4378" t="14122" r="4594" b="14251">the</wd>

<space/>

<wd l="4637" t="14122" r="5194" b="14290">training</wd>

<space/>

<wd l="5242" t="14141" r="5438" b="14251">set</wd>

<space/>

<wd l="5482" t="14122" r="5798" b="14251">does</wd>

<space/>

</ln>

<ln l="1440" t="14318" r="4675" b="14486" baseLine="14443" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14338" r="1670" b="14448">not</wd>

<space/>

<wd l="1714" t="14318" r="2242" b="14448">contain</wd>

<space/>

<wd l="2290" t="14357" r="2539" b="14486">any</wd>

<space/>

<wd l="2587" t="14318" r="3331" b="14486">multi-byte</wd>

<space/>

<wd l="3379" t="14318" r="3859" b="14448">UTF-8</wd>

<space/>

<wd l="3912" t="14318" r="4675" b="14448">characters.</wd>

</ln>

</para>

<para l="1440" t="14501" r="5803" b="15293" alignment="justified" spaceBefore="24" fli="216" lsp="exactly" lspExact="197" language="en">

<ln l="1694" t="14501" r="5803" b="14707" baseLine="14657">

<wd l="1694" t="14501" r="2189" b="14669"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">5</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">These</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2270" t="14544" r="2976" b="14669">RNN-LM</wd>

<space/>

<wd l="3053" t="14539" r="3542" b="14669">hidden</wd>

<space/>

<wd l="3619" t="14539" r="3979" b="14707">layer</wd>

<space/>

<wd l="4056" t="14539" r="4752" b="14669">activation</wd>

<space/>

<wd l="4829" t="14539" r="5390" b="14669">features</wd>

<space/>

<wd l="5472" t="14539" r="5803" b="14669">have</wd>

<space/>

</run>

</ln>

<ln l="1440" t="14736" r="5803" b="14904" baseLine="14861" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14736" r="1781" b="14866">been</wd>

<space/>

<wd l="1843" t="14736" r="2170" b="14866">used</wd>

<space/>

<wd l="2237" t="14736" r="3106" b="14904">successfully</wd>

<space/>

<wd l="3168" t="14736" r="3312" b="14861">in</wd>

<space/>

<wd l="3374" t="14755" r="3643" b="14866">text</wd>

<space/>

<wd l="3706" t="14736" r="4656" b="14904">segmentation</wd>

<space/>

<wd l="4723" t="14736" r="4978" b="14866">and</wd>

<space/>

<wd l="5035" t="14736" r="5803" b="14866">word-level</wd>

<space/>

</ln>

<ln l="1440" t="14938" r="5798" b="15106" baseLine="15058" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14938" r="2083" b="15106">language</wd>

<space/>

<wd l="2194" t="14938" r="3144" b="15067">identification</wd>

<space/>

<wd l="3250" t="14938" r="4003" b="15106">(Chrupała,</wd>

<space/>

<wd l="4138" t="14938" r="4531" b="15091">2013;</wd>

<space/>

<wd l="4675" t="14942" r="5242" b="15067">Barman</wd>

<space/>

<wd l="5352" t="14957" r="5482" b="15067">et</wd>

<space/>

<wd l="5592" t="14938" r="5798" b="15091">al.,</wd>

<space/>

</ln>

<ln l="1445" t="15134" r="1891" b="15293" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="15134" r="1891" b="15293">2014).</wd>

</ln>

</para>

</column>

<column l="6139" t="1260" r="10521" b="15310">

<para l="6144" t="1320" r="10512" b="2064" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="1320" r="10502" b="1507" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1320" r="6614" b="1507">rules,</wd>

<space/>

<wd l="6715" t="1320" r="6974" b="1478">i.e.</wd>

<space/>

<wd l="7070" t="1320" r="7776" b="1478">whether</wd>

<space/>

<wd l="7862" t="1373" r="8040" b="1478">or</wd>

<space/>

<wd l="8122" t="1344" r="8405" b="1478">not</wd>

<space/>

<wd l="8486" t="1320" r="8755" b="1478">the</wd>

<space/>

<wd l="8842" t="1320" r="9715" b="1478">characters</wd>

<space/>

<wd l="9811" t="1373" r="10502" b="1478">encoun-</wd>

</ln>

<ln l="6144" t="1594" r="10512" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1594" r="6581" b="1752">tered</wd>

<space/>

<wd l="6648" t="1594" r="7085" b="1752">since</wd>

<space/>

<wd l="7142" t="1594" r="7406" b="1752">the</wd>

<space/>

<wd l="7464" t="1594" r="7771" b="1752">last</wd>

<space/>

<wd l="7834" t="1646" r="8309" b="1795">space</wd>

<space/>

<wd l="8371" t="1646" r="8549" b="1752">or</wd>

<space/>

<wd l="8611" t="1618" r="8981" b="1752">start</wd>

<space/>

<wd l="9038" t="1594" r="9230" b="1752">of</wd>

<space/>

<wd l="9274" t="1618" r="9744" b="1752">tweet</wd>

<space/>

<wd l="9806" t="1594" r="10186" b="1795">only</wd>

<space/>

<wd l="10248" t="1646" r="10512" b="1752">are</wd>

<space/>

</ln>

<ln l="6144" t="1862" r="9461" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1862" r="6720" b="2050">letters,</wd>

<space/>

<wd l="6792" t="1862" r="7315" b="2064">digits,</wd>

<space/>

<wd l="7387" t="1862" r="8414" b="2064">apostrophes</wd>

<space/>

<wd l="8482" t="1862" r="8794" b="2021">and</wd>

<space/>

<wd l="8856" t="1915" r="9461" b="2064">spaces.</wd>

</ln>

</para>

<para l="6144" t="2333" r="8443" b="2534" alignment="left" spaceBefore="217" lsp="exactly" lspExact="251" language="en">

<ln l="6144" t="2333" r="8443" b="2534" baseLine="2482" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6144" t="2333" r="6413" b="2491">2.3</wd>

<space/>

<wd l="6643" t="2333" r="7507" b="2534">Sequence</wd>

<space/>

<wd l="7565" t="2333" r="8443" b="2534">Labelling</wd>

</ln>

</para>

<para l="6144" t="2693" r="10512" b="6643" alignment="justified" spaceBefore="85" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="2693" r="10507" b="2894" baseLine="2842">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="2698" r="6451" b="2851">For</wd>

<space/>

<wd l="6518" t="2693" r="7795" b="2851">character-level</wd>

<space/>

<wd l="7877" t="2746" r="8664" b="2894">sequence</wd>

<space/>

<wd l="8731" t="2693" r="9538" b="2894">labelling,</wd>

<space/>

<wd l="9624" t="2746" r="9878" b="2851">we</wd>

<space/>

<wd l="9946" t="2717" r="10186" b="2894">try</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="10262" t="2698" r="10507" b="2890">(a)</wd>

<space/>

</run>

</ln>

<ln l="6149" t="2928" r="10502" b="3163" baseLine="3106">

<wd l="6149" t="2928" r="6840" b="3163"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Sequor</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">6</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="6931" t="2962" r="7795" b="3163">(Chrupała</wd>

<space/>

<wd l="7862" t="2962" r="8174" b="3120">and</wd>

<space/>

<wd l="8246" t="2962" r="8952" b="3149">Klakow,</wd>

<space/>

<wd l="9038" t="2966" r="9586" b="3158">2010),</wd>

<space/>

<wd l="9672" t="3014" r="9869" b="3120">an</wd>

<space/>

<wd l="9941" t="2962" r="10502" b="3163">imple-</wd>

</run>

</ln>

<ln l="6144" t="3230" r="10498" b="3432" baseLine="3384" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3230" r="7018" b="3389">mentation</wd>

<space/>

<wd l="7094" t="3230" r="7286" b="3389">of</wd>

<space/>

<wd l="7344" t="3230" r="7608" b="3389">the</wd>

<space/>

<wd l="7690" t="3230" r="8678" b="3432">generalised</wd>

<space/>

<wd l="8750" t="3254" r="9682" b="3432">perceptron</wd>

<space/>

<wd l="9763" t="3230" r="10498" b="3427">(Collins,</wd>

<space/>

</ln>

<ln l="6149" t="3466" r="10493" b="3706" baseLine="3646">

<wd l="6149" t="3470" r="6782" b="3701"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2002),</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">7</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="6984" t="3504" r="7373" b="3662">with</wd>

<space/>

<wd l="7555" t="3509" r="7742" b="3662">10</wd>

<space/>

<wd l="7906" t="3504" r="8760" b="3691">iterations,</wd>

<space/>

<wd l="8962" t="3504" r="9274" b="3662">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="9437" t="3504" r="9682" b="3701">(b)</wd>

<space/>

</run>

<wd l="9845" t="3466" r="10493" b="3706"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Wapiti</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">8</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="6154" t="3773" r="10502" b="3974" baseLine="3926" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="3778" r="7032" b="3974">(Lavergne</wd>

<space/>

<wd l="7114" t="3797" r="7267" b="3931">et</wd>

<space/>

<wd l="7344" t="3773" r="7594" b="3960">al.,</wd>

<space/>

<wd l="7694" t="3778" r="8333" b="3970">2010)’s</wd>

<space/>

<wd l="8419" t="3773" r="9792" b="3974">implementation</wd>

<space/>

<wd l="9869" t="3773" r="10061" b="3931">of</wd>

<space/>

<wd l="10128" t="3826" r="10502" b="3931">con-</wd>

</ln>

<ln l="6149" t="4046" r="10507" b="4248" baseLine="4195" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4046" r="6811" b="4205">ditional</wd>

<space/>

<wd l="6864" t="4046" r="7536" b="4205">random</wd>

<space/>

<wd l="7589" t="4046" r="8050" b="4205">fields</wd>

<space/>

<wd l="8122" t="4046" r="8890" b="4248">(Lafferty</wd>

<space/>

<wd l="8952" t="4070" r="9106" b="4205">et</wd>

<space/>

<wd l="9163" t="4046" r="9413" b="4234">al.,</wd>

<space/>

<wd l="9480" t="4051" r="9974" b="4243">2001)</wd>

<space/>

<wd l="10037" t="4046" r="10507" b="4248">using</wd>

<space/>

</ln>

<ln l="6144" t="4315" r="10502" b="4517" baseLine="4469" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4315" r="6648" b="4517">l-bfgs</wd>

<space/>

<wd l="6720" t="4315" r="7805" b="4517">optimisation</wd>

<space/>

<wd l="7867" t="4315" r="8256" b="4474">with</wd>

<space/>

<wd l="8318" t="4368" r="8414" b="4474">a</wd>

<space/>

<wd l="8472" t="4315" r="9072" b="4517">history</wd>

<space/>

<wd l="9139" t="4315" r="9331" b="4474">of</wd>

<space/>

<wd l="9384" t="4315" r="9475" b="4474">5</wd>

<space/>

<wd l="9557" t="4339" r="10027" b="4517">steps,</wd>

<space/>

<wd l="10104" t="4315" r="10502" b="4474">elas-</wd>

</ln>

<ln l="6144" t="4589" r="10502" b="4790" baseLine="4740">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="4589" r="6360" b="4747">tic</wd>

<space/>

<wd l="6413" t="4613" r="6677" b="4747">net</wd>

<space/>

<wd l="6725" t="4589" r="7920" b="4790">regularisation</wd>

<space/>

</run>

<wd l="7978" t="4594" r="8222" b="4790"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(p</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8318" t="4661" r="8467" b="4714">=</wd>

<space/>

<wd l="8544" t="4594" r="9024" b="4747">0.333</wd>

<space/>

<wd l="9086" t="4589" r="9398" b="4747">and</wd>

<space/>

</run>

<wd l="9446" t="4642" r="9634" b="4790"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">p</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="9720" t="4661" r="9869" b="4714">=</wd>

<space/>

<wd l="9946" t="4594" r="10502" b="4786">0.001)</wd>

<space/>

</run>

</ln>

<ln l="6149" t="4858" r="10512" b="5016" baseLine="5011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4858" r="6461" b="5016">and</wd>

<space/>

<wd l="6518" t="4910" r="6734" b="5016">no</wd>

<space/>

<wd l="6797" t="4858" r="7186" b="5016">hard</wd>

<space/>

<wd l="7243" t="4858" r="7656" b="5016">limit</wd>

<space/>

<wd l="7718" t="4910" r="7934" b="5016">on</wd>

<space/>

<wd l="7987" t="4858" r="8256" b="5016">the</wd>

<space/>

<wd l="8314" t="4858" r="8986" b="5016">number</wd>

<space/>

<wd l="9043" t="4858" r="9235" b="5016">of</wd>

<space/>

<wd l="9278" t="4858" r="10133" b="5016">iterations.</wd>

<space/>

<wd l="10224" t="4862" r="10512" b="5016">We</wd>

<space/>

</ln>

<ln l="6149" t="5093" r="10498" b="5333" baseLine="5276">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="5131" r="6725" b="5290">extend</wd>

<space/>

<wd l="6797" t="5131" r="7061" b="5290">the</wd>

<space/>

<wd l="7133" t="5131" r="7738" b="5290">feature</wd>

<space/>

<wd l="7810" t="5131" r="8635" b="5333">templates</wd>

<space/>

<wd l="8722" t="5131" r="8914" b="5290">of</wd>

<space/>

<wd l="8976" t="5131" r="9773" b="5333">Chrupała</wd>

<space/>

</run>

<wd l="9850" t="5093" r="10498" b="5328"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(2014)</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">9</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="6144" t="5400" r="10502" b="5602" baseLine="5549" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5400" r="6360" b="5602">by</wd>

<space/>

<wd l="6413" t="5400" r="7234" b="5602">including</wd>

<space/>

<wd l="7286" t="5453" r="7579" b="5558">our</wd>

<space/>

<wd l="7627" t="5400" r="8491" b="5558">additional</wd>

<space/>

<wd l="8539" t="5424" r="8861" b="5558">two</wd>

<space/>

<wd l="8914" t="5400" r="9648" b="5558">features.</wd>

<space/>

<wd l="9725" t="5400" r="10061" b="5558">The</wd>

<space/>

<wd l="10109" t="5424" r="10502" b="5558">tem-</wd>

</ln>

<ln l="6144" t="5674" r="10502" b="5875" baseLine="5822" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5674" r="6571" b="5875">plate</wd>

<space/>

<wd l="6629" t="5698" r="7440" b="5875">generates</wd>

<space/>

<wd l="7498" t="5674" r="8270" b="5875">unigram,</wd>

<space/>

<wd l="8333" t="5674" r="8957" b="5875">bigram</wd>

<space/>

<wd l="9010" t="5674" r="9322" b="5832">and</wd>

<space/>

<wd l="9374" t="5674" r="10018" b="5875">trigram</wd>

<space/>

<wd l="10070" t="5674" r="10502" b="5832">char-</wd>

</ln>

<ln l="6149" t="5942" r="10502" b="6101" baseLine="6091" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="5966" r="6576" b="6101">acter</wd>

<space/>

<wd l="6634" t="5942" r="7315" b="6101">features</wd>

<space/>

<wd l="7387" t="5942" r="7944" b="6101">within</wd>

<space/>

<wd l="8011" t="5995" r="8107" b="6101">a</wd>

<space/>

<wd l="8174" t="5947" r="8414" b="6101">+/-</wd>

<space/>

<wd l="8491" t="5947" r="8592" b="6096">2</wd>

<space/>

<wd l="8659" t="5942" r="9384" b="6101">window.</wd>

<space/>

<wd l="9490" t="5942" r="9768" b="6096">All</wd>

<space/>

<wd l="9830" t="5942" r="10502" b="6101">remain-</wd>

</ln>

<ln l="6144" t="6211" r="10502" b="6413" baseLine="6365" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6211" r="6422" b="6413">ing</wd>

<space/>

<wd l="6499" t="6211" r="7181" b="6370">features</wd>

<space/>

<wd l="7267" t="6264" r="7526" b="6370">are</wd>

<space/>

<wd l="7603" t="6211" r="8357" b="6370">included</wd>

<space/>

<wd l="8434" t="6264" r="8602" b="6370">as</wd>

<space/>

<wd l="8683" t="6211" r="9485" b="6413">unigrams</wd>

<space/>

<wd l="9571" t="6211" r="9763" b="6370">of</wd>

<space/>

<wd l="9826" t="6211" r="10090" b="6370">the</wd>

<space/>

<wd l="10171" t="6264" r="10502" b="6370">cur-</wd>

</ln>

<ln l="6144" t="6485" r="7051" b="6643" baseLine="6634" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6509" r="6485" b="6643">rent</wd>

<space/>

<wd l="6538" t="6485" r="7051" b="6643">value.</wd>

</ln>

</para>

<para l="6144" t="6758" r="10512" b="8587" alignment="justified" spaceBefore="34" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="6758" r="10498" b="6955" baseLine="6912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="6763" r="6725" b="6917">Due</wd>

<space/>

<wd l="6797" t="6782" r="6960" b="6917">to</wd>

<space/>

<wd l="7032" t="6758" r="7301" b="6917">the</wd>

<space/>

<wd l="7368" t="6758" r="7925" b="6917">nested</wd>

<space/>

<wd l="7997" t="6758" r="9384" b="6917">cross-validation</wd>

<space/>

<wd l="9461" t="6763" r="9802" b="6955">(see</wd>

<space/>

<wd l="9874" t="6758" r="10498" b="6955">above),</wd>

<space/>

</ln>

<ln l="6149" t="6994" r="10507" b="7234" baseLine="7179">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="7037" r="6768" b="7234">Sequor</wd>

<space/>

<wd l="6854" t="7032" r="6994" b="7190">is</wd>

<space/>

<wd l="7094" t="7032" r="7699" b="7190">trained</wd>

<space/>

<wd l="7795" t="7085" r="8011" b="7190">on</wd>

<space/>

<wd l="8102" t="7032" r="8491" b="7190">64%</wd>

<space/>

</run>

<wd l="8602" t="6994" r="9101" b="7229"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(0.8</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9206" t="7032" r="9398" b="7190">of</wd>

<space/>

<wd l="9475" t="7032" r="9739" b="7190">the</wd>

<space/>

<wd l="9830" t="7032" r="10507" b="7234">training</wd>

<space/>

</run>

</ln>

<ln l="6149" t="7301" r="10512" b="7502" baseLine="7454">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="7301" r="6552" b="7488">data,</wd>

<space/>

<wd l="6658" t="7301" r="7022" b="7459">16%</wd>

<space/>

<wd l="7109" t="7306" r="7445" b="7498">(0.8</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7536" t="7344" r="7646" b="7454">x</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7742" t="7306" r="8078" b="7498">0.2)</wd>

<space/>

<wd l="8155" t="7301" r="8294" b="7459">is</wd>

<space/>

<wd l="8366" t="7301" r="8770" b="7459">used</wd>

<space/>

<wd l="8842" t="7354" r="9010" b="7459">as</wd>

<space/>

<wd l="9086" t="7301" r="10205" b="7502">development</wd>

<space/>

<wd l="10277" t="7325" r="10512" b="7459">set</wd>

<space/>

</run>

</ln>

<ln l="6149" t="7574" r="10507" b="7776" baseLine="7723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="7574" r="6461" b="7733">and</wd>

<space/>

<wd l="6518" t="7579" r="6902" b="7733">20%</wd>

<space/>

<wd l="6970" t="7574" r="7378" b="7771">(1/5)</wd>

<space/>

<wd l="7435" t="7574" r="7694" b="7733">for</wd>

<space/>

<wd l="7742" t="7574" r="8366" b="7776">testing.</wd>

<space/>

<wd l="8443" t="7579" r="8750" b="7733">For</wd>

<space/>

<wd l="8794" t="7574" r="9413" b="7776">Wapiti,</wd>

<space/>

<wd l="9475" t="7627" r="9730" b="7733">we</wd>

<space/>

<wd l="9782" t="7627" r="10070" b="7733">use</wd>

<space/>

<wd l="10128" t="7574" r="10507" b="7776">only</wd>

<space/>

</ln>

<ln l="6168" t="7843" r="10502" b="8045" baseLine="7997" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6168" t="7843" r="6538" b="8002">16%</wd>

<space/>

<wd l="6614" t="7843" r="6874" b="8002">for</wd>

<space/>

<wd l="6941" t="7843" r="7618" b="8045">training</wd>

<space/>

<wd l="7699" t="7843" r="8078" b="8040">(and</wd>

<space/>

<wd l="8146" t="7843" r="8414" b="8002">the</wd>

<space/>

<wd l="8482" t="7843" r="9365" b="8045">remaining</wd>

<space/>

<wd l="9442" t="7843" r="9830" b="8002">64%</wd>

<space/>

<wd l="9907" t="7843" r="10166" b="8002">for</wd>

<space/>

<wd l="10238" t="7843" r="10502" b="8002">de-</wd>

</ln>

<ln l="6144" t="8117" r="10507" b="8318" baseLine="8266" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8117" r="7066" b="8318">velopment</wd>

<space/>

<wd l="7123" t="8122" r="7416" b="8314">set)</wd>

<space/>

<wd l="7474" t="8117" r="7646" b="8270">in</wd>

<space/>

<wd l="7699" t="8117" r="8093" b="8275">each</wd>

<space/>

<wd l="8146" t="8117" r="9533" b="8275">cross-validation</wd>

<space/>

<wd l="9576" t="8117" r="9931" b="8275">fold</wd>

<space/>

<wd l="9984" t="8117" r="10291" b="8275">due</wd>

<space/>

<wd l="10339" t="8141" r="10507" b="8275">to</wd>

<space/>

</ln>

<ln l="6144" t="8314" r="8083" b="8587" baseLine="8527">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="8438" r="6869" b="8587">memory</wd>

<space/>

</run>

<wd l="6931" t="8352" r="8083" b="8544"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">constraints.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">10</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="8851" r="8798" b="9053" alignment="left" spaceBefore="191" lsp="exactly" lspExact="251" language="en">

<ln l="6144" t="8851" r="8798" b="9053" baseLine="9005" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="6144" t="8851" r="6413" b="9010">2.4</wd>

<space/>

<wd l="6643" t="8851" r="7690" b="9053">Generating</wd>

<space/>

<wd l="7757" t="8851" r="8798" b="9010">Candidates</wd>

</ln>

</para>

<para l="6144" t="9211" r="10512" b="12125" alignment="justified" spaceBefore="84" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="9211" r="10512" b="9413" baseLine="9365" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9216" r="6432" b="9370">We</wd>

<space/>

<wd l="6542" t="9211" r="7248" b="9413">produce</wd>

<space/>

<wd l="7363" t="9211" r="8194" b="9370">candidate</wd>

<space/>

<wd l="8309" t="9211" r="9586" b="9370">normalisations</wd>

<space/>

<wd l="9706" t="9211" r="10133" b="9370">from</wd>

<space/>

<wd l="10243" t="9211" r="10512" b="9370">the</wd>

<space/>

</ln>

<ln l="6149" t="9485" r="10498" b="9686" baseLine="9634" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9485" r="6475" b="9643">edit</wd>

<space/>

<wd l="6552" t="9485" r="7450" b="9686">operations</wd>

<space/>

<wd l="7531" t="9485" r="8333" b="9686">proposed</wd>

<space/>

<wd l="8405" t="9485" r="8621" b="9686">by</wd>

<space/>

<wd l="8698" t="9485" r="8962" b="9643">the</wd>

<space/>

<wd l="9048" t="9538" r="9835" b="9686">sequence</wd>

<space/>

<wd l="9912" t="9485" r="10498" b="9643">model.</wd>

<space/>

</ln>

<ln l="6144" t="9754" r="10502" b="9955" baseLine="9907" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9758" r="6965" b="9941">However,</wd>

<space/>

<wd l="7032" t="9754" r="7181" b="9907">if</wd>

<space/>

<wd l="7224" t="9806" r="7478" b="9912">we</wd>

<space/>

<wd l="7536" t="9754" r="8222" b="9912">allowed</wd>

<space/>

<wd l="8280" t="9754" r="8674" b="9912">each</wd>

<space/>

<wd l="8731" t="9754" r="9216" b="9912">insert</wd>

<space/>

<wd l="9278" t="9754" r="9590" b="9912">and</wd>

<space/>

<wd l="9648" t="9754" r="10162" b="9912">delete</wd>

<space/>

<wd l="10224" t="9806" r="10502" b="9955">op-</wd>

</ln>

<ln l="6149" t="10027" r="10502" b="10229" baseLine="10176" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10027" r="6754" b="10186">eration</wd>

<space/>

<wd l="6811" t="10051" r="6974" b="10186">to</wd>

<space/>

<wd l="7042" t="10027" r="7243" b="10186">be</wd>

<space/>

<wd l="7310" t="10027" r="7805" b="10186">either</wd>

<space/>

<wd l="7862" t="10027" r="8539" b="10186">realised</wd>

<space/>

<wd l="8602" t="10080" r="8784" b="10186">or</wd>

<space/>

<wd l="8837" t="10051" r="9158" b="10214">not,</wd>

<space/>

<wd l="9230" t="10080" r="9485" b="10186">we</wd>

<space/>

<wd l="9547" t="10027" r="10090" b="10186">would</wd>

<space/>

<wd l="10147" t="10080" r="10502" b="10229">pro-</wd>

</ln>

<ln l="6149" t="10262" r="10502" b="10498" baseLine="10446">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="10296" r="6557" b="10454">duce</wd>

<space/>

<wd l="6638" t="10349" r="6850" b="10498">up</wd>

<space/>

<wd l="6931" t="10320" r="7099" b="10454">to</wd>

<space/>

</run>

<wd l="7190" t="10262" r="7440" b="10450"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">N</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7536" t="10296" r="8496" b="10483">candidates,</wd>

<space/>

<wd l="8592" t="10296" r="9125" b="10454">where</wd>

<space/>

<wd l="9206" t="10296" r="9398" b="10450">N</wd>

<space/>

<wd l="9480" t="10296" r="9619" b="10454">is</wd>

<space/>

<wd l="9706" t="10296" r="9970" b="10454">the</wd>

<space/>

<wd l="10051" t="10349" r="10502" b="10454">num-</wd>

</run>

</ln>

<ln l="6144" t="10570" r="10512" b="10771" baseLine="10718" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10570" r="6427" b="10728">ber</wd>

<space/>

<wd l="6490" t="10570" r="6682" b="10728">of</wd>

<space/>

<wd l="6734" t="10570" r="7056" b="10728">edit</wd>

<space/>

<wd l="7118" t="10570" r="8069" b="10771">operations.</wd>

<space/>

<wd l="8165" t="10570" r="8592" b="10728">With</wd>

<space/>

<wd l="8659" t="10570" r="8851" b="10723">N</wd>

<space/>

<wd l="8933" t="10642" r="9082" b="10694">=</wd>

<space/>

<wd l="9182" t="10574" r="9485" b="10728">140</wd>

<space/>

<wd l="9562" t="10570" r="10512" b="10766">(maximum</wd>

<space/>

</ln>

<ln l="6144" t="10838" r="10502" b="11040" baseLine="10987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10838" r="6768" b="11040">lengths</wd>

<space/>

<wd l="6869" t="10838" r="7061" b="10997">of</wd>

<space/>

<wd l="7138" t="10891" r="7234" b="10997">a</wd>

<space/>

<wd l="7315" t="10843" r="7906" b="11035">tweet),</wd>

<space/>

<wd l="8011" t="10838" r="8770" b="11040">handling</wd>

<space/>

<wd l="8861" t="10838" r="9307" b="10997">these</wd>

<space/>

<wd l="9398" t="10891" r="9874" b="11040">many</wd>

<space/>

<wd l="9970" t="10838" r="10502" b="10997">candi-</wd>

</ln>

<ln l="6149" t="11112" r="10512" b="11314" baseLine="11261" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="11112" r="6586" b="11270">dates</wd>

<space/>

<wd l="6658" t="11112" r="6797" b="11270">is</wd>

<space/>

<wd l="6869" t="11136" r="7147" b="11270">not</wd>

<space/>

<wd l="7210" t="11112" r="7934" b="11270">feasible.</wd>

<space/>

<wd l="8040" t="11112" r="8712" b="11299">Instead,</wd>

<space/>

<wd l="8794" t="11165" r="9043" b="11270">we</wd>

<space/>

<wd l="9110" t="11112" r="10066" b="11314">recursively</wd>

<space/>

<wd l="10142" t="11112" r="10512" b="11314">split</wd>

<space/>

</ln>

<ln l="6144" t="11381" r="10512" b="11582" baseLine="11530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="11381" r="6413" b="11539">the</wd>

<space/>

<wd l="6504" t="11434" r="7296" b="11582">sequence</wd>

<space/>

<wd l="7382" t="11381" r="7574" b="11539">of</wd>

<space/>

<wd l="7651" t="11381" r="7973" b="11539">edit</wd>

<space/>

<wd l="8059" t="11381" r="8957" b="11582">operations</wd>

<space/>

<wd l="9048" t="11381" r="9859" b="11582">produced</wd>

<space/>

<wd l="9941" t="11381" r="10157" b="11582">by</wd>

<space/>

<wd l="10243" t="11381" r="10512" b="11539">the</wd>

<space/>

</ln>

<ln l="6154" t="11650" r="10512" b="11851" baseLine="11803" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="11702" r="6946" b="11851">sequence</wd>

<space/>

<wd l="6998" t="11650" r="7656" b="11808">labeller</wd>

<space/>

<wd l="7704" t="11650" r="8040" b="11808">into</wd>

<space/>

<wd l="8093" t="11702" r="8309" b="11851">up</wd>

<space/>

<wd l="8362" t="11674" r="8530" b="11808">to</wd>

<space/>

<wd l="8587" t="11650" r="9024" b="11851">eight</wd>

<space/>

<wd l="9082" t="11650" r="9816" b="11808">sections.</wd>

<space/>

<wd l="9898" t="11654" r="10118" b="11808">To</wd>

<space/>

<wd l="10176" t="11650" r="10512" b="11808">find</wd>

<space/>

</ln>

<ln l="6149" t="11923" r="9802" b="12125" baseLine="12072" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="11923" r="6586" b="12125">good</wd>

<space/>

<wd l="6648" t="11923" r="7013" b="12125">split</wd>

<space/>

<wd l="7066" t="11923" r="7642" b="12125">points,</wd>

<space/>

<wd l="7709" t="11976" r="7963" b="12082">we</wd>

<space/>

<wd l="8021" t="11976" r="8707" b="12125">propose</wd>

<space/>

<wd l="8765" t="11947" r="8928" b="12082">to</wd>

<space/>

<wd l="8990" t="11923" r="9802" b="12082">minimise</wd>

</ln>

</para>

<para l="6778" t="12370" r="6979" b="12638" alignment="left" li="648" spaceBefore="22" lsp="exactly" lspExact="357" language="en">

<ln l="6778" t="12370" r="6979" b="12638" baseLine="12384">

<wd l="6778" t="12374" r="6979" b="12638" underlined="none" subsuperscript="subscript" fontSize="1200" fontFace="Symbol" fontFamily="swiss" fontPitch="variable" spacing="-16">11</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Symbol" fontFamily="swiss" fontPitch="variable" spacing="-16"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6998" t="12413" r="10502" b="12638" alignment="left" li="864" spaceAfter="122" lsp="exactly" lspExact="142" language="en">

<tabs position="6998"/>

<ln l="6998" t="12413" r="10502" b="12638" baseLine="12583">

<wd l="6998" t="12413" r="7248" b="12638"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">e</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">L</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7325" t="12518" r="7464" b="12533">−</wd>

<space/>

</run>

<wd l="7536" t="12413" r="7805" b="12638"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">e</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">R</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7886" t="12451" r="8035" b="12600">+</wd>

<space/>

</run>

<wd l="8102" t="12413" r="9110" b="12638"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">max(</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0,10</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="9182" t="12518" r="9322" b="12533">−</wd>

<space/>

</run>

<wd l="9394" t="12413" r="9893" b="12638"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)/2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="9893"/>

<wd l="10267" t="12432" r="10502" b="12624">(1)</wd>

</run>

</ln>

</para>

<rulerline l="6139" t="12782" r="7344" b="12782" type="single" width="10" color="000000"/>

<para l="6158" t="12835" r="9893" b="13229" alignment="left" spaceBefore="46" fli="216" lsp="exactly" lspExact="204" language="en">

<ln l="6398" t="12835" r="9893" b="13032" baseLine="12991">

<wd l="6398" t="12835" r="9893" b="13032"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">6</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">https://bitbucket.org/gchrupala/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><space/>

</run>

</ln>

<ln l="6158" t="13080" r="6782" b="13229" baseLine="13195" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="6158" t="13114" r="6782" b="13229">sequor</wd>

</ln>

</para>

<para l="6144" t="13253" r="10502" b="14054" alignment="justified" spaceBefore="33" fli="216" lsp="exactly" lspExact="198" language="en">

<ln l="6398" t="13253" r="10502" b="13454" baseLine="13409">

<wd l="6398" t="13253" r="6744" b="13416"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">7</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">The</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="6787" t="13286" r="7598" b="13454">generalised</wd>

<space/>

<wd l="7632" t="13306" r="8400" b="13454">perceptron</wd>

<space/>

<wd l="8434" t="13286" r="8664" b="13416">has</wd>

<space/>

<wd l="8707" t="13286" r="9048" b="13416">been</wd>

<space/>

<wd l="9086" t="13286" r="9547" b="13416">shown</wd>

<space/>

<wd l="9581" t="13306" r="9715" b="13416">to</wd>

<space/>

<wd l="9754" t="13286" r="10195" b="13416">match</wd>

<space/>

<wd l="10224" t="13325" r="10502" b="13454">per-</wd>

</run>

</ln>

<ln l="6144" t="13483" r="10502" b="13656" baseLine="13608" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13488" r="6821" b="13618">formance</wd>

<space/>

<wd l="6888" t="13488" r="7046" b="13618">of</wd>

<space/>

<wd l="7099" t="13488" r="8160" b="13618">state-of-the-art</wd>

<space/>

<wd l="8218" t="13488" r="8818" b="13618">methods</wd>

<space/>

<wd l="8885" t="13488" r="9029" b="13613">in</wd>

<space/>

<wd l="9086" t="13488" r="9456" b="13618">word</wd>

<space/>

<wd l="9518" t="13488" r="10502" b="13656">segmentation,</wd>

<space/>

</ln>

<ln l="6144" t="13680" r="10502" b="13853" baseLine="13810" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13685" r="6466" b="13814">POS</wd>

<space/>

<wd l="6523" t="13685" r="7099" b="13853">tagging,</wd>

<space/>

<wd l="7162" t="13685" r="8006" b="13853">dependency</wd>

<space/>

<wd l="8059" t="13685" r="8587" b="13853">parsing</wd>

<space/>

<wd l="8645" t="13685" r="8899" b="13814">and</wd>

<space/>

<wd l="8947" t="13685" r="10099" b="13853">phrase-structure</wd>

<space/>

<wd l="10152" t="13723" r="10502" b="13853">pars-</wd>

</ln>

<ln l="6144" t="13882" r="8227" b="14054" baseLine="14006" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13886" r="6370" b="14054">ing</wd>

<space/>

<wd l="6422" t="13886" r="6936" b="14054">(Zhang</wd>

<space/>

<wd l="6989" t="13886" r="7243" b="14016">and</wd>

<space/>

<wd l="7291" t="13886" r="7723" b="14040">Clark,</wd>

<space/>

<wd l="7781" t="13886" r="8227" b="14045">2011).</wd>

</ln>

</para>

<para l="6403" t="14069" r="9034" b="14261" alignment="left" li="216" spaceBefore="7" lsp="exactly" lspExact="199" language="en">

<ln l="6403" t="14069" r="9034" b="14261" baseLine="14219">

<wd l="6403" t="14069" r="9034" b="14261"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">8</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">https://wapiti.limsi.fr/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6149" t="14285" r="10507" b="14688" alignment="justified" spaceBefore="32" fli="216" lsp="exactly" lspExact="198" language="en">

<ln l="6398" t="14285" r="10507" b="14486" baseLine="14441">

<wd l="6398" t="14285" r="6701" b="14448"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">9</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">We</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6754" t="14318" r="7152" b="14448">thank</wd>

<space/>

<wd l="7210" t="14318" r="7867" b="14486">Grzegorz</wd>

<space/>

<wd l="7925" t="14318" r="8578" b="14486">Chrupała</wd>

<space/>

<wd l="8626" t="14318" r="8837" b="14448">for</wd>

<space/>

<wd l="8890" t="14318" r="9581" b="14486">providing</wd>

<space/>

<wd l="9634" t="14318" r="9835" b="14448">his</wd>

<space/>

<wd l="9893" t="14318" r="10507" b="14486">template</wd>

<space/>

</run>

</ln>

<ln l="6149" t="14515" r="9826" b="14688" baseLine="14640" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="14520" r="6408" b="14650">and</wd>

<space/>

<wd l="6451" t="14520" r="6662" b="14650">for</wd>

<space/>

<wd l="6706" t="14520" r="7459" b="14688">translating</wd>

<space/>

<wd l="7507" t="14520" r="7608" b="14650">it</wd>

<space/>

<wd l="7651" t="14539" r="7786" b="14650">to</wd>

<space/>

<wd l="7834" t="14520" r="8050" b="14650">the</wd>

<space/>

<wd l="8102" t="14520" r="8606" b="14688">Sequor</wd>

<space/>

<wd l="8650" t="14520" r="9264" b="14688">template</wd>

<space/>

<wd l="9312" t="14520" r="9826" b="14650">format.</wd>

</ln>

</para>

<para l="6144" t="14702" r="10512" b="15302" alignment="justified" spaceBefore="25" fli="216" lsp="exactly" lspExact="197" language="en">

<ln l="6350" t="14702" r="10512" b="14904" baseLine="14857">

<wd l="6350" t="14702" r="6821" b="14866"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">10</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">With</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6898" t="14736" r="7262" b="14890">64%,</wd>

<space/>

<wd l="7349" t="14774" r="7944" b="14904">memory</wd>

<space/>

<wd l="8021" t="14774" r="8424" b="14904">usage</wd>

<space/>

<wd l="8506" t="14774" r="8851" b="14904">grew</wd>

<space/>

<wd l="8933" t="14755" r="9067" b="14866">to</wd>

<space/>

<wd l="9149" t="14774" r="9461" b="14866">over</wd>

<space/>

<wd l="9533" t="14736" r="9797" b="14866">400</wd>

<space/>

<wd l="9878" t="14736" r="10114" b="14866">GB</wd>

<space/>

<wd l="10205" t="14774" r="10512" b="14866">over</wd>

<space/>

</run>

</ln>

<ln l="6144" t="14933" r="10507" b="15106" baseLine="15058" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14938" r="6552" b="15106">night,</wd>

<space/>

<wd l="6605" t="14938" r="7147" b="15106">causing</wd>

<space/>

<wd l="7195" t="14938" r="7618" b="15106">heavy</wd>

<space/>

<wd l="7670" t="14976" r="8026" b="15106">swap</wd>

<space/>

<wd l="8078" t="14938" r="8606" b="15106">activity</wd>

<space/>

<wd l="8654" t="14976" r="8832" b="15067">on</wd>

<space/>

<wd l="8880" t="14976" r="9115" b="15067">our</wd>

<space/>

<wd l="9158" t="14938" r="9826" b="15067">machines</wd>

<space/>

<wd l="9878" t="14938" r="10200" b="15067">with</wd>

<space/>

<wd l="10248" t="14938" r="10507" b="15067">256</wd>

<space/>

</ln>

<ln l="6149" t="15130" r="8770" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="15134" r="6384" b="15264">GB</wd>

<space/>

<wd l="6442" t="15134" r="6845" b="15259">RAM</wd>

<space/>

<wd l="6898" t="15134" r="7214" b="15293">(and</wd>

<space/>

<wd l="7258" t="15134" r="7522" b="15264">410</wd>

<space/>

<wd l="7574" t="15134" r="7810" b="15264">GB</wd>

<space/>

<wd l="7867" t="15173" r="8227" b="15302">swap</wd>

<space/>

<wd l="8280" t="15134" r="8770" b="15302">space).</wd>

</ln>

</para>

</column>

</section>

<dd l="1440" t="15736" r="10521" b="15977">

<para l="5804" t="15787" r="6148" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5870" t="15787" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="41">

<wd l="5870" t="15792" r="6082" b="15946">94</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4314.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1207" marginRight="1383" marginBottom="1302" offsetX="-24" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1207" r="10526" b="15308">

<column l="1440" t="1207" r="5822" b="15308">

<para l="1440" t="1320" r="5818" b="3149" alignment="justified" spaceBefore="56" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="1320" r="5803" b="1517" baseLine="1476">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="1320" r="1973" b="1478">where</wd>

<space/>

</run>

<wd l="2030" t="1373" r="2232" b="1512"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">e</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">L</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2299" t="1320" r="2611" b="1478">and</wd>

<space/>

</run>

<wd l="2669" t="1373" r="2890" b="1517"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">e</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">R</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2952" t="1373" r="3211" b="1478">are</wd>

<space/>

<wd l="3264" t="1320" r="3528" b="1478">the</wd>

<space/>

<wd l="3576" t="1320" r="4248" b="1478">number</wd>

<space/>

<wd l="4296" t="1320" r="4488" b="1478">of</wd>

<space/>

<wd l="4522" t="1320" r="5006" b="1478">insert</wd>

<space/>

<wd l="5059" t="1373" r="5242" b="1478">or</wd>

<space/>

<wd l="5290" t="1320" r="5803" b="1478">delete</wd>

<space/>

</run>

</ln>

<ln l="1445" t="1594" r="5798" b="1795" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="1594" r="2342" b="1795">operations</wd>

<space/>

<wd l="2410" t="1618" r="2578" b="1752">to</wd>

<space/>

<wd l="2645" t="1594" r="2909" b="1752">the</wd>

<space/>

<wd l="2971" t="1594" r="3264" b="1752">left</wd>

<space/>

<wd l="3331" t="1594" r="3643" b="1752">and</wd>

<space/>

<wd l="3701" t="1594" r="4114" b="1795">right</wd>

<space/>

<wd l="4176" t="1594" r="5251" b="1795">respectively,</wd>

<space/>

<wd l="5333" t="1594" r="5640" b="1752">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="5712" t="1646" r="5798" b="1752">s</wd>

<space/>

</run>

</ln>

<ln l="1440" t="1862" r="5803" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="1862" r="1579" b="2021">is</wd>

<space/>

<wd l="1651" t="1862" r="1915" b="2021">the</wd>

<space/>

<wd l="1982" t="1862" r="2650" b="2021">number</wd>

<space/>

<wd l="2717" t="1862" r="2904" b="2021">of</wd>

<space/>

<wd l="2962" t="1862" r="3974" b="2021">consecutive</wd>

<space/>

<wd l="4042" t="1862" r="5232" b="2064">no-operations</wd>

<space/>

<wd l="5304" t="1886" r="5472" b="2021">to</wd>

<space/>

<wd l="5539" t="1862" r="5803" b="2021">the</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="5818" b="2294" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="2136" r="1776" b="2294">left.</wd>

<space/>

<wd l="1882" t="2136" r="2222" b="2294">The</wd>

<space/>

<wd l="2290" t="2136" r="2630" b="2294">first</wd>

<space/>

<wd l="2693" t="2160" r="3096" b="2294">term</wd>

<space/>

<wd l="3154" t="2136" r="3523" b="2294">tries</wd>

<space/>

<wd l="3595" t="2160" r="3763" b="2294">to</wd>

<space/>

<wd l="3830" t="2136" r="4498" b="2294">balance</wd>

<space/>

<wd l="4560" t="2136" r="4829" b="2294">the</wd>

<space/>

<wd l="4891" t="2136" r="5563" b="2294">number</wd>

<space/>

<wd l="5630" t="2136" r="5818" b="2294">of</wd>

<space/>

</ln>

<ln l="1445" t="2405" r="5808" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="2405" r="1771" b="2563">edit</wd>

<space/>

<wd l="1824" t="2405" r="2717" b="2606">operations</wd>

<space/>

<wd l="2784" t="2458" r="2995" b="2563">on</wd>

<space/>

<wd l="3048" t="2405" r="3446" b="2563">each</wd>

<space/>

<wd l="3504" t="2405" r="3845" b="2563">side</wd>

<space/>

<wd l="3898" t="2405" r="4382" b="2563">while</wd>

<space/>

<wd l="4430" t="2405" r="4699" b="2563">the</wd>

<space/>

<wd l="4757" t="2405" r="5357" b="2563">second</wd>

<space/>

<wd l="5405" t="2429" r="5808" b="2563">term</wd>

<space/>

</ln>

<ln l="1440" t="2678" r="5808" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="2678" r="2342" b="2837">introduces</wd>

<space/>

<wd l="2410" t="2731" r="2506" b="2837">a</wd>

<space/>

<wd l="2554" t="2678" r="3475" b="2880">preference</wd>

<space/>

<wd l="3533" t="2702" r="3696" b="2837">to</wd>

<space/>

<wd l="3754" t="2702" r="4037" b="2837">not</wd>

<space/>

<wd l="4099" t="2678" r="4469" b="2880">split</wd>

<space/>

<wd l="4526" t="2678" r="5179" b="2837">clusters</wd>

<space/>

<wd l="5246" t="2678" r="5438" b="2837">of</wd>

<space/>

<wd l="5482" t="2678" r="5808" b="2837">edit</wd>

<space/>

</ln>

<ln l="1445" t="2947" r="2390" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="2947" r="2390" b="3149">operations.</wd>

</ln>

</para>

<para l="1440" t="3221" r="5808" b="5544" alignment="justified" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="3221" r="5794" b="3422" baseLine="3370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="3226" r="1963" b="3379">For</wd>

<space/>

<wd l="2035" t="3221" r="2434" b="3379">each</wd>

<space/>

<wd l="2510" t="3221" r="3163" b="3408">section,</wd>

<space/>

<wd l="3250" t="3274" r="3504" b="3379">we</wd>

<space/>

<wd l="3581" t="3221" r="4080" b="3379">either</wd>

<space/>

<wd l="4147" t="3274" r="4435" b="3379">use</wd>

<space/>

<wd l="4512" t="3221" r="4776" b="3379">the</wd>

<space/>

<wd l="4853" t="3221" r="5179" b="3379">edit</wd>

<space/>

<wd l="5251" t="3274" r="5794" b="3422">opera-</wd>

</ln>

<ln l="1440" t="3490" r="5808" b="3691" baseLine="3638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3490" r="1858" b="3648">tions</wd>

<space/>

<wd l="1930" t="3490" r="2741" b="3691">produced</wd>

<space/>

<wd l="2803" t="3490" r="3019" b="3691">by</wd>

<space/>

<wd l="3086" t="3490" r="3350" b="3648">the</wd>

<space/>

<wd l="3427" t="3542" r="4214" b="3691">sequence</wd>

<space/>

<wd l="4282" t="3490" r="4939" b="3648">labeller</wd>

<space/>

<wd l="5002" t="3542" r="5184" b="3648">or</wd>

<space/>

<wd l="5251" t="3490" r="5458" b="3648">do</wd>

<space/>

<wd l="5525" t="3514" r="5808" b="3648">not</wd>

<space/>

</ln>

<ln l="1445" t="3763" r="5803" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3763" r="1771" b="3922">edit</wd>

<space/>

<wd l="1848" t="3763" r="2112" b="3922">the</wd>

<space/>

<wd l="2198" t="3763" r="2851" b="3922">section.</wd>

<space/>

<wd l="3000" t="3768" r="3235" b="3922">As</wd>

<space/>

<wd l="3322" t="3816" r="3576" b="3922">we</wd>

<space/>

<wd l="3667" t="3763" r="4032" b="3965">split</wd>

<space/>

<wd l="4114" t="3763" r="4512" b="3922">each</wd>

<space/>

<wd l="4598" t="3816" r="5386" b="3965">sequence</wd>

<space/>

<wd l="5467" t="3763" r="5803" b="3922">into</wd>

<space/>

</ln>

<ln l="1440" t="4032" r="5803" b="4234" baseLine="4181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4085" r="1656" b="4190">no</wd>

<space/>

<wd l="1757" t="4085" r="2203" b="4190">more</wd>

<space/>

<wd l="2299" t="4032" r="2674" b="4190">than</wd>

<space/>

<wd l="2779" t="4032" r="3211" b="4234">eight</wd>

<space/>

<wd l="3317" t="4032" r="4051" b="4219">sections,</wd>

<space/>

<wd l="4171" t="4085" r="4426" b="4190">we</wd>

<space/>

<wd l="4522" t="4032" r="5222" b="4234">produce</wd>

<space/>

<wd l="5323" t="4085" r="5534" b="4234">up</wd>

<space/>

<wd l="5635" t="4056" r="5803" b="4190">to</wd>

<space/>

</ln>

<ln l="1450" t="4267" r="5794" b="4502" baseLine="4445">

<wd l="1450" t="4267" r="1632" b="4454"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">8</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1718" t="4373" r="1867" b="4426">=</wd>

<space/>

<wd l="1954" t="4306" r="2261" b="4459">256</wd>

<space/>

</run>

<wd l="2333" t="4267" r="3446" b="4459"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">candidates.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">11</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3547" t="4301" r="3979" b="4502">Only</wd>

<space/>

<wd l="4042" t="4354" r="4354" b="4459">one</wd>

<space/>

<wd l="4416" t="4301" r="5290" b="4488">candidate,</wd>

<space/>

<wd l="5357" t="4301" r="5794" b="4459">iden-</wd>

</run>

</ln>

<ln l="1440" t="4574" r="5803" b="4776" baseLine="4723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4574" r="1814" b="4733">tical</wd>

<space/>

<wd l="1882" t="4598" r="2045" b="4733">to</wd>

<space/>

<wd l="2112" t="4574" r="2381" b="4733">the</wd>

<space/>

<wd l="2443" t="4574" r="2933" b="4776">input,</wd>

<space/>

<wd l="3014" t="4574" r="3350" b="4733">will</wd>

<space/>

<wd l="3418" t="4574" r="3619" b="4733">be</wd>

<space/>

<wd l="3686" t="4574" r="4498" b="4776">produced</wd>

<space/>

<wd l="4560" t="4574" r="4709" b="4728">if</wd>

<space/>

<wd l="4757" t="4574" r="5194" b="4733">there</wd>

<space/>

<wd l="5261" t="4627" r="5525" b="4733">are</wd>

<space/>

<wd l="5587" t="4627" r="5803" b="4733">no</wd>

<space/>

</ln>

<ln l="1445" t="4843" r="5803" b="5045" baseLine="4997" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4843" r="1958" b="5002">delete</wd>

<space/>

<wd l="2021" t="4896" r="2198" b="5002">or</wd>

<space/>

<wd l="2246" t="4843" r="2736" b="5002">insert</wd>

<space/>

<wd l="2789" t="4843" r="3686" b="5045">operations</wd>

<space/>

<wd l="3754" t="4843" r="4066" b="5002">and</wd>

<space/>

<wd l="4114" t="4867" r="4435" b="5002">two</wd>

<space/>

<wd l="4498" t="4843" r="5405" b="5002">candidates</wd>

<space/>

<wd l="5467" t="4843" r="5803" b="5002">will</wd>

<space/>

</ln>

<ln l="1440" t="5117" r="5794" b="5318" baseLine="5266" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5117" r="1646" b="5275">be</wd>

<space/>

<wd l="1699" t="5117" r="2510" b="5318">produced</wd>

<space/>

<wd l="2563" t="5117" r="2712" b="5270">if</wd>

<space/>

<wd l="2750" t="5117" r="3182" b="5275">there</wd>

<space/>

<wd l="3235" t="5117" r="3374" b="5275">is</wd>

<space/>

<wd l="3418" t="5117" r="3754" b="5318">just</wd>

<space/>

<wd l="3806" t="5170" r="4118" b="5275">one</wd>

<space/>

<wd l="4176" t="5117" r="4690" b="5275">delete</wd>

<space/>

<wd l="4747" t="5170" r="4930" b="5275">or</wd>

<space/>

<wd l="4978" t="5117" r="5462" b="5275">insert</wd>

<space/>

<wd l="5520" t="5170" r="5794" b="5318">op-</wd>

</ln>

<ln l="1445" t="5386" r="2088" b="5544" baseLine="5539" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5386" r="2088" b="5544">eration.</wd>

</ln>

</para>

<para l="1440" t="5659" r="5808" b="7752" alignment="justified" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="5659" r="5803" b="5861" baseLine="5808" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="5664" r="1843" b="5813">In</wd>

<space/>

<wd l="1920" t="5659" r="2645" b="5861">training,</wd>

<space/>

<wd l="2746" t="5712" r="2995" b="5818">we</wd>

<space/>

<wd l="3082" t="5712" r="3451" b="5861">may</wd>

<space/>

<wd l="3538" t="5659" r="4469" b="5861">potentially</wd>

<space/>

<wd l="4550" t="5659" r="5251" b="5861">produce</wd>

<space/>

<wd l="5338" t="5712" r="5549" b="5861">up</wd>

<space/>

<wd l="5635" t="5683" r="5803" b="5818">to</wd>

<space/>

</ln>

<ln l="1450" t="5928" r="5808" b="6130" baseLine="6082">

<wd l="1450" t="5933" r="2074" b="6091"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">5</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">x</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">256</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2150" t="6000" r="2299" b="6053">=</wd>

<space/>

<wd l="2381" t="5933" r="2846" b="6115">1,280</wd>

<space/>

<wd l="2899" t="5928" r="3806" b="6086">candidates</wd>

<space/>

<wd l="3864" t="5981" r="4147" b="6130">per</wd>

<space/>

<wd l="4190" t="5952" r="4661" b="6086">tweet</wd>

<space/>

<wd l="4714" t="5981" r="4882" b="6086">as</wd>

<space/>

<wd l="4934" t="5928" r="5198" b="6086">the</wd>

<space/>

<wd l="5246" t="5928" r="5808" b="6086">nested</wd>

<space/>

</run>

</ln>

<ln l="1445" t="6202" r="5798" b="6403" baseLine="6350" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="6202" r="2832" b="6360">cross-validation</wd>

<space/>

<wd l="2928" t="6202" r="3365" b="6403">gives</wd>

<space/>

<wd l="3470" t="6254" r="3658" b="6360">us</wd>

<space/>

<wd l="3763" t="6202" r="4075" b="6360">five</wd>

<space/>

<wd l="4181" t="6254" r="4973" b="6403">sequence</wd>

<space/>

<wd l="5064" t="6202" r="5798" b="6360">labellers</wd>

<space/>

</ln>

<ln l="1440" t="6470" r="5803" b="6672" baseLine="6624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6523" r="1723" b="6672">per</wd>

<space/>

<wd l="1824" t="6470" r="3206" b="6629">cross-validation</wd>

<space/>

<wd l="3307" t="6523" r="3638" b="6629">run.</wd>

<space/>

<wd l="3854" t="6470" r="4469" b="6672">During</wd>

<space/>

<wd l="4570" t="6470" r="5198" b="6672">testing,</wd>

<space/>

<wd l="5318" t="6523" r="5534" b="6672">up</wd>

<space/>

<wd l="5635" t="6494" r="5803" b="6629">to</wd>

<space/>

</ln>

<ln l="1450" t="6744" r="5794" b="6946" baseLine="6893">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="6749" r="1651" b="6902">25</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="1752" t="6787" r="1862" b="6898">x</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1968" t="6749" r="2280" b="6902">256</wd>

<space/>

<wd l="2400" t="6816" r="2549" b="6869">=</wd>

<space/>

<wd l="2640" t="6744" r="3125" b="6931">6,400</wd>

<space/>

<wd l="3211" t="6744" r="4118" b="6902">candidates</wd>

<space/>

<wd l="4205" t="6797" r="4574" b="6946">may</wd>

<space/>

<wd l="4656" t="6744" r="4862" b="6902">be</wd>

<space/>

<wd l="4939" t="6744" r="5794" b="6946">produced.</wd>

<space/>

</run>

</ln>

<ln l="1450" t="7013" r="5803" b="7214" baseLine="7162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="7013" r="1853" b="7210">(The</wd>

<space/>

<wd l="1925" t="7013" r="2438" b="7171">actual</wd>

<space/>

<wd l="2506" t="7013" r="3394" b="7171">maximum</wd>

<space/>

<wd l="3461" t="7013" r="4128" b="7171">number</wd>

<space/>

<wd l="4200" t="7013" r="4387" b="7171">of</wd>

<space/>

<wd l="4445" t="7013" r="5357" b="7171">candidates</wd>

<space/>

<wd l="5429" t="7066" r="5803" b="7214">may</wd>

<space/>

</ln>

<ln l="1440" t="7282" r="5794" b="7483" baseLine="7435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7282" r="1646" b="7440">be</wd>

<space/>

<wd l="1723" t="7282" r="2218" b="7440">lower</wd>

<space/>

<wd l="2290" t="7282" r="2765" b="7440">when</wd>

<space/>

<wd l="2842" t="7282" r="3571" b="7440">labellers</wd>

<space/>

<wd l="3662" t="7334" r="4128" b="7483">agree</wd>

<space/>

<wd l="4210" t="7334" r="4426" b="7440">on</wd>

<space/>

<wd l="4502" t="7282" r="4766" b="7440">the</wd>

<space/>

<wd l="4848" t="7282" r="5174" b="7440">edit</wd>

<space/>

<wd l="5251" t="7334" r="5794" b="7483">opera-</wd>

</ln>

<ln l="1440" t="7555" r="1982" b="7752" baseLine="7704" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7555" r="1982" b="7752">tions.)</wd>

</ln>

</para>

<para l="1440" t="7992" r="4334" b="8194" alignment="left" spaceBefore="186" lsp="exactly" lspExact="251" language="en">

<ln l="1440" t="7992" r="4334" b="8194" baseLine="8141" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="1440" t="7992" r="1709" b="8150">2.5</wd>

<space/>

<wd l="1930" t="7992" r="2784" b="8194">Applying</wd>

<space/>

<wd l="2842" t="7992" r="3245" b="8150">Edit</wd>

<space/>

<wd l="3302" t="7992" r="4334" b="8194">Operations</wd>

</ln>

</para>

<para l="1440" t="8342" r="5803" b="10440" alignment="justified" spaceBefore="78" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="8342" r="5794" b="8544" baseLine="8491" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8342" r="1906" b="8501">After</wd>

<space/>

<wd l="2054" t="8342" r="2938" b="8544">producing</wd>

<space/>

<wd l="3101" t="8342" r="3931" b="8501">candidate</wd>

<space/>

<wd l="4094" t="8342" r="4416" b="8501">edit</wd>

<space/>

<wd l="4574" t="8342" r="5395" b="8544">operation</wd>

<space/>

<wd l="5558" t="8395" r="5794" b="8501">se-</wd>

</ln>

<ln l="1445" t="8611" r="5794" b="8813" baseLine="8765" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="8664" r="2136" b="8813">quences</wd>

<space/>

<wd l="2189" t="8611" r="2520" b="8770">that</wd>

<space/>

<wd l="2563" t="8664" r="2856" b="8770">use</wd>

<space/>

<wd l="2914" t="8611" r="3523" b="8770">subsets</wd>

<space/>

<wd l="3586" t="8611" r="3778" b="8770">of</wd>

<space/>

<wd l="3811" t="8611" r="4075" b="8770">the</wd>

<space/>

<wd l="4128" t="8611" r="4454" b="8770">edit</wd>

<space/>

<wd l="4502" t="8611" r="5400" b="8813">operations</wd>

<space/>

<wd l="5453" t="8664" r="5794" b="8813">pre-</wd>

</ln>

<ln l="1445" t="8885" r="5798" b="9086" baseLine="9034" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="8885" r="1973" b="9043">dicted</wd>

<space/>

<wd l="2059" t="8885" r="2275" b="9086">by</wd>

<space/>

<wd l="2371" t="8938" r="2467" b="9043">a</wd>

<space/>

<wd l="2558" t="8938" r="3346" b="9086">sequence</wd>

<space/>

<wd l="3437" t="8885" r="4022" b="9072">model,</wd>

<space/>

<wd l="4128" t="8885" r="4397" b="9043">the</wd>

<space/>

<wd l="4488" t="8885" r="4810" b="9043">edit</wd>

<space/>

<wd l="4901" t="8885" r="5798" b="9086">operations</wd>

<space/>

</ln>

<ln l="1445" t="9154" r="5803" b="9355" baseLine="9302" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="9206" r="1704" b="9312">are</wd>

<space/>

<wd l="1771" t="9154" r="2539" b="9312">executed</wd>

<space/>

<wd l="2602" t="9178" r="2765" b="9312">to</wd>

<space/>

<wd l="2832" t="9154" r="3533" b="9355">produce</wd>

<space/>

<wd l="3600" t="9154" r="4507" b="9312">candidates</wd>

<space/>

<wd l="4589" t="9154" r="5150" b="9355">strings</wd>

<space/>

<wd l="5222" t="9154" r="5482" b="9312">for</wd>

<space/>

<wd l="5539" t="9154" r="5803" b="9312">the</wd>

<space/>

</ln>

<ln l="1440" t="9427" r="5794" b="9586" baseLine="9576" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9427" r="2410" b="9586">normalised</wd>

<space/>

<wd l="2467" t="9451" r="3067" b="9586">tweets.</wd>

<space/>

<wd l="3158" t="9432" r="3389" b="9586">As</wd>

<space/>

<wd l="3456" t="9427" r="3725" b="9586">the</wd>

<space/>

<wd l="3792" t="9427" r="4354" b="9586">shared</wd>

<space/>

<wd l="4406" t="9427" r="4762" b="9586">task</wd>

<space/>

<wd l="4824" t="9427" r="5184" b="9586">asks</wd>

<space/>

<wd l="5251" t="9427" r="5510" b="9586">for</wd>

<space/>

<wd l="5563" t="9451" r="5794" b="9586">to-</wd>

</ln>

<ln l="1440" t="9696" r="5794" b="9898" baseLine="9845" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9696" r="2107" b="9854">kenised</wd>

<space/>

<wd l="2165" t="9720" r="2722" b="9898">output</wd>

<space/>

<wd l="2784" t="9696" r="3422" b="9898">aligned</wd>

<space/>

<wd l="3475" t="9720" r="3643" b="9854">to</wd>

<space/>

<wd l="3706" t="9696" r="3970" b="9854">the</wd>

<space/>

<wd l="4027" t="9696" r="4478" b="9898">input</wd>

<space/>

<wd l="4536" t="9696" r="5146" b="9883">tokens,</wd>

<space/>

<wd l="5213" t="9749" r="5467" b="9854">we</wd>

<space/>

<wd l="5530" t="9749" r="5794" b="9898">ap-</wd>

</ln>

<ln l="1440" t="9965" r="5794" b="10166" baseLine="10118" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9965" r="1714" b="10166">ply</wd>

<space/>

<wd l="1771" t="9965" r="2035" b="10123">the</wd>

<space/>

<wd l="2093" t="9965" r="2414" b="10123">edit</wd>

<space/>

<wd l="2472" t="9965" r="3365" b="10166">operations</wd>

<space/>

<wd l="3427" t="9989" r="3590" b="10123">to</wd>

<space/>

<wd l="3653" t="9965" r="4046" b="10123">each</wd>

<space/>

<wd l="4099" t="9965" r="4579" b="10123">token</wd>

<space/>

<wd l="4632" t="9965" r="4800" b="10118">in</wd>

<space/>

<wd l="4853" t="9965" r="5117" b="10123">the</wd>

<space/>

<wd l="5170" t="9965" r="5794" b="10123">follow-</wd>

</ln>

<ln l="1440" t="10238" r="2616" b="10440" baseLine="10387" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="10238" r="1714" b="10440">ing</wd>

<space/>

<wd l="1781" t="10291" r="2616" b="10440">sequence:</wd>

</ln>

</para>

<para l="1637" t="10632" r="5794" b="11102" alignment="justified" li="432" spaceBefore="125" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="1637" t="10632" r="5794" b="10834" baseLine="10781" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1637" t="10637" r="1877" b="10781">1.</wd>

<space/>

<wd l="1877" t="10632" r="2419" b="10834">Apply</wd>

<space/>

<wd l="2515" t="10632" r="2726" b="10790">all</wd>

<space/>

<wd l="2822" t="10632" r="3149" b="10790">edit</wd>

<space/>

<wd l="3240" t="10632" r="4138" b="10834">operations</wd>

<space/>

<wd l="4238" t="10656" r="4392" b="10790">at</wd>

<space/>

<wd l="4483" t="10632" r="5285" b="10790">character</wd>

<space/>

<wd l="5371" t="10632" r="5794" b="10834">posi-</wd>

</ln>

<ln l="1877" t="10901" r="5098" b="11102" baseLine="11054" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="10901" r="2294" b="11059">tions</wd>

<space/>

<wd l="2357" t="10901" r="2683" b="11059">that</wd>

<space/>

<wd l="2741" t="10901" r="3706" b="11102">correspond</wd>

<space/>

<wd l="3763" t="10925" r="3926" b="11059">to</wd>

<space/>

<wd l="3984" t="10901" r="4435" b="11102">input</wd>

<space/>

<wd l="4488" t="10901" r="5098" b="11059">tokens.</wd>

</ln>

</para>

<para l="1618" t="11328" r="5803" b="12072" alignment="justified" li="432" spaceBefore="157" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="1618" t="11328" r="5803" b="11530" baseLine="11482" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1618" t="11333" r="1877" b="11482">2.</wd>

<space/>

<wd l="1877" t="11328" r="2419" b="11530">Apply</wd>

<space/>

<wd l="2477" t="11328" r="2962" b="11486">insert</wd>

<space/>

<wd l="3019" t="11328" r="3912" b="11530">operations</wd>

<space/>

<wd l="3974" t="11328" r="4738" b="11486">recorded</wd>

<space/>

<wd l="4795" t="11352" r="4949" b="11486">at</wd>

<space/>

<wd l="5002" t="11328" r="5266" b="11486">the</wd>

<space/>

<wd l="5333" t="11381" r="5803" b="11530">space</wd>

<space/>

</ln>

<ln l="1877" t="11602" r="5803" b="11760" baseLine="11750" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="11602" r="2606" b="11760">between</wd>

<space/>

<wd l="2659" t="11602" r="3216" b="11760">tokens</wd>

<space/>

<wd l="3283" t="11602" r="3595" b="11760">and</wd>

<space/>

<wd l="3653" t="11626" r="3806" b="11760">at</wd>

<space/>

<wd l="3859" t="11602" r="4128" b="11760">the</wd>

<space/>

<wd l="4186" t="11602" r="4498" b="11760">end</wd>

<space/>

<wd l="4555" t="11602" r="4747" b="11760">of</wd>

<space/>

<wd l="4786" t="11602" r="5054" b="11760">the</wd>

<space/>

<wd l="5107" t="11626" r="5582" b="11760">tweet</wd>

<space/>

<wd l="5635" t="11626" r="5803" b="11760">to</wd>

<space/>

</ln>

<ln l="1877" t="11870" r="3638" b="12072" baseLine="12024" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="11870" r="2141" b="12029">the</wd>

<space/>

<wd l="2198" t="11870" r="3053" b="12072">preceding</wd>

<space/>

<wd l="3110" t="11870" r="3638" b="12029">token.</wd>

</ln>

</para>

<para l="1618" t="12298" r="5808" b="13853" alignment="justified" li="432" spaceBefore="155" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="1618" t="12298" r="5808" b="12499" baseLine="12451" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1618" t="12302" r="1877" b="12451">3.</wd>

<space/>

<wd l="1877" t="12298" r="2419" b="12499">Apply</wd>

<space/>

<wd l="2482" t="12298" r="2995" b="12456">delete</wd>

<space/>

<wd l="3053" t="12298" r="3950" b="12499">operations</wd>

<space/>

<wd l="4018" t="12322" r="4171" b="12456">at</wd>

<space/>

<wd l="4219" t="12298" r="4488" b="12456">the</wd>

<space/>

<wd l="4550" t="12350" r="5026" b="12499">space</wd>

<space/>

<wd l="5078" t="12298" r="5808" b="12456">between</wd>

<space/>

</ln>

<ln l="1877" t="12571" r="5803" b="12773" baseLine="12720" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1877" t="12571" r="2486" b="12758">tokens,</wd>

<space/>

<wd l="2582" t="12571" r="3240" b="12773">moving</wd>

<space/>

<wd l="3322" t="12571" r="3590" b="12730">the</wd>

<space/>

<wd l="3672" t="12595" r="4387" b="12730">contents</wd>

<space/>

<wd l="4478" t="12571" r="4666" b="12730">of</wd>

<space/>

<wd l="4733" t="12571" r="4997" b="12730">the</wd>

<space/>

<wd l="5074" t="12571" r="5558" b="12730">token</wd>

<space/>

<wd l="5635" t="12595" r="5803" b="12730">to</wd>

<space/>

</ln>

<ln l="1877" t="12840" r="5794" b="13042" baseLine="12994" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1877" t="12840" r="2141" b="12998">the</wd>

<space/>

<wd l="2222" t="12840" r="2635" b="13042">right</wd>

<space/>

<wd l="2712" t="12864" r="2880" b="12998">to</wd>

<space/>

<wd l="2962" t="12840" r="3226" b="12998">the</wd>

<space/>

<wd l="3312" t="12840" r="3624" b="12998">end</wd>

<space/>

<wd l="3706" t="12840" r="3893" b="12998">of</wd>

<space/>

<wd l="3960" t="12840" r="4224" b="12998">the</wd>

<space/>

<wd l="4306" t="12840" r="4790" b="12998">token</wd>

<space/>

<wd l="4867" t="12864" r="5030" b="12998">to</wd>

<space/>

<wd l="5117" t="12840" r="5381" b="12998">the</wd>

<space/>

<wd l="5462" t="12840" r="5794" b="13027">left,</wd>

<space/>

</ln>

<ln l="1877" t="13114" r="5794" b="13315" baseLine="13262" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1877" t="13114" r="2510" b="13315">leaving</wd>

<space/>

<wd l="2587" t="13114" r="3182" b="13272">behind</wd>

<space/>

<wd l="3254" t="13166" r="3456" b="13272">an</wd>

<space/>

<wd l="3533" t="13138" r="4070" b="13315">empty</wd>

<space/>

<wd l="4147" t="13114" r="4670" b="13272">token.</wd>

<space/>

<wd l="4810" t="13114" r="5443" b="13310">(Delete</wd>

<space/>

<wd l="5520" t="13166" r="5794" b="13315">op-</wd>

</ln>

<ln l="1882" t="13382" r="5794" b="13584" baseLine="13536" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="13382" r="2558" b="13541">erations</wd>

<space/>

<wd l="2669" t="13406" r="2822" b="13541">at</wd>

<space/>

<wd l="2918" t="13382" r="3182" b="13541">the</wd>

<space/>

<wd l="3283" t="13382" r="4397" b="13541">end-of-tweet</wd>

<space/>

<wd l="4488" t="13382" r="5107" b="13541">marker</wd>

<space/>

<wd l="5208" t="13435" r="5467" b="13541">are</wd>

<space/>

<wd l="5563" t="13382" r="5794" b="13584">ig-</wd>

</ln>

<ln l="1877" t="13656" r="2491" b="13853" baseLine="13805" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1877" t="13656" r="2491" b="13853">nored.)</wd>

</ln>

</para>

<para l="1440" t="14050" r="5808" b="14750" alignment="justified" spaceBefore="123" spaceAfter="32" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="14050" r="5803" b="14251" baseLine="14198" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="14054" r="2021" b="14208">Due</wd>

<space/>

<wd l="2102" t="14074" r="2270" b="14208">to</wd>

<space/>

<wd l="2352" t="14050" r="2741" b="14208">time</wd>

<space/>

<wd l="2827" t="14050" r="3811" b="14237">constraints,</wd>

<space/>

<wd l="3907" t="14102" r="4162" b="14208">we</wd>

<space/>

<wd l="4248" t="14050" r="4459" b="14208">do</wd>

<space/>

<wd l="4541" t="14074" r="4824" b="14208">not</wd>

<space/>

<wd l="4906" t="14074" r="5558" b="14251">attempt</wd>

<space/>

<wd l="5635" t="14074" r="5803" b="14208">to</wd>

<space/>

</ln>

<ln l="1440" t="14318" r="5808" b="14520" baseLine="14472" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14318" r="2160" b="14520">improve</wd>

<space/>

<wd l="2242" t="14318" r="2510" b="14477">the</wd>

<space/>

<wd l="2597" t="14318" r="3466" b="14520">alignment</wd>

<space/>

<wd l="3552" t="14318" r="3744" b="14477">of</wd>

<space/>

<wd l="3816" t="14342" r="4373" b="14520">output</wd>

<space/>

<wd l="4454" t="14318" r="5011" b="14477">tokens</wd>

<space/>

<wd l="5102" t="14342" r="5270" b="14477">to</wd>

<space/>

<wd l="5357" t="14318" r="5808" b="14520">input</wd>

<space/>

</ln>

<ln l="1440" t="14592" r="2050" b="14750" baseLine="14741" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14592" r="2050" b="14750">tokens.</wd>

</ln>

</para>

<rulerline l="1440" t="14846" r="2640" b="14846" type="single" width="10" color="000000"/>

<para l="1445" t="14899" r="5798" b="15288" alignment="justified" spaceBefore="52" fli="216" lsp="exactly" lspExact="207" language="en">

<ln l="1642" t="14899" r="5798" b="15106" baseLine="15051">

<wd l="1642" t="14904" r="2376" b="15106"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">11</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Splitting</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2438" t="14938" r="2654" b="15067">the</wd>

<space/>

<wd l="2712" t="14938" r="3072" b="15106">eight</wd>

<space/>

<wd l="3130" t="14938" r="3696" b="15067">sections</wd>

<space/>

<wd l="3768" t="14938" r="4152" b="15106">again</wd>

<space/>

<wd l="4205" t="14938" r="4651" b="15067">would</wd>

<space/>

<wd l="4709" t="14938" r="5280" b="15106">produce</wd>

<space/>

</run>

<wd l="5347" t="14904" r="5573" b="15062"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="superscript" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">16</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

<wd l="5674" t="14995" r="5798" b="15043">=</wd>

<space/>

</run>

</ln>

<ln l="1445" t="15134" r="2770" b="15288" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="15134" r="1930" b="15288">65,536</wd>

<space/>

<wd l="1978" t="15134" r="2770" b="15264">candidates.</wd>

</ln>

</para>

</column>

<column l="6144" t="1207" r="10526" b="15308">

<para l="6144" t="1315" r="8554" b="1522" alignment="left" spaceBefore="75" lsp="exactly" lspExact="251" language="en">

<ln l="6144" t="1315" r="8554" b="1522" baseLine="1474" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6144" t="1320" r="6413" b="1478">2.6</wd>

<space/>

<wd l="6638" t="1325" r="7555" b="1522">Language</wd>

<space/>

<wd l="7613" t="1320" r="8554" b="1522">Modelling</wd>

</ln>

</para>

<para l="6144" t="1666" r="10512" b="3725" alignment="justified" spaceBefore="78" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="1666" r="10502" b="1872" baseLine="1824" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="1675" r="6451" b="1829">For</wd>

<space/>

<wd l="6533" t="1670" r="7320" b="1872">language</wd>

<space/>

<wd l="7402" t="1670" r="8333" b="1872">modelling,</wd>

<space/>

<wd l="8438" t="1723" r="8688" b="1829">we</wd>

<space/>

<wd l="8774" t="1670" r="9178" b="1829">train</wd>

<space/>

<wd l="9269" t="1675" r="9926" b="1829">SRILM</wd>

<space/>

<wd l="10022" t="1670" r="10502" b="1867">(Stol-</wd>

</ln>

<ln l="6149" t="1939" r="10507" b="2146" baseLine="2093" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="1944" r="6490" b="2131">cke,</wd>

<space/>

<wd l="6552" t="1949" r="7046" b="2141">2002)</wd>

<space/>

<wd l="7109" t="1997" r="7320" b="2102">on</wd>

<space/>

<wd l="7363" t="1944" r="7632" b="2102">the</wd>

<space/>

<wd l="7675" t="1944" r="8650" b="2102">normalised</wd>

<space/>

<wd l="8693" t="1968" r="9240" b="2102">tweets</wd>

<space/>

<wd l="9298" t="1944" r="9490" b="2102">of</wd>

<space/>

<wd l="9518" t="1944" r="9787" b="2102">the</wd>

<space/>

<wd l="9830" t="1944" r="10507" b="2146">training</wd>

<space/>

</ln>

<ln l="6149" t="2208" r="10502" b="2414" baseLine="2366">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6149" t="2213" r="6552" b="2371">data.</wd>

<space/>

<wd l="6648" t="2218" r="6883" b="2371">As</wd>

<space/>

<wd l="6950" t="2266" r="7205" b="2371">we</wd>

<space/>

<wd l="7262" t="2237" r="7690" b="2371">want</wd>

<space/>

<wd l="7747" t="2237" r="7910" b="2371">to</wd>

<space/>

<wd l="7978" t="2213" r="8419" b="2371">build</wd>

<space/>

<wd l="8486" t="2213" r="9283" b="2371">character</wd>

<space/>

</run>

<wd l="9346" t="2266" r="9994" b="2414"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">n</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">-gram</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="10051" t="2213" r="10502" b="2371">mod-</wd>

</run>

</ln>

<ln l="6149" t="2482" r="10512" b="2688" baseLine="2635" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="2486" r="6379" b="2645">els</wd>

<space/>

<wd l="6461" t="2486" r="6773" b="2645">and</wd>

<space/>

<wd l="6840" t="2491" r="7502" b="2645">SRILM</wd>

<space/>

<wd l="7570" t="2486" r="7853" b="2645">has</wd>

<space/>

<wd l="7925" t="2539" r="8141" b="2645">no</wd>

<space/>

<wd l="8218" t="2486" r="8712" b="2645">direct</wd>

<space/>

<wd l="8784" t="2515" r="9432" b="2688">support</wd>

<space/>

<wd l="9494" t="2486" r="9754" b="2645">for</wd>

<space/>

<wd l="9816" t="2486" r="10176" b="2674">this,</wd>

<space/>

<wd l="10258" t="2539" r="10512" b="2645">we</wd>

<space/>

</ln>

<ln l="6144" t="2750" r="10502" b="2957" baseLine="2904" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="2755" r="6970" b="2914">re-format</wd>

<space/>

<wd l="7022" t="2755" r="7286" b="2914">the</wd>

<space/>

<wd l="7349" t="2755" r="8179" b="2914">candidate</wd>

<space/>

<wd l="8242" t="2755" r="8808" b="2957">strings</wd>

<space/>

<wd l="8866" t="2779" r="9034" b="2914">to</wd>

<space/>

<wd l="9091" t="2755" r="9562" b="2914">make</wd>

<space/>

<wd l="9619" t="2755" r="10013" b="2914">each</wd>

<space/>

<wd l="10070" t="2755" r="10502" b="2914">char-</wd>

</ln>

<ln l="6149" t="3024" r="10512" b="3230" baseLine="3178" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="3053" r="6576" b="3187">acter</wd>

<space/>

<wd l="6619" t="3082" r="6715" b="3187">a</wd>

<space/>

<wd l="6754" t="3029" r="7282" b="3187">token.</wd>

<space/>

<wd l="7358" t="3034" r="7579" b="3187">To</wd>

<space/>

<wd l="7632" t="3029" r="8587" b="3230">distinguish</wd>

<space/>

<wd l="8640" t="3082" r="9110" b="3230">space</wd>

<space/>

<wd l="9163" t="3029" r="10032" b="3187">characters</wd>

<space/>

<wd l="10085" t="3029" r="10512" b="3187">from</wd>

<space/>

</ln>

<ln l="6144" t="3293" r="10512" b="3499" baseLine="3446" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="3298" r="6629" b="3456">token</wd>

<space/>

<wd l="6715" t="3322" r="7632" b="3499">separators,</wd>

<space/>

<wd l="7728" t="3350" r="7982" b="3456">we</wd>

<space/>

<wd l="8059" t="3322" r="8861" b="3499">represent</wd>

<space/>

<wd l="8938" t="3298" r="9379" b="3456">them</wd>

<space/>

<wd l="9451" t="3298" r="9840" b="3456">with</wd>

<space/>

<wd l="9922" t="3298" r="10512" b="3456">double</wd>

<space/>

</ln>

<ln l="6144" t="3566" r="7229" b="3725" baseLine="3720" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="3566" r="7229" b="3725">underscores.</wd>

</ln>

</para>

<para l="6144" t="4003" r="8496" b="4166" alignment="left" spaceBefore="191" lsp="exactly" lspExact="251" language="en">

<ln l="6144" t="4003" r="8496" b="4166" baseLine="4162" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6144" t="4008" r="6413" b="4166">2.7</wd>

<space/>

<wd l="6648" t="4008" r="7603" b="4166">Candidate</wd>

<space/>

<wd l="7666" t="4008" r="8496" b="4166">Selection</wd>

</ln>

</para>

<para l="6144" t="4277" r="10512" b="5112" alignment="justified" spaceBefore="85" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="4277" r="10512" b="4560" baseLine="4506">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4363" r="6432" b="4517">We</wd>

<space/>

<wd l="6523" t="4411" r="6811" b="4517">use</wd>

<space/>

<wd l="6902" t="4358" r="7166" b="4517">the</wd>

<space/>

<wd l="7258" t="4358" r="7728" b="4560">noisy</wd>

<space/>

<wd l="7829" t="4358" r="8496" b="4517">channel</wd>

<space/>

</run>

<wd l="8592" t="4325" r="9293" b="4517"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">model</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">12</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9398" t="4382" r="9562" b="4517">to</wd>

<space/>

<wd l="9667" t="4358" r="10157" b="4517">select</wd>

<space/>

<wd l="10243" t="4358" r="10512" b="4517">the</wd>

<space/>

</run>

</ln>

<ln l="6144" t="4627" r="10502" b="4834" baseLine="4781">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4656" r="6571" b="4790">most</wd>

<space/>

<wd l="6643" t="4632" r="7430" b="4834">plausible</wd>

<space/>

<wd l="7517" t="4685" r="8078" b="4790">source</wd>

<space/>

</run>

<wd l="8165" t="4632" r="8251" b="4790"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ˆ</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8333" t="4632" r="8592" b="4790">for</wd>

<space/>

<wd l="8659" t="4632" r="8928" b="4790">the</wd>

<space/>

<wd l="9010" t="4632" r="9787" b="4790">observed</wd>

<space/>

<wd l="9864" t="4656" r="10358" b="4834">target</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10435" t="4646" r="10502" b="4790">t</wd>

<space/>

</run>

</ln>

<ln l="6144" t="4872" r="8894" b="5112" baseLine="5050">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4901" r="6571" b="5059">from</wd>

<space/>

<wd l="6624" t="4901" r="6888" b="5059">the</wd>

<space/>

<wd l="6955" t="4925" r="7190" b="5059">set</wd>

<space/>

<wd l="7248" t="4901" r="7440" b="5059">of</wd>

<space/>

<wd l="7483" t="4901" r="8390" b="5059">candidates</wd>

<space/>

</run>

<wd l="8462" t="4886" r="8894" b="5112"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">S</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">t</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">):</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="7430" t="5333" r="10502" b="5558" alignment="left" li="1296" spaceBefore="180" lsp="exactly" lspExact="259" language="en">

<tabs position="7430"/>

<ln l="7430" t="5333" r="10502" b="5558" baseLine="5495">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7430" t="5400" r="7728" b="5549">arg</wd>

<space/>

<wd l="7771" t="5400" r="8174" b="5506">max</wd>

<space/>

</run>

<wd l="8213" t="5333" r="8539" b="5558"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">t</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="8611" t="5333" r="9216" b="5558"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="9216"/>

<wd l="10267" t="5352" r="10502" b="5544">(2)</wd>

</run>

</ln>

</para>

<para l="7555" t="5582" r="8035" b="5746" alignment="left" li="1296" lsp="exactly" lspExact="229" language="en">

<ln l="7555" t="5582" r="8035" b="5746" baseLine="5698">

<wd l="7555" t="5582" r="8035" b="5746"><run underlined="none" subsuperscript="none" fontSize="850" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17">s</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17">∈</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17">S</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17">(</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17">t</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="17"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="5957" r="10517" b="7810" alignment="justified" spaceBefore="132" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="5957" r="10502" b="6182" baseLine="6120">

<wd l="6149" t="5957" r="6571" b="6182"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6691" t="5971" r="6830" b="6130">is</wd>

<space/>

<wd l="6941" t="5971" r="7714" b="6173">provided</wd>

<space/>

<wd l="7819" t="5971" r="8030" b="6173">by</wd>

<space/>

<wd l="8141" t="5971" r="8405" b="6130">the</wd>

<space/>

<wd l="8510" t="5971" r="9298" b="6173">language</wd>

<space/>

<wd l="9403" t="5971" r="9946" b="6130">model</wd>

<space/>

<wd l="10061" t="5976" r="10502" b="6168">(Sec-</wd>

</run>

</ln>

<ln l="6144" t="6240" r="10507" b="6442" baseLine="6394" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6240" r="6485" b="6398">tion</wd>

<space/>

<wd l="6566" t="6240" r="6950" b="6437">2.6).</wd>

<space/>

<wd l="7094" t="6240" r="7867" b="6398">Standard</wd>

<space/>

<wd l="7944" t="6240" r="8563" b="6398">models</wd>

<space/>

<wd l="8654" t="6240" r="9014" b="6442">give</wd>

<space/>

<wd l="9091" t="6240" r="9480" b="6442">high</wd>

<space/>

<wd l="9552" t="6240" r="10507" b="6442">probability</wd>

<space/>

</ln>

<ln l="6144" t="6514" r="10517" b="6715" baseLine="6662" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6538" r="6312" b="6672">to</wd>

<space/>

<wd l="6379" t="6514" r="7027" b="6715">making</wd>

<space/>

<wd l="7094" t="6514" r="7411" b="6672">few</wd>

<space/>

<wd l="7483" t="6566" r="7666" b="6672">or</wd>

<space/>

<wd l="7723" t="6566" r="7934" b="6672">no</wd>

<space/>

<wd l="8006" t="6514" r="8458" b="6672">edits.</wd>

<space/>

<wd l="8558" t="6518" r="9379" b="6701">However,</wd>

<space/>

<wd l="9456" t="6566" r="9706" b="6672">we</wd>

<space/>

<wd l="9768" t="6538" r="10162" b="6672">trust</wd>

<space/>

<wd l="10224" t="6566" r="10517" b="6672">our</wd>

<space/>

</ln>

<ln l="6154" t="6782" r="10502" b="6984" baseLine="6936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="6835" r="6946" b="6984">sequence</wd>

<space/>

<wd l="7008" t="6782" r="7627" b="6941">models</wd>

<space/>

<wd l="7704" t="6835" r="7872" b="6941">as</wd>

<space/>

<wd l="7944" t="6782" r="8746" b="6984">Chrupała</wd>

<space/>

<wd l="8813" t="6787" r="9374" b="6979">(2014)</wd>

<space/>

<wd l="9446" t="6782" r="10171" b="6984">reported</wd>

<space/>

<wd l="10238" t="6835" r="10502" b="6941">en-</wd>

</ln>

<ln l="6149" t="7056" r="10502" b="7258" baseLine="7205" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="7056" r="7013" b="7258">couraging</wd>

<space/>

<wd l="7090" t="7056" r="7699" b="7214">results.</wd>

<space/>

<wd l="7829" t="7056" r="8731" b="7243">Therefore,</wd>

<space/>

<wd l="8818" t="7109" r="9072" b="7214">we</wd>

<space/>

<wd l="9149" t="7056" r="9509" b="7258">give</wd>

<space/>

<wd l="9581" t="7056" r="9970" b="7258">high</wd>

<space/>

<wd l="10037" t="7056" r="10502" b="7258">prob-</wd>

</ln>

<ln l="6149" t="7325" r="10512" b="7526" baseLine="7474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="7325" r="6701" b="7526">ability</wd>

<space/>

<wd l="6773" t="7349" r="6936" b="7483">to</wd>

<space/>

<wd l="7008" t="7325" r="7478" b="7526">using</wd>

<space/>

<wd l="7550" t="7325" r="7814" b="7483">the</wd>

<space/>

<wd l="7882" t="7325" r="8693" b="7526">predicted</wd>

<space/>

<wd l="8765" t="7325" r="9091" b="7483">edit</wd>

<space/>

<wd l="9158" t="7325" r="10109" b="7526">operations.</wd>

<space/>

<wd l="10224" t="7330" r="10512" b="7483">We</wd>

<space/>

</ln>

<ln l="6149" t="7531" r="8938" b="7810" baseLine="7747">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="7598" r="6888" b="7757">consider</wd>

<space/>

<wd l="6941" t="7622" r="7262" b="7757">two</wd>

<space/>

<wd l="7320" t="7598" r="7939" b="7757">models</wd>

<space/>

<wd l="8002" t="7598" r="8261" b="7757">for</wd>

<space/>

</run>

<wd l="8318" t="7584" r="8645" b="7810"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">t</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="8717" t="7584" r="8938" b="7810"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">):</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="7057" t="8006" r="10522" b="8914" alignment="justified" li="144" spaceBefore="424" fli="-144" lsp="exactly" lspExact="270" language="en" id="_1_3_89">

<ln l="7123" t="8006" r="10522" b="8914" baseLine="8180">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7123" t="8006" r="7238" b="8914">{</wd>

<space/>

</run>

<wd l="7282" t="8040" r="7766" b="8194"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">979</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7992" t="8035" r="8141" b="8189">if</wd>

<space/>

<wd l="8184" t="8035" r="8395" b="8194">all</wd>

<space/>

<wd l="8458" t="8035" r="8779" b="8194">edit</wd>

<space/>

<wd l="8837" t="8035" r="9734" b="8237">operations</wd>

<space/>

<wd l="9802" t="8088" r="10061" b="8194">are</wd>

<space/>

<wd l="10118" t="8035" r="10522" b="8194">used</wd>

<space/>

</run>

</ln>

<ln l="7282" t="8366" r="8808" b="8525" baseLine="8520">

<wd l="7282" t="8371" r="7766" b="8525"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">020</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7992" t="8366" r="8141" b="8520">if</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8352" t="8419" r="8438" b="8525">s</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8515" t="8438" r="8664" b="8491">=</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8741" t="8381" r="8808" b="8525">t</wd>

</run>

</ln>

</para>

<para l="7282" t="8698" r="8837" b="8856" alignment="left" li="144" lsp="exactly" lspExact="123" language="en">

<ln l="7282" t="8698" r="8837" b="8856" baseLine="8851">

<wd l="7282" t="8702" r="7762" b="8856"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">001</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8"><space/>

<wd l="7997" t="8698" r="8837" b="8856">otherwise</wd>

</run>

</ln>

</para>

<para l="10201" t="8952" r="10526" b="9144" alignment="left" spaceAfter="214" fli="3024" lsp="exactly" lspExact="256" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="10267" t="8952" r="10502" b="9106" baseLine="9101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-81">

<nl orig="true"/>

</ln>

</para>

<para l="6336" t="9571" r="10301" b="10123" alignment="left" li="1296" ri="216" spaceBefore="185" fli="-1152" lsp="exactly" lspExact="302" language="en">

<ln l="6336" t="9571" r="10301" b="10013" baseLine="9817">

<wd l="6336" t="9802" r="6552" b="9989"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="6586" t="9787" r="6725" b="10013"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">t</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="6802" t="9787" r="6960" b="10013"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7051" t="9874" r="7200" b="9926">=</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7344" t="9571" r="7421" b="9840">f</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7464" t="9638" r="7541" b="9787">1</wd>

<space/>

<wd l="7771" t="9634" r="7920" b="9787">if</wd>

<space/>

<wd l="7963" t="9634" r="8170" b="9792">all</wd>

<space/>

<wd l="8237" t="9634" r="8563" b="9792">edit</wd>

<space/>

<wd l="8621" t="9634" r="9518" b="9835">operations</wd>

<space/>

<wd l="9586" t="9686" r="9845" b="9792">are</wd>

<space/>

<wd l="9898" t="9634" r="10301" b="9792">used</wd>

<space/>

</run>

</ln>

<ln l="7450" t="9965" r="8621" b="10123" baseLine="10118" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7450" t="9970" r="7546" b="10123">0</wd>

<space/>

<wd l="7776" t="9965" r="8621" b="10123">otherwise</wd>

</ln>

</para>

<para l="6144" t="10248" r="10517" b="13925" alignment="justified" spaceAfter="48" fli="3024" lsp="exactly" lspExact="270" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<wd l="10267" t="10248" r="10502" b="10392">(4)</wd>

<space/>

<ln l="10502" t="10248" r="10502" b="10397" baseLine="10392" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<space/>

</ln>

<ln l="6144" t="10512" r="10502" b="10714" baseLine="10667">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="10517" r="6571" b="10670">Note</wd>

<space/>

<wd l="6638" t="10512" r="6965" b="10670">that</wd>

<space/>

</run>

<wd l="7037" t="10512" r="7243" b="10699"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7334" t="10512" r="7469" b="10670">is</wd>

<space/>

<wd l="7546" t="10536" r="7824" b="10670">not</wd>

<space/>

<wd l="7896" t="10565" r="7992" b="10670">a</wd>

<space/>

<wd l="8054" t="10565" r="8630" b="10714">proper</wd>

<space/>

<wd l="8693" t="10512" r="9648" b="10714">probability</wd>

<space/>

<wd l="9715" t="10512" r="10258" b="10670">model</wd>

<space/>

<wd l="10334" t="10565" r="10502" b="10670">as</wd>

<space/>

</run>

</ln>

<ln l="6144" t="10786" r="10512" b="10987" baseLine="10934" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10786" r="6581" b="10944">there</wd>

<space/>

<wd l="6677" t="10786" r="6816" b="10944">is</wd>

<space/>

<wd l="6922" t="10838" r="7402" b="10944">never</wd>

<space/>

<wd l="7498" t="10786" r="8117" b="10987">exactly</wd>

<space/>

<wd l="8218" t="10838" r="8530" b="10944">one</wd>

<space/>

<wd l="8630" t="10786" r="9662" b="10944">“otherwise”</wd>

<space/>

<wd l="9768" t="10838" r="10138" b="10944">case</wd>

<space/>

<wd l="10238" t="10786" r="10512" b="10944">but</wd>

<space/>

</ln>

<ln l="6154" t="11026" r="10502" b="11213" baseLine="11204">

<wd l="6154" t="11026" r="6307" b="11208"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">z</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="6365" t="11059" r="6648" b="11208"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">−</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6706" t="11107" r="7157" b="11213">cases</wd>

<space/>

<wd l="7210" t="11054" r="7742" b="11213">where</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7800" t="11059" r="7862" b="11213">i</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7915" t="11054" r="8054" b="11213">is</wd>

<space/>

<wd l="8112" t="11054" r="8376" b="11213">the</wd>

<space/>

<wd l="8424" t="11054" r="9096" b="11213">number</wd>

<space/>

<wd l="9144" t="11054" r="9336" b="11213">of</wd>

<space/>

<wd l="9379" t="11054" r="10066" b="11213">sections</wd>

<space/>

<wd l="10128" t="11107" r="10502" b="11213">con-</wd>

</run>

</ln>

<ln l="6154" t="11328" r="10507" b="11530" baseLine="11477" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="11328" r="6778" b="11486">sidered</wd>

<space/>

<wd l="6845" t="11328" r="7018" b="11482">in</wd>

<space/>

<wd l="7094" t="11328" r="7925" b="11486">candidate</wd>

<space/>

<wd l="8002" t="11328" r="8962" b="11530">generation,</wd>

<space/>

<wd l="9053" t="11328" r="9710" b="11530">causing</wd>

<space/>

<wd l="9787" t="11328" r="10051" b="11486">the</wd>

<space/>

<wd l="10123" t="11328" r="10507" b="11486">total</wd>

<space/>

</ln>

<ln l="6144" t="11597" r="10498" b="11770" baseLine="11750">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="11621" r="6312" b="11755">to</wd>

<space/>

<wd l="6384" t="11597" r="6590" b="11755">be</wd>

<space/>

<wd l="6667" t="11597" r="7162" b="11755">either</wd>

<space/>

<wd l="7234" t="11602" r="7709" b="11755">0.999</wd>

<space/>

<wd l="7795" t="11650" r="7978" b="11755">or</wd>

<space/>

<wd l="8040" t="11597" r="8770" b="11755">between</wd>

<space/>

<wd l="8861" t="11602" r="9307" b="11755">1.001</wd>

<space/>

<wd l="9403" t="11597" r="9715" b="11755">and</wd>

<space/>

</run>

<wd l="9787" t="11602" r="10272" b="11755"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">999</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10349" t="11621" r="10498" b="11770">+</wd>

<space/>

</run>

</ln>

<ln l="6149" t="11832" r="10502" b="12082" baseLine="12017">

<wd l="6149" t="11875" r="6629" b="12029"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">001</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="6701" t="11914" r="6811" b="12024">x</wd>

<space/>

</run>

<wd l="6893" t="11832" r="7152" b="12082"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(2</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">8</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

<wd l="7210" t="11962" r="7349" b="11976">−</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7406" t="11856" r="7570" b="12082">2)</wd>

<space/>

<wd l="7661" t="11942" r="7810" b="11995">=</wd>

<space/>

</run>

<wd l="7901" t="11875" r="8419" b="12029"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">253.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="8501" t="11870" r="8717" b="12053"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8789" t="11870" r="9696" b="12072">effectively</wd>

<space/>

<wd l="9754" t="11870" r="10502" b="12029">excludes</wd>

<space/>

</run>

</ln>

<ln l="6144" t="12139" r="10507" b="12341" baseLine="12288" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12139" r="6413" b="12298">the</wd>

<space/>

<wd l="6480" t="12139" r="7152" b="12341">original</wd>

<space/>

<wd l="7219" t="12139" r="7670" b="12341">input</wd>

<space/>

<wd l="7738" t="12139" r="8050" b="12298">and</wd>

<space/>

<wd l="8117" t="12139" r="8318" b="12298">all</wd>

<space/>

<wd l="8395" t="12139" r="9307" b="12298">candidates</wd>

<space/>

<wd l="9379" t="12139" r="9706" b="12298">that</wd>

<space/>

<wd l="9768" t="12192" r="10056" b="12298">use</wd>

<space/>

<wd l="10128" t="12139" r="10507" b="12341">only</wd>

<space/>

</ln>

<ln l="6154" t="12413" r="10512" b="12614" baseLine="12562" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="12466" r="6605" b="12571">some</wd>

<space/>

<wd l="6682" t="12413" r="6955" b="12571">but</wd>

<space/>

<wd l="7027" t="12437" r="7310" b="12571">not</wd>

<space/>

<wd l="7387" t="12413" r="7589" b="12571">all</wd>

<space/>

<wd l="7675" t="12413" r="7867" b="12571">of</wd>

<space/>

<wd l="7925" t="12413" r="8194" b="12571">the</wd>

<space/>

<wd l="8270" t="12413" r="8597" b="12571">edit</wd>

<space/>

<wd l="8674" t="12413" r="9571" b="12614">operations</wd>

<space/>

<wd l="9662" t="12413" r="10512" b="12614">suggested</wd>

<space/>

</ln>

<ln l="6144" t="12682" r="10502" b="12883" baseLine="12830" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12682" r="6360" b="12883">by</wd>

<space/>

<wd l="6427" t="12682" r="6691" b="12840">the</wd>

<space/>

<wd l="6763" t="12734" r="7555" b="12883">sequence</wd>

<space/>

<wd l="7618" t="12682" r="8400" b="12840">labellers.</wd>

<space/>

<wd l="8506" t="12682" r="8986" b="12840">Since</wd>

<space/>

<wd l="9048" t="12682" r="9485" b="12840">there</wd>

<space/>

<wd l="9552" t="12734" r="9811" b="12840">are</wd>

<space/>

<wd l="9878" t="12682" r="10195" b="12840">five</wd>

<space/>

<wd l="10267" t="12734" r="10502" b="12840">se-</wd>

</ln>

<ln l="6149" t="12950" r="10507" b="13152" baseLine="13104" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13003" r="6763" b="13152">quence</wd>

<space/>

<wd l="6850" t="12950" r="7579" b="13109">labellers</wd>

<space/>

<wd l="7670" t="13003" r="7954" b="13152">per</wd>

<space/>

<wd l="8040" t="12950" r="9422" b="13109">cross-validation</wd>

<space/>

<wd l="9504" t="12950" r="9859" b="13109">fold</wd>

<space/>

<wd l="9946" t="12950" r="10258" b="13109">due</wd>

<space/>

<wd l="10339" t="12974" r="10507" b="13109">to</wd>

<space/>

</ln>

<ln l="6144" t="13224" r="10502" b="13426" baseLine="13373" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13224" r="6706" b="13382">nested</wd>

<space/>

<wd l="6778" t="13224" r="8160" b="13382">cross-validation</wd>

<space/>

<wd l="8237" t="13224" r="8549" b="13382">and</wd>

<space/>

<wd l="8621" t="13224" r="8822" b="13382">25</wd>

<space/>

<wd l="8914" t="13277" r="9701" b="13426">sequence</wd>

<space/>

<wd l="9773" t="13224" r="10502" b="13382">labellers</wd>

<space/>

</ln>

<ln l="6149" t="13493" r="10517" b="13694" baseLine="13647">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="13493" r="6710" b="13694">during</wd>

<space/>

<wd l="6773" t="13493" r="7397" b="13694">testing,</wd>

<space/>

</run>

<wd l="7474" t="13493" r="7685" b="13680"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7766" t="13493" r="8678" b="13694">effectively</wd>

<space/>

<wd l="8746" t="13493" r="9312" b="13651">selects</wd>

<space/>

<wd l="9379" t="13493" r="10104" b="13651">between</wd>

<space/>

<wd l="10166" t="13493" r="10258" b="13651">5</wd>

<space/>

<wd l="10334" t="13546" r="10517" b="13651">or</wd>

<space/>

</run>

</ln>

<ln l="6149" t="13694" r="7546" b="13925" baseLine="13901">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="13766" r="6350" b="13925">25</wd>

<space/>

</run>

<wd l="6422" t="13728" r="7546" b="13925"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">candidates.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">13</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<rulerline l="6144" t="14030" r="7344" b="14030" type="single" width="10" color="000000"/>

<para l="6144" t="14088" r="10502" b="14885" alignment="justified" spaceBefore="67" fli="144" lsp="exactly" lspExact="200" language="en">

<ln l="6350" t="14088" r="10502" b="14290" baseLine="14238">

<wd l="6350" t="14088" r="6744" b="14251"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">12</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">The</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6840" t="14122" r="7229" b="14290">noisy</wd>

<space/>

<wd l="7325" t="14122" r="7882" b="14251">channel</wd>

<space/>

<wd l="7978" t="14122" r="8424" b="14251">model</wd>

<space/>

<wd l="8520" t="14122" r="8755" b="14251">has</wd>

<space/>

<wd l="8856" t="14122" r="9197" b="14251">been</wd>

<space/>

<wd l="9293" t="14122" r="9821" b="14290">applied</wd>

<space/>

<wd l="9917" t="14160" r="10502" b="14251">success-</wd>

</run>

</ln>

<ln l="6144" t="14318" r="10502" b="14486" baseLine="14443" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14318" r="6480" b="14486">fully</wd>

<space/>

<wd l="6538" t="14338" r="6677" b="14448">to</wd>

<space/>

<wd l="6739" t="14318" r="7301" b="14486">spelling</wd>

<space/>

<wd l="7358" t="14318" r="8088" b="14448">correction</wd>

<space/>

<wd l="8146" t="14318" r="8938" b="14486">(Kemighan</wd>

<space/>

<wd l="9000" t="14338" r="9130" b="14448">et</wd>

<space/>

<wd l="9187" t="14318" r="9398" b="14472">al.,</wd>

<space/>

<wd l="9480" t="14318" r="9864" b="14472">1990;</wd>

<space/>

<wd l="9931" t="14318" r="10502" b="14448">Wilcox-</wd>

</ln>

<ln l="6149" t="14520" r="10502" b="14688" baseLine="14640" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="14520" r="6773" b="14650">O’Hearn</wd>

<space/>

<wd l="6830" t="14539" r="6965" b="14650">et</wd>

<space/>

<wd l="7022" t="14520" r="7229" b="14674">al.,</wd>

<space/>

<wd l="7301" t="14520" r="7709" b="14678">2008)</wd>

<space/>

<wd l="7776" t="14520" r="8035" b="14650">and</wd>

<space/>

<wd l="8088" t="14520" r="8693" b="14650">machine</wd>

<space/>

<wd l="8755" t="14520" r="9514" b="14650">translation</wd>

<space/>

<wd l="9576" t="14520" r="9979" b="14688">(Way,</wd>

<space/>

<wd l="10051" t="14520" r="10502" b="14678">2010),</wd>

<space/>

</ln>

<ln l="6149" t="14717" r="7493" b="14885" baseLine="14842" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="14755" r="6629" b="14885">among</wd>

<space/>

<wd l="6682" t="14717" r="7051" b="14846">other</wd>

<space/>

<wd l="7094" t="14755" r="7493" b="14846">areas.</wd>

</ln>

</para>

<para l="6144" t="14904" r="10512" b="15302" alignment="justified" spaceBefore="7" fli="144" lsp="exactly" lspExact="204" language="en">

<ln l="6350" t="14904" r="10512" b="15106" baseLine="15055">

<wd l="6350" t="14904" r="6768" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">13</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Han</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="6821" t="14957" r="6950" b="15067">et</wd>

<space/>

<wd l="7008" t="14938" r="7162" b="15067">al.</wd>

<space/>

<wd l="7234" t="14938" r="7699" b="15096">(2013)</wd>

<space/>

<wd l="7762" t="14938" r="8045" b="15067">also</wd>

<space/>

<wd l="8098" t="14976" r="8333" b="15067">use</wd>

<space/>

<wd l="8395" t="14976" r="8472" b="15067">a</wd>

<space/>

<wd l="8520" t="14938" r="9048" b="15106">trigram</wd>

<space/>

<wd l="9101" t="14938" r="9744" b="15106">language</wd>

<space/>

<wd l="9802" t="14938" r="10248" b="15067">model</wd>

<space/>

<wd l="10301" t="14938" r="10512" b="15067">for</wd>

<space/>

</run>

</ln>

<ln l="6144" t="15134" r="10507" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="15134" r="7171" b="15288">normalisation,</wd>

<space/>

<wd l="7224" t="15134" r="7454" b="15264">but</wd>

<space/>

<wd l="7502" t="15134" r="7814" b="15302">only</wd>

<space/>

<wd l="7867" t="15154" r="8002" b="15264">to</wd>

<space/>

<wd l="8054" t="15134" r="8530" b="15264">reduce</wd>

<space/>

<wd l="8587" t="15173" r="8664" b="15264">a</wd>

<space/>

<wd l="8707" t="15134" r="9125" b="15302">larger</wd>

<space/>

<wd l="9173" t="15134" r="9854" b="15264">candidate</wd>

<space/>

<wd l="9912" t="15154" r="10109" b="15264">set</wd>

<space/>

<wd l="10152" t="15154" r="10291" b="15264">to</wd>

<space/>

<wd l="10349" t="15173" r="10507" b="15264">an</wd>

</ln>

</para>

</column>

</section>

<dd l="6144" t="7953" r="7123" b="9384" anchorTo="toPage" refTo="_1_3_89">

<shape>

<rect l="6144" t="7953" r="7123" b="9158"/>

<rect l="6144" t="9158" r="7123" b="9384"/>

</shape>

<para l="6149" t="8352" r="7013" b="8578" alignment="left" spaceBefore="369" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="8352" r="7013" b="8578" baseLine="8523">

<wd l="6149" t="8352" r="6542" b="8578"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="7">1</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">t</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><space/>

</run>

<wd l="6614" t="8352" r="6773" b="8578"><run italic="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">s</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><space/>

<wd l="6864" t="8438" r="7013" b="8491">=</wd>

</run>

</ln>

</para>

<para l="6144" t="9221" r="6527" b="9379" alignment="left" spaceBefore="585" lsp="exactly" lspExact="196" language="en">

<ln l="6149" t="9221" r="6461" b="9379" baseLine="9370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="16">

<wd l="6149" t="9221" r="6461" b="9379">and</wd>

</ln>

</para>

</dd>

<dd l="1440" t="15736" r="10526" b="15977">

<para l="5804" t="15787" r="6138" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5870" t="15787" r="6072" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="38">

<wd l="5870" t="15787" r="6072" b="15946">95</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4314.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1248" marginRight="1383" marginBottom="1302" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1248" r="10526" b="15317">

<column l="1440" t="1248" r="5822" b="15317">

<table l="1714" t="1258" r="5530" b="2390" alignment="left" li="274" ri="292" spaceBefore="10" spaceAfter="152">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>600</gridCol>

<gridCol>730</gridCol>

<gridCol>619</gridCol>

<gridCol>619</gridCol>

<gridCol>624</gridCol>

<gridCol>624</gridCol>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>292</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1714" t="1258" r="2314" b="1541" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2626" t="1306" r="2726" b="1454" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="2626" t="1306" r="2726" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2626" t="1306" r="2726" b="1454">2</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3302" t="1306" r="3394" b="1459" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="3302" t="1306" r="3394" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3302" t="1306" r="3394" b="1459">3</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3917" t="1306" r="4022" b="1454" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="3917" t="1306" r="4022" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3917" t="1306" r="4022" b="1454">4</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4546" t="1301" r="4637" b="1459" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="4546" t="1301" r="4637" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4546" t="1301" r="4637" b="1459">5</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5165" t="1301" r="5266" b="1459" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="5165" t="1301" r="5266" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="5165" t="1301" r="5266" b="1459">6</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1838" t="1584" r="2179" b="1738" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<ln l="1838" t="1584" r="2179" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1838" t="1584" r="2179" b="1738">WB</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2453" t="1584" r="2918" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="2453"/>

<ln l="2453" t="1584" r="2918" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="2453" t="1584" r="2918" b="1738">14.70</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3163" t="1584" r="3533" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="3163"/>

<ln l="3163" t="1584" r="3533" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3163" t="1584" r="3533" b="1738">9.97</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3782" t="1584" r="4142" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="3782"/>

<ln l="3782" t="1584" r="4142" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="3782" t="1584" r="4142" b="1738">7.91</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4402" t="1584" r="4762" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="4402"/>

<ln l="4402" t="1584" r="4762" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="4402" t="1584" r="4762" b="1738">7.31</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5026" t="1579" r="5400" b="1738" alignment="left" spaceAfter="26" lsp="exactly" lspExact="247" language="en">

<tabs position="5026"/>

<ln l="5026" t="1579" r="5400" b="1738" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5026" t="1579" r="5400" b="1738">7.19</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1862" t="1862" r="2174" b="2016" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="1862" t="1862" r="2174" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1862" t="1862" r="2174" b="2016">KN</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2453" t="1862" r="2909" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="2453"/>

<ln l="2453" t="1862" r="2909" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="2453" t="1862" r="2909" b="2016">14.73</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3163" t="1862" r="3528" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="3163"/>

<ln l="3163" t="1862" r="3528" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="3163" t="1862" r="3528" b="2016">9.83</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3782" t="1862" r="4142" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="3782"/>

<ln l="3782" t="1862" r="4142" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="3782" t="1862" r="4142" b="2016">7.81</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4402" t="1862" r="4771" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="4402"/>

<ln l="4402" t="1862" r="4771" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4402" t="1862" r="4771" b="2016">7.33</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5026" t="1862" r="5390" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="5026"/>

<ln l="5026" t="1862" r="5390" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="5026" t="1862" r="5390" b="2016">7.43</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1877" t="2141" r="2155" b="2294" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<ln l="1877" t="2141" r="2155" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1877" t="2141" r="2155" b="2294">GT</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2453" t="2136" r="2909" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="2453"/>

<ln l="2453" t="2136" r="2909" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="2453" t="2136" r="2909" b="2294">14.63</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3163" t="2141" r="3533" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="3163"/>

<ln l="3163" t="2141" r="3533" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3163" t="2141" r="3533" b="2294">9.88</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3782" t="2141" r="4142" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="3782"/>

<ln l="3782" t="2141" r="4142" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="3782" t="2141" r="4142" b="2294">7.91</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4402" t="2136" r="4771" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="4402"/>

<ln l="4402" t="2136" r="4771" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4402" t="2136" r="4771" b="2294">7.45</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5026" t="2141" r="5400" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="5026"/>

<ln l="5026" t="2141" r="5400" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5026" t="2141" r="5400" b="2294">7.44</wd>

</ln>

</para>

</cell>

</table>

<para l="1440" t="2602" r="5808" b="4118" alignment="justified" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="2602" r="5808" b="2803" baseLine="2755" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2602" r="1920" b="2760">Table</wd>

<space/>

<wd l="2006" t="2606" r="2136" b="2760">1:</wd>

<space/>

<wd l="2237" t="2606" r="2957" b="2803">Average</wd>

<space/>

<wd l="3019" t="2602" r="3806" b="2803">language</wd>

<space/>

<wd l="3869" t="2602" r="4411" b="2760">model</wd>

<space/>

<wd l="4478" t="2602" r="5357" b="2803">perplexity</wd>

<space/>

<wd l="5429" t="2654" r="5808" b="2760">over</wd>

<space/>

</ln>

<ln l="1440" t="2875" r="5794" b="3077" baseLine="3024" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2875" r="1704" b="3034">the</wd>

<space/>

<wd l="1757" t="2875" r="2069" b="3034">five</wd>

<space/>

<wd l="2122" t="2875" r="3509" b="3034">cross-validation</wd>

<space/>

<wd l="3552" t="2928" r="3922" b="3034">runs</wd>

<space/>

<wd l="3974" t="2875" r="4234" b="3034">for</wd>

<space/>

<wd l="4282" t="2928" r="4930" b="3077">n-gram</wd>

<space/>

<wd l="4982" t="2875" r="5390" b="3034">sizes</wd>

<space/>

<wd l="5448" t="2928" r="5568" b="3034">n</wd>

<space/>

<wd l="5645" t="2947" r="5794" b="3000">=</wd>

<space/>

</ln>

<ln l="1450" t="3144" r="5794" b="3346" baseLine="3298" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="3149" r="1877" b="3341">2,...,</wd>

<space/>

<wd l="1930" t="3149" r="2026" b="3302">6</wd>

<space/>

<wd l="2150" t="3144" r="2462" b="3302">and</wd>

<space/>

<wd l="2578" t="3144" r="3490" b="3346">smoothing</wd>

<space/>

<wd l="3600" t="3144" r="4334" b="3302">methods</wd>

<space/>

<wd l="4450" t="3149" r="4790" b="3302">WB</wd>

<space/>

<wd l="4920" t="3211" r="5035" b="3274">=</wd>

<space/>

<wd l="5146" t="3144" r="5794" b="3302">Witten-</wd>

</ln>

<ln l="1440" t="3418" r="5794" b="3619" baseLine="3566" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3418" r="1848" b="3605">Bell,</wd>

<space/>

<wd l="1944" t="3422" r="2256" b="3576">KN</wd>

<space/>

<wd l="2338" t="3485" r="2453" b="3547">=</wd>

<space/>

<wd l="2539" t="3422" r="3566" b="3619">Keyser-Ney</wd>

<space/>

<wd l="3653" t="3418" r="3965" b="3576">and</wd>

<space/>

<wd l="4046" t="3422" r="4330" b="3576">GT</wd>

<space/>

<wd l="4416" t="3485" r="4531" b="3547">=</wd>

<space/>

<wd l="4613" t="3418" r="5794" b="3619">Good-Turing.</wd>

<space/>

</ln>

<ln l="1445" t="3686" r="5794" b="3888" baseLine="3835">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="3686" r="2218" b="3845">Standard</wd>

<space/>

<wd l="2314" t="3686" r="3115" b="3845">deviation</wd>

<space/>

<wd l="3211" t="3744" r="3331" b="3845">Q</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="3485" t="3701" r="3624" b="3830">G</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3778" t="3691" r="4152" b="3845">0.23</wd>

<space/>

<wd l="4253" t="3686" r="4512" b="3845">for</wd>

<space/>

<wd l="4603" t="3686" r="4814" b="3845">all</wd>

<space/>

<wd l="4915" t="3686" r="5794" b="3888">configura-</wd>

</run>

</ln>

<ln l="1440" t="3960" r="1906" b="4118" baseLine="4109" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3960" r="1906" b="4118">tions.</wd>

</ln>

</para>

<para l="1440" t="4589" r="3893" b="4747" alignment="left" spaceBefore="377" lsp="exactly" lspExact="254" language="en">

<ln l="1440" t="4589" r="3893" b="4747" baseLine="4738" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1440" t="4589" r="1709" b="4747">2.8</wd>

<space/>

<wd l="1930" t="4589" r="2947" b="4747">Evaluation</wd>

<space/>

<wd l="3000" t="4594" r="3893" b="4747">Measures</wd>

</ln>

</para>

<para l="1440" t="4949" r="5808" b="5650" alignment="justified" spaceBefore="87" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="4949" r="5808" b="5150" baseLine="5098" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4954" r="1723" b="5107">We</wd>

<space/>

<wd l="1800" t="4949" r="2510" b="5107">evaluate</wd>

<space/>

<wd l="2587" t="5002" r="2875" b="5107">our</wd>

<space/>

<wd l="2942" t="4949" r="3298" b="5107">best</wd>

<space/>

<wd l="3374" t="4973" r="4046" b="5150">systems</wd>

<space/>

<wd l="4123" t="4949" r="4594" b="5150">using</wd>

<space/>

<wd l="4666" t="4949" r="4934" b="5107">the</wd>

<space/>

<wd l="5011" t="4949" r="5808" b="5107">evalution</wd>

<space/>

</ln>

<ln l="1450" t="5218" r="5808" b="5419" baseLine="5371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="5218" r="1925" b="5419">script</wd>

<space/>

<wd l="2006" t="5218" r="2779" b="5419">provided</wd>

<space/>

<wd l="2856" t="5218" r="3072" b="5419">by</wd>

<space/>

<wd l="3154" t="5218" r="3422" b="5376">the</wd>

<space/>

<wd l="3509" t="5218" r="4070" b="5376">shared</wd>

<space/>

<wd l="4152" t="5218" r="4502" b="5376">task</wd>

<space/>

<wd l="4589" t="5218" r="5515" b="5419">organisers.</wd>

<space/>

<wd l="5674" t="5222" r="5808" b="5376">It</wd>

<space/>

</ln>

<ln l="1445" t="5501" r="2054" b="5650" baseLine="5640" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5515" r="2054" b="5650">counts:</wd>

</ln>

</para>

<para l="1675" t="5962" r="5794" b="6931" alignment="justified" li="432" spaceBefore="198" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="5962" r="5794" b="6163" baseLine="6110" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="5966" r="1877" b="6110">•</wd>

<tab position="1756"/>

<wd l="1877" t="5962" r="2213" b="6120">The</wd>

<space/>

<wd l="2266" t="5962" r="2938" b="6120">number</wd>

<space/>

<wd l="2986" t="5962" r="3178" b="6120">of</wd>

<space/>

<wd l="3221" t="5962" r="3984" b="6163">correctly</wd>

<space/>

<wd l="4042" t="5962" r="4819" b="6120">modified</wd>

<space/>

<wd l="4867" t="5962" r="5477" b="6149">tokens,</wd>

<space/>

<wd l="5539" t="5962" r="5794" b="6120">i.e.</wd>

<space/>

</ln>

<ln l="1877" t="6230" r="5794" b="6432" baseLine="6384" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="6230" r="2434" b="6389">tokens</wd>

<space/>

<wd l="2491" t="6230" r="2822" b="6389">that</wd>

<space/>

<wd l="2866" t="6230" r="3283" b="6389">need</wd>

<space/>

<wd l="3326" t="6254" r="3494" b="6389">to</wd>

<space/>

<wd l="3547" t="6230" r="3749" b="6389">be</wd>

<space/>

<wd l="3802" t="6230" r="4541" b="6432">replaced</wd>

<space/>

<wd l="4589" t="6230" r="4800" b="6432">by</wd>

<space/>

<wd l="4858" t="6283" r="4954" b="6389">a</wd>

<space/>

<wd l="5002" t="6283" r="5352" b="6389">new</wd>

<space/>

<wd l="5405" t="6283" r="5794" b="6389">non-</wd>

</ln>

<ln l="1882" t="6504" r="5794" b="6706" baseLine="6653" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="6528" r="2419" b="6706">empty</wd>

<space/>

<wd l="2520" t="6504" r="3005" b="6662">token</wd>

<space/>

<wd l="3106" t="6504" r="3418" b="6662">and</wd>

<space/>

<wd l="3514" t="6504" r="3778" b="6662">the</wd>

<space/>

<wd l="3888" t="6528" r="4488" b="6706">system</wd>

<space/>

<wd l="4584" t="6504" r="5352" b="6706">correctly</wd>

<space/>

<wd l="5453" t="6557" r="5794" b="6706">pre-</wd>

</ln>

<ln l="1882" t="6773" r="3240" b="6931" baseLine="6922" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="6773" r="2280" b="6931">dicts</wd>

<space/>

<wd l="2342" t="6773" r="2650" b="6931">this</wd>

<space/>

<wd l="2712" t="6773" r="3240" b="6931">token.</wd>

</ln>

</para>

<para l="1675" t="7243" r="5818" b="8798" alignment="justified" li="432" spaceBefore="202" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="7243" r="5794" b="7445" baseLine="7392" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1675" t="7248" r="1877" b="7392">•</wd>

<tab position="1756"/>

<wd l="1877" t="7243" r="2597" b="7402">Number</wd>

<space/>

<wd l="2645" t="7243" r="2837" b="7402">of</wd>

<space/>

<wd l="2875" t="7243" r="3432" b="7402">tokens</wd>

<space/>

<wd l="3490" t="7243" r="4181" b="7445">needing</wd>

<space/>

<wd l="4234" t="7243" r="5477" b="7430">normalisation,</wd>

<space/>

<wd l="5539" t="7243" r="5794" b="7402">i.e.</wd>

<space/>

</ln>

<ln l="1877" t="7517" r="5794" b="7718" baseLine="7666" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="7517" r="2434" b="7675">tokens</wd>

<space/>

<wd l="2525" t="7517" r="2851" b="7675">that</wd>

<space/>

<wd l="2933" t="7570" r="3197" b="7675">are</wd>

<space/>

<wd l="3274" t="7517" r="4051" b="7675">modified</wd>

<space/>

<wd l="4133" t="7517" r="4301" b="7670">in</wd>

<space/>

<wd l="4382" t="7517" r="4646" b="7675">the</wd>

<space/>

<wd l="4733" t="7517" r="5117" b="7718">gold</wd>

<space/>

<wd l="5198" t="7541" r="5794" b="7718">output.</wd>

<space/>

</ln>

<ln l="1877" t="7786" r="5808" b="7987" baseLine="7934" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="7790" r="2698" b="7973">However,</wd>

<space/>

<wd l="2770" t="7786" r="3283" b="7987">again,</wd>

<space/>

<wd l="3350" t="7786" r="3912" b="7944">tokens</wd>

<space/>

<wd l="3974" t="7786" r="4306" b="7944">that</wd>

<space/>

<wd l="4363" t="7838" r="4627" b="7944">are</wd>

<space/>

<wd l="4685" t="7810" r="4853" b="7944">to</wd>

<space/>

<wd l="4910" t="7786" r="5117" b="7944">be</wd>

<space/>

<wd l="5179" t="7786" r="5808" b="7944">deleted</wd>

<space/>

</ln>

<ln l="1882" t="8054" r="5798" b="8256" baseLine="8208" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="8107" r="2141" b="8213">are</wd>

<space/>

<wd l="2227" t="8054" r="2938" b="8256">ignored,</wd>

<space/>

<wd l="3043" t="8107" r="3341" b="8256">e.g.</wd>

<space/>

<wd l="3442" t="8054" r="3590" b="8208">“l</wd>

<space/>

<wd l="3682" t="8107" r="3782" b="8213">o</wd>

<space/>

<wd l="3869" t="8107" r="3974" b="8213">v</wd>

<space/>

<wd l="4066" t="8059" r="4248" b="8213">e”</wd>

<space/>

<wd l="4339" t="8078" r="4502" b="8213">to</wd>

<space/>

<wd l="4594" t="8054" r="5146" b="8213">“love”</wd>

<space/>

<wd l="5242" t="8078" r="5798" b="8213">counts</wd>

<space/>

</ln>

<ln l="1882" t="8328" r="5818" b="8530" baseLine="8477" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="8381" r="2050" b="8486">as</wd>

<space/>

<wd l="2126" t="8381" r="2438" b="8486">one</wd>

<space/>

<wd l="2506" t="8352" r="2966" b="8486">event</wd>

<space/>

<wd l="3034" t="8328" r="3413" b="8530">only</wd>

<space/>

<wd l="3485" t="8328" r="4099" b="8530">despite</wd>

<space/>

<wd l="4162" t="8328" r="4430" b="8486">the</wd>

<space/>

<wd l="4493" t="8328" r="5563" b="8530">replacement</wd>

<space/>

<wd l="5630" t="8328" r="5818" b="8486">of</wd>

<space/>

</ln>

<ln l="1877" t="8597" r="4642" b="8798" baseLine="8750" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="8597" r="2314" b="8755">three</wd>

<space/>

<wd l="2366" t="8597" r="2928" b="8755">tokens</wd>

<space/>

<wd l="2990" t="8597" r="3379" b="8755">with</wd>

<space/>

<wd l="3437" t="8621" r="3974" b="8798">empty</wd>

<space/>

<wd l="4032" t="8597" r="4642" b="8755">tokens.</wd>

</ln>

</para>

<para l="1675" t="9067" r="5808" b="9811" alignment="justified" li="432" spaceBefore="200" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="9067" r="5794" b="9269" baseLine="9221" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="9072" r="1877" b="9221">•</wd>

<tab position="1758"/>

<wd l="1877" t="9067" r="2213" b="9226">The</wd>

<space/>

<wd l="2304" t="9067" r="2971" b="9226">number</wd>

<space/>

<wd l="3062" t="9067" r="3250" b="9226">of</wd>

<space/>

<wd l="3322" t="9067" r="3883" b="9226">tokens</wd>

<space/>

<wd l="3979" t="9067" r="4757" b="9226">modified</wd>

<space/>

<wd l="4838" t="9067" r="5054" b="9269">by</wd>

<space/>

<wd l="5155" t="9091" r="5794" b="9269">system,</wd>

<space/>

</ln>

<ln l="1877" t="9341" r="5808" b="9499" baseLine="9490" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9341" r="2131" b="9499">i.e.</wd>

<space/>

<wd l="2246" t="9341" r="2803" b="9499">tokens</wd>

<space/>

<wd l="2914" t="9341" r="3173" b="9499">for</wd>

<space/>

<wd l="3269" t="9341" r="3802" b="9499">which</wd>

<space/>

<wd l="3907" t="9394" r="4003" b="9499">a</wd>

<space/>

<wd l="4109" t="9341" r="5122" b="9499">substitution</wd>

<space/>

<wd l="5218" t="9341" r="5611" b="9499">with</wd>

<space/>

<wd l="5712" t="9394" r="5808" b="9499">a</wd>

<space/>

</ln>

<ln l="1877" t="9610" r="5712" b="9811" baseLine="9763" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9634" r="2818" b="9811">non-empty</wd>

<space/>

<wd l="2875" t="9610" r="3360" b="9768">token</wd>

<space/>

<wd l="3413" t="9610" r="3552" b="9768">is</wd>

<space/>

<wd l="3614" t="9610" r="4416" b="9811">proposed</wd>

<space/>

<wd l="4469" t="9610" r="4685" b="9811">by</wd>

<space/>

<wd l="4742" t="9610" r="5006" b="9768">the</wd>

<space/>

<wd l="5074" t="9634" r="5712" b="9811">system.</wd>

</ln>

</para>

<para l="1440" t="10080" r="5808" b="11323" alignment="justified" spaceBefore="196" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="10080" r="5794" b="10282" baseLine="10234" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10080" r="1973" b="10238">Based</wd>

<space/>

<wd l="2035" t="10133" r="2251" b="10238">on</wd>

<space/>

<wd l="2304" t="10080" r="2755" b="10238">these</wd>

<space/>

<wd l="2813" t="10080" r="3605" b="10267">numbers,</wd>

<space/>

<wd l="3677" t="10080" r="4517" b="10282">precision,</wd>

<space/>

<wd l="4589" t="10080" r="5064" b="10238">recall</wd>

<space/>

<wd l="5136" t="10080" r="5448" b="10238">and</wd>

<space/>

<wd l="5501" t="10085" r="5794" b="10234">F1-</wd>

<space/>

</ln>

<ln l="1450" t="10354" r="5808" b="10555" baseLine="10502" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="10406" r="1901" b="10512">score</wd>

<space/>

<wd l="1968" t="10406" r="2227" b="10512">are</wd>

<space/>

<wd l="2294" t="10354" r="3178" b="10512">calculated</wd>

<space/>

<wd l="3245" t="10354" r="3557" b="10512">and</wd>

<space/>

<wd l="3614" t="10406" r="3869" b="10512">we</wd>

<space/>

<wd l="3941" t="10354" r="4430" b="10512">select</wd>

<space/>

<wd l="4493" t="10354" r="4757" b="10512">the</wd>

<space/>

<wd l="4834" t="10378" r="5429" b="10555">system</wd>

<space/>

<wd l="5496" t="10354" r="5808" b="10512">and</wd>

<space/>

</ln>

<ln l="1445" t="10622" r="5808" b="10824" baseLine="10776" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="10622" r="2606" b="10824">configuration</wd>

<space/>

<wd l="2717" t="10646" r="2880" b="10781">to</wd>

<space/>

<wd l="3000" t="10622" r="3202" b="10781">be</wd>

<space/>

<wd l="3317" t="10622" r="3720" b="10781">used</wd>

<space/>

<wd l="3835" t="10675" r="4046" b="10781">on</wd>

<space/>

<wd l="4162" t="10622" r="4426" b="10781">the</wd>

<space/>

<wd l="4541" t="10646" r="4843" b="10781">test</wd>

<space/>

<wd l="4963" t="10646" r="5198" b="10781">set</wd>

<space/>

<wd l="5309" t="10622" r="5808" b="10781">based</wd>

<space/>

</ln>

<ln l="1445" t="10896" r="5794" b="11098" baseLine="11045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="10949" r="1661" b="11054">on</wd>

<space/>

<wd l="1771" t="10896" r="2405" b="11098">highest</wd>

<space/>

<wd l="2525" t="10949" r="3187" b="11098">average</wd>

<space/>

<wd l="3302" t="10901" r="4066" b="11054">F1-score</wd>

<space/>

<wd l="4186" t="10949" r="4570" b="11054">over</wd>

<space/>

<wd l="4680" t="10896" r="4944" b="11054">the</wd>

<space/>

<wd l="5064" t="10896" r="5155" b="11054">5</wd>

<space/>

<wd l="5290" t="10949" r="5794" b="11054">cross-</wd>

</ln>

<ln l="1440" t="11165" r="2779" b="11323" baseLine="11314" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11165" r="2309" b="11323">validation</wd>

<space/>

<wd l="2362" t="11218" r="2779" b="11323">runs.</wd>

</ln>

</para>

<para l="1440" t="11645" r="2534" b="11818" alignment="left" spaceBefore="225" lsp="exactly" lspExact="273" language="en">

<ln l="1440" t="11645" r="2534" b="11818" baseLine="11808" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="16">

<wd l="1440" t="11645" r="1555" b="11818">3</wd>

<space/>

<wd l="1805" t="11650" r="2534" b="11818">Results</wd>

</ln>

</para>

<para l="1440" t="12091" r="5808" b="14731" alignment="justified" spaceBefore="156" spaceAfter="124" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="12091" r="5803" b="12293" baseLine="12240" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="12096" r="1723" b="12250">We</wd>

<space/>

<wd l="1795" t="12144" r="2083" b="12250">use</wd>

<space/>

<wd l="2160" t="12091" r="2957" b="12250">character</wd>

<space/>

<wd l="3029" t="12144" r="3677" b="12293">n-gram</wd>

<space/>

<wd l="3744" t="12091" r="4531" b="12293">language</wd>

<space/>

<wd l="4598" t="12091" r="5222" b="12250">models</wd>

<space/>

<wd l="5299" t="12091" r="5472" b="12245">in</wd>

<space/>

<wd l="5539" t="12091" r="5803" b="12250">the</wd>

<space/>

</ln>

<ln l="1440" t="12360" r="5803" b="12562" baseLine="12509" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="12360" r="1910" b="12562">noisy</wd>

<space/>

<wd l="1997" t="12360" r="2664" b="12518">channel</wd>

<space/>

<wd l="2746" t="12360" r="3288" b="12518">model</wd>

<space/>

<wd l="3370" t="12360" r="3629" b="12518">for</wd>

<space/>

<wd l="3706" t="12360" r="4536" b="12518">candidate</wd>

<space/>

<wd l="4622" t="12360" r="5434" b="12518">selection.</wd>

<space/>

<wd l="5582" t="12365" r="5803" b="12518">To</wd>

<space/>

</ln>

<ln l="1445" t="12629" r="5794" b="12830" baseLine="12782" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="12629" r="2088" b="12787">address</wd>

<space/>

<wd l="2170" t="12629" r="2837" b="12830">sparsity</wd>

<space/>

<wd l="2909" t="12629" r="3101" b="12787">of</wd>

<space/>

<wd l="3158" t="12629" r="3518" b="12787">data</wd>

<space/>

<wd l="3581" t="12629" r="3907" b="12787">that</wd>

<space/>

<wd l="3979" t="12629" r="4464" b="12787">arises</wd>

<space/>

<wd l="4536" t="12629" r="5011" b="12787">when</wd>

<space/>

<wd l="5074" t="12653" r="5376" b="12787">test</wd>

<space/>

<wd l="5453" t="12682" r="5794" b="12787">sen-</wd>

</ln>

<ln l="1440" t="12902" r="5808" b="13104" baseLine="13051" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="12926" r="1978" b="13061">tences</wd>

<space/>

<wd l="2059" t="12902" r="2698" b="13061">contain</wd>

<space/>

<wd l="2770" t="12955" r="3494" b="13104">n-grams</wd>

<space/>

<wd l="3571" t="12902" r="3902" b="13061">that</wd>

<space/>

<wd l="3970" t="12955" r="4234" b="13061">are</wd>

<space/>

<wd l="4301" t="12955" r="4642" b="13061">rare</wd>

<space/>

<wd l="4714" t="12955" r="4896" b="13061">or</wd>

<space/>

<wd l="4963" t="12955" r="5568" b="13061">unseen</wd>

<space/>

<wd l="5635" t="12902" r="5808" b="13056">in</wd>

<space/>

</ln>

<ln l="1440" t="13171" r="5803" b="13373" baseLine="13325" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="13171" r="1704" b="13330">the</wd>

<space/>

<wd l="1771" t="13171" r="2448" b="13373">training</wd>

<space/>

<wd l="2520" t="13171" r="2923" b="13358">data,</wd>

<space/>

<wd l="3000" t="13224" r="3254" b="13330">we</wd>

<space/>

<wd l="3317" t="13195" r="3557" b="13373">try</wd>

<space/>

<wd l="3624" t="13171" r="4690" b="13358">Witten-Bell,</wd>

<space/>

<wd l="4771" t="13176" r="5803" b="13373">Keyser-Ney</wd>

<space/>

</ln>

<ln l="1445" t="13445" r="5794" b="13646" baseLine="13594" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="13445" r="1757" b="13603">and</wd>

<space/>

<wd l="1838" t="13445" r="2971" b="13646">Good-Turing</wd>

<space/>

<wd l="3062" t="13445" r="4018" b="13646">smoothing.</wd>

<space/>

<wd l="4166" t="13445" r="4646" b="13603">Table</wd>

<space/>

<wd l="4747" t="13450" r="4810" b="13598">1</wd>

<space/>

<wd l="4925" t="13445" r="5443" b="13603">shows</wd>

<space/>

<wd l="5534" t="13498" r="5794" b="13603">av-</wd>

</ln>

<ln l="1445" t="13714" r="5803" b="13915" baseLine="13867" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="13766" r="1910" b="13915">erage</wd>

<space/>

<wd l="2016" t="13714" r="3398" b="13872">cross-validation</wd>

<space/>

<wd l="3494" t="13714" r="4373" b="13915">perplexity</wd>

<space/>

<wd l="4474" t="13714" r="4733" b="13872">for</wd>

<space/>

<wd l="4824" t="13714" r="5270" b="13872">these</wd>

<space/>

<wd l="5371" t="13714" r="5803" b="13872">three</wd>

<space/>

</ln>

<ln l="1450" t="13987" r="5803" b="14189" baseLine="14136" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="13987" r="2357" b="14189">smoothing</wd>

<space/>

<wd l="2453" t="13987" r="3182" b="14146">methods</wd>

<space/>

<wd l="3288" t="13987" r="3600" b="14146">and</wd>

<space/>

<wd l="3691" t="14040" r="3811" b="14146">n</wd>

<space/>

<wd l="3955" t="14059" r="4104" b="14112">=</wd>

<space/>

<wd l="4253" t="13992" r="4397" b="14184">2,</wd>

<space/>

<wd l="4459" t="14117" r="4675" b="14184">...,</wd>

<space/>

<wd l="4733" t="13992" r="4877" b="14146">6.</wd>

<space/>

<wd l="5069" t="13992" r="5501" b="14146">Over</wd>

<space/>

<wd l="5592" t="13987" r="5803" b="14146">all</wd>

<space/>

</ln>

<ln l="1445" t="14256" r="5803" b="14458" baseLine="14410" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="14256" r="1757" b="14414">five</wd>

<space/>

<wd l="1872" t="14256" r="3259" b="14414">cross-validation</wd>

<space/>

<wd l="3370" t="14256" r="3850" b="14443">folds,</wd>

<space/>

<wd l="3984" t="14256" r="4248" b="14414">the</wd>

<space/>

<wd l="4363" t="14256" r="5150" b="14458">language</wd>

<space/>

<wd l="5261" t="14256" r="5803" b="14414">model</wd>

<space/>

</ln>

<ln l="1440" t="14530" r="5808" b="14731" baseLine="14678" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="14530" r="1771" b="14688">that</wd>

<space/>

<wd l="1906" t="14530" r="2342" b="14731">gives</wd>

<space/>

<wd l="2486" t="14530" r="2750" b="14688">the</wd>

<space/>

<wd l="2885" t="14530" r="3451" b="14688">lowest</wd>

<space/>

<wd l="3581" t="14530" r="4459" b="14731">perplexity</wd>

<space/>

<wd l="4594" t="14530" r="5069" b="14688">when</wd>

<space/>

<wd l="5198" t="14530" r="5808" b="14688">trained</wd>

</ln>

</para>

<rulerline l="1440" t="14870" r="2640" b="14870" type="single" width="10" color="000000"/>

<para l="1440" t="14933" r="5798" b="15264" alignment="justified" spaceBefore="49" lsp="exactly" lspExact="197" language="en">

<ln l="1445" t="14933" r="5798" b="15106" baseLine="15058">

<wd l="1445" t="14938" r="1901" b="15067"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">n</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">-best</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="1963" t="14938" r="2184" b="15067">list</wd>

<space/>

<wd l="2246" t="14938" r="2702" b="15067">before</wd>

<space/>

<wd l="2770" t="14938" r="3389" b="15106">applying</wd>

<space/>

<wd l="3456" t="14976" r="3821" b="15067">more</wd>

<space/>

<wd l="3888" t="14938" r="4498" b="15106">complex</wd>

<space/>

<wd l="4565" t="14938" r="5078" b="15067">models</wd>

<space/>

<wd l="5146" t="14957" r="5285" b="15067">to</wd>

<space/>

<wd l="5347" t="14938" r="5798" b="15067">token-</wd>

</run>

</ln>

<ln l="1440" t="15130" r="3230" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="15134" r="1781" b="15264">level</wd>

<space/>

<wd l="1824" t="15134" r="2510" b="15264">candidate</wd>

<space/>

<wd l="2563" t="15134" r="3230" b="15264">selection.</wd>

</ln>

</para>

</column>

<column l="6144" t="1248" r="10526" b="15317">

<table l="6605" t="1258" r="10051" b="2659" alignment="left" li="461" ri="475" spaceBefore="10" spaceAfter="33">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>480</gridCol>

<gridCol>446</gridCol>

<gridCol>836</gridCol>

<gridCol>840</gridCol>

<gridCol>844</gridCol>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>278</gridRow>

<gridRow>283</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6605" t="1258" r="7085" b="1541" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7085" t="1258" r="7531" b="1541" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7886" t="1296" r="8006" b="1454" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="7886" t="1296" r="8006" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7886" t="1306" r="8006" b="1454">P</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8717" t="1296" r="8861" b="1454" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="8717" t="1296" r="8861" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8717" t="1306" r="8861" b="1454">R</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9514" t="1296" r="9720" b="1454" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="9514" t="1296" r="9720" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-9">

<wd l="9514" t="1306" r="9720" b="1454">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6734" t="1574" r="6941" b="1766" alignment="centered" spaceAfter="11" lsp="exactly" lspExact="262" language="en">

<ln l="6734" t="1574" r="6941" b="1766" baseLine="1750">

<wd l="6734" t="1579" r="6941" b="1766"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-2"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7205" t="1579" r="7411" b="1738" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<ln l="7205" t="1579" r="7411" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7205" t="1584" r="7411" b="1738">W</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7675" t="1579" r="8222" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="7675"/>

<ln l="7675" t="1579" r="8222" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7675" t="1584" r="8222" b="1738">83.2%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8510" t="1579" r="9062" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="8510"/>

<ln l="8510" t="1579" r="9062" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8510" t="1584" r="9062" b="1738">37.7%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9350" t="1579" r="9898" b="1738" alignment="left" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<tabs position="9350"/>

<ln l="9350" t="1579" r="9898" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9350" t="1579" r="9898" b="1738">51.9%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6734" t="1853" r="6941" b="2045" alignment="centered" spaceAfter="5" lsp="exactly" lspExact="263" language="en">

<ln l="6734" t="1853" r="6941" b="2045" baseLine="2030">

<wd l="6734" t="1858" r="6941" b="2045"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-2"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7253" t="1858" r="7358" b="2016" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="7253" t="1858" r="7358" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7253" t="1862" r="7358" b="2016">S</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7675" t="1858" r="8222" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="7675"/>

<ln l="7675" t="1858" r="8222" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7675" t="1862" r="8222" b="2016">83.2%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8506" t="1858" r="9062" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="8506"/>

<ln l="8506" t="1858" r="9062" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8506" t="1862" r="9062" b="2016">41.0%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9350" t="1858" r="9898" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="9350"/>

<ln l="9350" t="1858" r="9898" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9350" t="1858" r="9898" b="2016">54.9%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6734" t="2131" r="6946" b="2323" alignment="centered" spaceAfter="12" lsp="exactly" lspExact="266" language="en">

<ln l="6734" t="2131" r="6946" b="2323" baseLine="2312">

<wd l="6734" t="2136" r="6946" b="2323"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7205" t="2136" r="7411" b="2294" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<ln l="7205" t="2136" r="7411" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7205" t="2141" r="7411" b="2294">W</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7651" t="2136" r="8222" b="2294" alignment="left" spaceAfter="26" lsp="exactly" lspExact="252" language="en">

<tabs position="7651"/>

<ln l="7651" t="2136" r="8222" b="2294" baseLine="2290" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-10">

<wd l="7651" t="2136" r="8222" b="2294">85.9%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8506" t="2136" r="9062" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="8506"/>

<ln l="8506" t="2136" r="9062" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8506" t="2141" r="9062" b="2294">47.7%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9350" t="2136" r="9898" b="2294" alignment="left" spaceAfter="28" lsp="exactly" lspExact="250" language="en">

<tabs position="9350"/>

<ln l="9350" t="2136" r="9898" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9350" t="2136" r="9898" b="2294">61.4%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6734" t="2410" r="6946" b="2602" alignment="centered" spaceAfter="6" lsp="exactly" lspExact="267" language="en">

<ln l="6734" t="2410" r="6946" b="2602" baseLine="2590">

<wd l="6734" t="2414" r="6946" b="2602"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7253" t="2414" r="7358" b="2573" alignment="centered" spaceAfter="23" lsp="exactly" lspExact="250" language="en">

<ln l="7253" t="2414" r="7358" b="2573" baseLine="2568" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7253" t="2419" r="7358" b="2573">S</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7675" t="2414" r="8222" b="2573" alignment="left" spaceAfter="23" lsp="exactly" lspExact="250" language="en">

<tabs position="7675"/>

<ln l="7675" t="2414" r="8222" b="2573" baseLine="2568" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7675" t="2414" r="8222" b="2573">85.7%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8491" t="2414" r="9062" b="2573" alignment="left" spaceAfter="21" lsp="exactly" lspExact="252" language="en">

<tabs position="8491"/>

<ln l="8491" t="2414" r="9062" b="2573" baseLine="2568" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-10">

<wd l="8491" t="2414" r="9062" b="2573">56.1%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9331" t="2414" r="9902" b="2573" alignment="left" spaceAfter="21" lsp="exactly" lspExact="252" language="en">

<tabs position="9331"/>

<ln l="9331" t="2414" r="9902" b="2573" baseLine="2568" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-10">

<wd l="9331" t="2414" r="9902" b="2573">67.8%</wd>

</ln>

</para>

</cell>

</table>

<rulerline l="6610" t="2698" r="10051" b="2698" type="single" width="10" color="000000"/>

<para l="6144" t="2909" r="10517" b="4968" alignment="justified" spaceBefore="161" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="2909" r="10512" b="3115" baseLine="3062" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2914" r="6624" b="3072">Table</wd>

<space/>

<wd l="6691" t="2918" r="6840" b="3072">2:</wd>

<space/>

<wd l="6941" t="2918" r="7656" b="3115">Average</wd>

<space/>

<wd l="7723" t="2914" r="9110" b="3072">cross-validation</wd>

<space/>

<wd l="9168" t="2914" r="9730" b="3072">results</wd>

<space/>

<wd l="9806" t="2966" r="10186" b="3072">over</wd>

<space/>

<wd l="10243" t="2914" r="10512" b="3072">the</wd>

<space/>

</ln>

<ln l="6149" t="3178" r="10502" b="3341" baseLine="3336" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="3182" r="6466" b="3341">five</wd>

<space/>

<wd l="6586" t="3182" r="7968" b="3341">cross-validation</wd>

<space/>

<wd l="8083" t="3235" r="8448" b="3341">runs</wd>

<space/>

<wd l="8573" t="3182" r="8832" b="3341">for</wd>

<space/>

<wd l="8942" t="3182" r="9768" b="3341">transition</wd>

<space/>

<wd l="9878" t="3182" r="10502" b="3341">models</wd>

<space/>

</ln>

<ln l="6149" t="3451" r="10517" b="3658" baseLine="3607">

<wd l="6149" t="3456" r="6360" b="3643"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6480" t="3456" r="6792" b="3614">and</wd>

<space/>

</run>

<wd l="6888" t="3456" r="7162" b="3643"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7272" t="3461" r="7478" b="3614">W</wd>

<space/>

<wd l="7579" t="3523" r="7694" b="3586">=</wd>

<space/>

<wd l="7790" t="3456" r="8362" b="3658">Wapiti</wd>

<space/>

<wd l="8462" t="3461" r="8870" b="3614">CRF</wd>

<space/>

<wd l="8971" t="3509" r="9763" b="3658">sequence</wd>

<space/>

<wd l="9854" t="3456" r="10517" b="3614">labeller</wd>

<space/>

</run>

</ln>

<ln l="6154" t="3725" r="10507" b="3926" baseLine="3878" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="3725" r="6826" b="3922">(trained</wd>

<space/>

<wd l="6917" t="3778" r="7133" b="3883">on</wd>

<space/>

<wd l="7229" t="3725" r="7608" b="3926">only</wd>

<space/>

<wd l="7723" t="3725" r="8093" b="3883">16%</wd>

<space/>

<wd l="8194" t="3725" r="8386" b="3883">of</wd>

<space/>

<wd l="8462" t="3725" r="8726" b="3883">the</wd>

<space/>

<wd l="8818" t="3725" r="9494" b="3926">training</wd>

<space/>

<wd l="9590" t="3725" r="10066" b="3922">data),</wd>

<space/>

<wd l="10181" t="3730" r="10286" b="3883">S</wd>

<space/>

<wd l="10392" t="3792" r="10507" b="3854">=</wd>

<space/>

</ln>

<ln l="6149" t="3998" r="10517" b="4200" baseLine="4147" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4003" r="6768" b="4200">Sequor</wd>

<space/>

<wd l="6859" t="3998" r="7848" b="4200">generalised</wd>

<space/>

<wd l="7939" t="4022" r="8875" b="4200">perceptron</wd>

<space/>

<wd l="8976" t="4051" r="9763" b="4200">sequence</wd>

<space/>

<wd l="9854" t="3998" r="10517" b="4157">labeller</wd>

<space/>

</ln>

<ln l="6154" t="4267" r="10502" b="4469" baseLine="4421" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="4267" r="6826" b="4464">(trained</wd>

<space/>

<wd l="6907" t="4320" r="7118" b="4426">on</wd>

<space/>

<wd l="7200" t="4267" r="7589" b="4426">64%</wd>

<space/>

<wd l="7680" t="4267" r="7867" b="4426">of</wd>

<space/>

<wd l="7930" t="4267" r="8198" b="4426">the</wd>

<space/>

<wd l="8275" t="4267" r="8952" b="4469">training</wd>

<space/>

<wd l="9034" t="4267" r="9509" b="4464">data),</wd>

<space/>

<wd l="9605" t="4272" r="9725" b="4421">P</wd>

<space/>

<wd l="9806" t="4334" r="9922" b="4397">=</wd>

<space/>

<wd l="10003" t="4267" r="10502" b="4469">preci-</wd>

</ln>

<ln l="6154" t="4541" r="10502" b="4728" baseLine="4690" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="4541" r="6552" b="4728">sion,</wd>

<space/>

<wd l="6624" t="4546" r="6768" b="4694">R</wd>

<space/>

<wd l="6835" t="4608" r="6950" b="4670">=</wd>

<space/>

<wd l="7013" t="4541" r="7541" b="4728">recall,</wd>

<space/>

<wd l="7608" t="4546" r="7819" b="4694">F1</wd>

<space/>

<wd l="7906" t="4608" r="8021" b="4670">=</wd>

<space/>

<wd l="8083" t="4546" r="8290" b="4694">F1</wd>

<space/>

<wd l="8371" t="4594" r="9139" b="4699">measure.</wd>

<space/>

<wd l="9240" t="4541" r="10008" b="4699">Standard</wd>

<space/>

<wd l="10075" t="4541" r="10502" b="4699">devi-</wd>

</ln>

<ln l="6149" t="4810" r="8525" b="4968" baseLine="4963">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="4810" r="6586" b="4968">ation</wd>

<space/>

<wd l="6643" t="4867" r="6763" b="4968">Q</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="6845" t="4824" r="6984" b="4954">G</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7066" t="4814" r="7440" b="4968">0.03</wd>

<space/>

<wd l="7502" t="4810" r="7762" b="4968">for</wd>

<space/>

<wd l="7814" t="4810" r="8021" b="4968">all</wd>

<space/>

<wd l="8088" t="4810" r="8525" b="4968">cells.</wd>

</run>

</ln>

</para>

<para l="6144" t="5472" r="10507" b="7032" alignment="justified" spaceBefore="390" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="5472" r="10507" b="5674" baseLine="5626" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="5525" r="6365" b="5630">on</wd>

<space/>

<wd l="6461" t="5472" r="6725" b="5630">the</wd>

<space/>

<wd l="6826" t="5472" r="7502" b="5674">training</wd>

<space/>

<wd l="7608" t="5472" r="7968" b="5630">data</wd>

<space/>

<wd l="8069" t="5472" r="8376" b="5630">and</wd>

<space/>

<wd l="8477" t="5472" r="9120" b="5674">applied</wd>

<space/>

<wd l="9211" t="5496" r="9379" b="5630">to</wd>

<space/>

<wd l="9480" t="5472" r="9744" b="5630">the</wd>

<space/>

<wd l="9845" t="5472" r="10507" b="5630">internal</wd>

<space/>

</ln>

<ln l="6144" t="5746" r="10502" b="5947" baseLine="5894" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5770" r="6451" b="5904">test</wd>

<space/>

<wd l="6576" t="5770" r="6811" b="5904">set</wd>

<space/>

<wd l="6926" t="5746" r="7066" b="5904">is</wd>

<space/>

<wd l="7190" t="5746" r="7454" b="5904">the</wd>

<space/>

<wd l="7579" t="5746" r="8208" b="5947">6-gram</wd>

<space/>

<wd l="8323" t="5746" r="8866" b="5904">model</wd>

<space/>

<wd l="8986" t="5746" r="9374" b="5904">with</wd>

<space/>

<wd l="9490" t="5746" r="10502" b="5904">Witten-Bell</wd>

<space/>

</ln>

<ln l="6154" t="6014" r="10502" b="6216" baseLine="6168" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="6014" r="7109" b="6216">smoothing.</wd>

<space/>

<wd l="7282" t="6014" r="7666" b="6173">This</wd>

<space/>

<wd l="7762" t="6014" r="8515" b="6173">confirms</wd>

<space/>

<wd l="8606" t="6014" r="8875" b="6173">the</wd>

<space/>

<wd l="8962" t="6014" r="10502" b="6173">recommendations</wd>

<space/>

</ln>

<ln l="6144" t="6288" r="10502" b="6446" baseLine="6437" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6288" r="6317" b="6442">in</wd>

<space/>

<wd l="6394" t="6288" r="6662" b="6446">the</wd>

<space/>

<wd l="6749" t="6293" r="7406" b="6446">SRILM</wd>

<space/>

<wd l="7493" t="6288" r="8789" b="6446">documentation</wd>

<space/>

<wd l="8866" t="6312" r="9034" b="6446">to</wd>

<space/>

<wd l="9120" t="6341" r="9408" b="6446">use</wd>

<space/>

<wd l="9490" t="6288" r="10502" b="6446">Witten-Bell</wd>

<space/>

</ln>

<ln l="6154" t="6557" r="10502" b="6758" baseLine="6706" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="6557" r="7066" b="6758">smoothing</wd>

<space/>

<wd l="7142" t="6557" r="7618" b="6715">when</wd>

<space/>

<wd l="7694" t="6557" r="7963" b="6715">the</wd>

<space/>

<wd l="8040" t="6557" r="8995" b="6758">vocabulary</wd>

<space/>

<wd l="9077" t="6557" r="9216" b="6715">is</wd>

<space/>

<wd l="9312" t="6557" r="9773" b="6715">small</wd>

<space/>

<wd l="9859" t="6557" r="10253" b="6715">such</wd>

<space/>

<wd l="10334" t="6610" r="10502" b="6715">as</wd>

<space/>

</ln>

<ln l="6144" t="6830" r="9888" b="7032" baseLine="6979" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6830" r="6619" b="6989">when</wd>

<space/>

<wd l="6672" t="6830" r="7392" b="7032">building</wd>

<space/>

<wd l="7454" t="6883" r="7550" b="6989">a</wd>

<space/>

<wd l="7608" t="6830" r="8405" b="6989">character</wd>

<space/>

<wd l="8458" t="6830" r="9245" b="7032">language</wd>

<space/>

<wd l="9298" t="6830" r="9888" b="6989">model.</wd>

</ln>

</para>

<para l="6144" t="7109" r="10512" b="10560" alignment="justified" spaceBefore="5" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="7109" r="10512" b="7267" baseLine="7258" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="7109" r="6840" b="7267">Table</wd>

<space/>

<wd l="6936" t="7114" r="7037" b="7262">2</wd>

<space/>

<wd l="7142" t="7109" r="7666" b="7267">shows</wd>

<space/>

<wd l="7766" t="7109" r="9154" b="7267">cross-validation</wd>

<space/>

<wd l="9240" t="7109" r="9802" b="7267">results</wd>

<space/>

<wd l="9902" t="7109" r="10157" b="7267">for</wd>

<space/>

<wd l="10243" t="7109" r="10512" b="7267">the</wd>

<space/>

</ln>

<ln l="6144" t="7378" r="10512" b="7579" baseLine="7526" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7378" r="6514" b="7536">four</wd>

<space/>

<wd l="6600" t="7402" r="7272" b="7579">systems</wd>

<space/>

<wd l="7358" t="7378" r="8117" b="7579">resulting</wd>

<space/>

<wd l="8203" t="7378" r="8630" b="7536">from</wd>

<space/>

<wd l="8702" t="7378" r="8971" b="7536">the</wd>

<space/>

<wd l="9058" t="7378" r="9696" b="7536">choices</wd>

<space/>

<wd l="9782" t="7378" r="10512" b="7536">between</wd>

<space/>

</ln>

<ln l="6144" t="7646" r="10507" b="7848" baseLine="7802">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="7646" r="6970" b="7805">transition</wd>

<space/>

<wd l="7032" t="7646" r="7656" b="7805">models</wd>

<space/>

</run>

<wd l="7728" t="7646" r="7934" b="7834"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8026" t="7646" r="8338" b="7805">and</wd>

<space/>

</run>

<wd l="8400" t="7646" r="8616" b="7834"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8698" t="7646" r="9010" b="7805">and</wd>

<space/>

<wd l="9072" t="7646" r="9542" b="7848">using</wd>

<space/>

<wd l="9605" t="7646" r="9874" b="7805">the</wd>

<space/>

<wd l="9936" t="7646" r="10507" b="7848">Wapiti</wd>

<space/>

</run>

</ln>

<ln l="6149" t="7920" r="10502" b="8122" baseLine="8069" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="7925" r="6557" b="8078">CRF</wd>

<space/>

<wd l="6682" t="7973" r="6859" b="8078">or</wd>

<space/>

<wd l="6974" t="7920" r="7238" b="8078">the</wd>

<space/>

<wd l="7363" t="7925" r="7982" b="8122">Sequor</wd>

<space/>

<wd l="8098" t="7920" r="9091" b="8122">generalised</wd>

<space/>

<wd l="9206" t="7944" r="10142" b="8122">perceptron</wd>

<space/>

<wd l="10267" t="7973" r="10502" b="8078">se-</wd>

</ln>

<ln l="6149" t="8189" r="10512" b="8390" baseLine="8342" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="8242" r="6763" b="8390">quence</wd>

<space/>

<wd l="6840" t="8189" r="7526" b="8347">labeller.</wd>

<space/>

<wd l="7675" t="8189" r="8011" b="8347">The</wd>

<space/>

<wd l="8098" t="8189" r="9048" b="8347">differences</wd>

<space/>

<wd l="9134" t="8242" r="9398" b="8347">are</wd>

<space/>

<wd l="9475" t="8213" r="9758" b="8347">not</wd>

<space/>

<wd l="9830" t="8189" r="10262" b="8390">large</wd>

<space/>

<wd l="10339" t="8189" r="10512" b="8342">in</wd>

<space/>

</ln>

<ln l="6144" t="8462" r="10502" b="8664" baseLine="8612">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="8462" r="6946" b="8664">precision</wd>

<space/>

<wd l="7037" t="8462" r="7315" b="8621">but</wd>

<space/>

<wd l="7406" t="8462" r="7666" b="8621">for</wd>

<space/>

<wd l="7752" t="8462" r="8280" b="8650">recall,</wd>

<space/>

<wd l="8395" t="8462" r="8664" b="8621">the</wd>

<space/>

<wd l="8755" t="8462" r="9298" b="8621">model</wd>

<space/>

</run>

<wd l="9398" t="8462" r="9610" b="8650"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="9725" t="8462" r="10502" b="8664">performs</wd>

<space/>

</run>

</ln>

<ln l="6144" t="8731" r="10502" b="8933" baseLine="8885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8731" r="6744" b="8933">poorly.</wd>

<space/>

<wd l="6893" t="8731" r="7301" b="8890">Also</wd>

<space/>

<wd l="7378" t="8731" r="7646" b="8890">the</wd>

<space/>

<wd l="7728" t="8736" r="8136" b="8890">CRF</wd>

<space/>

<wd l="8218" t="8731" r="9254" b="8933">consistently</wd>

<space/>

<wd l="9331" t="8731" r="9614" b="8890">has</wd>

<space/>

<wd l="9701" t="8731" r="10195" b="8890">lower</wd>

<space/>

<wd l="10267" t="8784" r="10502" b="8890">re-</wd>

</ln>

<ln l="6149" t="9005" r="10502" b="9206" baseLine="9154" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9005" r="6451" b="9163">call</wd>

<space/>

<wd l="6538" t="9005" r="6917" b="9163">than</wd>

<space/>

<wd l="6989" t="9005" r="7258" b="9163">the</wd>

<space/>

<wd l="7334" t="9005" r="8208" b="9206">respective</wd>

<space/>

<wd l="8285" t="9029" r="9221" b="9206">perceptron</wd>

<space/>

<wd l="9298" t="9005" r="9883" b="9163">model.</wd>

<space/>

<wd l="10032" t="9010" r="10502" b="9163">Inter-</wd>

</ln>

<ln l="6149" t="9274" r="10502" b="9475" baseLine="9427" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9274" r="6864" b="9475">estingly,</wd>

<space/>

<wd l="6936" t="9274" r="7205" b="9432">the</wd>

<space/>

<wd l="7267" t="9278" r="7675" b="9432">CRF</wd>

<space/>

<wd l="7738" t="9274" r="8467" b="9432">achieves</wd>

<space/>

<wd l="8534" t="9274" r="8890" b="9432">best</wd>

<space/>

<wd l="8947" t="9274" r="9787" b="9475">precision.</wd>

<space/>

<wd l="9888" t="9278" r="10152" b="9432">On</wd>

<space/>

<wd l="10210" t="9278" r="10502" b="9427">F1-</wd>

<space/>

</ln>

<ln l="6154" t="9547" r="10498" b="9734" baseLine="9696">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6154" t="9600" r="6648" b="9734">score,</wd>

<space/>

<wd l="6744" t="9547" r="7008" b="9706">the</wd>

<space/>

<wd l="7090" t="9547" r="7440" b="9706">best</wd>

<space/>

<wd l="7517" t="9547" r="8006" b="9706">result</wd>

<space/>

<wd l="8078" t="9547" r="8218" b="9706">is</wd>

<space/>

<wd l="8309" t="9547" r="9058" b="9706">obtained</wd>

<space/>

<wd l="9134" t="9547" r="9523" b="9706">with</wd>

<space/>

<wd l="9600" t="9547" r="10142" b="9706">model</wd>

<space/>

</run>

<wd l="10229" t="9547" r="10498" b="9734"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="6144" t="9816" r="10502" b="10018" baseLine="9965" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9816" r="6682" b="9974">which</wd>

<space/>

<wd l="6754" t="9816" r="7411" b="9974">reduces</wd>

<space/>

<wd l="7493" t="9816" r="7762" b="9974">the</wd>

<space/>

<wd l="7838" t="9816" r="8304" b="10018">noisy</wd>

<space/>

<wd l="8390" t="9816" r="9058" b="9974">channel</wd>

<space/>

<wd l="9139" t="9816" r="9682" b="9974">model</wd>

<space/>

<wd l="9758" t="9840" r="9922" b="9974">to</wd>

<space/>

<wd l="10013" t="9816" r="10502" b="9974">selec-</wd>

</ln>

<ln l="6144" t="10090" r="10502" b="10291" baseLine="10238" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10090" r="6485" b="10248">tion</wd>

<space/>

<wd l="6576" t="10090" r="7306" b="10248">between</wd>

<space/>

<wd l="7402" t="10142" r="8189" b="10291">sequence</wd>

<space/>

<wd l="8280" t="10090" r="9062" b="10248">modeller</wd>

<space/>

<wd l="9149" t="10090" r="10157" b="10291">hypotheses,</wd>

<space/>

<wd l="10267" t="10114" r="10502" b="10248">to-</wd>

</ln>

<ln l="6149" t="10358" r="9845" b="10560" baseLine="10507" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10358" r="6696" b="10560">gether</wd>

<space/>

<wd l="6744" t="10358" r="7133" b="10517">with</wd>

<space/>

<wd l="7186" t="10358" r="7454" b="10517">the</wd>

<space/>

<wd l="7512" t="10363" r="8131" b="10560">Sequor</wd>

<space/>

<wd l="8194" t="10411" r="8981" b="10560">sequence</wd>

<space/>

<wd l="9034" t="10358" r="9845" b="10517">modeller.</wd>

</ln>

</para>

<para l="6149" t="10637" r="10502" b="11650" alignment="justified" spaceBefore="11" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6370" t="10637" r="10493" b="10838" baseLine="10787">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="10642" r="6634" b="10795">On</wd>

<space/>

<wd l="6706" t="10637" r="6970" b="10795">the</wd>

<space/>

<wd l="7051" t="10637" r="7430" b="10795">final</wd>

<space/>

<wd l="7507" t="10661" r="7810" b="10795">test</wd>

<space/>

<wd l="7891" t="10661" r="8170" b="10824">set,</wd>

<space/>

<wd l="8266" t="10690" r="8554" b="10795">our</wd>

<space/>

<wd l="8626" t="10637" r="8976" b="10795">best</wd>

<space/>

<wd l="9058" t="10661" r="9658" b="10838">system</wd>

<space/>

<wd l="9730" t="10637" r="10200" b="10838">using</wd>

<space/>

</run>

<wd l="10282" t="10637" r="10493" b="10824"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="6149" t="10910" r="10502" b="11112" baseLine="11059" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="10910" r="6461" b="11069">and</wd>

<space/>

<wd l="6542" t="10915" r="7157" b="11112">Sequor</wd>

<space/>

<wd l="7229" t="10910" r="7512" b="11069">has</wd>

<space/>

<wd l="7594" t="10910" r="8395" b="11112">precision</wd>

<space/>

<wd l="8482" t="10915" r="9187" b="11098">81.90%,</wd>

<space/>

<wd l="9278" t="10910" r="9754" b="11069">recall</wd>

<space/>

<wd l="9845" t="10910" r="10502" b="11069">55.09%</wd>

<space/>

</ln>

<ln l="6149" t="11179" r="10502" b="11381" baseLine="11328" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="11179" r="6461" b="11338">and</wd>

<space/>

<wd l="6523" t="11184" r="6730" b="11333">F1</wd>

<space/>

<wd l="6821" t="11179" r="7531" b="11366">65.87%,</wd>

<space/>

<wd l="7608" t="11179" r="8246" b="11381">placing</wd>

<space/>

<wd l="8309" t="11179" r="8434" b="11338">it</wd>

<space/>

<wd l="8496" t="11179" r="8861" b="11338">fifth</wd>

<space/>

<wd l="8923" t="11203" r="9202" b="11338">out</wd>

<space/>

<wd l="9264" t="11179" r="9456" b="11338">of</wd>

<space/>

<wd l="9514" t="11179" r="9754" b="11338">six</wd>

<space/>

<wd l="9830" t="11179" r="10502" b="11338">submis-</wd>

</ln>

<ln l="6154" t="11448" r="9226" b="11650" baseLine="11602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="11448" r="6586" b="11606">sions</wd>

<space/>

<wd l="6648" t="11448" r="6821" b="11602">in</wd>

<space/>

<wd l="6874" t="11448" r="7138" b="11606">the</wd>

<space/>

<wd l="7200" t="11448" r="8390" b="11606">“constrained”</wd>

<space/>

<wd l="8453" t="11472" r="9226" b="11650">category.</wd>

</ln>

</para>

<para l="6144" t="11938" r="7579" b="12110" alignment="left" spaceBefore="230" lsp="exactly" lspExact="273" language="en">

<ln l="6144" t="11938" r="7579" b="12110" baseLine="12101" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">

<wd l="6144" t="11938" r="6259" b="12106">4</wd>

<space/>

<wd l="6504" t="11938" r="7579" b="12110">Discussion</wd>

</ln>

</para>

<para l="6144" t="12389" r="10512" b="13901" alignment="justified" spaceBefore="165" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="12389" r="10512" b="12590" baseLine="12538" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="12394" r="6302" b="12542">A</wd>

<space/>

<wd l="6360" t="12389" r="7075" b="12590">possible</wd>

<space/>

<wd l="7138" t="12389" r="8150" b="12590">explanation</wd>

<space/>

<wd l="8203" t="12389" r="8462" b="12547">for</wd>

<space/>

<wd l="8515" t="12389" r="8779" b="12547">the</wd>

<space/>

<wd l="8837" t="12389" r="9158" b="12547">low</wd>

<space/>

<wd l="9216" t="12389" r="9701" b="12547">recall</wd>

<space/>

<wd l="9763" t="12389" r="10512" b="12547">obtained</wd>

<space/>

</ln>

<ln l="6144" t="12658" r="10512" b="12845" baseLine="12812">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="12658" r="6533" b="12816">with</wd>

<space/>

<wd l="6595" t="12658" r="6859" b="12816">the</wd>

<space/>

</run>

<wd l="6926" t="12658" r="7138" b="12845"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">P</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7219" t="12658" r="7762" b="12816">model</wd>

<space/>

<wd l="7829" t="12658" r="7963" b="12816">is</wd>

<space/>

<wd l="8035" t="12658" r="8362" b="12816">that</wd>

<space/>

<wd l="8424" t="12658" r="8731" b="12816">this</wd>

<space/>

<wd l="8798" t="12658" r="9259" b="12816">noise</wd>

<space/>

<wd l="9322" t="12658" r="9864" b="12816">model</wd>

<space/>

<wd l="9936" t="12682" r="10512" b="12816">cannot</wd>

<space/>

</run>

</ln>

<ln l="6149" t="12931" r="10507" b="13133" baseLine="13080" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="12955" r="6806" b="13090">counter</wd>

<space/>

<wd l="6864" t="12931" r="7128" b="13090">the</wd>

<space/>

<wd l="7195" t="12931" r="7685" b="13090">effect</wd>

<space/>

<wd l="7742" t="12931" r="8074" b="13090">that</wd>

<space/>

<wd l="8141" t="12931" r="8741" b="13090">shorter</wd>

<space/>

<wd l="8813" t="12955" r="9629" b="13090">sentences</wd>

<space/>

<wd l="9706" t="12931" r="10507" b="13133">generally</wd>

<space/>

</ln>

<ln l="6144" t="13200" r="10502" b="13402" baseLine="13354" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="13200" r="6768" b="13358">receive</wd>

<space/>

<wd l="6835" t="13200" r="7397" b="13402">higher</wd>

<space/>

<wd l="7464" t="13200" r="8251" b="13402">language</wd>

<space/>

<wd l="8323" t="13200" r="8866" b="13358">model</wd>

<space/>

<wd l="8938" t="13200" r="9893" b="13402">probability</wd>

<space/>

<wd l="9974" t="13253" r="10502" b="13358">scores</wd>

<space/>

</ln>

<ln l="6149" t="13474" r="10502" b="13675" baseLine="13622" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="13474" r="6461" b="13632">and</wd>

<space/>

<wd l="6518" t="13474" r="7306" b="13632">therefore</wd>

<space/>

<wd l="7363" t="13474" r="7800" b="13632">there</wd>

<space/>

<wd l="7862" t="13474" r="7997" b="13632">is</wd>

<space/>

<wd l="8069" t="13526" r="8165" b="13632">a</wd>

<space/>

<wd l="8218" t="13474" r="9000" b="13675">tendency</wd>

<space/>

<wd l="9062" t="13498" r="9230" b="13632">to</wd>

<space/>

<wd l="9293" t="13474" r="9778" b="13675">reject</wd>

<space/>

<wd l="9840" t="13474" r="10162" b="13632">edit</wd>

<space/>

<wd l="10224" t="13526" r="10502" b="13675">op-</wd>

</ln>

<ln l="6149" t="13742" r="9667" b="13901" baseLine="13896" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="13742" r="6830" b="13901">erations</wd>

<space/>

<wd l="6893" t="13742" r="7219" b="13901">that</wd>

<space/>

<wd l="7272" t="13742" r="7762" b="13901">insert</wd>

<space/>

<wd l="7819" t="13742" r="8683" b="13901">additional</wd>

<space/>

<wd l="8746" t="13742" r="9667" b="13901">characters.</wd>

</ln>

</para>

<para l="6149" t="14021" r="10512" b="15307" alignment="justified" spaceBefore="8" fli="216" lsp="exactly" lspExact="269" language="en">

<ln l="6365" t="14021" r="10512" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6365" t="14021" r="7498" b="14208">Furthermore,</wd>

<space/>

<wd l="7579" t="14074" r="7834" b="14179">we</wd>

<space/>

<wd l="7906" t="14021" r="8573" b="14179">observe</wd>

<space/>

<wd l="8640" t="14021" r="8971" b="14179">that</wd>

<space/>

<wd l="9038" t="14074" r="9326" b="14179">our</wd>

<space/>

<wd l="9398" t="14045" r="9998" b="14222">system</wd>

<space/>

<wd l="10066" t="14021" r="10512" b="14179">often</wd>

<space/>

</ln>

<ln l="6149" t="14294" r="10498" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="14294" r="6768" b="14496">assigns</wd>

<space/>

<wd l="6826" t="14294" r="7517" b="14453">inserted</wd>

<space/>

<wd l="7565" t="14318" r="7891" b="14453">text</wd>

<space/>

<wd l="7939" t="14318" r="8107" b="14453">to</wd>

<space/>

<wd l="8160" t="14294" r="8424" b="14453">the</wd>

<space/>

<wd l="8477" t="14347" r="9029" b="14496">wrong</wd>

<space/>

<wd l="9091" t="14294" r="9984" b="14453">evaluation</wd>

<space/>

<wd l="10032" t="14294" r="10498" b="14482">units,</wd>

<space/>

</ln>

<ln l="6149" t="14563" r="10512" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="14616" r="6451" b="14765">e.g.</wd>

<space/>

<wd l="6518" t="14563" r="7277" b="14765">inserting</wd>

<space/>

<wd l="7339" t="14563" r="7608" b="14722">the</wd>

<space/>

<wd l="7675" t="14563" r="8160" b="14765">string</wd>

<space/>

<wd l="8222" t="14568" r="8309" b="14626">“</wd>

<space/>

<wd l="8376" t="14563" r="9134" b="14765">laughing</wd>

<space/>

<wd l="9202" t="14568" r="9566" b="14722">out”</wd>

<space/>

<wd l="9629" t="14563" r="10186" b="14722">before</wd>

<space/>

<wd l="10243" t="14563" r="10512" b="14722">the</wd>

<space/>

</ln>

<ln l="6154" t="14837" r="10507" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6154" t="14890" r="6629" b="15038">space</wd>

<space/>

<wd l="6701" t="14837" r="7258" b="14995">before</wd>

<space/>

<wd l="7330" t="14837" r="7742" b="14995">“lol”</wd>

<space/>

<wd l="7824" t="14837" r="8136" b="14995">and</wd>

<space/>

<wd l="8203" t="14837" r="8582" b="14995">then</wd>

<space/>

<wd l="8650" t="14837" r="9456" b="15038">replacing</wd>

<space/>

<wd l="9538" t="14837" r="10138" b="14995">second</wd>

<space/>

<wd l="10210" t="14842" r="10507" b="14990">“L”</wd>

<space/>

</ln>

<ln l="6149" t="15106" r="10507" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="15106" r="6341" b="15264">of</wd>

<space/>

<wd l="6384" t="15106" r="6802" b="15264">“lol”</wd>

<space/>

<wd l="6859" t="15106" r="7248" b="15264">with</wd>

<space/>

<wd l="7306" t="15106" r="7757" b="15264">“ud”.</wd>

<space/>

<wd l="7834" t="15106" r="8218" b="15264">This</wd>

<space/>

<wd l="8275" t="15106" r="8414" b="15264">is</wd>

<space/>

<wd l="8477" t="15130" r="8755" b="15264">not</wd>

<space/>

<wd l="8808" t="15158" r="9365" b="15307">wrong</wd>

<space/>

<wd l="9427" t="15158" r="9638" b="15264">on</wd>

<space/>

<wd l="9691" t="15106" r="9960" b="15264">the</wd>

<space/>

<wd l="10022" t="15106" r="10507" b="15307">string</wd>

</ln>

</para>

</column>

</section>

<dd l="1440" t="15736" r="10526" b="15977">

<para l="5804" t="15787" r="6148" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5870" t="15787" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="41">

<wd l="5870" t="15787" r="6082" b="15946">96</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4314.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1425" marginTop="1252" marginRight="1363" marginBottom="1302" offsetX="-34" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1425" t="1252" r="10546" b="15317">

<column l="1425" t="1252" r="5827" b="15317">

<para l="1440" t="1320" r="5803" b="2338" alignment="justified" spaceBefore="11" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="1320" r="5803" b="1507" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="1320" r="1901" b="1507">level,</wd>

<space/>

<wd l="1992" t="1320" r="2266" b="1478">but</wd>

<space/>

<wd l="2342" t="1320" r="2510" b="1474">in</wd>

<space/>

<wd l="2587" t="1320" r="2851" b="1478">the</wd>

<space/>

<wd l="2928" t="1320" r="3893" b="1478">token-level</wd>

<space/>

<wd l="3979" t="1320" r="4915" b="1507">evaluation,</wd>

<space/>

<wd l="5006" t="1373" r="5261" b="1478">we</wd>

<space/>

<wd l="5333" t="1320" r="5803" b="1478">make</wd>

<space/>

</ln>

<ln l="1440" t="1594" r="5803" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="1618" r="1762" b="1752">two</wd>

<space/>

<wd l="1829" t="1646" r="2376" b="1752">errors:</wd>

<space/>

<wd l="2467" t="1594" r="3192" b="1795">wrongly</wd>

<space/>

<wd l="3259" t="1594" r="4162" b="1795">appending</wd>

<space/>

<wd l="4229" t="1598" r="4315" b="1656">“</wd>

<space/>

<wd l="4378" t="1594" r="5141" b="1795">laughing</wd>

<space/>

<wd l="5208" t="1598" r="5573" b="1752">out”</wd>

<space/>

<wd l="5635" t="1618" r="5803" b="1752">to</wd>

<space/>

</ln>

<ln l="1440" t="1862" r="5798" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="1862" r="1704" b="2021">the</wd>

<space/>

<wd l="1766" t="1862" r="2506" b="2064">previous</wd>

<space/>

<wd l="2573" t="1862" r="3058" b="2021">token</wd>

<space/>

<wd l="3120" t="1862" r="3432" b="2021">and</wd>

<space/>

<wd l="3490" t="1862" r="4214" b="2064">wrongly</wd>

<space/>

<wd l="4277" t="1862" r="5318" b="2064">normalising</wd>

<space/>

<wd l="5386" t="1862" r="5798" b="2021">“lol”</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="5357" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="2160" r="1608" b="2294">to</wd>

<space/>

<wd l="1646" t="2136" r="1982" b="2338">just</wd>

<space/>

<wd l="2040" t="2136" r="2611" b="2294">“loud”</wd>

<space/>

<wd l="2669" t="2136" r="3288" b="2294">instead</wd>

<space/>

<wd l="3346" t="2136" r="3538" b="2294">of</wd>

<space/>

<wd l="3586" t="2136" r="4435" b="2338">“laughing</wd>

<space/>

<wd l="4498" t="2160" r="4776" b="2294">out</wd>

<space/>

<wd l="4829" t="2136" r="5357" b="2294">loud”.</wd>

</ln>

</para>

<para l="1440" t="2405" r="5808" b="4502" alignment="justified" spaceBefore="9" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1661" t="2405" r="5803" b="2592" baseLine="2559">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="2405" r="2141" b="2563">Since</wd>

<space/>

<wd l="2213" t="2405" r="2482" b="2563">the</wd>

<space/>

<wd l="2554" t="2405" r="3096" b="2563">model</wd>

<space/>

</run>

<wd l="3173" t="2405" r="3379" b="2592"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">P</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3480" t="2405" r="3754" b="2563">did</wd>

<space/>

<wd l="3826" t="2429" r="4104" b="2563">not</wd>

<space/>

<wd l="4181" t="2458" r="4646" b="2563">come</wd>

<space/>

<wd l="4723" t="2429" r="5002" b="2563">out</wd>

<space/>

<wd l="5069" t="2405" r="5462" b="2592">best,</wd>

<space/>

<wd l="5549" t="2458" r="5803" b="2563">we</wd>

<space/>

</run>

</ln>

<ln l="1445" t="2678" r="5808" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="2702" r="2026" b="2837">cannot</wd>

<space/>

<wd l="2126" t="2678" r="2611" b="2880">reject</wd>

<space/>

<wd l="2717" t="2678" r="3514" b="2880">Chrupała</wd>

<space/>

<wd l="3624" t="2683" r="4334" b="2875">(2014)’s</wd>

<space/>

<wd l="4445" t="2678" r="5366" b="2880">hypothesis</wd>

<space/>

<wd l="5477" t="2678" r="5808" b="2837">that</wd>

<space/>

</ln>

<ln l="1440" t="2947" r="5794" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2947" r="1704" b="3106">the</wd>

<space/>

<wd l="1819" t="2947" r="2290" b="3149">noisy</wd>

<space/>

<wd l="2410" t="2947" r="3082" b="3106">channel</wd>

<space/>

<wd l="3197" t="2947" r="3739" b="3106">model</wd>

<space/>

<wd l="3854" t="2947" r="4397" b="3106">would</wd>

<space/>

<wd l="4507" t="2971" r="4790" b="3106">not</wd>

<space/>

<wd l="4901" t="2947" r="5102" b="3106">be</wd>

<space/>

<wd l="5218" t="2947" r="5794" b="3106">useful.</wd>

<space/>

</ln>

<ln l="1440" t="3221" r="5803" b="3422" baseLine="3370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3226" r="2261" b="3408">However,</wd>

<space/>

<wd l="2390" t="3274" r="2683" b="3379">our</wd>

<space/>

<wd l="2789" t="3221" r="3869" b="3379">observations</wd>

<space/>

<wd l="3989" t="3221" r="4330" b="3379">also</wd>

<space/>

<wd l="4445" t="3221" r="4651" b="3379">do</wd>

<space/>

<wd l="4762" t="3245" r="5040" b="3379">not</wd>

<space/>

<wd l="5141" t="3221" r="5803" b="3422">provide</wd>

<space/>

</ln>

<ln l="1440" t="3490" r="5794" b="3691" baseLine="3638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3490" r="1925" b="3648">much</wd>

<space/>

<wd l="1987" t="3518" r="2635" b="3691">support</wd>

<space/>

<wd l="2688" t="3490" r="2947" b="3648">for</wd>

<space/>

<wd l="2995" t="3490" r="3302" b="3648">this</wd>

<space/>

<wd l="3365" t="3490" r="4291" b="3691">hypothesis</wd>

<space/>

<wd l="4358" t="3542" r="4526" b="3648">as</wd>

<space/>

<wd l="4589" t="3542" r="4843" b="3648">we</wd>

<space/>

<wd l="4901" t="3490" r="5179" b="3648">did</wd>

<space/>

<wd l="5232" t="3514" r="5510" b="3648">not</wd>

<space/>

<wd l="5563" t="3490" r="5794" b="3643">in-</wd>

</ln>

<ln l="1445" t="3763" r="5808" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3763" r="1910" b="3922">clude</wd>

<space/>

<wd l="1982" t="3763" r="2712" b="3922">standard</wd>

<space/>

<wd l="2774" t="3763" r="3394" b="3922">models</wd>

<space/>

<wd l="3461" t="3763" r="3888" b="3922">from</wd>

<space/>

<wd l="3946" t="3763" r="4685" b="3965">previous</wd>

<space/>

<wd l="4752" t="3763" r="5203" b="3922">work</wd>

<space/>

<wd l="5270" t="3763" r="5808" b="3960">(Cook</wd>

<space/>

</ln>

<ln l="1445" t="4032" r="5794" b="4229" baseLine="4181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4032" r="1757" b="4190">and</wd>

<space/>

<wd l="1824" t="4037" r="2750" b="4219">Stevenson,</wd>

<space/>

<wd l="2832" t="4037" r="3312" b="4219">2009;</wd>

<space/>

<wd l="3394" t="4037" r="3754" b="4190">Han</wd>

<space/>

<wd l="3821" t="4056" r="3979" b="4190">et</wd>

<space/>

<wd l="4042" t="4032" r="4296" b="4219">al.,</wd>

<space/>

<wd l="4378" t="4037" r="4867" b="4229">2013)</wd>

<space/>

<wd l="4944" t="4032" r="5112" b="4186">in</wd>

<space/>

<wd l="5179" t="4085" r="5472" b="4190">our</wd>

<space/>

<wd l="5534" t="4085" r="5794" b="4190">ex-</wd>

</ln>

<ln l="1440" t="4301" r="2261" b="4502" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4301" r="2261" b="4502">periment.</wd>

</ln>

</para>

<para l="1445" t="4747" r="3029" b="4920" alignment="left" spaceBefore="192" lsp="exactly" lspExact="274" language="en">

<ln l="1445" t="4747" r="3029" b="4920" baseLine="4915" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">

<wd l="1445" t="4752" r="1555" b="4920">5</wd>

<space/>

<wd l="1810" t="4747" r="3029" b="4920">Conclusions</wd>

</ln>

</para>

<para l="1440" t="5165" r="5808" b="6451" alignment="justified" spaceBefore="133" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="5165" r="5808" b="5366" baseLine="5318" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="5170" r="1723" b="5323">We</wd>

<space/>

<wd l="1781" t="5165" r="2386" b="5323">trained</wd>

<space/>

<wd l="2443" t="5189" r="2765" b="5323">two</wd>

<space/>

<wd l="2832" t="5218" r="3619" b="5366">sequence</wd>

<space/>

<wd l="3677" t="5165" r="4531" b="5323">modellers</wd>

<space/>

<wd l="4594" t="5189" r="4757" b="5323">to</wd>

<space/>

<wd l="4819" t="5165" r="5424" b="5366">predict</wd>

<space/>

<wd l="5482" t="5165" r="5808" b="5323">edit</wd>

<space/>

</ln>

<ln l="1445" t="5438" r="5794" b="5640" baseLine="5587" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="5438" r="2342" b="5640">operations</wd>

<space/>

<wd l="2458" t="5438" r="2789" b="5597">that</wd>

<space/>

<wd l="2894" t="5438" r="3754" b="5597">normalise</wd>

<space/>

<wd l="3864" t="5438" r="4315" b="5640">input</wd>

<space/>

<wd l="4421" t="5462" r="4747" b="5597">text</wd>

<space/>

<wd l="4853" t="5438" r="5328" b="5597">when</wd>

<space/>

<wd l="5443" t="5491" r="5794" b="5597">exe-</wd>

</ln>

<ln l="1445" t="5707" r="5803" b="5909" baseLine="5861" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="5707" r="1915" b="5866">cuted</wd>

<space/>

<wd l="2002" t="5707" r="2314" b="5866">and</wd>

<space/>

<wd l="2400" t="5707" r="3581" b="5909">experimented</wd>

<space/>

<wd l="3662" t="5707" r="4051" b="5866">with</wd>

<space/>

<wd l="4138" t="5707" r="4896" b="5909">applying</wd>

<space/>

<wd l="4982" t="5707" r="5246" b="5866">the</wd>

<space/>

<wd l="5333" t="5707" r="5803" b="5909">noisy</wd>

<space/>

</ln>

<ln l="1445" t="5981" r="5794" b="6182" baseLine="6130" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="5981" r="2117" b="6139">channel</wd>

<space/>

<wd l="2203" t="5981" r="2746" b="6139">model</wd>

<space/>

<wd l="2837" t="6005" r="3000" b="6139">to</wd>

<space/>

<wd l="3101" t="5981" r="3864" b="6182">selecting</wd>

<space/>

<wd l="3955" t="5981" r="4786" b="6139">candidate</wd>

<space/>

<wd l="4872" t="5981" r="5794" b="6139">normalisa-</wd>

</ln>

<ln l="1440" t="6250" r="2458" b="6451" baseLine="6403" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="6250" r="1781" b="6408">tion</wd>

<space/>

<wd l="1843" t="6250" r="2458" b="6451">strings.</wd>

</ln>

</para>

<para l="1656" t="6523" r="3408" b="6682" alignment="justified" li="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="6523" r="3408" b="6682" baseLine="6672" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="6528" r="2227" b="6682">Future</wd>

<space/>

<wd l="2285" t="6523" r="2731" b="6682">work</wd>

<space/>

<wd l="2794" t="6523" r="3408" b="6682">should:</wd>

</ln>

</para>

<para l="1675" t="6898" r="5808" b="7910" alignment="justified" li="432" spaceBefore="106" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="6898" r="5808" b="7099" baseLine="7046" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1675" t="6902" r="1877" b="7046">•</wd>

<tab position="1756"/>

<wd l="1877" t="6898" r="2342" b="7056">Train</wd>

<space/>

<wd l="2390" t="6898" r="2659" b="7056">the</wd>

<space/>

<wd l="2712" t="6902" r="3120" b="7056">CRF</wd>

<space/>

<wd l="3178" t="6950" r="3389" b="7056">on</wd>

<space/>

<wd l="3442" t="6898" r="3706" b="7056">the</wd>

<space/>

<wd l="3758" t="6898" r="4051" b="7056">full</wd>

<space/>

<wd l="4109" t="6898" r="4786" b="7099">training</wd>

<space/>

<wd l="4843" t="6898" r="5246" b="7085">data,</wd>

<space/>

<wd l="5314" t="6898" r="5808" b="7056">either</wd>

<space/>

</ln>

<ln l="1877" t="7166" r="5803" b="7368" baseLine="7320" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="7166" r="2347" b="7368">using</wd>

<space/>

<wd l="2424" t="7219" r="2520" b="7325">a</wd>

<space/>

<wd l="2582" t="7219" r="3034" b="7325">more</wd>

<space/>

<wd l="3101" t="7166" r="4589" b="7368">memory-friendly</wd>

<space/>

<wd l="4670" t="7166" r="5011" b="7363">(but</wd>

<space/>

<wd l="5078" t="7166" r="5803" b="7368">possibly</wd>

<space/>

</ln>

<ln l="1886" t="7440" r="5808" b="7642" baseLine="7589" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1886" t="7440" r="2515" b="7637">slower)</wd>

<space/>

<wd l="2578" t="7440" r="3662" b="7642">optimisation</wd>

<space/>

<wd l="3706" t="7440" r="4363" b="7598">method</wd>

<space/>

<wd l="4411" t="7493" r="4594" b="7598">or</wd>

<space/>

<wd l="4632" t="7440" r="5102" b="7642">using</wd>

<space/>

<wd l="5155" t="7493" r="5352" b="7598">an</wd>

<space/>

<wd l="5405" t="7493" r="5808" b="7598">even</wd>

<space/>

</ln>

<ln l="1877" t="7709" r="3216" b="7910" baseLine="7858" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="7709" r="2386" b="7910">larger</wd>

<space/>

<wd l="2434" t="7709" r="3216" b="7867">machine.</wd>

</ln>

</para>

<para l="1675" t="8131" r="5803" b="9682" alignment="justified" li="432" spaceBefore="156" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="8131" r="5803" b="8333" baseLine="8280" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="8136" r="1877" b="8280">•</wd>

<tab position="1756"/>

<wd l="1877" t="8131" r="2894" b="8333">Experiment</wd>

<space/>

<wd l="2957" t="8131" r="3346" b="8290">with</wd>

<space/>

<wd l="3413" t="8136" r="3989" b="8290">LSTM</wd>

<space/>

<wd l="4066" t="8184" r="4858" b="8333">sequence</wd>

<space/>

<wd l="4920" t="8131" r="5803" b="8333">modelling</wd>

<space/>

</ln>

<ln l="1886" t="8400" r="5794" b="8597" baseLine="8549" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1886" t="8400" r="2885" b="8597">(Hochreiter</wd>

<space/>

<wd l="2986" t="8400" r="3298" b="8558">and</wd>

<space/>

<wd l="3403" t="8400" r="4594" b="8587">Schmidhuber,</wd>

<space/>

<wd l="4742" t="8405" r="5203" b="8587">1997;</wd>

<space/>

<wd l="5342" t="8405" r="5794" b="8587">Gers,</wd>

<space/>

</ln>

<ln l="1882" t="8669" r="5803" b="8870" baseLine="8822" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="8674" r="2429" b="8866">2001),</wd>

<space/>

<wd l="2530" t="8669" r="3062" b="8827">which</wd>

<space/>

<wd l="3144" t="8669" r="3427" b="8827">has</wd>

<space/>

<wd l="3518" t="8669" r="3931" b="8827">been</wd>

<space/>

<wd l="4018" t="8669" r="4656" b="8870">applied</wd>

<space/>

<wd l="4747" t="8669" r="5803" b="8870">successfully</wd>

<space/>

</ln>

<ln l="1877" t="8942" r="5794" b="9144" baseLine="9091" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="8966" r="2045" b="9101">to</wd>

<space/>

<wd l="2170" t="8942" r="2755" b="9144">speech</wd>

<space/>

<wd l="2866" t="8942" r="3859" b="9144">recognition</wd>

<space/>

<wd l="3974" t="8942" r="4286" b="9101">and</wd>

<space/>

<wd l="4402" t="8942" r="5040" b="9144">caption</wd>

<space/>

<wd l="5155" t="8995" r="5794" b="9144">genera-</wd>

</ln>

<ln l="1877" t="9211" r="5794" b="9413" baseLine="9365" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9211" r="2218" b="9370">tion</wd>

<space/>

<wd l="2294" t="9216" r="2962" b="9408">(Graves</wd>

<space/>

<wd l="3043" t="9211" r="3355" b="9370">and</wd>

<space/>

<wd l="3422" t="9211" r="3922" b="9413">Jaitly,</wd>

<space/>

<wd l="4013" t="9216" r="4493" b="9398">2014;</wd>

<space/>

<wd l="4579" t="9211" r="5237" b="9413">Vinyals</wd>

<space/>

<wd l="5318" t="9235" r="5472" b="9370">et</wd>

<space/>

<wd l="5544" t="9211" r="5794" b="9398">al.,</wd>

<space/>

</ln>

<ln l="1882" t="9485" r="2429" b="9682" baseLine="9634" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="9485" r="2429" b="9682">2015).</wd>

</ln>

</para>

<para l="1675" t="9902" r="5794" b="10378" alignment="justified" li="432" spaceBefore="151" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="9902" r="5794" b="10104" baseLine="10056" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="9907" r="1882" b="10056">•</wd>

<tab position="1758"/>

<wd l="1882" t="9902" r="2674" b="10061">Combine</wd>

<space/>

<wd l="2731" t="9902" r="3355" b="10061">models</wd>

<space/>

<wd l="3418" t="9902" r="3806" b="10061">with</wd>

<space/>

<wd l="3859" t="9902" r="4411" b="10104">voting</wd>

<space/>

<wd l="4469" t="9902" r="4982" b="10061">rather</wd>

<space/>

<wd l="5035" t="9902" r="5410" b="10061">than</wd>

<space/>

<wd l="5467" t="9902" r="5794" b="10061">lan-</wd>

</ln>

<ln l="1882" t="10176" r="3557" b="10378" baseLine="10325" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="10229" r="2395" b="10378">guage</wd>

<space/>

<wd l="2453" t="10176" r="2995" b="10334">model</wd>

<space/>

<wd l="3062" t="10229" r="3557" b="10334">score.</wd>

</ln>

</para>

<para l="1675" t="10594" r="5808" b="11333" alignment="justified" li="432" spaceBefore="155" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="10594" r="5794" b="10795" baseLine="10747" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="10598" r="1877" b="10747">•</wd>

<tab position="1758"/>

<wd l="1877" t="10598" r="2179" b="10752">For</wd>

<space/>

<wd l="2328" t="10594" r="2597" b="10752">the</wd>

<space/>

<wd l="2750" t="10594" r="3221" b="10795">noisy</wd>

<space/>

<wd l="3379" t="10594" r="4051" b="10752">channel</wd>

<space/>

<wd l="4210" t="10594" r="4795" b="10781">model,</wd>

<space/>

<wd l="4987" t="10618" r="5222" b="10795">try</wd>

<space/>

<wd l="5390" t="10618" r="5794" b="10752">stan-</wd>

</ln>

<ln l="1882" t="10867" r="5808" b="11069" baseLine="11016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="10867" r="2266" b="11026">dard</wd>

<space/>

<wd l="2338" t="10867" r="2957" b="11026">models</wd>

<space/>

<wd l="3038" t="10867" r="3466" b="11026">from</wd>

<space/>

<wd l="3538" t="10867" r="4272" b="11069">previous</wd>

<space/>

<wd l="4354" t="10867" r="4800" b="11026">work</wd>

<space/>

<wd l="4882" t="10867" r="5419" b="11064">(Cook</wd>

<space/>

<wd l="5496" t="10867" r="5808" b="11026">and</wd>

<space/>

</ln>

<ln l="1882" t="11136" r="4930" b="11333" baseLine="11290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="11141" r="2808" b="11323">Stevenson,</wd>

<space/>

<wd l="2880" t="11141" r="3360" b="11323">2009;</wd>

<space/>

<wd l="3427" t="11141" r="3787" b="11294">Han</wd>

<space/>

<wd l="3850" t="11160" r="4003" b="11294">et</wd>

<space/>

<wd l="4061" t="11136" r="4310" b="11323">al.,</wd>

<space/>

<wd l="4382" t="11141" r="4930" b="11333">2013).</wd>

</ln>

</para>

<para l="1675" t="11558" r="5808" b="13382" alignment="justified" li="432" spaceBefore="154" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="11558" r="5794" b="11760" baseLine="11707" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1675" t="11563" r="1877" b="11707">•</wd>

<tab position="1756"/>

<wd l="1877" t="11563" r="2098" b="11717">To</wd>

<space/>

<wd l="2227" t="11558" r="2726" b="11717">better</wd>

<space/>

<wd l="2846" t="11558" r="3806" b="11717">understand</wd>

<space/>

<wd l="3926" t="11558" r="4190" b="11717">the</wd>

<space/>

<wd l="4325" t="11558" r="5093" b="11717">selection</wd>

<space/>

<wd l="5218" t="11558" r="5794" b="11760">prefer-</wd>

</ln>

<ln l="1882" t="11827" r="5794" b="12029" baseLine="11976" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="11880" r="2352" b="11986">ences</wd>

<space/>

<wd l="2496" t="11827" r="2688" b="11986">of</wd>

<space/>

<wd l="2803" t="11827" r="3067" b="11986">the</wd>

<space/>

<wd l="3197" t="11827" r="3667" b="12029">noisy</wd>

<space/>

<wd l="3806" t="11827" r="4478" b="11986">channel</wd>

<space/>

<wd l="4608" t="11827" r="5198" b="12014">model,</wd>

<space/>

<wd l="5362" t="11880" r="5794" b="11986">com-</wd>

</ln>

<ln l="1877" t="12101" r="5803" b="12302" baseLine="12250" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="12154" r="2251" b="12302">pare</wd>

<space/>

<wd l="2333" t="12101" r="2597" b="12259">the</wd>

<space/>

<wd l="2678" t="12106" r="3442" b="12259">F1-score</wd>

<space/>

<wd l="3528" t="12101" r="4277" b="12259">obtained</wd>

<space/>

<wd l="4354" t="12101" r="4829" b="12259">when</wd>

<space/>

<wd l="4910" t="12101" r="5803" b="12302">evaluating</wd>

<space/>

</ln>

<ln l="1882" t="12370" r="5808" b="12571" baseLine="12518" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="12370" r="2496" b="12571">against</wd>

<space/>

<wd l="2544" t="12370" r="2808" b="12528">the</wd>

<space/>

<wd l="2861" t="12370" r="3250" b="12571">gold</wd>

<space/>

<wd l="3298" t="12370" r="3662" b="12528">data</wd>

<space/>

<wd l="3706" t="12394" r="3874" b="12528">to</wd>

<space/>

<wd l="3926" t="12370" r="4190" b="12528">the</wd>

<space/>

<wd l="4243" t="12374" r="5006" b="12528">F1-score</wd>

<space/>

<wd l="5059" t="12370" r="5808" b="12528">obtained</wd>

<space/>

</ln>

<ln l="1877" t="12638" r="5798" b="12840" baseLine="12792" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="12638" r="2352" b="12797">when</wd>

<space/>

<wd l="2405" t="12638" r="3293" b="12840">evaluating</wd>

<space/>

<wd l="3350" t="12638" r="3614" b="12797">the</wd>

<space/>

<wd l="3677" t="12662" r="4277" b="12840">system</wd>

<space/>

<wd l="4330" t="12662" r="4882" b="12840">output</wd>

<space/>

<wd l="4934" t="12638" r="5549" b="12840">against</wd>

<space/>

<wd l="5602" t="12638" r="5798" b="12797">its</wd>

<space/>

</ln>

<ln l="1882" t="12912" r="5803" b="13114" baseLine="13061" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="12965" r="2246" b="13070">own</wd>

<space/>

<wd l="2323" t="12912" r="2813" b="13114">input,</wd>

<space/>

<wd l="2904" t="12912" r="3158" b="13070">i.e.</wd>

<space/>

<wd l="3250" t="12965" r="3514" b="13070">are</wd>

<space/>

<wd l="3590" t="12965" r="3840" b="13070">we</wd>

<space/>

<wd l="3917" t="12912" r="4478" b="13070">biased</wd>

<space/>

<wd l="4550" t="12912" r="5227" b="13070">towards</wd>

<space/>

<wd l="5314" t="12912" r="5803" b="13114">doing</wd>

<space/>

</ln>

<ln l="1877" t="13181" r="2635" b="13382" baseLine="13334" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="13181" r="2635" b="13382">nothing?</wd>

</ln>

</para>

<para l="1675" t="13603" r="5794" b="14347" alignment="justified" li="432" spaceBefore="150" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="13603" r="5794" b="13805" baseLine="13752" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="13608" r="1877" b="13752">•</wd>

<tab position="1756"/>

<wd l="1877" t="13603" r="2712" b="13762">Introduce</wd>

<space/>

<wd l="2774" t="13656" r="2870" b="13762">a</wd>

<space/>

<wd l="2928" t="13603" r="3538" b="13805">brevity</wd>

<space/>

<wd l="3595" t="13603" r="4234" b="13805">penalty</wd>

<space/>

<wd l="4296" t="13627" r="4464" b="13762">to</wd>

<space/>

<wd l="4531" t="13627" r="5184" b="13762">counter</wd>

<space/>

<wd l="5237" t="13603" r="5506" b="13762">the</wd>

<space/>

<wd l="5568" t="13603" r="5794" b="13762">ef-</wd>

</ln>

<ln l="1877" t="13872" r="5794" b="14074" baseLine="14026" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="13872" r="2203" b="14030">fect</wd>

<space/>

<wd l="2294" t="13872" r="2486" b="14030">of</wd>

<space/>

<wd l="2573" t="13872" r="3331" b="14074">selecting</wd>

<space/>

<wd l="3432" t="13872" r="3864" b="14030">short</wd>

<space/>

<wd l="3955" t="13872" r="4786" b="14030">candidate</wd>

<space/>

<wd l="4872" t="13872" r="5794" b="14030">normalisa-</wd>

</ln>

<ln l="1877" t="14146" r="4752" b="14347" baseLine="14294" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="14146" r="2294" b="14304">tions</wd>

<space/>

<wd l="2357" t="14146" r="2525" b="14299">in</wd>

<space/>

<wd l="2578" t="14146" r="2846" b="14304">the</wd>

<space/>

<wd l="2899" t="14146" r="3370" b="14347">noisy</wd>

<space/>

<wd l="3432" t="14146" r="4104" b="14304">channel</wd>

<space/>

<wd l="4162" t="14146" r="4752" b="14304">model.</wd>

</ln>

</para>

<para l="1675" t="14563" r="5803" b="15264" alignment="justified" li="432" spaceBefore="155" fli="-216" lsp="exactly" lspExact="266" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="14563" r="5794" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="14568" r="1877" b="14717">•</wd>

<tab position="1758"/>

<wd l="1877" t="14563" r="3120" b="14765">Automatically</wd>

<space/>

<wd l="3250" t="14563" r="3763" b="14722">revise</wd>

<space/>

<wd l="3888" t="14563" r="4152" b="14722">the</wd>

<space/>

<wd l="4282" t="14563" r="5150" b="14765">alignment</wd>

<space/>

<wd l="5270" t="14587" r="5438" b="14722">to</wd>

<space/>

<wd l="5563" t="14563" r="5794" b="14717">in-</wd>

</ln>

<ln l="1877" t="14837" r="5803" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="14861" r="2155" b="15038">put</wd>

<space/>

<wd l="2227" t="14837" r="2712" b="14995">token</wd>

<space/>

<wd l="2784" t="14837" r="3638" b="15038">according</wd>

<space/>

<wd l="3710" t="14861" r="3878" b="14995">to</wd>

<space/>

<wd l="3960" t="14837" r="4498" b="15038">global</wd>

<space/>

<wd l="4574" t="14890" r="5803" b="14995">co-occurrence</wd>

<space/>

</ln>

<ln l="1886" t="15106" r="2674" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1886" t="15106" r="2674" b="15264">statistics.</wd>

</ln>

</para>

</column>

<column l="6144" t="1252" r="10546" b="15317">

<para l="6384" t="1320" r="10502" b="1752" alignment="justified" li="432" spaceBefore="8" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="1320" r="10502" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="1325" r="6586" b="1474">•</wd>

<tab position="6467"/>

<wd l="6586" t="1325" r="7075" b="1522">Carry</wd>

<space/>

<wd l="7128" t="1344" r="7406" b="1478">out</wd>

<space/>

<wd l="7450" t="1373" r="7546" b="1478">a</wd>

<space/>

<wd l="7589" t="1320" r="7882" b="1478">full</wd>

<space/>

<wd l="7939" t="1373" r="8366" b="1478">error</wd>

<space/>

<wd l="8410" t="1320" r="9101" b="1522">analysis</wd>

<space/>

<wd l="9158" t="1320" r="9350" b="1478">of</wd>

<space/>

<wd l="9379" t="1320" r="9806" b="1478">what</wd>

<space/>

<wd l="9850" t="1320" r="10114" b="1478">the</wd>

<space/>

<wd l="10171" t="1373" r="10502" b="1522">sys-</wd>

</ln>

<ln l="6581" t="1594" r="9398" b="1752" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="1618" r="6912" b="1752">tem</wd>

<space/>

<wd l="6970" t="1594" r="7354" b="1752">does</wd>

<space/>

<wd l="7416" t="1594" r="7790" b="1752">well</wd>

<space/>

<wd l="7853" t="1594" r="8165" b="1752">and</wd>

<space/>

<wd l="8218" t="1594" r="8750" b="1752">where</wd>

<space/>

<wd l="8808" t="1594" r="8928" b="1752">it</wd>

<space/>

<wd l="8981" t="1594" r="9398" b="1752">fails.</wd>

</ln>

</para>

<para l="6144" t="2035" r="8011" b="2256" alignment="left" spaceBefore="192" lsp="exactly" lspExact="274" language="en">

<ln l="6144" t="2035" r="8011" b="2256" baseLine="2203" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2035" r="8011" b="2256">Acknowledgments</wd>

</ln>

</para>

<para l="6144" t="2453" r="10512" b="4550" alignment="justified" spaceBefore="130" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="2453" r="10502" b="2654" baseLine="2602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2453" r="6523" b="2611">This</wd>

<space/>

<wd l="6672" t="2453" r="7402" b="2611">research</wd>

<space/>

<wd l="7536" t="2453" r="7675" b="2611">is</wd>

<space/>

<wd l="7829" t="2453" r="8683" b="2654">supported</wd>

<space/>

<wd l="8818" t="2453" r="9034" b="2654">by</wd>

<space/>

<wd l="9182" t="2453" r="9854" b="2611">Science</wd>

<space/>

<wd l="9994" t="2458" r="10502" b="2611">Foun-</wd>

</ln>

<ln l="6149" t="2722" r="10512" b="2923" baseLine="2875" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="2722" r="6691" b="2880">dation</wd>

<space/>

<wd l="6821" t="2722" r="7440" b="2880">Ireland</wd>

<space/>

<wd l="7565" t="2722" r="8246" b="2923">through</wd>

<space/>

<wd l="8376" t="2722" r="8640" b="2880">the</wd>

<space/>

<wd l="8774" t="2726" r="9365" b="2880">CNGL</wd>

<space/>

<wd l="9494" t="2726" r="10512" b="2923">Programme</wd>

<space/>

</ln>

<ln l="6154" t="2995" r="10512" b="3192" baseLine="3144" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="3000" r="6715" b="3192">(Grant</wd>

<space/>

<wd l="6912" t="2995" r="8078" b="3192">12/CE/I2267)</wd>

<space/>

<wd l="8261" t="2995" r="8429" b="3149">in</wd>

<space/>

<wd l="8602" t="2995" r="8866" b="3154">the</wd>

<space/>

<wd l="9038" t="3000" r="9754" b="3149">ADAPT</wd>

<space/>

<wd l="9936" t="3000" r="10512" b="3154">Centre</wd>

<space/>

</ln>

<ln l="6154" t="3264" r="10498" b="3466" baseLine="3418" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="3264" r="8011" b="3466">(www.adaptcentre.ie)</wd>

<space/>

<wd l="8126" t="3288" r="8280" b="3422">at</wd>

<space/>

<wd l="8376" t="3264" r="8986" b="3422">Dublin</wd>

<space/>

<wd l="9086" t="3264" r="9456" b="3466">City</wd>

<space/>

<wd l="9557" t="3264" r="10498" b="3466">University.</wd>

<space/>

</ln>

<ln l="6144" t="3538" r="10502" b="3739" baseLine="3686" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3542" r="6432" b="3696">We</wd>

<space/>

<wd l="6485" t="3538" r="6974" b="3696">thank</wd>

<space/>

<wd l="7027" t="3538" r="7291" b="3696">the</wd>

<space/>

<wd l="7354" t="3590" r="8342" b="3739">anonymous</wd>

<space/>

<wd l="8405" t="3538" r="9235" b="3696">reviewers</wd>

<space/>

<wd l="9298" t="3538" r="9557" b="3696">for</wd>

<space/>

<wd l="9610" t="3538" r="10013" b="3696">their</wd>

<space/>

<wd l="10066" t="3590" r="10502" b="3696">com-</wd>

</ln>

<ln l="6144" t="3806" r="10502" b="4008" baseLine="3955" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3830" r="6658" b="3965">ments</wd>

<space/>

<wd l="6725" t="3859" r="6941" b="3965">on</wd>

<space/>

<wd l="6994" t="3806" r="7301" b="3965">this</wd>

<space/>

<wd l="7368" t="3859" r="7882" b="4008">paper.</wd>

<space/>

<wd l="7963" t="3806" r="9096" b="3994">Furthermore,</wd>

<space/>

<wd l="9163" t="3859" r="9418" b="3965">we</wd>

<space/>

<wd l="9475" t="3806" r="9960" b="3965">thank</wd>

<space/>

<wd l="10018" t="3811" r="10502" b="3965">Grze-</wd>

</ln>

<ln l="6149" t="4080" r="10502" b="4282" baseLine="4229" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4133" r="6528" b="4282">gorz</wd>

<space/>

<wd l="6634" t="4080" r="7435" b="4282">Chrupała</wd>

<space/>

<wd l="7526" t="4080" r="7786" b="4238">for</wd>

<space/>

<wd l="7891" t="4080" r="8520" b="4282">sharing</wd>

<space/>

<wd l="8621" t="4080" r="8866" b="4238">his</wd>

<space/>

<wd l="8971" t="4080" r="9576" b="4238">feature</wd>

<space/>

<wd l="9677" t="4080" r="10502" b="4282">templates</wd>

<space/>

</ln>

<ln l="6149" t="4349" r="9293" b="4550" baseLine="4498" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4349" r="6461" b="4507">and</wd>

<space/>

<wd l="6514" t="4349" r="6773" b="4507">for</wd>

<space/>

<wd l="6826" t="4349" r="7070" b="4507">his</wd>

<space/>

<wd l="7142" t="4349" r="8069" b="4550">suggestion</wd>

<space/>

<wd l="8122" t="4373" r="8290" b="4507">to</wd>

<space/>

<wd l="8347" t="4373" r="8582" b="4550">try</wd>

<space/>

<wd l="8650" t="4354" r="9293" b="4550">Sequor.</wd>

</ln>

</para>

<para l="6149" t="5050" r="7248" b="5222" alignment="left" spaceBefore="446" lsp="exactly" lspExact="274" language="en">

<ln l="6149" t="5050" r="7248" b="5222" baseLine="5213" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="5050" r="7248" b="5222">References</wd>

</ln>

</para>

<para l="6144" t="5414" r="10517" b="6917" alignment="justified" li="216" spaceBefore="108" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="5414" r="10502" b="5602" baseLine="5549" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5414" r="6821" b="5602">Timothy</wd>

<space/>

<wd l="6965" t="5414" r="7685" b="5582">Baldwin,</wd>

<space/>

<wd l="7858" t="5414" r="8333" b="5558">Marie</wd>

<space/>

<wd l="8482" t="5414" r="9250" b="5558">Catherine</wd>

<space/>

<wd l="9398" t="5414" r="9581" b="5558">de</wd>

<space/>

<wd l="9725" t="5414" r="10502" b="5582">Marneffe,</wd>

<space/>

</ln>

<ln l="6365" t="5635" r="10507" b="5822" baseLine="5770" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5640" r="6590" b="5779">Bo</wd>

<space/>

<wd l="6686" t="5640" r="7061" b="5803">Han,</wd>

<space/>

<wd l="7171" t="5640" r="8150" b="5822">Young-Bum</wd>

<space/>

<wd l="8242" t="5635" r="8635" b="5803">Kim,</wd>

<space/>

<wd l="8741" t="5635" r="9125" b="5779">Alan</wd>

<space/>

<wd l="9221" t="5635" r="9710" b="5803">Ritter,</wd>

<space/>

<wd l="9821" t="5635" r="10104" b="5779">and</wd>

<space/>

<wd l="10195" t="5635" r="10507" b="5779">Wei</wd>

<space/>

</ln>

<ln l="6365" t="5851" r="10512" b="6034" baseLine="5990" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5856" r="6648" b="5995">Xu.</wd>

<space/>

<wd l="6792" t="5851" r="7224" b="5995">2015.</wd>

<space/>

<wd l="7368" t="5851" r="7915" b="5995">Shared</wd>

<space/>

<wd l="7982" t="5851" r="8376" b="5995">tasks</wd>

<space/>

<wd l="8453" t="5851" r="8626" b="5995">of</wd>

<space/>

<wd l="8683" t="5851" r="8923" b="5995">the</wd>

<space/>

<wd l="9000" t="5851" r="9384" b="5995">2015</wd>

<space/>

<wd l="9461" t="5851" r="10238" b="6034">workshop</wd>

<space/>

<wd l="10315" t="5894" r="10512" b="5995">on</wd>

<space/>

</ln>

<ln l="6365" t="6072" r="10502" b="6259" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="6072" r="6792" b="6259">noisy</wd>

<space/>

<wd l="6878" t="6072" r="8050" b="6259">user-generated</wd>

<space/>

<wd l="8131" t="6091" r="8467" b="6216">text:</wd>

<space/>

<wd l="8611" t="6072" r="9182" b="6216">Twitter</wd>

<space/>

<wd l="9269" t="6072" r="9792" b="6216">lexical</wd>

<space/>

<wd l="9878" t="6072" r="10502" b="6216">normal-</wd>

</ln>

<ln l="6365" t="6293" r="10502" b="6480" baseLine="6427">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="6293" r="6907" b="6437">ization</wd>

<space/>

<wd l="6979" t="6293" r="7267" b="6437">and</wd>

<space/>

<wd l="7334" t="6293" r="7867" b="6437">named</wd>

<space/>

<wd l="7939" t="6293" r="8386" b="6480">entity</wd>

<space/>

<wd l="8458" t="6293" r="9403" b="6480">recognition.</wd>

<space/>

<wd l="9552" t="6298" r="9720" b="6432">In</wd>

<space/>

</run>

<wd l="9787" t="6293" r="10502" b="6437" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Proceed-</wd>

</ln>

<ln l="6374" t="6509" r="10517" b="6691" baseLine="6648" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="6514" r="6696" b="6691">ings</wd>

<space/>

<wd l="6758" t="6509" r="6941" b="6691">of</wd>

<space/>

<wd l="6974" t="6509" r="7210" b="6653">the</wd>

<space/>

<wd l="7282" t="6509" r="8054" b="6691">Workshop</wd>

<space/>

<wd l="8122" t="6557" r="8314" b="6653">on</wd>

<space/>

<wd l="8371" t="6514" r="8827" b="6691">Noisy</wd>

<space/>

<wd l="8909" t="6509" r="10138" b="6691">User-generated</wd>

<space/>

<wd l="10200" t="6514" r="10517" b="6653">Text</wd>

<space/>

</ln>

<ln l="6370" t="6730" r="8798" b="6917" baseLine="6864">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="6734" r="7003" b="6907">(WNUT</wd>

<space/>

</run>

<wd l="7032" t="6730" r="7541" b="6907"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7598" t="6730" r="8227" b="6917">Beijing,</wd>

<space/>

<wd l="8290" t="6730" r="8798" b="6874">China.</wd>

</run>

</ln>

</para>

<para l="6144" t="7094" r="10502" b="8813" alignment="justified" li="216" spaceBefore="148" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="7094" r="10502" b="7282" baseLine="7229" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7094" r="6605" b="7238">Utsab</wd>

<space/>

<wd l="6686" t="7099" r="7358" b="7262">Barman,</wd>

<space/>

<wd l="7445" t="7094" r="8112" b="7238">Joachim</wd>

<space/>

<wd l="8184" t="7099" r="8832" b="7282">Wagner,</wd>

<space/>

<wd l="8923" t="7094" r="9653" b="7282">Grzegorz</wd>

<space/>

<wd l="9734" t="7094" r="10502" b="7282">Chrupała,</wd>

<space/>

</ln>

<ln l="6370" t="7310" r="10502" b="7454" baseLine="7450" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="7310" r="6653" b="7454">and</wd>

<space/>

<wd l="6754" t="7310" r="7397" b="7454">Jennifer</wd>

<space/>

<wd l="7498" t="7315" r="8021" b="7454">Foster.</wd>

<space/>

<wd l="8270" t="7310" r="8702" b="7454">2014.</wd>

<space/>

<wd l="8952" t="7310" r="9888" b="7454">DCU-UVT:</wd>

<space/>

<wd l="10008" t="7310" r="10502" b="7454">Word-</wd>

</ln>

<ln l="6365" t="7531" r="10498" b="7718" baseLine="7666" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="7531" r="6739" b="7675">level</wd>

<space/>

<wd l="6811" t="7531" r="7526" b="7718">language</wd>

<space/>

<wd l="7603" t="7531" r="8640" b="7675">classification</wd>

<space/>

<wd l="8702" t="7531" r="9058" b="7675">with</wd>

<space/>

<wd l="9130" t="7531" r="10066" b="7675">code-mixed</wd>

<space/>

<wd l="10133" t="7531" r="10498" b="7675">data.</wd>

<space/>

</ln>

<ln l="6365" t="7752" r="10502" b="7934" baseLine="7886">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="7757" r="6533" b="7891">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6590" t="7752" r="7579" b="7934">Proceedings</wd>

<space/>

<wd l="7646" t="7752" r="7829" b="7934">of</wd>

<space/>

<wd l="7862" t="7752" r="8098" b="7896">the</wd>

<space/>

<wd l="8165" t="7757" r="8549" b="7896">First</wd>

<space/>

<wd l="8611" t="7752" r="9389" b="7934">Workshop</wd>

<space/>

<wd l="9456" t="7800" r="9648" b="7896">on</wd>

<space/>

<wd l="9725" t="7757" r="10502" b="7934">Computa-</wd>

</run>

</ln>

<ln l="6370" t="7968" r="10488" b="8150" baseLine="8107" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="7968" r="6830" b="8112">tional</wd>

<space/>

<wd l="6854" t="7968" r="7805" b="8150">Approaches</wd>

<space/>

<wd l="7853" t="7997" r="7997" b="8112">to</wd>

<space/>

<wd l="8050" t="7968" r="8458" b="8112">Code</wd>

<space/>

<wd l="8501" t="7968" r="9312" b="8150">Switching.</wd>

<space/>

<wd l="9365" t="7973" r="10027" b="8112">EMNLP</wd>

<space/>

<wd l="10061" t="7968" r="10488" b="8136">2014,</wd>

<space/>

</ln>

<ln l="6374" t="8189" r="10502" b="8371" baseLine="8323" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6374" t="8189" r="7272" b="8371">Conference</wd>

<space/>

<wd l="7349" t="8237" r="7536" b="8333">on</wd>

<space/>

<wd l="7603" t="8189" r="8410" b="8371">Empirical</wd>

<space/>

<wd l="8467" t="8189" r="9158" b="8333">Methods</wd>

<space/>

<wd l="9235" t="8194" r="9379" b="8333">in</wd>

<space/>

<wd l="9446" t="8189" r="10070" b="8333">Natural</wd>

<space/>

<wd l="10128" t="8194" r="10502" b="8333">Lan-</wd>

</ln>

<ln l="6365" t="8410" r="10502" b="8597" baseLine="8544">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="8458" r="6845" b="8592">guage</wd>

<space/>

</run>

<wd l="6893" t="8414" r="7810" b="8592"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Processing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7862" t="8453" r="8314" b="8597">pages</wd>

<space/>

<wd l="8381" t="8410" r="9101" b="8578">127–132,</wd>

<space/>

<wd l="9154" t="8410" r="9629" b="8578">Doha,</wd>

<space/>

<wd l="9686" t="8410" r="10162" b="8587">Qatar,</wd>

<space/>

<wd l="10219" t="8410" r="10502" b="8554">Oc-</wd>

</run>

</ln>

<ln l="6365" t="8626" r="10291" b="8813" baseLine="8765" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="8626" r="6802" b="8770">tober.</wd>

<space/>

<wd l="6864" t="8626" r="7805" b="8770">Association</wd>

<space/>

<wd l="7853" t="8626" r="8088" b="8770">for</wd>

<space/>

<wd l="8141" t="8626" r="9317" b="8808">Computational</wd>

<space/>

<wd l="9370" t="8626" r="10291" b="8813">Linguistics.</wd>

</ln>

</para>

<para l="6149" t="8990" r="10498" b="9178" alignment="justified" spaceBefore="141" lsp="exactly" lspExact="220" language="en">

<tabs position="6149"/>

<ln l="6149" t="8990" r="10498" b="9178" baseLine="9125" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="8990" r="6883" b="9178">Grzegorz</wd>

<space/>

<wd l="7018" t="8990" r="7747" b="9178">Chrupała</wd>

<space/>

<wd l="7877" t="8990" r="8165" b="9134">and</wd>

<space/>

<wd l="8290" t="8990" r="8947" b="9134">Dietrich</wd>

<space/>

<wd l="9077" t="8990" r="9725" b="9134">Klakow.</wd>

<tab position="9725"/>

<wd l="10066" t="8990" r="10498" b="9134">2010.</wd>

</ln>

</para>

<para l="6360" t="9211" r="10507" b="11150" alignment="justified" li="216" spaceBefore="1" lsp="exactly" lspExact="219" language="en">

<ln l="6365" t="9211" r="10507" b="9398" baseLine="9346" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9216" r="6509" b="9350">A</wd>

<space/>

<wd l="6614" t="9211" r="7147" b="9355">named</wd>

<space/>

<wd l="7258" t="9211" r="7699" b="9398">entity</wd>

<space/>

<wd l="7810" t="9211" r="8352" b="9355">labeler</wd>

<space/>

<wd l="8458" t="9211" r="8693" b="9355">for</wd>

<space/>

<wd l="8803" t="9211" r="9480" b="9355">German:</wd>

<space/>

<wd l="9667" t="9211" r="10507" b="9398">Exploiting</wd>

<space/>

</ln>

<ln l="6365" t="9427" r="10502" b="9610" baseLine="9566" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9427" r="7195" b="9610">Wikipedia</wd>

<space/>

<wd l="7306" t="9427" r="7589" b="9571">and</wd>

<space/>

<wd l="7704" t="9427" r="8755" b="9571">distributional</wd>

<space/>

<wd l="8870" t="9427" r="9514" b="9571">clusters.</wd>

<space/>

<wd l="9782" t="9432" r="9950" b="9566">In</wd>

<space/>

<wd l="10056" t="9427" r="10502" b="9571">Nico-</wd>

</ln>

<ln l="6365" t="9648" r="10502" b="9826" baseLine="9782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9648" r="6710" b="9792">letta</wd>

<space/>

<wd l="6768" t="9648" r="7493" b="9792">Calzolari</wd>

<space/>

<wd l="7560" t="9648" r="8534" b="9826">(Conference</wd>

<space/>

<wd l="8597" t="9648" r="9144" b="9826">Chair),</wd>

<space/>

<wd l="9216" t="9648" r="9754" b="9792">Khalid</wd>

<space/>

<wd l="9811" t="9648" r="10502" b="9816">Choukri,</wd>

<space/>

</ln>

<ln l="6365" t="9869" r="10502" b="10056" baseLine="10003" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9874" r="6826" b="10013">Bente</wd>

<space/>

<wd l="6912" t="9869" r="7747" b="10056">Maegaard,</wd>

<space/>

<wd l="7848" t="9869" r="8390" b="10051">Joseph</wd>

<space/>

<wd l="8472" t="9869" r="9149" b="10037">Mariani,</wd>

<space/>

<wd l="9245" t="9874" r="9509" b="10013">Jan</wd>

<space/>

<wd l="9600" t="9869" r="10090" b="10056">Odijk,</wd>

<space/>

<wd l="10195" t="9869" r="10502" b="10013">Ste-</wd>

</ln>

<ln l="6365" t="10085" r="10502" b="10267" baseLine="10224" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="10085" r="6648" b="10229">lios</wd>

<space/>

<wd l="6763" t="10085" r="7512" b="10267">Piperidis,</wd>

<space/>

<wd l="7646" t="10085" r="8064" b="10229">Mike</wd>

<space/>

<wd l="8174" t="10090" r="8774" b="10253">Rosner,</wd>

<space/>

<wd l="8909" t="10085" r="9197" b="10229">and</wd>

<space/>

<wd l="9302" t="10085" r="9835" b="10229">Daniel</wd>

<space/>

<wd l="9946" t="10085" r="10502" b="10267">Tapias,</wd>

<space/>

</ln>

<ln l="6370" t="10306" r="10507" b="10488" baseLine="10440">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="10306" r="6950" b="10474">editors,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7042" t="10306" r="8030" b="10488">Proceedings</wd>

<space/>

<wd l="8117" t="10306" r="8294" b="10488">of</wd>

<space/>

<wd l="8352" t="10306" r="8587" b="10450">the</wd>

<space/>

<wd l="8669" t="10306" r="9283" b="10450">Seventh</wd>

<space/>

<wd l="9370" t="10306" r="10229" b="10488">conference</wd>

<space/>

<wd l="10315" t="10354" r="10507" b="10450">on</wd>

<space/>

</run>

</ln>

<ln l="6360" t="10526" r="10507" b="10709" baseLine="10661" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6360" t="10526" r="7416" b="10670">International</wd>

<space/>

<wd l="7488" t="10531" r="8285" b="10709">Language</wd>

<space/>

<wd l="8362" t="10531" r="9178" b="10670">Resources</wd>

<space/>

<wd l="9259" t="10526" r="9562" b="10670">and</wd>

<space/>

<wd l="9634" t="10526" r="10507" b="10670">Evaluation</wd>

<space/>

</ln>

<ln l="6370" t="10742" r="10502" b="10930" baseLine="10882">

<wd l="6370" t="10742" r="7291" b="10920"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(LREC’10)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7402" t="10742" r="8054" b="10910">Valletta,</wd>

<space/>

<wd l="8165" t="10742" r="8674" b="10910">Malta,</wd>

<space/>

<wd l="8784" t="10747" r="9173" b="10930">May.</wd>

<space/>

<wd l="9278" t="10747" r="10037" b="10925">European</wd>

<space/>

<wd l="10133" t="10747" r="10502" b="10886">Lan-</wd>

</run>

</ln>

<ln l="6370" t="10963" r="9442" b="11150" baseLine="11098" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="11006" r="6835" b="11150">guage</wd>

<space/>

<wd l="6888" t="10968" r="7704" b="11107">Resources</wd>

<space/>

<wd l="7757" t="10963" r="8702" b="11107">Association</wd>

<space/>

<wd l="8760" t="10963" r="9442" b="11141">(ELRA).</wd>

</ln>

</para>

<para l="6149" t="11328" r="10541" b="12821" alignment="justified" li="216" spaceBefore="147" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6149" t="11328" r="10512" b="11515" baseLine="11462" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="11328" r="6883" b="11515">Grzegorz</wd>

<space/>

<wd l="6974" t="11328" r="7738" b="11515">Chrupała.</wd>

<space/>

<wd l="7944" t="11328" r="8376" b="11472">2013.</wd>

<space/>

<wd l="8578" t="11333" r="8928" b="11472">Text</wd>

<space/>

<wd l="9019" t="11328" r="10070" b="11515">segmentation</wd>

<space/>

<wd l="10157" t="11328" r="10512" b="11472">with</wd>

<space/>

</ln>

<ln l="6370" t="11544" r="10541" b="11731" baseLine="11683">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6370" t="11544" r="7531" b="11688">character-level</wd>

<space/>

<wd l="7598" t="11563" r="7896" b="11688">text</wd>

<space/>

<wd l="7958" t="11544" r="8957" b="11731">embeddings.</wd>

<space/>

<wd l="9077" t="11549" r="9245" b="11683">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="9307" t="11544" r="10291" b="11726">Proceedings</wd>

<space/>

<wd l="10358" t="11544" r="10541" b="11726">of</wd>

<space/>

</run>

</ln>

<ln l="6370" t="11765" r="10502" b="11947" baseLine="11899" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6370" t="11765" r="6605" b="11909">the</wd>

<space/>

<wd l="6648" t="11770" r="7133" b="11909">ICML</wd>

<space/>

<wd l="7176" t="11765" r="7570" b="11909">2013</wd>

<space/>

<wd l="7632" t="11765" r="8410" b="11947">Workshop</wd>

<space/>

<wd l="8462" t="11813" r="8654" b="11909">on</wd>

<space/>

<wd l="8698" t="11770" r="9120" b="11947">Deep</wd>

<space/>

<wd l="9168" t="11770" r="9898" b="11947">Learning</wd>

<space/>

<wd l="9917" t="11765" r="10502" b="11947">forAu-</wd>

</ln>

<ln l="6365" t="11986" r="10502" b="12168" baseLine="12120">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6365" t="11986" r="6648" b="12154">dio,</wd>

<space/>

<wd l="6715" t="11986" r="7272" b="12168">Speech</wd>

<space/>

<wd l="7325" t="11986" r="7632" b="12130">and</wd>

<space/>

<wd l="7670" t="11990" r="8462" b="12168">Language</wd>

<space/>

</run>

<wd l="8515" t="11990" r="9432" b="12168"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Processing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="9490" t="11986" r="10118" b="12154">Atlanta,</wd>

<space/>

<wd l="10176" t="11986" r="10502" b="12154">GA,</wd>

<space/>

</run>

</ln>

<ln l="6365" t="12202" r="10493" b="12379" baseLine="12341">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6365" t="12202" r="6802" b="12346">USA.</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-3"><wd l="6931" t="12206" r="10493" b="12379">https://sites.google.com/site/</wd>

<space/>

</run>

</ln>

<ln l="6374" t="12427" r="9955" b="12600" baseLine="12557" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-3">

<wd l="6374" t="12427" r="9955" b="12600">deeplearningicml2013/accepted_</wd>

<space/>

</ln>

<ln l="6365" t="12667" r="7118" b="12821" baseLine="12778">

<wd l="6365" t="12696" r="7118" b="12821"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-3">papers</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6149" t="13003" r="10512" b="14462" alignment="justified" li="216" spaceBefore="147" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6149" t="13003" r="10512" b="13190" baseLine="13142" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13003" r="6883" b="13190">Grzegorz</wd>

<space/>

<wd l="6965" t="13003" r="7728" b="13190">Chrupała.</wd>

<space/>

<wd l="7896" t="13003" r="8328" b="13147">2014.</wd>

<space/>

<wd l="8491" t="13003" r="9494" b="13190">Normalizing</wd>

<space/>

<wd l="9571" t="13022" r="10075" b="13147">tweets</wd>

<space/>

<wd l="10157" t="13003" r="10512" b="13147">with</wd>

<space/>

</ln>

<ln l="6370" t="13224" r="10512" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="13224" r="6667" b="13368">edit</wd>

<space/>

<wd l="6763" t="13224" r="7267" b="13406">scripts</wd>

<space/>

<wd l="7368" t="13224" r="7651" b="13368">and</wd>

<space/>

<wd l="7738" t="13243" r="8458" b="13368">recurrent</wd>

<space/>

<wd l="8549" t="13224" r="9043" b="13368">neural</wd>

<space/>

<wd l="9139" t="13224" r="10138" b="13411">embeddings.</wd>

<space/>

<wd l="10344" t="13229" r="10512" b="13363">In</wd>

<space/>

</ln>

<ln l="6365" t="13445" r="10502" b="13627" baseLine="13579" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13445" r="7349" b="13627">Proceedings</wd>

<space/>

<wd l="7416" t="13445" r="7594" b="13627">of</wd>

<space/>

<wd l="7627" t="13445" r="7867" b="13589">the</wd>

<space/>

<wd l="7925" t="13445" r="8328" b="13589">52nd</wd>

<space/>

<wd l="8366" t="13445" r="8962" b="13589">Annual</wd>

<space/>

<wd l="9014" t="13450" r="9667" b="13627">Meeting</wd>

<space/>

<wd l="9734" t="13445" r="9917" b="13627">of</wd>

<space/>

<wd l="9946" t="13445" r="10186" b="13589">the</wd>

<space/>

<wd l="10229" t="13450" r="10502" b="13589">As-</wd>

</ln>

<ln l="6365" t="13661" r="10502" b="13843" baseLine="13800" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13666" r="7090" b="13805">sociation</wd>

<space/>

<wd l="7118" t="13661" r="7397" b="13843">for</wd>

<space/>

<wd l="7454" t="13661" r="8645" b="13843">Computational</wd>

<space/>

<wd l="8693" t="13666" r="9571" b="13843">Linguistics</wd>

<space/>

<wd l="9638" t="13661" r="10282" b="13838">(Volume</wd>

<space/>

<wd l="10344" t="13661" r="10502" b="13805">2:</wd>

<space/>

</ln>

<ln l="6365" t="13882" r="10502" b="14069" baseLine="14016">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="13882" r="6802" b="14026">Short</wd>

<space/>

</run>

<wd l="6888" t="13886" r="7546" b="14064"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Papers)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7661" t="13925" r="8107" b="14069">pages</wd>

<space/>

<wd l="8213" t="13882" r="8947" b="14050">680–686,</wd>

<space/>

<wd l="9062" t="13882" r="9902" b="14050">Baltimore,</wd>

<space/>

<wd l="10013" t="13886" r="10502" b="14069">Mary-</wd>

</run>

</ln>

<ln l="6365" t="14098" r="10502" b="14285" baseLine="14237" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14098" r="6749" b="14266">land,</wd>

<space/>

<wd l="6821" t="14102" r="7224" b="14242">June.</wd>

<space/>

<wd l="7296" t="14098" r="8237" b="14242">Association</wd>

<space/>

<wd l="8299" t="14098" r="8530" b="14242">for</wd>

<space/>

<wd l="8597" t="14098" r="9773" b="14280">Computational</wd>

<space/>

<wd l="9835" t="14098" r="10502" b="14285">Linguis-</wd>

</ln>

<ln l="6365" t="14318" r="6677" b="14462" baseLine="14458" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14318" r="6677" b="14462">tics.</wd>

</ln>

</para>

<para l="6144" t="14683" r="10512" b="15307" alignment="justified" li="216" spaceBefore="142" fli="-216" lsp="exactly" lspExact="218" language="en">

<ln l="6144" t="14683" r="10502" b="14870" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14683" r="6797" b="14827">Michael</wd>

<space/>

<wd l="6864" t="14683" r="7474" b="14827">Collins.</wd>

<space/>

<wd l="7589" t="14683" r="8021" b="14827">2002.</wd>

<space/>

<wd l="8131" t="14683" r="9307" b="14827">Discriminative</wd>

<space/>

<wd l="9370" t="14683" r="9984" b="14870">training</wd>

<space/>

<wd l="10046" t="14683" r="10502" b="14827">meth-</wd>

</ln>

<ln l="6370" t="14899" r="10502" b="15086" baseLine="15038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="14899" r="6634" b="15043">ods</wd>

<space/>

<wd l="6696" t="14899" r="6931" b="15043">for</wd>

<space/>

<wd l="6984" t="14899" r="7531" b="15043">hidden</wd>

<space/>

<wd l="7584" t="14899" r="8208" b="15043">Markov</wd>

<space/>

<wd l="8266" t="14899" r="8880" b="15043">models:</wd>

<space/>

<wd l="8971" t="14899" r="9547" b="15086">Theory</wd>

<space/>

<wd l="9610" t="14899" r="9893" b="15043">and</wd>

<space/>

<wd l="9955" t="14899" r="10502" b="15082">experi-</wd>

</ln>

<ln l="6365" t="15120" r="10512" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="15139" r="6835" b="15264">ments</wd>

<space/>

<wd l="6907" t="15120" r="7262" b="15264">with</wd>

<space/>

<wd l="7334" t="15139" r="8184" b="15302">perceptron</wd>

<space/>

<wd l="8256" t="15120" r="9144" b="15307">algorithms.</wd>

<space/>

<wd l="9288" t="15125" r="9456" b="15259">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9523" t="15120" r="10512" b="15302">Proceedings</wd>

</run>

</ln>

</para>

</column>

</section>

<dd l="1425" t="15736" r="10546" b="15977">

<para l="5804" t="15792" r="6143" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5870" t="15792" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="40">

<wd l="5870" t="15792" r="6077" b="15946">97</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4314.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1423" marginTop="1296" marginRight="1365" marginBottom="1292" offsetX="-24" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1423" t="1296" r="10544" b="15311">

<column l="1423" t="1296" r="5825" b="15311">

<para l="1651" t="1334" r="5808" b="2179" alignment="justified" li="216" spaceBefore="5" lsp="exactly" lspExact="220" language="en">

<ln l="1661" t="1334" r="5803" b="1517" baseLine="1474" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="1334" r="1843" b="1517">of</wd>

<space/>

<wd l="1906" t="1334" r="2141" b="1478">the</wd>

<space/>

<wd l="2227" t="1334" r="2621" b="1478">2002</wd>

<space/>

<wd l="2722" t="1334" r="3624" b="1517">Conference</wd>

<space/>

<wd l="3715" t="1382" r="3907" b="1478">on</wd>

<space/>

<wd l="3989" t="1334" r="4795" b="1517">Empirical</wd>

<space/>

<wd l="4872" t="1334" r="5563" b="1478">Methods</wd>

<space/>

<wd l="5659" t="1339" r="5803" b="1478">in</wd>

<space/>

</ln>

<ln l="1651" t="1555" r="5798" b="1742" baseLine="1694">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="1555" r="2275" b="1699">Natural</wd>

<space/>

<wd l="2347" t="1560" r="3139" b="1738">Language</wd>

<space/>

<wd l="3216" t="1560" r="4090" b="1738">Processing</wd>

<space/>

</run>

<wd l="4176" t="1555" r="5266" b="1733"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(EMNLP’02)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5352" t="1598" r="5798" b="1742">pages</wd>

<space/>

</run>

</ln>

<ln l="1675" t="1776" r="5808" b="1963" baseLine="1910" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="1776" r="2002" b="1944">1–8,</wd>

<space/>

<wd l="2107" t="1776" r="3086" b="1944">Morristown,</wd>

<space/>

<wd l="3187" t="1781" r="3456" b="1944">NJ,</wd>

<space/>

<wd l="3547" t="1776" r="3989" b="1944">USA,</wd>

<space/>

<wd l="4085" t="1776" r="4445" b="1963">July.</wd>

<space/>

<wd l="4546" t="1776" r="5486" b="1920">Association</wd>

<space/>

<wd l="5573" t="1776" r="5808" b="1920">for</wd>

<space/>

</ln>

<ln l="1661" t="1992" r="3816" b="2179" baseLine="2131" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="1992" r="2842" b="2174">Computational</wd>

<space/>

<wd l="2894" t="1992" r="3816" b="2179">Linguistics.</wd>

</ln>

</para>

<para l="1440" t="2400" r="5808" b="3682" alignment="justified" li="216" spaceBefore="183" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="2400" r="5798" b="2544" baseLine="2539" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2400" r="1790" b="2544">Paul</wd>

<space/>

<wd l="1882" t="2400" r="2309" b="2544">Cook</wd>

<space/>

<wd l="2400" t="2400" r="2683" b="2544">and</wd>

<space/>

<wd l="2774" t="2400" r="3442" b="2544">Suzanne</wd>

<space/>

<wd l="3533" t="2400" r="4378" b="2544">Stevenson.</wd>

<space/>

<wd l="4579" t="2400" r="5011" b="2544">2009.</wd>

<space/>

<wd l="5213" t="2405" r="5458" b="2539">An</wd>

<space/>

<wd l="5539" t="2443" r="5798" b="2544">un-</wd>

</ln>

<ln l="1666" t="2621" r="5794" b="2808" baseLine="2755" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="2621" r="2510" b="2803">supervised</wd>

<space/>

<wd l="2597" t="2621" r="3091" b="2765">model</wd>

<space/>

<wd l="3182" t="2621" r="3418" b="2765">for</wd>

<space/>

<wd l="3504" t="2640" r="3802" b="2765">text</wd>

<space/>

<wd l="3888" t="2664" r="4560" b="2808">message</wd>

<space/>

<wd l="4646" t="2621" r="5794" b="2765">normalization.</wd>

<space/>

</ln>

<ln l="1656" t="2837" r="5808" b="3019" baseLine="2976">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="2842" r="1824" b="2976">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1891" t="2837" r="2880" b="3019">Proceedings</wd>

<space/>

<wd l="2952" t="2837" r="3134" b="3019">of</wd>

<space/>

<wd l="3178" t="2837" r="3413" b="2981">the</wd>

<space/>

<wd l="3494" t="2837" r="4272" b="3019">Workshop</wd>

<space/>

<wd l="4349" t="2885" r="4536" b="2981">on</wd>

<space/>

<wd l="4618" t="2837" r="5808" b="3019">Computational</wd>

<space/>

</run>

</ln>

<ln l="1642" t="3058" r="5798" b="3245" baseLine="3192">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1642" t="3058" r="2597" b="3240">Approaches</wd>

<space/>

<wd l="2683" t="3086" r="2832" b="3202">to</wd>

<space/>

<wd l="2909" t="3062" r="3710" b="3240">Linguistic</wd>

<space/>

</run>

<wd l="3802" t="3062" r="4627" b="3240"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Creativity</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4723" t="3101" r="5170" b="3245">pages</wd>

<space/>

<wd l="5256" t="3058" r="5798" b="3226">71–78,</wd>

<space/>

</run>

</ln>

<ln l="1656" t="3278" r="5798" b="3461" baseLine="3413" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="3278" r="2338" b="3446">Boulder,</wd>

<space/>

<wd l="2405" t="3278" r="3187" b="3446">Colorado,</wd>

<space/>

<wd l="3250" t="3283" r="3653" b="3422">June.</wd>

<space/>

<wd l="3720" t="3278" r="4666" b="3422">Association</wd>

<space/>

<wd l="4718" t="3278" r="4954" b="3422">for</wd>

<space/>

<wd l="5011" t="3278" r="5798" b="3461">Computa-</wd>

</ln>

<ln l="1656" t="3494" r="3086" b="3682" baseLine="3634" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="3494" r="2107" b="3638">tional</wd>

<space/>

<wd l="2160" t="3494" r="3086" b="3682">Linguistics.</wd>

</ln>

</para>

<para l="1440" t="3902" r="5808" b="4978" alignment="justified" li="216" spaceBefore="180" fli="-216" lsp="exactly" lspExact="225" language="en">

<ln l="1440" t="3902" r="5803" b="4085" baseLine="4037">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="3902" r="1848" b="4046">Felix</wd>

<space/>

<wd l="1963" t="3902" r="2371" b="4046">Gers.</wd>

<space/>

<wd l="2650" t="3902" r="3082" b="4046">2001.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="3346" t="3907" r="3758" b="4085">Long</wd>

<space/>

<wd l="3869" t="3902" r="4771" b="4046">Short-Term</wd>

<space/>

<wd l="4872" t="3907" r="5539" b="4085">Memory</wd>

<space/>

<wd l="5659" t="3907" r="5803" b="4046">in</wd>

<space/>

</run>

</ln>

<ln l="1651" t="4099" r="5803" b="4310" baseLine="4281">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1651" t="4147" r="2453" b="4286">Recurrent</wd>

<space/>

<wd l="2534" t="4142" r="3091" b="4286">Neural</wd>

<space/>

</run>

<wd l="3178" t="4142" r="3974" b="4286"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Networks</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="4195" t="4142" r="4642" b="4286">Ph.D.</wd>

<space/>

<wd l="4742" t="4142" r="5242" b="4310">thesis,</wd>

<space/>

<wd l="5352" t="4099" r="5803" b="4286">´Ecole</wd>

<space/>

</run>

</ln>

<ln l="1656" t="4363" r="5808" b="4550" baseLine="4498" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="4363" r="2798" b="4550">Polytechnique</wd>

<space/>

<wd l="2870" t="4363" r="3552" b="4507">F´ed´erale</wd>

<space/>

<wd l="3634" t="4363" r="3811" b="4507">de</wd>

<space/>

<wd l="3888" t="4368" r="4694" b="4531">Lausanne,</wd>

<space/>

<wd l="4776" t="4363" r="5808" b="4550">D´epartement</wd>

<space/>

</ln>

<ln l="1661" t="4584" r="5789" b="4771" baseLine="4718">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1661" t="4584" r="2909" b="4771">d’Informatique,</wd>

<space/>

<wd l="2981" t="4589" r="3782" b="4728">Lausanne.</wd>

<space/>

<wd l="3859" t="4584" r="4843" b="4728">Switzerland.</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-3"><wd l="4973" t="4589" r="5789" b="4762">http://</wd>

<space/>

</run>

</ln>

<ln l="1661" t="4805" r="5405" b="4978" baseLine="4939">

<wd l="1661" t="4805" r="5405" b="4978"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-3">www.felixgers.de/papers/phd.pdf</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="5208" r="5803" b="6701" alignment="right" spaceBefore="186" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="5208" r="5798" b="5395" baseLine="5342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5208" r="1819" b="5352">Alex</wd>

<space/>

<wd l="1925" t="5208" r="2472" b="5352">Graves</wd>

<space/>

<wd l="2582" t="5208" r="2866" b="5352">and</wd>

<space/>

<wd l="2962" t="5208" r="3662" b="5390">Navdeep</wd>

<space/>

<wd l="3763" t="5208" r="4219" b="5395">Jaitly.</wd>

<space/>

<wd l="4464" t="5208" r="4896" b="5352">2014.</wd>

<space/>

<wd l="5131" t="5208" r="5798" b="5352">Towards</wd>

<space/>

</ln>

<ln l="1661" t="5424" r="5798" b="5611" baseLine="5563" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="5424" r="2525" b="5568">end-to-end</wd>

<space/>

<wd l="2611" t="5424" r="3144" b="5606">speech</wd>

<space/>

<wd l="3226" t="5424" r="4133" b="5611">recognition</wd>

<space/>

<wd l="4214" t="5424" r="4570" b="5568">with</wd>

<space/>

<wd l="4651" t="5443" r="5371" b="5568">recurrent</wd>

<space/>

<wd l="5453" t="5467" r="5798" b="5568">neu-</wd>

</ln>

<ln l="1656" t="5645" r="5798" b="5832" baseLine="5784" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="5645" r="1867" b="5789">ral</wd>

<space/>

<wd l="1930" t="5645" r="2698" b="5789">networks.</wd>

<space/>

<wd l="2822" t="5650" r="2990" b="5784">In</wd>

<space/>

<wd l="3053" t="5645" r="3384" b="5789">Eric</wd>

<space/>

<wd l="3446" t="5650" r="3576" b="5789">P.</wd>

<space/>

<wd l="3648" t="5645" r="4042" b="5832">Xing</wd>

<space/>

<wd l="4114" t="5645" r="4402" b="5789">and</wd>

<space/>

<wd l="4459" t="5650" r="4858" b="5832">Tony</wd>

<space/>

<wd l="4925" t="5645" r="5477" b="5813">Jebara,</wd>

<space/>

<wd l="5554" t="5645" r="5798" b="5789">ed-</wd>

</ln>

<ln l="1656" t="5866" r="5798" b="6048" baseLine="6000">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="5866" r="2054" b="6034">itors,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2155" t="5866" r="3144" b="6048">Proceedings</wd>

<space/>

<wd l="3235" t="5866" r="3413" b="6048">of</wd>

<space/>

<wd l="3480" t="5866" r="3763" b="6010">The</wd>

<space/>

<wd l="3854" t="5866" r="4190" b="6010">31st</wd>

<space/>

<wd l="4267" t="5866" r="5323" b="6010">International</wd>

<space/>

<wd l="5414" t="5870" r="5798" b="6010">Con-</wd>

</run>

</ln>

<ln l="1622" t="6082" r="5803" b="6264" baseLine="6221">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1622" t="6082" r="2237" b="6264">ference</wd>

<space/>

<wd l="2304" t="6130" r="2496" b="6226">on</wd>

<space/>

<wd l="2558" t="6082" r="3254" b="6226">Machine</wd>

<space/>

</run>

<wd l="3317" t="6086" r="4094" b="6264"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Learning</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4166" t="6082" r="4762" b="6226">volume</wd>

<space/>

<wd l="4829" t="6082" r="5021" b="6226">32</wd>

<space/>

<wd l="5093" t="6082" r="5266" b="6226">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5314" t="6086" r="5803" b="6226">JMLR</wd>

<space/>

</run>

</ln>

<ln l="1666" t="6302" r="5765" b="6485" baseLine="6442">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1666" t="6302" r="2443" b="6485">Workshop</wd>

<space/>

<wd l="2544" t="6302" r="2851" b="6446">and</wd>

<space/>

<wd l="2952" t="6302" r="3850" b="6485">Conference</wd>

<space/>

</run>

<wd l="3950" t="6302" r="4973" b="6485"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Proceedings</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0"><wd l="5213" t="6317" r="5765" b="6480">http:</wd>

<space/>

</run>

</ln>

<ln l="1675" t="6528" r="5760" b="6701" baseLine="6658">

<wd l="1675" t="6528" r="5760" b="6701"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">//jmlr.org/proceedings/papers/v32/</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="6926" r="5818" b="8194" alignment="justified" li="216" spaceBefore="184" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="6926" r="5794" b="7114" baseLine="7066" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="1440" t="6931" r="1670" b="7070">Bo</wd>

<space/>

<wd l="1766" t="6931" r="2141" b="7094">Han,</wd>

<space/>

<wd l="2246" t="6926" r="2597" b="7070">Paul</wd>

<space/>

<wd l="2698" t="6926" r="3168" b="7094">Cook,</wd>

<space/>

<wd l="3278" t="6926" r="3566" b="7070">and</wd>

<space/>

<wd l="3658" t="6926" r="4330" b="7114">Timothy</wd>

<space/>

<wd l="4426" t="6926" r="5141" b="7070">Baldwin.</wd>

<space/>

<wd l="5362" t="6926" r="5794" b="7070">2013.</wd>

<space/>

</ln>

<ln l="1656" t="7147" r="5818" b="7291" baseLine="7286">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4"><wd l="1656" t="7147" r="2251" b="7291">Lexical</wd>

<space/>

<wd l="2323" t="7147" r="3432" b="7291">normalization</wd>

<space/>

<wd l="3504" t="7147" r="3734" b="7291">for</wd>

<space/>

<wd l="3816" t="7147" r="4267" b="7291">social</wd>

<space/>

<wd l="4344" t="7147" r="4834" b="7291">media</wd>

<space/>

<wd l="4901" t="7166" r="5237" b="7291">text.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4"><wd l="5376" t="7152" r="5818" b="7291">ACM</wd>

<space/>

</run>

</ln>

<ln l="1666" t="7368" r="5798" b="7550" baseLine="7502" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="1666" t="7373" r="2683" b="7512">Transactions</wd>

<space/>

<wd l="2789" t="7416" r="2976" b="7512">on</wd>

<space/>

<wd l="3072" t="7368" r="3902" b="7550">Intelligent</wd>

<space/>

<wd l="3994" t="7373" r="4622" b="7550">Systems</wd>

<space/>

<wd l="4723" t="7368" r="5026" b="7512">and</wd>

<space/>

<wd l="5126" t="7368" r="5798" b="7512">Technol-</wd>

</ln>

<ln l="1661" t="7584" r="5798" b="7766" baseLine="7723" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="1661" t="7632" r="1944" b="7766">ogy</wd>

<space/>

<wd l="2054" t="7589" r="2558" b="7762">(TIST)</wd>

<space/>

<wd l="2683" t="7670" r="2731" b="7685">-</wd>

<space/>

<wd l="2846" t="7584" r="3432" b="7766">Special</wd>

<space/>

<wd l="3538" t="7589" r="4099" b="7728">section</wd>

<space/>

<wd l="4210" t="7632" r="4402" b="7728">on</wd>

<space/>

<wd l="4517" t="7589" r="5040" b="7728">twitter</wd>

<space/>

<wd l="5136" t="7584" r="5438" b="7728">and</wd>

<space/>

<wd l="5539" t="7589" r="5798" b="7728">mi-</wd>

</ln>

<ln l="1661" t="7805" r="5798" b="7987" baseLine="7939" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="1661" t="7805" r="2616" b="7987">croblogging</wd>

<space/>

<wd l="2770" t="7810" r="3437" b="7973">services,</wd>

<space/>

<wd l="3634" t="7805" r="4114" b="7949">social</wd>

<space/>

<wd l="4262" t="7805" r="5357" b="7949">recommender</wd>

<space/>

<wd l="5496" t="7853" r="5798" b="7987">sys-</wd>

</ln>

<ln l="1661" t="8026" r="5798" b="8194" baseLine="8160">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4"><wd l="1661" t="8054" r="2054" b="8194">tems,</wd>

<space/>

<wd l="2251" t="8026" r="2554" b="8170">and</wd>

<space/>

<wd l="2707" t="8026" r="3797" b="8170">CAMRa2010:</wd>

<space/>

<wd l="4066" t="8030" r="4565" b="8170">Movie</wd>

<space/>

<wd l="4723" t="8026" r="5798" b="8170">recommenda-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1661" t="8242" r="5803" b="8419" alignment="left" li="216" spaceBefore="1" lsp="exactly" lspExact="215" language="en">

<tabs position="1661"/>

<ln l="1661" t="8242" r="5803" b="8419" baseLine="8381">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="8246" r="1963" b="8386">tion</wd>

<space/>

<wd l="2136" t="8246" r="2275" b="8386">in</wd>

<space/>

<wd l="2443" t="8270" r="3014" b="8386">context</wd>

<space/>

</run>

<wd l="3168" t="8242" r="3797" b="8410"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">archive</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3989" t="8242" r="5122" b="8419">4(1):5:1–5:27.</wd>

<tab position="5122"/>

<wd l="5554" t="8242" r="5803" b="8386">doi</wd>

</run>

</ln>

</para>

<para l="1675" t="8462" r="3845" b="8606" alignment="left" li="216" lsp="exactly" lspExact="219" language="en">

<ln l="1675" t="8462" r="3845" b="8606" baseLine="8597" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1675" t="8462" r="3845" b="8606">10.1145/2414425.2414430.</wd>

</ln>

</para>

<para l="1445" t="8870" r="5798" b="9485" alignment="justified" li="216" spaceBefore="185" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="8870" r="5794" b="9058" baseLine="9005" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="8870" r="1834" b="9053">Sepp</wd>

<space/>

<wd l="1954" t="8870" r="2808" b="9014">Hochreiter</wd>

<space/>

<wd l="2928" t="8870" r="3211" b="9014">and</wd>

<space/>

<wd l="3326" t="8875" r="3854" b="9058">J¨urgen</wd>

<space/>

<wd l="3974" t="8870" r="5059" b="9014">Schmidhuber.</wd>

<space/>

<wd l="5376" t="8870" r="5794" b="9014">1997.</wd>

<space/>

</ln>

<ln l="1656" t="9086" r="5798" b="9274" baseLine="9226">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="9091" r="2074" b="9274">Long</wd>

<space/>

<wd l="2194" t="9086" r="3014" b="9230">short-term</wd>

<space/>

<wd l="3115" t="9130" r="3806" b="9274">memory.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4056" t="9086" r="4613" b="9230">Neural</wd>

<space/>

</run>

<wd l="4723" t="9091" r="5798" b="9269"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Computation</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1661" t="9307" r="5688" b="9485" baseLine="9442" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="9307" r="2981" b="9485">9(8):1735–1780.</wd>

<space/>

<wd l="3067" t="9307" r="5688" b="9451">doi:10.1162/neco.1997.9.8.1735.</wd>

</ln>

</para>

<para l="1440" t="9715" r="5808" b="11645" alignment="justified" li="216" spaceBefore="189" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="9715" r="5808" b="9902" baseLine="9850" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9715" r="1872" b="9859">Mark</wd>

<space/>

<wd l="2035" t="9720" r="2218" b="9859">D.</wd>

<space/>

<wd l="2400" t="9715" r="3264" b="9902">Kemighan,</wd>

<space/>

<wd l="3470" t="9715" r="4138" b="9859">Kenneth</wd>

<space/>

<wd l="4301" t="9720" r="4512" b="9859">W.</wd>

<space/>

<wd l="4690" t="9715" r="5318" b="9883">Church,</wd>

<space/>

<wd l="5525" t="9715" r="5808" b="9859">and</wd>

<space/>

</ln>

<ln l="1656" t="9931" r="5798" b="10118" baseLine="10070" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="9931" r="2309" b="10075">William</wd>

<space/>

<wd l="2366" t="9936" r="2549" b="10075">A.</wd>

<space/>

<wd l="2626" t="9931" r="3034" b="10075">Gale.</wd>

<space/>

<wd l="3173" t="9931" r="3590" b="10075">1990.</wd>

<space/>

<wd l="3706" t="9936" r="3850" b="10070">A</wd>

<space/>

<wd l="3922" t="9931" r="4541" b="10118">spelling</wd>

<space/>

<wd l="4608" t="9931" r="5414" b="10075">correction</wd>

<space/>

<wd l="5472" t="9974" r="5798" b="10114">pro-</wd>

</ln>

<ln l="1661" t="10152" r="5798" b="10339" baseLine="10286" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1661" t="10195" r="2069" b="10339">gram</wd>

<space/>

<wd l="2155" t="10152" r="2611" b="10296">based</wd>

<space/>

<wd l="2702" t="10195" r="2899" b="10296">on</wd>

<space/>

<wd l="2995" t="10195" r="3082" b="10296">a</wd>

<space/>

<wd l="3163" t="10152" r="3595" b="10339">noisy</wd>

<space/>

<wd l="3691" t="10152" r="4306" b="10296">channel</wd>

<space/>

<wd l="4397" t="10152" r="4930" b="10296">model.</wd>

<space/>

<wd l="5141" t="10157" r="5309" b="10291">In</wd>

<space/>

<wd l="5395" t="10157" r="5798" b="10296">Hans</wd>

<space/>

</ln>

<ln l="1661" t="10373" r="5803" b="10560" baseLine="10507">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1661" t="10373" r="2410" b="10560">Karlgren,</wd>

<space/>

<wd l="2486" t="10373" r="2986" b="10541">editor,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="3067" t="10373" r="4109" b="10517">COLING-90:</wd>

<space/>

<wd l="4210" t="10378" r="4757" b="10555">Papers</wd>

<space/>

<wd l="4800" t="10373" r="5592" b="10555">presented</wd>

<space/>

<wd l="5654" t="10402" r="5803" b="10517">to</wd>

<space/>

</run>

</ln>

<ln l="1661" t="10589" r="5808" b="10771" baseLine="10728" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1661" t="10589" r="1901" b="10733">the</wd>

<space/>

<wd l="1949" t="10589" r="2290" b="10733">13th</wd>

<space/>

<wd l="2328" t="10589" r="3389" b="10733">International</wd>

<space/>

<wd l="3432" t="10589" r="4330" b="10771">Conference</wd>

<space/>

<wd l="4378" t="10637" r="4570" b="10733">on</wd>

<space/>

<wd l="4618" t="10589" r="5808" b="10771">Computational</wd>

<space/>

</ln>

<ln l="1651" t="10810" r="5803" b="10992" baseLine="10944" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1651" t="10814" r="2534" b="10992">Linguistics</wd>

<space/>

<wd l="2592" t="10858" r="2784" b="10954">on</wd>

<space/>

<wd l="2851" t="10810" r="3086" b="10954">the</wd>

<space/>

<wd l="3149" t="10814" r="3850" b="10954">occasion</wd>

<space/>

<wd l="3917" t="10810" r="4094" b="10992">of</wd>

<space/>

<wd l="4128" t="10810" r="4363" b="10954">the</wd>

<space/>

<wd l="4421" t="10810" r="4771" b="10954">25th</wd>

<space/>

<wd l="4819" t="10814" r="5803" b="10992">Anniversary</wd>

<space/>

</ln>

<ln l="1661" t="11030" r="5803" b="11213" baseLine="11165" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1661" t="11030" r="1843" b="11213">of</wd>

<space/>

<wd l="1891" t="11035" r="2616" b="11174">COLING</wd>

<space/>

<wd l="2678" t="11030" r="2986" b="11174">and</wd>

<space/>

<wd l="3053" t="11030" r="3288" b="11174">the</wd>

<space/>

<wd l="3355" t="11030" r="3806" b="11174">350th</wd>

<space/>

<wd l="3864" t="11035" r="4848" b="11213">Anniversary</wd>

<space/>

<wd l="4925" t="11030" r="5102" b="11213">of</wd>

<space/>

<wd l="5136" t="11030" r="5803" b="11174">Helsinki</wd>

<space/>

</ln>

<ln l="1675" t="11246" r="5765" b="11429" baseLine="11386">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1675" t="11251" r="2506" b="11429">University,</wd>

<space/>

<wd l="2640" t="11246" r="3211" b="11390">Volume</wd>

<space/>

</run>

<wd l="3302" t="11246" r="3442" b="11390"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">2</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-1"><wd l="3658" t="11251" r="5765" b="11424">http://www.aclweb.</wd>

<space/>

</run>

</ln>

<ln l="1670" t="11472" r="4090" b="11645" baseLine="11602">

<wd l="1670" t="11472" r="4090" b="11645"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-1">org/anthology/C/C90/</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="11875" r="5803" b="12720" alignment="justified" li="216" spaceBefore="192" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="11875" r="5803" b="12062" baseLine="12010" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11875" r="1819" b="12019">John</wd>

<space/>

<wd l="1891" t="11875" r="2568" b="12062">Lafferty,</wd>

<space/>

<wd l="2654" t="11875" r="3283" b="12019">Andrew</wd>

<space/>

<wd l="3360" t="11875" r="4258" b="12043">McCallum,</wd>

<space/>

<wd l="4349" t="11875" r="4632" b="12019">and</wd>

<space/>

<wd l="4704" t="11875" r="5453" b="12019">Fernando</wd>

<space/>

<wd l="5534" t="11875" r="5803" b="12019">CN</wd>

<space/>

</ln>

<ln l="1656" t="12091" r="5798" b="12235" baseLine="12230" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="12091" r="2261" b="12235">Pereira.</wd>

<space/>

<wd l="2443" t="12091" r="2875" b="12235">2001.</wd>

<space/>

<wd l="3053" t="12091" r="3989" b="12235">Conditional</wd>

<space/>

<wd l="4070" t="12091" r="4680" b="12235">random</wd>

<space/>

<wd l="4762" t="12091" r="5227" b="12235">fields:</wd>

<space/>

<wd l="5362" t="12091" r="5798" b="12235">Prob-</wd>

</ln>

<ln l="1661" t="12312" r="5798" b="12499" baseLine="12446" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="12312" r="2285" b="12456">abilistic</wd>

<space/>

<wd l="2395" t="12312" r="2966" b="12456">models</wd>

<space/>

<wd l="3077" t="12312" r="3307" b="12456">for</wd>

<space/>

<wd l="3422" t="12312" r="4325" b="12499">segmenting</wd>

<space/>

<wd l="4440" t="12312" r="4723" b="12456">and</wd>

<space/>

<wd l="4824" t="12312" r="5462" b="12499">labeling</wd>

<space/>

<wd l="5582" t="12355" r="5798" b="12456">se-</wd>

</ln>

<ln l="1661" t="12533" r="3965" b="12720" baseLine="12667" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="12576" r="2222" b="12715">quence</wd>

<space/>

<wd l="2275" t="12533" r="2645" b="12677">data.</wd>

<space/>

<wd l="2726" t="12576" r="3173" b="12720">pages</wd>

<space/>

<wd l="3235" t="12533" r="3965" b="12677">282–289.</wd>

</ln>

</para>

<para l="1440" t="12936" r="5803" b="14222" alignment="right" spaceBefore="182" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="12936" r="5794" b="13123" baseLine="13075">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="12936" r="2078" b="13080">Thomas</wd>

<space/>

<wd l="2141" t="12941" r="2923" b="13123">Lavergne,</wd>

<space/>

<wd l="2995" t="12936" r="3552" b="13080">Olivier</wd>

<space/>

<wd l="3614" t="12936" r="4162" b="13123">Capp´e,</wd>

<space/>

<wd l="4234" t="12936" r="4517" b="13080">and</wd>

<space/>

</run>

<wd l="4574" t="12936" r="5251" b="13118"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Franc</run>

<run underlined="none" subsuperscript="subscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">¸</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">ois</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="5318" t="12941" r="5794" b="13080">Yvon.</wd>

<space/>

</run>

</ln>

<ln l="1661" t="13157" r="5798" b="13344" baseLine="13291">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1661" t="13157" r="2093" b="13301">2010.</wd>

<space/>

<wd l="2242" t="13157" r="2938" b="13301">Practical</wd>

<space/>

<wd l="3010" t="13200" r="3355" b="13344">very</wd>

<space/>

<wd l="3432" t="13157" r="3826" b="13344">large</wd>

<space/>

<wd l="3907" t="13157" r="4291" b="13301">scale</wd>

<space/>

<wd l="4368" t="13157" r="4699" b="13301">crfs.</wd>

<space/>

<wd l="4848" t="13162" r="5016" b="13296">In</wd>

<space/>

</run>

<wd l="5083" t="13157" r="5798" b="13301" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Proceed-</wd>

</ln>

<ln l="1666" t="13378" r="5803" b="13560" baseLine="13512" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1666" t="13382" r="1992" b="13560">ings</wd>

<space/>

<wd l="2059" t="13378" r="2242" b="13560">of</wd>

<space/>

<wd l="2275" t="13378" r="2515" b="13522">the</wd>

<space/>

<wd l="2578" t="13378" r="2928" b="13522">48th</wd>

<space/>

<wd l="2981" t="13378" r="3576" b="13522">Annual</wd>

<space/>

<wd l="3629" t="13382" r="4282" b="13560">Meeting</wd>

<space/>

<wd l="4354" t="13378" r="4536" b="13560">of</wd>

<space/>

<wd l="4574" t="13378" r="4810" b="13522">the</wd>

<space/>

<wd l="4862" t="13382" r="5803" b="13522">Association</wd>

<space/>

</ln>

<ln l="1622" t="13594" r="5798" b="13781" baseLine="13733">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1622" t="13594" r="1901" b="13776">for</wd>

<space/>

<wd l="1958" t="13594" r="3144" b="13776">Computational</wd>

<space/>

</run>

<wd l="3192" t="13598" r="4118" b="13776"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Linguistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="4181" t="13637" r="4627" b="13781">pages</wd>

<space/>

<wd l="4694" t="13594" r="5434" b="13762">504–513,</wd>

<space/>

<wd l="5496" t="13598" r="5798" b="13776">Up-</wd>

</run>

</ln>

<ln l="1656" t="13814" r="5803" b="14002" baseLine="13949" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="13814" r="2112" b="13997">psala,</wd>

<space/>

<wd l="2179" t="13814" r="2846" b="13982">Sweden,</wd>

<space/>

<wd l="2914" t="13814" r="3269" b="14002">July.</wd>

<space/>

<wd l="3336" t="13814" r="4277" b="13958">Association</wd>

<space/>

<wd l="4334" t="13814" r="4565" b="13958">for</wd>

<space/>

<wd l="4627" t="13814" r="5803" b="13997">Computational</wd>

<space/>

</ln>

<ln l="1656" t="14035" r="2582" b="14222" baseLine="14170" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="14035" r="2582" b="14222">Linguistics.</wd>

</ln>

</para>

<para l="1440" t="14424" r="5808" b="15302" alignment="justified" li="216" spaceBefore="209" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="14424" r="5808" b="14650" baseLine="14600">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="14467" r="1584" b="14606">T.</wd>

<space/>

<wd l="1666" t="14462" r="2376" b="14630">Mikolov,</wd>

<space/>

<wd l="2458" t="14467" r="2674" b="14606">M.</wd>

<space/>

<wd l="2760" t="14462" r="3437" b="14630">Karafi´at,</wd>

<space/>

<wd l="3518" t="14467" r="3682" b="14606">L.</wd>

<space/>

<wd l="3758" t="14467" r="4344" b="14650">Burget,</wd>

<space/>

<wd l="4421" t="14467" r="4541" b="14606">J.</wd>

<space/>

</run>

<wd l="4622" t="14424" r="5438" b="14650"><run underlined="none" subsuperscript="superscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ˇ</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Cernock´y,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5525" t="14462" r="5808" b="14606">and</wd>

<space/>

</run>

</ln>

<ln l="1661" t="14683" r="5808" b="14866" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="14683" r="1810" b="14827">S.</wd>

<space/>

<wd l="1915" t="14683" r="2832" b="14866">Khudanpur.</wd>

<space/>

<wd l="3048" t="14683" r="3480" b="14827">2010.</wd>

<space/>

<wd l="3691" t="14688" r="4478" b="14827">Recurrent</wd>

<space/>

<wd l="4565" t="14683" r="5064" b="14827">neural</wd>

<space/>

<wd l="5155" t="14683" r="5808" b="14827">network</wd>

<space/>

</ln>

<ln l="1656" t="14899" r="5803" b="15086" baseLine="15038">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="14899" r="2112" b="15043">based</wd>

<space/>

<wd l="2179" t="14899" r="2894" b="15086">language</wd>

<space/>

<wd l="2962" t="14899" r="3499" b="15043">model.</wd>

<space/>

<wd l="3634" t="14904" r="3802" b="15038">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3869" t="14899" r="4853" b="15082">Proceedings</wd>

<space/>

<wd l="4925" t="14899" r="5107" b="15082">of</wd>

<space/>

<wd l="5146" t="14899" r="5381" b="15043">the</wd>

<space/>

<wd l="5462" t="14899" r="5803" b="15043">11th</wd>

<space/>

</run>

</ln>

<ln l="1642" t="15120" r="5803" b="15302" baseLine="15259" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="15120" r="2237" b="15264">Annual</wd>

<space/>

<wd l="2371" t="15120" r="3274" b="15302">Conference</wd>

<space/>

<wd l="3408" t="15120" r="3590" b="15302">of</wd>

<space/>

<wd l="3696" t="15120" r="3931" b="15264">the</wd>

<space/>

<wd l="4056" t="15120" r="5117" b="15264">International</wd>

<space/>

<wd l="5246" t="15120" r="5803" b="15302">Speech</wd>

</ln>

</para>

</column>

<column l="6142" t="1296" r="10544" b="12280">

<para l="6365" t="1339" r="10522" b="2611" alignment="left" li="216" spaceBefore="14" lsp="exactly" lspExact="218" language="en">

<ln l="6374" t="1339" r="10522" b="1512" baseLine="1474" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="1339" r="7632" b="1478">Communication</wd>

<space/>

<wd l="7915" t="1339" r="8856" b="1478">Association</wd>

<space/>

<wd l="9154" t="1339" r="10522" b="1512">(INTERSPEECH</wd>

<space/>

</ln>

<ln l="6365" t="1555" r="10507" b="1738" baseLine="1694">

<wd l="6365" t="1555" r="6874" b="1733"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2010)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7075" t="1555" r="7896" b="1723">Makuhari,</wd>

<space/>

<wd l="8102" t="1555" r="8616" b="1723">Chiba,</wd>

<space/>

<wd l="8822" t="1560" r="9312" b="1738">Japan.</wd>

<space/>

<wd l="9494" t="1555" r="10507" b="1699">International</wd>

<space/>

</run>

</ln>

<ln l="6370" t="1776" r="10498" b="1958" baseLine="1910" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="1776" r="6941" b="1958">Speech</wd>

<space/>

<wd l="7181" t="1776" r="8462" b="1920">Communication</wd>

<space/>

<wd l="8698" t="1776" r="9638" b="1920">Association</wd>

<space/>

<wd l="9883" t="1776" r="10498" b="1954">(ICSA).</wd>

<space/>

</ln>

<ln l="6370" t="1997" r="10291" b="2170" baseLine="2131" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="6370" t="1997" r="10291" b="2170">http://www.fit.vutbr.cz/research/</wd>

<space/>

</ln>

<ln l="6374" t="2218" r="10315" b="2390" baseLine="2352" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="6374" t="2218" r="10315" b="2390">groups/speech/publi/2010/mikolov_</wd>

<space/>

</ln>

<ln l="6379" t="2448" r="9749" b="2611" baseLine="2568">

<wd l="6379" t="2448" r="9749" b="2611"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">interspeech2010_IS100722.pdf</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="2832" r="10502" b="3014" alignment="left" spaceBefore="180" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="2832" r="10502" b="3014" baseLine="2966">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="6144" t="2832" r="6667" b="2976">Tom´aˇs</wd>

<space/>

<wd l="6758" t="2832" r="7469" b="2976">Mikolov.</wd>

<space/>

<wd l="7675" t="2832" r="8107" b="2976">2012.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="8314" t="2832" r="9110" b="2976">Statistical</wd>

<space/>

<wd l="9192" t="2837" r="9989" b="3014">Language</wd>

<space/>

<wd l="10075" t="2832" r="10502" b="2976">Mod-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6365" t="3048" r="10512" b="4325" alignment="justified" li="216" spaceBefore="6" lsp="exactly" lspExact="218" language="en">

<tabs position="6365"/>

<ln l="6370" t="3048" r="10502" b="3216" baseLine="3187" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="3048" r="6586" b="3192">els</wd>

<space/>

<wd l="6710" t="3048" r="7181" b="3192">based</wd>

<space/>

<wd l="7306" t="3096" r="7498" b="3192">on</wd>

<space/>

<wd l="7622" t="3048" r="8184" b="3192">Neural</wd>

<space/>

</run>

<wd l="8304" t="3048" r="9096" b="3192"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Networks</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="9096"/>

<wd l="9427" t="3048" r="9869" b="3192">Ph.D.</wd>

<space/>

<wd l="10008" t="3048" r="10502" b="3216">thesis,
</wd>

</run>

</ln>

<ln l="6365" t="3269" r="10502" b="3456" baseLine="3408" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6365" t="3274" r="6758" b="3413">Brno</wd>

<space/>

<wd l="6888" t="3269" r="7718" b="3456">University</wd>

<space/>

<wd l="7853" t="3269" r="8026" b="3413">of</wd>

<space/>

<wd l="8141" t="3269" r="9110" b="3456">Technology,</wd>

<space/>

<wd l="9264" t="3269" r="9854" b="3456">Faculty</wd>

<space/>

<wd l="9989" t="3269" r="10162" b="3413">of</wd>

<space/>

<wd l="10277" t="3274" r="10502" b="3408">In-</wd>

</ln>

<ln l="6365" t="3490" r="10512" b="3677" baseLine="3624" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6365" t="3490" r="7152" b="3634">formation</wd>

<space/>

<wd l="7267" t="3490" r="8232" b="3677">Technology,</wd>

<space/>

<wd l="8376" t="3494" r="9317" b="3672">Department</wd>

<space/>

<wd l="9437" t="3490" r="9610" b="3634">of</wd>

<space/>

<wd l="9720" t="3490" r="10512" b="3672">Computer</wd>

<space/>

</ln>

<ln l="6370" t="3706" r="10498" b="3888" baseLine="3845" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6370" t="3706" r="7075" b="3888">Graphics</wd>

<space/>

<wd l="7171" t="3706" r="7459" b="3850">and</wd>

<space/>

<wd l="7541" t="3706" r="8515" b="3874">Multimedia,</wd>

<space/>

<wd l="8616" t="3710" r="9058" b="3874">Brno,</wd>

<space/>

<wd l="9163" t="3706" r="9658" b="3850">Czech</wd>

<space/>

<wd l="9744" t="3706" r="10498" b="3888">Republic.</wd>

<space/>

</ln>

<ln l="6370" t="3931" r="10411" b="4104" baseLine="4066" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0" forcedEOF="true">

<wd l="6370" t="3931" r="10411" b="4104">http://www.fit.vutbr.cz/˜imikolov/</wd>

<space/>

</ln>

<ln l="6379" t="4152" r="8314" b="4325" baseLine="4282" forcedEOF="true">

<wd l="6379" t="4152" r="8314" b="4325"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">rnnlm/thesis.pdf</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="4546" r="10512" b="6038" alignment="justified" li="216" spaceBefore="173" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="4546" r="10502" b="4690" baseLine="4680" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4546" r="6802" b="4690">Andreas</wd>

<space/>

<wd l="6874" t="4546" r="7502" b="4690">Stolcke.</wd>

<space/>

<wd l="7618" t="4546" r="8050" b="4690">2002.</wd>

<space/>

<wd l="8170" t="4546" r="8770" b="4690">SRILM</wd>

<space/>

<wd l="8832" t="4632" r="9034" b="4646">—</wd>

<space/>

<wd l="9096" t="4589" r="9274" b="4690">an</wd>

<space/>

<wd l="9341" t="4546" r="10142" b="4690">extensible</wd>

<space/>

<wd l="10200" t="4546" r="10502" b="4690">lan-</wd>

</ln>

<ln l="6370" t="4762" r="10512" b="4949" baseLine="4901" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="4805" r="6835" b="4949">guage</wd>

<space/>

<wd l="6902" t="4762" r="7651" b="4949">modeling</wd>

<space/>

<wd l="7718" t="4762" r="8275" b="4906">toolkit.</wd>

<space/>

<wd l="8405" t="4766" r="8568" b="4901">In</wd>

<space/>

<wd l="8630" t="4762" r="9010" b="4906">John</wd>

<space/>

<wd l="9072" t="4766" r="9254" b="4906">H.</wd>

<space/>

<wd l="9326" t="4766" r="9490" b="4906">L.</wd>

<space/>

<wd l="9562" t="4766" r="10162" b="4906">Hansen</wd>

<space/>

<wd l="10229" t="4762" r="10512" b="4906">and</wd>

<space/>

</ln>

<ln l="6365" t="4982" r="10502" b="5170" baseLine="5122">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="4987" r="6845" b="5170">Bryan</wd>

<space/>

<wd l="6902" t="4982" r="7512" b="5150">Pellom,</wd>

<space/>

<wd l="7574" t="4982" r="8155" b="5150">editors,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8213" t="4982" r="9202" b="5165">Proceedings</wd>

<space/>

<wd l="9259" t="4982" r="9437" b="5165">of</wd>

<space/>

<wd l="9466" t="4982" r="9701" b="5126">the</wd>

<space/>

<wd l="9768" t="4982" r="10008" b="5126">7th</wd>

<space/>

<wd l="10056" t="4987" r="10502" b="5126">Inter-</wd>

</run>

</ln>

<ln l="6365" t="5203" r="10502" b="5386" baseLine="5338" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="5203" r="7032" b="5347">national</wd>

<space/>

<wd l="7099" t="5203" r="8002" b="5386">Conference</wd>

<space/>

<wd l="8069" t="5251" r="8261" b="5347">on</wd>

<space/>

<wd l="8328" t="5203" r="8899" b="5386">Spoken</wd>

<space/>

<wd l="8962" t="5208" r="9758" b="5386">Language</wd>

<space/>

<wd l="9821" t="5208" r="10502" b="5347">Process-</wd>

</ln>

<ln l="6374" t="5419" r="10502" b="5606" baseLine="5558">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6374" t="5424" r="6614" b="5602">ing</wd>

<space/>

</run>

<wd l="6662" t="5419" r="7762" b="5597"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(ICSLP2002)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7814" t="5419" r="8405" b="5563">volume</wd>

<space/>

<wd l="8448" t="5419" r="8587" b="5587">2,</wd>

<space/>

<wd l="8635" t="5462" r="9086" b="5606">pages</wd>

<space/>

<wd l="9134" t="5419" r="9869" b="5587">901–904,</wd>

<space/>

<wd l="9917" t="5419" r="10502" b="5587">Baixas,</wd>

<space/>

</run>

</ln>

<ln l="6365" t="5640" r="10502" b="5822" baseLine="5774" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="5645" r="6946" b="5784">France.</wd>

<space/>

<wd l="7008" t="5640" r="8026" b="5784">International</wd>

<space/>

<wd l="8083" t="5640" r="8654" b="5822">Speech</wd>

<space/>

<wd l="8712" t="5640" r="9994" b="5784">Communication</wd>

<space/>

<wd l="10046" t="5645" r="10502" b="5784">Asso-</wd>

</ln>

<ln l="6370" t="5861" r="7579" b="6038" baseLine="5995" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="5861" r="6907" b="6005">ciation</wd>

<space/>

<wd l="6965" t="5861" r="7579" b="6038">(ISCA).</wd>

</ln>

</para>

<para l="6149" t="6259" r="10512" b="7320" alignment="justified" li="216" spaceBefore="192" fli="-216" lsp="exactly" lspExact="217" language="en">

<ln l="6149" t="6259" r="10512" b="6446" baseLine="6394" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="6259" r="6562" b="6403">Oriol</wd>

<space/>

<wd l="6643" t="6259" r="7291" b="6446">Vinyals,</wd>

<space/>

<wd l="7387" t="6259" r="8213" b="6403">Alexander</wd>

<space/>

<wd l="8290" t="6259" r="8885" b="6427">Toshev,</wd>

<space/>

<wd l="8986" t="6259" r="9427" b="6446">Samy</wd>

<space/>

<wd l="9514" t="6259" r="10133" b="6446">Bengio,</wd>

<space/>

<wd l="10229" t="6259" r="10512" b="6403">and</wd>

<space/>

</ln>

<ln l="6365" t="6475" r="10507" b="6619" baseLine="6614" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="6475" r="7037" b="6619">Dumitru</wd>

<space/>

<wd l="7123" t="6475" r="7637" b="6619">Erhan.</wd>

<space/>

<wd l="7829" t="6475" r="8261" b="6619">2015.</wd>

<space/>

<wd l="8453" t="6475" r="8894" b="6619">Show</wd>

<space/>

<wd l="8986" t="6475" r="9269" b="6619">and</wd>

<space/>

<wd l="9350" t="6475" r="9643" b="6619">tell:</wd>

<space/>

<wd l="9787" t="6480" r="9931" b="6614">A</wd>

<space/>

<wd l="10013" t="6475" r="10507" b="6619">neural</wd>

<space/>

</ln>

<ln l="6365" t="6696" r="10493" b="6883" baseLine="6835">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="6696" r="6850" b="6883">image</wd>

<space/>

<wd l="6922" t="6696" r="7502" b="6878">caption</wd>

<space/>

<wd l="7574" t="6715" r="8347" b="6883">generator.</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0"><wd l="8482" t="6701" r="10493" b="6874">http://arxiv.org/</wd>

<space/>

</run>

</ln>

<ln l="6374" t="6917" r="10512" b="7099" baseLine="7051">

<wd l="6374" t="6922" r="7963" b="7085"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">abs/1411.4555</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8050" t="6936" r="8203" b="7061">to</wd>

<space/>

<wd l="8285" t="6960" r="8813" b="7099">appear</wd>

<space/>

<wd l="8890" t="6917" r="9043" b="7056">in</wd>

<space/>

<wd l="9125" t="6917" r="9917" b="7099">Computer</wd>

<space/>

<wd l="9994" t="6917" r="10512" b="7061">Vision</wd>

<space/>

</run>

</ln>

<ln l="6370" t="7133" r="8323" b="7320" baseLine="7272" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="7133" r="6653" b="7277">and</wd>

<space/>

<wd l="6701" t="7138" r="7262" b="7277">Pattern</wd>

<space/>

<wd l="7310" t="7133" r="8323" b="7320">Recognition.</wd>

</ln>

</para>

<para l="6144" t="7531" r="10512" b="8597" alignment="justified" li="216" spaceBefore="175" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="7531" r="10512" b="7718" baseLine="7670" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7531" r="6586" b="7718">Andy</wd>

<space/>

<wd l="6648" t="7536" r="7032" b="7718">Way.</wd>

<space/>

<wd l="7157" t="7531" r="7589" b="7675">2010.</wd>

<space/>

<wd l="7704" t="7531" r="8400" b="7675">Machine</wd>

<space/>

<wd l="8462" t="7531" r="9341" b="7675">translation.</wd>

<space/>

<wd l="9456" t="7536" r="9624" b="7670">In</wd>

<space/>

<wd l="9686" t="7531" r="10512" b="7675">Alexander</wd>

<space/>

</ln>

<ln l="6370" t="7752" r="10507" b="7934" baseLine="7891">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="7752" r="6850" b="7920">Clark,</wd>

<space/>

<wd l="6931" t="7752" r="7349" b="7896">Chris</wd>

<space/>

<wd l="7421" t="7757" r="7771" b="7920">Fox,</wd>

<space/>

<wd l="7848" t="7752" r="8136" b="7896">and</wd>

<space/>

<wd l="8203" t="7752" r="8808" b="7896">Shalom</wd>

<space/>

<wd l="8870" t="7752" r="9475" b="7934">Lappin,</wd>

<space/>

<wd l="9557" t="7752" r="10138" b="7920">editors,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10219" t="7752" r="10507" b="7896">The</wd>

<space/>

</run>

</ln>

<ln l="6360" t="7973" r="10502" b="8155" baseLine="8107" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6360" t="7973" r="7200" b="8117">Handbook</wd>

<space/>

<wd l="7286" t="7973" r="7469" b="8155">of</wd>

<space/>

<wd l="7536" t="7973" r="8722" b="8155">Computational</wd>

<space/>

<wd l="8803" t="7978" r="9682" b="8155">Linguistics</wd>

<space/>

<wd l="9768" t="7973" r="10075" b="8117">and</wd>

<space/>

<wd l="10152" t="7978" r="10502" b="8117">Nat-</wd>

</ln>

<ln l="6370" t="8189" r="10507" b="8376" baseLine="8328">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="8189" r="6696" b="8333">ural</wd>

<space/>

<wd l="6773" t="8194" r="7565" b="8371">Language</wd>

<space/>

</run>

<wd l="7651" t="8194" r="8573" b="8371"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Processing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8669" t="8232" r="9115" b="8376">pages</wd>

<space/>

<wd l="9211" t="8189" r="9941" b="8333">531–573.</wd>

<space/>

<wd l="10037" t="8189" r="10507" b="8376">Wiley</wd>

<space/>

</run>

</ln>

<ln l="6365" t="8410" r="8962" b="8597" baseLine="8544" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="8410" r="7214" b="8578">Blackwell,</wd>

<space/>

<wd l="7277" t="8410" r="8160" b="8578">Chichester,</wd>

<space/>

<wd l="8213" t="8414" r="8544" b="8578">UK,</wd>

<space/>

<wd l="8602" t="8410" r="8962" b="8597">July.</wd>

</ln>

</para>

<para l="6144" t="8808" r="10512" b="9432" alignment="justified" li="216" spaceBefore="183" fli="-216" lsp="exactly" lspExact="217" language="en">

<ln l="6144" t="8808" r="10512" b="8976" baseLine="8947" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8808" r="6701" b="8952">Amber</wd>

<space/>

<wd l="6744" t="8808" r="8131" b="8976">Wilcox-O’Hearn,</wd>

<space/>

<wd l="8184" t="8808" r="8808" b="8952">Graeme</wd>

<space/>

<wd l="8856" t="8808" r="9298" b="8976">Hirst,</wd>

<space/>

<wd l="9355" t="8808" r="9638" b="8952">and</wd>

<space/>

<wd l="9686" t="8808" r="10512" b="8952">Alexander</wd>

<space/>

</ln>

<ln l="6365" t="9029" r="10512" b="9216" baseLine="9163" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="9029" r="7296" b="9216">Budanitsky.</wd>

<space/>

<wd l="7474" t="9029" r="7906" b="9173">2008.</wd>

<space/>

<wd l="8078" t="9029" r="8918" b="9173">Real-word</wd>

<space/>

<wd l="9005" t="9029" r="9624" b="9216">spelling</wd>

<space/>

<wd l="9706" t="9029" r="10512" b="9173">correction</wd>

<space/>

</ln>

<ln l="6365" t="9245" r="10502" b="9432" baseLine="9384" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="9245" r="6720" b="9389">with</wd>

<space/>

<wd l="6835" t="9245" r="7541" b="9432">trigrams:</wd>

<space/>

<wd l="7757" t="9250" r="7901" b="9384">A</wd>

<space/>

<wd l="8021" t="9245" r="9250" b="9389">reconsideration</wd>

<space/>

<wd l="9374" t="9245" r="9547" b="9389">of</wd>

<space/>

<wd l="9658" t="9245" r="9898" b="9389">the</wd>

<space/>

<wd l="10018" t="9250" r="10502" b="9432">Mays,</wd>

</ln>

</para>

<para l="6331" t="9466" r="10517" b="10747" alignment="justified" li="216" lsp="exactly" lspExact="219" language="en">

<tabs position="6331"/>

<ln l="6365" t="9466" r="10512" b="9634" baseLine="9605" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" forcedEOF="true">

<wd l="6365" t="9470" r="7138" b="9634">Damerau,</wd>

<space/>

<wd l="7315" t="9466" r="7598" b="9610">and</wd>

<space/>

<wd l="7742" t="9470" r="8318" b="9610">Mercer</wd>

<space/>

<wd l="8458" t="9466" r="8995" b="9610">model.</wd>

<tab position="8995"/>

<wd l="9374" t="9470" r="9542" b="9605">In</wd>

<space/>

<wd l="9686" t="9466" r="10512" b="9610">Alexander
</wd>

</ln>

<ln l="6370" t="9686" r="10517" b="9869" baseLine="9821" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6370" t="9686" r="7090" b="9854">Gelbukh,</wd>

<space/>

<wd l="7243" t="9686" r="7742" b="9854">editor,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7901" t="9686" r="9091" b="9869">Computational</wd>

<space/>

<wd l="9206" t="9691" r="10085" b="9869">Linguistics</wd>

<space/>

<wd l="10214" t="9686" r="10517" b="9830">and</wd>

<space/>

</run>

</ln>

<ln l="6360" t="9902" r="10502" b="10085" baseLine="10042" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" forcedEOF="true">

<wd l="6360" t="9902" r="7186" b="10085">Intelligent</wd>

<space/>

<wd l="7253" t="9907" r="7570" b="10046">Text</wd>

<space/>

<wd l="7622" t="9907" r="8496" b="10085">Processing</wd>

<space/>

<wd l="8568" t="9989" r="8616" b="10003">-</wd>

<space/>

<wd l="8688" t="9902" r="8938" b="10046">9th</wd>

<space/>

<wd l="8995" t="9902" r="10056" b="10046">International</wd>

<space/>

<wd l="10123" t="9907" r="10502" b="10046">Con-</wd>

</ln>

<ln l="6331" t="10123" r="10507" b="10306" baseLine="10258" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" forcedEOF="true">

<wd l="6331" t="10123" r="6970" b="10306">ference,</wd>

<space/>

<wd l="7109" t="10128" r="7790" b="10306">CICLing</wd>

<space/>

<wd l="7891" t="10123" r="8318" b="10291">2008,</wd>

<space/>

<wd l="8438" t="10123" r="8928" b="10306">Haifa,</wd>

<space/>

<wd l="9053" t="10123" r="9648" b="10291">Isarael,</wd>

<space/>

<wd l="9773" t="10123" r="10507" b="10306">February</wd>

<space/>

</ln>

<ln l="6374" t="10344" r="10502" b="10526" baseLine="10478" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6374" t="10344" r="6893" b="10512">17–23,</wd>

<space/>

<wd l="7042" t="10344" r="7440" b="10488">2008</wd>

<space/>

<wd l="7565" t="10430" r="7613" b="10445">-</wd>

<space/>

</run>

<wd l="7733" t="10344" r="8765" b="10526"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Proceedings</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="8899" t="10344" r="9494" b="10488">volume</wd>

<space/>

<wd l="9610" t="10344" r="10502" b="10512">4919/2008,</wd>

<space/>

</run>

</ln>

<ln l="6365" t="10560" r="10502" b="10747" baseLine="10699" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" forcedEOF="true">

<wd l="6365" t="10603" r="6811" b="10747">pages</wd>

<space/>

<wd l="7080" t="10560" r="7810" b="10704">605–616.</wd>

<space/>

<wd l="8088" t="10560" r="8770" b="10747">Springer</wd>

<space/>

<wd l="9024" t="10560" r="10502" b="10747">Berlin/Heidelberg,</wd>

</ln>

</para>

<para l="6365" t="10781" r="10512" b="11405" alignment="left" li="216" lsp="exactly" lspExact="220" language="en">

<tabs position="6365"/>

<ln l="6370" t="10781" r="10512" b="10968" baseLine="10915" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6370" t="10781" r="7128" b="10968">Germany.</wd>

<tab position="7128"/>

<wd l="7584" t="10781" r="7978" b="10925">2006</wd>

<space/>

<wd l="8150" t="10781" r="8525" b="10925">draft</wd>

<space/>

<wd l="8688" t="10781" r="9274" b="10925">version</wd>

<space/>

<wd l="9442" t="10781" r="10142" b="10925">available</wd>

<space/>

<wd l="10315" t="10824" r="10512" b="10925">on
</wd>

</ln>

<ln l="6365" t="11002" r="10171" b="11189" baseLine="11136" forcedEOF="true">

<wd l="6365" t="11002" r="10171" b="11189">http://ftp.cs.toronto.edu/pub/gh/WilcoxOHearn-</wd>

</ln>

<ln l="6370" t="11218" r="7469" b="11405" baseLine="11357" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6370" t="11218" r="7469" b="11405">etal-2006.pdf.</wd>

</ln>

</para>

<para l="6144" t="11616" r="10512" b="12240" alignment="justified" li="216" spaceBefore="177" spaceAfter="24" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="11616" r="10502" b="11803" baseLine="11755" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11621" r="6451" b="11760">Yue</wd>

<space/>

<wd l="6523" t="11616" r="7027" b="11803">Zhang</wd>

<space/>

<wd l="7104" t="11616" r="7392" b="11760">and</wd>

<space/>

<wd l="7464" t="11616" r="8098" b="11798">Stephen</wd>

<space/>

<wd l="8170" t="11616" r="8650" b="11760">Clark.</wd>

<space/>

<wd l="8794" t="11616" r="9226" b="11760">2011.</wd>

<space/>

<wd l="9374" t="11616" r="10109" b="11803">Syntactic</wd>

<space/>

<wd l="10181" t="11659" r="10502" b="11798">pro-</wd>

</ln>

<ln l="6370" t="11837" r="10512" b="12024" baseLine="11971" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="11837" r="6946" b="12024">cessing</wd>

<space/>

<wd l="7018" t="11837" r="7445" b="12024">using</wd>

<space/>

<wd l="7512" t="11837" r="7757" b="11981">the</wd>

<space/>

<wd l="7829" t="11837" r="8741" b="12024">generalized</wd>

<space/>

<wd l="8808" t="11856" r="9662" b="12019">perceptron</wd>

<space/>

<wd l="9730" t="11837" r="10013" b="11981">and</wd>

<space/>

<wd l="10080" t="11837" r="10512" b="11981">beam</wd>

<space/>

</ln>

<ln l="6374" t="12058" r="10435" b="12240" baseLine="12192">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="12058" r="6912" b="12202">search.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7003" t="12058" r="8194" b="12240">Computational</wd>

<space/>

</run>

<wd l="8237" t="12062" r="9158" b="12240"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Linguistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9221" t="12058" r="10435" b="12235">37(1):105–151.</wd>

</run>

</ln>

</para>

</column>

</section>

<dd l="1423" t="15746" r="10544" b="15975">

<para l="5804" t="15792" r="6143" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5870" t="15792" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="43">

<wd l="5870" t="15792" r="6077" b="15946">98</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

