<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1360" marginRight="1385" marginBottom="358" offsetX="-22" offsetY="-12" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1360" r="10524" b="4083">

<column l="1440" t="1360" r="10524" b="4083">

<para l="5155" t="1430" r="6778" b="1646" alignment="centered" spaceBefore="19" lsp="exactly" lspExact="324" language="en">

<ln l="5155" t="1430" r="6778" b="1646" baseLine="1632" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-8">

<wd l="5155" t="1435" r="6778" b="1646">LYSGROUP:</wd>

</ln>

</para>

<para l="2112" t="1742" r="9830" b="2016" alignment="centered" lsp="exactly" lspExact="325" language="en">

<ln l="2112" t="1742" r="9830" b="2016" baseLine="1949" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2112" t="1752" r="3254" b="2016">Adapting</wd>

<space/>

<wd l="3336" t="1814" r="3475" b="1958">a</wd>

<space/>

<wd l="3557" t="1752" r="4512" b="2016">Spanish</wd>

<space/>

<wd l="4594" t="1752" r="5765" b="1958">microtext</wd>

<space/>

<wd l="5842" t="1752" r="7560" b="1958">normalization</wd>

<space/>

<wd l="7637" t="1771" r="8458" b="2016">system</wd>

<space/>

<wd l="8534" t="1771" r="8765" b="1958">to</wd>

<space/>

<wd l="8842" t="1752" r="9830" b="2016">English.</wd>

</ln>

</para>

<para l="1949" t="2414" r="10008" b="3485" alignment="centered" spaceBefore="348" spaceAfter="579" lsp="exactly" lspExact="280" language="en">

<ln l="3302" t="2414" r="8645" b="2640" baseLine="2582" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29" forcedEOF="true">

<wd l="3302" t="2419" r="3840" b="2592">Yerai</wd>

<space/>

<wd l="3902" t="2424" r="4555" b="2630">Doval,</wd>

<space/>

<wd l="4618" t="2414" r="5150" b="2611">Jes´us</wd>

<space/>

<wd l="5218" t="2419" r="5990" b="2630">Vilares,</wd>

<space/>

<wd l="6062" t="2419" r="6725" b="2592">Carlos</wd>

<space/>

<wd l="6797" t="2414" r="8645" b="2640">G´omez-Rodriguez
</wd>

</ln>

<ln l="2616" t="2698" r="9322" b="2918" baseLine="2865" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29" forcedEOF="true">

<wd l="2616" t="2702" r="3029" b="2870">LYS</wd>

<space/>

<wd l="3110" t="2755" r="3710" b="2918">group,</wd>

<space/>

<wd l="3782" t="2707" r="5131" b="2918">Departamento</wd>

<space/>

<wd l="5198" t="2702" r="5419" b="2870">de</wd>

<space/>

<wd l="5486" t="2698" r="6816" b="2918">Computaci´on,</wd>

<space/>

<wd l="6888" t="2702" r="7814" b="2870">Facultade</wd>

<space/>

<wd l="7882" t="2702" r="8098" b="2870">de</wd>

<space/>

<wd l="8160" t="2698" r="9322" b="2904">Inform´atica,
</wd>

</ln>

<ln l="2664" t="2976" r="9288" b="3197" baseLine="3143" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><wd l="2664" t="2981" r="3926" b="3149">Universidade</wd>

<space/>

<wd l="3994" t="2981" r="4219" b="3149">da</wd>

<space/>

</run>

<wd l="4277" t="2981" r="5026" b="3182"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">Coru</run>

<run underlined="none" subsuperscript="superscript" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">na,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><space/>

<wd l="5102" t="2981" r="5875" b="3197">Campus</wd>

<space/>

<wd l="5947" t="2981" r="6168" b="3149">de</wd>

<space/>

</run>

<wd l="6226" t="2976" r="6898" b="3182"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">Elvi</run>

<run underlined="none" subsuperscript="superscript" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">na,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><space/>

<wd l="6994" t="2976" r="7546" b="3149">15071</wd>

<space/>

<wd l="7690" t="2981" r="7862" b="3144">A</wd>

<space/>

</run>

<wd l="7925" t="2981" r="8674" b="3182"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">Coru</run>

<run underlined="none" subsuperscript="superscript" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">na,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><space/>

<wd l="8750" t="2981" r="9288" b="3197">Spain
</wd>

</run>

</ln>

<ln l="1949" t="3240" r="10008" b="3485" baseLine="3422" forcedEOF="true">

<wd l="1949" t="3240" r="3715" b="3485"><run underlined="none" subsuperscript="none" fontSize="1400" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="29">{</run>

<run underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">yerai.doval,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><space/>

<wd l="3950" t="3269" r="5150" b="3470">jvilares,</wd>

<space/>

</run>

<wd l="5371" t="3240" r="7459" b="3485"><run underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">cgomezr</run>

<run underlined="none" subsuperscript="none" fontSize="1400" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="29">}</run>

<run underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29">@udc.es</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><wd l="7541" t="3360" r="7661" b="3374">–</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="29"><wd l="7728" t="3274" r="10008" b="3470">www.grupolys.org</wd>

</run>

</ln>

</para>

</column>

</section>

<section l="1440" t="4083" r="10524" b="15316">

<column l="1440" t="4083" r="5822" b="15316">

<para l="3178" t="4142" r="4070" b="4315" alignment="centered" spaceBefore="12" lsp="exactly" lspExact="266" language="en">

<ln l="3178" t="4142" r="4070" b="4315" baseLine="4306" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3178" t="4142" r="4070" b="4315">Abstract</wd>

</ln>

</para>

<para l="1781" t="4661" r="5467" b="8885" alignment="justified" li="288" ri="360" spaceBefore="240" lsp="exactly" lspExact="271" language="en">

<ln l="1781" t="4661" r="5467" b="4819" baseLine="4814" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="4666" r="1963" b="4814">In</wd>

<space/>

<wd l="2054" t="4661" r="2362" b="4819">this</wd>

<space/>

<wd l="2467" t="4661" r="3010" b="4819">article</wd>

<space/>

<wd l="3106" t="4714" r="3355" b="4819">we</wd>

<space/>

<wd l="3456" t="4661" r="4176" b="4819">describe</wd>

<space/>

<wd l="4272" t="4661" r="4536" b="4819">the</wd>

<space/>

<wd l="4632" t="4661" r="5467" b="4819">microtext</wd>

<space/>

</ln>

<ln l="1781" t="4934" r="5453" b="5136" baseLine="5083" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="4934" r="2995" b="5093">normalization</wd>

<space/>

<wd l="3053" t="4958" r="3648" b="5136">system</wd>

<space/>

<wd l="3696" t="4987" r="3950" b="5093">we</wd>

<space/>

<wd l="3998" t="4934" r="4402" b="5093">have</wd>

<space/>

<wd l="4450" t="4934" r="4853" b="5093">used</wd>

<space/>

<wd l="4901" t="4958" r="5064" b="5093">to</wd>

<space/>

<wd l="5117" t="4987" r="5453" b="5136">par-</wd>

</ln>

<ln l="1781" t="5203" r="5467" b="5405" baseLine="5357" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="5203" r="2424" b="5405">ticipate</wd>

<space/>

<wd l="2467" t="5203" r="2635" b="5357">in</wd>

<space/>

<wd l="2678" t="5203" r="2947" b="5362">the</wd>

<space/>

<wd l="2990" t="5203" r="4253" b="5362">Normalization</wd>

<space/>

<wd l="4301" t="5203" r="4488" b="5362">of</wd>

<space/>

<wd l="4517" t="5203" r="5035" b="5405">Noisy</wd>

<space/>

<wd l="5083" t="5208" r="5467" b="5362">Text</wd>

<space/>

</ln>

<ln l="1781" t="5477" r="5453" b="5678" baseLine="5626" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="5477" r="2189" b="5635">Task</wd>

<space/>

<wd l="2242" t="5477" r="2434" b="5635">of</wd>

<space/>

<wd l="2472" t="5477" r="2736" b="5635">the</wd>

<space/>

<wd l="2789" t="5482" r="3216" b="5635">ACL</wd>

<space/>

<wd l="3269" t="5482" r="3979" b="5635">W-NUT</wd>

<space/>

<wd l="4037" t="5477" r="4454" b="5635">2015</wd>

<space/>

<wd l="4522" t="5477" r="5453" b="5678">Workshop.</wd>

<space/>

</ln>

<ln l="1786" t="5746" r="5462" b="5947" baseLine="5899" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1786" t="5750" r="2122" b="5904">Our</wd>

<space/>

<wd l="2203" t="5746" r="3418" b="5904">normalization</wd>

<space/>

<wd l="3514" t="5770" r="4114" b="5947">system</wd>

<space/>

<wd l="4195" t="5798" r="4522" b="5904">was</wd>

<space/>

<wd l="4622" t="5746" r="5462" b="5947">originally</wd>

<space/>

</ln>

<ln l="1786" t="6019" r="5453" b="6221" baseLine="6168" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1786" t="6019" r="2669" b="6221">developed</wd>

<space/>

<wd l="2741" t="6019" r="3000" b="6178">for</wd>

<space/>

<wd l="3067" t="6043" r="3394" b="6178">text</wd>

<space/>

<wd l="3466" t="6019" r="4080" b="6221">mining</wd>

<space/>

<wd l="4157" t="6019" r="4584" b="6178">tasks</wd>

<space/>

<wd l="4670" t="6072" r="4886" b="6178">on</wd>

<space/>

<wd l="4963" t="6024" r="5453" b="6221">Span-</wd>

</ln>

<ln l="1781" t="6288" r="5453" b="6490" baseLine="6437" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="6288" r="2035" b="6446">ish</wd>

<space/>

<wd l="2102" t="6312" r="2707" b="6446">tweets.</wd>

<space/>

<wd l="2832" t="6293" r="3173" b="6446">Our</wd>

<space/>

<wd l="3235" t="6288" r="3672" b="6446">main</wd>

<space/>

<wd l="3749" t="6288" r="4195" b="6490">goals</wd>

<space/>

<wd l="4277" t="6288" r="4838" b="6490">during</wd>

<space/>

<wd l="4910" t="6288" r="5107" b="6446">its</wd>

<space/>

<wd l="5194" t="6288" r="5453" b="6446">de-</wd>

</ln>

<ln l="1781" t="6562" r="5467" b="6763" baseLine="6710" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="6562" r="2698" b="6763">velopment</wd>

<space/>

<wd l="2760" t="6614" r="3182" b="6720">were</wd>

<space/>

<wd l="3250" t="6562" r="4118" b="6763">flexibility,</wd>

<space/>

<wd l="4200" t="6562" r="5088" b="6763">scalability</wd>

<space/>

<wd l="5155" t="6562" r="5467" b="6720">and</wd>

<space/>

</ln>

<ln l="1781" t="6830" r="5453" b="7032" baseLine="6979" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="6830" r="3130" b="7032">maintainability,</wd>

<space/>

<wd l="3206" t="6830" r="3374" b="6984">in</wd>

<space/>

<wd l="3442" t="6830" r="3898" b="6989">order</wd>

<space/>

<wd l="3955" t="6854" r="4123" b="6989">to</wd>

<space/>

<wd l="4186" t="6854" r="4493" b="6989">test</wd>

<space/>

<wd l="4555" t="6883" r="4651" b="6989">a</wd>

<space/>

<wd l="4709" t="6830" r="5131" b="6989">wide</wd>

<space/>

<wd l="5194" t="6883" r="5453" b="6989">va-</wd>

</ln>

<ln l="1781" t="7099" r="5467" b="7301" baseLine="7253" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="7099" r="2174" b="7301">riety</wd>

<space/>

<wd l="2256" t="7099" r="2448" b="7258">of</wd>

<space/>

<wd l="2510" t="7099" r="3854" b="7301">approximations</wd>

<space/>

<wd l="3931" t="7123" r="4099" b="7258">to</wd>

<space/>

<wd l="4171" t="7099" r="4440" b="7258">the</wd>

<space/>

<wd l="4512" t="7099" r="5242" b="7301">problem</wd>

<space/>

<wd l="5314" t="7123" r="5467" b="7258">at</wd>

<space/>

</ln>

<ln l="1781" t="7373" r="5462" b="7574" baseLine="7522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="7373" r="2208" b="7531">hand</wd>

<space/>

<wd l="2285" t="7373" r="2674" b="7531">with</wd>

<space/>

<wd l="2755" t="7373" r="3605" b="7531">minimum</wd>

<space/>

<wd l="3686" t="7373" r="4205" b="7531">effort.</wd>

<space/>

<wd l="4363" t="7378" r="4646" b="7531">We</wd>

<space/>

<wd l="4728" t="7373" r="5059" b="7531">will</wd>

<space/>

<wd l="5150" t="7426" r="5462" b="7574">pay</wd>

<space/>

</ln>

<ln l="1790" t="7642" r="5462" b="7843" baseLine="7795" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1790" t="7642" r="2381" b="7843">special</wd>

<space/>

<wd l="2438" t="7642" r="3202" b="7800">attention</wd>

<space/>

<wd l="3245" t="7666" r="3413" b="7800">to</wd>

<space/>

<wd l="3466" t="7642" r="3730" b="7800">the</wd>

<space/>

<wd l="3782" t="7694" r="4426" b="7843">process</wd>

<space/>

<wd l="4488" t="7642" r="4680" b="7800">of</wd>

<space/>

<wd l="4718" t="7642" r="5462" b="7843">adapting</wd>

<space/>

</ln>

<ln l="1781" t="7915" r="5467" b="8117" baseLine="8064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="7915" r="2045" b="8074">the</wd>

<space/>

<wd l="2102" t="7939" r="3144" b="8117">components</wd>

<space/>

<wd l="3211" t="7915" r="3403" b="8074">of</wd>

<space/>

<wd l="3442" t="7968" r="3734" b="8074">our</wd>

<space/>

<wd l="3792" t="7939" r="4392" b="8117">system</wd>

<space/>

<wd l="4440" t="7939" r="4608" b="8074">to</wd>

<space/>

<wd l="4666" t="7915" r="5021" b="8074">deal</wd>

<space/>

<wd l="5078" t="7915" r="5467" b="8074">with</wd>

<space/>

</ln>

<ln l="1781" t="8184" r="5453" b="8386" baseLine="8338" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="8184" r="2448" b="8386">English</wd>

<space/>

<wd l="2544" t="8208" r="3096" b="8342">tweets</wd>

<space/>

<wd l="3202" t="8184" r="3778" b="8371">which,</wd>

<space/>

<wd l="3902" t="8237" r="4070" b="8342">as</wd>

<space/>

<wd l="4181" t="8237" r="4430" b="8342">we</wd>

<space/>

<wd l="4531" t="8184" r="4862" b="8342">will</wd>

<space/>

<wd l="4978" t="8184" r="5453" b="8371">show,</wd>

<space/>

</ln>

<ln l="1781" t="8458" r="5458" b="8659" baseLine="8606" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1781" t="8510" r="2107" b="8616">was</wd>

<space/>

<wd l="2174" t="8458" r="2938" b="8616">achieved</wd>

<space/>

<wd l="2990" t="8458" r="3662" b="8616">without</wd>

<space/>

<wd l="3715" t="8458" r="4229" b="8659">major</wd>

<space/>

<wd l="4277" t="8458" r="5458" b="8616">modifications</wd>

<space/>

</ln>

<ln l="1786" t="8726" r="3528" b="8885" baseLine="8880" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1786" t="8726" r="1978" b="8885">of</wd>

<space/>

<wd l="2016" t="8726" r="2213" b="8885">its</wd>

<space/>

<wd l="2275" t="8726" r="2664" b="8885">base</wd>

<space/>

<wd l="2731" t="8750" r="3528" b="8885">structure.</wd>

</ln>

</para>

<para l="1454" t="9226" r="3091" b="9398" alignment="left" spaceBefore="246" lsp="exactly" lspExact="266" language="en">

<ln l="1454" t="9226" r="3091" b="9398" baseLine="9394" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1454" t="9226" r="1550" b="9394">1</wd>

<space/>

<wd l="1805" t="9226" r="3091" b="9398">Introduction</wd>

</ln>

</para>

<para l="1440" t="9677" r="5818" b="11237" alignment="justified" spaceBefore="168" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="9677" r="5794" b="9878" baseLine="9830">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="9677" r="1781" b="9835">The</wd>

<space/>

<wd l="1834" t="9677" r="2304" b="9835">value</wd>

<space/>

<wd l="2366" t="9677" r="2554" b="9835">of</wd>

<space/>

<wd l="2597" t="9677" r="3226" b="9835">Twitter</wd>

<space/>

<wd l="3283" t="9677" r="3595" b="9835">and</wd>

<space/>

<wd l="3658" t="9677" r="4104" b="9835">other</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="4157" t="9677" r="5424" b="9878">microblogging</wd>

<space/>

</run>

<wd l="5491" t="9730" r="5794" b="9835" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">ser-</wd>

</ln>

<ln l="1440" t="9950" r="5794" b="10109" baseLine="10099" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9950" r="1882" b="10109">vices</wd>

<space/>

<wd l="1954" t="10003" r="2122" b="10109">as</wd>

<space/>

<wd l="2189" t="9950" r="3221" b="10109">information</wd>

<space/>

<wd l="3283" t="10003" r="3922" b="10109">sources</wd>

<space/>

<wd l="3989" t="9950" r="4162" b="10104">in</wd>

<space/>

<wd l="4219" t="9950" r="4949" b="10109">domains</wd>

<space/>

<wd l="5016" t="9950" r="5338" b="10109">like</wd>

<space/>

<wd l="5400" t="10003" r="5794" b="10109">mar-</wd>

</ln>

<ln l="1440" t="10219" r="5798" b="10421" baseLine="10373" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10219" r="2026" b="10421">keting,</wd>

<space/>

<wd l="2131" t="10219" r="2856" b="10378">business</wd>

<space/>

<wd l="2947" t="10219" r="4013" b="10421">intelligence,</wd>

<space/>

<wd l="4094" t="10219" r="5088" b="10421">journalism,</wd>

<space/>

<wd l="5198" t="10243" r="5491" b="10378">etc.</wd>

<space/>

<wd l="5659" t="10219" r="5798" b="10378">is</wd>

<space/>

</ln>

<ln l="1445" t="10493" r="5818" b="10694" baseLine="10642" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="10493" r="2122" b="10651">obvious</wd>

<space/>

<wd l="2189" t="10493" r="3101" b="10694">nowadays.</wd>

<space/>

<wd l="3206" t="10493" r="4368" b="10680">Nevertheless,</wd>

<space/>

<wd l="4454" t="10493" r="4843" b="10651">such</wd>

<space/>

<wd l="4910" t="10517" r="5563" b="10651">amount</wd>

<space/>

<wd l="5630" t="10493" r="5818" b="10651">of</wd>

<space/>

</ln>

<ln l="1440" t="10762" r="5808" b="10963" baseLine="10915" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10762" r="2472" b="10920">information</wd>

<space/>

<wd l="2568" t="10814" r="2861" b="10920">can</wd>

<space/>

<wd l="2966" t="10762" r="3346" b="10963">only</wd>

<space/>

<wd l="3442" t="10762" r="3648" b="10920">be</wd>

<space/>

<wd l="3744" t="10762" r="4901" b="10963">appropriately</wd>

<space/>

<wd l="5002" t="10762" r="5808" b="10963">exploited</wd>

<space/>

</ln>

<ln l="1440" t="11035" r="4176" b="11237" baseLine="11184">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="11035" r="2122" b="11237">through</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2179" t="11069" r="2491" b="11194">text</wd>

<space/>

<wd l="2539" t="11045" r="3139" b="11237">mining</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="3197" t="11035" r="4176" b="11237">techniques.</wd>

</run>

</ln>

</para>

<para l="1440" t="11314" r="5818" b="15307" alignment="justified" spaceBefore="8" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="11314" r="5808" b="11501" baseLine="11462" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1656" t="11318" r="2477" b="11501">However,</wd>

<space/>

<wd l="2544" t="11314" r="2981" b="11472">there</wd>

<space/>

<wd l="3043" t="11366" r="3302" b="11472">are</wd>

<space/>

<wd l="3360" t="11314" r="4003" b="11472">notable</wd>

<space/>

<wd l="4066" t="11314" r="5016" b="11472">differences</wd>

<space/>

<wd l="5078" t="11314" r="5808" b="11472">between</wd>

<space/>

</ln>

<ln l="1445" t="11582" r="5808" b="11784" baseLine="11736">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1445" t="11582" r="2366" b="11741">“standard”</wd>

<space/>

<wd l="2419" t="11582" r="3206" b="11784">language</wd>

<space/>

<wd l="3259" t="11582" r="3571" b="11741">and</wd>

<space/>

<wd l="3619" t="11582" r="3883" b="11741">the</wd>

<space/>

<wd l="3941" t="11582" r="4723" b="11741">so-called</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="4771" t="11592" r="5352" b="11784">texting</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="5405" t="11582" r="5808" b="11741">used</wd>

<space/>

</run>

</ln>

<ln l="1440" t="11856" r="5798" b="12058" baseLine="12005">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1440" t="11856" r="1613" b="12010">in</wd>

<space/>

<wd l="1680" t="11856" r="2141" b="12014">those</wd>

<space/>

</run>

<wd l="2213" t="11866" r="3149" b="12014"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">microtexts</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="3274" t="11861" r="3461" b="12010">In</wd>

<space/>

<wd l="3528" t="11856" r="3835" b="12014">this</wd>

<space/>

<wd l="3912" t="11856" r="4301" b="12014">kind</wd>

<space/>

<wd l="4378" t="11856" r="4570" b="12014">of</wd>

<space/>

<wd l="4622" t="11856" r="5381" b="12058">writings,</wd>

<space/>

<wd l="5467" t="11856" r="5592" b="12014">it</wd>

<space/>

<wd l="5659" t="11856" r="5798" b="12014">is</wd>

<space/>

</run>

</ln>

<ln l="1440" t="12125" r="5808" b="12326" baseLine="12278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="12125" r="2290" b="12326">important</wd>

<space/>

<wd l="2342" t="12149" r="2506" b="12283">to</wd>

<space/>

<wd l="2563" t="12125" r="3144" b="12283">reduce</wd>

<space/>

<wd l="3197" t="12125" r="3461" b="12283">the</wd>

<space/>

<wd l="3514" t="12125" r="4186" b="12283">number</wd>

<space/>

<wd l="4238" t="12125" r="4430" b="12283">of</wd>

<space/>

<wd l="4474" t="12125" r="5347" b="12283">characters</wd>

<space/>

<wd l="5405" t="12125" r="5808" b="12283">used</wd>

<space/>

</ln>

<ln l="1440" t="12398" r="5803" b="12600" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="12422" r="1608" b="12557">to</wd>

<space/>

<wd l="1709" t="12398" r="1891" b="12557">fit</wd>

<space/>

<wd l="1982" t="12398" r="2386" b="12557">their</wd>

<space/>

<wd l="2477" t="12398" r="3024" b="12600">length</wd>

<space/>

<wd l="3120" t="12398" r="4080" b="12557">restrictions</wd>

<space/>

<wd l="4181" t="12398" r="4666" b="12557">while</wd>

<space/>

<wd l="4762" t="12398" r="5803" b="12600">maintaining</wd>

<space/>

</ln>

<ln l="1440" t="12667" r="5803" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="12667" r="1704" b="12826">the</wd>

<space/>

<wd l="1771" t="12667" r="2698" b="12869">readability</wd>

<space/>

<wd l="2770" t="12667" r="2962" b="12826">of</wd>

<space/>

<wd l="3010" t="12667" r="3278" b="12826">the</wd>

<space/>

<wd l="3341" t="12720" r="4080" b="12869">message</wd>

<space/>

<wd l="4142" t="12691" r="4310" b="12826">to</wd>

<space/>

<wd l="4387" t="12720" r="4838" b="12826">some</wd>

<space/>

<wd l="4906" t="12691" r="5477" b="12826">extent.</wd>

<space/>

<wd l="5582" t="12672" r="5803" b="12826">To</wd>

<space/>

</ln>

<ln l="1445" t="12941" r="5803" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="12941" r="2098" b="13099">achieve</wd>

<space/>

<wd l="2174" t="12941" r="2534" b="13128">this,</wd>

<space/>

<wd l="2630" t="12965" r="3053" b="13099">most</wd>

<space/>

<wd l="3134" t="12941" r="3326" b="13099">of</wd>

<space/>

<wd l="3389" t="12941" r="3658" b="13099">the</wd>

<space/>

<wd l="3734" t="12941" r="4661" b="13142">techniques</wd>

<space/>

<wd l="4752" t="12941" r="5390" b="13142">applied</wd>

<space/>

<wd l="5467" t="12941" r="5803" b="13142">rely</wd>

<space/>

</ln>

<ln l="1445" t="13210" r="5803" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="13262" r="1661" b="13368">on</wd>

<space/>

<wd l="1709" t="13210" r="2592" b="13411">phonetics,</wd>

<space/>

<wd l="2654" t="13210" r="3010" b="13368">thus</wd>

<space/>

<wd l="3072" t="13210" r="3552" b="13411">being</wd>

<space/>

<wd l="3610" t="13210" r="5131" b="13411">language-specific</wd>

<space/>

<wd l="5198" t="13214" r="5803" b="13411">(L´opez</wd>

<space/>

</ln>

<ln l="1440" t="13478" r="5803" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="13483" r="1834" b="13666">R´ua,</wd>

<space/>

<wd l="1930" t="13483" r="2477" b="13675">2007).</wd>

<space/>

<wd l="2611" t="13483" r="2918" b="13637">For</wd>

<space/>

<wd l="2990" t="13478" r="3768" b="13680">example:</wd>

<space/>

<wd l="3888" t="13478" r="4987" b="13680">intentionally</wd>

<space/>

<wd l="5064" t="13478" r="5803" b="13680">ignoring</wd>

<space/>

</ln>

<ln l="1445" t="13752" r="5808" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="13752" r="2549" b="13954">orthographic</wd>

<space/>

<wd l="2602" t="13752" r="2914" b="13910">and</wd>

<space/>

<wd l="2957" t="13805" r="3744" b="13954">grammar</wd>

<space/>

<wd l="3782" t="13752" r="4253" b="13939">rules,</wd>

<space/>

<wd l="4310" t="13805" r="4478" b="13910">as</wd>

<space/>

<wd l="4531" t="13752" r="4704" b="13906">in</wd>

<space/>

<wd l="4747" t="13752" r="5045" b="13910">“be</wd>

<space/>

<wd l="5088" t="13752" r="5506" b="13910">like”</wd>

<space/>

<wd l="5549" t="13752" r="5808" b="13910">for</wd>

<space/>

</ln>

<ln l="1445" t="14021" r="5808" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="14021" r="3216" b="14179">“am/is/are/was/were</wd>

<space/>

<wd l="3302" t="14021" r="3720" b="14179">like”</wd>

<space/>

<wd l="3811" t="14021" r="3979" b="14174">in</wd>

<space/>

<wd l="4061" t="14021" r="4330" b="14179">the</wd>

<space/>

<wd l="4416" t="14074" r="4790" b="14179">case</wd>

<space/>

<wd l="4877" t="14021" r="5069" b="14179">of</wd>

<space/>

<wd l="5141" t="14021" r="5808" b="14222">English</wd>

<space/>

</ln>

<ln l="1445" t="14294" r="5794" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="14347" r="1627" b="14453">or</wd>

<space/>

<wd l="1704" t="14294" r="2443" b="14496">“asique”</wd>

<space/>

<wd l="2525" t="14294" r="2784" b="14453">for</wd>

<space/>

<wd l="2861" t="14299" r="3677" b="14496">“asique”</wd>

<space/>

<wd l="3758" t="14294" r="3926" b="14448">in</wd>

<space/>

<wd l="4003" t="14294" r="4267" b="14453">the</wd>

<space/>

<wd l="4349" t="14347" r="4718" b="14453">case</wd>

<space/>

<wd l="4800" t="14294" r="4992" b="14453">of</wd>

<space/>

<wd l="5059" t="14294" r="5794" b="14496">Spanish;</wd>

<space/>

</ln>

<ln l="1440" t="14563" r="5794" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14563" r="1704" b="14722">the</wd>

<space/>

<wd l="1776" t="14616" r="2270" b="14765">usage</wd>

<space/>

<wd l="2347" t="14563" r="2539" b="14722">of</wd>

<space/>

<wd l="2602" t="14563" r="3643" b="14765">shortenings,</wd>

<space/>

<wd l="3734" t="14563" r="4786" b="14722">contractions</wd>

<space/>

<wd l="4867" t="14563" r="5179" b="14722">and</wd>

<space/>

<wd l="5251" t="14563" r="5794" b="14722">abbre-</wd>

</ln>

<ln l="1440" t="14837" r="5808" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14837" r="2122" b="14995">viations</wd>

<space/>

<wd l="2203" t="14837" r="2592" b="14995">such</wd>

<space/>

<wd l="2659" t="14890" r="2827" b="14995">as</wd>

<space/>

<wd l="2904" t="14842" r="3086" b="14995">“c</wd>

<space/>

<wd l="3154" t="14842" r="3355" b="14995">u”</wd>

<space/>

<wd l="3422" t="14837" r="3682" b="14995">for</wd>

<space/>

<wd l="3744" t="14842" r="4114" b="14995">“see</wd>

<space/>

<wd l="4176" t="14842" r="4594" b="15038">you”</wd>

<space/>

<wd l="4661" t="14837" r="4834" b="14990">in</wd>

<space/>

<wd l="4896" t="14837" r="5563" b="15038">English</wd>

<space/>

<wd l="5630" t="14890" r="5808" b="14995">or</wd>

<space/>

</ln>

<ln l="1445" t="15106" r="5818" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="15106" r="1920" b="15264">“ksa”</wd>

<space/>

<wd l="1978" t="15106" r="2237" b="15264">for</wd>

<space/>

<wd l="2290" t="15110" r="2846" b="15264">“casa”</wd>

<space/>

<wd l="2904" t="15106" r="3077" b="15259">in</wd>

<space/>

<wd l="3130" t="15106" r="3864" b="15307">Spanish;</wd>

<space/>

<wd l="3936" t="15158" r="4118" b="15264">or</wd>

<space/>

<wd l="4166" t="15106" r="4430" b="15264">the</wd>

<space/>

<wd l="4488" t="15106" r="5573" b="15307">employment</wd>

<space/>

<wd l="5630" t="15106" r="5818" b="15264">of</wd>

<space/>

</ln>

</para>

</column>

<column l="6142" t="4083" r="10524" b="15316">

<para l="6144" t="4157" r="10512" b="4896" alignment="justified" spaceBefore="11" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="4157" r="10502" b="4358" baseLine="4306">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4157" r="6778" b="4358">smileys</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6826" t="4181" r="6994" b="4315">to</wd>

<space/>

<wd l="7046" t="4210" r="7685" b="4358">express</wd>

<space/>

<wd l="7742" t="4157" r="8578" b="4344">emotions,</wd>

<space/>

<wd l="8640" t="4157" r="8894" b="4315">for</wd>

<space/>

<wd l="8938" t="4157" r="9653" b="4315">instance</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9744" t="4176" r="9898" b="4339">:)</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10022" t="4181" r="10186" b="4315">to</wd>

<space/>

<wd l="10238" t="4210" r="10502" b="4315">ex-</wd>

</run>

</ln>

<ln l="6144" t="4426" r="10512" b="4627" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4478" r="6586" b="4627">press</wd>

<space/>

<wd l="6662" t="4426" r="7565" b="4627">happiness.</wd>

<space/>

<wd l="7685" t="4426" r="8203" b="4584">These</wd>

<space/>

<wd l="8270" t="4426" r="9034" b="4627">resulting</wd>

<space/>

<wd l="9106" t="4450" r="9581" b="4584">terms</wd>

<space/>

<wd l="9662" t="4478" r="9922" b="4584">are</wd>

<space/>

<wd l="9994" t="4426" r="10512" b="4584">called</wd>

<space/>

</ln>

<ln l="6149" t="4699" r="9125" b="4896" baseLine="4848">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="4699" r="6725" b="4858">lexical</wd>

<space/>

<wd l="6778" t="4709" r="7488" b="4858">variants</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7555" t="4704" r="7978" b="4896">(Han</wd>

<space/>

<wd l="8045" t="4723" r="8198" b="4858">et</wd>

<space/>

<wd l="8256" t="4699" r="8506" b="4886">al.,</wd>

<space/>

<wd l="8578" t="4704" r="9125" b="4896">2013).</wd>

</run>

</ln>

</para>

<para l="6144" t="4982" r="10512" b="7349" alignment="justified" spaceBefore="12" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="4982" r="10507" b="5184" baseLine="5131" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="4982" r="6701" b="5141">The</wd>

<space/>

<wd l="6806" t="4982" r="7536" b="5184">problem</wd>

<space/>

<wd l="7637" t="4982" r="7771" b="5141">is</wd>

<space/>

<wd l="7886" t="4982" r="8256" b="5170">that,</wd>

<space/>

<wd l="8381" t="4982" r="8554" b="5136">in</wd>

<space/>

<wd l="8659" t="4982" r="9341" b="5184">general,</wd>

<space/>

<wd l="9466" t="5006" r="9792" b="5141">text</wd>

<space/>

<wd l="9893" t="4982" r="10507" b="5184">mining</wd>

<space/>

</ln>

<ln l="6144" t="5251" r="10502" b="5453" baseLine="5405" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5251" r="6562" b="5410">tools</wd>

<space/>

<wd l="6667" t="5304" r="6931" b="5410">are</wd>

<space/>

<wd l="7022" t="5304" r="7402" b="5453">very</wd>

<space/>

<wd l="7512" t="5251" r="8256" b="5410">sensitive</wd>

<space/>

<wd l="8347" t="5275" r="8515" b="5410">to</wd>

<space/>

<wd l="8611" t="5251" r="9072" b="5410">those</wd>

<space/>

<wd l="9168" t="5251" r="10214" b="5453">phenomena,</wd>

<space/>

<wd l="10334" t="5304" r="10502" b="5410">as</wd>

<space/>

</ln>

<ln l="6144" t="5525" r="10498" b="5726" baseLine="5674" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5525" r="6514" b="5726">they</wd>

<space/>

<wd l="6590" t="5578" r="6850" b="5683">are</wd>

<space/>

<wd l="6922" t="5525" r="7694" b="5726">designed</wd>

<space/>

<wd l="7757" t="5525" r="8016" b="5683">for</wd>

<space/>

<wd l="8083" t="5525" r="8717" b="5726">dealing</wd>

<space/>

<wd l="8789" t="5525" r="9178" b="5683">with</wd>

<space/>

<wd l="9250" t="5525" r="9984" b="5683">standard</wd>

<space/>

<wd l="10046" t="5549" r="10498" b="5683">texts.</wd>

<space/>

</ln>

<ln l="6144" t="5794" r="10502" b="5995" baseLine="5947">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="5794" r="7051" b="5981">Therefore,</wd>

<space/>

<wd l="7123" t="5794" r="7248" b="5952">it</wd>

<space/>

<wd l="7306" t="5794" r="7445" b="5952">is</wd>

<space/>

<wd l="7517" t="5846" r="8362" b="5995">necessary</wd>

<space/>

<wd l="8424" t="5818" r="8592" b="5952">to</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8659" t="5794" r="9523" b="5966">normalize</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="9590" t="5794" r="10037" b="5952">these</wd>

<space/>

<wd l="10104" t="5818" r="10502" b="5952">texts</wd>

<space/>

</run>

</ln>

<ln l="6144" t="6067" r="10512" b="6269" baseLine="6216" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6067" r="6701" b="6226">before</wd>

<space/>

<wd l="6763" t="6067" r="7171" b="6226">their</wd>

<space/>

<wd l="7229" t="6067" r="8203" b="6269">processing,</wd>

<space/>

<wd l="8280" t="6067" r="8606" b="6226">that</wd>

<space/>

<wd l="8669" t="6067" r="8856" b="6254">is,</wd>

<space/>

<wd l="8933" t="6091" r="9101" b="6226">to</wd>

<space/>

<wd l="9163" t="6067" r="10018" b="6226">transform</wd>

<space/>

<wd l="10075" t="6067" r="10512" b="6226">them</wd>

<space/>

</ln>

<ln l="6144" t="6336" r="10498" b="6538" baseLine="6490" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6336" r="6480" b="6494">into</wd>

<space/>

<wd l="6557" t="6336" r="7286" b="6494">standard</wd>

<space/>

<wd l="7344" t="6336" r="8174" b="6538">language.</wd>

<space/>

<wd l="8270" t="6336" r="8650" b="6494">This</wd>

<space/>

<wd l="8717" t="6389" r="9077" b="6538">way</wd>

<space/>

<wd l="9144" t="6341" r="9326" b="6494">“c</wd>

<space/>

<wd l="9394" t="6389" r="9499" b="6494">u</wd>

<space/>

<wd l="9562" t="6360" r="9840" b="6494">nxt</wd>

<space/>

<wd l="9898" t="6336" r="10498" b="6523">week”,</wd>

<space/>

</ln>

<ln l="6144" t="6610" r="10507" b="6811" baseLine="6758" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6610" r="6403" b="6768">for</wd>

<space/>

<wd l="6470" t="6610" r="7248" b="6811">example,</wd>

<space/>

<wd l="7330" t="6610" r="7872" b="6768">would</wd>

<space/>

<wd l="7939" t="6610" r="8146" b="6768">be</wd>

<space/>

<wd l="8213" t="6610" r="9269" b="6768">transformed</wd>

<space/>

<wd l="9336" t="6610" r="9672" b="6768">into</wd>

<space/>

<wd l="9744" t="6614" r="10114" b="6768">“see</wd>

<space/>

<wd l="10186" t="6662" r="10507" b="6811">you</wd>

<space/>

</ln>

<ln l="6144" t="6878" r="10498" b="7080" baseLine="7032" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6902" r="6518" b="7037">next</wd>

<space/>

<wd l="6581" t="6878" r="7181" b="7037">week”.</wd>

<space/>

<wd l="7291" t="6878" r="7670" b="7037">This</wd>

<space/>

<wd l="7742" t="6878" r="7877" b="7037">is</wd>

<space/>

<wd l="7954" t="6878" r="8218" b="7037">the</wd>

<space/>

<wd l="8285" t="6878" r="8654" b="7080">goal</wd>

<space/>

<wd l="8726" t="6878" r="8918" b="7037">of</wd>

<space/>

<wd l="8966" t="6878" r="9235" b="7037">the</wd>

<space/>

<wd l="9298" t="6883" r="10008" b="7037">W-NUT</wd>

<space/>

<wd l="10080" t="6878" r="10498" b="7037">2015</wd>

<space/>

</ln>

<ln l="6144" t="7152" r="9874" b="7349" baseLine="7301" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7152" r="7406" b="7310">Normalization</wd>

<space/>

<wd l="7459" t="7152" r="7867" b="7310">Task</wd>

<space/>

<wd l="7930" t="7152" r="8736" b="7349">(Baldwin</wd>

<space/>

<wd l="8794" t="7176" r="8947" b="7310">et</wd>

<space/>

<wd l="9005" t="7152" r="9254" b="7339">al.,</wd>

<space/>

<wd l="9326" t="7152" r="9874" b="7349">2015).</wd>

</ln>

</para>

<para l="6144" t="7435" r="10517" b="9533" alignment="justified" spaceBefore="11" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="7435" r="10493" b="7637" baseLine="7584" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="7435" r="6701" b="7594">The</wd>

<space/>

<wd l="6782" t="7459" r="7099" b="7594">rest</wd>

<space/>

<wd l="7176" t="7435" r="7368" b="7594">of</wd>

<space/>

<wd l="7430" t="7435" r="7738" b="7594">this</wd>

<space/>

<wd l="7824" t="7488" r="8314" b="7637">paper</wd>

<space/>

<wd l="8386" t="7435" r="8525" b="7594">is</wd>

<space/>

<wd l="8616" t="7435" r="9466" b="7637">organized</wd>

<space/>

<wd l="9547" t="7488" r="9715" b="7594">as</wd>

<space/>

<wd l="9802" t="7435" r="10493" b="7594">follows:</wd>

<space/>

</ln>

<ln l="6149" t="7704" r="10517" b="7862" baseLine="7858" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="7704" r="6802" b="7862">Section</wd>

<space/>

<wd l="6898" t="7709" r="6998" b="7858">2</wd>

<space/>

<wd l="7099" t="7704" r="7896" b="7862">describes</wd>

<space/>

<wd l="7997" t="7704" r="8266" b="7862">the</wd>

<space/>

<wd l="8362" t="7757" r="8731" b="7862">core</wd>

<space/>

<wd l="8827" t="7704" r="9854" b="7862">architecture</wd>

<space/>

<wd l="9950" t="7704" r="10142" b="7862">of</wd>

<space/>

<wd l="10224" t="7757" r="10517" b="7862">our</wd>

<space/>

</ln>

<ln l="6154" t="7978" r="10512" b="8179" baseLine="8126" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="8002" r="6797" b="8179">system,</wd>

<space/>

<wd l="6888" t="7978" r="7200" b="8136">and</wd>

<space/>

<wd l="7267" t="7978" r="7637" b="8136">how</wd>

<space/>

<wd l="7709" t="7978" r="7834" b="8136">it</wd>

<space/>

<wd l="7901" t="8030" r="8232" b="8136">was</wd>

<space/>

<wd l="8314" t="7978" r="8990" b="8179">adapted</wd>

<space/>

<wd l="9062" t="8002" r="9226" b="8136">to</wd>

<space/>

<wd l="9307" t="7978" r="9485" b="8136">fit</wd>

<space/>

<wd l="9557" t="7978" r="9864" b="8136">this</wd>

<space/>

<wd l="9950" t="7978" r="10512" b="8136">shared</wd>

<space/>

</ln>

<ln l="6144" t="8246" r="10498" b="8448" baseLine="8395" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8246" r="6542" b="8434">task,</wd>

<space/>

<wd l="6653" t="8246" r="6965" b="8405">and</wd>

<space/>

<wd l="7056" t="8246" r="7704" b="8405">Section</wd>

<space/>

<wd l="7795" t="8251" r="7886" b="8405">3</wd>

<space/>

<wd l="7987" t="8270" r="8698" b="8448">presents</wd>

<space/>

<wd l="8789" t="8246" r="9058" b="8405">the</wd>

<space/>

<wd l="9144" t="8299" r="9960" b="8405">resources</wd>

<space/>

<wd l="10056" t="8246" r="10498" b="8405">used.</wd>

<space/>

</ln>

<ln l="6144" t="8520" r="10502" b="8722" baseLine="8669" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8525" r="6610" b="8707">Next,</wd>

<space/>

<wd l="6672" t="8520" r="7325" b="8678">Section</wd>

<space/>

<wd l="7368" t="8525" r="7474" b="8674">4</wd>

<space/>

<wd l="7531" t="8520" r="8318" b="8678">evaluates</wd>

<space/>

<wd l="8371" t="8520" r="8640" b="8678">the</wd>

<space/>

<wd l="8693" t="8544" r="9293" b="8722">system</wd>

<space/>

<wd l="9341" t="8520" r="9653" b="8678">and</wd>

<space/>

<wd l="9706" t="8520" r="10502" b="8678">discusses</wd>

<space/>

</ln>

<ln l="6144" t="8789" r="10502" b="8990" baseLine="8938" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8789" r="6413" b="8947">the</wd>

<space/>

<wd l="6494" t="8789" r="7056" b="8947">results</wd>

<space/>

<wd l="7157" t="8789" r="7944" b="8947">obtained.</wd>

<space/>

<wd l="8112" t="8789" r="8760" b="8990">Finally,</wd>

<space/>

<wd l="8870" t="8789" r="9518" b="8947">Section</wd>

<space/>

<wd l="9610" t="8789" r="9701" b="8947">5</wd>

<space/>

<wd l="9797" t="8813" r="10502" b="8990">presents</wd>

<space/>

</ln>

<ln l="6149" t="9058" r="10502" b="9259" baseLine="9211" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9110" r="6442" b="9216">our</wd>

<space/>

<wd l="6518" t="9058" r="7536" b="9216">conclusions</wd>

<space/>

<wd l="7632" t="9058" r="7939" b="9216">and</wd>

<space/>

<wd l="8026" t="9058" r="8837" b="9216">considers</wd>

<space/>

<wd l="8933" t="9110" r="9384" b="9216">some</wd>

<space/>

<wd l="9461" t="9058" r="10176" b="9259">possible</wd>

<space/>

<wd l="10258" t="9058" r="10502" b="9216">fu-</wd>

</ln>

<ln l="6144" t="9331" r="9139" b="9533" baseLine="9480" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9355" r="6485" b="9490">ture</wd>

<space/>

<wd l="6538" t="9331" r="7771" b="9533">improvements</wd>

<space/>

<wd l="7834" t="9331" r="8093" b="9490">for</wd>

<space/>

<wd l="8150" t="9384" r="8438" b="9490">our</wd>

<space/>

<wd l="8501" t="9355" r="9139" b="9533">system.</wd>

</ln>

</para>

<para l="6144" t="9835" r="7790" b="10008" alignment="left" spaceBefore="250" lsp="exactly" lspExact="266" language="en">

<ln l="6144" t="9835" r="7790" b="10008" baseLine="9998" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="6144" t="9835" r="6259" b="10003">2</wd>

<space/>

<wd l="6504" t="9835" r="7790" b="10008">Architecture</wd>

</ln>

</para>

<para l="6144" t="10301" r="10512" b="13210" alignment="justified" spaceBefore="185" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="10301" r="10512" b="10502" baseLine="10450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10306" r="6490" b="10459">Our</wd>

<space/>

<wd l="6586" t="10325" r="7061" b="10459">tweet</wd>

<space/>

<wd l="7162" t="10301" r="8376" b="10459">normalization</wd>

<space/>

<wd l="8486" t="10325" r="9086" b="10502">system</wd>

<space/>

<wd l="9182" t="10354" r="9514" b="10459">was</wd>

<space/>

<wd l="9629" t="10301" r="10512" b="10502">developed</wd>

<space/>

</ln>

<ln l="6144" t="10570" r="10502" b="10771" baseLine="10718" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10570" r="6686" b="10771">taking</wd>

<space/>

<wd l="6792" t="10622" r="6960" b="10728">as</wd>

<space/>

<wd l="7066" t="10570" r="7507" b="10728">basic</wd>

<space/>

<wd l="7608" t="10570" r="8376" b="10771">premises</wd>

<space/>

<wd l="8477" t="10570" r="8678" b="10728">its</wd>

<space/>

<wd l="8784" t="10570" r="9653" b="10771">flexibility,</wd>

<space/>

<wd l="9782" t="10570" r="10502" b="10728">scalabil-</wd>

</ln>

<ln l="6144" t="10843" r="10512" b="11045" baseLine="10992" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10843" r="6374" b="11045">ity</wd>

<space/>

<wd l="6470" t="10843" r="6782" b="11002">and</wd>

<space/>

<wd l="6869" t="10843" r="8218" b="11045">maintainability.</wd>

<space/>

<wd l="8400" t="10848" r="8630" b="11002">As</wd>

<space/>

<wd l="8731" t="10896" r="8827" b="11002">a</wd>

<space/>

<wd l="8923" t="10843" r="9566" b="11045">starting</wd>

<space/>

<wd l="9658" t="10843" r="10147" b="11045">point,</wd>

<space/>

<wd l="10258" t="10896" r="10512" b="11002">we</wd>

<space/>

</ln>

<ln l="6144" t="11112" r="10502" b="11314" baseLine="11261" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="11112" r="6533" b="11270">took</wd>

<space/>

<wd l="6614" t="11165" r="6710" b="11270">a</wd>

<space/>

<wd l="6778" t="11112" r="7517" b="11314">previous</wd>

<space/>

<wd l="7598" t="11136" r="8434" b="11314">prototype</wd>

<space/>

<wd l="8510" t="11112" r="8770" b="11270">for</wd>

<space/>

<wd l="8846" t="11112" r="9533" b="11314">Spanish</wd>

<space/>

<wd l="9605" t="11136" r="10080" b="11270">tweet</wd>

<space/>

<wd l="10152" t="11165" r="10502" b="11270">nor-</wd>

</ln>

<ln l="6144" t="11381" r="10512" b="11582" baseLine="11534" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="11381" r="7070" b="11539">malization</wd>

<space/>

<wd l="7152" t="11381" r="7824" b="11578">(Vilares</wd>

<space/>

<wd l="7915" t="11405" r="8069" b="11539">et</wd>

<space/>

<wd l="8150" t="11381" r="8400" b="11568">al.,</wd>

<space/>

<wd l="8496" t="11386" r="8990" b="11578">2013)</wd>

<space/>

<wd l="9077" t="11381" r="9653" b="11568">which,</wd>

<space/>

<wd l="9754" t="11381" r="10512" b="11582">although</wd>

<space/>

</ln>

<ln l="6144" t="11654" r="10502" b="11856" baseLine="11803" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="11654" r="6552" b="11856">fully</wd>

<space/>

<wd l="6648" t="11654" r="7574" b="11842">functional,</wd>

<space/>

<wd l="7690" t="11654" r="7963" b="11813">did</wd>

<space/>

<wd l="8054" t="11678" r="8333" b="11813">not</wd>

<space/>

<wd l="8419" t="11678" r="8774" b="11813">turn</wd>

<space/>

<wd l="8866" t="11678" r="9139" b="11813">out</wd>

<space/>

<wd l="9230" t="11678" r="9394" b="11813">to</wd>

<space/>

<wd l="9490" t="11654" r="9691" b="11813">be</wd>

<space/>

<wd l="9787" t="11707" r="9955" b="11813">as</wd>

<space/>

<wd l="10061" t="11654" r="10502" b="11813">flexi-</wd>

</ln>

<ln l="6144" t="11923" r="10512" b="12125" baseLine="12077" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="11923" r="6413" b="12082">ble</wd>

<space/>

<wd l="6466" t="11923" r="6778" b="12082">and</wd>

<space/>

<wd l="6830" t="11923" r="7954" b="12082">maintainable</wd>

<space/>

<wd l="8011" t="11976" r="8179" b="12082">as</wd>

<space/>

<wd l="8246" t="11923" r="9053" b="12125">expected.</wd>

<space/>

<wd l="9134" t="11923" r="9514" b="12082">This</wd>

<space/>

<wd l="9576" t="11923" r="10056" b="12082">could</wd>

<space/>

<wd l="10109" t="11923" r="10512" b="12082">have</wd>

<space/>

</ln>

<ln l="6144" t="12197" r="10512" b="12398" baseLine="12346" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="12197" r="6826" b="12355">become</wd>

<space/>

<wd l="6893" t="12250" r="6989" b="12355">a</wd>

<space/>

<wd l="7046" t="12197" r="7776" b="12398">problem</wd>

<space/>

<wd l="7838" t="12197" r="8098" b="12355">for</wd>

<space/>

<wd l="8155" t="12197" r="8674" b="12355">future</wd>

<space/>

<wd l="8746" t="12197" r="9984" b="12398">developments,</wd>

<space/>

<wd l="10070" t="12197" r="10512" b="12355">since</wd>

<space/>

</ln>

<ln l="6144" t="12466" r="10502" b="12667" baseLine="12619" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="12466" r="6413" b="12624">the</wd>

<space/>

<wd l="6470" t="12466" r="7373" b="12667">adaptation</wd>

<space/>

<wd l="7430" t="12466" r="7906" b="12624">effort</wd>

<space/>

<wd l="7958" t="12466" r="8578" b="12624">needed</wd>

<space/>

<wd l="8630" t="12490" r="8794" b="12624">to</wd>

<space/>

<wd l="8851" t="12466" r="9610" b="12667">integrate</wd>

<space/>

<wd l="9662" t="12518" r="10018" b="12624">new</wd>

<space/>

<wd l="10075" t="12466" r="10502" b="12624">tech-</wd>

</ln>

<ln l="6144" t="12739" r="10512" b="12941" baseLine="12888" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="12739" r="6706" b="12941">niques</wd>

<space/>

<wd l="6782" t="12739" r="7330" b="12898">would</wd>

<space/>

<wd l="7392" t="12739" r="7795" b="12898">have</wd>

<space/>

<wd l="7867" t="12739" r="8280" b="12898">been</wd>

<space/>

<wd l="8347" t="12763" r="8621" b="12898">too</wd>

<space/>

<wd l="8693" t="12739" r="9168" b="12941">large,</wd>

<space/>

<wd l="9259" t="12792" r="9442" b="12898">so</wd>

<space/>

<wd l="9509" t="12792" r="9763" b="12898">we</wd>

<space/>

<wd l="9835" t="12739" r="10512" b="12898">decided</wd>

<space/>

</ln>

<ln l="6144" t="13008" r="9763" b="13210" baseLine="13162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="13032" r="6312" b="13166">to</wd>

<space/>

<wd l="6370" t="13008" r="7051" b="13166">refactor</wd>

<space/>

<wd l="7099" t="13008" r="7368" b="13166">the</wd>

<space/>

<wd l="7421" t="13008" r="7954" b="13166">whole</wd>

<space/>

<wd l="8021" t="13032" r="8621" b="13210">system</wd>

<space/>

<wd l="8669" t="13032" r="8837" b="13166">to</wd>

<space/>

<wd l="8904" t="13008" r="9350" b="13166">solve</wd>

<space/>

<wd l="9408" t="13008" r="9763" b="13166">this.</wd>

</ln>

</para>

<para l="6144" t="13291" r="10502" b="14035" alignment="justified" spaceBefore="12" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="13291" r="10502" b="13493" baseLine="13445" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6365" t="13291" r="6701" b="13450">The</wd>

<space/>

<wd l="6754" t="13291" r="7387" b="13493">general</wd>

<space/>

<wd l="7440" t="13291" r="8088" b="13450">scheme</wd>

<space/>

<wd l="8136" t="13291" r="8328" b="13450">of</wd>

<space/>

<wd l="8357" t="13291" r="8621" b="13450">the</wd>

<space/>

<wd l="8669" t="13291" r="9341" b="13493">original</wd>

<space/>

<wd l="9398" t="13315" r="9998" b="13493">system</wd>

<space/>

<wd l="10037" t="13291" r="10502" b="13445">mim-</wd>

</ln>

<ln l="6144" t="13565" r="10502" b="13766" baseLine="13714" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="13565" r="6379" b="13723">ics</wd>

<space/>

<wd l="6442" t="13565" r="6768" b="13723">that</wd>

<space/>

<wd l="6826" t="13565" r="7013" b="13723">of</wd>

<space/>

<wd l="7051" t="13570" r="7411" b="13723">Han</wd>

<space/>

<wd l="7474" t="13565" r="7786" b="13723">and</wd>

<space/>

<wd l="7834" t="13565" r="8578" b="13723">Baldwin</wd>

<space/>

<wd l="8635" t="13570" r="9197" b="13762">(2011)</wd>

<space/>

<wd l="9264" t="13565" r="9576" b="13723">and</wd>

<space/>

<wd l="9629" t="13565" r="10502" b="13766">comprises</wd>

<space/>

</ln>

<ln l="6144" t="13834" r="7214" b="14035" baseLine="13987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="13834" r="6581" b="13992">three</wd>

<space/>

<wd l="6648" t="13858" r="7214" b="14035">stages:</wd>

</ln>

</para>

<para l="6341" t="14333" r="8419" b="14534" alignment="left" li="504" spaceBefore="228" fli="-288" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="6341" t="14333" r="8419" b="14534" baseLine="14486" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="6341" t="14338" r="6581" b="14486">1.</wd>

<space/>

<wd l="6581" t="14338" r="7114" b="14491">Tweet</wd>

<space/>

<wd l="7166" t="14333" r="8419" b="14534">preprocessing.</wd>

</ln>

</para>

<para l="6322" t="14832" r="10512" b="15307" alignment="justified" li="504" spaceBefore="231" fli="-288" lsp="exactly" lspExact="266" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="6322" t="14832" r="10512" b="15038" baseLine="14986">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6322" t="14842" r="6581" b="14986">2.</wd>

<space/>

<wd l="6581" t="14837" r="7795" b="15038">In-vocabulary</wd>

<space/>

<wd l="7848" t="14837" r="8299" b="14995">word</wd>

<space/>

<wd l="8352" t="14837" r="9504" b="14995">identification</wd>

<space/>

</run>

<wd l="9566" t="14842" r="9950" b="15034"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">(</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">IV</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">),</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="10013" t="14837" r="10512" b="14995">based</wd>

<space/>

</run>

</ln>

<ln l="6586" t="15106" r="10502" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6586" t="15158" r="6802" b="15264">on</wd>

<space/>

<wd l="6898" t="15106" r="7162" b="15264">the</wd>

<space/>

<wd l="7262" t="15106" r="7901" b="15264">lexicon</wd>

<space/>

<wd l="8002" t="15106" r="8194" b="15264">of</wd>

<space/>

<wd l="8275" t="15106" r="8544" b="15264">the</wd>

<space/>

<wd l="8650" t="15130" r="9288" b="15307">system,</wd>

<space/>

<wd l="9413" t="15106" r="10229" b="15307">obtaining</wd>

<space/>

<wd l="10334" t="15158" r="10502" b="15264">as</wd>

</ln>

</para>

</column>

</section>

<section l="1440" t="15316" r="10524" b="16480">

<column l="1440" t="15316" r="10524" b="16480">

<para l="5804" t="15792" r="6143" b="15946" alignment="centered" spaceBefore="406" lsp="exactly" lspExact="271" language="en">

<ln l="5870" t="15792" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="39">

<wd l="5870" t="15792" r="6077" b="15946">99</wd>

</ln>

</para>

<para l="2870" t="16128" r="9029" b="16469" alignment="centered" spaceBefore="139" lsp="exactly" lspExact="170" language="en">

<ln l="2870" t="16128" r="9029" b="16325" baseLine="16253" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2870" t="16133" r="3758" b="16296">Proceedings</wd>

<space/>

<wd l="3811" t="16133" r="3970" b="16296">of</wd>

<space/>

<wd l="3994" t="16133" r="4205" b="16262">the</wd>

<space/>

<wd l="4243" t="16138" r="4579" b="16262">ACL</wd>

<space/>

<wd l="4622" t="16133" r="4982" b="16262">2015</wd>

<space/>

<wd l="5035" t="16133" r="5731" b="16296">Workshop</wd>

<space/>

<wd l="5784" t="16176" r="5957" b="16262">on</wd>

<space/>

<wd l="6000" t="16138" r="6408" b="16296">Noisy</wd>

<space/>

<wd l="6470" t="16133" r="7579" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7627" t="16138" r="7949" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7997" t="16171" r="8400" b="16325">pages</wd>

<space/>

<wd l="8458" t="16133" r="9029" b="16286">99–105,
</wd>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1261" marginRight="1385" marginBottom="1292" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1261" r="10524" b="15317">

<column l="1440" t="1261" r="5822" b="15317">

<para l="1877" t="1320" r="5803" b="1790" alignment="justified" li="432" lsp="exactly" lspExact="269" language="en">

<ln l="1882" t="1320" r="5803" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="1373" r="1978" b="1478">a</wd>

<space/>

<wd l="2078" t="1320" r="2568" b="1478">result</wd>

<space/>

<wd l="2678" t="1373" r="2875" b="1478">an</wd>

<space/>

<wd l="2986" t="1320" r="3490" b="1478">initial</wd>

<space/>

<wd l="3610" t="1344" r="3845" b="1478">set</wd>

<space/>

<wd l="3955" t="1320" r="4147" b="1478">of</wd>

<space/>

<wd l="4243" t="1320" r="5803" b="1522">out-of-vocabulary</wd>

<space/>

</ln>

<ln l="1877" t="1594" r="3053" b="1790" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="1594" r="2400" b="1752">words</wd>

<space/>

</run>

<wd l="2472" t="1598" r="3053" b="1790"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">OOV</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1618" t="2088" r="5803" b="5270" alignment="justified" li="432" spaceBefore="224" fli="-216" lsp="exactly" lspExact="271" language="en">

<ln l="1618" t="2088" r="5794" b="2290" baseLine="2237">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1618" t="2093" r="1766" b="2246">3.</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1886" t="2122" r="2270" b="2246">OOV</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2333" t="2112" r="2568" b="2246">set</wd>

<space/>

<wd l="2611" t="2088" r="3542" b="2290">processing</wd>

<space/>

<wd l="3590" t="2088" r="3758" b="2242">in</wd>

<space/>

<wd l="3806" t="2088" r="4267" b="2246">order</wd>

<space/>

<wd l="4310" t="2112" r="4474" b="2246">to</wd>

<space/>

<wd l="4526" t="2088" r="5482" b="2290">distinguish</wd>

<space/>

<wd l="5525" t="2088" r="5794" b="2246">be-</wd>

</run>

</ln>

<ln l="1877" t="2357" r="5794" b="2558" baseLine="2506" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="2381" r="2400" b="2515">tween</wd>

<space/>

<wd l="2453" t="2381" r="3053" b="2515">correct</wd>

<space/>

<wd l="3101" t="2357" r="3624" b="2515">words</wd>

<space/>

<wd l="3682" t="2357" r="4214" b="2515">which</wd>

<space/>

<wd l="4267" t="2410" r="4531" b="2515">are</wd>

<space/>

<wd l="4584" t="2381" r="4862" b="2515">out</wd>

<space/>

<wd l="4910" t="2357" r="5102" b="2515">of</wd>

<space/>

<wd l="5136" t="2357" r="5405" b="2515">the</wd>

<space/>

<wd l="5462" t="2410" r="5794" b="2558">sys-</wd>

</ln>

<ln l="1877" t="2626" r="5794" b="2827" baseLine="2779">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1877" t="2650" r="2208" b="2784">tem</wd>

<space/>

<wd l="2275" t="2626" r="2918" b="2784">lexicon</wd>

<space/>

<wd l="2995" t="2626" r="3302" b="2784">and</wd>

<space/>

<wd l="3374" t="2678" r="3950" b="2827">proper</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="4022" t="2626" r="4598" b="2784">lexical</wd>

<space/>

</run>

<wd l="4666" t="2635" r="5424" b="2813"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">variants</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="5520" t="2626" r="5794" b="2784">ob-</wd>

</run>

</ln>

<ln l="1877" t="2899" r="5794" b="3101" baseLine="3048" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="2899" r="2477" b="3101">taining</wd>

<space/>

<wd l="2568" t="2899" r="2822" b="3058">for</wd>

<space/>

<wd l="2909" t="2899" r="3307" b="3058">each</wd>

<space/>

<wd l="3394" t="2952" r="3701" b="3058">one</wd>

<space/>

<wd l="3792" t="2899" r="3984" b="3058">of</wd>

<space/>

<wd l="4051" t="2899" r="4315" b="3058">the</wd>

<space/>

<wd l="4402" t="2899" r="4853" b="3058">latter</wd>

<space/>

<wd l="4939" t="2952" r="5035" b="3058">a</wd>

<space/>

<wd l="5117" t="2899" r="5794" b="3058">normal-</wd>

</ln>

<ln l="1877" t="3168" r="5794" b="3370" baseLine="3322" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="3168" r="2242" b="3326">ized</wd>

<space/>

<wd l="2314" t="3168" r="2784" b="3326">form.</wd>

<space/>

<wd l="2923" t="3168" r="3307" b="3326">This</wd>

<space/>

<wd l="3389" t="3168" r="3691" b="3326">last</wd>

<space/>

<wd l="3778" t="3192" r="4114" b="3370">step</wd>

<space/>

<wd l="4200" t="3221" r="4493" b="3326">can</wd>

<space/>

<wd l="4574" t="3168" r="4776" b="3326">be</wd>

<space/>

<wd l="4853" t="3168" r="5026" b="3322">in</wd>

<space/>

<wd l="5098" t="3192" r="5453" b="3326">turn</wd>

<space/>

<wd l="5530" t="3168" r="5794" b="3326">de-</wd>

</ln>

<ln l="1882" t="3442" r="5794" b="3643" baseLine="3590" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="3442" r="2765" b="3643">composed</wd>

<space/>

<wd l="2818" t="3442" r="3154" b="3600">into</wd>

<space/>

<wd l="3216" t="3466" r="3586" b="3600">two:</wd>

<space/>

<wd l="3677" t="3442" r="3941" b="3600">the</wd>

<space/>

<wd l="4008" t="3442" r="4344" b="3600">first</wd>

<space/>

<wd l="4402" t="3494" r="4757" b="3629">one,</wd>

<space/>

<wd l="4829" t="3442" r="5362" b="3600">which</wd>

<space/>

<wd l="5424" t="3494" r="5794" b="3643">gen-</wd>

</ln>

<ln l="1882" t="3710" r="5794" b="3912" baseLine="3864" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="3734" r="2376" b="3869">erates</wd>

<space/>

<wd l="2462" t="3763" r="2558" b="3869">a</wd>

<space/>

<wd l="2635" t="3734" r="2870" b="3869">set</wd>

<space/>

<wd l="2942" t="3710" r="3134" b="3869">of</wd>

<space/>

<wd l="3192" t="3710" r="3907" b="3912">possible</wd>

<space/>

<wd l="3979" t="3710" r="5189" b="3869">normalization</wd>

<space/>

<wd l="5266" t="3710" r="5794" b="3869">candi-</wd>

</ln>

<ln l="1882" t="3984" r="5794" b="4186" baseLine="4133" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="3984" r="2318" b="4142">dates</wd>

<space/>

<wd l="2381" t="3984" r="2880" b="4142">based</wd>

<space/>

<wd l="2938" t="4037" r="3154" b="4142">on</wd>

<space/>

<wd l="3211" t="3984" r="3475" b="4142">the</wd>

<space/>

<wd l="3538" t="3984" r="4502" b="4186">application</wd>

<space/>

<wd l="4565" t="3984" r="4752" b="4142">of</wd>

<space/>

<wd l="4800" t="3984" r="5390" b="4142">certain</wd>

<space/>

<wd l="5448" t="4037" r="5794" b="4142">nor-</wd>

</ln>

<ln l="1877" t="4253" r="5794" b="4454" baseLine="4406" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="4253" r="2798" b="4411">malization</wd>

<space/>

<wd l="2885" t="4253" r="3869" b="4454">techniques;</wd>

<space/>

<wd l="3989" t="4253" r="4301" b="4411">and</wd>

<space/>

<wd l="4387" t="4253" r="4651" b="4411">the</wd>

<space/>

<wd l="4752" t="4253" r="5347" b="4411">second</wd>

<space/>

<wd l="5438" t="4306" r="5794" b="4440">one,</wd>

<space/>

</ln>

<ln l="1877" t="4526" r="5803" b="4685" baseLine="4675" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="4526" r="2410" b="4685">which</wd>

<space/>

<wd l="2491" t="4526" r="3053" b="4685">selects</wd>

<space/>

<wd l="3139" t="4579" r="3446" b="4685">one</wd>

<space/>

<wd l="3523" t="4526" r="3715" b="4685">of</wd>

<space/>

<wd l="3773" t="4526" r="4219" b="4685">these</wd>

<space/>

<wd l="4296" t="4526" r="5208" b="4685">candidates</wd>

<space/>

<wd l="5290" t="4579" r="5458" b="4685">as</wd>

<space/>

<wd l="5539" t="4526" r="5803" b="4685">the</wd>

<space/>

</ln>

<ln l="1877" t="4795" r="5794" b="4992" baseLine="4944" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="4795" r="2861" b="4954">normalized</wd>

<space/>

<wd l="2966" t="4795" r="3394" b="4954">form</wd>

<space/>

<wd l="3504" t="4795" r="3739" b="4992">(in</wd>

<space/>

<wd l="3850" t="4848" r="4138" b="4954">our</wd>

<space/>

<wd l="4248" t="4848" r="4661" b="4982">case,</wd>

<space/>

<wd l="4790" t="4795" r="4963" b="4949">in</wd>

<space/>

<wd l="5074" t="4848" r="5170" b="4954">a</wd>

<space/>

<wd l="5280" t="4848" r="5794" b="4954">score-</wd>

</ln>

<ln l="1882" t="5069" r="3250" b="5270" baseLine="5218" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="5069" r="2429" b="5227">driven</wd>

<space/>

<wd l="2482" t="5074" r="3250" b="5270">process).</wd>

</ln>

</para>

<para l="1440" t="5558" r="5803" b="7114" alignment="justified" spaceBefore="222" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="5558" r="5794" b="5760" baseLine="5712" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5563" r="1675" b="5717">As</wd>

<space/>

<wd l="1728" t="5558" r="1987" b="5717">for</wd>

<space/>

<wd l="2030" t="5558" r="2294" b="5717">the</wd>

<space/>

<wd l="2342" t="5558" r="3182" b="5760">particular</wd>

<space/>

<wd l="3226" t="5558" r="4440" b="5717">normalization</wd>

<space/>

<wd l="4488" t="5558" r="5410" b="5760">techniques</wd>

<space/>

<wd l="5472" t="5611" r="5794" b="5717">em-</wd>

</ln>

<ln l="1440" t="5832" r="5803" b="6034" baseLine="5981" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5832" r="2035" b="6034">ployed</wd>

<space/>

<wd l="2107" t="5832" r="3062" b="6034">throughout</wd>

<space/>

<wd l="3139" t="5885" r="3432" b="5990">our</wd>

<space/>

<wd l="3509" t="5856" r="4152" b="6034">system,</wd>

<space/>

<wd l="4238" t="5885" r="4493" b="5990">we</wd>

<space/>

<wd l="4574" t="5832" r="5246" b="5990">decided</wd>

<space/>

<wd l="5318" t="5856" r="5486" b="5990">to</wd>

<space/>

<wd l="5563" t="5856" r="5803" b="6034">try</wd>

<space/>

</ln>

<ln l="1445" t="6101" r="5794" b="6302" baseLine="6250" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="6101" r="1781" b="6259">first</wd>

<space/>

<wd l="1872" t="6154" r="1968" b="6259">a</wd>

<space/>

<wd l="2059" t="6101" r="3144" b="6259">combination</wd>

<space/>

<wd l="3235" t="6101" r="3427" b="6259">of</wd>

<space/>

<wd l="3504" t="6125" r="3826" b="6259">two</wd>

<space/>

<wd l="3922" t="6101" r="4114" b="6259">of</wd>

<space/>

<wd l="4186" t="6101" r="4454" b="6259">the</wd>

<space/>

<wd l="4541" t="6101" r="5434" b="6259">traditional</wd>

<space/>

<wd l="5530" t="6154" r="5794" b="6302">ap-</wd>

</ln>

<ln l="1440" t="6374" r="5803" b="6576" baseLine="6523" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6374" r="2582" b="6576">proximations</wd>

<space/>

<wd l="2650" t="6398" r="2818" b="6533">to</wd>

<space/>

<wd l="2880" t="6374" r="3187" b="6533">this</wd>

<space/>

<wd l="3254" t="6374" r="3605" b="6533">task</wd>

<space/>

<wd l="3672" t="6374" r="4286" b="6571">(Kobus</wd>

<space/>

<wd l="4358" t="6398" r="4512" b="6533">et</wd>

<space/>

<wd l="4574" t="6374" r="4824" b="6562">al.,</wd>

<space/>

<wd l="4896" t="6379" r="5448" b="6571">2008):</wd>

<space/>

<wd l="5539" t="6374" r="5803" b="6533">the</wd>

<space/>

</ln>

<ln l="1450" t="6643" r="5794" b="6845" baseLine="6792" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="6643" r="1843" b="6845">spell</wd>

<space/>

<wd l="1925" t="6643" r="2702" b="6845">checking</wd>

<space/>

<wd l="2779" t="6643" r="3091" b="6802">and</wd>

<space/>

<wd l="3158" t="6643" r="3422" b="6802">the</wd>

<space/>

<wd l="3494" t="6643" r="4344" b="6802">automatic</wd>

<space/>

<wd l="4426" t="6643" r="5011" b="6845">speech</wd>

<space/>

<wd l="5078" t="6643" r="5794" b="6845">recogni-</wd>

</ln>

<ln l="1440" t="6912" r="2784" b="7114" baseLine="7066" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6912" r="1781" b="7070">tion</wd>

<space/>

<wd l="1834" t="6912" r="2784" b="7114">metaphors.</wd>

</ln>

</para>

<para l="1440" t="7397" r="3086" b="7598" alignment="left" spaceBefore="234" lsp="exactly" lspExact="249" language="en">

<ln l="1440" t="7397" r="3086" b="7598" baseLine="7550" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">

<wd l="1440" t="7397" r="1704" b="7555">2.1</wd>

<space/>

<wd l="1934" t="7402" r="2294" b="7555">The</wd>

<space/>

<wd l="2347" t="7397" r="3086" b="7598">pipeline</wd>

</ln>

</para>

<para l="1440" t="7766" r="5813" b="9869" alignment="justified" spaceBefore="99" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="7766" r="5813" b="7968" baseLine="7920">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="7771" r="1723" b="7925">We</wd>

<space/>

<wd l="1795" t="7766" r="2467" b="7925">decided</wd>

<space/>

<wd l="2530" t="7790" r="2698" b="7925">to</wd>

<space/>

<wd l="2765" t="7766" r="3130" b="7968">give</wd>

<space/>

<wd l="3197" t="7819" r="3485" b="7925">our</wd>

<space/>

<wd l="3557" t="7790" r="4152" b="7968">system</wd>

<space/>

<wd l="4219" t="7819" r="4416" b="7925">an</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="4488" t="7766" r="5021" b="7968">object</wd>

<space/>

<wd l="5083" t="7766" r="5813" b="7925">oriented</wd>

<space/>

</run>

</ln>

<ln l="1445" t="8040" r="5794" b="8242" baseLine="8189">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1445" t="8040" r="2242" b="8242">approach</wd>

<space/>

<wd l="2318" t="8040" r="2846" b="8242">(using</wd>

<space/>

</run>

<wd l="2923" t="8045" r="3427" b="8237"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">J</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">AVA</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3509" t="8093" r="3677" b="8198">as</wd>

<space/>

<wd l="3758" t="8040" r="4483" b="8242">opposed</wd>

<space/>

<wd l="4546" t="8064" r="4714" b="8198">to</wd>

<space/>

<wd l="4786" t="8040" r="5050" b="8198">the</wd>

<space/>

</run>

<wd l="5126" t="8050" r="5794" b="8242" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">impera-</wd>

</ln>

<ln l="1445" t="8309" r="5794" b="8510" baseLine="8462">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1445" t="8318" r="1747" b="8467">tive</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1819" t="8309" r="2616" b="8510">approach</wd>

<space/>

<wd l="2678" t="8309" r="2870" b="8467">of</wd>

<space/>

<wd l="2918" t="8309" r="3182" b="8467">the</wd>

<space/>

<wd l="3250" t="8309" r="3922" b="8510">original</wd>

<space/>

<wd l="3984" t="8333" r="4819" b="8510">prototype</wd>

<space/>

<wd l="4891" t="8309" r="5126" b="8506">(in</wd>

<space/>

</run>

<wd l="5189" t="8314" r="5794" b="8506"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">P</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">ERL</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

</ln>

<ln l="1440" t="8582" r="5794" b="8784" baseLine="8731">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="8582" r="1781" b="8741">The</wd>

<space/>

<wd l="1858" t="8635" r="2213" b="8741">new</wd>

<space/>

<wd l="2304" t="8606" r="2904" b="8784">system</wd>

<space/>

<wd l="2981" t="8582" r="3120" b="8741">is</wd>

<space/>

<wd l="3216" t="8582" r="4080" b="8741">structured</wd>

<space/>

<wd l="4162" t="8582" r="4330" b="8736">in</wd>

<space/>

</run>

<wd l="4392" t="8635" r="5386" b="8784"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">processors</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="5482" t="8582" r="5794" b="8741">for-</wd>

</run>

</ln>

<ln l="1440" t="8851" r="5803" b="9053" baseLine="9005">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="8851" r="1944" b="9053">merly</wd>

<space/>

<wd l="2016" t="8851" r="2606" b="9010">known</wd>

<space/>

<wd l="2678" t="8904" r="2846" b="9010">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="2923" t="8851" r="3643" b="9010">modules</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="3715" t="8851" r="3888" b="9005">in</wd>

<space/>

<wd l="3950" t="8851" r="4219" b="9010">the</wd>

<space/>

<wd l="4286" t="8875" r="5165" b="9053">prototype,</wd>

<space/>

<wd l="5246" t="8851" r="5803" b="9010">whose</wd>

<space/>

</run>

</ln>

<ln l="1445" t="9125" r="5808" b="9326" baseLine="9274" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="9125" r="1814" b="9326">goal</wd>

<space/>

<wd l="1925" t="9125" r="2059" b="9283">is</wd>

<space/>

<wd l="2174" t="9149" r="2342" b="9283">to</wd>

<space/>

<wd l="2458" t="9125" r="2933" b="9326">apply</wd>

<space/>

<wd l="3048" t="9178" r="3144" b="9283">a</wd>

<space/>

<wd l="3250" t="9125" r="3840" b="9283">certain</wd>

<space/>

<wd l="3946" t="9178" r="4594" b="9326">process</wd>

<space/>

<wd l="4709" t="9149" r="4872" b="9283">to</wd>

<space/>

<wd l="4982" t="9125" r="5251" b="9283">the</wd>

<space/>

<wd l="5357" t="9125" r="5808" b="9326">input</wd>

<space/>

</ln>

<ln l="1440" t="9394" r="5808" b="9552" baseLine="9547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9418" r="1987" b="9552">tweets</wd>

<space/>

<wd l="2107" t="9446" r="2290" b="9552">so</wd>

<space/>

<wd l="2395" t="9394" r="2722" b="9552">that</wd>

<space/>

<wd l="2822" t="9446" r="3077" b="9552">we</wd>

<space/>

<wd l="3182" t="9446" r="3475" b="9552">can</wd>

<space/>

<wd l="3586" t="9394" r="4128" b="9552">obtain</wd>

<space/>

<wd l="4224" t="9394" r="4493" b="9552">the</wd>

<space/>

<wd l="4594" t="9394" r="5808" b="9552">normalization</wd>

<space/>

</ln>

<ln l="1445" t="9667" r="4718" b="9869" baseLine="9816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="9667" r="2352" b="9826">candidates</wd>

<space/>

<wd l="2419" t="9667" r="2611" b="9826">of</wd>

<space/>

<wd l="2650" t="9667" r="3058" b="9826">their</wd>

<space/>

<wd l="3106" t="9691" r="3581" b="9826">terms</wd>

<space/>

<wd l="3653" t="9691" r="3806" b="9826">at</wd>

<space/>

<wd l="3859" t="9667" r="4056" b="9826">its</wd>

<space/>

<wd l="4123" t="9691" r="4718" b="9869">output.</wd>

</ln>

</para>

<para l="1440" t="9946" r="5808" b="12859" alignment="justified" spaceBefore="9" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="9946" r="5803" b="10147" baseLine="10099" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1656" t="9946" r="1997" b="10104">The</wd>

<space/>

<wd l="2141" t="9998" r="2510" b="10104">core</wd>

<space/>

<wd l="2654" t="9970" r="3624" b="10147">component</wd>

<space/>

<wd l="3763" t="9946" r="3955" b="10104">of</wd>

<space/>

<wd l="4085" t="9998" r="4373" b="10104">our</wd>

<space/>

<wd l="4517" t="9970" r="5117" b="10147">system</wd>

<space/>

<wd l="5256" t="9946" r="5390" b="10104">is</wd>

<space/>

<wd l="5539" t="9946" r="5803" b="10104">the</wd>

<space/>

</ln>

<ln l="1440" t="10219" r="5803" b="10421" baseLine="10368" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="10219" r="2184" b="10421">pipeline,</wd>

<space/>

<wd l="2275" t="10219" r="3154" b="10421">consisting</wd>

<space/>

<wd l="3230" t="10219" r="3422" b="10378">of</wd>

<space/>

<wd l="3480" t="10272" r="3576" b="10378">a</wd>

<space/>

<wd l="3648" t="10219" r="4219" b="10378">classic</wd>

<space/>

<wd l="4301" t="10219" r="4973" b="10378">cascade</wd>

<space/>

<wd l="5050" t="10243" r="5803" b="10378">structure</wd>

<space/>

</ln>

<ln l="1440" t="10488" r="5794" b="10690" baseLine="10642" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="10488" r="1973" b="10646">where</wd>

<space/>

<wd l="2050" t="10541" r="2304" b="10646">we</wd>

<space/>

<wd l="2386" t="10541" r="2683" b="10646">can</wd>

<space/>

<wd l="2765" t="10488" r="3250" b="10646">insert</wd>

<space/>

<wd l="3331" t="10541" r="3528" b="10646">an</wd>

<space/>

<wd l="3614" t="10488" r="4358" b="10690">arbitrary</wd>

<space/>

<wd l="4440" t="10488" r="5107" b="10646">number</wd>

<space/>

<wd l="5189" t="10488" r="5376" b="10646">of</wd>

<space/>

<wd l="5443" t="10541" r="5794" b="10690">pro-</wd>

</ln>

<ln l="1445" t="10762" r="5794" b="10963" baseLine="10910" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="10814" r="2064" b="10920">cessors</wd>

<space/>

<wd l="2126" t="10762" r="2438" b="10920">and</wd>

<space/>

<wd l="2486" t="10762" r="2890" b="10920">have</wd>

<space/>

<wd l="2938" t="10762" r="3346" b="10920">their</wd>

<space/>

<wd l="3389" t="10762" r="3917" b="10963">inputs</wd>

<space/>

<wd l="3979" t="10762" r="4291" b="10920">and</wd>

<space/>

<wd l="4344" t="10786" r="4973" b="10963">outputs</wd>

<space/>

<wd l="5035" t="10786" r="5794" b="10920">automat-</wd>

</ln>

<ln l="1440" t="11030" r="5803" b="11232" baseLine="11179" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="11030" r="1920" b="11232">ically</wd>

<space/>

<wd l="1982" t="11030" r="2568" b="11189">linked.</wd>

<space/>

<wd l="2659" t="11035" r="2842" b="11184">In</wd>

<space/>

<wd l="2899" t="11030" r="3206" b="11189">this</wd>

<space/>

<wd l="3269" t="11083" r="3662" b="11232">way,</wd>

<space/>

<wd l="3730" t="11030" r="3998" b="11189">the</wd>

<space/>

<wd l="4061" t="11030" r="4733" b="11232">original</wd>

<space/>

<wd l="4790" t="11030" r="5242" b="11232">input</wd>

<space/>

<wd l="5304" t="11030" r="5496" b="11189">of</wd>

<space/>

<wd l="5539" t="11030" r="5803" b="11189">the</wd>

<space/>

</ln>

<ln l="1450" t="11304" r="5803" b="11506" baseLine="11453" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1450" t="11328" r="2050" b="11506">system</wd>

<space/>

<wd l="2088" t="11304" r="2846" b="11462">becomes</wd>

<space/>

<wd l="2894" t="11304" r="3163" b="11462">the</wd>

<space/>

<wd l="3206" t="11304" r="3653" b="11506">input</wd>

<space/>

<wd l="3701" t="11304" r="3893" b="11462">of</wd>

<space/>

<wd l="3922" t="11304" r="4186" b="11462">the</wd>

<space/>

<wd l="4234" t="11304" r="4570" b="11462">first</wd>

<space/>

<wd l="4613" t="11357" r="5482" b="11506">processor,</wd>

<space/>

<wd l="5539" t="11304" r="5803" b="11462">the</wd>

<space/>

</ln>

<ln l="1445" t="11573" r="5794" b="11774" baseLine="11722" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="11597" r="2002" b="11774">output</wd>

<space/>

<wd l="2054" t="11573" r="2246" b="11731">of</wd>

<space/>

<wd l="2285" t="11573" r="2549" b="11731">the</wd>

<space/>

<wd l="2606" t="11573" r="2942" b="11731">first</wd>

<space/>

<wd l="2995" t="11626" r="3835" b="11774">processor</wd>

<space/>

<wd l="3883" t="11573" r="4022" b="11731">is</wd>

<space/>

<wd l="4080" t="11573" r="4349" b="11731">the</wd>

<space/>

<wd l="4402" t="11573" r="4853" b="11774">input</wd>

<space/>

<wd l="4906" t="11573" r="5098" b="11731">of</wd>

<space/>

<wd l="5136" t="11573" r="5400" b="11731">the</wd>

<space/>

<wd l="5462" t="11626" r="5794" b="11731">sec-</wd>

</ln>

<ln l="1445" t="11842" r="5803" b="12043" baseLine="11995" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="11842" r="1766" b="12000">ond</wd>

<space/>

<wd l="1829" t="11894" r="2179" b="12029">one,</wd>

<space/>

<wd l="2246" t="11842" r="2510" b="12000">the</wd>

<space/>

<wd l="2573" t="11866" r="3130" b="12043">output</wd>

<space/>

<wd l="3187" t="11842" r="3374" b="12000">of</wd>

<space/>

<wd l="3418" t="11842" r="3725" b="12000">this</wd>

<space/>

<wd l="3797" t="11842" r="4392" b="12000">second</wd>

<space/>

<wd l="4450" t="11894" r="5290" b="12043">processor</wd>

<space/>

<wd l="5338" t="11842" r="5477" b="12000">is</wd>

<space/>

<wd l="5539" t="11842" r="5803" b="12000">the</wd>

<space/>

</ln>

<ln l="1440" t="12115" r="5803" b="12317" baseLine="12264" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="12115" r="1891" b="12317">input</wd>

<space/>

<wd l="1944" t="12115" r="2131" b="12274">of</wd>

<space/>

<wd l="2170" t="12115" r="2434" b="12274">the</wd>

<space/>

<wd l="2482" t="12115" r="2894" b="12274">third</wd>

<space/>

<wd l="2947" t="12168" r="3302" b="12302">one,</wd>

<space/>

<wd l="3365" t="12115" r="3677" b="12274">and</wd>

<space/>

<wd l="3734" t="12168" r="3917" b="12274">so</wd>

<space/>

<wd l="3974" t="12168" r="4229" b="12302">on,</wd>

<space/>

<wd l="4291" t="12115" r="4690" b="12274">until</wd>

<space/>

<wd l="4738" t="12115" r="5486" b="12317">reaching</wd>

<space/>

<wd l="5539" t="12115" r="5803" b="12274">the</wd>

<space/>

</ln>

<ln l="1440" t="12384" r="5808" b="12586" baseLine="12538" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="12384" r="1747" b="12542">last</wd>

<space/>

<wd l="1824" t="12437" r="2693" b="12586">processor,</wd>

<space/>

<wd l="2789" t="12384" r="3346" b="12542">whose</wd>

<space/>

<wd l="3427" t="12408" r="3984" b="12586">output</wd>

<space/>

<wd l="4061" t="12384" r="4814" b="12542">becomes</wd>

<space/>

<wd l="4901" t="12384" r="5170" b="12542">the</wd>

<space/>

<wd l="5251" t="12408" r="5808" b="12586">output</wd>

<space/>

</ln>

<ln l="1445" t="12658" r="2645" b="12859" baseLine="12806" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="12658" r="1637" b="12816">of</wd>

<space/>

<wd l="1675" t="12658" r="1944" b="12816">the</wd>

<space/>

<wd l="2006" t="12682" r="2645" b="12859">system.</wd>

</ln>

</para>

<para l="1440" t="12941" r="5818" b="15307" alignment="justified" spaceBefore="14" fli="216" lsp="exactly" lspExact="269" language="en">

<ln l="1656" t="12941" r="5808" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="12941" r="2558" b="13142">Regarding</wd>

<space/>

<wd l="2654" t="12941" r="2851" b="13099">its</wd>

<space/>

<wd l="2952" t="12941" r="3562" b="13142">design,</wd>

<space/>

<wd l="3672" t="12994" r="3926" b="13099">we</wd>

<space/>

<wd l="4018" t="12941" r="4421" b="13099">have</wd>

<space/>

<wd l="4507" t="12941" r="5280" b="13099">followed</wd>

<space/>

<wd l="5376" t="12941" r="5808" b="13142">good</wd>

<space/>

</ln>

<ln l="1445" t="13210" r="5818" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="13210" r="2467" b="13411">engineering</wd>

<space/>

<wd l="2554" t="13210" r="3317" b="13411">practices</wd>

<space/>

<wd l="3413" t="13210" r="3725" b="13368">and</wd>

<space/>

<wd l="3806" t="13210" r="4277" b="13368">made</wd>

<space/>

<wd l="4363" t="13210" r="5170" b="13368">extensive</wd>

<space/>

<wd l="5251" t="13262" r="5539" b="13368">use</wd>

<space/>

<wd l="5630" t="13210" r="5818" b="13368">of</wd>

<space/>

</ln>

<ln l="1440" t="13478" r="5808" b="13680" baseLine="13632">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="13478" r="2006" b="13680">design</wd>

<space/>

</run>

<wd l="2054" t="13512" r="2832" b="13680"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">patterns</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="2942" t="13483" r="3590" b="13680">Among</wd>

<space/>

<wd l="3662" t="13478" r="4138" b="13666">them,</wd>

<space/>

<wd l="4219" t="13478" r="4339" b="13637">it</wd>

<space/>

<wd l="4411" t="13478" r="4987" b="13637">should</wd>

<space/>

<wd l="5050" t="13478" r="5256" b="13637">be</wd>

<space/>

<wd l="5318" t="13478" r="5808" b="13637">noted</wd>

<space/>

</run>

</ln>

<ln l="1440" t="13752" r="5794" b="13954" baseLine="13901">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="13752" r="1704" b="13910">the</wd>

<space/>

<wd l="1757" t="13805" r="2045" b="13910">use</wd>

<space/>

<wd l="2102" t="13752" r="2294" b="13910">of</wd>

<space/>

<wd l="2333" t="13752" r="2597" b="13910">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="2650" t="13752" r="3514" b="13910">decorator</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="3562" t="13776" r="4166" b="13954">pattern</wd>

<space/>

<wd l="4219" t="13752" r="4795" b="13939">which,</wd>

<space/>

<wd l="4858" t="13752" r="5026" b="13906">in</wd>

<space/>

<wd l="5083" t="13805" r="5371" b="13910">our</wd>

<space/>

<wd l="5424" t="13805" r="5794" b="13910">con-</wd>

</run>

</ln>

<ln l="1440" t="14021" r="5803" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14045" r="1810" b="14208">text,</wd>

<space/>

<wd l="1901" t="14045" r="2774" b="14222">represents</wd>

<space/>

<wd l="2866" t="14074" r="2962" b="14179">a</wd>

<space/>

<wd l="3043" t="14021" r="3614" b="14222">simple</wd>

<space/>

<wd l="3691" t="14021" r="4440" b="14222">pipeline,</wd>

<space/>

<wd l="4536" t="14021" r="5285" b="14222">allowing</wd>

<space/>

<wd l="5366" t="14074" r="5554" b="14179">us</wd>

<space/>

<wd l="5635" t="14045" r="5803" b="14179">to</wd>

<space/>

</ln>

<ln l="1445" t="14294" r="5794" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="14294" r="2515" b="14496">dynamically</wd>

<space/>

<wd l="2592" t="14294" r="3034" b="14453">stack</wd>

<space/>

<wd l="3101" t="14347" r="3298" b="14453">an</wd>

<space/>

<wd l="3374" t="14294" r="4118" b="14496">arbitrary</wd>

<space/>

<wd l="4186" t="14294" r="4858" b="14453">number</wd>

<space/>

<wd l="4920" t="14294" r="5112" b="14453">of</wd>

<space/>

<wd l="5165" t="14347" r="5794" b="14496">proces-</wd>

</ln>

<ln l="1450" t="14563" r="5808" b="14765" baseLine="14717">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1450" t="14616" r="1834" b="14722">sors.</wd>

<space/>

<wd l="1910" t="14568" r="2122" b="14722">Its</wd>

<space/>

<wd l="2189" t="14563" r="3274" b="14722">combination</wd>

<space/>

<wd l="3326" t="14563" r="3715" b="14722">with</wd>

<space/>

<wd l="3763" t="14563" r="4027" b="14722">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="4085" t="14573" r="5146" b="14765">composition</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="5198" t="14587" r="5808" b="14765">pattern</wd>

<space/>

</run>

</ln>

<ln l="1440" t="14837" r="5803" b="15038" baseLine="14986">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="14837" r="1733" b="14995">lets</wd>

<space/>

<wd l="1819" t="14890" r="2006" b="14995">us</wd>

<space/>

<wd l="2093" t="14890" r="2597" b="15038">group</wd>

<space/>

<wd l="2678" t="14837" r="3115" b="14995">them</wd>

<space/>

<wd l="3187" t="14837" r="3523" b="14995">into</wd>

<space/>

</run>

<wd l="3605" t="14870" r="4190" b="15038"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">stages</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="4282" t="14837" r="4819" b="14995">which</wd>

<space/>

<wd l="4896" t="14837" r="5462" b="14995">enable</wd>

<space/>

<wd l="5539" t="14837" r="5803" b="14995">the</wd>

<space/>

</run>

</ln>

<ln l="1445" t="15106" r="5803" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="15106" r="2280" b="15264">definition</wd>

<space/>

<wd l="2342" t="15106" r="2534" b="15264">of</wd>

<space/>

<wd l="2582" t="15106" r="3422" b="15307">particular</wd>

<space/>

<wd l="3480" t="15158" r="4320" b="15307">processor</wd>

<space/>

<wd l="4382" t="15158" r="5251" b="15307">sequences</wd>

<space/>

<wd l="5318" t="15106" r="5803" b="15264">while</wd>

<space/>

</ln>

</para>

</column>

<column l="6142" t="1261" r="10524" b="15317">

<para l="6144" t="1320" r="10507" b="3149" alignment="justified" spaceBefore="1" lsp="exactly" lspExact="271" language="en">

<ln l="6154" t="1320" r="10498" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="1320" r="6470" b="1478">still</wd>

<space/>

<wd l="6581" t="1320" r="7210" b="1522">sharing</wd>

<space/>

<wd l="7310" t="1320" r="7574" b="1478">the</wd>

<space/>

<wd l="7680" t="1373" r="8122" b="1478">same</wd>

<space/>

<wd l="8218" t="1320" r="8659" b="1478">basic</wd>

<space/>

<wd l="8765" t="1373" r="9605" b="1522">processor</wd>

<space/>

<wd l="9696" t="1320" r="10498" b="1507">interface,</wd>

<space/>

</ln>

<ln l="6144" t="1594" r="10498" b="1795" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="1594" r="6499" b="1752">thus</wd>

<space/>

<wd l="6610" t="1594" r="7526" b="1795">preserving</wd>

<space/>

<wd l="7632" t="1594" r="7901" b="1752">the</wd>

<space/>

<wd l="8006" t="1594" r="8842" b="1795">flexibility</wd>

<space/>

<wd l="8952" t="1594" r="9144" b="1752">of</wd>

<space/>

<wd l="9230" t="1594" r="9499" b="1752">the</wd>

<space/>

</run>

<wd l="9600" t="1594" r="10498" b="1752"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">decorator</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="6144" t="1862" r="10502" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="1862" r="6902" b="2064">Thereby,</wd>

<space/>

<wd l="6974" t="1862" r="7243" b="2021">the</wd>

<space/>

<wd l="7301" t="1862" r="8064" b="2064">resulting</wd>

<space/>

<wd l="8136" t="1886" r="8890" b="2021">structure</wd>

<space/>

<wd l="8957" t="1862" r="9509" b="2021">allows</wd>

<space/>

<wd l="9576" t="1862" r="9835" b="2021">for</wd>

<space/>

<wd l="9893" t="1862" r="10157" b="2021">the</wd>

<space/>

<wd l="10224" t="1862" r="10502" b="2064">dy-</wd>

</ln>

<ln l="6144" t="2136" r="10502" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2136" r="6672" b="2294">namic</wd>

<space/>

<wd l="6763" t="2136" r="7838" b="2294">construction</wd>

<space/>

<wd l="7920" t="2136" r="8112" b="2294">of</wd>

<space/>

<wd l="8179" t="2136" r="8923" b="2294">different</wd>

<space/>

<wd l="9000" t="2136" r="9706" b="2338">pipeline</wd>

<space/>

<wd l="9787" t="2136" r="10502" b="2338">configu-</wd>

</ln>

<ln l="6144" t="2405" r="10502" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2405" r="6730" b="2563">rations</wd>

<space/>

<wd l="6811" t="2405" r="6998" b="2563">of</wd>

<space/>

<wd l="7051" t="2405" r="7709" b="2606">varying</wd>

<space/>

<wd l="7781" t="2405" r="8750" b="2606">complexity</wd>

<space/>

<wd l="8827" t="2405" r="9134" b="2563">and</wd>

<space/>

<wd l="9206" t="2405" r="9946" b="2563">different</wd>

<space/>

<wd l="10013" t="2405" r="10502" b="2563">levels</wd>

<space/>

</ln>

<ln l="6149" t="2678" r="10507" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="2678" r="6341" b="2837">of</wd>

<space/>

<wd l="6398" t="2678" r="7397" b="2866">abstraction,</wd>

<space/>

<wd l="7478" t="2702" r="7762" b="2837">not</wd>

<space/>

<wd l="7824" t="2678" r="8309" b="2880">being</wd>

<space/>

<wd l="8381" t="2678" r="9192" b="2837">restricted</wd>

<space/>

<wd l="9259" t="2702" r="9427" b="2837">to</wd>

<space/>

<wd l="9499" t="2678" r="9763" b="2837">the</wd>

<space/>

<wd l="9835" t="2678" r="10507" b="2880">original</wd>

<space/>

</ln>

<ln l="6154" t="2947" r="6854" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="2947" r="6854" b="3149">settings.</wd>

</ln>

</para>

<para l="6144" t="3230" r="10512" b="5554" alignment="justified" spaceBefore="9" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="3230" r="10512" b="3432" baseLine="3379">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6365" t="3230" r="6701" b="3389">The</wd>

<space/>

<wd l="6768" t="3230" r="7733" b="3432">application</wd>

<space/>

<wd l="7795" t="3230" r="7982" b="3389">of</wd>

<space/>

<wd l="8030" t="3230" r="8294" b="3389">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8357" t="3230" r="9096" b="3432">template</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="9163" t="3254" r="9768" b="3432">pattern</wd>

<space/>

<wd l="9830" t="3230" r="10512" b="3389">allowed</wd>

<space/>

</run>

</ln>

<ln l="6144" t="3499" r="10502" b="3701" baseLine="3653" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="3552" r="6331" b="3658">us</wd>

<space/>

<wd l="6394" t="3523" r="6557" b="3658">to</wd>

<space/>

<wd l="6614" t="3499" r="7373" b="3658">factorize</wd>

<space/>

<wd l="7430" t="3523" r="7862" b="3701">great</wd>

<space/>

<wd l="7915" t="3528" r="8256" b="3701">part</wd>

<space/>

<wd l="8314" t="3499" r="8501" b="3658">of</wd>

<space/>

<wd l="8539" t="3499" r="8808" b="3658">the</wd>

<space/>

<wd l="8866" t="3552" r="9624" b="3658">common</wd>

<space/>

<wd l="9677" t="3552" r="10502" b="3701">processes</wd>

<space/>

</ln>

<ln l="6149" t="3773" r="10512" b="3974" baseLine="3922" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="3773" r="6341" b="3931">of</wd>

<space/>

<wd l="6379" t="3773" r="6643" b="3931">the</wd>

<space/>

<wd l="6696" t="3797" r="7790" b="3974">components,</wd>

<space/>

<wd l="7862" t="3773" r="8256" b="3931">such</wd>

<space/>

<wd l="8309" t="3826" r="8477" b="3931">as</wd>

<space/>

<wd l="8534" t="3773" r="8798" b="3931">the</wd>

<space/>

<wd l="8861" t="3773" r="9730" b="3974">sequential</wd>

<space/>

<wd l="9782" t="3773" r="10512" b="3931">iteration</wd>

<space/>

</ln>

<ln l="6144" t="4042" r="10512" b="4243" baseLine="4195" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="4042" r="6826" b="4243">through</wd>

<space/>

<wd l="6922" t="4042" r="7123" b="4200">all</wd>

<space/>

<wd l="7224" t="4042" r="7488" b="4200">the</wd>

<space/>

<wd l="7579" t="4042" r="8030" b="4243">input</wd>

<space/>

<wd l="8122" t="4066" r="8722" b="4229">tweets,</wd>

<space/>

<wd l="8832" t="4042" r="9370" b="4200">which</wd>

<space/>

<wd l="9456" t="4066" r="9883" b="4200">most</wd>

<space/>

<wd l="9974" t="4042" r="10166" b="4200">of</wd>

<space/>

<wd l="10243" t="4042" r="10512" b="4200">the</wd>

<space/>

</ln>

<ln l="6144" t="4315" r="10502" b="4517" baseLine="4464" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="4368" r="7061" b="4517">processors</wd>

<space/>

<wd l="7147" t="4315" r="7891" b="4517">perform.</wd>

<space/>

<wd l="8045" t="4315" r="8424" b="4474">This</wd>

<space/>

<wd l="8510" t="4315" r="9202" b="4474">resulted</wd>

<space/>

<wd l="9278" t="4315" r="9451" b="4469">in</wd>

<space/>

<wd l="9533" t="4368" r="9629" b="4474">a</wd>

<space/>

<wd l="9710" t="4339" r="10142" b="4517">great</wd>

<space/>

<wd l="10219" t="4315" r="10502" b="4474">ho-</wd>

</ln>

<ln l="6144" t="4584" r="10502" b="4786" baseLine="4733" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="4584" r="7334" b="4786">mogenization</wd>

<space/>

<wd l="7402" t="4584" r="7594" b="4742">of</wd>

<space/>

<wd l="7642" t="4584" r="7910" b="4742">the</wd>

<space/>

<wd l="7978" t="4584" r="8429" b="4771">code,</wd>

<space/>

<wd l="8506" t="4584" r="8861" b="4742">thus</wd>

<space/>

<wd l="8942" t="4584" r="9936" b="4786">simplifying</wd>

<space/>

<wd l="10003" t="4584" r="10502" b="4742">main-</wd>

</ln>

<ln l="6144" t="4858" r="10512" b="5059" baseLine="5006" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="4882" r="6811" b="5016">tenance</wd>

<space/>

<wd l="6869" t="4858" r="7176" b="5016">and</wd>

<space/>

<wd l="7234" t="4858" r="7982" b="5059">allowing</wd>

<space/>

<wd l="8035" t="4910" r="8222" b="5016">us</wd>

<space/>

<wd l="8280" t="4882" r="8443" b="5016">to</wd>

<space/>

<wd l="8501" t="4858" r="8962" b="5016">focus</wd>

<space/>

<wd l="9024" t="4910" r="9317" b="5016">our</wd>

<space/>

<wd l="9365" t="4858" r="9917" b="5016">efforts</wd>

<space/>

<wd l="9979" t="4910" r="10195" b="5016">on</wd>

<space/>

<wd l="10243" t="4858" r="10512" b="5016">the</wd>

<space/>

</ln>

<ln l="6154" t="5126" r="10502" b="5328" baseLine="5275" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6154" t="5126" r="6806" b="5328">specific</wd>

<space/>

<wd l="6854" t="5126" r="8227" b="5328">implementation</wd>

<space/>

<wd l="8270" t="5126" r="8462" b="5285">of</wd>

<space/>

<wd l="8486" t="5126" r="8755" b="5285">the</wd>

<space/>

<wd l="8798" t="5126" r="9725" b="5328">processing</wd>

<space/>

<wd l="9773" t="5126" r="10502" b="5285">methods</wd>

<space/>

</ln>

<ln l="6144" t="5395" r="7243" b="5554" baseLine="5549" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5395" r="6317" b="5549">in</wd>

<space/>

<wd l="6374" t="5395" r="6773" b="5554">each</wd>

<space/>

<wd l="6830" t="5448" r="7243" b="5554">case.</wd>

</ln>

</para>

<para l="6144" t="5678" r="10517" b="8318" alignment="justified" spaceBefore="9" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="5678" r="10502" b="5880" baseLine="5827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6365" t="5683" r="7253" b="5866">Moreover,</wd>

<space/>

<wd l="7349" t="5731" r="7795" b="5837">some</wd>

<space/>

<wd l="7867" t="5731" r="8779" b="5880">processors</wd>

<space/>

<wd l="8856" t="5678" r="9326" b="5837">make</wd>

<space/>

<wd l="9398" t="5731" r="9686" b="5837">use</wd>

<space/>

<wd l="9763" t="5678" r="9955" b="5837">of</wd>

<space/>

<wd l="10013" t="5702" r="10502" b="5837">exter-</wd>

</ln>

<ln l="6144" t="5947" r="10512" b="6149" baseLine="6101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5947" r="6408" b="6106">nal</wd>

<space/>

<wd l="6461" t="5947" r="6874" b="6106">tools</wd>

<space/>

<wd l="6936" t="5947" r="7594" b="6149">capable</wd>

<space/>

<wd l="7646" t="5947" r="7838" b="6106">of</wd>

<space/>

<wd l="7872" t="5947" r="8352" b="6149">being</wd>

<space/>

<wd l="8410" t="5947" r="9134" b="6149">changed</wd>

<space/>

<wd l="9182" t="6000" r="9581" b="6106">even</wd>

<space/>

<wd l="9634" t="5971" r="9787" b="6106">at</wd>

<space/>

<wd l="9830" t="5947" r="10512" b="6106">runtime</wd>

<space/>

</ln>

<ln l="6144" t="6221" r="10502" b="6422" baseLine="6370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6317" r="6365" b="6331">—</wd>

<space/>

<wd l="6418" t="6221" r="7310" b="6422">something</wd>

<space/>

<wd l="7363" t="6221" r="7550" b="6379">of</wd>

<space/>

<wd l="7589" t="6221" r="8184" b="6422">special</wd>

<space/>

<wd l="8227" t="6221" r="8870" b="6379">interest</wd>

<space/>

<wd l="8914" t="6221" r="9082" b="6374">in</wd>

<space/>

<wd l="9125" t="6221" r="10186" b="6422">multilingual</wd>

<space/>

<wd l="10238" t="6274" r="10502" b="6379">en-</wd>

</ln>

<ln l="6144" t="6490" r="10512" b="6691" baseLine="6643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6490" r="7171" b="6648">vironments.</wd>

<space/>

<wd l="7253" t="6494" r="7392" b="6648">It</wd>

<space/>

<wd l="7454" t="6490" r="8026" b="6648">should</wd>

<space/>

<wd l="8088" t="6490" r="8429" b="6648">also</wd>

<space/>

<wd l="8491" t="6490" r="8698" b="6648">be</wd>

<space/>

<wd l="8755" t="6490" r="9466" b="6691">possible</wd>

<space/>

<wd l="9523" t="6514" r="9691" b="6648">to</wd>

<space/>

<wd l="9749" t="6490" r="10512" b="6691">integrate</wd>

<space/>

</ln>

<ln l="6144" t="6763" r="10517" b="6965" baseLine="6912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6763" r="6586" b="6922">them</wd>

<space/>

<wd l="6638" t="6763" r="6974" b="6922">into</wd>

<space/>

<wd l="7042" t="6763" r="7493" b="6922">other</wd>

<space/>

<wd l="7550" t="6763" r="8242" b="6922">external</wd>

<space/>

<wd l="8309" t="6787" r="9403" b="6965">components,</wd>

<space/>

<wd l="9480" t="6816" r="9662" b="6922">so</wd>

<space/>

<wd l="9725" t="6763" r="10056" b="6922">that</wd>

<space/>

<wd l="10109" t="6763" r="10517" b="6922">their</wd>

<space/>

</ln>

<ln l="6144" t="7032" r="10502" b="7234" baseLine="7186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="7032" r="6576" b="7234">logic</wd>

<space/>

<wd l="6667" t="7085" r="6965" b="7190">can</wd>

<space/>

<wd l="7051" t="7032" r="7253" b="7190">be</wd>

<space/>

<wd l="7339" t="7032" r="7910" b="7190">reused</wd>

<space/>

<wd l="7992" t="7032" r="8203" b="7234">by</wd>

<space/>

<wd l="8294" t="7032" r="8866" b="7190">others.</wd>

<space/>

<wd l="9029" t="7032" r="9307" b="7186">All</wd>

<space/>

<wd l="9389" t="7032" r="9696" b="7190">this</wd>

<space/>

<wd l="9787" t="7032" r="10502" b="7190">involves</wd>

<space/>

</ln>

<ln l="6149" t="7306" r="10502" b="7507" baseLine="7454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="7306" r="7114" b="7507">decoupling</wd>

<space/>

<wd l="7162" t="7306" r="7426" b="7464">the</wd>

<space/>

<wd l="7474" t="7358" r="8390" b="7507">processors</wd>

<space/>

<wd l="8443" t="7306" r="8870" b="7464">from</wd>

<space/>

<wd l="8914" t="7306" r="9182" b="7464">the</wd>

<space/>

<wd l="9235" t="7306" r="9888" b="7507">specific</wd>

<space/>

<wd l="9941" t="7306" r="10502" b="7507">imple-</wd>

</ln>

<ln l="6144" t="7574" r="10498" b="7776" baseLine="7728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="7574" r="7094" b="7733">mentations</wd>

<space/>

<wd l="7166" t="7574" r="7358" b="7733">of</wd>

<space/>

<wd l="7402" t="7574" r="7666" b="7733">the</wd>

<space/>

<wd l="7733" t="7574" r="8424" b="7733">external</wd>

<space/>

<wd l="8491" t="7598" r="9533" b="7776">components</wd>

<space/>

<wd l="9605" t="7574" r="10498" b="7776">employed,</wd>

<space/>

</ln>

<ln l="6144" t="7848" r="10502" b="8050" baseLine="7997">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="7848" r="6682" b="8006">which</wd>

<space/>

<wd l="6734" t="7901" r="6984" b="8006">we</wd>

<space/>

<wd l="7042" t="7848" r="7445" b="8006">have</wd>

<space/>

<wd l="7502" t="7848" r="8266" b="8006">achieved</wd>

<space/>

<wd l="8318" t="7848" r="8995" b="8050">through</wd>

<space/>

<wd l="9048" t="7848" r="9317" b="8006">the</wd>

<space/>

<wd l="9370" t="7901" r="9658" b="8006">use</wd>

<space/>

<wd l="9720" t="7848" r="9907" b="8006">of</wd>

<space/>

<wd l="9950" t="7848" r="10214" b="8006">the</wd>

<space/>

</run>

<wd l="10277" t="7858" r="10502" b="8006" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">in-</wd>

</ln>

<ln l="6144" t="8117" r="8390" b="8318" baseLine="8266">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="8126" r="6782" b="8275">version</wd>

<space/>

<wd l="6845" t="8122" r="7046" b="8318">of</wd>

<space/>

<wd l="7070" t="8117" r="7685" b="8275">control</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7738" t="8141" r="8390" b="8318">pattern.</wd>

</run>

</ln>

</para>

<para l="6144" t="8400" r="10512" b="11266" alignment="justified" spaceBefore="12" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="8400" r="10502" b="8587" baseLine="8549" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="8400" r="7498" b="8587">Furthermore,</wd>

<space/>

<wd l="7565" t="8400" r="8918" b="8558">communication</wd>

<space/>

<wd l="8966" t="8400" r="9696" b="8558">between</wd>

<space/>

<wd l="9744" t="8400" r="10013" b="8558">the</wd>

<space/>

<wd l="10066" t="8453" r="10502" b="8558">com-</wd>

</ln>

<ln l="6144" t="8669" r="10512" b="8870" baseLine="8818" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="8693" r="6816" b="8870">ponents</wd>

<space/>

<wd l="6888" t="8669" r="7080" b="8827">of</wd>

<space/>

<wd l="7123" t="8669" r="7392" b="8827">the</wd>

<space/>

<wd l="7450" t="8669" r="8150" b="8870">pipeline</wd>

<space/>

<wd l="8213" t="8669" r="8352" b="8827">is</wd>

<space/>

<wd l="8424" t="8669" r="8842" b="8827">done</wd>

<space/>

<wd l="8899" t="8669" r="9581" b="8870">through</wd>

<space/>

<wd l="9648" t="8669" r="10512" b="8827">structured</wd>

<space/>

</ln>

<ln l="6144" t="8942" r="10507" b="9144" baseLine="9091" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="8966" r="6470" b="9101">text</wd>

<space/>

<wd l="6533" t="8942" r="6936" b="9130">files,</wd>

<space/>

<wd l="7013" t="8942" r="7766" b="9144">allowing</wd>

<space/>

<wd l="7829" t="8995" r="8011" b="9101">us</wd>

<space/>

<wd l="8083" t="8966" r="8246" b="9101">to</wd>

<space/>

<wd l="8318" t="8942" r="8688" b="9144">gain</wd>

<space/>

<wd l="8750" t="8942" r="9590" b="9144">flexibility</wd>

<space/>

<wd l="9658" t="8995" r="9826" b="9101">as</wd>

<space/>

<wd l="9893" t="8995" r="10147" b="9101">we</wd>

<space/>

<wd l="10214" t="8995" r="10507" b="9101">can</wd>

<space/>

</ln>

<ln l="6144" t="9211" r="10507" b="9413" baseLine="9360" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9211" r="6907" b="9413">integrate</wd>

<space/>

<wd l="6979" t="9211" r="7291" b="9370">and</wd>

<space/>

<wd l="7363" t="9211" r="8179" b="9413">exchange</wd>

<space/>

<wd l="8251" t="9211" r="8640" b="9370">with</wd>

<space/>

<wd l="8712" t="9264" r="9082" b="9370">ease</wd>

<space/>

<wd l="9149" t="9264" r="9504" b="9370">new</wd>

<space/>

<wd l="9576" t="9211" r="10507" b="9413">processing</wd>

<space/>

</ln>

<ln l="6144" t="9480" r="10502" b="9682" baseLine="9634" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9480" r="6878" b="9638">modules</wd>

<space/>

<wd l="6960" t="9480" r="7834" b="9682">regardless</wd>

<space/>

<wd l="7925" t="9480" r="8112" b="9638">of</wd>

<space/>

<wd l="8174" t="9480" r="8582" b="9638">their</wd>

<space/>

<wd l="8654" t="9480" r="9494" b="9682">particular</wd>

<space/>

<wd l="9566" t="9480" r="10502" b="9682">implemen-</wd>

</ln>

<ln l="6144" t="9754" r="10512" b="9950" baseLine="9902" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9754" r="6643" b="9912">tation</wd>

<space/>

<wd l="6720" t="9754" r="7392" b="9950">(Vilares</wd>

<space/>

<wd l="7474" t="9778" r="7627" b="9912">et</wd>

<space/>

<wd l="7699" t="9754" r="7949" b="9941">al.,</wd>

<space/>

<wd l="8040" t="9758" r="8587" b="9950">2013).</wd>

<space/>

<wd l="8707" t="9758" r="8890" b="9907">In</wd>

<space/>

<wd l="8957" t="9754" r="9264" b="9912">this</wd>

<space/>

<wd l="9346" t="9806" r="9715" b="9912">case</wd>

<space/>

<wd l="9782" t="9806" r="10037" b="9912">we</wd>

<space/>

<wd l="10109" t="9754" r="10512" b="9912">have</wd>

<space/>

</ln>

<ln l="6144" t="10008" r="10502" b="10224" baseLine="10176">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="10022" r="6547" b="10181">used</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6595" t="10056" r="7003" b="10176">XML</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7061" t="10022" r="7536" b="10224">along</wd>

<space/>

<wd l="7584" t="10022" r="7973" b="10181">with</wd>

<space/>

<wd l="8021" t="10075" r="8218" b="10181">an</wd>

<space/>

<wd l="8266" t="10022" r="9638" b="10224">implementation</wd>

<space/>

<wd l="9686" t="10022" r="9878" b="10181">of</wd>

<space/>

<wd l="9907" t="10022" r="10176" b="10181">the</wd>

<space/>

</run>

<wd l="10219" t="10022" r="10502" b="10181" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">ab-</wd>

</ln>

<ln l="6144" t="10296" r="10502" b="10498" baseLine="10445">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="10330" r="6648" b="10454">stract</wd>

<space/>

<wd l="6658" t="10301" r="7306" b="10498">factory</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7358" t="10320" r="7968" b="10498">pattern</wd>

<space/>

<wd l="8016" t="10296" r="8275" b="10454">for</wd>

<space/>

<wd l="8323" t="10296" r="8520" b="10454">its</wd>

<space/>

<wd l="8582" t="10296" r="9658" b="10454">construction</wd>

<space/>

<wd l="9715" t="10296" r="10027" b="10454">and</wd>

<space/>

<wd l="10075" t="10349" r="10502" b="10498">pars-</wd>

</run>

</ln>

<ln l="6144" t="10565" r="10502" b="10766" baseLine="10718" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10565" r="6466" b="10766">ing.</wd>

<space/>

<wd l="6653" t="10565" r="7037" b="10723">This</wd>

<space/>

<wd l="7138" t="10565" r="7483" b="10723">also</wd>

<space/>

<wd l="7574" t="10565" r="8414" b="10723">facilitates</wd>

<space/>

<wd l="8510" t="10565" r="9226" b="10766">possible</wd>

<space/>

<wd l="9317" t="10565" r="9840" b="10723">future</wd>

<space/>

<wd l="9931" t="10565" r="10502" b="10766">migra-</wd>

</ln>

<ln l="6144" t="10838" r="10512" b="11040" baseLine="10987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10838" r="6562" b="10997">tions</wd>

<space/>

<wd l="6634" t="10862" r="6802" b="10997">to</wd>

<space/>

<wd l="6874" t="10838" r="7325" b="10997">other</wd>

<space/>

<wd l="7392" t="10838" r="7752" b="10997">data</wd>

<space/>

<wd l="7814" t="10838" r="9053" b="11040">representation</wd>

<space/>

<wd l="9115" t="10838" r="10032" b="11040">languages,</wd>

<space/>

<wd l="10118" t="10838" r="10512" b="10997">such</wd>

<space/>

</ln>

<ln l="6149" t="11141" r="6883" b="11266" baseLine="11261">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6149" t="11160" r="6322" b="11266">as</wd>

<space/>

</run>

<wd l="6389" t="11141" r="6883" b="11266"><run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">JSON</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="11390" r="10512" b="12946" alignment="justified" spaceBefore="6" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="11390" r="10502" b="11592" baseLine="11539">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6365" t="11390" r="7013" b="11592">Finally,</wd>

<space/>

<wd l="7104" t="11443" r="7358" b="11549">we</wd>

<space/>

<wd l="7435" t="11390" r="7838" b="11549">have</wd>

<space/>

<wd l="7920" t="11390" r="8544" b="11549">created</wd>

<space/>

<wd l="8621" t="11443" r="8717" b="11549">a</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8789" t="11390" r="9528" b="11592">dynamic</wd>

<space/>

<wd l="9610" t="11395" r="10502" b="11592">configura-</wd>

</run>

</ln>

<ln l="6149" t="11645" r="10507" b="11861" baseLine="11813">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6149" t="11669" r="6480" b="11818">tion</wd>

<space/>

<wd l="6528" t="11659" r="7411" b="11861">subsystem</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7454" t="11659" r="7954" b="11818">based</wd>

<space/>

<wd l="8002" t="11712" r="8213" b="11818">on</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8261" t="11693" r="8669" b="11813">XML</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8726" t="11659" r="9077" b="11818">files</wd>

<space/>

<wd l="9125" t="11659" r="9456" b="11818">that</wd>

<space/>

<wd l="9504" t="11659" r="10051" b="11818">allows</wd>

<space/>

<wd l="10104" t="11712" r="10291" b="11818">us</wd>

<space/>

<wd l="10339" t="11683" r="10507" b="11818">to</wd>

<space/>

</run>

</ln>

<ln l="6149" t="11933" r="10512" b="12134" baseLine="12082" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="11933" r="6677" b="12091">define</wd>

<space/>

<wd l="6730" t="11933" r="7037" b="12091">and</wd>

<space/>

<wd l="7080" t="11933" r="7978" b="12091">instantiate</wd>

<space/>

<wd l="8021" t="11933" r="8290" b="12091">the</wd>

<space/>

<wd l="8333" t="11933" r="9173" b="12134">particular</wd>

<space/>

<wd l="9221" t="11957" r="9974" b="12091">structure</wd>

<space/>

<wd l="10022" t="11933" r="10214" b="12091">of</wd>

<space/>

<wd l="10243" t="11933" r="10512" b="12091">the</wd>

<space/>

</ln>

<ln l="6144" t="12202" r="10498" b="12403" baseLine="12355" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="12202" r="6850" b="12403">pipeline</wd>

<space/>

<wd l="6922" t="12254" r="7133" b="12360">on</wd>

<space/>

<wd l="7200" t="12202" r="7733" b="12360">which</wd>

<space/>

<wd l="7800" t="12254" r="8054" b="12360">we</wd>

<space/>

<wd l="8122" t="12226" r="8544" b="12360">want</wd>

<space/>

<wd l="8611" t="12226" r="8774" b="12360">to</wd>

<space/>

<wd l="8846" t="12254" r="9490" b="12403">process</wd>

<space/>

<wd l="9566" t="12202" r="9830" b="12360">the</wd>

<space/>

<wd l="9898" t="12226" r="10498" b="12360">tweets.</wd>

<space/>

</ln>

<ln l="6144" t="12475" r="10512" b="12677" baseLine="12624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="12475" r="6485" b="12634">The</wd>

<space/>

<wd l="6533" t="12475" r="7483" b="12677">advantages</wd>

<space/>

<wd l="7541" t="12475" r="7733" b="12634">of</wd>

<space/>

<wd l="7771" t="12475" r="8160" b="12634">such</wd>

<space/>

<wd l="8208" t="12528" r="8304" b="12634">a</wd>

<space/>

<wd l="8357" t="12475" r="9259" b="12677">subsystem</wd>

<space/>

<wd l="9302" t="12528" r="9562" b="12634">are</wd>

<space/>

<wd l="9614" t="12475" r="10066" b="12662">clear,</wd>

<space/>

<wd l="10123" t="12475" r="10512" b="12634">both</wd>

<space/>

</ln>

<ln l="6144" t="12744" r="9485" b="12946" baseLine="12893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="12744" r="6403" b="12902">for</wd>

<space/>

<wd l="6466" t="12768" r="7066" b="12946">system</wd>

<space/>

<wd l="7114" t="12744" r="8434" b="12946">maintainability</wd>

<space/>

<wd l="8496" t="12744" r="8808" b="12902">and</wd>

<space/>

<wd l="8861" t="12744" r="9485" b="12946">testing:</wd>

</ln>

</para>

<para l="6341" t="13262" r="10512" b="14275" alignment="justified" li="504" spaceBefore="245" fli="-288" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="6341" t="13262" r="10512" b="13464" baseLine="13411" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6341" t="13267" r="6581" b="13411">1.</wd>

<space/>

<wd l="6581" t="13267" r="6715" b="13421">It</wd>

<space/>

<wd l="6806" t="13262" r="7603" b="13464">improves</wd>

<space/>

<wd l="7704" t="13262" r="7973" b="13421">the</wd>

<space/>

<wd l="8064" t="13262" r="9130" b="13464">multilingual</wd>

<space/>

<wd l="9235" t="13291" r="9878" b="13464">support</wd>

<space/>

<wd l="9974" t="13262" r="10166" b="13421">of</wd>

<space/>

<wd l="10243" t="13262" r="10512" b="13421">the</wd>

<space/>

</ln>

<ln l="6590" t="13531" r="10502" b="13733" baseLine="13680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6590" t="13555" r="7190" b="13733">system</wd>

<space/>

<wd l="7243" t="13531" r="7459" b="13733">by</wd>

<space/>

<wd l="7526" t="13531" r="8266" b="13733">enabling</wd>

<space/>

<wd l="8328" t="13531" r="8592" b="13690">the</wd>

<space/>

<wd l="8654" t="13531" r="9490" b="13690">definition</wd>

<space/>

<wd l="9552" t="13531" r="9739" b="13690">of</wd>

<space/>

<wd l="9787" t="13531" r="10502" b="13733">configu-</wd>

</ln>

<ln l="6581" t="13800" r="10502" b="14002" baseLine="13954" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="13800" r="7166" b="13958">rations</wd>

<space/>

<wd l="7238" t="13800" r="7570" b="13958">that</wd>

<space/>

<wd l="7627" t="13853" r="7920" b="13958">use</wd>

<space/>

<wd l="7982" t="13853" r="8894" b="14002">processors</wd>

<space/>

<wd l="8971" t="13800" r="9283" b="13958">and</wd>

<space/>

<wd l="9346" t="13853" r="10162" b="13958">resources</wd>

<space/>

<wd l="10238" t="13800" r="10502" b="13958">de-</wd>

</ln>

<ln l="6590" t="14074" r="9389" b="14275" baseLine="14222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6590" t="14074" r="7152" b="14275">signed</wd>

<space/>

<wd l="7205" t="14074" r="7464" b="14232">for</wd>

<space/>

<wd l="7522" t="14126" r="7618" b="14232">a</wd>

<space/>

<wd l="7666" t="14074" r="8506" b="14275">particular</wd>

<space/>

<wd l="8558" t="14074" r="9389" b="14275">language.</wd>

</ln>

</para>

<para l="6322" t="14563" r="10502" b="15302" alignment="justified" li="504" spaceBefore="224" fli="-288" lsp="exactly" lspExact="267" language="en">

<bullet type="ordered" numChars="3">

</bullet>

<ln l="6322" t="14563" r="10502" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6322" t="14568" r="6581" b="14717">2.</wd>

<space/>

<wd l="6581" t="14568" r="6715" b="14722">It</wd>

<space/>

<wd l="6773" t="14563" r="7325" b="14722">allows</wd>

<space/>

<wd l="7387" t="14563" r="7646" b="14722">for</wd>

<space/>

<wd l="7704" t="14563" r="9115" b="14765">experimentation</wd>

<space/>

<wd l="9168" t="14563" r="9336" b="14717">in</wd>

<space/>

<wd l="9394" t="14616" r="9490" b="14722">a</wd>

<space/>

<wd l="9552" t="14563" r="10166" b="14765">simple,</wd>

<space/>

<wd l="10238" t="14616" r="10502" b="14765">ag-</wd>

</ln>

<ln l="6581" t="14837" r="10502" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="14837" r="6802" b="14995">ile</wd>

<space/>

<wd l="6864" t="14837" r="7176" b="14995">and</wd>

<space/>

<wd l="7238" t="14837" r="8299" b="14995">documented</wd>

<space/>

<wd l="8366" t="14837" r="8698" b="15034">(the</wd>

<space/>

<wd l="8760" t="14837" r="9922" b="15038">configuration</wd>

<space/>

<wd l="9984" t="14837" r="10258" b="14995">file</wd>

<space/>

<wd l="10315" t="14837" r="10502" b="14995">it-</wd>

</ln>

<ln l="6590" t="15106" r="10301" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6590" t="15106" r="6912" b="15264">self</wd>

<space/>

<wd l="6955" t="15106" r="7301" b="15264">also</wd>

<space/>

<wd l="7368" t="15158" r="7891" b="15264">serves</wd>

<space/>

<wd l="7958" t="15158" r="8126" b="15264">as</wd>

<space/>

<wd l="8194" t="15106" r="9552" b="15302">documentation)</wd>

<space/>

<wd l="9614" t="15158" r="10301" b="15264">manner.</wd>

</ln>

</para>

</column>

</section>

<dd l="1440" t="15746" r="10524" b="15975">

<para l="5771" t="15792" r="6200" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6134" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="30">

<wd l="5837" t="15792" r="6134" b="15946">100</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1433" marginTop="2026" marginRight="1378" marginBottom="1292" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<dd l="6144" t="1261" r="10531" b="2072">

<para l="6581" t="1320" r="10512" b="2021" alignment="justified" li="432" spaceBefore="1" lsp="exactly" lspExact="265" language="en">

<ln l="6586" t="1320" r="10502" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="1373" r="6802" b="1478">on</wd>

<space/>

<wd l="6874" t="1320" r="7138" b="1478">the</wd>

<space/>

<wd l="7214" t="1320" r="8194" b="1522">Metaphone</wd>

<space/>

<wd l="8275" t="1320" r="9120" b="1522">algorithm</wd>

<space/>

<wd l="9202" t="1320" r="9912" b="1522">(Philips,</wd>

<space/>

<wd l="10027" t="1325" r="10502" b="1517">1990)</wd>

<space/>

</ln>

<ln l="6586" t="1594" r="10512" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="1594" r="6898" b="1752">and</wd>

<space/>

<wd l="6960" t="1646" r="7056" b="1752">a</wd>

<space/>

<wd l="7114" t="1646" r="7469" b="1752">new</wd>

<space/>

<wd l="7536" t="1594" r="8227" b="1795">Spanish</wd>

<space/>

<wd l="8290" t="1594" r="9168" b="1795">dictionary</wd>

<space/>

<wd l="9235" t="1594" r="10027" b="1752">extracted</wd>

<space/>

<wd l="10085" t="1594" r="10512" b="1752">from</wd>

<space/>

</ln>

<ln l="6581" t="1829" r="8554" b="2021" baseLine="2008">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6581" t="1862" r="7546" b="2021">Wikimedia</wd>

<space/>

</run>

<wd l="7598" t="1829" r="8554" b="2021"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">resources.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</dd>

<dd l="1618" t="1261" r="5798" b="1798">

<para l="1618" t="1320" r="5794" b="1752" alignment="left" li="216" fli="-216" lsp="exactly" lspExact="262" language="en">

<ln l="1618" t="1320" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1618" t="1325" r="1766" b="1478">3.</wd>

<space/>

<wd l="1877" t="1325" r="2011" b="1478">It</wd>

<space/>

<wd l="2078" t="1320" r="2630" b="1478">avoids</wd>

<space/>

<wd l="2702" t="1320" r="2966" b="1478">the</wd>

<space/>

<wd l="3034" t="1320" r="3830" b="1522">necessity</wd>

<space/>

<wd l="3902" t="1320" r="4094" b="1478">of</wd>

<space/>

<wd l="4147" t="1320" r="5054" b="1522">modifying</wd>

<space/>

<wd l="5122" t="1320" r="5386" b="1478">the</wd>

<space/>

<wd l="5462" t="1373" r="5794" b="1522">sys-</wd>

</ln>

<ln l="1877" t="1594" r="3336" b="1752" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="1618" r="2208" b="1752">tem</wd>

<space/>

<wd l="2266" t="1646" r="2827" b="1752">source</wd>

<space/>

<wd l="2885" t="1594" r="3336" b="1752">code.</wd>

</ln>

</para>

</dd>

<section l="1433" t="2026" r="10531" b="15354">

<column l="1433" t="2026" r="5820" b="15354">

<para l="1440" t="2040" r="5165" b="2242" alignment="left" lsp="exactly" lspExact="225" language="en">

<ln l="1440" t="2040" r="5165" b="2242" baseLine="2189" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="1440" t="2040" r="1709" b="2198">2.2</wd>

<space/>

<wd l="1939" t="2040" r="3240" b="2242">Configuration</wd>

<space/>

<wd l="3293" t="2040" r="3878" b="2198">before</wd>

<space/>

<wd l="3936" t="2045" r="4670" b="2198">W-NUT</wd>

<space/>

<wd l="4733" t="2040" r="5165" b="2198">2015</wd>

</ln>

</para>

<para l="1440" t="2390" r="5808" b="6115" alignment="justified" spaceBefore="87" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="2390" r="5808" b="2592" baseLine="2539" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2390" r="1781" b="2549">The</wd>

<space/>

<wd l="1877" t="2414" r="2491" b="2549">current</wd>

<space/>

<wd l="2582" t="2443" r="3422" b="2592">processor</wd>

<space/>

<wd l="3518" t="2390" r="4675" b="2592">configuration</wd>

<space/>

<wd l="4766" t="2390" r="5026" b="2549">for</wd>

<space/>

<wd l="5122" t="2390" r="5808" b="2592">Spanish</wd>

<space/>

</ln>

<ln l="1440" t="2659" r="5808" b="2818" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2683" r="1915" b="2818">tweet</wd>

<space/>

<wd l="2011" t="2659" r="3226" b="2818">normalization</wd>

<space/>

<wd l="3326" t="2659" r="3936" b="2818">derives</wd>

<space/>

<wd l="4042" t="2659" r="4469" b="2818">from</wd>

<space/>

<wd l="4565" t="2659" r="4896" b="2818">that</wd>

<space/>

<wd l="4997" t="2712" r="5304" b="2818">one</wd>

<space/>

<wd l="5405" t="2659" r="5808" b="2818">used</wd>

<space/>

</ln>

<ln l="1440" t="2933" r="5803" b="3134" baseLine="3082" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2933" r="1656" b="3134">by</wd>

<space/>

<wd l="1723" t="2933" r="1992" b="3091">the</wd>

<space/>

<wd l="2059" t="2933" r="2563" b="3091">initial</wd>

<space/>

<wd l="2635" t="2957" r="3470" b="3134">prototype</wd>

<space/>

<wd l="3538" t="2933" r="3797" b="3091">for</wd>

<space/>

<wd l="3859" t="2933" r="4056" b="3091">its</wd>

<space/>

<wd l="4133" t="2933" r="5237" b="3134">participation</wd>

<space/>

<wd l="5304" t="2933" r="5472" b="3086">in</wd>

<space/>

<wd l="5539" t="2933" r="5803" b="3091">the</wd>

<space/>

</ln>

<ln l="1440" t="3202" r="5803" b="3403" baseLine="3354" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3206" r="2482" b="3360">TweetNorm</wd>

<space/>

<wd l="2549" t="3206" r="2966" b="3360">2013</wd>

<space/>

<wd l="3043" t="3202" r="3394" b="3360">task</wd>

<space/>

<wd l="3470" t="3202" r="4186" b="3403">(Alegria</wd>

<space/>

<wd l="4253" t="3226" r="4406" b="3360">et</wd>

<space/>

<wd l="4474" t="3202" r="4723" b="3389">al.,</wd>

<space/>

<wd l="4810" t="3206" r="5357" b="3398">2013).</wd>

<space/>

<wd l="5467" t="3202" r="5803" b="3360">The</wd>

<space/>

</ln>

<ln l="1445" t="3475" r="5803" b="3677" baseLine="3624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3475" r="2078" b="3677">general</wd>

<space/>

<wd l="2174" t="3475" r="3043" b="3677">procedure</wd>

<space/>

<wd l="3134" t="3475" r="3658" b="3634">works</wd>

<space/>

<wd l="3754" t="3475" r="4080" b="3634">like</wd>

<space/>

<wd l="4171" t="3475" r="4526" b="3634">this:</wd>

<space/>

<wd l="4690" t="3475" r="5222" b="3677">firstly,</wd>

<space/>

<wd l="5333" t="3475" r="5803" b="3677">using</wd>

<space/>

</ln>

<ln l="1440" t="3744" r="5794" b="3946" baseLine="3898" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3797" r="2352" b="3946">processors</wd>

<space/>

<wd l="2458" t="3768" r="2626" b="3902">to</wd>

<space/>

<wd l="2726" t="3797" r="3379" b="3946">prepare</wd>

<space/>

<wd l="3475" t="3744" r="3744" b="3902">the</wd>

<space/>

<wd l="3840" t="3744" r="4291" b="3946">input</wd>

<space/>

<wd l="4397" t="3744" r="5794" b="3946">(preprocessing);</wd>

<space/>

</ln>

<ln l="1450" t="4018" r="5803" b="4219" baseLine="4166" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="4018" r="2246" b="4219">secondly,</wd>

<space/>

<wd l="2371" t="4018" r="3293" b="4219">employing</wd>

<space/>

<wd l="3394" t="4018" r="3854" b="4176">those</wd>

<space/>

<wd l="3950" t="4018" r="4507" b="4176">whose</wd>

<space/>

<wd l="4603" t="4070" r="5294" b="4219">purpose</wd>

<space/>

<wd l="5395" t="4018" r="5530" b="4176">is</wd>

<space/>

<wd l="5635" t="4042" r="5803" b="4176">to</wd>

<space/>

</ln>

<ln l="1445" t="4286" r="5794" b="4488" baseLine="4435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4286" r="1987" b="4445">obtain</wd>

<space/>

<wd l="2059" t="4339" r="2410" b="4445">new</wd>

<space/>

<wd l="2486" t="4286" r="3701" b="4445">normalization</wd>

<space/>

<wd l="3773" t="4286" r="4272" b="4445">forms</wd>

<space/>

<wd l="4363" t="4286" r="5338" b="4483">(candidates</wd>

<space/>

<wd l="5424" t="4339" r="5794" b="4488">gen-</wd>

</ln>

<ln l="1445" t="4560" r="5794" b="4762" baseLine="4709" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4560" r="2165" b="4757">eration);</wd>

<space/>

<wd l="2270" t="4560" r="2880" b="4762">thirdly,</wd>

<space/>

<wd l="2976" t="4560" r="3446" b="4762">using</wd>

<space/>

<wd l="3528" t="4560" r="3989" b="4718">those</wd>

<space/>

<wd l="4070" t="4560" r="4238" b="4714">in</wd>

<space/>

<wd l="4325" t="4560" r="4896" b="4762">charge</wd>

<space/>

<wd l="4978" t="4560" r="5170" b="4718">of</wd>

<space/>

<wd l="5246" t="4560" r="5794" b="4718">select-</wd>

</ln>

<ln l="1440" t="4829" r="5794" b="5030" baseLine="4978" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4829" r="1714" b="5030">ing</wd>

<space/>

<wd l="1786" t="4882" r="1968" b="4987">or</wd>

<space/>

<wd l="2026" t="4829" r="2712" b="5030">filtering</wd>

<space/>

<wd l="2774" t="4829" r="3038" b="4987">the</wd>

<space/>

<wd l="3101" t="4829" r="3456" b="4987">best</wd>

<space/>

<wd l="3514" t="4829" r="4728" b="4987">normalization</wd>

<space/>

<wd l="4786" t="4829" r="5290" b="4987">forms</wd>

<space/>

<wd l="5366" t="4834" r="5794" b="5026">(can-</wd>

</ln>

<ln l="1445" t="5098" r="5803" b="5299" baseLine="5251" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5098" r="1973" b="5256">didate</wd>

<space/>

<wd l="2074" t="5098" r="3715" b="5299">filtering/selection);</wd>

<space/>

<wd l="3850" t="5098" r="4162" b="5256">and</wd>

<space/>

<wd l="4258" t="5098" r="4757" b="5299">lastly,</wd>

<space/>

<wd l="4877" t="5098" r="5803" b="5299">employing</wd>

<space/>

</ln>

<ln l="1440" t="5371" r="5808" b="5573" baseLine="5520" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5371" r="1901" b="5530">those</wd>

<space/>

<wd l="1958" t="5371" r="2491" b="5530">which</wd>

<space/>

<wd l="2549" t="5424" r="3202" b="5573">prepare</wd>

<space/>

<wd l="3259" t="5371" r="3523" b="5530">the</wd>

<space/>

<wd l="3586" t="5371" r="3965" b="5530">final</wd>

<space/>

<wd l="4027" t="5395" r="4584" b="5573">output</wd>

<space/>

<wd l="4642" t="5371" r="4834" b="5530">of</wd>

<space/>

<wd l="4877" t="5371" r="5141" b="5530">the</wd>

<space/>

<wd l="5208" t="5395" r="5808" b="5573">system</wd>

<space/>

</ln>

<ln l="1450" t="5640" r="5794" b="5842" baseLine="5794" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="5640" r="2923" b="5842">(postprocessing).</wd>

<space/>

<wd l="3034" t="5640" r="3466" b="5798">Such</wd>

<space/>

<wd l="3538" t="5664" r="3984" b="5842">setup</wd>

<space/>

<wd l="4051" t="5640" r="4771" b="5798">includes</wd>

<space/>

<wd l="4838" t="5640" r="5107" b="5798">the</wd>

<space/>

<wd l="5170" t="5640" r="5794" b="5798">follow-</wd>

</ln>

<ln l="1440" t="5914" r="2736" b="6115" baseLine="6062" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5914" r="1714" b="6115">ing</wd>

<space/>

<wd l="1771" t="5966" r="2736" b="6115">processors:</wd>

</ln>

</para>

<para l="1675" t="6355" r="5808" b="8146" alignment="justified" li="432" spaceBefore="184" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="6360" r="5803" b="6557" baseLine="6509">

<wd l="1675" t="6389" r="1882" b="6509">•</wd>

<tab position="1742"/>

<wd l="1882" t="6374" r="4147" b="6557"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">FreelingProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><space/>

<wd l="4296" t="6360" r="4834" b="6518">which</wd>

<space/>

<wd l="4954" t="6360" r="5405" b="6518">reads</wd>

<space/>

<wd l="5539" t="6360" r="5803" b="6518">the</wd>

<space/>

</run>

</ln>

<ln l="1877" t="6629" r="5808" b="6830" baseLine="6782" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1877" t="6629" r="2328" b="6830">input</wd>

<space/>

<wd l="2434" t="6629" r="2798" b="6787">data</wd>

<space/>

<wd l="2899" t="6629" r="3067" b="6782">in</wd>

<space/>

<wd l="3173" t="6629" r="3437" b="6787">the</wd>

<space/>

<wd l="3542" t="6634" r="4584" b="6787">TweetNorm</wd>

<space/>

<wd l="4690" t="6634" r="5107" b="6787">2013</wd>

<space/>

<wd l="5222" t="6629" r="5808" b="6787">format</wd>

<space/>

</ln>

<ln l="1882" t="6902" r="5794" b="7104" baseLine="7051">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="1882" t="6902" r="2194" b="7061">and</wd>

<space/>

<wd l="2237" t="6955" r="2606" b="7061">uses</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="2664" t="6917" r="3701" b="7099">Freeling</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="3763" t="6902" r="4330" b="7099">(Padr´o</wd>

<space/>

<wd l="4382" t="6902" r="4694" b="7061">and</wd>

<space/>

<wd l="4747" t="6902" r="5794" b="7104">Stanilovsky,</wd>

<space/>

</run>

</ln>

<ln l="1882" t="7171" r="5794" b="7373" baseLine="7325" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1882" t="7176" r="2376" b="7368">2012)</wd>

<space/>

<wd l="2458" t="7195" r="2626" b="7330">to</wd>

<space/>

<wd l="2698" t="7171" r="3403" b="7373">perform</wd>

<space/>

<wd l="3470" t="7171" r="3739" b="7330">the</wd>

<space/>

<wd l="3811" t="7171" r="4930" b="7358">tokenization,</wd>

<space/>

<wd l="5016" t="7171" r="5794" b="7330">lemmati-</wd>

</ln>

<ln l="1882" t="7445" r="5798" b="7646" baseLine="7594" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1882" t="7445" r="2410" b="7603">zation</wd>

<space/>

<wd l="2482" t="7445" r="2789" b="7603">and</wd>

<space/>

<wd l="2856" t="7450" r="3245" b="7603">POS</wd>

<space/>

<wd l="3322" t="7445" r="3970" b="7646">tagging</wd>

<space/>

<wd l="4051" t="7445" r="4877" b="7646">(although</wd>

<space/>

<wd l="4939" t="7445" r="5390" b="7603">these</wd>

<space/>

<wd l="5453" t="7469" r="5798" b="7646">tags</wd>

<space/>

</ln>

<ln l="1882" t="7714" r="5803" b="7915" baseLine="7867" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1882" t="7766" r="2141" b="7872">are</wd>

<space/>

<wd l="2237" t="7738" r="2515" b="7872">not</wd>

<space/>

<wd l="2616" t="7714" r="3394" b="7915">currently</wd>

<space/>

<wd l="3490" t="7714" r="3662" b="7867">in</wd>

<space/>

<wd l="3754" t="7718" r="4109" b="7910">use)</wd>

<space/>

<wd l="4214" t="7714" r="4406" b="7872">of</wd>

<space/>

<wd l="4488" t="7714" r="4752" b="7872">the</wd>

<space/>

<wd l="4848" t="7738" r="5170" b="7872">text</wd>

<space/>

<wd l="5270" t="7714" r="5458" b="7872">of</wd>

<space/>

<wd l="5539" t="7714" r="5803" b="7872">the</wd>

<space/>

</ln>

<ln l="1877" t="7997" r="2390" b="8146" baseLine="8136" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1877" t="8011" r="2390" b="8146">tweet.</wd>

</ln>

</para>

<para l="1675" t="8443" r="4013" b="8616" alignment="justified" li="432" spaceBefore="174" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="8443" r="4013" b="8616" baseLine="8578">

<wd l="1675" t="8458" r="1877" b="8578">•</wd>

<tab position="1742"/>

<wd l="1877" t="8443" r="4013" b="8616"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="23">MentionProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="23">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="23"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1877" t="8717" r="5808" b="9672" alignment="justified" li="432" spaceBefore="2" lsp="exactly" lspExact="270" language="en">

<ln l="1886" t="8717" r="5794" b="8894" baseLine="8851">

<wd l="1886" t="8717" r="4013" b="8894"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">HashtagProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4238" t="8726" r="5794" b="8856">URLProcessor</wd>

<space/>

</run>

</ln>

<ln l="1882" t="8971" r="5798" b="9168" baseLine="9120">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1882" t="8971" r="2194" b="9130">and</wd>

<space/>

</run>

<wd l="2362" t="8986" r="4349" b="9168"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">SmileyProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4536" t="8971" r="5069" b="9130">which</wd>

<space/>

<wd l="5222" t="8995" r="5477" b="9130">act</wd>

<space/>

<wd l="5630" t="9024" r="5798" b="9130">as</wd>

<space/>

</run>

</ln>

<ln l="1882" t="9240" r="5808" b="9398" baseLine="9394">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1882" t="9240" r="2366" b="9398">filters</wd>

<space/>

<wd l="2448" t="9240" r="2707" b="9398">for</wd>

<space/>

</run>

<wd l="2789" t="9274" r="3259" b="9398"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">OOV</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">s</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3341" t="9293" r="3595" b="9398">we</wd>

<space/>

<wd l="3677" t="9240" r="3888" b="9398">do</wd>

<space/>

<wd l="3970" t="9264" r="4248" b="9398">not</wd>

<space/>

<wd l="4320" t="9264" r="4747" b="9398">want</wd>

<space/>

<wd l="4819" t="9264" r="4987" b="9398">to</wd>

<space/>

<wd l="5069" t="9240" r="5808" b="9398">consider</wd>

<space/>

</run>

</ln>

<ln l="1877" t="9514" r="3442" b="9672" baseLine="9662" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9514" r="2136" b="9672">for</wd>

<space/>

<wd l="2184" t="9514" r="3442" b="9672">normalization.</wd>

</ln>

</para>

<para l="1675" t="9950" r="5808" b="10699" alignment="justified" li="432" spaceBefore="174" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="9955" r="5798" b="10152" baseLine="10104">

<wd l="1675" t="9984" r="1886" b="10104">•</wd>

<tab position="1742"/>

<wd l="1886" t="9974" r="4013" b="10152"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">LaughESProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><space/>

<wd l="4181" t="9955" r="4714" b="10114">which</wd>

<space/>

<wd l="4848" t="9955" r="5798" b="10114">normalizes</wd>

<space/>

</run>

</ln>

<ln l="1877" t="10224" r="5808" b="10426" baseLine="10373" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1877" t="10224" r="2362" b="10426">laugh</wd>

<space/>

<wd l="2472" t="10224" r="2957" b="10426">string</wd>

<space/>

<wd l="3058" t="10224" r="4426" b="10426">representations,</wd>

<space/>

<wd l="4550" t="10277" r="4718" b="10382">as</wd>

<space/>

<wd l="4829" t="10224" r="5002" b="10378">in</wd>

<space/>

<wd l="5102" t="10224" r="5443" b="10426">“ja”</wd>

<space/>

<wd l="5549" t="10224" r="5808" b="10382">for</wd>

<space/>

</ln>

<ln l="1882" t="10498" r="2587" b="10699" baseLine="10646" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1882" t="10498" r="2587" b="10699">“jajaja”.</wd>

</ln>

</para>

<para l="1675" t="10934" r="5798" b="11683" alignment="justified" li="432" spaceBefore="213" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="10939" r="5794" b="11141" baseLine="11088">

<wd l="1675" t="10968" r="1882" b="11088">•</wd>

<tab position="1742"/>

<wd l="1882" t="10954" r="4147" b="11126"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">PhoneticProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4219" t="10939" r="4752" b="11098">which</wd>

<space/>

<wd l="4814" t="10992" r="5179" b="11098">uses</wd>

<space/>

<wd l="5251" t="10992" r="5347" b="11098">a</wd>

<space/>

<wd l="5405" t="10939" r="5794" b="11141">pho-</wd>

</run>

</ln>

<ln l="1877" t="11208" r="5798" b="11410" baseLine="11357" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="11208" r="2294" b="11366">netic</wd>

<space/>

<wd l="2347" t="11208" r="2770" b="11366">table</wd>

<space/>

<wd l="2818" t="11232" r="2986" b="11366">to</wd>

<space/>

<wd l="3034" t="11261" r="3408" b="11410">map</wd>

<space/>

<wd l="3466" t="11208" r="4334" b="11366">characters</wd>

<space/>

<wd l="4392" t="11232" r="4555" b="11366">to</wd>

<space/>

<wd l="4608" t="11208" r="5011" b="11366">their</wd>

<space/>

<wd l="5054" t="11208" r="5798" b="11410">phonetic</wd>

<space/>

</ln>

<ln l="1882" t="11443" r="5400" b="11683" baseLine="11626">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1882" t="11482" r="2774" b="11683">equivalent</wd>

<space/>

<wd l="2837" t="11482" r="3456" b="11683">strings,</wd>

<space/>

<wd l="3528" t="11482" r="3922" b="11640">such</wd>

<space/>

<wd l="3979" t="11534" r="4147" b="11640">as</wd>

<space/>

<wd l="4214" t="11486" r="4507" b="11635">“x”</wd>

<space/>

<wd l="4570" t="11506" r="4733" b="11640">to</wd>

<space/>

</run>

<wd l="4795" t="11443" r="5400" b="11683"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">“por”.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1675" t="11923" r="5808" b="12893" alignment="justified" li="432" spaceBefore="134" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<tabs position="1675"/>

<ln l="1675" t="11923" r="5808" b="12120" baseLine="12072" forcedEOF="true">

<wd l="1675" t="11947" r="1896" b="12072">•</wd>

<tab position="1745"/>

<wd l="1896" t="11938" r="4800" b="12120"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">SMSDictionaryProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><tab position="4800"/>

<wd l="5270" t="11923" r="5808" b="12082">which
</wd>

</run>

</ln>

<ln l="1877" t="12192" r="5789" b="12350" baseLine="12341" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1877" t="12192" r="2342" b="12350">looks</wd>

<space/>

<wd l="2400" t="12192" r="2659" b="12350">for</wd>

<space/>

<wd l="2707" t="12192" r="3922" b="12350">normalization</wd>

<space/>

<wd l="3974" t="12192" r="4886" b="12350">candidates</wd>

<space/>

<wd l="4944" t="12192" r="5117" b="12346">in</wd>

<space/>

<wd l="5170" t="12245" r="5366" b="12350">an</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="5434" t="12226" r="5789" b="12350">SMS</wd>

<space/>

</run>

</ln>

<ln l="1882" t="12466" r="5794" b="12667" baseLine="12614" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3" forcedEOF="true">

<wd l="1882" t="12466" r="2789" b="12667">dictionary,</wd>

<space/>

<wd l="2875" t="12466" r="3134" b="12624">for</wd>

<space/>

<wd l="3202" t="12466" r="3931" b="12667">example</wd>

<space/>

<wd l="4008" t="12466" r="4896" b="12624">“tambi´en”</wd>

<space/>

<wd l="4978" t="12466" r="5794" b="12662">(too/also)</wd>

<space/>

</ln>

<ln l="1877" t="12734" r="2592" b="12893" baseLine="12883" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3" forcedEOF="true">

<wd l="1877" t="12734" r="2136" b="12893">for</wd>

<space/>

<wd l="2189" t="12734" r="2592" b="12893">“tb”.</wd>

</ln>

</para>

<para l="1675" t="13171" r="5808" b="14731" alignment="justified" li="432" spaceBefore="180" spaceAfter="93" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="13176" r="5794" b="13373" baseLine="13325">

<wd l="1675" t="13205" r="1877" b="13325">•</wd>

<tab position="1742"/>

<wd l="1877" t="13195" r="3883" b="13373"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">AspellProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="4037" t="13176" r="4570" b="13334">which</wd>

<space/>

<wd l="4699" t="13176" r="5314" b="13334">obtains</wd>

<space/>

<wd l="5448" t="13229" r="5794" b="13334">nor-</wd>

</run>

</ln>

<ln l="1877" t="13450" r="5808" b="13651" baseLine="13598" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="13450" r="2798" b="13608">malization</wd>

<space/>

<wd l="2856" t="13450" r="3763" b="13608">candidates</wd>

<space/>

<wd l="3821" t="13450" r="4291" b="13651">using</wd>

<space/>

<wd l="4349" t="13450" r="4613" b="13608">the</wd>

<space/>

<wd l="4675" t="13450" r="5069" b="13651">spell</wd>

<space/>

<wd l="5136" t="13450" r="5808" b="13608">checker</wd>

<space/>

</ln>

<ln l="1891" t="13718" r="5798" b="13920" baseLine="13867">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1891" t="13738" r="2645" b="13915">aspell</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2774" t="13718" r="3451" b="13920">(Aspell,</wd>

<space/>

<wd l="3581" t="13723" r="4128" b="13915">2011),</wd>

<space/>

<wd l="4258" t="13771" r="4430" b="13877">as</wd>

<space/>

<wd l="4541" t="13718" r="4709" b="13872">in</wd>

<space/>

<wd l="4814" t="13718" r="5798" b="13920">“pol´emica”</wd>

<space/>

</run>

</ln>

<ln l="1886" t="13987" r="5803" b="14189" baseLine="14141" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1886" t="13992" r="3034" b="14189">(controversy)</wd>

<space/>

<wd l="3149" t="13987" r="3408" b="14146">for</wd>

<space/>

<wd l="3509" t="13987" r="4454" b="14189">“polemik”.</wd>

<space/>

<wd l="4680" t="13992" r="4814" b="14146">It</wd>

<space/>

<wd l="4925" t="13987" r="5496" b="14146">should</wd>

<space/>

<wd l="5602" t="13987" r="5803" b="14146">be</wd>

<space/>

</ln>

<ln l="1877" t="14261" r="5808" b="14419" baseLine="14410" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="14261" r="2362" b="14419">noted</wd>

<space/>

<wd l="2491" t="14261" r="2818" b="14419">that</wd>

<space/>

<wd l="2947" t="14261" r="3254" b="14419">this</wd>

<space/>

<wd l="3394" t="14261" r="3730" b="14419">tool</wd>

<space/>

<wd l="3864" t="14261" r="4142" b="14419">has</wd>

<space/>

<wd l="4282" t="14261" r="4694" b="14419">been</wd>

<space/>

<wd l="4829" t="14261" r="5808" b="14419">customised</wd>

<space/>

</ln>

<ln l="1877" t="14530" r="5808" b="14731" baseLine="14683" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="14530" r="2266" b="14688">with</wd>

<space/>

<wd l="2328" t="14582" r="2424" b="14688">a</wd>

<space/>

<wd l="2482" t="14582" r="2832" b="14688">new</wd>

<space/>

<wd l="2894" t="14530" r="3643" b="14731">phonetic</wd>

<space/>

<wd l="3706" t="14530" r="4128" b="14688">table</wd>

<space/>

<wd l="4190" t="14530" r="4450" b="14688">for</wd>

<space/>

<wd l="4507" t="14530" r="5237" b="14731">Spanish,</wd>

<space/>

<wd l="5309" t="14530" r="5808" b="14688">based</wd>

</ln>

</para>

<rulerline l="1433" t="14846" r="2640" b="14846" type="single" width="10" color="000000"/>

<para l="1445" t="14904" r="5798" b="15302" alignment="justified" spaceBefore="66" spaceAfter="38" fli="216" lsp="exactly" lspExact="203" language="en">

<ln l="1704" t="14904" r="5798" b="15106" baseLine="15056">

<wd l="1704" t="14904" r="2040" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">The</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2107" t="14938" r="2770" b="15067">character</wd>

<space/>

<wd l="2842" t="14938" r="3077" b="15062">“x”</wd>

<space/>

<wd l="3149" t="14938" r="3859" b="15067">resembles</wd>

<space/>

<wd l="3936" t="14938" r="4152" b="15067">the</wd>

<space/>

<wd l="4224" t="14938" r="5232" b="15106">multiplication</wd>

<space/>

<wd l="5304" t="14938" r="5798" b="15096">(times)</wd>

<space/>

</run>

</ln>

<ln l="1445" t="15134" r="4440" b="15302" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="15134" r="1742" b="15302">sign</wd>

<space/>

</run>

<wd l="1810" t="15168" r="1963" b="15288"><run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">×</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2016" t="15134" r="2458" b="15264">which</wd>

<space/>

<wd l="2501" t="15134" r="2640" b="15259">in</wd>

<space/>

<wd l="2688" t="15134" r="3254" b="15302">Spanish</wd>

<space/>

<wd l="3298" t="15134" r="3408" b="15264">is</wd>

<space/>

<wd l="3461" t="15134" r="3773" b="15264">read</wd>

<space/>

<wd l="3821" t="15173" r="3955" b="15264">as</wd>

<space/>

<wd l="4013" t="15134" r="4440" b="15302">“por”.</wd>

</run>

</ln>

</para>

</column>

<column l="6144" t="2072" r="10531" b="15354">

<para l="6581" t="2290" r="10526" b="3840" alignment="justified" li="432" spaceBefore="161" lsp="exactly" lspExact="270" language="en">

<ln l="6581" t="2290" r="10512" b="2477" baseLine="2443">

<wd l="6581" t="2304" r="8722" b="2477"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">AffixESProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="8774" t="2290" r="9312" b="2448">which</wd>

<space/>

<wd l="9350" t="2290" r="10142" b="2448">identifies</wd>

<space/>

<wd l="10200" t="2290" r="10512" b="2448">and</wd>

<space/>

</run>

</ln>

<ln l="6581" t="2563" r="10526" b="2765" baseLine="2712" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6581" t="2563" r="7531" b="2722">normalizes</wd>

<space/>

<wd l="7666" t="2563" r="8774" b="2722">affix-derived</wd>

<space/>

<wd l="8894" t="2563" r="9581" b="2765">Spanish</wd>

<space/>

<wd l="9701" t="2563" r="10200" b="2722">forms</wd>

<space/>

<wd l="10334" t="2563" r="10526" b="2722">of</wd>

<space/>

</ln>

<ln l="6581" t="2832" r="10502" b="3034" baseLine="2981" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6581" t="2832" r="6970" b="2990">base</wd>

<space/>

<wd l="7037" t="2832" r="7613" b="3019">words,</wd>

<space/>

<wd l="7699" t="2832" r="8040" b="2990">also</wd>

<space/>

<wd l="8122" t="2832" r="9038" b="3034">supporting</wd>

<space/>

<wd l="9110" t="2832" r="10018" b="3034">phonetical</wd>

<space/>

<wd l="10085" t="2832" r="10502" b="2990">writ-</wd>

</ln>

<ln l="6581" t="3106" r="10507" b="3307" baseLine="3254" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6581" t="3106" r="6902" b="3307">ing,</wd>

<space/>

<wd l="6965" t="3158" r="7133" b="3264">as</wd>

<space/>

<wd l="7186" t="3106" r="7358" b="3259">in</wd>

<space/>

<wd l="7397" t="3106" r="7666" b="3264">the</wd>

<space/>

<wd l="7714" t="3158" r="8083" b="3264">case</wd>

<space/>

<wd l="8131" t="3106" r="8323" b="3264">of</wd>

<space/>

<wd l="8357" t="3106" r="9197" b="3307">“chikiyo”</wd>

<space/>

<wd l="9245" t="3106" r="9504" b="3264">for</wd>

<space/>

<wd l="9547" t="3106" r="10507" b="3307">“chiquillo”</wd>

<space/>

</ln>

<ln l="6590" t="3374" r="10512" b="3576" baseLine="3523" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6590" t="3374" r="7056" b="3571">(little</wd>

<space/>

<wd l="7138" t="3374" r="7579" b="3576">boy),</wd>

<space/>

<wd l="7685" t="3374" r="8434" b="3533">obtained</wd>

<space/>

<wd l="8515" t="3374" r="8942" b="3533">from</wd>

<space/>

<wd l="9029" t="3374" r="9686" b="3533">“chico”</wd>

<space/>

<wd l="9773" t="3374" r="10162" b="3533">with</wd>

<space/>

<wd l="10243" t="3374" r="10512" b="3533">the</wd>

<space/>

</ln>

<ln l="6590" t="3643" r="8861" b="3840" baseLine="3797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6590" t="3643" r="7070" b="3802">suffix</wd>

<space/>

<wd l="7133" t="3643" r="7680" b="3802">“-illo”</wd>

<space/>

<wd l="7752" t="3643" r="8861" b="3840">(little/small).</wd>

</ln>

</para>

<para l="6384" t="4070" r="10512" b="5899" alignment="justified" li="432" spaceBefore="159" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="4070" r="10512" b="4258" baseLine="4224">

<wd l="6384" t="4099" r="6586" b="4224">•</wd>

<tab position="6454"/>

<wd l="6586" t="4094" r="8458" b="4258"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">NGramProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4"><space/>

<wd l="8606" t="4070" r="9144" b="4229">which</wd>

<space/>

<wd l="9269" t="4070" r="10114" b="4229">calculates</wd>

<space/>

<wd l="10243" t="4070" r="10512" b="4229">the</wd>

<space/>

</run>

</ln>

<ln l="6590" t="4344" r="10512" b="4546" baseLine="4493" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6590" t="4397" r="7118" b="4502">scores</wd>

<space/>

<wd l="7253" t="4344" r="7445" b="4502">of</wd>

<space/>

<wd l="7555" t="4344" r="8011" b="4502">those</wd>

<space/>

<wd l="8136" t="4368" r="8563" b="4502">most</wd>

<space/>

<wd l="8683" t="4344" r="9173" b="4546">likely</wd>

<space/>

<wd l="9298" t="4344" r="10512" b="4502">normalization</wd>

<space/>

</ln>

<ln l="6586" t="4613" r="10502" b="4814" baseLine="4762" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6586" t="4613" r="7493" b="4771">candidates</wd>

<space/>

<wd l="7642" t="4613" r="8491" b="4814">according</wd>

<space/>

<wd l="8626" t="4637" r="8794" b="4771">to</wd>

<space/>

<wd l="8928" t="4613" r="9192" b="4771">the</wd>

<space/>

<wd l="9326" t="4613" r="9926" b="4771">Viterbi</wd>

<space/>

<wd l="10066" t="4613" r="10502" b="4814">algo-</wd>

</ln>

<ln l="6581" t="4886" r="10502" b="5088" baseLine="5035" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6581" t="4886" r="7056" b="5045">rithm</wd>

<space/>

<wd l="7152" t="4886" r="8002" b="5088">(Manning</wd>

<space/>

<wd l="8098" t="4886" r="8410" b="5045">and</wd>

<space/>

<wd l="8506" t="4886" r="9230" b="5074">Sch¨utze,</wd>

<space/>

<wd l="9365" t="4891" r="9821" b="5074">1999,</wd>

<space/>

<wd l="9936" t="4886" r="10229" b="5045">Ch.</wd>

<space/>

<wd l="10334" t="4891" r="10502" b="5083">9)</wd>

<space/>

</ln>

<ln l="6581" t="5155" r="10512" b="5357" baseLine="5304" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6581" t="5155" r="7123" b="5357">taking</wd>

<space/>

<wd l="7277" t="5208" r="7445" b="5314">as</wd>

<space/>

<wd l="7594" t="5155" r="8405" b="5314">reference</wd>

<space/>

<wd l="8549" t="5155" r="8813" b="5314">the</wd>

<space/>

<wd l="8957" t="5155" r="9350" b="5314">Web</wd>

<space/>

<wd l="9518" t="5160" r="9734" b="5309">1T</wd>

<space/>

<wd l="9888" t="5155" r="10512" b="5357">5-gram</wd>

<space/>

</ln>

<ln l="6581" t="5424" r="10502" b="5626" baseLine="5578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6581" t="5429" r="6778" b="5582">v1</wd>

<space/>

<wd l="6917" t="5429" r="7541" b="5621">(Brants</wd>

<space/>

<wd l="7666" t="5424" r="7978" b="5582">and</wd>

<space/>

<wd l="8083" t="5429" r="8621" b="5611">Franz,</wd>

<space/>

<wd l="8760" t="5424" r="9254" b="5621">2006)</wd>

<space/>

<wd l="9379" t="5424" r="10066" b="5626">Spanish</wd>

<space/>

<wd l="10171" t="5424" r="10502" b="5582">lan-</wd>

</ln>

<ln l="6586" t="5698" r="7747" b="5899" baseLine="5846" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6586" t="5750" r="7104" b="5899">guage</wd>

<space/>

<wd l="7157" t="5698" r="7747" b="5856">model.</wd>

</ln>

</para>

<para l="6384" t="6120" r="10512" b="6595" alignment="justified" li="432" spaceBefore="161" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6125" r="10512" b="6312" baseLine="6274">

<wd l="6384" t="6149" r="6590" b="6274">•</wd>

<tab position="6454"/>

<wd l="6590" t="6139" r="8981" b="6312"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">CandidateProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9038" t="6125" r="9576" b="6283">which</wd>

<space/>

<wd l="9629" t="6125" r="10190" b="6283">selects</wd>

<space/>

<wd l="10243" t="6125" r="10512" b="6283">the</wd>

<space/>

</run>

</ln>

<ln l="6581" t="6394" r="9773" b="6595" baseLine="6547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6394" r="7574" b="6595">top-scoring</wd>

<space/>

<wd l="7637" t="6394" r="8467" b="6552">candidate</wd>

<space/>

<wd l="8520" t="6394" r="8779" b="6552">for</wd>

<space/>

<wd l="8837" t="6394" r="9230" b="6552">each</wd>

<space/>

<wd l="9283" t="6394" r="9773" b="6552">word.</wd>

</ln>

</para>

<para l="6384" t="6816" r="10512" b="7565" alignment="justified" li="432" spaceBefore="155" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6821" r="10512" b="7022" baseLine="6970">

<wd l="6384" t="6850" r="6586" b="6970">•</wd>

<tab position="6451"/>

<wd l="6586" t="6840" r="8587" b="7008"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ResultProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8794" t="6821" r="9331" b="6979">which</wd>

<space/>

<wd l="9499" t="6821" r="10070" b="7022">dumps</wd>

<space/>

<wd l="10243" t="6821" r="10512" b="6979">the</wd>

<space/>

</run>

</ln>

<ln l="6581" t="7090" r="10502" b="7291" baseLine="7243" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="7114" r="7056" b="7248">tweet</wd>

<space/>

<wd l="7109" t="7090" r="7469" b="7248">data</wd>

<space/>

<wd l="7522" t="7090" r="8270" b="7248">obtained</wd>

<space/>

<wd l="8314" t="7090" r="8530" b="7291">by</wd>

<space/>

<wd l="8582" t="7090" r="8846" b="7248">the</wd>

<space/>

<wd l="8909" t="7114" r="9509" b="7291">system</wd>

<space/>

<wd l="9552" t="7114" r="9720" b="7248">to</wd>

<space/>

<wd l="9778" t="7142" r="9874" b="7248">a</wd>

<space/>

<wd l="9922" t="7090" r="10195" b="7248">file</wd>

<space/>

<wd l="10243" t="7142" r="10502" b="7248">us-</wd>

</ln>

<ln l="6581" t="7363" r="8645" b="7565" baseLine="7512" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="7363" r="6859" b="7565">ing</wd>

<space/>

<wd l="6917" t="7363" r="7181" b="7522">the</wd>

<space/>

<wd l="7238" t="7363" r="7963" b="7565">required</wd>

<space/>

<wd l="8016" t="7363" r="8645" b="7522">format.</wd>

</ln>

</para>

<para l="6144" t="7766" r="9302" b="7968" alignment="left" spaceBefore="155" lsp="exactly" lspExact="254" language="en">

<ln l="6144" t="7766" r="9302" b="7968" baseLine="7915" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">

<wd l="6144" t="7766" r="6413" b="7925">2.3</wd>

<space/>

<wd l="6638" t="7766" r="7690" b="7968">Adaptation</wd>

<space/>

<wd l="7747" t="7766" r="8016" b="7925">for</wd>

<space/>

<wd l="8074" t="7771" r="8813" b="7925">W-NUT</wd>

<space/>

<wd l="8870" t="7766" r="9302" b="7925">2015</wd>

</ln>

</para>

<para l="6144" t="8117" r="10526" b="10214" alignment="justified" spaceBefore="81" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="8117" r="10512" b="8318" baseLine="8266" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8122" r="6326" b="8270">In</wd>

<space/>

<wd l="6384" t="8117" r="7061" b="8318">general,</wd>

<space/>

<wd l="7123" t="8117" r="7392" b="8275">the</wd>

<space/>

<wd l="7445" t="8117" r="8352" b="8318">adaptation</wd>

<space/>

<wd l="8400" t="8170" r="9048" b="8318">process</wd>

<space/>

<wd l="9106" t="8117" r="9854" b="8275">revolved</wd>

<space/>

<wd l="9912" t="8117" r="10512" b="8275">around</wd>

<space/>

</ln>

<ln l="6144" t="8386" r="10507" b="8587" baseLine="8539" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8386" r="7354" b="8587">implementing</wd>

<space/>

<wd l="7411" t="8438" r="7762" b="8544">new</wd>

<space/>

<wd l="7819" t="8438" r="8731" b="8587">processors</wd>

<space/>

<wd l="8798" t="8386" r="9110" b="8544">and</wd>

<space/>

<wd l="9158" t="8386" r="10099" b="8587">integrating</wd>

<space/>

<wd l="10152" t="8438" r="10507" b="8544">new</wd>

<space/>

</ln>

<ln l="6144" t="8659" r="10502" b="8861" baseLine="8808" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8712" r="6960" b="8818">resources</wd>

<space/>

<wd l="7046" t="8683" r="7214" b="8818">to</wd>

<space/>

<wd l="7296" t="8683" r="7973" b="8818">account</wd>

<space/>

<wd l="8050" t="8659" r="8304" b="8818">for</wd>

<space/>

<wd l="8381" t="8659" r="8645" b="8818">the</wd>

<space/>

<wd l="8722" t="8659" r="9854" b="8861">requirements</wd>

<space/>

<wd l="9941" t="8659" r="10133" b="8818">of</wd>

<space/>

<wd l="10195" t="8659" r="10502" b="8818">this</wd>

<space/>

</ln>

<ln l="6144" t="8928" r="10526" b="9130" baseLine="9077" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8981" r="6499" b="9086">new</wd>

<space/>

<wd l="6595" t="8928" r="6989" b="9115">task,</wd>

<space/>

<wd l="7109" t="8928" r="7498" b="9086">such</wd>

<space/>

<wd l="7594" t="8981" r="7762" b="9086">as</wd>

<space/>

<wd l="7858" t="8928" r="8122" b="9086">the</wd>

<space/>

<wd l="8213" t="8981" r="8506" b="9086">use</wd>

<space/>

<wd l="8597" t="8928" r="8789" b="9086">of</wd>

<space/>

<wd l="8866" t="8928" r="9533" b="9130">English</wd>

<space/>

<wd l="9624" t="8928" r="10243" b="9086">instead</wd>

<space/>

<wd l="10334" t="8928" r="10526" b="9086">of</wd>

<space/>

</ln>

<ln l="6149" t="9202" r="10507" b="9403" baseLine="9350" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="9202" r="6840" b="9403">Spanish</wd>

<space/>

<wd l="6893" t="9254" r="7109" b="9360">on</wd>

<space/>

<wd l="7162" t="9202" r="7426" b="9360">the</wd>

<space/>

<wd l="7478" t="9254" r="7834" b="9360">new</wd>

<space/>

<wd l="7886" t="9206" r="8174" b="9360">I/O</wd>

<space/>

<wd l="8237" t="9202" r="8597" b="9360">data</wd>

<space/>

<wd l="8645" t="9202" r="9274" b="9389">format,</wd>

<space/>

<wd l="9336" t="9202" r="9821" b="9360">while</wd>

<space/>

<wd l="9874" t="9202" r="10507" b="9403">leaving</wd>

<space/>

</ln>

<ln l="6144" t="9470" r="10502" b="9672" baseLine="9619" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="9470" r="6413" b="9629">the</wd>

<space/>

<wd l="6485" t="9470" r="6869" b="9629">base</wd>

<space/>

<wd l="6950" t="9494" r="7704" b="9629">structure</wd>

<space/>

<wd l="7781" t="9470" r="7973" b="9629">of</wd>

<space/>

<wd l="8030" t="9470" r="8294" b="9629">the</wd>

<space/>

<wd l="8376" t="9494" r="8976" b="9672">system</wd>

<space/>

<wd l="9043" t="9470" r="9994" b="9629">untouched.</wd>

<space/>

<wd l="10123" t="9470" r="10502" b="9629">This</wd>

<space/>

</ln>

<ln l="6144" t="9739" r="10507" b="9941" baseLine="9893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="9792" r="6475" b="9898">was</wd>

<space/>

<wd l="6538" t="9739" r="7320" b="9941">precisely</wd>

<space/>

<wd l="7378" t="9739" r="7642" b="9898">the</wd>

<space/>

<wd l="7694" t="9739" r="8131" b="9898">main</wd>

<space/>

<wd l="8189" t="9739" r="8558" b="9941">goal</wd>

<space/>

<wd l="8621" t="9739" r="9178" b="9941">during</wd>

<space/>

<wd l="9235" t="9739" r="9504" b="9898">the</wd>

<space/>

<wd l="9557" t="9739" r="10507" b="9941">refactoring</wd>

<space/>

</ln>

<ln l="6144" t="10013" r="9566" b="10214" baseLine="10162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="10066" r="6792" b="10214">process</wd>

<space/>

<wd l="6859" t="10037" r="7013" b="10171">at</wd>

<space/>

<wd l="7066" t="10013" r="7334" b="10171">the</wd>

<space/>

<wd l="7387" t="10013" r="8256" b="10214">beginning</wd>

<space/>

<wd l="8318" t="10013" r="8506" b="10171">of</wd>

<space/>

<wd l="8549" t="10013" r="8856" b="10171">this</wd>

<space/>

<wd l="8918" t="10013" r="9566" b="10214">project.</wd>

</ln>

</para>

<para l="6144" t="10282" r="10512" b="11026" alignment="justified" spaceBefore="6" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="6365" t="10282" r="10502" b="10483" baseLine="10435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="10282" r="6701" b="10440">The</wd>

<space/>

<wd l="6754" t="10282" r="7512" b="10483">resulting</wd>

<space/>

<wd l="7570" t="10282" r="8731" b="10483">configuration</wd>

<space/>

<wd l="8779" t="10282" r="9499" b="10440">includes</wd>

<space/>

<wd l="9557" t="10282" r="9826" b="10440">the</wd>

<space/>

<wd l="9874" t="10282" r="10502" b="10440">follow-</wd>

</ln>

<ln l="6144" t="10555" r="10512" b="10757" baseLine="10704" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10555" r="6422" b="10757">ing</wd>

<space/>

<wd l="6470" t="10608" r="6826" b="10714">new</wd>

<space/>

<wd l="6874" t="10608" r="7790" b="10757">processors</wd>

<space/>

<wd l="7853" t="10560" r="8194" b="10752">(see</wd>

<space/>

<wd l="8246" t="10555" r="8894" b="10714">Section</wd>

<space/>

<wd l="8947" t="10560" r="9038" b="10714">3</wd>

<space/>

<wd l="9096" t="10555" r="9355" b="10714">for</wd>

<space/>

<wd l="9403" t="10608" r="9499" b="10714">a</wd>

<space/>

<wd l="9547" t="10555" r="10512" b="10757">description</wd>

<space/>

</ln>

<ln l="6149" t="10824" r="8414" b="11026" baseLine="10978" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10824" r="6341" b="10982">of</wd>

<space/>

<wd l="6384" t="10824" r="6648" b="10982">the</wd>

<space/>

<wd l="6701" t="10877" r="7517" b="10982">resources</wd>

<space/>

<wd l="7579" t="10824" r="7949" b="11026">they</wd>

<space/>

<wd l="8006" t="10829" r="8414" b="11021">use):</wd>

</ln>

</para>

<para l="6384" t="11227" r="10512" b="12202" alignment="justified" li="432" spaceBefore="134" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="11227" r="10512" b="11429" baseLine="11381">

<wd l="6384" t="11256" r="6581" b="11381">•</wd>

<tab position="6454"/>

<wd l="6581" t="11256" r="8981" b="11414"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">WNUTTweetProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9053" t="11227" r="9586" b="11386">which</wd>

<space/>

<wd l="9643" t="11280" r="10181" b="11429">parses</wd>

<space/>

<wd l="10243" t="11227" r="10512" b="11386">the</wd>

<space/>

</run>

</ln>

<ln l="6590" t="11486" r="10512" b="11702" baseLine="11650">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6590" t="11501" r="7454" b="11659">structured</wd>

<space/>

<wd l="7512" t="11501" r="7958" b="11702">input</wd>

<space/>

<wd l="8026" t="11506" r="8453" b="11698">(now</wd>

<space/>

<wd l="8515" t="11501" r="8683" b="11654">in</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8746" t="11534" r="9192" b="11659">JSON</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9254" t="11501" r="9840" b="11659">format</wd>

<space/>

<wd l="9893" t="11501" r="10512" b="11659">instead</wd>

<space/>

</run>

</ln>

<ln l="6586" t="11770" r="10502" b="11971" baseLine="11923" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="11770" r="6778" b="11928">of</wd>

<space/>

<wd l="6845" t="11770" r="7282" b="11971">plain</wd>

<space/>

<wd l="7363" t="11774" r="7752" b="11966">text)</wd>

<space/>

<wd l="7848" t="11770" r="8160" b="11928">and</wd>

<space/>

<wd l="8246" t="11770" r="8861" b="11928">obtains</wd>

<space/>

<wd l="8952" t="11770" r="9221" b="11928">the</wd>

<space/>

<wd l="9312" t="11794" r="9912" b="11971">system</wd>

<space/>

<wd l="9989" t="11822" r="10502" b="11971">repre-</wd>

</ln>

<ln l="6590" t="12043" r="8582" b="12202" baseLine="12192" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6590" t="12043" r="7373" b="12202">sentation</wd>

<space/>

<wd l="7430" t="12043" r="7618" b="12202">of</wd>

<space/>

<wd l="7661" t="12043" r="7925" b="12202">the</wd>

<space/>

<wd l="7982" t="12067" r="8582" b="12202">tweets.</wd>

</ln>

</para>

<para l="6384" t="12461" r="10512" b="13440" alignment="justified" li="432" spaceBefore="158" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="12466" r="10512" b="12653" baseLine="12619">

<wd l="6384" t="12494" r="6581" b="12619">•</wd>

<tab position="6454"/>

<wd l="6581" t="12485" r="8851" b="12653"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ArkTweetProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9034" t="12466" r="9571" b="12624">which</wd>

<space/>

<wd l="9720" t="12518" r="10085" b="12624">uses</wd>

<space/>

<wd l="10243" t="12466" r="10512" b="12624">the</wd>

<space/>

</run>

</ln>

<ln l="6595" t="12739" r="10512" b="12941" baseLine="12888">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6595" t="12758" r="8275" b="12936">ark-tweet-nlp</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8342" t="12744" r="8731" b="12898">POS</wd>

<space/>

<wd l="8803" t="12763" r="9355" b="12941">tagger</wd>

<space/>

<wd l="9408" t="12763" r="9576" b="12898">to</wd>

<space/>

<wd l="9643" t="12739" r="10186" b="12898">obtain</wd>

<space/>

<wd l="10243" t="12739" r="10512" b="12898">the</wd>

<space/>

</run>

</ln>

<ln l="6581" t="13008" r="10512" b="13210" baseLine="13162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="13008" r="8030" b="13210">morphosyntactic</wd>

<space/>

<wd l="8174" t="13008" r="9206" b="13166">information</wd>

<space/>

<wd l="9346" t="13008" r="9538" b="13166">of</wd>

<space/>

<wd l="9658" t="13008" r="9926" b="13166">the</wd>

<space/>

<wd l="10061" t="13008" r="10512" b="13210">input</wd>

<space/>

</ln>

<ln l="6581" t="13282" r="7718" b="13440" baseLine="13430" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="13306" r="7056" b="13440">tweet</wd>

<space/>

<wd l="7109" t="13282" r="7718" b="13440">tokens.</wd>

</ln>

</para>

<para l="6384" t="13709" r="10502" b="14947" alignment="justified" li="432" spaceBefore="162" spaceAfter="35" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="13709" r="10502" b="13896" baseLine="13858">

<wd l="6384" t="13738" r="6581" b="13858">•</wd>

<tab position="6451"/>

<wd l="6581" t="13723" r="9110" b="13896"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">WNUTFilterProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9317" t="13709" r="9850" b="13867">which</wd>

<space/>

<wd l="10018" t="13709" r="10502" b="13867">filters</wd>

<space/>

</run>

</ln>

<ln l="6586" t="13978" r="10502" b="14136" baseLine="14126" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="14002" r="6864" b="14136">out</wd>

<space/>

<wd l="6917" t="13978" r="7128" b="14136">all</wd>

<space/>

<wd l="7181" t="13978" r="7637" b="14136">those</wd>

<space/>

<wd l="7690" t="14002" r="8165" b="14136">terms</wd>

<space/>

<wd l="8227" t="13978" r="8554" b="14136">that</wd>

<space/>

<wd l="8611" t="13978" r="9187" b="14136">should</wd>

<space/>

<wd l="9235" t="14002" r="9514" b="14136">not</wd>

<space/>

<wd l="9566" t="13978" r="9768" b="14136">be</wd>

<space/>

<wd l="9821" t="13978" r="10502" b="14136">normal-</wd>

</ln>

<ln l="6581" t="14251" r="10498" b="14453" baseLine="14400" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="14251" r="6946" b="14410">ized</wd>

<space/>

<wd l="7046" t="14251" r="7896" b="14453">according</wd>

<space/>

<wd l="7997" t="14275" r="8160" b="14410">to</wd>

<space/>

<wd l="8261" t="14251" r="8525" b="14410">the</wd>

<space/>

<wd l="8621" t="14251" r="8971" b="14410">task</wd>

<space/>

<wd l="9067" t="14251" r="9480" b="14410">rules</wd>

<space/>

<wd l="9595" t="14251" r="10498" b="14448">(mentions,</wd>

<space/>

</ln>

<ln l="6581" t="14520" r="10502" b="14722" baseLine="14669" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="14520" r="7378" b="14722">hashtags,</wd>

<space/>

<wd l="7469" t="14525" r="8030" b="14707">URLs,</wd>

<space/>

<wd l="8131" t="14525" r="8496" b="14717">etc.)</wd>

<space/>

<wd l="8635" t="14520" r="9106" b="14722">using</wd>

<space/>

<wd l="9182" t="14520" r="9802" b="14722">regular</wd>

<space/>

<wd l="9878" t="14573" r="10502" b="14722">expres-</wd>

</ln>

<ln l="6590" t="14789" r="7075" b="14947" baseLine="14942" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6590" t="14789" r="7075" b="14947">sions.</wd>

</ln>

</para>

<rulerline l="6144" t="15048" r="7344" b="15048" type="single" width="10" color="000000"/>

<para l="6384" t="15042" r="6475" b="2434" alignment="left" li="216" lsp="single" language="en">

<ln l="6384" t="1824" r="6475" b="2434" baseLine="2443" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="2342" r="6475" b="2434">•</wd>

</ln>

</para>

<para l="6398" t="15101" r="9691" b="15293" alignment="left" li="216" spaceBefore="12597" spaceAfter="52" lsp="exactly" lspExact="197" language="en">

<ln l="6398" t="15101" r="9691" b="15293" baseLine="15256">

<wd l="6398" t="15101" r="9691" b="15293"><run underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="22">2</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="22">http://wikimediafoundation.org</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="22"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<dd l="1433" t="15746" r="10531" b="15975">

<para l="5771" t="15792" r="6181" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6115" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="25">

<wd l="5837" t="15792" r="6115" b="15946">101</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1430" marginTop="1097" marginRight="1381" marginBottom="1292" offsetX="-20" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1430" t="1097" r="10528" b="15316">

<column l="1430" t="1097" r="5817" b="15316">

<para l="1675" t="1320" r="5808" b="2875" alignment="justified" li="432" spaceBefore="167" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="1320" r="5798" b="1507" baseLine="1474">

<wd l="1675" t="1349" r="1886" b="1474">•</wd>

<tab position="1745"/>

<wd l="1886" t="1344" r="4277" b="1507"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">LowerCaseProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9"><space/>

<wd l="4579" t="1320" r="5117" b="1478">which</wd>

<space/>

<wd l="5362" t="1320" r="5798" b="1478">takes</wd>

<space/>

</run>

</ln>

<ln l="1882" t="1594" r="5808" b="1752" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">

<wd l="1882" t="1594" r="2093" b="1752">all</wd>

<space/>

<wd l="2242" t="1594" r="2506" b="1752">the</wd>

<space/>

<wd l="2659" t="1594" r="3490" b="1752">candidate</wd>

<space/>

<wd l="3634" t="1594" r="4138" b="1752">forms</wd>

<space/>

<wd l="4296" t="1594" r="4488" b="1752">of</wd>

<space/>

<wd l="4622" t="1646" r="4718" b="1752">a</wd>

<space/>

<wd l="4862" t="1594" r="5347" b="1752">token</wd>

<space/>

<wd l="5496" t="1594" r="5808" b="1752">and</wd>

<space/>

</ln>

<ln l="1877" t="1862" r="5794" b="2059" baseLine="2016">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9"><wd l="1877" t="1862" r="2822" b="2021">lowercases</wd>

<space/>

<wd l="2971" t="1862" r="3456" b="2050">them;</wd>

<space/>

</run>

<wd l="3658" t="1882" r="5794" b="2059"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">AspellCProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9"><space/>

</run>

</ln>

<ln l="1882" t="2136" r="5803" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">

<wd l="1882" t="2189" r="1978" b="2294">a</wd>

<space/>

<wd l="2189" t="2136" r="3192" b="2294">constrained</wd>

<space/>

<wd l="3403" t="2136" r="4042" b="2294">version</wd>

<space/>

<wd l="4258" t="2136" r="4450" b="2294">of</wd>

<space/>

<wd l="4646" t="2136" r="4915" b="2294">the</wd>

<space/>

<wd l="5131" t="2136" r="5803" b="2338">original</wd>

<space/>

</ln>

<ln l="1877" t="2405" r="5794" b="2602" baseLine="2558">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9"><wd l="1877" t="2424" r="3830" b="2602">AspellProcessor</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9"><wd l="4037" t="2405" r="4867" b="2563">described</wd>

<space/>

<wd l="5059" t="2405" r="5227" b="2558">in</wd>

<space/>

<wd l="5424" t="2410" r="5794" b="2563">Sec-</wd>

</run>

</ln>

<ln l="1877" t="2678" r="5520" b="2875" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">

<wd l="1877" t="2678" r="2218" b="2837">tion</wd>

<space/>

<wd l="2275" t="2683" r="2539" b="2837">2.2</wd>

<space/>

<wd l="2606" t="2683" r="2947" b="2875">(see</wd>

<space/>

<wd l="3010" t="2678" r="3658" b="2837">Section</wd>

<space/>

<wd l="3715" t="2683" r="3806" b="2837">3</wd>

<space/>

<wd l="3878" t="2678" r="4133" b="2837">for</wd>

<space/>

<wd l="4186" t="2678" r="4781" b="2837">further</wd>

<space/>

<wd l="4838" t="2678" r="5520" b="2875">details).</wd>

</ln>

</para>

<para l="1675" t="3206" r="5808" b="4224" alignment="justified" li="432" spaceBefore="264" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="3206" r="5808" b="3403" baseLine="3360">

<wd l="1675" t="3235" r="1877" b="3360">•</wd>

<tab position="1745"/>

<wd l="1877" t="3235" r="4277" b="3403"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">WNUTNgramProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4368" t="3206" r="4906" b="3365">which</wd>

<space/>

<wd l="4978" t="3206" r="5117" b="3365">is</wd>

<space/>

<wd l="5208" t="3206" r="5808" b="3365">similar</wd>

<space/>

</run>

</ln>

<ln l="1877" t="3480" r="5808" b="3682" baseLine="3629">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="3504" r="2045" b="3638">to</wd>

<space/>

<wd l="2098" t="3480" r="2362" b="3638">the</wd>

<space/>

<wd l="2414" t="3480" r="3154" b="3682">previous</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3216" t="3504" r="5030" b="3638">NGramProcessor</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5093" t="3480" r="5371" b="3638">but</wd>

<space/>

<wd l="5419" t="3480" r="5808" b="3638">with</wd>

<space/>

</run>

</ln>

<ln l="1886" t="3749" r="5794" b="3950" baseLine="3902" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1886" t="3802" r="2338" b="3907">some</wd>

<space/>

<wd l="2419" t="3749" r="2938" b="3907">added</wd>

<space/>

<wd l="3014" t="3749" r="4190" b="3907">modifications</wd>

<space/>

<wd l="4277" t="3773" r="4445" b="3907">to</wd>

<space/>

<wd l="4531" t="3749" r="4709" b="3907">fit</wd>

<space/>

<wd l="4786" t="3749" r="5050" b="3907">the</wd>

<space/>

<wd l="5126" t="3749" r="5794" b="3950">particu-</wd>

</ln>

<ln l="1877" t="4022" r="5635" b="4224" baseLine="4171" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="4022" r="2462" b="4181">larities</wd>

<space/>

<wd l="2530" t="4022" r="2722" b="4181">of</wd>

<space/>

<wd l="2765" t="4075" r="3058" b="4181">our</wd>

<space/>

<wd l="3106" t="4075" r="3461" b="4181">new</wd>

<space/>

<wd l="3523" t="4046" r="4152" b="4181">custom</wd>

<space/>

<wd l="4205" t="4022" r="4992" b="4224">language</wd>

<space/>

<wd l="5045" t="4022" r="5635" b="4181">model.</wd>

</ln>

</para>

<para l="1675" t="4550" r="5803" b="5294" alignment="justified" li="432" spaceBefore="265" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="4550" r="5798" b="4752" baseLine="4704">

<wd l="1675" t="4579" r="1877" b="4704">•</wd>

<tab position="1745"/>

<wd l="1877" t="4570" r="4406" b="4738"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">WNUTResultProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4565" t="4550" r="5098" b="4709">which</wd>

<space/>

<wd l="5227" t="4550" r="5798" b="4752">dumps</wd>

<space/>

</run>

</ln>

<ln l="1882" t="4824" r="5803" b="5026" baseLine="4973" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="4824" r="2093" b="4982">all</wd>

<space/>

<wd l="2155" t="4848" r="2630" b="4982">tweet</wd>

<space/>

<wd l="2698" t="4824" r="3058" b="4982">data</wd>

<space/>

<wd l="3125" t="4824" r="3970" b="5026">generated</wd>

<space/>

<wd l="4027" t="4824" r="4243" b="5026">by</wd>

<space/>

<wd l="4310" t="4824" r="4574" b="4982">the</wd>

<space/>

<wd l="4646" t="4848" r="5246" b="5026">system</wd>

<space/>

<wd l="5309" t="4824" r="5477" b="4978">in</wd>

<space/>

<wd l="5539" t="4824" r="5803" b="4982">the</wd>

<space/>

</ln>

<ln l="1877" t="5093" r="4555" b="5294" baseLine="5246">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="5093" r="2606" b="5294">required</wd>

<space/>

<wd l="2664" t="5117" r="3216" b="5294">output</wd>

<space/>

<wd l="3269" t="5093" r="3854" b="5251">format</wd>

<space/>

</run>

<wd l="3917" t="5098" r="4555" b="5290"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">JSON</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="5654" r="5808" b="6398" alignment="justified" spaceBefore="290" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="5654" r="5808" b="5856" baseLine="5808" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5659" r="1723" b="5813">We</wd>

<space/>

<wd l="1824" t="5654" r="2266" b="5813">show</wd>

<space/>

<wd l="2362" t="5654" r="2534" b="5808">in</wd>

<space/>

<wd l="2621" t="5654" r="3192" b="5856">Figure</wd>

<space/>

<wd l="3307" t="5659" r="3370" b="5808">1</wd>

<space/>

<wd l="3485" t="5707" r="3581" b="5813">a</wd>

<space/>

<wd l="3672" t="5654" r="4478" b="5856">graphical</wd>

<space/>

<wd l="4570" t="5654" r="5808" b="5856">representation</wd>

<space/>

</ln>

<ln l="1445" t="5928" r="5808" b="6130" baseLine="6077" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5928" r="1637" b="6086">of</wd>

<space/>

<wd l="1690" t="5928" r="1954" b="6086">the</wd>

<space/>

<wd l="2026" t="5928" r="3048" b="6086">architecture</wd>

<space/>

<wd l="3120" t="5928" r="3312" b="6086">of</wd>

<space/>

<wd l="3360" t="5928" r="3629" b="6086">the</wd>

<space/>

<wd l="3706" t="5952" r="4306" b="6130">system</wd>

<space/>

<wd l="4368" t="5928" r="4757" b="6086">both</wd>

<space/>

<wd l="4819" t="5928" r="5376" b="6086">before</wd>

<space/>

<wd l="5453" t="5928" r="5808" b="6125">(left</wd>

<space/>

</ln>

<ln l="1450" t="6197" r="5035" b="6398" baseLine="6346" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="6197" r="1853" b="6394">side)</wd>

<space/>

<wd l="1925" t="6197" r="2237" b="6355">and</wd>

<space/>

<wd l="2294" t="6197" r="2693" b="6355">after</wd>

<space/>

<wd l="2750" t="6197" r="3230" b="6398">(right</wd>

<space/>

<wd l="3293" t="6197" r="3696" b="6394">side)</wd>

<space/>

<wd l="3758" t="6197" r="4027" b="6355">the</wd>

<space/>

<wd l="4085" t="6197" r="5035" b="6398">adaptation.</wd>

</ln>

</para>

<para l="1440" t="6490" r="5808" b="8045" alignment="justified" spaceBefore="26" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="6490" r="5798" b="6691" baseLine="6638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="6490" r="2914" b="6691">Unfortunately,</wd>

<space/>

<wd l="3062" t="6490" r="3451" b="6648">time</wd>

<space/>

<wd l="3576" t="6490" r="4502" b="6648">limitations</wd>

<space/>

<wd l="4637" t="6490" r="5486" b="6691">prevented</wd>

<space/>

<wd l="5611" t="6542" r="5798" b="6648">us</wd>

<space/>

</ln>

<ln l="1440" t="6758" r="5808" b="6960" baseLine="6912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6758" r="1867" b="6917">from</wd>

<space/>

<wd l="1934" t="6758" r="3144" b="6960">implementing</wd>

<space/>

<wd l="3226" t="6811" r="3422" b="6917">an</wd>

<space/>

<wd l="3494" t="6758" r="4162" b="6960">English</wd>

<space/>

<wd l="4234" t="6758" r="4978" b="6960">phonetic</wd>

<space/>

<wd l="5054" t="6758" r="5477" b="6917">table</wd>

<space/>

<wd l="5549" t="6758" r="5808" b="6917">for</wd>

<space/>

</ln>

<ln l="1440" t="7032" r="5803" b="7219" baseLine="7181">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="7032" r="1704" b="7190">the</wd>

<space/>

</run>

<wd l="1795" t="7046" r="4056" b="7219"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">PhoneticProcessor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4157" t="7032" r="4694" b="7190">which</wd>

<space/>

<wd l="4776" t="7032" r="5318" b="7190">would</wd>

<space/>

<wd l="5400" t="7032" r="5803" b="7190">have</wd>

<space/>

</run>

</ln>

<ln l="1440" t="7301" r="5798" b="7502" baseLine="7450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7301" r="2213" b="7502">provided</wd>

<space/>

<wd l="2290" t="7354" r="2472" b="7459">us</wd>

<space/>

<wd l="2558" t="7301" r="2947" b="7459">with</wd>

<space/>

<wd l="3019" t="7301" r="3864" b="7502">mappings</wd>

<space/>

<wd l="3955" t="7301" r="4349" b="7459">such</wd>

<space/>

<wd l="4426" t="7354" r="4594" b="7459">as</wd>

<space/>

<wd l="4685" t="7306" r="5242" b="7488">“two”,</wd>

<space/>

<wd l="5338" t="7306" r="5798" b="7459">“too”</wd>

<space/>

</ln>

<ln l="1445" t="7574" r="5803" b="7762" baseLine="7723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="7627" r="1627" b="7733">or</wd>

<space/>

<wd l="1675" t="7579" r="2026" b="7733">“to”</wd>

<space/>

<wd l="2083" t="7574" r="2342" b="7733">for</wd>

<space/>

<wd l="2390" t="7579" r="2731" b="7733">“2”.</wd>

<space/>

<wd l="2808" t="7579" r="3029" b="7733">To</wd>

<space/>

<wd l="3086" t="7574" r="3816" b="7733">alleviate</wd>

<space/>

<wd l="3864" t="7574" r="4219" b="7762">this,</wd>

<space/>

<wd l="4282" t="7627" r="4536" b="7733">we</wd>

<space/>

<wd l="4589" t="7574" r="4867" b="7733">did</wd>

<space/>

<wd l="4915" t="7574" r="5491" b="7733">extend</wd>

<space/>

<wd l="5539" t="7574" r="5803" b="7733">the</wd>

<space/>

</ln>

<ln l="1450" t="7829" r="5328" b="8045" baseLine="7992">

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="7877" r="1805" b="8002">SMS</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1882" t="7843" r="2755" b="8045">dictionary</wd>

<space/>

<wd l="2818" t="7867" r="2981" b="8002">to</wd>

<space/>

<wd l="3043" t="7896" r="3523" b="8002">cover</wd>

<space/>

<wd l="3581" t="7896" r="4032" b="8002">some</wd>

<space/>

<wd l="4094" t="7843" r="4282" b="8002">of</wd>

<space/>

<wd l="4325" t="7843" r="4771" b="8002">these</wd>

<space/>

<wd l="4834" t="7896" r="5328" b="8002">cases.</wd>

</run>

</ln>

</para>

<para l="1440" t="8136" r="5808" b="10502" alignment="justified" spaceBefore="32" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="8136" r="5794" b="8294" baseLine="8285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="8141" r="1795" b="8294">It</wd>

<space/>

<wd l="1862" t="8136" r="2438" b="8294">should</wd>

<space/>

<wd l="2496" t="8136" r="2702" b="8294">be</wd>

<space/>

<wd l="2765" t="8136" r="3254" b="8294">noted</wd>

<space/>

<wd l="3312" t="8136" r="3643" b="8294">that</wd>

<space/>

<wd l="3706" t="8136" r="4392" b="8294">because</wd>

<space/>

<wd l="4459" t="8136" r="4651" b="8294">of</wd>

<space/>

<wd l="4699" t="8136" r="5160" b="8294">those</wd>

<space/>

<wd l="5222" t="8136" r="5794" b="8294">limita-</wd>

</ln>

<ln l="1440" t="8405" r="5794" b="8563" baseLine="8554" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8405" r="1858" b="8563">tions</wd>

<space/>

<wd l="1939" t="8458" r="2194" b="8563">we</wd>

<space/>

<wd l="2270" t="8405" r="2549" b="8563">did</wd>

<space/>

<wd l="2621" t="8429" r="2904" b="8563">not</wd>

<space/>

<wd l="2981" t="8405" r="3619" b="8563">address</wd>

<space/>

<wd l="3706" t="8405" r="4162" b="8563">those</wd>

<space/>

<wd l="4243" t="8458" r="4690" b="8563">cases</wd>

<space/>

<wd l="4771" t="8458" r="5198" b="8563">were</wd>

<space/>

<wd l="5270" t="8405" r="5794" b="8563">multi-</wd>

</ln>

<ln l="1440" t="8678" r="5803" b="8880" baseLine="8827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8678" r="1704" b="8880">ple</wd>

<space/>

<wd l="1762" t="8678" r="2707" b="8880">contiguous</wd>

<space/>

<wd l="2770" t="8678" r="3326" b="8837">tokens</wd>

<space/>

<wd l="3394" t="8678" r="3586" b="8837">of</wd>

<space/>

<wd l="3624" t="8678" r="3888" b="8837">the</wd>

<space/>

<wd l="3941" t="8678" r="4392" b="8880">input</wd>

<space/>

<wd l="4440" t="8702" r="4915" b="8837">tweet</wd>

<space/>

<wd l="4973" t="8678" r="5549" b="8837">should</wd>

<space/>

<wd l="5602" t="8678" r="5803" b="8837">be</wd>

<space/>

</ln>

<ln l="1440" t="8947" r="5803" b="9149" baseLine="9096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8947" r="2424" b="9106">normalized</wd>

<space/>

<wd l="2491" t="8947" r="2827" b="9106">into</wd>

<space/>

<wd l="2904" t="9000" r="3000" b="9106">a</wd>

<space/>

<wd l="3072" t="8947" r="3581" b="9149">single</wd>

<space/>

<wd l="3658" t="8971" r="4210" b="9149">output</wd>

<space/>

<wd l="4277" t="8947" r="4762" b="9106">token</wd>

<space/>

<wd l="4838" t="8947" r="5155" b="9144">(i.e.</wd>

<space/>

<wd l="5275" t="8947" r="5544" b="9106">the</wd>

<space/>

<wd l="5621" t="9000" r="5803" b="9106">so</wd>

<space/>

</ln>

<ln l="1445" t="9216" r="5794" b="9418" baseLine="9370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9216" r="1963" b="9374">called</wd>

<space/>

<wd l="2016" t="9221" r="2376" b="9370">“n-1</wd>

<space/>

<wd l="2453" t="9216" r="3514" b="9418">mappings”).</wd>

<space/>

<wd l="3590" t="9221" r="4478" b="9403">Moreover,</wd>

<space/>

<wd l="4550" t="9216" r="4987" b="9374">since</wd>

<space/>

<wd l="5040" t="9216" r="5366" b="9374">that</wd>

<space/>

<wd l="5419" t="9216" r="5794" b="9418">phe-</wd>

</ln>

<ln l="1440" t="9490" r="5798" b="9691" baseLine="9638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9542" r="2251" b="9648">nomenon</wd>

<space/>

<wd l="2333" t="9542" r="2659" b="9648">was</wd>

<space/>

<wd l="2750" t="9542" r="3086" b="9648">rare</wd>

<space/>

<wd l="3178" t="9490" r="3360" b="9686">(it</wd>

<space/>

<wd l="3446" t="9490" r="4229" b="9691">appeared</wd>

<space/>

<wd l="4306" t="9490" r="4478" b="9643">in</wd>

<space/>

<wd l="4536" t="9490" r="4872" b="9691">just</wd>

<space/>

<wd l="4973" t="9494" r="5146" b="9643">11</wd>

<space/>

<wd l="5246" t="9514" r="5798" b="9648">tweets</wd>

<space/>

</ln>

<ln l="1445" t="9758" r="5808" b="9960" baseLine="9912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9782" r="1718" b="9917">out</wd>

<space/>

<wd l="1781" t="9758" r="1973" b="9917">of</wd>

<space/>

<wd l="2021" t="9758" r="2448" b="9917">2950</wd>

<space/>

<wd l="2515" t="9758" r="2707" b="9917">of</wd>

<space/>

<wd l="2750" t="9758" r="3014" b="9917">the</wd>

<space/>

<wd l="3077" t="9758" r="3749" b="9960">training</wd>

<space/>

<wd l="3816" t="9758" r="4478" b="9955">dataset)</wd>

<space/>

<wd l="4550" t="9811" r="4800" b="9917">we</wd>

<space/>

<wd l="4867" t="9758" r="5808" b="9917">considered</wd>

<space/>

</ln>

<ln l="1440" t="10032" r="5803" b="10234" baseLine="10181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10032" r="1771" b="10190">that</wd>

<space/>

<wd l="1843" t="10032" r="2477" b="10234">leaving</wd>

<space/>

<wd l="2558" t="10032" r="2866" b="10190">this</wd>

<space/>

<wd l="2952" t="10032" r="3557" b="10190">feature</wd>

<space/>

<wd l="3634" t="10032" r="4229" b="10190">behind</wd>

<space/>

<wd l="4306" t="10032" r="4848" b="10190">would</wd>

<space/>

<wd l="4925" t="10032" r="5328" b="10190">have</wd>

<space/>

<wd l="5405" t="10032" r="5803" b="10190">little</wd>

<space/>

</ln>

<ln l="1440" t="10301" r="5486" b="10502" baseLine="10454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10301" r="2035" b="10502">impact</wd>

<space/>

<wd l="2093" t="10354" r="2309" b="10459">on</wd>

<space/>

<wd l="2362" t="10301" r="2626" b="10459">the</wd>

<space/>

<wd l="2688" t="10301" r="3067" b="10459">final</wd>

<space/>

<wd l="3125" t="10301" r="4229" b="10502">performance</wd>

<space/>

<wd l="4286" t="10301" r="4478" b="10459">of</wd>

<space/>

<wd l="4517" t="10301" r="4786" b="10459">the</wd>

<space/>

<wd l="4848" t="10325" r="5486" b="10502">system.</wd>

</ln>

</para>

<para l="1440" t="10834" r="3888" b="11054" alignment="left" spaceBefore="275" lsp="exactly" lspExact="278" language="en">

<ln l="1440" t="10834" r="3888" b="11054" baseLine="10997" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="1440" t="10834" r="1555" b="11006">3</wd>

<space/>

<wd l="1805" t="10838" r="2870" b="11054">Integrated</wd>

<space/>

<wd l="2938" t="10886" r="3888" b="11006">resources</wd>

</ln>

</para>

<para l="1440" t="11314" r="5808" b="12058" alignment="justified" spaceBefore="193" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="11314" r="5808" b="11501" baseLine="11467" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11314" r="1781" b="11472">The</wd>

<space/>

<wd l="1829" t="11314" r="2218" b="11472">base</wd>

<space/>

<wd l="2270" t="11366" r="3086" b="11472">resources</wd>

<space/>

<wd l="3144" t="11366" r="3398" b="11472">we</wd>

<space/>

<wd l="3451" t="11314" r="3854" b="11472">have</wd>

<space/>

<wd l="3907" t="11314" r="4310" b="11472">used</wd>

<space/>

<wd l="4358" t="11314" r="4618" b="11472">for</wd>

<space/>

<wd l="4666" t="11314" r="4973" b="11472">this</wd>

<space/>

<wd l="5030" t="11314" r="5429" b="11501">task,</wd>

<space/>

<wd l="5496" t="11314" r="5808" b="11472">and</wd>

<space/>

</ln>

<ln l="1445" t="11587" r="5803" b="11789" baseLine="11736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="11640" r="1661" b="11746">on</wd>

<space/>

<wd l="1728" t="11587" r="2266" b="11746">which</wd>

<space/>

<wd l="2333" t="11611" r="2760" b="11746">most</wd>

<space/>

<wd l="2832" t="11587" r="3024" b="11746">of</wd>

<space/>

<wd l="3082" t="11587" r="3346" b="11746">the</wd>

<space/>

<wd l="3427" t="11611" r="4027" b="11789">system</wd>

<space/>

<wd l="4094" t="11640" r="5006" b="11789">processors</wd>

<space/>

<wd l="5083" t="11587" r="5453" b="11789">rely,</wd>

<space/>

<wd l="5544" t="11640" r="5803" b="11746">are</wd>

<space/>

</ln>

<ln l="1440" t="11856" r="2650" b="12058" baseLine="12010" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11856" r="1704" b="12014">the</wd>

<space/>

<wd l="1762" t="11856" r="2650" b="12058">following:</wd>

</ln>

</para>

<para l="1675" t="12418" r="5808" b="13162" alignment="justified" li="432" spaceBefore="289" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="12418" r="5808" b="12619" baseLine="12571">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1675" t="12470" r="1891" b="12571">•</wd>

<tab position="1732"/>

<wd l="1891" t="12437" r="2645" b="12614">aspell</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2808" t="12418" r="3480" b="12619">(Aspell,</wd>

<space/>

<wd l="3653" t="12422" r="4200" b="12614">2011),</wd>

<space/>

<wd l="4368" t="12418" r="4632" b="12576">the</wd>

<space/>

<wd l="4766" t="12418" r="5808" b="12576">well-known</wd>

<space/>

</run>

</ln>

<ln l="1886" t="12691" r="5794" b="12893" baseLine="12840" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1886" t="12691" r="3043" b="12893">spell-checker</wd>

<space/>

<wd l="3144" t="12691" r="3864" b="12893">together</wd>

<space/>

<wd l="3970" t="12691" r="4358" b="12850">with</wd>

<space/>

<wd l="4464" t="12691" r="4661" b="12850">its</wd>

<space/>

<wd l="4786" t="12691" r="5386" b="12850">default</wd>

<space/>

<wd l="5491" t="12696" r="5794" b="12845">En-</wd>

</ln>

<ln l="1882" t="12960" r="3269" b="13162" baseLine="13109" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="12960" r="2304" b="13162">glish</wd>

<space/>

<wd l="2362" t="12960" r="3269" b="13162">dictionary.</wd>

</ln>

</para>

<para l="1675" t="13493" r="5808" b="14237" alignment="justified" li="432" spaceBefore="265" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="13493" r="5808" b="13694" baseLine="13642">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1675" t="13546" r="1891" b="13642">•</wd>

<tab position="1729"/>

<wd l="1891" t="13512" r="3566" b="13690">ark-tweet-nlp</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3648" t="13493" r="4469" b="13694">(Owoputi</wd>

<space/>

<wd l="4541" t="13517" r="4694" b="13651">et</wd>

<space/>

<wd l="4757" t="13493" r="5006" b="13680">al.,</wd>

<space/>

<wd l="5088" t="13498" r="5635" b="13690">2013),</wd>

<space/>

<wd l="5712" t="13546" r="5808" b="13651">a</wd>

<space/>

</run>

</ln>

<ln l="1877" t="13762" r="5803" b="13920" baseLine="13915" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="13762" r="3250" b="13920">Twitter-focused</wd>

<space/>

<wd l="3322" t="13766" r="3730" b="13920">NLP</wd>

<space/>

<wd l="3806" t="13762" r="4378" b="13920">toolkit</wd>

<space/>

<wd l="4450" t="13762" r="4877" b="13920">from</wd>

<space/>

<wd l="4944" t="13762" r="5482" b="13920">which</wd>

<space/>

<wd l="5549" t="13814" r="5803" b="13920">we</wd>

<space/>

</ln>

<ln l="1877" t="14035" r="4080" b="14237" baseLine="14184" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="14035" r="2280" b="14194">have</wd>

<space/>

<wd l="2338" t="14035" r="2736" b="14194">used</wd>

<space/>

<wd l="2789" t="14035" r="2986" b="14194">its</wd>

<space/>

<wd l="3053" t="14040" r="3442" b="14194">POS</wd>

<space/>

<wd l="3504" t="14059" r="4080" b="14237">tagger.</wd>

</ln>

</para>

<para l="1675" t="14558" r="5808" b="15307" alignment="justified" li="432" spaceBefore="265" fli="-216" lsp="exactly" lspExact="267" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="14563" r="5808" b="14760" baseLine="14717">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1675" t="14592" r="1882" b="14717">•</wd>

<tab position="1745"/>

<wd l="1882" t="14582" r="3182" b="14760">BerkeleyLM</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3302" t="14563" r="3826" b="14760">(Pauls</wd>

<space/>

<wd l="3946" t="14563" r="4258" b="14722">and</wd>

<space/>

<wd l="4368" t="14563" r="4891" b="14750">Klein,</wd>

<space/>

<wd l="5030" t="14568" r="5578" b="14760">2011),</wd>

<space/>

<wd l="5712" t="14616" r="5808" b="14722">a</wd>

<space/>

</run>

</ln>

<ln l="1877" t="14837" r="5803" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="14842" r="2256" b="14995">Java</wd>

<space/>

<wd l="2318" t="14837" r="2899" b="15038">library</wd>

<space/>

<wd l="2971" t="14837" r="3283" b="14995">and</wd>

<space/>

<wd l="3346" t="14837" r="3926" b="14995">toolset</wd>

<space/>

<wd l="3994" t="14837" r="4670" b="14995">focused</wd>

<space/>

<wd l="4738" t="14890" r="4954" b="14995">on</wd>

<space/>

<wd l="5016" t="14837" r="5803" b="15038">language</wd>

<space/>

</ln>

<ln l="1877" t="15106" r="2746" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="15106" r="2746" b="15307">modeling.</wd>

</ln>

</para>

</column>

<column l="6141" t="1097" r="10528" b="15316">

<para l="6384" t="1286" r="10512" b="2338" alignment="justified" li="432" spaceBefore="165" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="1286" r="10512" b="1522" baseLine="1470">

<wd l="6384" t="1349" r="6586" b="1474">•</wd>

<tab position="6454"/>

<wd l="6586" t="1286" r="7363" b="1507"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Redis</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7464" t="1373" r="7560" b="1478">a</wd>

<space/>

<wd l="7632" t="1325" r="8266" b="1517">noSQL</wd>

<space/>

<wd l="8338" t="1320" r="9187" b="1522">key-value</wd>

<space/>

<wd l="9269" t="1320" r="10099" b="1507">datastore;</wd>

<space/>

<wd l="10200" t="1320" r="10512" b="1478">and</wd>

<space/>

</run>

</ln>

<ln l="6581" t="1579" r="10502" b="1781" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6581" t="1594" r="6850" b="1752">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6941" t="1627" r="7296" b="1752">SMS</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7397" t="1594" r="8611" b="1752">normalization</wd>

<space/>

<wd l="8698" t="1594" r="9754" b="1781">dictionaries,</wd>

<space/>

<wd l="9859" t="1594" r="10502" b="1752">canoni-</wd>

</run>

</ln>

<ln l="6586" t="1862" r="10507" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="1862" r="6835" b="2021">cal</wd>

<space/>

<wd l="6912" t="1862" r="7550" b="2021">lexicon</wd>

<space/>

<wd l="7627" t="1862" r="7939" b="2021">and</wd>

<space/>

<wd l="8011" t="1862" r="8688" b="2064">training</wd>

<space/>

<wd l="8770" t="1862" r="9374" b="2021">dataset</wd>

<space/>

<wd l="9446" t="1862" r="10219" b="2064">provided</wd>

<space/>

<wd l="10291" t="1862" r="10507" b="2064">by</wd>

<space/>

</ln>

<ln l="6581" t="2136" r="8813" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="2136" r="6850" b="2294">the</wd>

<space/>

<wd l="6907" t="2136" r="7800" b="2338">organizers</wd>

<space/>

<wd l="7867" t="2136" r="8059" b="2294">of</wd>

<space/>

<wd l="8098" t="2136" r="8362" b="2294">the</wd>

<space/>

<wd l="8419" t="2136" r="8813" b="2294">task.</wd>

</ln>

</para>

<para l="6144" t="2606" r="10498" b="3082" alignment="justified" spaceBefore="204" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="2606" r="10498" b="2808" baseLine="2760" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2611" r="6379" b="2765">As</wd>

<space/>

<wd l="6470" t="2659" r="6566" b="2765">a</wd>

<space/>

<wd l="6638" t="2606" r="7123" b="2765">result</wd>

<space/>

<wd l="7205" t="2606" r="7397" b="2765">of</wd>

<space/>

<wd l="7459" t="2606" r="8386" b="2808">processing</wd>

<space/>

<wd l="8467" t="2606" r="8731" b="2765">the</wd>

<space/>

<wd l="8808" t="2606" r="9547" b="2808">previous</wd>

<space/>

<wd l="9634" t="2659" r="10498" b="2794">resources,</wd>

<space/>

</ln>

<ln l="6144" t="2880" r="10310" b="3082" baseLine="3029" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2933" r="6398" b="3038">we</wd>

<space/>

<wd l="6456" t="2880" r="6859" b="3038">have</wd>

<space/>

<wd l="6917" t="2880" r="7666" b="3038">obtained</wd>

<space/>

<wd l="7718" t="2880" r="7987" b="3038">the</wd>

<space/>

<wd l="8040" t="2880" r="8880" b="3082">following</wd>

<space/>

<wd l="8942" t="2880" r="9806" b="3038">additional</wd>

<space/>

<wd l="9869" t="2933" r="10310" b="3038">ones:</wd>

</ln>

</para>

<para l="6384" t="3350" r="10502" b="4637" alignment="justified" li="432" spaceBefore="205" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="3350" r="10502" b="3552" baseLine="3499">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="3355" r="6581" b="3499">•</wd>

<tab position="6465"/>

<wd l="6581" t="3355" r="6739" b="3504">A</wd>

<space/>

<wd l="6835" t="3350" r="7373" b="3552">global</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7474" t="3384" r="7829" b="3509">SMS</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7934" t="3350" r="9149" b="3509">normalization</wd>

<space/>

<wd l="9240" t="3350" r="10114" b="3552">dictionary</wd>

<space/>

<wd l="10210" t="3350" r="10502" b="3504">im-</wd>

</run>

</ln>

<ln l="6581" t="3619" r="10502" b="3821" baseLine="3773">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6581" t="3619" r="7493" b="3821">plemented</wd>

<space/>

<wd l="7565" t="3672" r="7733" b="3778">as</wd>

<space/>

<wd l="7814" t="3672" r="7910" b="3778">a</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7978" t="3634" r="8606" b="3778">Redis</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8698" t="3619" r="9523" b="3806">datastore,</wd>

<space/>

<wd l="9610" t="3619" r="10162" b="3778">whose</wd>

<space/>

<wd l="10238" t="3672" r="10502" b="3778">en-</wd>

</run>

</ln>

<ln l="6581" t="3893" r="10502" b="4051" baseLine="4042" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="3893" r="6950" b="4051">tries</wd>

<space/>

<wd l="7018" t="3946" r="7445" b="4051">were</wd>

<space/>

<wd l="7512" t="3893" r="8304" b="4051">extracted</wd>

<space/>

<wd l="8362" t="3893" r="8789" b="4051">from</wd>

<space/>

<wd l="8851" t="3893" r="9115" b="4051">the</wd>

<space/>

<wd l="9178" t="3917" r="9499" b="4051">two</wd>

<space/>

<wd l="9566" t="3893" r="10502" b="4051">normaliza-</wd>

</ln>

<ln l="6581" t="4162" r="10502" b="4363" baseLine="4315" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="4162" r="6922" b="4320">tion</wd>

<space/>

<wd l="6984" t="4162" r="7987" b="4320">dictionaries</wd>

<space/>

<wd l="8059" t="4162" r="8371" b="4320">and</wd>

<space/>

<wd l="8424" t="4162" r="8693" b="4320">the</wd>

<space/>

<wd l="8750" t="4162" r="9422" b="4363">training</wd>

<space/>

<wd l="9490" t="4162" r="10094" b="4320">dataset</wd>

<space/>

<wd l="10147" t="4214" r="10502" b="4363">pro-</wd>

</ln>

<ln l="6581" t="4435" r="8664" b="4637" baseLine="4584" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="4435" r="7070" b="4594">vided</wd>

<space/>

<wd l="7123" t="4435" r="7334" b="4637">by</wd>

<space/>

<wd l="7392" t="4435" r="7661" b="4594">the</wd>

<space/>

<wd l="7718" t="4435" r="8664" b="4637">organizers.</wd>

</ln>

</para>

<para l="6384" t="4886" r="10512" b="6130" alignment="justified" li="432" spaceBefore="186" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="4886" r="10512" b="5088" baseLine="5035" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="4891" r="6581" b="5035">•</wd>

<tab position="6465"/>

<wd l="6581" t="4891" r="6739" b="5040">A</wd>

<space/>

<wd l="6821" t="4891" r="7858" b="5088">Kneser-Ney</wd>

<space/>

<wd l="7939" t="4886" r="8726" b="5088">language</wd>

<space/>

<wd l="8803" t="4886" r="9346" b="5045">model</wd>

<space/>

<wd l="9437" t="4891" r="10123" b="5083">(Kneser</wd>

<space/>

<wd l="10200" t="4886" r="10512" b="5045">and</wd>

<space/>

</ln>

<ln l="6581" t="5155" r="10512" b="5357" baseLine="5309" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="5160" r="6970" b="5357">Ney,</wd>

<space/>

<wd l="7118" t="5155" r="7594" b="5352">1995)</wd>

<space/>

<wd l="7709" t="5155" r="7901" b="5314">of</wd>

<space/>

<wd l="7987" t="5155" r="8251" b="5314">the</wd>

<space/>

<wd l="8352" t="5179" r="8846" b="5357">target</wd>

<space/>

<wd l="8947" t="5155" r="9600" b="5314">domain</wd>

<space/>

<wd l="9710" t="5155" r="10512" b="5352">(standard</wd>

<space/>

</ln>

<ln l="6581" t="5429" r="10507" b="5626" baseLine="5578">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6581" t="5453" r="7056" b="5587">tweet</wd>

<space/>

<wd l="7123" t="5434" r="7512" b="5626">text)</wd>

<space/>

<wd l="7594" t="5429" r="8342" b="5587">obtained</wd>

<space/>

<wd l="8410" t="5429" r="8798" b="5587">with</wd>

<space/>

<wd l="8866" t="5429" r="9134" b="5587">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9206" t="5448" r="10507" b="5626">BerkeleyLM</wd>

<space/>

</run>

</ln>

<ln l="6581" t="5698" r="10507" b="5899" baseLine="5851" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="5698" r="6998" b="5856">tools</wd>

<space/>

<wd l="7099" t="5698" r="7642" b="5899">taking</wd>

<space/>

<wd l="7742" t="5750" r="7910" b="5856">as</wd>

<space/>

<wd l="8011" t="5698" r="8462" b="5899">input</wd>

<space/>

<wd l="8549" t="5722" r="9101" b="5856">tweets</wd>

<space/>

<wd l="9206" t="5698" r="9394" b="5856">of</wd>

<space/>

<wd l="9475" t="5698" r="9739" b="5856">the</wd>

<space/>

<wd l="9830" t="5698" r="10507" b="5899">training</wd>

<space/>

</ln>

<ln l="6586" t="5971" r="7229" b="6130" baseLine="6120" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="5971" r="7229" b="6130">dataset.</wd>

</ln>

</para>

<para l="6384" t="6418" r="10512" b="6850" alignment="justified" li="432" spaceBefore="185" fli="-216" lsp="exactly" lspExact="270" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6422" r="10512" b="6624" baseLine="6571">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="6427" r="6581" b="6571">•</wd>

<tab position="6465"/>

<wd l="6581" t="6427" r="6739" b="6576">A</wd>

<space/>

<wd l="6811" t="6475" r="7166" b="6581">new</wd>

<space/>

<wd l="7238" t="6422" r="7906" b="6624">English</wd>

<space/>

<wd l="7982" t="6422" r="8861" b="6624">dictionary</wd>

<space/>

<wd l="8933" t="6422" r="9192" b="6581">for</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9274" t="6442" r="10027" b="6619">aspell</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10114" t="6422" r="10512" b="6581">built</wd>

<space/>

</run>

</ln>

<ln l="6586" t="6691" r="8750" b="6850" baseLine="6845" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="6744" r="6802" b="6850">on</wd>

<space/>

<wd l="6854" t="6691" r="7118" b="6850">the</wd>

<space/>

<wd l="7181" t="6691" r="8011" b="6850">canonical</wd>

<space/>

<wd l="8069" t="6691" r="8750" b="6850">lexicon.</wd>

</ln>

</para>

<para l="6144" t="7166" r="10512" b="10891" alignment="justified" spaceBefore="213" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="7166" r="10512" b="7368" baseLine="7315" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7166" r="6576" b="7325">With</wd>

<space/>

<wd l="6658" t="7190" r="7277" b="7368">respect</wd>

<space/>

<wd l="7358" t="7190" r="7526" b="7325">to</wd>

<space/>

<wd l="7613" t="7166" r="7877" b="7325">the</wd>

<space/>

<wd l="7968" t="7166" r="8918" b="7325">differences</wd>

<space/>

<wd l="9019" t="7166" r="9696" b="7368">existing</wd>

<space/>

<wd l="9782" t="7166" r="10512" b="7325">between</wd>

<space/>

</ln>

<ln l="6144" t="7435" r="10512" b="7637" baseLine="7584" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7435" r="6413" b="7594">the</wd>

<space/>

<wd l="6504" t="7435" r="7742" b="7637">configurations</wd>

<space/>

<wd l="7843" t="7435" r="8035" b="7594">of</wd>

<space/>

<wd l="8112" t="7435" r="8376" b="7594">the</wd>

<space/>

<wd l="8477" t="7459" r="9077" b="7637">system</wd>

<space/>

<wd l="9163" t="7435" r="9422" b="7594">for</wd>

<space/>

<wd l="9509" t="7435" r="10512" b="7594">constrained</wd>

<space/>

</ln>

<ln l="6149" t="7709" r="10512" b="7910" baseLine="7858" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="7709" r="6461" b="7867">and</wd>

<space/>

<wd l="6566" t="7709" r="7790" b="7867">unconstrained</wd>

<space/>

<wd l="7896" t="7762" r="8318" b="7896">runs,</wd>

<space/>

<wd l="8448" t="7709" r="8885" b="7867">there</wd>

<space/>

<wd l="8990" t="7709" r="9130" b="7867">is</wd>

<space/>

<wd l="9245" t="7709" r="9624" b="7910">only</wd>

<space/>

<wd l="9739" t="7762" r="10094" b="7867">one.</wd>

<space/>

<wd l="10330" t="7714" r="10512" b="7862">In</wd>

<space/>

</ln>

<ln l="6144" t="7978" r="10502" b="8179" baseLine="8126">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="7978" r="6413" b="8136">the</wd>

<space/>

<wd l="6509" t="8030" r="6878" b="8136">case</wd>

<space/>

<wd l="6979" t="7978" r="7171" b="8136">of</wd>

<space/>

<wd l="7253" t="7978" r="7517" b="8136">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7618" t="7978" r="8645" b="8136">constrained</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8741" t="8030" r="9072" b="8165">run,</wd>

<space/>

<wd l="9197" t="7978" r="9634" b="8136">since</wd>

<space/>

<wd l="9734" t="7978" r="10114" b="8179">only</wd>

<space/>

</run>

<wd l="10214" t="7982" r="10502" b="8179" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">off-</wd>

</ln>

<ln l="6149" t="8246" r="10502" b="8448" baseLine="8400">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="8246" r="6931" b="8448">the-shelf</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7003" t="8246" r="7421" b="8405">tools</wd>

<space/>

<wd l="7512" t="8299" r="7771" b="8405">are</wd>

<space/>

<wd l="7848" t="8246" r="8726" b="8448">permitted,</wd>

<space/>

<wd l="8822" t="8246" r="9086" b="8405">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9178" t="8266" r="9936" b="8443">aspell</wd>

<space/>

</run>

<wd l="10037" t="8246" r="10502" b="8448" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">spell-</wd>

</ln>

<ln l="6149" t="8520" r="10507" b="8722" baseLine="8669" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="8520" r="6826" b="8678">checker</wd>

<space/>

<wd l="6878" t="8573" r="7205" b="8678">was</wd>

<space/>

<wd l="7272" t="8520" r="8126" b="8722">employed</wd>

<space/>

<wd l="8179" t="8520" r="8650" b="8722">using</wd>

<space/>

<wd l="8707" t="8520" r="8904" b="8678">its</wd>

<space/>

<wd l="8971" t="8520" r="9576" b="8678">default</wd>

<space/>

<wd l="9629" t="8520" r="10507" b="8722">dictionary</wd>

<space/>

</ln>

<ln l="6144" t="8789" r="10502" b="8990" baseLine="8942" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8789" r="6422" b="8947">but</wd>

<space/>

<wd l="6470" t="8789" r="7157" b="8990">filtering</wd>

<space/>

<wd l="7205" t="8789" r="7402" b="8947">its</wd>

<space/>

<wd l="7459" t="8789" r="8227" b="8947">retrieved</wd>

<space/>

<wd l="8275" t="8789" r="9106" b="8947">candidate</wd>

<space/>

<wd l="9158" t="8789" r="10118" b="8947">corrections</wd>

<space/>

<wd l="10171" t="8789" r="10502" b="8947">tak-</wd>

</ln>

<ln l="6144" t="9062" r="10507" b="9264" baseLine="9211" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9062" r="6422" b="9264">ing</wd>

<space/>

<wd l="6509" t="9115" r="6677" b="9221">as</wd>

<space/>

<wd l="6768" t="9062" r="7574" b="9221">reference</wd>

<space/>

<wd l="7656" t="9062" r="7925" b="9221">the</wd>

<space/>

<wd l="8011" t="9062" r="8837" b="9221">canonical</wd>

<space/>

<wd l="8918" t="9062" r="9610" b="9250">lexicon;</wd>

<space/>

<wd l="9710" t="9062" r="9970" b="9221">i.e.</wd>

<space/>

<wd l="10128" t="9062" r="10507" b="9264">only</wd>

<space/>

</ln>

<ln l="6144" t="9331" r="10502" b="9490" baseLine="9485" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9331" r="6605" b="9490">those</wd>

<space/>

<wd l="6677" t="9331" r="7584" b="9490">candidates</wd>

<space/>

<wd l="7661" t="9331" r="7987" b="9490">that</wd>

<space/>

<wd l="8054" t="9331" r="8539" b="9490">could</wd>

<space/>

<wd l="8602" t="9331" r="8808" b="9490">be</wd>

<space/>

<wd l="8875" t="9331" r="9384" b="9490">found</wd>

<space/>

<wd l="9456" t="9384" r="9667" b="9490">on</wd>

<space/>

<wd l="9734" t="9331" r="10042" b="9490">this</wd>

<space/>

<wd l="10114" t="9331" r="10502" b="9490">lexi-</wd>

</ln>

<ln l="6149" t="9605" r="10498" b="9792" baseLine="9754" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="9658" r="6461" b="9763">con</wd>

<space/>

<wd l="6533" t="9658" r="6955" b="9763">were</wd>

<space/>

<wd l="7027" t="9605" r="7502" b="9763">taken</wd>

<space/>

<wd l="7570" t="9605" r="7906" b="9763">into</wd>

<space/>

<wd l="7987" t="9629" r="8702" b="9763">account.</wd>

<space/>

<wd l="8842" t="9610" r="9101" b="9763">On</wd>

<space/>

<wd l="9173" t="9605" r="9442" b="9763">the</wd>

<space/>

<wd l="9518" t="9605" r="9965" b="9763">other</wd>

<space/>

<wd l="10032" t="9605" r="10498" b="9792">hand,</wd>

<space/>

</ln>

<ln l="6144" t="9874" r="10502" b="10070" baseLine="10027">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="9874" r="6317" b="10027">in</wd>

<space/>

<wd l="6365" t="9874" r="6629" b="10032">the</wd>

<space/>

<wd l="6682" t="9926" r="7051" b="10032">case</wd>

<space/>

<wd l="7109" t="9874" r="7296" b="10032">of</wd>

<space/>

<wd l="7330" t="9874" r="7598" b="10032">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7651" t="9874" r="8899" b="10032">unconstrained</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8947" t="9926" r="9278" b="10061">run,</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9355" t="9893" r="10109" b="10070">aspell</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10176" t="9926" r="10502" b="10032">was</wd>

<space/>

</run>

</ln>

<ln l="6144" t="10147" r="10512" b="10349" baseLine="10296" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10147" r="6547" b="10306">used</wd>

<space/>

<wd l="6600" t="10147" r="7219" b="10306">instead</wd>

<space/>

<wd l="7267" t="10147" r="7656" b="10306">with</wd>

<space/>

<wd l="7709" t="10147" r="7973" b="10306">the</wd>

<space/>

<wd l="8030" t="10147" r="8909" b="10349">dictionary</wd>

<space/>

<wd l="8971" t="10147" r="9715" b="10306">obtained</wd>

<space/>

<wd l="9768" t="10147" r="10195" b="10306">from</wd>

<space/>

<wd l="10243" t="10147" r="10512" b="10306">the</wd>

<space/>

</ln>

<ln l="6149" t="10416" r="10512" b="10618" baseLine="10565" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="10416" r="6979" b="10574">canonical</wd>

<space/>

<wd l="7046" t="10416" r="7728" b="10574">lexicon.</wd>

<space/>

<wd l="7843" t="10416" r="8179" b="10574">The</wd>

<space/>

<wd l="8246" t="10440" r="8563" b="10574">rest</wd>

<space/>

<wd l="8635" t="10416" r="8822" b="10574">of</wd>

<space/>

<wd l="8875" t="10416" r="9144" b="10574">the</wd>

<space/>

<wd l="9211" t="10469" r="10123" b="10618">processors</wd>

<space/>

<wd l="10200" t="10416" r="10512" b="10574">and</wd>

<space/>

</ln>

<ln l="6144" t="10690" r="9293" b="10891" baseLine="10838" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10690" r="6552" b="10848">their</wd>

<space/>

<wd l="6600" t="10714" r="7550" b="10891">parameters</wd>

<space/>

<wd l="7613" t="10690" r="8424" b="10848">remained</wd>

<space/>

<wd l="8477" t="10690" r="8746" b="10848">the</wd>

<space/>

<wd l="8808" t="10742" r="9293" b="10848">same.</wd>

</ln>

</para>

<para l="6144" t="10958" r="10512" b="12230" alignment="justified" spaceBefore="4" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="6365" t="10958" r="10512" b="11160" baseLine="11107" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="10963" r="7253" b="11146">Moreover,</wd>

<space/>

<wd l="7334" t="10958" r="8093" b="11160">although</wd>

<space/>

<wd l="8155" t="11011" r="8405" b="11117">we</wd>

<space/>

<wd l="8477" t="10958" r="8818" b="11117">also</wd>

<space/>

<wd l="8890" t="10958" r="9830" b="11117">considered</wd>

<space/>

<wd l="9893" t="10958" r="10157" b="11117">the</wd>

<space/>

<wd l="10219" t="11011" r="10512" b="11117">use</wd>

<space/>

</ln>

<ln l="6149" t="11232" r="10512" b="11434" baseLine="11381" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="11232" r="6341" b="11390">of</wd>

<space/>

<wd l="6403" t="11232" r="6667" b="11390">the</wd>

<space/>

<wd l="6739" t="11232" r="7133" b="11390">Web</wd>

<space/>

<wd l="7234" t="11237" r="7450" b="11386">1T</wd>

<space/>

<wd l="7531" t="11232" r="8160" b="11434">5-gram</wd>

<space/>

<wd l="8227" t="11237" r="8424" b="11390">v1</wd>

<space/>

<wd l="8520" t="11232" r="9307" b="11434">language</wd>

<space/>

<wd l="9384" t="11232" r="9926" b="11390">model</wd>

<space/>

<wd l="10003" t="11232" r="10171" b="11386">in</wd>

<space/>

<wd l="10243" t="11232" r="10512" b="11390">the</wd>

<space/>

</ln>

<ln l="6144" t="11501" r="10512" b="11702" baseLine="11650" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11501" r="7373" b="11659">unconstrained</wd>

<space/>

<wd l="7454" t="11554" r="7790" b="11688">run,</wd>

<space/>

<wd l="7901" t="11554" r="8189" b="11659">our</wd>

<space/>

<wd l="8270" t="11501" r="9288" b="11702">preliminary</wd>

<space/>

<wd l="9374" t="11525" r="9754" b="11659">tests</wd>

<space/>

<wd l="9859" t="11501" r="10512" b="11659">showed</wd>

<space/>

</ln>

<ln l="6144" t="11770" r="10502" b="11971" baseLine="11923" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11770" r="6475" b="11928">that</wd>

<space/>

<wd l="6566" t="11770" r="6835" b="11928">the</wd>

<space/>

<wd l="6926" t="11770" r="7488" b="11928">results</wd>

<space/>

<wd l="7598" t="11770" r="8347" b="11928">obtained</wd>

<space/>

<wd l="8438" t="11822" r="8861" b="11928">were</wd>

<space/>

<wd l="8957" t="11822" r="9341" b="11971">very</wd>

<space/>

<wd l="9437" t="11822" r="9840" b="11971">poor</wd>

<space/>

<wd l="9931" t="11770" r="10104" b="11923">in</wd>

<space/>

<wd l="10195" t="11770" r="10502" b="11928">this</wd>

<space/>

</ln>

<ln l="6149" t="12043" r="9778" b="12230" baseLine="12192" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="12096" r="6566" b="12230">case,</wd>

<space/>

<wd l="6634" t="12096" r="6802" b="12202">as</wd>

<space/>

<wd l="6869" t="12096" r="7118" b="12202">we</wd>

<space/>

<wd l="7176" t="12043" r="7771" b="12202">further</wd>

<space/>

<wd l="7829" t="12067" r="8635" b="12202">comment</wd>

<space/>

<wd l="8688" t="12043" r="8861" b="12197">in</wd>

<space/>

<wd l="8918" t="12043" r="9571" b="12202">Section</wd>

<space/>

<wd l="9624" t="12048" r="9778" b="12202">4.</wd>

</ln>

</para>

<para l="6144" t="12504" r="7613" b="12677" alignment="left" spaceBefore="212" lsp="exactly" lspExact="278" language="en">

<ln l="6144" t="12504" r="7613" b="12677" baseLine="12672" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">

<wd l="6144" t="12504" r="6259" b="12672">4</wd>

<space/>

<wd l="6504" t="12504" r="7613" b="12677">Evaluation</wd>

</ln>

</para>

<para l="6144" t="12941" r="10512" b="15264" alignment="justified" spaceBefore="147" lsp="exactly" lspExact="269" language="en">

<ln l="6144" t="12941" r="10502" b="13099" baseLine="13090">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="12941" r="6624" b="13099">Table</wd>

<space/>

<wd l="6730" t="12946" r="6792" b="13094">1</wd>

<space/>

<wd l="6902" t="12941" r="7426" b="13099">shows</wd>

<space/>

<wd l="7512" t="12941" r="7776" b="13099">the</wd>

<space/>

<wd l="7858" t="12941" r="8419" b="13099">results</wd>

<space/>

<wd l="8510" t="12941" r="9259" b="13099">obtained</wd>

<space/>

<wd l="9336" t="12941" r="9595" b="13099">for</wd>

<space/>

<wd l="9672" t="12941" r="9936" b="13099">the</wd>

<space/>

</run>

<wd l="10022" t="12950" r="10502" b="13099" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">train-</wd>

</ln>

<ln l="6154" t="13210" r="10502" b="13411" baseLine="13358">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6154" t="13219" r="6422" b="13411">ing</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6514" t="13262" r="7133" b="13411">corpus.</wd>

<space/>

<wd l="7301" t="13214" r="7435" b="13368">It</wd>

<space/>

<wd l="7531" t="13210" r="8102" b="13368">should</wd>

<space/>

<wd l="8184" t="13210" r="8390" b="13368">be</wd>

<space/>

<wd l="8477" t="13210" r="8962" b="13368">noted</wd>

<space/>

<wd l="9048" t="13210" r="9374" b="13368">that</wd>

<space/>

<wd l="9456" t="13210" r="9902" b="13368">these</wd>

<space/>

<wd l="9994" t="13262" r="10502" b="13368">corre-</wd>

</run>

</ln>

<ln l="6154" t="13478" r="10502" b="13680" baseLine="13632">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6154" t="13478" r="6667" b="13680">spond</wd>

<space/>

<wd l="6730" t="13502" r="6893" b="13637">to</wd>

<space/>

<wd l="6965" t="13531" r="7061" b="13637">a</wd>

<space/>

<wd l="7128" t="13478" r="7766" b="13680">slightly</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7838" t="13478" r="8659" b="13680">overfitted</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="8731" t="13502" r="9370" b="13680">system,</wd>

<space/>

<wd l="9451" t="13478" r="9893" b="13637">since</wd>

<space/>

<wd l="9955" t="13531" r="10205" b="13637">we</wd>

<space/>

<wd l="10267" t="13478" r="10502" b="13632">in-</wd>

</run>

</ln>

<ln l="6149" t="13752" r="10512" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="13752" r="7118" b="13954">advertently</wd>

<space/>

<wd l="7186" t="13752" r="7584" b="13910">used</wd>

<space/>

<wd l="7651" t="13805" r="7747" b="13910">a</wd>

<space/>

<wd l="7800" t="13752" r="8587" b="13954">language</wd>

<space/>

<wd l="8650" t="13752" r="9192" b="13910">model</wd>

<space/>

<wd l="9254" t="13752" r="9653" b="13910">built</wd>

<space/>

<wd l="9710" t="13752" r="10181" b="13954">using</wd>

<space/>

<wd l="10243" t="13752" r="10512" b="13910">the</wd>

<space/>

</ln>

<ln l="6144" t="14021" r="10512" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14021" r="6677" b="14179">whole</wd>

<space/>

<wd l="6739" t="14021" r="7416" b="14222">training</wd>

<space/>

<wd l="7483" t="14021" r="8088" b="14179">dataset</wd>

<space/>

<wd l="8155" t="14021" r="8477" b="14218">(for</wd>

<space/>

<wd l="8539" t="14021" r="9370" b="14179">candidate</wd>

<space/>

<wd l="9442" t="14021" r="10272" b="14218">selection)</wd>

<space/>

<wd l="10339" t="14021" r="10512" b="14174">in</wd>

<space/>

</ln>

<ln l="6149" t="14294" r="10502" b="14453" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="14347" r="6442" b="14453">our</wd>

<space/>

<wd l="6552" t="14294" r="7171" b="14453">10-fold</wd>

<space/>

<wd l="7262" t="14294" r="8650" b="14453">cross-validation</wd>

<space/>

<wd l="8741" t="14294" r="9730" b="14453">framework.</wd>

<space/>

<wd l="9917" t="14299" r="10502" b="14453">Never-</wd>

</ln>

<ln l="6144" t="14563" r="10512" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14563" r="6782" b="14750">theless,</wd>

<space/>

<wd l="6854" t="14563" r="7162" b="14722">this</wd>

<space/>

<wd l="7234" t="14563" r="7574" b="14722">also</wd>

<space/>

<wd l="7642" t="14616" r="8040" b="14765">gave</wd>

<space/>

<wd l="8098" t="14616" r="8285" b="14722">us</wd>

<space/>

<wd l="8357" t="14616" r="8554" b="14722">an</wd>

<space/>

<wd l="8616" t="14563" r="9533" b="14765">interesting</wd>

<space/>

<wd l="9600" t="14563" r="9955" b="14722">clue</wd>

<space/>

<wd l="10018" t="14587" r="10181" b="14722">to</wd>

<space/>

<wd l="10243" t="14563" r="10512" b="14722">the</wd>

<space/>

</ln>

<ln l="6144" t="14837" r="10512" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14837" r="6586" b="14995">main</wd>

<space/>

<wd l="6634" t="14837" r="7733" b="15038">performance</wd>

<space/>

<wd l="7786" t="14837" r="8693" b="14995">bottleneck</wd>

<space/>

<wd l="8746" t="14837" r="8938" b="14995">of</wd>

<space/>

<wd l="8976" t="14890" r="9269" b="14995">our</wd>

<space/>

<wd l="9322" t="14861" r="9965" b="15038">system,</wd>

<space/>

<wd l="10032" t="14890" r="10200" b="14995">as</wd>

<space/>

<wd l="10258" t="14890" r="10512" b="14995">we</wd>

<space/>

</ln>

<ln l="6144" t="15106" r="7781" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="15106" r="6475" b="15264">will</wd>

<space/>

<wd l="6542" t="15106" r="7162" b="15264">discuss</wd>

<space/>

<wd l="7224" t="15106" r="7781" b="15264">below.</wd>

</ln>

</para>

</column>

</section>

<dd l="1430" t="15746" r="10528" b="15975">

<para l="5771" t="15792" r="6200" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6134" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="29">

<wd l="5837" t="15792" r="6134" b="15946">102</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1432" marginTop="1260" marginRight="1379" marginBottom="1292" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1432" t="1260" r="10520" b="10435">

<column l="1432" t="1260" r="10520" b="10435">

<picture l="1666" t="1262" r="10282" b="9259" alignment="left" li="234" ri="238" spaceBefore="2" spaceAfter="257">

</picture>

<para l="1440" t="9576" r="10502" b="10046" alignment="justified" spaceAfter="370" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="9576" r="10502" b="9778" baseLine="9725" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9576" r="2011" b="9778">Figure</wd>

<space/>

<wd l="2088" t="9581" r="2218" b="9734">1:</wd>

<space/>

<wd l="2304" t="9576" r="3024" b="9778">Original</wd>

<space/>

<wd l="3082" t="9576" r="3782" b="9778">pipeline</wd>

<space/>

<wd l="3850" t="9576" r="4267" b="9773">(left)</wd>

<space/>

<wd l="4334" t="9576" r="4646" b="9734">and</wd>

<space/>

<wd l="4699" t="9576" r="5400" b="9778">pipeline</wd>

<space/>

<wd l="5462" t="9576" r="6134" b="9778">adapted</wd>

<space/>

<wd l="6187" t="9576" r="6446" b="9734">for</wd>

<space/>

<wd l="6494" t="9581" r="7205" b="9734">W-NUT</wd>

<space/>

<wd l="7267" t="9576" r="7685" b="9734">2015</wd>

<space/>

<wd l="7762" t="9576" r="8299" b="9778">(right)</wd>

<space/>

<wd l="8366" t="9576" r="9235" b="9778">integrated</wd>

<space/>

<wd l="9288" t="9576" r="9624" b="9734">into</wd>

<space/>

<wd l="9682" t="9576" r="9946" b="9734">the</wd>

<space/>

<wd l="10008" t="9576" r="10502" b="9734">archi-</wd>

</ln>

<ln l="1440" t="9845" r="3293" b="10046" baseLine="9998" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9869" r="2035" b="10003">tecture</wd>

<space/>

<wd l="2093" t="9845" r="2285" b="10003">of</wd>

<space/>

<wd l="2323" t="9845" r="2592" b="10003">the</wd>

<space/>

<wd l="2654" t="9869" r="3293" b="10046">system.</wd>

</ln>

</para>

</column>

</section>

<section l="1432" t="10435" r="10530" b="15319">

<column l="1432" t="10435" r="5819" b="15319">

<table l="1507" t="10445" r="5741" b="11285" alignment="left" li="75" ri="78" spaceBefore="10" spaceAfter="251">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>1464</gridCol>

<gridCol>1085</gridCol>

<gridCol>840</gridCol>

<gridCol>845</gridCol>

<gridRow>283</gridRow>

<gridRow>255</gridRow>

<gridRow>302</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1507" t="10445" r="2971" b="10728" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3091" t="10488" r="3936" b="10690" alignment="centered" spaceAfter="27" lsp="exactly" lspExact="251" language="en">

<ln l="3091" t="10488" r="3936" b="10690" baseLine="10642" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3091" t="10488" r="3936" b="10690">precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4224" t="10493" r="4733" b="10646" alignment="centered" spaceAfter="27" lsp="exactly" lspExact="251" language="en">

<ln l="4224" t="10493" r="4733" b="10646" baseLine="10642" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4224" t="10493" r="4733" b="10646">recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5194" t="10488" r="5429" b="10642" alignment="centered" spaceAfter="27" lsp="exactly" lspExact="251" language="en">

<ln l="5194" t="10488" r="5429" b="10642" baseLine="10642" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5194" t="10488" r="5429" b="10642">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="1637" t="10766" r="2635" b="10925" alignment="left" li="125" lsp="exactly" lspExact="244" language="en">

<ln l="1637" t="10766" r="2635" b="10925" baseLine="10920" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1637" t="10766" r="2635" b="10925">constrained</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<para l="3221" t="10766" r="3811" b="10925" alignment="centered" lsp="exactly" lspExact="244" language="en">

<ln l="3221" t="10766" r="3811" b="10925" baseLine="10920" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3221" t="10766" r="3811" b="10925">0.8956</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="4181" t="10766" r="4771" b="10925" alignment="centered" lsp="exactly" lspExact="244" language="en">

<ln l="4181" t="10766" r="4771" b="10925" baseLine="10920" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4181" t="10766" r="4771" b="10925">0.8746</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5021" t="10766" r="5611" b="10925" alignment="centered" lsp="exactly" lspExact="244" language="en">

<ln l="5021" t="10766" r="5611" b="10925" baseLine="10920" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5021" t="10766" r="5611" b="10925">0.8850</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1632" t="11040" r="2856" b="11198" alignment="left" li="125" spaceAfter="29" lsp="exactly" lspExact="263" language="en">

<ln l="1632" t="11040" r="2856" b="11198" baseLine="11189" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1632" t="11040" r="2856" b="11198">unconstrained</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3221" t="11045" r="3811" b="11198" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="263" language="en">

<ln l="3221" t="11045" r="3811" b="11198" baseLine="11189" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3221" t="11045" r="3811" b="11198">0.8914</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="4181" t="11045" r="4766" b="11198" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="263" language="en">

<ln l="4181" t="11045" r="4766" b="11198" baseLine="11189" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4181" t="11045" r="4766" b="11198">0.8739</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5021" t="11040" r="5602" b="11198" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="263" language="en">

<ln l="5021" t="11040" r="5602" b="11198" baseLine="11189" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5021" t="11040" r="5602" b="11198">0.8825</wd>

</ln>

</para>

</cell>

</table>

<para l="2525" t="11597" r="4709" b="11798" alignment="centered" spaceAfter="235" lsp="exactly" lspExact="267" language="en">

<ln l="2525" t="11597" r="4709" b="11798" baseLine="11746" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2525" t="11597" r="3005" b="11755">Table</wd>

<space/>

<wd l="3082" t="11602" r="3211" b="11755">1:</wd>

<space/>

<wd l="3298" t="11597" r="4037" b="11798">Training</wd>

<space/>

<wd l="4094" t="11597" r="4709" b="11755">results.</wd>

</ln>

</para>

<table l="1507" t="12048" r="5741" b="12883" alignment="left" li="75" ri="78" spaceBefore="5" spaceAfter="257">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<gridTable>

<gridCol>1464</gridCol>

<gridCol>1085</gridCol>

<gridCol>840</gridCol>

<gridCol>845</gridCol>

<gridRow>283</gridRow>

<gridRow>255</gridRow>

<gridRow>297</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1507" t="12048" r="2971" b="12331" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3091" t="12096" r="3936" b="12298" alignment="centered" spaceAfter="22" lsp="exactly" lspExact="251" language="en">

<ln l="3091" t="12096" r="3936" b="12298" baseLine="12245" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3091" t="12096" r="3936" b="12298">precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4224" t="12101" r="4733" b="12254" alignment="centered" spaceAfter="22" lsp="exactly" lspExact="251" language="en">

<ln l="4224" t="12101" r="4733" b="12254" baseLine="12245" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4224" t="12101" r="4733" b="12254">recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5194" t="12096" r="5429" b="12250" alignment="centered" spaceAfter="22" lsp="exactly" lspExact="251" language="en">

<ln l="5194" t="12096" r="5429" b="12250" baseLine="12245" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5194" t="12096" r="5429" b="12250">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<para l="1637" t="12374" r="2635" b="12533" alignment="left" li="125" spaceAfter="5" lsp="exactly" lspExact="249" language="en">

<ln l="1637" t="12374" r="2635" b="12533" baseLine="12523" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1637" t="12374" r="2635" b="12533">constrained</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<para l="3221" t="12374" r="3811" b="12533" alignment="centered" spaceAfter="5" lsp="exactly" lspExact="249" language="en">

<ln l="3221" t="12374" r="3811" b="12533" baseLine="12523" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3221" t="12374" r="3811" b="12533">0.4646</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="5"/>

<para l="4181" t="12374" r="4752" b="12533" alignment="centered" spaceAfter="5" lsp="exactly" lspExact="249" language="en">

<ln l="4181" t="12374" r="4752" b="12533" baseLine="12523" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="4181" t="12374" r="4752" b="12533">0.6281</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<para l="5021" t="12374" r="5592" b="12533" alignment="centered" spaceAfter="5" lsp="exactly" lspExact="249" language="en">

<ln l="5021" t="12374" r="5592" b="12533" baseLine="12523" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5021" t="12374" r="5592" b="12533">0.5341</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1632" t="12643" r="2856" b="12802" alignment="left" li="125" spaceAfter="19" lsp="exactly" lspExact="268" language="en">

<ln l="1632" t="12643" r="2856" b="12802" baseLine="12797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1632" t="12643" r="2856" b="12802">unconstrained</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3221" t="12643" r="3811" b="12802" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="268" language="en">

<ln l="3221" t="12643" r="3811" b="12802" baseLine="12797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3221" t="12643" r="3811" b="12802">0.4592</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<bottomBorder type="single" width="5"/>

<para l="4181" t="12643" r="4771" b="12802" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="268" language="en">

<ln l="4181" t="12643" r="4771" b="12802" baseLine="12797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4181" t="12643" r="4771" b="12802">0.6296</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5021" t="12643" r="5611" b="12802" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="268" language="en">

<ln l="5021" t="12643" r="5611" b="12802" baseLine="12797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5021" t="12643" r="5611" b="12802">0.5310</wd>

</ln>

</para>

</cell>

</table>

<para l="2578" t="13200" r="4656" b="13402" alignment="centered" lsp="exactly" lspExact="271" language="en">

<ln l="2578" t="13200" r="4656" b="13402" baseLine="13354" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2578" t="13200" r="3058" b="13358">Table</wd>

<space/>

<wd l="3115" t="13205" r="3264" b="13358">2:</wd>

<space/>

<wd l="3350" t="13200" r="3984" b="13402">Testing</wd>

<space/>

<wd l="4042" t="13200" r="4656" b="13358">results.</wd>

</ln>

</para>

<para l="1440" t="13882" r="5813" b="14894" alignment="justified" spaceBefore="408" spaceAfter="130" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="13882" r="5813" b="14040" baseLine="14030">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1656" t="13882" r="2136" b="14040">Table</wd>

<space/>

<wd l="2218" t="13886" r="2318" b="14035">2</wd>

<space/>

<wd l="2410" t="13882" r="2933" b="14040">shows</wd>

<space/>

<wd l="3014" t="13882" r="3278" b="14040">the</wd>

<space/>

<wd l="3355" t="13882" r="3917" b="14040">results</wd>

<space/>

<wd l="4008" t="13882" r="4757" b="14040">obtained</wd>

<space/>

<wd l="4829" t="13882" r="5088" b="14040">for</wd>

<space/>

<wd l="5160" t="13882" r="5424" b="14040">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1"><wd l="5506" t="13915" r="5813" b="14040">test</wd>

<space/>

</run>

</ln>

<ln l="1445" t="14150" r="5808" b="14352" baseLine="14304" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="14203" r="2064" b="14352">corpus.</wd>

<space/>

<wd l="2170" t="14155" r="2386" b="14309">At</wd>

<space/>

<wd l="2448" t="14150" r="2712" b="14309">the</wd>

<space/>

<wd l="2784" t="14150" r="3202" b="14352">sight</wd>

<space/>

<wd l="3269" t="14150" r="3461" b="14309">of</wd>

<space/>

<wd l="3509" t="14150" r="3955" b="14309">these</wd>

<space/>

<wd l="4022" t="14150" r="4656" b="14352">figures,</wd>

<space/>

<wd l="4733" t="14150" r="5266" b="14309">which</wd>

<space/>

<wd l="5333" t="14150" r="5808" b="14309">differ</wd>

<space/>

</ln>

<ln l="1445" t="14424" r="5808" b="14626" baseLine="14573" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="14424" r="2554" b="14626">considerably</wd>

<space/>

<wd l="2626" t="14424" r="3053" b="14582">from</wd>

<space/>

<wd l="3120" t="14424" r="3384" b="14582">the</wd>

<space/>

<wd l="3456" t="14424" r="4195" b="14626">previous</wd>

<space/>

<wd l="4277" t="14477" r="4718" b="14611">ones,</wd>

<space/>

<wd l="4800" t="14477" r="5054" b="14582">we</wd>

<space/>

<wd l="5131" t="14424" r="5808" b="14582">decided</wd>

<space/>

</ln>

<ln l="1440" t="14693" r="5794" b="14894" baseLine="14846" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="14717" r="1608" b="14851">to</wd>

<space/>

<wd l="1685" t="14693" r="2333" b="14894">analyse</wd>

<space/>

<wd l="2400" t="14693" r="2842" b="14851">them</wd>

<space/>

<wd l="2904" t="14693" r="3077" b="14846">in</wd>

<space/>

<wd l="3144" t="14746" r="3590" b="14851">more</wd>

<space/>

<wd l="3667" t="14693" r="4190" b="14851">detail.</wd>

<space/>

<wd l="4310" t="14698" r="4613" b="14851">For</wd>

<space/>

<wd l="4675" t="14693" r="4982" b="14851">this</wd>

<space/>

<wd l="5059" t="14746" r="5794" b="14894">purpose,</wd>

</ln>

</para>

<rulerline l="1432" t="15048" r="2640" b="15048" type="single" width="10" color="000000"/>

<para l="1699" t="15101" r="3466" b="15293" alignment="left" li="216" spaceBefore="59" spaceAfter="14" lsp="exactly" lspExact="192" language="en">

<ln l="1699" t="15101" r="3466" b="15293" baseLine="15254">

<wd l="1699" t="15101" r="3466" b="15293"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-1">3</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">http://redis.io/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

</column>

<column l="6143" t="10435" r="10530" b="15057">

<para l="6144" t="10512" r="10517" b="15048" alignment="justified" spaceBefore="10" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="10512" r="10502" b="10714" baseLine="10661" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="10565" r="6398" b="10670">we</wd>

<space/>

<wd l="6446" t="10512" r="7195" b="10670">obtained</wd>

<space/>

<wd l="7238" t="10565" r="7334" b="10670">a</wd>

<space/>

<wd l="7373" t="10512" r="7848" b="10670">recall</wd>

<space/>

<wd l="7901" t="10512" r="8453" b="10670">metric</wd>

<space/>

<wd l="8501" t="10565" r="8717" b="10670">on</wd>

<space/>

<wd l="8760" t="10512" r="9024" b="10670">the</wd>

<space/>

<wd l="9077" t="10565" r="9562" b="10714">scope</wd>

<space/>

<wd l="9610" t="10512" r="9802" b="10670">of</wd>

<space/>

<wd l="9826" t="10512" r="10094" b="10670">the</wd>

<space/>

<wd l="10142" t="10565" r="10502" b="10670">can-</wd>

</ln>

<ln l="6149" t="10781" r="10498" b="10982" baseLine="10934" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="10781" r="6754" b="10939">didates</wd>

<space/>

<wd l="6845" t="10781" r="7646" b="10982">proposed</wd>

<space/>

<wd l="7728" t="10781" r="7944" b="10982">by</wd>

<space/>

<wd l="8030" t="10781" r="8294" b="10939">the</wd>

<space/>

<wd l="8390" t="10805" r="9034" b="10982">system;</wd>

<space/>

<wd l="9144" t="10781" r="9312" b="10934">in</wd>

<space/>

<wd l="9398" t="10781" r="9845" b="10939">other</wd>

<space/>

<wd l="9926" t="10781" r="10498" b="10968">words,</wd>

<space/>

</ln>

<ln l="6144" t="11054" r="10502" b="11256" baseLine="11203" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11107" r="6398" b="11213">we</wd>

<space/>

<wd l="6451" t="11054" r="7080" b="11213">wanted</wd>

<space/>

<wd l="7133" t="11078" r="7296" b="11213">to</wd>

<space/>

<wd l="7363" t="11107" r="7627" b="11213">see</wd>

<space/>

<wd l="7680" t="11054" r="8050" b="11213">how</wd>

<space/>

<wd l="8102" t="11107" r="8582" b="11256">many</wd>

<space/>

<wd l="8635" t="11054" r="9101" b="11213">times</wd>

<space/>

<wd l="9158" t="11054" r="9427" b="11213">the</wd>

<space/>

<wd l="9485" t="11078" r="10085" b="11213">correct</wd>

<space/>

<wd l="10142" t="11107" r="10502" b="11213">can-</wd>

</ln>

<ln l="6149" t="11323" r="10502" b="11525" baseLine="11477" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="11323" r="6677" b="11482">didate</wd>

<space/>

<wd l="6739" t="11323" r="7978" b="11525">corresponding</wd>

<space/>

<wd l="8040" t="11347" r="8203" b="11482">to</wd>

<space/>

<wd l="8266" t="11376" r="8362" b="11482">a</wd>

<space/>

<wd l="8414" t="11323" r="8899" b="11482">token</wd>

<space/>

<wd l="8957" t="11323" r="9149" b="11482">of</wd>

<space/>

<wd l="9192" t="11323" r="9456" b="11482">the</wd>

<space/>

<wd l="9518" t="11323" r="10118" b="11482">dataset</wd>

<space/>

<wd l="10176" t="11376" r="10502" b="11482">was</wd>

<space/>

</ln>

<ln l="6149" t="11597" r="10512" b="11798" baseLine="11746" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="11650" r="6734" b="11798">among</wd>

<space/>

<wd l="6826" t="11597" r="7090" b="11755">the</wd>

<space/>

<wd l="7181" t="11650" r="7570" b="11755">ones</wd>

<space/>

<wd l="7666" t="11597" r="8611" b="11755">considered</wd>

<space/>

<wd l="8693" t="11597" r="8909" b="11798">by</wd>

<space/>

<wd l="9000" t="11597" r="9264" b="11755">the</wd>

<space/>

<wd l="9360" t="11621" r="9998" b="11798">system.</wd>

<space/>

<wd l="10171" t="11597" r="10512" b="11755">The</wd>

<space/>

</ln>

<ln l="6144" t="11866" r="10512" b="12067" baseLine="12014">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="11866" r="6907" b="12067">resulting</wd>

<space/>

<wd l="6989" t="11866" r="7387" b="12024">ratio</wd>

<space/>

<wd l="7478" t="11918" r="7930" b="12024">came</wd>

<space/>

<wd l="8011" t="11890" r="8179" b="12024">to</wd>

<space/>

</run>

<wd l="8290" t="11880" r="8832" b="12053"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-4">0.87</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="8928" t="11866" r="9466" b="12024">which</wd>

<space/>

<wd l="9547" t="11918" r="10094" b="12024">means</wd>

<space/>

<wd l="10186" t="11866" r="10512" b="12024">that</wd>

<space/>

</run>

</ln>

<ln l="6144" t="12139" r="10512" b="12298" baseLine="12288" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12163" r="6571" b="12298">most</wd>

<space/>

<wd l="6634" t="12139" r="6826" b="12298">of</wd>

<space/>

<wd l="6869" t="12139" r="7138" b="12298">the</wd>

<space/>

<wd l="7195" t="12139" r="7661" b="12298">times</wd>

<space/>

<wd l="7728" t="12192" r="7982" b="12298">we</wd>

<space/>

<wd l="8045" t="12139" r="8362" b="12298">had</wd>

<space/>

<wd l="8419" t="12139" r="8736" b="12298">had</wd>

<space/>

<wd l="8794" t="12139" r="9058" b="12298">the</wd>

<space/>

<wd l="9125" t="12139" r="9725" b="12298">chance</wd>

<space/>

<wd l="9787" t="12163" r="9950" b="12298">to</wd>

<space/>

<wd l="10022" t="12139" r="10512" b="12298">select</wd>

<space/>

</ln>

<ln l="6144" t="12408" r="10502" b="12610" baseLine="12557" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12408" r="6413" b="12566">the</wd>

<space/>

<wd l="6509" t="12432" r="7109" b="12566">correct</wd>

<space/>

<wd l="7200" t="12408" r="8410" b="12566">normalization</wd>

<space/>

<wd l="8501" t="12408" r="8928" b="12566">form</wd>

<space/>

<wd l="9014" t="12408" r="9274" b="12566">for</wd>

<space/>

<wd l="9365" t="12461" r="9461" b="12566">a</wd>

<space/>

<wd l="9552" t="12408" r="10022" b="12610">given</wd>

<space/>

<wd l="10109" t="12461" r="10502" b="12566">non-</wd>

</ln>

<ln l="6154" t="12677" r="10512" b="12878" baseLine="12830" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="12677" r="6888" b="12835">standard</wd>

<space/>

<wd l="6960" t="12677" r="7445" b="12835">token</wd>

<space/>

<wd l="7517" t="12677" r="7790" b="12835">but</wd>

<space/>

<wd l="7867" t="12677" r="8131" b="12835">the</wd>

<space/>

<wd l="8218" t="12701" r="8813" b="12878">system</wd>

<space/>

<wd l="8885" t="12677" r="9384" b="12835">failed</wd>

<space/>

<wd l="9456" t="12701" r="9624" b="12835">to</wd>

<space/>

<wd l="9701" t="12677" r="10171" b="12835">make</wd>

<space/>

<wd l="10243" t="12677" r="10512" b="12835">the</wd>

<space/>

</ln>

<ln l="6154" t="12950" r="10502" b="13152" baseLine="13099" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="12950" r="6965" b="13138">selection,</wd>

<space/>

<wd l="7061" t="12950" r="7373" b="13109">and</wd>

<space/>

<wd l="7450" t="12950" r="7584" b="13109">is</wd>

<space/>

<wd l="7675" t="12950" r="8016" b="13109">also</wd>

<space/>

<wd l="8102" t="13003" r="8198" b="13109">a</wd>

<space/>

<wd l="8275" t="12950" r="9144" b="13109">consistent</wd>

<space/>

<wd l="9226" t="12950" r="9730" b="13152">figure</wd>

<space/>

<wd l="9806" t="12950" r="10195" b="13109">with</wd>

<space/>

<wd l="10267" t="13003" r="10502" b="13109">re-</wd>

</ln>

<ln l="6154" t="13219" r="10517" b="13421" baseLine="13373" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="13243" r="6595" b="13421">spect</wd>

<space/>

<wd l="6667" t="13243" r="6830" b="13378">to</wd>

<space/>

<wd l="6907" t="13219" r="7368" b="13378">those</wd>

<space/>

<wd l="7450" t="13219" r="8002" b="13378">shown</wd>

<space/>

<wd l="8078" t="13272" r="8294" b="13378">on</wd>

<space/>

<wd l="8362" t="13219" r="8842" b="13378">Table</wd>

<space/>

<wd l="8938" t="13224" r="9067" b="13378">1.</wd>

<space/>

<wd l="9197" t="13219" r="9576" b="13378">This</wd>

<space/>

<wd l="9658" t="13272" r="9984" b="13378">was</wd>

<space/>

<wd l="10066" t="13243" r="10344" b="13378">not</wd>

<space/>

<wd l="10421" t="13272" r="10517" b="13378">a</wd>

<space/>

</ln>

<ln l="6144" t="13493" r="10502" b="13694" baseLine="13642" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13493" r="6422" b="13694">big</wd>

<space/>

<wd l="6518" t="13493" r="7200" b="13694">surprise</wd>

<space/>

<wd l="7286" t="13493" r="7546" b="13651">for</wd>

<space/>

<wd l="7627" t="13546" r="7867" b="13680">us,</wd>

<space/>

<wd l="7973" t="13493" r="8573" b="13694">mainly</wd>

<space/>

<wd l="8664" t="13493" r="9355" b="13651">because</wd>

<space/>

<wd l="9442" t="13493" r="9562" b="13651">it</wd>

<space/>

<wd l="9648" t="13493" r="9787" b="13651">is</wd>

<space/>

<wd l="9883" t="13546" r="9979" b="13651">a</wd>

<space/>

<wd l="10061" t="13493" r="10502" b="13651">well-</wd>

</ln>

<ln l="6144" t="13762" r="10512" b="13963" baseLine="13915" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13762" r="6734" b="13920">known</wd>

<space/>

<wd l="6806" t="13762" r="7536" b="13963">problem</wd>

<space/>

<wd l="7608" t="13814" r="7858" b="13920">we</wd>

<space/>

<wd l="7934" t="13762" r="8338" b="13920">have</wd>

<space/>

<wd l="8410" t="13762" r="8822" b="13920">been</wd>

<space/>

<wd l="8899" t="13814" r="9408" b="13920">aware</wd>

<space/>

<wd l="9485" t="13762" r="9677" b="13920">of</wd>

<space/>

<wd l="9744" t="13762" r="10186" b="13920">since</wd>

<space/>

<wd l="10258" t="13814" r="10512" b="13920">we</wd>

<space/>

</ln>

<ln l="6154" t="14035" r="10498" b="14237" baseLine="14184" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="14035" r="6730" b="14194">started</wd>

<space/>

<wd l="6782" t="14035" r="7502" b="14237">working</wd>

<space/>

<wd l="7565" t="14088" r="7776" b="14194">on</wd>

<space/>

<wd l="7838" t="14035" r="8654" b="14237">(Spanish)</wd>

<space/>

<wd l="8717" t="14059" r="9192" b="14194">tweet</wd>

<space/>

<wd l="9245" t="14035" r="10498" b="14194">normalization.</wd>

<space/>

</ln>

<ln l="6144" t="14304" r="10512" b="14506" baseLine="14458" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14304" r="7051" b="14491">Therefore,</wd>

<space/>

<wd l="7133" t="14357" r="7382" b="14462">we</wd>

<space/>

<wd l="7459" t="14357" r="7752" b="14462">can</wd>

<space/>

<wd l="7829" t="14304" r="8611" b="14462">conclude</wd>

<space/>

<wd l="8678" t="14304" r="9010" b="14462">that</wd>

<space/>

<wd l="9072" t="14304" r="9341" b="14462">the</wd>

<space/>

<wd l="9408" t="14304" r="10512" b="14506">performance</wd>

<space/>

</ln>

<ln l="6144" t="14578" r="10502" b="14779" baseLine="14726" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14578" r="7056" b="14736">bottleneck</wd>

<space/>

<wd l="7128" t="14578" r="7320" b="14736">of</wd>

<space/>

<wd l="7378" t="14630" r="7670" b="14736">our</wd>

<space/>

<wd l="7742" t="14602" r="8342" b="14779">system</wd>

<space/>

<wd l="8405" t="14578" r="8544" b="14736">is</wd>

<space/>

<wd l="8630" t="14578" r="8947" b="14736">still</wd>

<space/>

<wd l="9019" t="14578" r="9283" b="14736">the</wd>

<space/>

<wd l="9355" t="14578" r="10186" b="14736">candidate</wd>

<space/>

<wd l="10267" t="14630" r="10502" b="14736">se-</wd>

</ln>

<ln l="6144" t="14846" r="10512" b="15048" baseLine="14995" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14846" r="6739" b="15005">lection</wd>

<space/>

<wd l="6792" t="14899" r="7488" b="15048">process,</wd>

<space/>

<wd l="7550" t="14846" r="8083" b="15005">which</wd>

<space/>

<wd l="8131" t="14846" r="8270" b="15005">is</wd>

<space/>

<wd l="8328" t="14846" r="8962" b="15048">heavily</wd>

<space/>

<wd l="9019" t="14846" r="9926" b="15005">influenced</wd>

<space/>

<wd l="9974" t="14846" r="10190" b="15048">by</wd>

<space/>

<wd l="10243" t="14846" r="10512" b="15005">the</wd>

</ln>

</para>

</column>

</section>

<dd l="1432" t="15746" r="10530" b="15975">

<para l="5771" t="15792" r="6191" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6125" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="27">

<wd l="5837" t="15792" r="6125" b="15946">103</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1437" marginTop="1260" marginRight="1378" marginBottom="1292" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1437" t="1260" r="10531" b="15316">

<column l="1437" t="1260" r="5824" b="15316">

<para l="1440" t="1320" r="3442" b="1522" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="1320" r="3442" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="1320" r="2227" b="1522">language</wd>

<space/>

<wd l="2280" t="1320" r="2822" b="1478">model</wd>

<space/>

<wd l="2880" t="1320" r="3053" b="1474">in</wd>

<space/>

<wd l="3106" t="1373" r="3442" b="1478">use.</wd>

</ln>

</para>

<para l="1440" t="1608" r="5818" b="7771" alignment="justified" spaceBefore="16" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="1608" r="5803" b="1810" baseLine="1762" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1656" t="1613" r="1843" b="1762">In</wd>

<space/>

<wd l="1934" t="1608" r="2242" b="1766">this</wd>

<space/>

<wd l="2347" t="1632" r="3005" b="1810">respect,</wd>

<space/>

<wd l="3125" t="1608" r="3677" b="1810">tuning</wd>

<space/>

<wd l="3782" t="1608" r="4834" b="1810">experiments</wd>

<space/>

<wd l="4934" t="1661" r="5357" b="1766">were</wd>

<space/>

<wd l="5458" t="1608" r="5803" b="1766">also</wd>

<space/>

</ln>

<ln l="1440" t="1882" r="5794" b="2083" baseLine="2030" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="1882" r="1910" b="2040">made</wd>

<space/>

<wd l="1992" t="1882" r="2208" b="2083">by</wd>

<space/>

<wd l="2299" t="1882" r="3149" b="2083">extending</wd>

<space/>

<wd l="3235" t="1934" r="3528" b="2040">our</wd>

<space/>

<wd l="3605" t="1882" r="4829" b="2040">unconstrained</wd>

<space/>

<wd l="4915" t="1882" r="5794" b="2083">configura-</wd>

</ln>

<ln l="1440" t="2150" r="5784" b="2352" baseLine="2299" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="2150" r="1781" b="2309">tion</wd>

<space/>

<wd l="1829" t="2150" r="2506" b="2352">through</wd>

<space/>

<wd l="2554" t="2150" r="2822" b="2309">the</wd>

<space/>

<wd l="2875" t="2150" r="3586" b="2309">addition</wd>

<space/>

<wd l="3638" t="2150" r="3826" b="2309">of</wd>

<space/>

<wd l="3864" t="2150" r="4128" b="2309">the</wd>

<space/>

<wd l="4176" t="2150" r="4570" b="2309">Web</wd>

<space/>

<wd l="4642" t="2155" r="4858" b="2304">1T</wd>

<space/>

<wd l="4915" t="2150" r="5544" b="2352">5-gram</wd>

<space/>

<wd l="5587" t="2155" r="5784" b="2309">v1</wd>

<space/>

</ln>

<ln l="1440" t="2424" r="5794" b="2626" baseLine="2573" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="2424" r="2107" b="2626">English</wd>

<space/>

<wd l="2194" t="2424" r="2981" b="2626">language</wd>

<space/>

<wd l="3067" t="2424" r="3610" b="2582">model</wd>

<space/>

<wd l="3701" t="2477" r="3869" b="2582">as</wd>

<space/>

<wd l="3965" t="2477" r="4061" b="2582">a</wd>

<space/>

<wd l="4142" t="2424" r="5098" b="2626">knowledge</wd>

<space/>

<wd l="5189" t="2477" r="5794" b="2582">source.</wd>

<space/>

</ln>

<ln l="1445" t="2693" r="5794" b="2894" baseLine="2842" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="2693" r="1872" b="2894">Only</wd>

<space/>

<wd l="1982" t="2693" r="2784" b="2894">unigrams</wd>

<space/>

<wd l="2904" t="2693" r="3211" b="2851">and</wd>

<space/>

<wd l="3317" t="2693" r="4013" b="2894">bigrams</wd>

<space/>

<wd l="4128" t="2693" r="4608" b="2851">could</wd>

<space/>

<wd l="4714" t="2693" r="4915" b="2851">be</wd>

<space/>

<wd l="5021" t="2693" r="5424" b="2851">used</wd>

<space/>

<wd l="5525" t="2693" r="5794" b="2851">be-</wd>

</ln>

<ln l="1445" t="2962" r="5794" b="3163" baseLine="3115" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="3014" r="1925" b="3120">cause</wd>

<space/>

<wd l="1997" t="2962" r="2189" b="3120">of</wd>

<space/>

<wd l="2237" t="2962" r="3024" b="3120">unsolved</wd>

<space/>

<wd l="3091" t="3014" r="3811" b="3163">memory</wd>

<space/>

<wd l="3883" t="2962" r="4862" b="3120">limitations.</wd>

<space/>

<wd l="4973" t="2966" r="5794" b="3149">However,</wd>

<space/>

</ln>

<ln l="1440" t="3235" r="5808" b="3437" baseLine="3384" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="3235" r="1613" b="3389">in</wd>

<space/>

<wd l="1694" t="3259" r="2381" b="3394">contrast</wd>

<space/>

<wd l="2462" t="3235" r="2851" b="3394">with</wd>

<space/>

<wd l="2928" t="3235" r="3667" b="3437">previous</wd>

<space/>

<wd l="3758" t="3235" r="4810" b="3437">experiments</wd>

<space/>

<wd l="4896" t="3235" r="5808" b="3437">performed</wd>

<space/>

</ln>

<ln l="1440" t="3504" r="5794" b="3706" baseLine="3658" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="3504" r="1699" b="3662">for</wd>

<space/>

<wd l="1762" t="3504" r="2491" b="3706">Spanish,</wd>

<space/>

<wd l="2563" t="3504" r="2827" b="3662">the</wd>

<space/>

<wd l="2890" t="3504" r="3648" b="3706">resulting</wd>

<space/>

<wd l="3710" t="3504" r="4814" b="3706">performance</wd>

<space/>

<wd l="4877" t="3557" r="5203" b="3662">was</wd>

<space/>

<wd l="5270" t="3528" r="5794" b="3662">unsat-</wd>

</ln>

<ln l="1440" t="3778" r="5794" b="3979" baseLine="3926" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="3778" r="2232" b="3979">isfactory.</wd>

<space/>

<wd l="2400" t="3782" r="3125" b="3936">Because</wd>

<space/>

<wd l="3216" t="3778" r="3408" b="3936">of</wd>

<space/>

<wd l="3480" t="3778" r="3835" b="3965">this,</wd>

<space/>

<wd l="3941" t="3778" r="4205" b="3936">the</wd>

<space/>

<wd l="4291" t="3830" r="4579" b="3936">use</wd>

<space/>

<wd l="4670" t="3778" r="4862" b="3936">of</wd>

<space/>

<wd l="4934" t="3778" r="5381" b="3936">these</wd>

<space/>

<wd l="5467" t="3778" r="5794" b="3936">lan-</wd>

</ln>

<ln l="1445" t="4046" r="5794" b="4248" baseLine="4200" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="4099" r="1958" b="4248">guage</wd>

<space/>

<wd l="2050" t="4046" r="2674" b="4205">models</wd>

<space/>

<wd l="2774" t="4046" r="3034" b="4205">for</wd>

<space/>

<wd l="3125" t="4099" r="3413" b="4205">our</wd>

<space/>

<wd l="3504" t="4046" r="3883" b="4205">final</wd>

<space/>

<wd l="3989" t="4046" r="4963" b="4205">submission</wd>

<space/>

<wd l="5050" t="4099" r="5381" b="4205">was</wd>

<space/>

<wd l="5482" t="4046" r="5794" b="4205">dis-</wd>

</ln>

<ln l="1440" t="4320" r="5808" b="4522" baseLine="4469" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="4320" r="2088" b="4478">missed.</wd>

<space/>

<wd l="2222" t="4320" r="3139" b="4522">According</wd>

<space/>

<wd l="3216" t="4344" r="3379" b="4478">to</wd>

<space/>

<wd l="3461" t="4373" r="3754" b="4478">our</wd>

<space/>

<wd l="3826" t="4320" r="4565" b="4522">analysis,</wd>

<space/>

<wd l="4656" t="4320" r="4920" b="4478">the</wd>

<space/>

<wd l="4997" t="4373" r="5477" b="4478">cause</wd>

<space/>

<wd l="5549" t="4320" r="5808" b="4478">for</wd>

<space/>

</ln>

<ln l="1440" t="4589" r="5803" b="4790" baseLine="4742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="4589" r="1747" b="4747">this</wd>

<space/>

<wd l="1834" t="4642" r="2347" b="4747">seems</wd>

<space/>

<wd l="2424" t="4613" r="2587" b="4747">to</wd>

<space/>

<wd l="2659" t="4589" r="2866" b="4747">be</wd>

<space/>

<wd l="2933" t="4589" r="3197" b="4747">the</wd>

<space/>

<wd l="3274" t="4613" r="3706" b="4790">great</wd>

<space/>

<wd l="3773" t="4589" r="4776" b="4776">differences,</wd>

<space/>

<wd l="4862" t="4613" r="5016" b="4747">at</wd>

<space/>

<wd l="5083" t="4589" r="5472" b="4747">both</wd>

<space/>

<wd l="5539" t="4589" r="5803" b="4747">the</wd>

<space/>

</ln>

<ln l="1440" t="4862" r="5798" b="5064" baseLine="5011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="4862" r="2016" b="5021">lexical</wd>

<space/>

<wd l="2117" t="4862" r="2429" b="5021">and</wd>

<space/>

<wd l="2534" t="4862" r="3456" b="5064">syntactical</wd>

<space/>

<wd l="3552" t="4862" r="4094" b="5050">levels,</wd>

<space/>

<wd l="4214" t="4862" r="4939" b="5021">between</wd>

<space/>

<wd l="5035" t="4862" r="5299" b="5021">the</wd>

<space/>

<wd l="5395" t="4886" r="5798" b="5021">texts</wd>

<space/>

</ln>

<ln l="1440" t="5131" r="5794" b="5318" baseLine="5280" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5131" r="1843" b="5290">used</wd>

<space/>

<wd l="1944" t="5155" r="2107" b="5290">to</wd>

<space/>

<wd l="2213" t="5131" r="2659" b="5290">build</wd>

<space/>

<wd l="2760" t="5131" r="3067" b="5290">this</wd>

<space/>

<wd l="3178" t="5131" r="3763" b="5318">model,</wd>

<space/>

<wd l="3888" t="5131" r="4426" b="5290">which</wd>

<space/>

<wd l="4526" t="5131" r="5011" b="5290">could</wd>

<space/>

<wd l="5112" t="5131" r="5314" b="5290">be</wd>

<space/>

<wd l="5424" t="5184" r="5794" b="5290">con-</wd>

</ln>

<ln l="1450" t="5405" r="5794" b="5606" baseLine="5554" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1450" t="5405" r="2074" b="5563">sidered</wd>

<space/>

<wd l="2150" t="5458" r="2318" b="5563">as</wd>

<space/>

<wd l="2410" t="5405" r="3206" b="5606">“regular”</wd>

<space/>

<wd l="3288" t="5429" r="3744" b="5592">texts,</wd>

<space/>

<wd l="3840" t="5405" r="4152" b="5563">and</wd>

<space/>

<wd l="4229" t="5405" r="4685" b="5563">those</wd>

<space/>

<wd l="4766" t="5405" r="5794" b="5606">correspond-</wd>

</ln>

<ln l="1440" t="5674" r="5798" b="5875" baseLine="5822" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5674" r="1714" b="5875">ing</wd>

<space/>

<wd l="1786" t="5698" r="1949" b="5832">to</wd>

<space/>

<wd l="2021" t="5698" r="2621" b="5861">tweets,</wd>

<space/>

<wd l="2702" t="5674" r="3235" b="5832">which</wd>

<space/>

<wd l="3302" t="5726" r="3850" b="5875">agrees</wd>

<space/>

<wd l="3922" t="5674" r="4310" b="5832">with</wd>

<space/>

<wd l="4378" t="5674" r="4642" b="5832">the</wd>

<space/>

<wd l="4714" t="5674" r="5798" b="5832">observations</wd>

<space/>

</ln>

<ln l="1445" t="5942" r="5818" b="6144" baseLine="6096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="5942" r="1637" b="6101">of</wd>

<space/>

<wd l="1709" t="5942" r="2510" b="6144">Chrupała</wd>

<space/>

<wd l="2602" t="5947" r="3216" b="6139">(2014).</wd>

<space/>

<wd l="3384" t="5947" r="3619" b="6101">As</wd>

<space/>

<wd l="3710" t="5942" r="4632" b="6101">illustrative</wd>

<space/>

<wd l="4723" t="5942" r="5530" b="6144">examples</wd>

<space/>

<wd l="5630" t="5942" r="5818" b="6101">of</wd>

<space/>

</ln>

<ln l="1440" t="6216" r="5808" b="6418" baseLine="6365" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="6216" r="1747" b="6374">this</wd>

<space/>

<wd l="1824" t="6240" r="2198" b="6418">type</wd>

<space/>

<wd l="2275" t="6216" r="2467" b="6374">of</wd>

<space/>

<wd l="2525" t="6216" r="3528" b="6418">expressions</wd>

<space/>

<wd l="3605" t="6269" r="3859" b="6374">we</wd>

<space/>

<wd l="3936" t="6269" r="4229" b="6374">can</wd>

<space/>

<wd l="4306" t="6216" r="4666" b="6374">take</wd>

<space/>

<wd l="4738" t="6221" r="4906" b="6370">“I</wd>

<space/>

<wd l="4973" t="6216" r="5299" b="6374">like</wd>

<space/>

<wd l="5371" t="6216" r="5808" b="6374">them</wd>

<space/>

</ln>

<ln l="1445" t="6485" r="5794" b="6686" baseLine="6638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6485" r="1920" b="6686">girls”</wd>

<space/>

<wd l="1992" t="6485" r="2304" b="6643">and</wd>

<space/>

<wd l="2371" t="6485" r="2885" b="6686">“Why</wd>

<space/>

<wd l="2947" t="6538" r="3274" b="6686">you</wd>

<space/>

<wd l="3341" t="6538" r="3557" b="6643">no</wd>

<space/>

<wd l="3624" t="6485" r="3835" b="6643">do</wd>

<space/>

<wd l="3902" t="6485" r="4469" b="6672">that?”,</wd>

<space/>

<wd l="4546" t="6485" r="5078" b="6643">which</wd>

<space/>

<wd l="5146" t="6538" r="5405" b="6643">are</wd>

<space/>

<wd l="5467" t="6485" r="5794" b="6643">lex-</wd>

</ln>

<ln l="1440" t="6758" r="5794" b="6960" baseLine="6907" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="6758" r="1920" b="6960">ically</wd>

<space/>

<wd l="2016" t="6782" r="2616" b="6917">correct</wd>

<space/>

<wd l="2698" t="6758" r="2976" b="6917">but</wd>

<space/>

<wd l="3058" t="6782" r="3341" b="6917">not</wd>

<space/>

<wd l="3432" t="6758" r="4522" b="6960">syntactically</wd>

<space/>

<wd l="4608" t="6758" r="5083" b="6946">valid,</wd>

<space/>

<wd l="5198" t="6811" r="5376" b="6917">so</wd>

<space/>

<wd l="5467" t="6758" r="5794" b="6917">lan-</wd>

</ln>

<ln l="1445" t="7027" r="5794" b="7229" baseLine="7181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="7080" r="1958" b="7229">guage</wd>

<space/>

<wd l="2006" t="7027" r="2630" b="7186">models</wd>

<space/>

<wd l="2683" t="7027" r="3082" b="7186">built</wd>

<space/>

<wd l="3125" t="7027" r="3595" b="7229">using</wd>

<space/>

<wd l="3643" t="7027" r="4262" b="7229">regular</wd>

<space/>

<wd l="4301" t="7051" r="4704" b="7186">texts</wd>

<space/>

<wd l="4757" t="7027" r="5093" b="7186">will</wd>

<space/>

<wd l="5141" t="7051" r="5424" b="7186">not</wd>

<space/>

<wd l="5467" t="7080" r="5794" b="7186">rec-</wd>

</ln>

<ln l="1445" t="7301" r="5794" b="7502" baseLine="7450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="7301" r="2021" b="7502">ognize</wd>

<space/>

<wd l="2093" t="7301" r="2573" b="7459">them.</wd>

<space/>

<wd l="2707" t="7306" r="2894" b="7454">In</wd>

<space/>

<wd l="2966" t="7301" r="3230" b="7459">the</wd>

<space/>

<wd l="3307" t="7354" r="3677" b="7459">case</wd>

<space/>

<wd l="3758" t="7301" r="3950" b="7459">of</wd>

<space/>

<wd l="4013" t="7354" r="4301" b="7459">our</wd>

<space/>

<wd l="4373" t="7301" r="5112" b="7502">previous</wd>

<space/>

<wd l="5194" t="7301" r="5794" b="7502">experi-</wd>

</ln>

<ln l="1440" t="7570" r="5794" b="7771" baseLine="7723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="7594" r="1954" b="7728">ments</wd>

<space/>

<wd l="2016" t="7622" r="2232" b="7728">on</wd>

<space/>

<wd l="2285" t="7570" r="3014" b="7771">Spanish,</wd>

<space/>

<wd l="3082" t="7570" r="3389" b="7728">this</wd>

<space/>

<wd l="3451" t="7570" r="4325" b="7728">difference</wd>

<space/>

<wd l="4378" t="7622" r="4704" b="7728">was</wd>

<space/>

<wd l="4762" t="7594" r="5045" b="7728">not</wd>

<space/>

<wd l="5102" t="7622" r="5285" b="7728">so</wd>

<space/>

<wd l="5342" t="7570" r="5794" b="7728">clear.</wd>

</ln>

</para>

<para l="1445" t="8083" r="4829" b="8256" alignment="left" spaceBefore="260" lsp="exactly" lspExact="274" language="en">

<ln l="1445" t="8083" r="4829" b="8256" baseLine="8251" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="1445" t="8088" r="1555" b="8256">5</wd>

<space/>

<wd l="1810" t="8083" r="3029" b="8256">Conclusions</wd>

<space/>

<wd l="3101" t="8088" r="3475" b="8256">and</wd>

<space/>

<wd l="3538" t="8088" r="4234" b="8256">Future</wd>

<space/>

<wd l="4306" t="8088" r="4829" b="8256">work</wd>

</ln>

</para>

<para l="1440" t="8558" r="5808" b="9840" alignment="justified" spaceBefore="180" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="8558" r="5794" b="8760" baseLine="8707" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="8563" r="1723" b="8717">We</wd>

<space/>

<wd l="1786" t="8558" r="2189" b="8717">have</wd>

<space/>

<wd l="2251" t="8558" r="3086" b="8760">presented</wd>

<space/>

<wd l="3144" t="8558" r="3317" b="8712">in</wd>

<space/>

<wd l="3374" t="8558" r="3682" b="8717">this</wd>

<space/>

<wd l="3749" t="8558" r="4195" b="8717">work</wd>

<space/>

<wd l="4258" t="8558" r="4522" b="8717">the</wd>

<space/>

<wd l="4584" t="8582" r="5054" b="8717">tweet</wd>

<space/>

<wd l="5117" t="8558" r="5794" b="8717">normal-</wd>

</ln>

<ln l="1440" t="8827" r="5808" b="9029" baseLine="8976" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="8827" r="2035" b="8986">ization</wd>

<space/>

<wd l="2102" t="8851" r="2702" b="9029">system</wd>

<space/>

<wd l="2760" t="8827" r="3163" b="8986">used</wd>

<space/>

<wd l="3221" t="8827" r="3437" b="9029">by</wd>

<space/>

<wd l="3509" t="8880" r="3797" b="8986">our</wd>

<space/>

<wd l="3859" t="8880" r="4358" b="9029">group</wd>

<space/>

<wd l="4426" t="8851" r="4589" b="8986">to</wd>

<space/>

<wd l="4656" t="8827" r="5573" b="9029">participate</wd>

<space/>

<wd l="5635" t="8827" r="5808" b="8981">in</wd>

<space/>

</ln>

<ln l="1440" t="9096" r="5808" b="9283" baseLine="9250" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9096" r="1704" b="9254">the</wd>

<space/>

<wd l="1795" t="9101" r="2501" b="9254">W-NUT</wd>

<space/>

<wd l="2597" t="9096" r="3014" b="9254">2015</wd>

<space/>

<wd l="3115" t="9096" r="4378" b="9254">Normalization</wd>

<space/>

<wd l="4459" t="9096" r="4867" b="9254">Task</wd>

<space/>

<wd l="4954" t="9096" r="5530" b="9283">which,</wd>

<space/>

<wd l="5635" t="9096" r="5808" b="9250">in</wd>

<space/>

</ln>

<ln l="1440" t="9370" r="5808" b="9571" baseLine="9518" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9394" r="1834" b="9557">turn,</wd>

<space/>

<wd l="1920" t="9370" r="2054" b="9528">is</wd>

<space/>

<wd l="2136" t="9422" r="2333" b="9528">an</wd>

<space/>

<wd l="2410" t="9370" r="3317" b="9571">adaptation</wd>

<space/>

<wd l="3389" t="9370" r="3581" b="9528">of</wd>

<space/>

<wd l="3638" t="9370" r="4296" b="9528">another</wd>

<space/>

<wd l="4363" t="9370" r="5040" b="9571">existing</wd>

<space/>

<wd l="5122" t="9370" r="5808" b="9571">Spanish</wd>

<space/>

</ln>

<ln l="1440" t="9638" r="3883" b="9840" baseLine="9792" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9662" r="1915" b="9797">tweet</wd>

<space/>

<wd l="1968" t="9638" r="3182" b="9797">normalization</wd>

<space/>

<wd l="3245" t="9662" r="3883" b="9840">system.</wd>

</ln>

</para>

<para l="1440" t="9926" r="5808" b="12566" alignment="justified" spaceBefore="16" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="9926" r="5808" b="10128" baseLine="10075" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="9926" r="2256" b="10085">Within</wd>

<space/>

<wd l="2338" t="9926" r="2606" b="10085">the</wd>

<space/>

<wd l="2698" t="9979" r="3182" b="10128">scope</wd>

<space/>

<wd l="3274" t="9926" r="3466" b="10085">of</wd>

<space/>

<wd l="3533" t="9926" r="3840" b="10085">this</wd>

<space/>

<wd l="3931" t="9926" r="4325" b="10114">task,</wd>

<space/>

<wd l="4426" t="9926" r="4550" b="10085">it</wd>

<space/>

<wd l="4632" t="9926" r="5299" b="10085">became</wd>

<space/>

<wd l="5386" t="9926" r="5808" b="10085">clear</wd>

<space/>

</ln>

<ln l="1440" t="10195" r="5803" b="10397" baseLine="10349" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10195" r="1771" b="10354">that</wd>

<space/>

<wd l="1838" t="10219" r="2266" b="10354">most</wd>

<space/>

<wd l="2338" t="10195" r="2530" b="10354">of</wd>

<space/>

<wd l="2587" t="10195" r="2856" b="10354">the</wd>

<space/>

<wd l="2928" t="10195" r="4138" b="10354">normalization</wd>

<space/>

<wd l="4210" t="10195" r="4963" b="10354">mistakes</wd>

<space/>

<wd l="5045" t="10195" r="5515" b="10354">made</wd>

<space/>

<wd l="5587" t="10195" r="5803" b="10397">by</wd>

<space/>

</ln>

<ln l="1445" t="10469" r="5794" b="10670" baseLine="10618" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="10522" r="1733" b="10627">our</wd>

<space/>

<wd l="1829" t="10493" r="2429" b="10670">system</wd>

<space/>

<wd l="2515" t="10469" r="3278" b="10627">occurred</wd>

<space/>

<wd l="3365" t="10469" r="3926" b="10670">during</wd>

<space/>

<wd l="4018" t="10469" r="4286" b="10627">the</wd>

<space/>

<wd l="4378" t="10469" r="5208" b="10627">candidate</wd>

<space/>

<wd l="5304" t="10469" r="5794" b="10627">selec-</wd>

</ln>

<ln l="1440" t="10738" r="5808" b="10939" baseLine="10891" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10738" r="1781" b="10896">tion</wd>

<space/>

<wd l="1834" t="10762" r="2314" b="10939">stage,</wd>

<space/>

<wd l="2376" t="10790" r="2544" b="10896">as</wd>

<space/>

<wd l="2597" t="10738" r="2717" b="10896">it</wd>

<space/>

<wd l="2760" t="10790" r="3086" b="10896">was</wd>

<space/>

<wd l="3139" t="10738" r="3720" b="10896">unable</wd>

<space/>

<wd l="3763" t="10762" r="3931" b="10896">to</wd>

<space/>

<wd l="3979" t="10738" r="4848" b="10896">determine</wd>

<space/>

<wd l="4891" t="10738" r="5155" b="10896">the</wd>

<space/>

<wd l="5203" t="10762" r="5808" b="10896">correct</wd>

<space/>

</ln>

<ln l="1440" t="11011" r="5798" b="11213" baseLine="11160" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11011" r="2654" b="11170">normalization</wd>

<space/>

<wd l="2765" t="11035" r="3168" b="11170">term</wd>

<space/>

<wd l="3278" t="11011" r="4027" b="11170">obtained</wd>

<space/>

<wd l="4138" t="11011" r="4306" b="11165">in</wd>

<space/>

<wd l="4416" t="11011" r="5155" b="11213">previous</wd>

<space/>

<wd l="5280" t="11035" r="5798" b="11213">stages</wd>

<space/>

</ln>

<ln l="1440" t="11280" r="5808" b="11438" baseLine="11434" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11280" r="1867" b="11438">from</wd>

<space/>

<wd l="1939" t="11280" r="2208" b="11438">the</wd>

<space/>

<wd l="2294" t="11304" r="2525" b="11438">set</wd>

<space/>

<wd l="2606" t="11280" r="2798" b="11438">of</wd>

<space/>

<wd l="2866" t="11280" r="3773" b="11438">candidates</wd>

<space/>

<wd l="3859" t="11280" r="4675" b="11438">available.</wd>

<space/>

<wd l="4819" t="11280" r="5160" b="11438">The</wd>

<space/>

<wd l="5237" t="11333" r="5808" b="11438">reason</wd>

<space/>

</ln>

<ln l="1440" t="11554" r="5808" b="11755" baseLine="11702" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11554" r="1699" b="11712">for</wd>

<space/>

<wd l="1766" t="11554" r="1891" b="11712">it</wd>

<space/>

<wd l="1958" t="11554" r="2098" b="11712">is</wd>

<space/>

<wd l="2174" t="11554" r="2506" b="11712">that</wd>

<space/>

<wd l="2578" t="11606" r="2827" b="11712">we</wd>

<space/>

<wd l="2904" t="11554" r="3115" b="11712">do</wd>

<space/>

<wd l="3192" t="11578" r="3470" b="11712">not</wd>

<space/>

<wd l="3542" t="11554" r="3946" b="11712">have</wd>

<space/>

<wd l="4022" t="11578" r="4176" b="11712">at</wd>

<space/>

<wd l="4248" t="11554" r="4555" b="11712">this</wd>

<space/>

<wd l="4632" t="11606" r="5016" b="11755">very</wd>

<space/>

<wd l="5088" t="11578" r="5808" b="11712">moment</wd>

<space/>

</ln>

<ln l="1445" t="11822" r="5794" b="12024" baseLine="11976" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11822" r="2083" b="12024">enough</wd>

<space/>

<wd l="2141" t="11822" r="2818" b="12024">training</wd>

<space/>

<wd l="2885" t="11822" r="3250" b="11981">data</wd>

<space/>

<wd l="3302" t="11846" r="3470" b="11981">to</wd>

<space/>

<wd l="3533" t="11822" r="3979" b="11981">build</wd>

<space/>

<wd l="4042" t="11875" r="4138" b="11981">a</wd>

<space/>

<wd l="4190" t="11822" r="5405" b="12024">representative</wd>

<space/>

<wd l="5467" t="11822" r="5794" b="11981">lan-</wd>

</ln>

<ln l="1445" t="12096" r="5808" b="12298" baseLine="12245" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12149" r="1958" b="12298">guage</wd>

<space/>

<wd l="2006" t="12096" r="2549" b="12254">model</wd>

<space/>

<wd l="2606" t="12096" r="2794" b="12254">of</wd>

<space/>

<wd l="2827" t="12096" r="3091" b="12254">the</wd>

<space/>

<wd l="3139" t="12120" r="3634" b="12298">target</wd>

<space/>

<wd l="3686" t="12096" r="4334" b="12254">domain</wd>

<space/>

<wd l="4392" t="12096" r="5438" b="12293">(normalized</wd>

<space/>

<wd l="5482" t="12120" r="5808" b="12254">text</wd>

<space/>

</ln>

<ln l="1445" t="12365" r="3072" b="12566" baseLine="12518" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12365" r="1637" b="12523">of</wd>

<space/>

<wd l="1675" t="12365" r="2342" b="12566">English</wd>

<space/>

<wd l="2400" t="12370" r="3072" b="12562">tweets).</wd>

</ln>

</para>

<para l="1440" t="12653" r="5808" b="14438" alignment="justified" spaceBefore="14" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="12653" r="5794" b="12854" baseLine="12802" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="12653" r="2794" b="12840">Furthermore,</wd>

<space/>

<wd l="2894" t="12653" r="3331" b="12811">there</wd>

<space/>

<wd l="3418" t="12653" r="3557" b="12811">is</wd>

<space/>

<wd l="3653" t="12653" r="4306" b="12811">another</wd>

<space/>

<wd l="4387" t="12677" r="4762" b="12854">type</wd>

<space/>

<wd l="4853" t="12653" r="5045" b="12811">of</wd>

<space/>

<wd l="5117" t="12653" r="5794" b="12811">normal-</wd>

</ln>

<ln l="1440" t="12922" r="5794" b="13123" baseLine="13075" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12922" r="2035" b="13080">ization</wd>

<space/>

<wd l="2126" t="12922" r="3134" b="13123">phenomena</wd>

<space/>

<wd l="3221" t="12922" r="3797" b="13109">which,</wd>

<space/>

<wd l="3912" t="12946" r="4066" b="13080">at</wd>

<space/>

<wd l="4157" t="12922" r="4464" b="13080">this</wd>

<space/>

<wd l="4560" t="12946" r="5318" b="13109">moment,</wd>

<space/>

<wd l="5434" t="12974" r="5794" b="13080">can-</wd>

</ln>

<ln l="1440" t="13195" r="5794" b="13397" baseLine="13344" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13219" r="1718" b="13354">not</wd>

<space/>

<wd l="1781" t="13195" r="1982" b="13354">be</wd>

<space/>

<wd l="2050" t="13195" r="2818" b="13397">correctly</wd>

<space/>

<wd l="2880" t="13195" r="3571" b="13354">handled</wd>

<space/>

<wd l="3634" t="13195" r="3845" b="13397">by</wd>

<space/>

<wd l="3917" t="13248" r="4205" b="13354">our</wd>

<space/>

<wd l="4272" t="13219" r="4910" b="13397">system:</wd>

<space/>

<wd l="5006" t="13200" r="5275" b="13349">n-1</wd>

<space/>

<wd l="5357" t="13248" r="5794" b="13397">map-</wd>

</ln>

<ln l="1440" t="13464" r="5808" b="13666" baseLine="13618" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13464" r="1958" b="13666">pings.</wd>

<space/>

<wd l="2064" t="13464" r="2443" b="13622">This</wd>

<space/>

<wd l="2515" t="13464" r="2650" b="13622">is</wd>

<space/>

<wd l="2726" t="13464" r="3038" b="13622">due</wd>

<space/>

<wd l="3101" t="13488" r="3269" b="13622">to</wd>

<space/>

<wd l="3336" t="13464" r="3600" b="13622">the</wd>

<space/>

<wd l="3662" t="13464" r="4171" b="13622">initial</wd>

<space/>

<wd l="4243" t="13464" r="5035" b="13666">approach</wd>

<space/>

<wd l="5098" t="13517" r="5352" b="13622">we</wd>

<space/>

<wd l="5419" t="13464" r="5808" b="13622">took</wd>

<space/>

</ln>

<ln l="1440" t="13738" r="5794" b="13939" baseLine="13886" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13738" r="1699" b="13896">for</wd>

<space/>

<wd l="1757" t="13738" r="2064" b="13896">this</wd>

<space/>

<wd l="2141" t="13762" r="2779" b="13939">system,</wd>

<space/>

<wd l="2851" t="13738" r="3384" b="13896">which</wd>

<space/>

<wd l="3451" t="13738" r="3830" b="13939">only</wd>

<space/>

<wd l="3898" t="13738" r="4838" b="13896">considered</wd>

<space/>

<wd l="4920" t="13742" r="5165" b="13891">1-1</wd>

<space/>

<wd l="5251" t="13738" r="5563" b="13896">and</wd>

<space/>

<wd l="5650" t="13742" r="5794" b="13891">1-</wd>

<space/>

</ln>

<ln l="1440" t="14006" r="5808" b="14208" baseLine="14155" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14059" r="1550" b="14160">n</wd>

<space/>

<wd l="1618" t="14006" r="2510" b="14208">mappings,</wd>

<space/>

<wd l="2597" t="14006" r="2875" b="14165">but</wd>

<space/>

<wd l="2942" t="14030" r="3226" b="14165">not</wd>

<space/>

<wd l="3293" t="14011" r="3562" b="14160">n-1</wd>

<space/>

<wd l="3653" t="14006" r="4546" b="14208">mappings,</wd>

<space/>

<wd l="4632" t="14006" r="5352" b="14208">together</wd>

<space/>

<wd l="5419" t="14006" r="5808" b="14165">with</wd>

<space/>

</ln>

<ln l="1445" t="14280" r="3206" b="14438" baseLine="14429" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="14333" r="1733" b="14438">our</wd>

<space/>

<wd l="1786" t="14280" r="2174" b="14438">time</wd>

<space/>

<wd l="2227" t="14280" r="3206" b="14438">limitations.</wd>

</ln>

</para>

<para l="1445" t="14563" r="5808" b="15307" alignment="justified" spaceBefore="17" fli="216" lsp="exactly" lspExact="268" language="en">

<ln l="1656" t="14563" r="5803" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="14563" r="1934" b="14717">All</wd>

<space/>

<wd l="2011" t="14563" r="2338" b="14722">that</wd>

<space/>

<wd l="2410" t="14563" r="2890" b="14765">being</wd>

<space/>

<wd l="2976" t="14563" r="3360" b="14750">said,</wd>

<space/>

<wd l="3451" t="14616" r="3619" b="14722">as</wd>

<space/>

<wd l="3701" t="14563" r="4224" b="14722">future</wd>

<space/>

<wd l="4296" t="14563" r="4699" b="14722">lines</wd>

<space/>

<wd l="4786" t="14563" r="4973" b="14722">of</wd>

<space/>

<wd l="5035" t="14563" r="5482" b="14722">work</wd>

<space/>

<wd l="5549" t="14616" r="5803" b="14722">we</wd>

<space/>

</ln>

<ln l="1445" t="14837" r="5808" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="14890" r="1704" b="14995">are</wd>

<space/>

<wd l="1757" t="14837" r="2765" b="15038">considering</wd>

<space/>

<wd l="2813" t="14837" r="3082" b="14995">the</wd>

<space/>

<wd l="3125" t="14837" r="3965" b="15038">following</wd>

<space/>

<wd l="4013" t="14837" r="5246" b="15038">improvements</wd>

<space/>

<wd l="5299" t="14861" r="5467" b="14995">to</wd>

<space/>

<wd l="5520" t="14890" r="5808" b="14995">our</wd>

<space/>

</ln>

<ln l="1450" t="15110" r="2088" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="15130" r="2088" b="15307">system:</wd>

</ln>

</para>

</column>

<column l="6144" t="1260" r="10531" b="15316">

<para l="6384" t="1320" r="10526" b="3144" alignment="justified" li="432" spaceBefore="1" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="1320" r="10526" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6384" t="1325" r="6586" b="1474">•</wd>

<tab position="6467"/>

<wd l="6586" t="1320" r="7450" b="1522">Obtaining</wd>

<space/>

<wd l="7507" t="1373" r="7603" b="1478">a</wd>

<space/>

<wd l="7642" t="1320" r="8856" b="1522">representative</wd>

<space/>

<wd l="8904" t="1320" r="9691" b="1522">language</wd>

<space/>

<wd l="9739" t="1320" r="10282" b="1478">model</wd>

<space/>

<wd l="10334" t="1320" r="10526" b="1478">of</wd>

<space/>

</ln>

<ln l="6581" t="1594" r="10502" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="1594" r="6850" b="1752">the</wd>

<space/>

<wd l="6926" t="1618" r="7421" b="1795">target</wd>

<space/>

<wd l="7498" t="1594" r="8150" b="1752">domain</wd>

<space/>

<wd l="8222" t="1594" r="8438" b="1795">by</wd>

<space/>

<wd l="8520" t="1594" r="8986" b="1795">using</wd>

<space/>

<wd l="9072" t="1646" r="9168" b="1752">a</wd>

<space/>

<wd l="9240" t="1594" r="9749" b="1795">larger</wd>

<space/>

<wd l="9821" t="1594" r="10502" b="1752">normal-</wd>

</ln>

<ln l="6581" t="1862" r="10502" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="1862" r="6946" b="2021">ized</wd>

<space/>

<wd l="7013" t="1886" r="7483" b="2021">tweet</wd>

<space/>

<wd l="7555" t="1915" r="8174" b="2064">corpus.</wd>

<space/>

<wd l="8285" t="1862" r="8664" b="2021">This</wd>

<space/>

<wd l="8746" t="1915" r="9312" b="2064">corpus</wd>

<space/>

<wd l="9384" t="1862" r="9725" b="2021">will</wd>

<space/>

<wd l="9792" t="1862" r="9998" b="2021">be</wd>

<space/>

<wd l="10066" t="1915" r="10502" b="2021">com-</wd>

</ln>

<ln l="6581" t="2136" r="10498" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="2136" r="7118" b="2338">prised</wd>

<space/>

<wd l="7171" t="2136" r="7363" b="2294">of</wd>

<space/>

<wd l="7402" t="2160" r="7954" b="2294">tweets</wd>

<space/>

<wd l="8011" t="2136" r="8683" b="2294">without</wd>

<space/>

<wd l="8731" t="2136" r="9874" b="2294">non-standard</wd>

<space/>

<wd l="9926" t="2136" r="10498" b="2323">words,</wd>

<space/>

</ln>

<ln l="6590" t="2405" r="10507" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6590" t="2458" r="6773" b="2563">so</wd>

<space/>

<wd l="6859" t="2458" r="7109" b="2563">we</wd>

<space/>

<wd l="7195" t="2458" r="7493" b="2563">can</wd>

<space/>

<wd l="7589" t="2405" r="7901" b="2563">still</wd>

<space/>

<wd l="7992" t="2429" r="8626" b="2606">capture</wd>

<space/>

<wd l="8707" t="2405" r="8976" b="2563">the</wd>

<space/>

<wd l="9058" t="2405" r="10507" b="2606">morphosyntactic</wd>

<space/>

</ln>

<ln l="6590" t="2678" r="10498" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6590" t="2702" r="7344" b="2837">structure</wd>

<space/>

<wd l="7406" t="2678" r="7598" b="2837">of</wd>

<space/>

<wd l="7642" t="2678" r="8088" b="2837">these</wd>

<space/>

<wd l="8146" t="2702" r="8544" b="2837">texts</wd>

<space/>

<wd l="8621" t="2683" r="9130" b="2880">(Yang</wd>

<space/>

<wd l="9192" t="2678" r="9504" b="2837">and</wd>

<space/>

<wd l="9562" t="2678" r="10498" b="2866">Eisenstein,</wd>

<space/>

</ln>

<ln l="6586" t="2952" r="7133" b="3144" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6586" t="2952" r="7133" b="3144">2013).</wd>

</ln>

</para>

<para l="6384" t="3394" r="10507" b="3864" alignment="justified" li="432" spaceBefore="173" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="3394" r="10507" b="3595" baseLine="3542" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="3398" r="6581" b="3542">•</wd>

<tab position="6465"/>

<wd l="6581" t="3394" r="7099" b="3595">Using</wd>

<space/>

<wd l="7166" t="3398" r="7555" b="3552">POS</wd>

<space/>

<wd l="7627" t="3418" r="7968" b="3595">tags</wd>

<space/>

<wd l="8040" t="3394" r="8352" b="3552">and</wd>

<space/>

<wd l="8424" t="3394" r="9182" b="3595">syntactic</wd>

<space/>

<wd l="9250" t="3394" r="10282" b="3552">information</wd>

<space/>

<wd l="10339" t="3418" r="10507" b="3552">to</wd>

<space/>

</ln>

<ln l="6581" t="3662" r="10094" b="3864" baseLine="3816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="3662" r="7301" b="3864">improve</wd>

<space/>

<wd l="7358" t="3662" r="7622" b="3821">the</wd>

<space/>

<wd l="7685" t="3662" r="8515" b="3821">candidate</wd>

<space/>

<wd l="8578" t="3662" r="9346" b="3821">selection</wd>

<space/>

<wd l="9398" t="3715" r="10094" b="3864">process.</wd>

</ln>

</para>

<para l="6384" t="4109" r="10517" b="6466" alignment="justified" li="432" spaceBefore="172" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="4109" r="10502" b="4310" baseLine="4262" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="4114" r="6581" b="4262">•</wd>

<tab position="6467"/>

<wd l="6581" t="4109" r="7531" b="4310">Integrating</wd>

<space/>

<wd l="7613" t="4162" r="7709" b="4267">a</wd>

<space/>

<wd l="7781" t="4109" r="8558" b="4267">classifier</wd>

<space/>

<wd l="8626" t="4109" r="8798" b="4262">in</wd>

<space/>

<wd l="8866" t="4109" r="9134" b="4267">the</wd>

<space/>

<wd l="9211" t="4109" r="10075" b="4267">extraction</wd>

<space/>

<wd l="10147" t="4162" r="10502" b="4310">pro-</wd>

</ln>

<ln l="6586" t="4382" r="10498" b="4570" baseLine="4531" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="4435" r="6936" b="4541">cess</wd>

<space/>

<wd l="7061" t="4382" r="7248" b="4541">of</wd>

<space/>

<wd l="7344" t="4382" r="7608" b="4541">the</wd>

<space/>

<wd l="7723" t="4382" r="8102" b="4541">final</wd>

<space/>

<wd l="8213" t="4382" r="9427" b="4541">normalization</wd>

<space/>

<wd l="9542" t="4382" r="10498" b="4570">candidates,</wd>

<space/>

</ln>

<ln l="6581" t="4651" r="10502" b="4853" baseLine="4805" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="4651" r="7123" b="4853">taking</wd>

<space/>

<wd l="7224" t="4704" r="7397" b="4810">as</wd>

<space/>

<wd l="7498" t="4651" r="8179" b="4810">features</wd>

<space/>

<wd l="8285" t="4675" r="8904" b="4853">aspects</wd>

<space/>

<wd l="9014" t="4651" r="9408" b="4810">such</wd>

<space/>

<wd l="9504" t="4704" r="9672" b="4810">as</wd>

<space/>

<wd l="9773" t="4651" r="10042" b="4810">the</wd>

<space/>

<wd l="10147" t="4704" r="10502" b="4853">syn-</wd>

</ln>

<ln l="6581" t="4925" r="10502" b="5126" baseLine="5074" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="4925" r="7051" b="5083">tactic</wd>

<space/>

<wd l="7152" t="4925" r="7464" b="5083">and</wd>

<space/>

<wd l="7550" t="4925" r="9000" b="5126">morphosyntactic</wd>

<space/>

<wd l="9101" t="4925" r="10128" b="5083">information</wd>

<space/>

<wd l="10224" t="4925" r="10502" b="5083">ob-</wd>

</ln>

<ln l="6581" t="5194" r="10502" b="5395" baseLine="5342" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="5194" r="7157" b="5381">tained,</wd>

<space/>

<wd l="7229" t="5194" r="7632" b="5352">their</wd>

<space/>

<wd l="7685" t="5194" r="8640" b="5395">probability</wd>

<space/>

<wd l="8707" t="5194" r="9557" b="5395">according</wd>

<space/>

<wd l="9619" t="5218" r="9787" b="5352">to</wd>

<space/>

<wd l="9850" t="5194" r="10114" b="5352">the</wd>

<space/>

<wd l="10171" t="5194" r="10502" b="5352">lan-</wd>

</ln>

<ln l="6586" t="5462" r="10517" b="5664" baseLine="5616" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="5515" r="7104" b="5664">guage</wd>

<space/>

<wd l="7171" t="5462" r="7762" b="5650">model,</wd>

<space/>

<wd l="7848" t="5462" r="8554" b="5621">whether</wd>

<space/>

<wd l="8621" t="5462" r="8990" b="5664">they</wd>

<space/>

<wd l="9062" t="5515" r="9485" b="5621">were</wd>

<space/>

<wd l="9566" t="5462" r="10262" b="5621">selected</wd>

<space/>

<wd l="10334" t="5515" r="10517" b="5621">or</wd>

<space/>

</ln>

<ln l="6581" t="5736" r="10512" b="5938" baseLine="5885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="5760" r="6864" b="5894">not</wd>

<space/>

<wd l="6926" t="5736" r="7138" b="5938">by</wd>

<space/>

<wd l="7205" t="5736" r="7474" b="5894">the</wd>

<space/>

<wd l="7536" t="5736" r="8136" b="5894">Viterbi</wd>

<space/>

<wd l="8208" t="5736" r="9096" b="5938">algorithm,</wd>

<space/>

<wd l="9173" t="5736" r="9576" b="5894">their</wd>

<space/>

<wd l="9643" t="5736" r="10128" b="5938">string</wd>

<space/>

<wd l="10200" t="5736" r="10512" b="5894">and</wd>

<space/>

</ln>

<ln l="6581" t="6005" r="10502" b="6206" baseLine="6158" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6005" r="7330" b="6206">phonetic</wd>

<space/>

<wd l="7397" t="6005" r="8347" b="6163">differences</wd>

<space/>

<wd l="8414" t="6005" r="8803" b="6163">with</wd>

<space/>

<wd l="8861" t="6029" r="9480" b="6206">respect</wd>

<space/>

<wd l="9533" t="6029" r="9701" b="6163">to</wd>

<space/>

<wd l="9763" t="6005" r="10027" b="6163">the</wd>

<space/>

<wd l="10090" t="6005" r="10502" b="6206">orig-</wd>

</ln>

<ln l="6581" t="6278" r="7795" b="6466" baseLine="6427" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6278" r="6907" b="6437">inal</wd>

<space/>

<wd l="6965" t="6278" r="7430" b="6466">form,</wd>

<space/>

<wd l="7502" t="6302" r="7795" b="6437">etc.</wd>

</ln>

</para>

<para l="6384" t="6725" r="10512" b="8006" alignment="justified" li="432" spaceBefore="176" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6725" r="10507" b="6926" baseLine="6874" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6384" t="6730" r="6586" b="6874">•</wd>

<tab position="6465"/>

<wd l="6586" t="6725" r="7310" b="6926">Keeping</wd>

<space/>

<wd l="7373" t="6725" r="7642" b="6883">the</wd>

<space/>

<wd l="7704" t="6725" r="8530" b="6883">canonical</wd>

<space/>

<wd l="8592" t="6725" r="9230" b="6883">lexicon</wd>

<space/>

<wd l="9288" t="6725" r="9979" b="6926">updated</wd>

<space/>

<wd l="10037" t="6725" r="10507" b="6926">using</wd>

<space/>

</ln>

<ln l="6581" t="6994" r="10512" b="7195" baseLine="7142" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="7046" r="7397" b="7152">resources</wd>

<space/>

<wd l="7469" t="6994" r="7795" b="7152">like</wd>

<space/>

<wd l="7858" t="6994" r="8803" b="7195">Wikipedia,</wd>

<space/>

<wd l="8890" t="6994" r="9326" b="7152">since</wd>

<space/>

<wd l="9394" t="6994" r="9658" b="7152">the</wd>

<space/>

<wd l="9725" t="6994" r="10512" b="7195">language</wd>

<space/>

</ln>

<ln l="6581" t="7267" r="10507" b="7469" baseLine="7416" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="7267" r="7123" b="7426">model</wd>

<space/>

<wd l="7267" t="7267" r="8342" b="7426">construction</wd>

<space/>

<wd l="8477" t="7320" r="9120" b="7469">process</wd>

<space/>

<wd l="9264" t="7267" r="9730" b="7426">relies</wd>

<space/>

<wd l="9874" t="7267" r="10507" b="7469">heavily</wd>

<space/>

</ln>

<ln l="6581" t="7536" r="10502" b="7738" baseLine="7685" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="7589" r="7018" b="7738">upon</wd>

<space/>

<wd l="7075" t="7589" r="7171" b="7694">a</wd>

<space/>

<wd l="7224" t="7536" r="7661" b="7738">good</wd>

<space/>

<wd l="7709" t="7536" r="8285" b="7694">lexical</wd>

<space/>

<wd l="8342" t="7536" r="9154" b="7694">reference</wd>

<space/>

<wd l="9206" t="7536" r="9374" b="7690">in</wd>

<space/>

<wd l="9432" t="7536" r="9893" b="7694">order</wd>

<space/>

<wd l="9941" t="7560" r="10109" b="7694">to</wd>

<space/>

<wd l="10171" t="7589" r="10502" b="7694">cor-</wd>

</ln>

<ln l="6581" t="7805" r="9586" b="8006" baseLine="7958" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="7805" r="7075" b="8006">rectly</wd>

<space/>

<wd l="7138" t="7805" r="7766" b="7963">discard</wd>

<space/>

<wd l="7819" t="7805" r="8957" b="7963">non-standard</wd>

<space/>

<wd l="9010" t="7805" r="9586" b="7963">words.</wd>

</ln>

</para>

<para l="6144" t="8266" r="10526" b="9274" alignment="justified" spaceBefore="184" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="8266" r="10526" b="8467" baseLine="8414" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8270" r="7032" b="8453">Moreover,</wd>

<space/>

<wd l="7138" t="8318" r="7392" b="8424">we</wd>

<space/>

<wd l="7478" t="8266" r="8026" b="8424">intend</wd>

<space/>

<wd l="8107" t="8290" r="8275" b="8424">to</wd>

<space/>

<wd l="8376" t="8266" r="8832" b="8467">study</wd>

<space/>

<wd l="8923" t="8266" r="9187" b="8424">the</wd>

<space/>

<wd l="9278" t="8266" r="10243" b="8467">application</wd>

<space/>

<wd l="10334" t="8266" r="10526" b="8424">of</wd>

<space/>

</ln>

<ln l="6144" t="8534" r="10512" b="8736" baseLine="8683" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8558" r="6619" b="8693">tweet</wd>

<space/>

<wd l="6672" t="8534" r="7925" b="8722">normalization,</wd>

<space/>

<wd l="7987" t="8534" r="8246" b="8693">for</wd>

<space/>

<wd l="8294" t="8534" r="8683" b="8693">both</wd>

<space/>

<wd l="8741" t="8534" r="9427" b="8736">Spanish</wd>

<space/>

<wd l="9480" t="8534" r="9792" b="8693">and</wd>

<space/>

<wd l="9845" t="8534" r="10512" b="8736">English</wd>

<space/>

</ln>

<ln l="6144" t="8803" r="10498" b="9005" baseLine="8957">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="8827" r="6744" b="8990">tweets,</wd>

<space/>

<wd l="6878" t="8803" r="7046" b="8957">in</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7157" t="8813" r="7819" b="9005">opinion</wd>

<space/>

<wd l="7930" t="8813" r="8530" b="9005">mining</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8640" t="8803" r="9067" b="8962">tasks</wd>

<space/>

<wd l="9192" t="8803" r="9864" b="9000">(Vilares</wd>

<space/>

<wd l="9984" t="8827" r="10138" b="8962">et</wd>

<space/>

<wd l="10248" t="8803" r="10498" b="8990">al.,</wd>

<space/>

</run>

</ln>

<ln l="6149" t="9077" r="6696" b="9274" baseLine="9226" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="9077" r="6696" b="9274">2015).</wd>

</ln>

</para>

<para l="6144" t="9533" r="8011" b="9754" alignment="left" spaceBefore="207" lsp="exactly" lspExact="274" language="en">

<ln l="6144" t="9533" r="8011" b="9754" baseLine="9701" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9533" r="8011" b="9754">Acknowledgments</wd>

</ln>

</para>

<para l="6144" t="9965" r="10526" b="11251" alignment="justified" spaceBefore="136" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="9965" r="10512" b="10166" baseLine="10114" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9965" r="6523" b="10123">This</wd>

<space/>

<wd l="6638" t="9965" r="7368" b="10123">research</wd>

<space/>

<wd l="7469" t="9965" r="7752" b="10123">has</wd>

<space/>

<wd l="7862" t="9965" r="8275" b="10123">been</wd>

<space/>

<wd l="8381" t="9965" r="9106" b="10166">partially</wd>

<space/>

<wd l="9211" t="9965" r="9821" b="10123">funded</wd>

<space/>

<wd l="9922" t="9965" r="10138" b="10166">by</wd>

<space/>

<wd l="10243" t="9965" r="10512" b="10123">the</wd>

<space/>

</ln>

<ln l="6149" t="10238" r="10502" b="10440" baseLine="10387" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="10238" r="6840" b="10440">Spanish</wd>

<space/>

<wd l="6926" t="10238" r="7675" b="10440">Ministry</wd>

<space/>

<wd l="7771" t="10238" r="7963" b="10397">of</wd>

<space/>

<wd l="8040" t="10243" r="8870" b="10440">Economy</wd>

<space/>

<wd l="8966" t="10238" r="9278" b="10397">and</wd>

<space/>

<wd l="9374" t="10238" r="10502" b="10440">Competitive-</wd>

</ln>

<ln l="6144" t="10507" r="10502" b="10709" baseLine="10656">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="10560" r="6514" b="10666">ness</wd>

<space/>

<wd l="6576" t="10507" r="6888" b="10666">and</wd>

<space/>

</run>

<wd l="6941" t="10512" r="7560" b="10661"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">F</run>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">EDER</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7622" t="10507" r="8366" b="10709">(through</wd>

<space/>

<wd l="8414" t="10507" r="9019" b="10709">project</wd>

<space/>

<wd l="9067" t="10507" r="10502" b="10666">FFI2014-51978-</wd>

<space/>

</run>

</ln>

<ln l="6149" t="10776" r="10526" b="10978" baseLine="10930" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="10781" r="6864" b="10973">C2-2-R)</wd>

<space/>

<wd l="6950" t="10776" r="7262" b="10934">and</wd>

<space/>

<wd l="7334" t="10776" r="7550" b="10978">by</wd>

<space/>

<wd l="7627" t="10776" r="7896" b="10934">the</wd>

<space/>

<wd l="7968" t="10781" r="9086" b="10934">Autonomous</wd>

<space/>

<wd l="9178" t="10781" r="10258" b="10934">Government</wd>

<space/>

<wd l="10334" t="10776" r="10526" b="10934">of</wd>

<space/>

</ln>

<ln l="6149" t="11050" r="9226" b="11251" baseLine="11198" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="11050" r="6778" b="11208">Galicia</wd>

<space/>

<wd l="6840" t="11050" r="7584" b="11251">(through</wd>

<space/>

<wd l="7642" t="11074" r="8088" b="11251">grant</wd>

<space/>

<wd l="8141" t="11054" r="9226" b="11246">R2014/034).</wd>

</ln>

</para>

<para l="6149" t="11760" r="7248" b="11933" alignment="left" spaceBefore="462" lsp="exactly" lspExact="274" language="en">

<ln l="6149" t="11760" r="7248" b="11933" baseLine="11928" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="11760" r="7248" b="11933">References</wd>

</ln>

</para>

<para l="6144" t="12139" r="10512" b="13862" alignment="justified" li="216" spaceBefore="114" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="12139" r="10507" b="12331" baseLine="12278">

<wd l="6144" t="12144" r="6552" b="12288"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">I</run>

<run underlined="none" subsuperscript="superscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">naki</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="6638" t="12139" r="7277" b="12331">Alegr´ıa,</wd>

<space/>

<wd l="7378" t="12149" r="7781" b="12288">Nora</wd>

<space/>

<wd l="7862" t="12144" r="8678" b="12312">Aranberri,</wd>

<space/>

<wd l="8779" t="12139" r="9288" b="12288">V´ıctor</wd>

<space/>

<wd l="9374" t="12149" r="9960" b="12312">Fresno,</wd>

<space/>

<wd l="10061" t="12144" r="10507" b="12288">Pablo</wd>

<space/>

</run>

</ln>

<ln l="6370" t="12360" r="10507" b="12528" baseLine="12498">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6370" t="12360" r="7094" b="12528">Gamallo,</wd>

<space/>

<wd l="7229" t="12360" r="7632" b="12504">Llu´ıs</wd>

<space/>

<wd l="7752" t="12360" r="8256" b="12528">Padr´o,</wd>

<space/>

</run>

<wd l="8390" t="12360" r="8798" b="12504"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">I</run>

<run underlined="none" subsuperscript="superscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">naki</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8918" t="12360" r="9211" b="12504">San</wd>

<space/>

<wd l="9326" t="12360" r="9979" b="12528">Vicente,</wd>

<space/>

<wd l="10114" t="12360" r="10507" b="12504">Jordi</wd>

<space/>

</run>

</ln>

<ln l="6365" t="12581" r="10512" b="12768" baseLine="12715" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="12586" r="6941" b="12749">Turmo,</wd>

<space/>

<wd l="7032" t="12581" r="7315" b="12725">and</wd>

<space/>

<wd l="7387" t="12581" r="7982" b="12725">Arkaitz</wd>

<space/>

<wd l="8054" t="12581" r="8746" b="12768">Zubiaga.</wd>

<space/>

<wd l="8904" t="12581" r="9336" b="12725">2013.</wd>

<space/>

<wd l="9494" t="12581" r="10512" b="12725">Introducci´on</wd>

<space/>

</ln>

<ln l="6370" t="12802" r="10502" b="12984" baseLine="12936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="12845" r="6456" b="12946">a</wd>

<space/>

<wd l="6523" t="12802" r="6672" b="12946">la</wd>

<space/>

<wd l="6744" t="12821" r="7133" b="12946">tarea</wd>

<space/>

<wd l="7205" t="12802" r="8102" b="12984">compartida</wd>

<space/>

<wd l="8170" t="12806" r="9206" b="12946">Tweet-Norm</wd>

<space/>

<wd l="9278" t="12802" r="9710" b="12946">2013:</wd>

<space/>

<wd l="9835" t="12802" r="10502" b="12946">Normal-</wd>

</ln>

<ln l="6365" t="12998" r="10512" b="13205" baseLine="13156">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="13018" r="6941" b="13162">izaci´on</wd>

<space/>

<wd l="7013" t="13018" r="7488" b="13162">l´exica</wd>

<space/>

<wd l="7565" t="13018" r="7742" b="13162">de</wd>

<space/>

<wd l="7819" t="13018" r="8155" b="13162">tuits</wd>

<space/>

<wd l="8237" t="13061" r="8424" b="13162">en</wd>

<space/>

</run>

<wd l="8496" t="13018" r="9139" b="13205"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">espa</run>

<run underlined="none" subsuperscript="superscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">nol.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="9293" t="13022" r="9461" b="13157">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="9538" t="13022" r="10512" b="13162">Tweet-Norm</wd>

<space/>

</run>

</ln>

<ln l="6365" t="13238" r="10507" b="13421" baseLine="13373">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="13238" r="6792" b="13382">2013.</wd>

<space/>

<wd l="6874" t="13243" r="7330" b="13382">Tweet</wd>

<space/>

<wd l="7368" t="13238" r="8525" b="13397">Normalization</wd>

<space/>

<wd l="8587" t="13238" r="9365" b="13421">Workshop</wd>

<space/>

</run>

<wd l="9418" t="13238" r="9859" b="13406"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2013</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="9917" t="13238" r="10507" b="13382">volume</wd>

<space/>

</run>

</ln>

<ln l="6384" t="13459" r="10498" b="13646" baseLine="13594">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6384" t="13459" r="6758" b="13603">1086</wd>

<space/>

<wd l="6840" t="13459" r="7008" b="13603">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7080" t="13464" r="7589" b="13603">CEUR</wd>

<space/>

<wd l="7670" t="13459" r="8448" b="13642">Workshop</wd>

<space/>

</run>

<wd l="8525" t="13459" r="9552" b="13642"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Proceedings</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="9638" t="13502" r="10085" b="13646">pages</wd>

<space/>

<wd l="10181" t="13459" r="10498" b="13603">1–9.</wd>

<space/>

</run>

</ln>

<ln l="6370" t="13675" r="7613" b="13862" baseLine="13814" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="13675" r="7613" b="13862">CEUR-WS.org.</wd>

</ln>

</para>

<para l="6154" t="14069" r="10469" b="14477" alignment="justified" li="216" spaceBefore="187" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6154" t="14069" r="10469" b="14246" baseLine="14208">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6154" t="14069" r="6600" b="14213">GNU</wd>

<space/>

</run>

<wd l="6662" t="14074" r="7325" b="14213"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">A</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">SPELL</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7392" t="14069" r="7699" b="14246">(rel.</wd>

<space/>

<wd l="7766" t="14069" r="8218" b="14246">0.60).</wd>

<space/>

<wd l="8314" t="14069" r="8746" b="14213">2011.</wd>

<space/>

<wd l="8837" t="14069" r="9590" b="14213">Available</wd>

<space/>

<wd l="9653" t="14088" r="9830" b="14213">at:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0"><wd l="9917" t="14083" r="10469" b="14246">http:</wd>

<space/>

</run>

</ln>

<ln l="6384" t="14290" r="9662" b="14477" baseLine="14424">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0"><wd l="6384" t="14294" r="7781" b="14467">//aspell.net</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7858" t="14290" r="8448" b="14467">(visited</wd>

<space/>

<wd l="8501" t="14333" r="8698" b="14434">on</wd>

<space/>

<wd l="8746" t="14294" r="9106" b="14477">May</wd>

<space/>

<wd l="9163" t="14290" r="9662" b="14467">2015).</wd>

</run>

</ln>

</para>

<para l="6144" t="14683" r="10512" b="15302" alignment="justified" li="216" spaceBefore="158" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="14683" r="10502" b="14870" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14683" r="6821" b="14870">Timothy</wd>

<space/>

<wd l="6965" t="14683" r="7685" b="14851">Baldwin,</wd>

<space/>

<wd l="7858" t="14683" r="8333" b="14827">Marie</wd>

<space/>

<wd l="8482" t="14683" r="9250" b="14827">Catherine</wd>

<space/>

<wd l="9398" t="14683" r="9581" b="14827">de</wd>

<space/>

<wd l="9725" t="14683" r="10502" b="14851">Marneffe,</wd>

<space/>

</ln>

<ln l="6365" t="14899" r="10507" b="15086" baseLine="15038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14904" r="6590" b="15043">Bo</wd>

<space/>

<wd l="6686" t="14904" r="7061" b="15067">Han,</wd>

<space/>

<wd l="7171" t="14904" r="8150" b="15086">Young-Bum</wd>

<space/>

<wd l="8242" t="14899" r="8635" b="15067">Kim,</wd>

<space/>

<wd l="8741" t="14899" r="9125" b="15043">Alan</wd>

<space/>

<wd l="9221" t="14899" r="9710" b="15067">Ritter,</wd>

<space/>

<wd l="9821" t="14899" r="10104" b="15043">and</wd>

<space/>

<wd l="10195" t="14899" r="10507" b="15043">Wei</wd>

<space/>

</ln>

<ln l="6365" t="15120" r="10512" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="15125" r="6648" b="15264">Xu.</wd>

<space/>

<wd l="6792" t="15120" r="7224" b="15264">2015.</wd>

<space/>

<wd l="7368" t="15120" r="7915" b="15264">Shared</wd>

<space/>

<wd l="7982" t="15120" r="8376" b="15264">tasks</wd>

<space/>

<wd l="8453" t="15120" r="8626" b="15264">of</wd>

<space/>

<wd l="8683" t="15120" r="8923" b="15264">the</wd>

<space/>

<wd l="9000" t="15120" r="9384" b="15264">2015</wd>

<space/>

<wd l="9461" t="15120" r="10238" b="15302">workshop</wd>

<space/>

<wd l="10315" t="15163" r="10512" b="15264">on</wd>

</ln>

</para>

</column>

</section>

<dd l="1437" t="15746" r="10531" b="15975">

<para l="5771" t="15792" r="6200" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6134" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="30">

<wd l="5837" t="15792" r="6134" b="15946">104</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4315.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1436" marginTop="1296" marginRight="1379" marginBottom="1292" offsetX="-24" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1436" t="1296" r="10530" b="15316">

<column l="1436" t="1296" r="5823" b="15316">

<para l="1656" t="1334" r="5813" b="2179" alignment="justified" li="216" spaceBefore="11" lsp="exactly" lspExact="219" language="en">

<ln l="1656" t="1334" r="5798" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="1334" r="2088" b="1522">noisy</wd>

<space/>

<wd l="2174" t="1334" r="3346" b="1522">user-generated</wd>

<space/>

<wd l="3427" t="1354" r="3763" b="1478">text:</wd>

<space/>

<wd l="3907" t="1334" r="4478" b="1478">Twitter</wd>

<space/>

<wd l="4565" t="1334" r="5088" b="1478">lexical</wd>

<space/>

<wd l="5174" t="1334" r="5798" b="1478">normal-</wd>

</ln>

<ln l="1656" t="1555" r="5798" b="1742" baseLine="1694">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="1555" r="2203" b="1699">ization</wd>

<space/>

<wd l="2275" t="1555" r="2558" b="1699">and</wd>

<space/>

<wd l="2630" t="1555" r="3163" b="1699">named</wd>

<space/>

<wd l="3235" t="1555" r="3682" b="1742">entity</wd>

<space/>

<wd l="3754" t="1555" r="4699" b="1742">recognition.</wd>

<space/>

<wd l="4848" t="1560" r="5016" b="1694">In</wd>

<space/>

</run>

<wd l="5083" t="1555" r="5798" b="1699" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Proceed-</wd>

</ln>

<ln l="1666" t="1776" r="5813" b="1958" baseLine="1910" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="1781" r="1992" b="1958">ings</wd>

<space/>

<wd l="2054" t="1776" r="2237" b="1958">of</wd>

<space/>

<wd l="2266" t="1776" r="2506" b="1920">the</wd>

<space/>

<wd l="2573" t="1776" r="3350" b="1958">Workshop</wd>

<space/>

<wd l="3418" t="1824" r="3610" b="1920">on</wd>

<space/>

<wd l="3667" t="1781" r="4123" b="1958">Noisy</wd>

<space/>

<wd l="4205" t="1776" r="5434" b="1958">User-generated</wd>

<space/>

<wd l="5496" t="1781" r="5813" b="1920">Text</wd>

<space/>

</ln>

<ln l="1661" t="1992" r="4094" b="2179" baseLine="2131">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="1997" r="2299" b="2170">(WNUT</wd>

<space/>

</run>

<wd l="2328" t="1992" r="2837" b="2170"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2894" t="1992" r="3523" b="2179">Beijing,</wd>

<space/>

<wd l="3586" t="1992" r="4094" b="2136">China.</wd>

</run>

</ln>

</para>

<para l="1440" t="2366" r="5798" b="2990" alignment="justified" li="216" spaceBefore="153" fli="-216" lsp="exactly" lspExact="218" language="en">

<ln l="1440" t="2366" r="5798" b="2510" baseLine="2501" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2366" r="2150" b="2510">Thorsten</wd>

<space/>

<wd l="2222" t="2371" r="2741" b="2510">Brants</wd>

<space/>

<wd l="2827" t="2366" r="3110" b="2510">and</wd>

<space/>

<wd l="3182" t="2366" r="3566" b="2510">Alex</wd>

<space/>

<wd l="3643" t="2371" r="4138" b="2510">Franz.</wd>

<space/>

<wd l="4306" t="2366" r="4738" b="2510">2006.</wd>

<space/>

<wd l="4906" t="2366" r="5261" b="2510">Web</wd>

<space/>

<wd l="5362" t="2366" r="5563" b="2506">1T</wd>

<space/>

<wd l="5645" t="2366" r="5798" b="2510">5-</wd>

<space/>

</ln>

<ln l="1661" t="2582" r="5798" b="2770" baseLine="2722" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="2626" r="2069" b="2770">gram</wd>

<space/>

<wd l="2146" t="2582" r="2755" b="2726">Version</wd>

<space/>

<wd l="2851" t="2582" r="2914" b="2722">1</wd>

<space/>

<wd l="3019" t="2582" r="3336" b="2760">(ref.</wd>

<space/>

<wd l="3427" t="2582" r="4651" b="2760">LDC2006T13).</wd>

<space/>

<wd l="4824" t="2587" r="5290" b="2726">DVD.</wd>

<space/>

<wd l="5462" t="2582" r="5798" b="2726">Dis-</wd>

</ln>

<ln l="1656" t="2803" r="4838" b="2990" baseLine="2938" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="2803" r="2275" b="2947">tributed</wd>

<space/>

<wd l="2323" t="2803" r="2520" b="2990">by</wd>

<space/>

<wd l="2573" t="2803" r="3379" b="2990">Linguistic</wd>

<space/>

<wd l="3432" t="2808" r="3811" b="2947">Data</wd>

<space/>

<wd l="3864" t="2803" r="4838" b="2947">Consortium.</wd>

</ln>

</para>

<para l="1445" t="3173" r="5813" b="4238" alignment="justified" li="216" spaceBefore="153" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1445" t="3173" r="5808" b="3360" baseLine="3307" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3173" r="2174" b="3360">Grzegorz</wd>

<space/>

<wd l="2256" t="3173" r="3024" b="3360">Chrupała.</wd>

<space/>

<wd l="3192" t="3173" r="3624" b="3317">2014.</wd>

<space/>

<wd l="3787" t="3173" r="4790" b="3360">Normalizing</wd>

<space/>

<wd l="4867" t="3192" r="5371" b="3317">tweets</wd>

<space/>

<wd l="5453" t="3173" r="5808" b="3317">with</wd>

<space/>

</ln>

<ln l="1661" t="3394" r="5808" b="3581" baseLine="3528" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="3394" r="1958" b="3538">edit</wd>

<space/>

<wd l="2054" t="3394" r="2563" b="3576">scripts</wd>

<space/>

<wd l="2659" t="3394" r="2942" b="3538">and</wd>

<space/>

<wd l="3034" t="3413" r="3754" b="3538">recurrent</wd>

<space/>

<wd l="3840" t="3394" r="4334" b="3538">neural</wd>

<space/>

<wd l="4435" t="3394" r="5429" b="3581">embeddings.</wd>

<space/>

<wd l="5640" t="3398" r="5808" b="3533">In</wd>

<space/>

</ln>

<ln l="1656" t="3610" r="5798" b="3792" baseLine="3749" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="3614" r="2064" b="3754">Proc.</wd>

<space/>

<wd l="2170" t="3610" r="2347" b="3792">of</wd>

<space/>

<wd l="2400" t="3610" r="2635" b="3754">the</wd>

<space/>

<wd l="2712" t="3610" r="3120" b="3754">52nd</wd>

<space/>

<wd l="3173" t="3610" r="3763" b="3754">Annual</wd>

<space/>

<wd l="3835" t="3614" r="4488" b="3792">Meeting</wd>

<space/>

<wd l="4574" t="3610" r="4757" b="3792">of</wd>

<space/>

<wd l="4805" t="3610" r="5040" b="3754">the</wd>

<space/>

<wd l="5107" t="3614" r="5798" b="3754">Associa-</wd>

</ln>

<ln l="1661" t="3830" r="5813" b="4013" baseLine="3965" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="3835" r="1963" b="3974">tion</wd>

<space/>

<wd l="1978" t="3830" r="2256" b="4013">for</wd>

<space/>

<wd l="2299" t="3830" r="3490" b="4013">Computational</wd>

<space/>

<wd l="3528" t="3835" r="4406" b="4013">Linguistics</wd>

<space/>

<wd l="4454" t="3830" r="5102" b="4008">(Volume</wd>

<space/>

<wd l="5150" t="3830" r="5304" b="3974">2:</wd>

<space/>

<wd l="5376" t="3830" r="5813" b="3974">Short</wd>

<space/>

</ln>

<ln l="1656" t="4051" r="4099" b="4238" baseLine="4186">

<wd l="1656" t="4056" r="2314" b="4234"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Papers)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2371" t="4094" r="2818" b="4238">pages</wd>

<space/>

<wd l="2880" t="4051" r="3610" b="4195">680–686.</wd>

<space/>

<wd l="3672" t="4051" r="4099" b="4195">ACL.</wd>

</run>

</ln>

</para>

<para l="1440" t="4421" r="5798" b="5702" alignment="justified" li="216" spaceBefore="150" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="4421" r="5798" b="4608" baseLine="4555" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4426" r="1670" b="4565">Bo</wd>

<space/>

<wd l="1728" t="4426" r="2054" b="4565">Han</wd>

<space/>

<wd l="2117" t="4421" r="2400" b="4565">and</wd>

<space/>

<wd l="2453" t="4421" r="3130" b="4608">Timothy</wd>

<space/>

<wd l="3187" t="4421" r="3898" b="4565">Baldwin.</wd>

<space/>

<wd l="3998" t="4421" r="4430" b="4565">2011.</wd>

<space/>

<wd l="4526" t="4421" r="5117" b="4565">Lexical</wd>

<space/>

<wd l="5174" t="4421" r="5798" b="4565">normal-</wd>

</ln>

<ln l="1656" t="4637" r="5794" b="4824" baseLine="4776" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="4637" r="2189" b="4781">isation</wd>

<space/>

<wd l="2246" t="4637" r="2414" b="4781">of</wd>

<space/>

<wd l="2467" t="4637" r="2856" b="4781">short</wd>

<space/>

<wd l="2904" t="4656" r="3202" b="4781">text</wd>

<space/>

<wd l="3250" t="4680" r="4042" b="4824">messages:</wd>

<space/>

<wd l="4123" t="4637" r="4565" b="4781">makn</wd>

<space/>

<wd l="4622" t="4680" r="4954" b="4781">sens</wd>

<space/>

<wd l="5011" t="4680" r="5098" b="4781">a</wd>

<space/>

<wd l="5146" t="4637" r="5794" b="4781">#twitter.</wd>

<space/>

</ln>

<ln l="1656" t="4858" r="5798" b="5040" baseLine="4997">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="4862" r="1824" b="4997">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1891" t="4862" r="2294" b="5002">Proc.</wd>

<space/>

<wd l="2386" t="4858" r="2568" b="5040">of</wd>

<space/>

<wd l="2606" t="4858" r="2846" b="5002">the</wd>

<space/>

<wd l="2914" t="4858" r="3264" b="5002">49th</wd>

<space/>

<wd l="3317" t="4858" r="3907" b="5002">Annual</wd>

<space/>

<wd l="3965" t="4862" r="4622" b="5040">Meeting</wd>

<space/>

<wd l="4694" t="4858" r="4877" b="5040">of</wd>

<space/>

<wd l="4915" t="4858" r="5150" b="5002">the</wd>

<space/>

<wd l="5203" t="4862" r="5798" b="5002">Associ-</wd>

</run>

</ln>

<ln l="1656" t="5078" r="5798" b="5261" baseLine="5213" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="5083" r="2064" b="5222">ation</wd>

<space/>

<wd l="2107" t="5078" r="2386" b="5261">for</wd>

<space/>

<wd l="2458" t="5078" r="3648" b="5261">Computational</wd>

<space/>

<wd l="3715" t="5083" r="4651" b="5261">Linguistics:</wd>

<space/>

<wd l="4762" t="5083" r="5352" b="5222">Human</wd>

<space/>

<wd l="5424" t="5083" r="5798" b="5222">Lan-</wd>

</ln>

<ln l="1656" t="5294" r="5798" b="5477" baseLine="5434">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="5342" r="2141" b="5477">guage</wd>

<space/>

<wd l="2237" t="5294" r="3264" b="5477">Technologies</wd>

<space/>

<wd l="3355" t="5299" r="4219" b="5472">(ACL-HLT</wd>

<space/>

<wd l="4286" t="5294" r="4742" b="5472">2011)</wd>

<space/>

<wd l="4843" t="5381" r="4891" b="5395">-</wd>

<space/>

<wd l="5002" t="5294" r="5568" b="5438">Volume</wd>

<space/>

</run>

<wd l="5664" t="5294" r="5798" b="5462"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1656" t="5515" r="3389" b="5702" baseLine="5650" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="5558" r="2107" b="5702">pages</wd>

<space/>

<wd l="2165" t="5515" r="2899" b="5659">368–378.</wd>

<space/>

<wd l="2957" t="5515" r="3389" b="5659">ACL.</wd>

</ln>

</para>

<para l="1440" t="5885" r="5818" b="6720" alignment="justified" li="216" spaceBefore="156" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="5885" r="5794" b="6072" baseLine="6024" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="5890" r="1670" b="6029">Bo</wd>

<space/>

<wd l="1766" t="5890" r="2141" b="6053">Han,</wd>

<space/>

<wd l="2246" t="5885" r="2597" b="6029">Paul</wd>

<space/>

<wd l="2698" t="5885" r="3168" b="6053">Cook,</wd>

<space/>

<wd l="3278" t="5885" r="3566" b="6029">and</wd>

<space/>

<wd l="3658" t="5885" r="4330" b="6072">Timothy</wd>

<space/>

<wd l="4426" t="5885" r="5141" b="6029">Baldwin.</wd>

<space/>

<wd l="5362" t="5885" r="5794" b="6029">2013.</wd>

<space/>

</ln>

<ln l="1656" t="6106" r="5818" b="6250" baseLine="6240">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1656" t="6106" r="2251" b="6250">Lexical</wd>

<space/>

<wd l="2323" t="6106" r="3432" b="6250">normalization</wd>

<space/>

<wd l="3504" t="6106" r="3734" b="6250">for</wd>

<space/>

<wd l="3816" t="6106" r="4267" b="6250">social</wd>

<space/>

<wd l="4344" t="6106" r="4834" b="6250">media</wd>

<space/>

<wd l="4901" t="6125" r="5237" b="6250">text.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="5376" t="6110" r="5818" b="6250">ACM</wd>

<space/>

</run>

</ln>

<ln l="1666" t="6326" r="5803" b="6509" baseLine="6461" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1666" t="6331" r="2683" b="6470">Transactions</wd>

<space/>

<wd l="2746" t="6374" r="2933" b="6470">on</wd>

<space/>

<wd l="2986" t="6326" r="3816" b="6509">Intelligent</wd>

<space/>

<wd l="3864" t="6331" r="4493" b="6509">Systems</wd>

<space/>

<wd l="4546" t="6326" r="4853" b="6470">and</wd>

<space/>

<wd l="4910" t="6326" r="5803" b="6509">Technology</wd>

<space/>

</ln>

<ln l="1661" t="6542" r="3413" b="6720" baseLine="6682">

<wd l="1661" t="6547" r="2222" b="6720"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">(TIST)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="2280" t="6542" r="3413" b="6720">4(1):5:1–5:27.</wd>

</run>

</ln>

</para>

<para l="1440" t="6912" r="5803" b="7978" alignment="justified" li="216" spaceBefore="149" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="6912" r="5798" b="7099" baseLine="7051" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6912" r="2170" b="7056">Reinhard</wd>

<space/>

<wd l="2285" t="6917" r="2842" b="7056">Kneser</wd>

<space/>

<wd l="2952" t="6912" r="3240" b="7056">and</wd>

<space/>

<wd l="3346" t="6917" r="4085" b="7056">Hermann</wd>

<space/>

<wd l="4190" t="6917" r="4546" b="7099">Ney.</wd>

<space/>

<wd l="4834" t="6912" r="5251" b="7056">1995.</wd>

<space/>

<wd l="5520" t="6917" r="5798" b="7051">Im-</wd>

</ln>

<ln l="1656" t="7133" r="5794" b="7320" baseLine="7267" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="7133" r="2208" b="7315">proved</wd>

<space/>

<wd l="2261" t="7133" r="3192" b="7320">backing-off</wd>

<space/>

<wd l="3235" t="7133" r="3470" b="7277">for</wd>

<space/>

<wd l="3523" t="7138" r="4181" b="7320">M-gram</wd>

<space/>

<wd l="4229" t="7133" r="4949" b="7320">language</wd>

<space/>

<wd l="5002" t="7133" r="5794" b="7320">modeling.</wd>

<space/>

</ln>

<ln l="1656" t="7354" r="5803" b="7536" baseLine="7488">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="7358" r="1824" b="7493">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1906" t="7358" r="2314" b="7498">Proc.</wd>

<space/>

<wd l="2419" t="7354" r="2597" b="7536">of</wd>

<space/>

<wd l="2654" t="7354" r="2890" b="7498">the</wd>

<space/>

<wd l="2966" t="7358" r="3413" b="7493">IEEE</wd>

<space/>

<wd l="3480" t="7354" r="4536" b="7498">International</wd>

<space/>

<wd l="4622" t="7354" r="5525" b="7536">Conference</wd>

<space/>

<wd l="5611" t="7402" r="5803" b="7498">on</wd>

<space/>

</run>

</ln>

<ln l="1642" t="7570" r="5798" b="7752" baseLine="7709" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="7574" r="2453" b="7738">Acoustics,</wd>

<space/>

<wd l="2534" t="7570" r="3096" b="7752">Speech</wd>

<space/>

<wd l="3158" t="7570" r="3466" b="7714">and</wd>

<space/>

<wd l="3523" t="7570" r="4032" b="7752">Signal</wd>

<space/>

<wd l="4094" t="7574" r="4963" b="7752">Processing</wd>

<space/>

<wd l="5035" t="7574" r="5798" b="7747">(ICASSP-</wd>

</ln>

<ln l="1656" t="7790" r="4637" b="7978" baseLine="7925">

<wd l="1656" t="7790" r="1968" b="7968"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">95)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2026" t="7790" r="2616" b="7934">volume</wd>

<space/>

<wd l="2688" t="7790" r="2808" b="7958">1,</wd>

<space/>

<wd l="2866" t="7834" r="3317" b="7978">pages</wd>

<space/>

<wd l="3389" t="7790" r="4104" b="7934">181–184.</wd>

<space/>

<wd l="4166" t="7795" r="4637" b="7934">IEEE.</wd>

</run>

</ln>

</para>

<para l="1445" t="8160" r="5803" b="8568" alignment="justified" li="216" spaceBefore="148" fli="-216" lsp="exactly" lspExact="221" language="en">

<ln l="1445" t="8160" r="5803" b="8342" baseLine="8294">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="8160" r="2213" b="8304">Catherine</wd>

<space/>

<wd l="2366" t="8160" r="2914" b="8328">Kobus,</wd>

<space/>

</run>

<wd l="3091" t="8160" r="3773" b="8342"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Franc</run>

<run underlined="none" subsuperscript="subscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">¸</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ois</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3926" t="8165" r="4406" b="8328">Yvon,</wd>

<space/>

<wd l="4589" t="8160" r="4872" b="8304">and</wd>

<space/>

<wd l="5026" t="8160" r="5803" b="8304">G´eraldine</wd>

<space/>

</run>

</ln>

<ln l="1656" t="8381" r="5803" b="8568" baseLine="8515" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="8381" r="2381" b="8525">Damnati.</wd>

<space/>

<wd l="2659" t="8381" r="3091" b="8525">2008.</wd>

<space/>

<wd l="3360" t="8381" r="4363" b="8568">Normalizing</wd>

<space/>

<wd l="4478" t="8381" r="4910" b="8525">SMS:</wd>

<space/>

<wd l="5035" t="8386" r="5333" b="8525">Are</wd>

<space/>

<wd l="5443" t="8386" r="5803" b="8525">Two</wd>

</ln>

</para>

<para l="1651" t="8597" r="5808" b="9398" alignment="justified" li="216" spaceBefore="2" lsp="exactly" lspExact="219" language="en">

<tabs position="1651"/>

<ln l="1656" t="8597" r="5803" b="8779" baseLine="8736" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="8597" r="2506" b="8779">Metaphors</wd>

<space/>

<wd l="2616" t="8602" r="3101" b="8741">Better</wd>

<space/>

<wd l="3206" t="8597" r="3610" b="8741">Than</wd>

<space/>

<wd l="3725" t="8597" r="4138" b="8741">One?</wd>

<tab position="4138"/>

<wd l="4502" t="8602" r="4670" b="8736">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4771" t="8602" r="5179" b="8741">Proc.</wd>

<space/>

<wd l="5309" t="8597" r="5491" b="8779">of</wd>

<space/>

<wd l="5568" t="8597" r="5803" b="8741">the
</wd>

</run>

</ln>

<ln l="1656" t="8818" r="5808" b="9000" baseLine="8952" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1656" t="8818" r="2064" b="8962">22nd</wd>

<space/>

<wd l="2150" t="8818" r="3206" b="8962">International</wd>

<space/>

<wd l="3312" t="8818" r="4214" b="9000">Conference</wd>

<space/>

<wd l="4315" t="8866" r="4507" b="8962">on</wd>

<space/>

<wd l="4618" t="8818" r="5808" b="9000">Computational</wd>

<space/>

</ln>

<ln l="1651" t="9038" r="5808" b="9226" baseLine="9173" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="9043" r="2534" b="9221">Linguistics</wd>

<space/>

<wd l="2616" t="9038" r="3734" b="9216">(COLING’08)</wd>

<space/>

<wd l="3830" t="9125" r="3878" b="9139">-</wd>

<space/>

<wd l="3984" t="9038" r="4555" b="9182">Volume</wd>

<space/>

</run>

<wd l="4646" t="9038" r="4781" b="9206"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4872" t="9082" r="5323" b="9226">pages</wd>

<space/>

<wd l="5405" t="9038" r="5808" b="9178">441–</wd>

<space/>

</run>

</ln>

<ln l="1656" t="9254" r="2486" b="9398" baseLine="9394" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1656" t="9254" r="1997" b="9398">448.</wd>

<space/>

<wd l="2054" t="9254" r="2486" b="9398">ACL.</wd>

</ln>

</para>

<para l="1440" t="9624" r="5803" b="10248" alignment="justified" li="216" spaceBefore="149" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="9624" r="5803" b="9816" baseLine="9763" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9629" r="1882" b="9773">Paula</wd>

<space/>

<wd l="1973" t="9624" r="2467" b="9816">L´opez</wd>

<space/>

<wd l="2563" t="9624" r="2923" b="9773">R´ua.</wd>

<space/>

<wd l="3144" t="9629" r="3576" b="9773">2007.</wd>

<space/>

<wd l="3797" t="9629" r="4517" b="9816">Teaching</wd>

<space/>

<wd l="4613" t="9629" r="4834" b="9768">L2</wd>

<space/>

<wd l="4930" t="9629" r="5803" b="9816">vocabulary</wd>

<space/>

</ln>

<ln l="1656" t="9845" r="5794" b="10032" baseLine="9984" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="9845" r="2280" b="10032">through</wd>

<space/>

<wd l="2357" t="9845" r="2741" b="9989">SMS</wd>

<space/>

<wd l="2822" t="9845" r="3581" b="10032">language:</wd>

<space/>

<wd l="3710" t="9845" r="4157" b="9989">Some</wd>

<space/>

<wd l="4238" t="9845" r="4862" b="9989">didactic</wd>

<space/>

<wd l="4939" t="9845" r="5794" b="10032">guidelines.</wd>

<space/>

</ln>

<ln l="1651" t="10066" r="5794" b="10248" baseLine="10200">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1651" t="10066" r="2342" b="10210">Estudios</wd>

<space/>

<wd l="2386" t="10066" r="2573" b="10210">de</wd>

<space/>

<wd l="2621" t="10066" r="3451" b="10248">ling¨uistica</wd>

<space/>

<wd l="3504" t="10066" r="4070" b="10248">inglesa</wd>

<space/>

</run>

<wd l="4114" t="10066" r="4853" b="10248"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">aplicada</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="4901" t="10066" r="5794" b="10210">7:165–188.</wd>

</run>

</ln>

</para>

<para l="1445" t="10435" r="5798" b="10838" alignment="justified" li="216" spaceBefore="152" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1445" t="10435" r="5794" b="10622" baseLine="10570" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="10435" r="2381" b="10618">Christopher</wd>

<space/>

<wd l="2453" t="10440" r="2635" b="10579">D.</wd>

<space/>

<wd l="2717" t="10435" r="3432" b="10622">Manning</wd>

<space/>

<wd l="3509" t="10435" r="3792" b="10579">and</wd>

<space/>

<wd l="3859" t="10435" r="4474" b="10579">Hinrich</wd>

<space/>

<wd l="4546" t="10435" r="5208" b="10579">Sch¨utze.</wd>

<space/>

<wd l="5376" t="10435" r="5794" b="10579">1999.</wd>

<space/>

</ln>

<ln l="1656" t="10656" r="5798" b="10838" baseLine="10790">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="10656" r="2645" b="10800">Foundations</wd>

<space/>

<wd l="2736" t="10656" r="2918" b="10838">of</wd>

<space/>

<wd l="2976" t="10656" r="3778" b="10800">Statistical</wd>

<space/>

<wd l="3859" t="10656" r="4483" b="10800">Natural</wd>

<space/>

<wd l="4565" t="10661" r="5357" b="10838">Language</wd>

<space/>

<wd l="5448" t="10661" r="5798" b="10800">Pro-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1661" t="10872" r="5798" b="11280" alignment="justified" li="216" lsp="exactly" lspExact="219" language="en">

<tabs position="1661"/>

<ln l="1661" t="10872" r="5798" b="11059" baseLine="11011" forcedEOF="true">

<wd l="1661" t="10877" r="2285" b="11054"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">cessing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="2285"/>

<wd l="2683" t="10872" r="2990" b="11016">The</wd>

<space/>

<wd l="3139" t="10877" r="3504" b="11011">MIT</wd>

<space/>

<wd l="3653" t="10877" r="4118" b="11040">Press,</wd>

<space/>

<wd l="4301" t="10872" r="5179" b="11059">Cambridge</wd>

<space/>

</run>

<wd l="5338" t="10872" r="5798" b="11050"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(Mas-</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">
</run>

</wd>

</ln>

<ln l="1666" t="11093" r="4426" b="11280" baseLine="11227" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1666" t="11093" r="2525" b="11270">sachusetts)</wd>

<space/>

<wd l="2587" t="11093" r="2870" b="11237">and</wd>

<space/>

<wd l="2918" t="11093" r="3542" b="11237">London</wd>

<space/>

<wd l="3600" t="11093" r="4426" b="11280">(England).</wd>

</ln>

</para>

<para l="1445" t="11462" r="5808" b="13622" alignment="justified" li="216" spaceBefore="153" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1445" t="11462" r="5798" b="11650" baseLine="11597" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="11462" r="2045" b="11606">Olutobi</wd>

<space/>

<wd l="2170" t="11462" r="2904" b="11645">Owoputi,</wd>

<space/>

<wd l="3043" t="11462" r="3715" b="11606">Brendan</wd>

<space/>

<wd l="3840" t="11462" r="4680" b="11630">O’Connor,</wd>

<space/>

<wd l="4824" t="11462" r="5242" b="11606">Chris</wd>

<space/>

<wd l="5366" t="11467" r="5798" b="11650">Dyer,</wd>

<space/>

</ln>

<ln l="1661" t="11683" r="5794" b="11866" baseLine="11818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="11683" r="2136" b="11827">Kevin</wd>

<space/>

<wd l="2251" t="11683" r="2885" b="11866">Gimpel,</wd>

<space/>

<wd l="3019" t="11683" r="3590" b="11827">Nathan</wd>

<space/>

<wd l="3710" t="11683" r="4536" b="11851">Schneider,</wd>

<space/>

<wd l="4675" t="11683" r="4958" b="11827">and</wd>

<space/>

<wd l="5069" t="11683" r="5501" b="11827">Noah</wd>

<space/>

<wd l="5611" t="11688" r="5794" b="11827">A.</wd>

<space/>

</ln>

<ln l="1661" t="11899" r="5803" b="12086" baseLine="12038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="11899" r="2174" b="12043">Smith.</wd>

<space/>

<wd l="2419" t="11899" r="2851" b="12043">2013.</wd>

<space/>

<wd l="3091" t="11899" r="3859" b="12082">Improved</wd>

<space/>

<wd l="3960" t="11899" r="5112" b="12082">part-of-speech</wd>

<space/>

<wd l="5208" t="11899" r="5803" b="12086">tagging</wd>

<space/>

</ln>

<ln l="1656" t="12120" r="5794" b="12264" baseLine="12254" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="12120" r="1891" b="12264">for</wd>

<space/>

<wd l="1987" t="12120" r="2477" b="12264">online</wd>

<space/>

<wd l="2578" t="12120" r="3720" b="12264">conversational</wd>

<space/>

<wd l="3816" t="12139" r="4114" b="12264">text</wd>

<space/>

<wd l="4200" t="12120" r="4555" b="12264">with</wd>

<space/>

<wd l="4646" t="12120" r="5054" b="12264">word</wd>

<space/>

<wd l="5150" t="12120" r="5794" b="12264">clusters.</wd>

<space/>

</ln>

<ln l="1656" t="12341" r="5803" b="12523" baseLine="12475">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="12346" r="1824" b="12480">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1949" t="12346" r="2352" b="12485">Proc.</wd>

<space/>

<wd l="2501" t="12341" r="2683" b="12523">of</wd>

<space/>

<wd l="2779" t="12341" r="3014" b="12485">the</wd>

<space/>

<wd l="3139" t="12341" r="3538" b="12485">2013</wd>

<space/>

<wd l="3672" t="12341" r="4570" b="12523">Conference</wd>

<space/>

<wd l="4699" t="12341" r="4882" b="12523">of</wd>

<space/>

<wd l="4978" t="12341" r="5218" b="12485">the</wd>

<space/>

<wd l="5338" t="12341" r="5803" b="12485">North</wd>

<space/>

</run>

</ln>

<ln l="1642" t="12557" r="5798" b="12739" baseLine="12696" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="12562" r="2429" b="12701">American</wd>

<space/>

<wd l="2501" t="12557" r="3154" b="12739">Chapter</wd>

<space/>

<wd l="3211" t="12557" r="3394" b="12739">of</wd>

<space/>

<wd l="3427" t="12557" r="3662" b="12701">the</wd>

<space/>

<wd l="3710" t="12562" r="4651" b="12701">Association</wd>

<space/>

<wd l="4680" t="12557" r="4958" b="12739">for</wd>

<space/>

<wd l="5016" t="12562" r="5798" b="12739">Computa-</wd>

</ln>

<ln l="1661" t="12778" r="5803" b="12960" baseLine="12912" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="12778" r="2126" b="12922">tional</wd>

<space/>

<wd l="2189" t="12782" r="3130" b="12960">Linguistics:</wd>

<space/>

<wd l="3240" t="12782" r="3826" b="12922">Human</wd>

<space/>

<wd l="3898" t="12782" r="4690" b="12960">Language</wd>

<space/>

<wd l="4776" t="12778" r="5803" b="12960">Technologies</wd>

<space/>

</ln>

<ln l="1661" t="12998" r="5808" b="13186" baseLine="13133">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="13003" r="2779" b="13176">(NAACL-HLT</wd>

<space/>

</run>

<wd l="2818" t="12998" r="3326" b="13176"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2013)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3389" t="13042" r="3835" b="13186">pages</wd>

<space/>

<wd l="3902" t="12998" r="4637" b="13142">380–390.</wd>

<space/>

<wd l="4704" t="12998" r="5131" b="13142">ACL.</wd>

<space/>

<wd l="5237" t="12998" r="5808" b="13142">Toolkit</wd>

<space/>

</run>

</ln>

<ln l="1661" t="13214" r="5789" b="13392" baseLine="13354">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="13214" r="2366" b="13358">available</wd>

<space/>

<wd l="2438" t="13234" r="2616" b="13358">at:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2702" t="13219" r="5789" b="13392">http://www.ark.cs.cmu.edu/</wd>

<space/>

</run>

</ln>

<ln l="1666" t="13435" r="4598" b="13622" baseLine="13570">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1666" t="13440" r="2717" b="13594">TweetNLP/</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2794" t="13435" r="3384" b="13613">(visited</wd>

<space/>

<wd l="3437" t="13478" r="3634" b="13579">on</wd>

<space/>

<wd l="3682" t="13440" r="4042" b="13622">May</wd>

<space/>

<wd l="4099" t="13435" r="4598" b="13613">2015).</wd>

</run>

</ln>

</para>

<para l="1440" t="13805" r="5803" b="15307" alignment="justified" li="216" spaceBefore="156" fli="-216" lsp="exactly" lspExact="218" language="en">

<ln l="1440" t="13805" r="5803" b="13992" baseLine="13943" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13805" r="1843" b="13949">Llu´ıs</wd>

<space/>

<wd l="1915" t="13805" r="2376" b="13949">Padr´o</wd>

<space/>

<wd l="2448" t="13805" r="2731" b="13949">and</wd>

<space/>

<wd l="2798" t="13810" r="3398" b="13992">Evgeny</wd>

<space/>

<wd l="3475" t="13805" r="4430" b="13992">Stanilovsky.</wd>

<space/>

<wd l="4574" t="13805" r="5006" b="13949">2012.</wd>

<space/>

<wd l="5141" t="13805" r="5803" b="13992">Freeling</wd>

<space/>

</ln>

<ln l="1661" t="14026" r="5798" b="14213" baseLine="14160">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="14026" r="1944" b="14170">3.0:</wd>

<space/>

<wd l="2088" t="14026" r="2755" b="14170">Towards</wd>

<space/>

<wd l="2842" t="14026" r="3341" b="14170">Wider</wd>

<space/>

<wd l="3422" t="14026" r="4656" b="14213">Multilinguality.</wd>

<space/>

<wd l="4838" t="14030" r="5006" b="14165">In</wd>

<space/>

</run>

<wd l="5083" t="14026" r="5798" b="14170" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Proceed-</wd>

</ln>

<ln l="1666" t="14242" r="5798" b="14424" baseLine="14381" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="14246" r="1992" b="14424">ings</wd>

<space/>

<wd l="2059" t="14242" r="2242" b="14424">of</wd>

<space/>

<wd l="2280" t="14242" r="2515" b="14386">the</wd>

<space/>

<wd l="2578" t="14242" r="3019" b="14424">Eight</wd>

<space/>

<wd l="3072" t="14242" r="4128" b="14386">International</wd>

<space/>

<wd l="4200" t="14242" r="5102" b="14424">Conference</wd>

<space/>

<wd l="5170" t="14290" r="5362" b="14386">on</wd>

<space/>

<wd l="5424" t="14246" r="5798" b="14386">Lan-</wd>

</ln>

<ln l="1656" t="14462" r="5798" b="14645" baseLine="14602">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="14510" r="2141" b="14645">guage</wd>

<space/>

<wd l="2227" t="14467" r="3043" b="14606">Resources</wd>

<space/>

<wd l="3134" t="14462" r="3442" b="14606">and</wd>

<space/>

<wd l="3518" t="14462" r="4397" b="14606">Evaluation</wd>

<space/>

</run>

<wd l="4498" t="14462" r="5414" b="14640"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(LREC’12)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5520" t="14467" r="5798" b="14606">Eu-</wd>

</run>

</ln>

<ln l="1656" t="14683" r="5794" b="14870" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="14726" r="2198" b="14866">ropean</wd>

<space/>

<wd l="2290" t="14688" r="3072" b="14870">Language</wd>

<space/>

<wd l="3163" t="14688" r="3979" b="14827">Resources</wd>

<space/>

<wd l="4070" t="14683" r="5016" b="14827">Association</wd>

<space/>

<wd l="5112" t="14683" r="5794" b="14861">(ELRA).</wd>

<space/>

</ln>

<ln l="1656" t="14899" r="5765" b="15077" baseLine="15038">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="14899" r="2232" b="15043">Toolkit</wd>

<space/>

<wd l="2366" t="14899" r="3067" b="15043">available</wd>

<space/>

<wd l="3206" t="14918" r="3384" b="15043">at:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3538" t="14904" r="5765" b="15077">http://nlp.lsi.upc.</wd>

<space/>

</run>

</ln>

<ln l="1666" t="15120" r="5078" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1666" t="15125" r="3192" b="15298">edu/freeling/</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3274" t="15120" r="3859" b="15298">(visited</wd>

<space/>

<wd l="3917" t="15163" r="4109" b="15264">on</wd>

<space/>

<wd l="4157" t="15125" r="4522" b="15307">May</wd>

<space/>

<wd l="4579" t="15120" r="5078" b="15298">2015).</wd>

</run>

</ln>

</para>

</column>

<column l="6143" t="1296" r="10530" b="7947">

<para l="6144" t="1334" r="10512" b="3058" alignment="justified" li="216" spaceBefore="10" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="1334" r="10512" b="1478" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1334" r="6634" b="1478">Adam</wd>

<space/>

<wd l="6686" t="1334" r="7109" b="1478">Pauls</wd>

<space/>

<wd l="7176" t="1334" r="7459" b="1478">and</wd>

<space/>

<wd l="7512" t="1339" r="7838" b="1478">Dan</wd>

<space/>

<wd l="7901" t="1334" r="8376" b="1478">Klein.</wd>

<space/>

<wd l="8482" t="1334" r="8914" b="1478">2011.</wd>

<space/>

<wd l="9010" t="1339" r="9494" b="1478">Faster</wd>

<space/>

<wd l="9552" t="1334" r="9840" b="1478">and</wd>

<space/>

<wd l="9898" t="1334" r="10512" b="1478">Smaller</wd>

<space/>

</ln>

<ln l="6365" t="1555" r="10507" b="1742" baseLine="1694">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="1560" r="6989" b="1742">N-gram</wd>

<space/>

<wd l="7075" t="1560" r="7858" b="1742">Language</wd>

<space/>

<wd l="7949" t="1555" r="8587" b="1699">Models.</wd>

<space/>

<wd l="8803" t="1560" r="8966" b="1694">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9058" t="1560" r="9466" b="1699">Proc.</wd>

<space/>

<wd l="9581" t="1555" r="9763" b="1738">of</wd>

<space/>

<wd l="9826" t="1555" r="10066" b="1699">the</wd>

<space/>

<wd l="10157" t="1555" r="10507" b="1699">49th</wd>

<space/>

</run>

</ln>

<ln l="6350" t="1776" r="10502" b="1958" baseLine="1910" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6350" t="1776" r="6941" b="1920">Annual</wd>

<space/>

<wd l="7027" t="1781" r="7680" b="1958">Meeting</wd>

<space/>

<wd l="7786" t="1776" r="7963" b="1958">of</wd>

<space/>

<wd l="8030" t="1776" r="8270" b="1920">the</wd>

<space/>

<wd l="8352" t="1781" r="9293" b="1920">Association</wd>

<space/>

<wd l="9355" t="1776" r="9629" b="1958">for</wd>

<space/>

<wd l="9725" t="1781" r="10502" b="1958">Computa-</wd>

</ln>

<ln l="6370" t="1992" r="10512" b="2174" baseLine="2131" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="1992" r="6830" b="2136">tional</wd>

<space/>

<wd l="6898" t="1997" r="7834" b="2174">Linguistics:</wd>

<space/>

<wd l="7944" t="1997" r="8530" b="2136">Human</wd>

<space/>

<wd l="8602" t="1997" r="9398" b="2174">Language</wd>

<space/>

<wd l="9480" t="1992" r="10512" b="2174">Technologies</wd>

<space/>

</ln>

<ln l="6370" t="2213" r="10498" b="2400" baseLine="2352">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="2218" r="7238" b="2390">(ACL-HLT</wd>

<space/>

<wd l="7272" t="2213" r="7728" b="2390">2011)</wd>

<space/>

<wd l="7800" t="2299" r="7848" b="2314">-</wd>

<space/>

<wd l="7930" t="2213" r="8496" b="2357">Volume</wd>

<space/>

</run>

<wd l="8563" t="2213" r="8698" b="2381"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8760" t="2256" r="9206" b="2400">pages</wd>

<space/>

<wd l="9274" t="2213" r="10003" b="2357">258–267.</wd>

<space/>

<wd l="10070" t="2213" r="10498" b="2357">ACL.</wd>

<space/>

</run>

</ln>

<ln l="6365" t="2434" r="10493" b="2621" baseLine="2568">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="2434" r="7373" b="2621">BerkeleyLM</wd>

<space/>

<wd l="7474" t="2477" r="7982" b="2578">source</wd>

<space/>

<wd l="8074" t="2434" r="8443" b="2578">code</wd>

<space/>

<wd l="8534" t="2434" r="9240" b="2578">available</wd>

<space/>

<wd l="9331" t="2453" r="9470" b="2578">at</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9562" t="2438" r="10493" b="2611">https://</wd>

<space/>

</run>

</ln>

<ln l="6379" t="2650" r="10512" b="2827" baseLine="2789">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6379" t="2654" r="9811" b="2827">code.google.com/p/berkeleylm/</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9922" t="2650" r="10512" b="2827">(visited</wd>

<space/>

</run>

</ln>

<ln l="6370" t="2870" r="7531" b="3058" baseLine="3005" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="2914" r="6566" b="3014">on</wd>

<space/>

<wd l="6614" t="2875" r="6974" b="3058">May</wd>

<space/>

<wd l="7032" t="2870" r="7531" b="3048">2015).</wd>

</ln>

</para>

<para l="6144" t="3269" r="10498" b="3672" alignment="justified" li="216" spaceBefore="180" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="3269" r="10498" b="3456" baseLine="3408" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3274" r="6926" b="3413">Lawrence</wd>

<space/>

<wd l="6989" t="3269" r="7584" b="3451">Philips.</wd>

<space/>

<wd l="7728" t="3269" r="8146" b="3413">1990.</wd>

<space/>

<wd l="8270" t="3269" r="8952" b="3456">Hanging</wd>

<space/>

<wd l="9024" t="3312" r="9221" b="3413">on</wd>

<space/>

<wd l="9278" t="3269" r="9523" b="3413">the</wd>

<space/>

<wd l="9586" t="3269" r="10498" b="3451">metaphone.</wd>

<space/>

</ln>

<ln l="6374" t="3490" r="9125" b="3672" baseLine="3624">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="3494" r="7171" b="3672">Computer</wd>

<space/>

</run>

<wd l="7205" t="3494" r="8045" b="3672"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Language</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8102" t="3490" r="9125" b="3667">7(12):39–43.</wd>

</run>

</ln>

</para>

<para l="6144" t="3888" r="10512" b="5170" alignment="justified" li="216" spaceBefore="184" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="3888" r="10498" b="4075" baseLine="4022" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3888" r="6562" b="4032">Jes´us</wd>

<space/>

<wd l="6643" t="3888" r="7248" b="4056">Vilares,</wd>

<space/>

<wd l="7339" t="3888" r="7915" b="4075">Miguel</wd>

<space/>

<wd l="7992" t="3893" r="8174" b="4032">A.</wd>

<space/>

<wd l="8266" t="3888" r="8885" b="4056">Alonso,</wd>

<space/>

<wd l="8976" t="3888" r="9264" b="4032">and</wd>

<space/>

<wd l="9336" t="3888" r="9821" b="4032">David</wd>

<space/>

<wd l="9898" t="3888" r="10498" b="4032">Vilares.</wd>

<space/>

</ln>

<ln l="6370" t="4104" r="10502" b="4291" baseLine="4243" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="4104" r="6802" b="4248">2013.</wd>

<space/>

<wd l="7018" t="4104" r="7944" b="4286">Prototipado</wd>

<space/>

<wd l="8040" t="4104" r="8544" b="4291">r´apido</wd>

<space/>

<wd l="8645" t="4104" r="8827" b="4248">de</wd>

<space/>

<wd l="8923" t="4147" r="9120" b="4248">un</wd>

<space/>

<wd l="9221" t="4104" r="9811" b="4248">sistema</wd>

<space/>

<wd l="9907" t="4104" r="10090" b="4248">de</wd>

<space/>

<wd l="10181" t="4147" r="10502" b="4248">nor-</wd>

</ln>

<ln l="6365" t="4325" r="10512" b="4512" baseLine="4463" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="4325" r="7238" b="4469">malizaci´on</wd>

<space/>

<wd l="7320" t="4325" r="7498" b="4469">de</wd>

<space/>

<wd l="7574" t="4325" r="7958" b="4469">tuits:</wd>

<space/>

<wd l="8088" t="4330" r="8424" b="4469">Una</wd>

<space/>

<wd l="8501" t="4325" r="9590" b="4512">aproximaci´on</wd>

<space/>

<wd l="9667" t="4325" r="10181" b="4469">l´exica.</wd>

<space/>

<wd l="10344" t="4330" r="10512" b="4464">In</wd>

<space/>

</ln>

<ln l="6374" t="4546" r="10507" b="4728" baseLine="4680" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="4550" r="7344" b="4690">Tweet-Norm</wd>

<space/>

<wd l="7426" t="4546" r="7853" b="4690">2013.</wd>

<space/>

<wd l="7958" t="4550" r="8419" b="4690">Tweet</wd>

<space/>

<wd l="8486" t="4546" r="9638" b="4704">Normalization</wd>

<space/>

<wd l="9730" t="4546" r="10507" b="4728">Workshop</wd>

<space/>

</ln>

<ln l="6365" t="4762" r="10502" b="4944" baseLine="4901">

<wd l="6365" t="4762" r="6806" b="4930"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2013</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6902" t="4762" r="7498" b="4906">volume</wd>

<space/>

<wd l="7598" t="4762" r="7978" b="4906">1086</wd>

<space/>

<wd l="8069" t="4762" r="8242" b="4906">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8323" t="4766" r="8832" b="4906">CEUR</wd>

<space/>

<wd l="8928" t="4762" r="9701" b="4944">Workshop</wd>

<space/>

<wd l="9787" t="4762" r="10502" b="4906">Proceed-</wd>

</run>

</ln>

<ln l="6374" t="4982" r="9144" b="5170" baseLine="5122">

<wd l="6374" t="4987" r="6739" b="5165"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ings</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6797" t="5026" r="7243" b="5170">pages</wd>

<space/>

<wd l="7306" t="4982" r="7834" b="5126">39–43.</wd>

<space/>

<wd l="7901" t="4982" r="9144" b="5170">CEUR-WS.org.</wd>

</run>

</ln>

</para>

<para l="6144" t="5381" r="10522" b="6658" alignment="justified" li="216" spaceBefore="178" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="5381" r="10502" b="5568" baseLine="5519" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5381" r="6629" b="5525">David</wd>

<space/>

<wd l="6686" t="5381" r="7296" b="5549">Vilares,</wd>

<space/>

<wd l="7363" t="5381" r="7939" b="5568">Miguel</wd>

<space/>

<wd l="8002" t="5386" r="8184" b="5525">A.</wd>

<space/>

<wd l="8251" t="5381" r="8870" b="5549">Alonso,</wd>

<space/>

<wd l="8947" t="5381" r="9230" b="5525">and</wd>

<space/>

<wd l="9293" t="5381" r="9802" b="5525">Carlos</wd>

<space/>

<wd l="9874" t="5381" r="10502" b="5525">G´omez-</wd>

<space/>

</ln>

<ln l="6365" t="5602" r="10507" b="5789" baseLine="5736" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="5602" r="7234" b="5789">Rodr´ıguez.</wd>

<space/>

<wd l="7464" t="5602" r="7896" b="5746">2015.</wd>

<space/>

<wd l="8126" t="5602" r="8366" b="5746">On</wd>

<space/>

<wd l="8458" t="5602" r="8702" b="5746">the</wd>

<space/>

<wd l="8798" t="5602" r="9624" b="5746">usefulness</wd>

<space/>

<wd l="9725" t="5602" r="9898" b="5746">of</wd>

<space/>

<wd l="9984" t="5602" r="10507" b="5746">lexical</wd>

<space/>

</ln>

<ln l="6370" t="5818" r="10522" b="6005" baseLine="5957" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="5818" r="6653" b="5962">and</wd>

<space/>

<wd l="6715" t="5818" r="7411" b="6005">syntactic</wd>

<space/>

<wd l="7464" t="5818" r="8314" b="6005">processing</wd>

<space/>

<wd l="8371" t="5818" r="8525" b="5957">in</wd>

<space/>

<wd l="8578" t="5818" r="9197" b="6005">polarity</wd>

<space/>

<wd l="9254" t="5818" r="10291" b="5962">classification</wd>

<space/>

<wd l="10349" t="5818" r="10522" b="5962">of</wd>

<space/>

</ln>

<ln l="6365" t="6038" r="10502" b="6226" baseLine="6178">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="6038" r="6936" b="6182">Twitter</wd>

<space/>

<wd l="6984" t="6082" r="7776" b="6226">messages.</wd>

<space/>

<wd l="7858" t="6038" r="8611" b="6221">Accepted</wd>

<space/>

<wd l="8659" t="6038" r="8890" b="6182">for</wd>

<space/>

<wd l="8938" t="6038" r="9835" b="6221">publication</wd>

<space/>

<wd l="9883" t="6038" r="10042" b="6178">in</wd>

<space/>

</run>

<wd l="10085" t="6043" r="10502" b="6182" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Jour-</wd>

</ln>

<ln l="6365" t="6259" r="10517" b="6442" baseLine="6394" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="6259" r="6619" b="6403">nal</wd>

<space/>

<wd l="6691" t="6259" r="6874" b="6442">of</wd>

<space/>

<wd l="6912" t="6259" r="7152" b="6403">the</wd>

<space/>

<wd l="7205" t="6264" r="8146" b="6403">Association</wd>

<space/>

<wd l="8184" t="6259" r="8458" b="6442">for</wd>

<space/>

<wd l="8510" t="6259" r="9466" b="6442">Information</wd>

<space/>

<wd l="9538" t="6264" r="10142" b="6403">Science</wd>

<space/>

<wd l="10214" t="6259" r="10517" b="6403">and</wd>

<space/>

</ln>

<ln l="6374" t="6475" r="10066" b="6658" baseLine="6614">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6374" t="6475" r="7267" b="6658">Technology</wd>

<space/>

</run>

<wd l="7325" t="6480" r="8069" b="6653"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(JASIST)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8155" t="6475" r="8506" b="6619">DOI</wd>

<space/>

<wd l="8578" t="6475" r="10066" b="6619">10.1002/asi.23284.</wd>

</run>

</ln>

</para>

<para l="6144" t="6874" r="10512" b="7939" alignment="justified" li="216" spaceBefore="182" fli="-216" lsp="exactly" lspExact="217" language="en">

<ln l="6144" t="6874" r="10512" b="7061" baseLine="7013" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6874" r="6331" b="7013">Yi</wd>

<space/>

<wd l="6408" t="6878" r="6816" b="7061">Yang</wd>

<space/>

<wd l="6898" t="6874" r="7181" b="7018">and</wd>

<space/>

<wd l="7253" t="6874" r="7704" b="7018">Jacob</wd>

<space/>

<wd l="7781" t="6874" r="8635" b="7018">Eisenstein.</wd>

<space/>

<wd l="8798" t="6874" r="9230" b="7018">2013.</wd>

<space/>

<wd l="9389" t="6878" r="9533" b="7013">A</wd>

<space/>

<wd l="9605" t="6874" r="10512" b="7061">Log-Linear</wd>

<space/>

</ln>

<ln l="6365" t="7094" r="10512" b="7277" baseLine="7234" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="7094" r="6883" b="7238">Model</wd>

<space/>

<wd l="6974" t="7094" r="7210" b="7238">for</wd>

<space/>

<wd l="7301" t="7094" r="8395" b="7277">Unsupervised</wd>

<space/>

<wd l="8486" t="7099" r="8851" b="7238">Text</wd>

<space/>

<wd l="8938" t="7094" r="10128" b="7238">Normalization.</wd>

<space/>

<wd l="10344" t="7099" r="10512" b="7234">In</wd>

<space/>

</ln>

<ln l="6365" t="7315" r="10512" b="7498" baseLine="7450" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="7320" r="6773" b="7459">Proc.</wd>

<space/>

<wd l="6845" t="7315" r="7022" b="7498">of</wd>

<space/>

<wd l="7046" t="7315" r="7282" b="7459">the</wd>

<space/>

<wd l="7330" t="7315" r="7728" b="7459">2013</wd>

<space/>

<wd l="7786" t="7315" r="8688" b="7498">Conference</wd>

<space/>

<wd l="8741" t="7363" r="8928" b="7459">on</wd>

<space/>

<wd l="8976" t="7315" r="9778" b="7498">Empirical</wd>

<space/>

<wd l="9821" t="7315" r="10512" b="7459">Methods</wd>

<space/>

</ln>

<ln l="6374" t="7531" r="10502" b="7714" baseLine="7670">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="7536" r="6514" b="7675">in</wd>

<space/>

<wd l="6610" t="7531" r="7234" b="7675">Natural</wd>

<space/>

<wd l="7320" t="7536" r="8117" b="7714">Language</wd>

<space/>

<wd l="8213" t="7536" r="9086" b="7714">Processing</wd>

<space/>

<wd l="9187" t="7536" r="9907" b="7709">(EMNLP</wd>

<space/>

</run>

<wd l="9998" t="7531" r="10502" b="7709"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2013)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="6365" t="7752" r="7896" b="7939" baseLine="7891" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="7795" r="6811" b="7939">pages</wd>

<space/>

<wd l="6874" t="7752" r="7402" b="7896">61–72.</wd>

<space/>

<wd l="7464" t="7752" r="7896" b="7896">ACL.</wd>

</ln>

</para>

</column>

</section>

<dd l="1436" t="15746" r="10530" b="15975">

<para l="5771" t="15787" r="6191" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15787" r="6125" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="27">

<wd l="5837" t="15787" r="6125" b="15946">105</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

