<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4311.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1416" marginTop="1420" marginRight="1402" marginBottom="358" offsetX="2" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1416" t="1420" r="10507" b="2071">

<column l="1416" t="1420" r="10507" b="2071">

<para l="2654" t="1493" r="9250" b="1766" alignment="centered" spaceBefore="9" spaceAfter="280" lsp="exactly" lspExact="350" language="en">

<ln l="2654" t="1493" r="9250" b="1766" baseLine="1694" bold="true" underlined="none" subsuperscript="none" fontSize="1500" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2654" t="1493" r="3830" b="1766">IHS_RD:</wd>

<space/>

<wd l="3931" t="1493" r="4858" b="1704">Lexical</wd>

<space/>

<wd l="4934" t="1493" r="6773" b="1704">Normalization</wd>

<space/>

<wd l="6869" t="1493" r="7238" b="1704">for</wd>

<space/>

<wd l="7320" t="1493" r="8275" b="1766">English</wd>

<space/>

<wd l="8371" t="1498" r="9250" b="1704">Tweets</wd>

</ln>

</para>

</column>

</section>

<section l="1416" t="2071" r="10507" b="14929">

<column l="1416" t="2071" r="5813" b="14929">

<para l="2194" t="2122" r="5074" b="2563" alignment="justified" li="720" ri="720" spaceBefore="6" fli="432" lsp="exactly" lspExact="268" language="en">

<ln l="2578" t="2122" r="4685" b="2338" baseLine="2285" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2578" t="2122" r="3322" b="2338">Dmitry</wd>

<space/>

<wd l="3389" t="2122" r="4685" b="2338">Supranovich</wd>

<space/>

</ln>

<ln l="2194" t="2390" r="5074" b="2563" baseLine="2554" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2194" t="2395" r="2563" b="2563">IHS</wd>

<space/>

<wd l="2640" t="2395" r="2981" b="2563">Inc.</wd>

<space/>

<wd l="3058" t="2390" r="3125" b="2563">/</wd>

<space/>

<wd l="3192" t="2395" r="3562" b="2563">IHS</wd>

<space/>

<wd l="3634" t="2390" r="4282" b="2563">Global</wd>

<space/>

<wd l="4349" t="2390" r="5074" b="2563">Belarus</wd>

</ln>

</para>

<para l="2165" t="2664" r="5102" b="3437" alignment="justified" li="864" ri="720" fli="216" lsp="exactly" lspExact="277" language="en">

<ln l="2549" t="2664" r="4738" b="2885" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="2549" t="2669" r="2856" b="2837">131</wd>

<space/>

<wd l="2962" t="2664" r="4478" b="2885">Starovilenskaya</wd>

<space/>

<wd l="4550" t="2669" r="4738" b="2837">St</wd>

<space/>

</ln>

<ln l="2486" t="2942" r="4776" b="3154" baseLine="3106" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="2486" t="2947" r="3250" b="3154">220123,</wd>

<space/>

<wd l="3322" t="2942" r="3979" b="3154">Minsk,</wd>

<space/>

<wd l="4051" t="2942" r="4776" b="3115">Belarus</wd>

<space/>

</ln>

<ln l="2165" t="3216" r="5102" b="3437" baseLine="3384" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="2165" t="3216" r="5102" b="3437">Dmitry.Supranovich@ihs.com</wd>

</ln>

</para>

<para l="3154" t="4248" r="4046" b="4416" alignment="centered" spaceBefore="750" lsp="exactly" lspExact="275" language="en">

<ln l="3154" t="4248" r="4046" b="4416" baseLine="4406" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3154" t="4248" r="4046" b="4416">Abstract</wd>

</ln>

</para>

<para l="1757" t="4747" r="5448" b="7920" alignment="justified" li="216" ri="360" spaceBefore="252" lsp="exactly" lspExact="229" language="en">

<ln l="1766" t="4747" r="5438" b="4930" baseLine="4882" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1766" t="4747" r="2112" b="4891">This</wd>

<space/>

<wd l="2184" t="4790" r="2640" b="4930">paper</wd>

<space/>

<wd l="2712" t="4747" r="3446" b="4891">describes</wd>

<space/>

<wd l="3528" t="4747" r="3768" b="4891">the</wd>

<space/>

<wd l="3850" t="4747" r="4435" b="4891">Twitter</wd>

<space/>

<wd l="4512" t="4747" r="5035" b="4891">lexical</wd>

<space/>

<wd l="5112" t="4790" r="5438" b="4891">nor-</wd>

</ln>

<ln l="1762" t="4978" r="5438" b="5160" baseLine="5112" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="4978" r="2606" b="5122">malization</wd>

<space/>

<wd l="2722" t="4997" r="3274" b="5160">system</wd>

<space/>

<wd l="3384" t="4978" r="4162" b="5122">submitted</wd>

<space/>

<wd l="4267" t="4978" r="4474" b="5160">by</wd>

<space/>

<wd l="4584" t="4978" r="4891" b="5122">IHS</wd>

<space/>

<wd l="5011" t="4978" r="5438" b="5122">R&amp;D</wd>

<space/>

</ln>

<ln l="1762" t="5208" r="5448" b="5390" baseLine="5342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="5208" r="2366" b="5352">Belarus</wd>

<space/>

<wd l="2429" t="5227" r="2822" b="5352">team</wd>

<space/>

<wd l="2885" t="5208" r="3115" b="5352">for</wd>

<space/>

<wd l="3173" t="5208" r="3413" b="5352">the</wd>

<space/>

<wd l="3475" t="5208" r="3874" b="5352">ACL</wd>

<space/>

<wd l="3936" t="5208" r="4325" b="5352">2015</wd>

<space/>

<wd l="4397" t="5208" r="5179" b="5390">workshop</wd>

<space/>

<wd l="5251" t="5251" r="5448" b="5352">on</wd>

<space/>

</ln>

<ln l="1762" t="5438" r="5443" b="5621" baseLine="5573" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="5438" r="2194" b="5621">noisy</wd>

<space/>

<wd l="2266" t="5438" r="3437" b="5621">user-generated</wd>

<space/>

<wd l="3514" t="5458" r="3850" b="5582">text.</wd>

<space/>

<wd l="3941" t="5438" r="4243" b="5582">The</wd>

<space/>

<wd l="4315" t="5438" r="5054" b="5621">proposed</wd>

<space/>

<wd l="5136" t="5482" r="5443" b="5621">sys-</wd>

</ln>

<ln l="1762" t="5669" r="5443" b="5851" baseLine="5803" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="5688" r="2064" b="5813">tem</wd>

<space/>

<wd l="2184" t="5669" r="2808" b="5813">consists</wd>

<space/>

<wd l="2942" t="5669" r="3130" b="5813">of</wd>

<space/>

<wd l="3226" t="5688" r="3518" b="5813">two</wd>

<space/>

<wd l="3648" t="5688" r="4656" b="5851">components:</wd>

<space/>

<wd l="4795" t="5712" r="4882" b="5813">a</wd>

<space/>

<wd l="5006" t="5669" r="5443" b="5813">CRF-</wd>

</ln>

<ln l="1757" t="5894" r="5443" b="6077" baseLine="6029" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1757" t="5894" r="2218" b="6038">based</wd>

<space/>

<wd l="2294" t="5894" r="3024" b="6077">approach</wd>

<space/>

<wd l="3101" t="5914" r="3250" b="6038">to</wd>

<space/>

<wd l="3336" t="5894" r="3950" b="6077">identify</wd>

<space/>

<wd l="4018" t="5894" r="4675" b="6077">possible</wd>

<space/>

<wd l="4757" t="5894" r="5443" b="6038">normali-</wd>

</ln>

<ln l="1762" t="6125" r="5438" b="6307" baseLine="6264" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="6125" r="2246" b="6269">zation</wd>

<space/>

<wd l="2323" t="6125" r="3202" b="6298">candidates,</wd>

<space/>

<wd l="3283" t="6125" r="3571" b="6269">and</wd>

<space/>

<wd l="3643" t="6168" r="3730" b="6269">a</wd>

<space/>

<wd l="3792" t="6125" r="5050" b="6307">post-processing</wd>

<space/>

<wd l="5131" t="6144" r="5438" b="6307">step</wd>

<space/>

</ln>

<ln l="1766" t="6355" r="5448" b="6538" baseLine="6490" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1766" t="6355" r="1915" b="6494">in</wd>

<space/>

<wd l="1987" t="6398" r="2174" b="6499">an</wd>

<space/>

<wd l="2242" t="6374" r="2842" b="6538">attempt</wd>

<space/>

<wd l="2904" t="6374" r="3058" b="6499">to</wd>

<space/>

<wd l="3130" t="6355" r="3922" b="6499">normalize</wd>

<space/>

<wd l="3998" t="6355" r="4483" b="6499">words</wd>

<space/>

<wd l="4555" t="6355" r="4853" b="6499">that</wd>

<space/>

<wd l="4925" t="6355" r="5117" b="6499">do</wd>

<space/>

<wd l="5189" t="6374" r="5448" b="6499">not</wd>

<space/>

</ln>

<ln l="1762" t="6586" r="5429" b="6730" baseLine="6720" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="6586" r="2131" b="6730">have</wd>

<space/>

<wd l="2242" t="6586" r="3350" b="6730">normalization</wd>

<space/>

<wd l="3456" t="6586" r="4085" b="6730">variants</wd>

<space/>

<wd l="4200" t="6586" r="4354" b="6725">in</wd>

<space/>

<wd l="4454" t="6586" r="4694" b="6730">the</wd>

<space/>

<wd l="4810" t="6586" r="5429" b="6730">lexicon.</wd>

<space/>

</ln>

<ln l="1762" t="6816" r="5448" b="6960" baseLine="6955" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="6816" r="2626" b="6960">Evaluation</wd>

<space/>

<wd l="2722" t="6859" r="2918" b="6960">on</wd>

<space/>

<wd l="3005" t="6816" r="3245" b="6960">the</wd>

<space/>

<wd l="3341" t="6835" r="3619" b="6960">test</wd>

<space/>

<wd l="3710" t="6816" r="4042" b="6960">data</wd>

<space/>

<wd l="4142" t="6835" r="4354" b="6960">set</wd>

<space/>

<wd l="4454" t="6816" r="5054" b="6960">showed</wd>

<space/>

<wd l="5146" t="6816" r="5448" b="6960">that</wd>

<space/>

</ln>

<ln l="1766" t="7046" r="5443" b="7229" baseLine="7181" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1766" t="7090" r="2030" b="7190">our</wd>

<space/>

<wd l="2126" t="7046" r="3250" b="7190">unconstrained</wd>

<space/>

<wd l="3360" t="7066" r="3912" b="7229">system</wd>

<space/>

<wd l="4013" t="7046" r="4718" b="7190">achieved</wd>

<space/>

<wd l="4819" t="7046" r="5059" b="7190">the</wd>

<space/>

<wd l="5266" t="7051" r="5443" b="7186">F-</wd>

</ln>

<ln l="1762" t="7277" r="5438" b="7459" baseLine="7411" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1762" t="7320" r="2424" b="7421">measure</wd>

<space/>

<wd l="2510" t="7277" r="2698" b="7421">of</wd>

<space/>

<wd l="2755" t="7277" r="3293" b="7421">0.8272</wd>

<space/>

<wd l="3384" t="7277" r="3802" b="7459">(rank</wd>

<space/>

<wd l="3898" t="7277" r="3955" b="7416">1</wd>

<space/>

<wd l="4061" t="7296" r="4310" b="7421">out</wd>

<space/>

<wd l="4392" t="7277" r="4579" b="7421">of</wd>

<space/>

<wd l="4642" t="7282" r="4718" b="7421">5</wd>

<space/>

<wd l="4824" t="7277" r="5438" b="7421">submis-</wd>

</ln>

<ln l="1771" t="7507" r="5448" b="7680" baseLine="7642" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1771" t="7507" r="2165" b="7651">sions</wd>

<space/>

<wd l="2242" t="7507" r="2477" b="7651">for</wd>

<space/>

<wd l="2539" t="7507" r="2779" b="7651">the</wd>

<space/>

<wd l="2846" t="7507" r="3970" b="7651">unconstrained</wd>

<space/>

<wd l="4042" t="7507" r="4526" b="7680">mode,</wd>

<space/>

<wd l="4603" t="7507" r="4958" b="7651">rank</wd>

<space/>

<wd l="5021" t="7507" r="5112" b="7646">2</wd>

<space/>

<wd l="5194" t="7526" r="5448" b="7651">out</wd>

<space/>

</ln>

<ln l="1766" t="7738" r="3557" b="7920" baseLine="7872" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1766" t="7738" r="1954" b="7882">of</wd>

<space/>

<wd l="1978" t="7738" r="2170" b="7882">all</wd>

<space/>

<wd l="2246" t="7738" r="2405" b="7877">11</wd>

<space/>

<wd l="2486" t="7738" r="3557" b="7920">submissions).</wd>

</ln>

</para>

<para l="1435" t="8222" r="3154" b="8390" alignment="left" spaceBefore="247" lsp="exactly" lspExact="275" language="en">

<ln l="1435" t="8222" r="3154" b="8390" baseLine="8386" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="15">

<wd l="1435" t="8222" r="1522" b="8386">1</wd>

<space/>

<wd l="1858" t="8222" r="3154" b="8390">Introduction</wd>

</ln>

</para>

<para l="1416" t="8645" r="5808" b="11083" alignment="justified" spaceBefore="153" lsp="exactly" lspExact="252" language="en">

<ln l="1430" t="8645" r="5779" b="8808" baseLine="8798" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1430" t="8650" r="1968" b="8808">Social</wd>

<space/>

<wd l="2098" t="8650" r="2640" b="8808">media</wd>

<space/>

<wd l="2760" t="8669" r="3173" b="8808">texts</wd>

<space/>

<wd l="3307" t="8650" r="3821" b="8808">found</wd>

<space/>

<wd l="3946" t="8650" r="4114" b="8803">in</wd>

<space/>

<wd l="4248" t="8650" r="4642" b="8808">such</wd>

<space/>

<wd l="4781" t="8650" r="5472" b="8808">services</wd>

<space/>

<wd l="5606" t="8698" r="5779" b="8808">as</wd>

<space/>

</ln>

<ln l="1426" t="8890" r="5789" b="9101" baseLine="9053" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="8899" r="2074" b="9058">Twitter</wd>

<space/>

<wd l="2184" t="8947" r="2366" b="9058">or</wd>

<space/>

<wd l="2472" t="8899" r="3331" b="9058">Facebook</wd>

<space/>

<wd l="3437" t="8899" r="3850" b="9058">have</wd>

<space/>

<wd l="3970" t="8947" r="4066" b="9058">a</wd>

<space/>

<wd l="4176" t="8918" r="4613" b="9101">great</wd>

<space/>

<wd l="4728" t="8899" r="5789" b="9101">data-mining</wd>

<space/>

</ln>

<ln l="1416" t="9144" r="5784" b="9355" baseLine="9302" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="9154" r="2237" b="9355">potential,</wd>

<space/>

<wd l="2318" t="9202" r="2491" b="9312">as</wd>

<space/>

<wd l="2568" t="9154" r="2942" b="9355">they</wd>

<space/>

<wd l="3019" t="9154" r="3446" b="9312">offer</wd>

<space/>

<wd l="3509" t="9154" r="4296" b="9312">real-time</wd>

<space/>

<wd l="4373" t="9154" r="4742" b="9312">data</wd>

<space/>

<wd l="4805" t="9154" r="5136" b="9312">that</wd>

<space/>

<wd l="5208" t="9202" r="5510" b="9312">can</wd>

<space/>

<wd l="5573" t="9154" r="5784" b="9312">be</wd>

<space/>

</ln>

<ln l="1421" t="9398" r="5779" b="9610" baseLine="9557" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="9408" r="1954" b="9566">useful</wd>

<space/>

<wd l="2102" t="9427" r="2270" b="9566">to</wd>

<space/>

<wd l="2424" t="9408" r="3120" b="9566">monitor</wd>

<space/>

<wd l="3259" t="9408" r="3806" b="9610">public</wd>

<space/>

<wd l="3965" t="9408" r="4632" b="9610">opinion</wd>

<space/>

<wd l="4786" t="9456" r="4997" b="9566">on</wd>

<space/>

<wd l="5141" t="9408" r="5779" b="9600">brands,</wd>

<space/>

</ln>

<ln l="1416" t="9648" r="5784" b="9859" baseLine="9811" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="9658" r="2227" b="9859">products,</wd>

<space/>

<wd l="2333" t="9677" r="2942" b="9850">events,</wd>

<space/>

<wd l="3048" t="9677" r="3341" b="9816">etc.</wd>

<space/>

<wd l="3451" t="9662" r="4306" b="9850">However,</wd>

<space/>

<wd l="4411" t="9677" r="5030" b="9816">current</wd>

<space/>

<wd l="5122" t="9658" r="5784" b="9816">Natural</wd>

<space/>

</ln>

<ln l="1421" t="9902" r="5779" b="10114" baseLine="10066" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="9917" r="2285" b="10114">Language</wd>

<space/>

<wd l="2390" t="9912" r="3346" b="10114">Processing</wd>

<space/>

<wd l="3461" t="9931" r="4142" b="10114">systems</wd>

<space/>

<wd l="4258" t="9960" r="4522" b="10070">are</wd>

<space/>

<wd l="4627" t="9912" r="5266" b="10114">usually</wd>

<space/>

<wd l="5376" t="9912" r="5779" b="10114">opti-</wd>

</ln>

<ln l="1421" t="10157" r="5808" b="10368" baseLine="10315" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="10166" r="1958" b="10325">mized</wd>

<space/>

<wd l="2059" t="10166" r="2314" b="10325">for</wd>

<space/>

<wd l="2414" t="10166" r="2870" b="10325">clean</wd>

<space/>

<wd l="2981" t="10166" r="3389" b="10358">data,</wd>

<space/>

<wd l="3494" t="10166" r="4032" b="10325">which</wd>

<space/>

<wd l="4138" t="10166" r="4272" b="10325">is</wd>

<space/>

<wd l="4378" t="10186" r="4661" b="10325">not</wd>

<space/>

<wd l="4757" t="10166" r="5026" b="10325">the</wd>

<space/>

<wd l="5126" t="10186" r="5501" b="10368">type</wd>

<space/>

<wd l="5606" t="10166" r="5808" b="10325">of</wd>

<space/>

</ln>

<ln l="1426" t="10406" r="5789" b="10618" baseLine="10565" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="10416" r="1790" b="10574">data</wd>

<space/>

<wd l="1848" t="10416" r="2362" b="10574">found</wd>

<space/>

<wd l="2419" t="10416" r="2582" b="10570">in</wd>

<space/>

<wd l="2650" t="10416" r="3154" b="10574">social</wd>

<space/>

<wd l="3211" t="10416" r="3754" b="10574">media</wd>

<space/>

<wd l="3802" t="10435" r="4272" b="10608">texts,</wd>

<space/>

<wd l="4339" t="10464" r="4512" b="10574">as</wd>

<space/>

<wd l="4574" t="10416" r="4949" b="10618">they</wd>

<space/>

<wd l="5011" t="10464" r="5275" b="10574">are</wd>

<space/>

<wd l="5338" t="10416" r="5789" b="10574">often</wd>

<space/>

</ln>

<ln l="1421" t="10661" r="5784" b="10872" baseLine="10824" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="10670" r="1944" b="10872">noisy,</wd>

<space/>

<wd l="2050" t="10670" r="2976" b="10872">containing</wd>

<space/>

<wd l="3072" t="10718" r="3168" b="10829">a</wd>

<space/>

<wd l="3264" t="10670" r="3490" b="10829">lot</wd>

<space/>

<wd l="3586" t="10670" r="3787" b="10829">of</wd>

<space/>

<wd l="3869" t="10670" r="4373" b="10872">slang,</wd>

<space/>

<wd l="4474" t="10690" r="4997" b="10872">typos,</wd>

<space/>

<wd l="5102" t="10670" r="5419" b="10829">and</wd>

<space/>

<wd l="5510" t="10670" r="5784" b="10829">ab-</wd>

</ln>

<ln l="1416" t="10920" r="2443" b="11083" baseLine="11074" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="10925" r="2443" b="11083">breviations.</wd>

</ln>

</para>

<para l="1421" t="11170" r="5789" b="12346" alignment="justified" fli="216" lsp="exactly" lspExact="252" language="en">

<ln l="1642" t="11170" r="5789" b="11381" baseLine="11328" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="11179" r="2760" b="11381">Normalizing</wd>

<space/>

<wd l="2822" t="11179" r="3216" b="11338">such</wd>

<space/>

<wd l="3274" t="11198" r="3605" b="11338">text</wd>

<space/>

<wd l="3662" t="11179" r="3802" b="11338">is</wd>

<space/>

<wd l="3869" t="11179" r="4930" b="11381">challenging.</wd>

<space/>

<wd l="4997" t="11184" r="5299" b="11338">We</wd>

<space/>

<wd l="5357" t="11198" r="5789" b="11338">want</wd>

<space/>

</ln>

<ln l="1421" t="11419" r="5779" b="11630" baseLine="11578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="11448" r="1584" b="11587">to</wd>

<space/>

<wd l="1690" t="11429" r="2352" b="11587">achieve</wd>

<space/>

<wd l="2443" t="11429" r="2837" b="11630">high</wd>

<space/>

<wd l="2928" t="11429" r="3466" b="11621">recall,</wd>

<space/>

<wd l="3562" t="11429" r="4214" b="11630">making</wd>

<space/>

<wd l="4310" t="11477" r="4483" b="11587">as</wd>

<space/>

<wd l="4584" t="11477" r="5069" b="11630">many</wd>

<space/>

<wd l="5165" t="11477" r="5779" b="11587">correc-</wd>

</ln>

<ln l="1421" t="11674" r="5779" b="11885" baseLine="11832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="11683" r="1843" b="11842">tions</wd>

<space/>

<wd l="1920" t="11731" r="2093" b="11842">as</wd>

<space/>

<wd l="2155" t="11683" r="2933" b="11885">possible,</wd>

<space/>

<wd l="3000" t="11683" r="3283" b="11842">but</wd>

<space/>

<wd l="3350" t="11702" r="3629" b="11842">not</wd>

<space/>

<wd l="3701" t="11702" r="3854" b="11842">at</wd>

<space/>

<wd l="3917" t="11683" r="4186" b="11842">the</wd>

<space/>

<wd l="4258" t="11731" r="4958" b="11885">expense</wd>

<space/>

<wd l="5030" t="11683" r="5232" b="11842">of</wd>

<space/>

<wd l="5270" t="11683" r="5779" b="11885">preci-</wd>

</ln>

<ln l="1430" t="11928" r="5774" b="12139" baseLine="12086" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1430" t="11938" r="1790" b="12096">sion</wd>

<space/>

<wd l="1872" t="12034" r="1992" b="12043">–</wd>

<space/>

<wd l="2074" t="11938" r="2606" b="12096">words</wd>

<space/>

<wd l="2712" t="11938" r="3293" b="12096">should</wd>

<space/>

<wd l="3379" t="11957" r="3662" b="12096">not</wd>

<space/>

<wd l="3744" t="11938" r="3955" b="12096">be</wd>

<space/>

<wd l="4051" t="11938" r="5002" b="12139">incorrectly</wd>

<space/>

<wd l="5088" t="11938" r="5774" b="12096">normal-</wd>

</ln>

<ln l="1426" t="12182" r="1829" b="12346" baseLine="12336" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="12187" r="1829" b="12346">ized.</wd>

</ln>

</para>

<para l="1421" t="12432" r="5789" b="14918" alignment="justified" spaceBefore="4" fli="216" lsp="exactly" lspExact="251" language="en">

<ln l="1646" t="12432" r="5789" b="12643" baseLine="12590" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="12442" r="2414" b="12600">Previous</wd>

<space/>

<wd l="2510" t="12442" r="3490" b="12643">approaches</wd>

<space/>

<wd l="3576" t="12461" r="3744" b="12600">to</wd>

<space/>

<wd l="3835" t="12442" r="4147" b="12600">this</wd>

<space/>

<wd l="4234" t="12442" r="4594" b="12600">task</wd>

<space/>

<wd l="4680" t="12442" r="5789" b="12643">incorporated</wd>

<space/>

</ln>

<ln l="1426" t="12691" r="5779" b="12888" baseLine="12845" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="12696" r="2179" b="12854">different</wd>

<space/>

<wd l="2304" t="12696" r="2726" b="12854">tools</wd>

<space/>

<wd l="2866" t="12696" r="3182" b="12854">and</wd>

<space/>

<wd l="3302" t="12696" r="4090" b="12854">methods:</wd>

<space/>

<wd l="4243" t="12696" r="5309" b="12888">dictionaries,</wd>

<space/>

<wd l="5448" t="12696" r="5779" b="12854">lan-</wd>

</ln>

<ln l="1426" t="12941" r="5779" b="13147" baseLine="13094" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="12994" r="1939" b="13147">guage</wd>

<space/>

<wd l="2040" t="12946" r="2722" b="13138">models,</wd>

<space/>

<wd l="2827" t="12946" r="3288" b="13104">finite</wd>

<space/>

<wd l="3394" t="12965" r="3787" b="13104">state</wd>

<space/>

<wd l="3878" t="12946" r="4930" b="13138">transducers,</wd>

<space/>

<wd l="5040" t="12946" r="5357" b="13104">and</wd>

<space/>

<wd l="5443" t="12994" r="5779" b="13104">ma-</wd>

</ln>

<ln l="1426" t="13190" r="5784" b="13358" baseLine="13349" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="13200" r="1896" b="13358">chine</wd>

<space/>

<wd l="1992" t="13200" r="2918" b="13358">translation</wd>

<space/>

<wd l="3019" t="13200" r="3696" b="13358">models.</wd>

<space/>

<wd l="3811" t="13200" r="4296" b="13358">Some</wd>

<space/>

<wd l="4402" t="13200" r="4603" b="13358">of</wd>

<space/>

<wd l="4675" t="13200" r="4944" b="13358">the</wd>

<space/>

<wd l="5040" t="13200" r="5784" b="13358">methods</wd>

<space/>

</ln>

<ln l="1426" t="13454" r="5779" b="13656" baseLine="13603" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="13502" r="1690" b="13613">are</wd>

<space/>

<wd l="1771" t="13454" r="2981" b="13656">unsupervised,</wd>

<space/>

<wd l="3072" t="13454" r="3682" b="13656">though</wd>

<space/>

<wd l="3768" t="13454" r="4214" b="13613">often</wd>

<space/>

<wd l="4296" t="13454" r="5102" b="13656">requiring</wd>

<space/>

<wd l="5189" t="13454" r="5779" b="13656">adjust-</wd>

</ln>

<ln l="1421" t="13709" r="5789" b="13910" baseLine="13858" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="13728" r="1858" b="13867">ment</wd>

<space/>

<wd l="1920" t="13709" r="2122" b="13867">of</wd>

<space/>

<wd l="2150" t="13728" r="3120" b="13910">parameters</wd>

<space/>

<wd l="3173" t="13709" r="3682" b="13867">based</wd>

<space/>

<wd l="3739" t="13757" r="3955" b="13867">on</wd>

<space/>

<wd l="4018" t="13709" r="4872" b="13867">annotated</wd>

<space/>

<wd l="4930" t="13709" r="5290" b="13867">data</wd>

<space/>

<wd l="5352" t="13709" r="5789" b="13910">(Han</wd>

<space/>

</ln>

<ln l="1426" t="13958" r="5789" b="14160" baseLine="14112" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="13958" r="1742" b="14117">and</wd>

<space/>

<wd l="1886" t="13958" r="2630" b="14117">Baldwin</wd>

<space/>

<wd l="2779" t="13958" r="3408" b="14160">(2011),</wd>

<space/>

<wd l="3566" t="13958" r="3869" b="14117">Liu</wd>

<space/>

<wd l="4018" t="13978" r="4171" b="14117">et</wd>

<space/>

<wd l="4325" t="13958" r="4522" b="14117">al.</wd>

<space/>

<wd l="4685" t="13958" r="5314" b="14160">(2011),</wd>

<space/>

<wd l="5472" t="13958" r="5789" b="14117">and</wd>

<space/>

</ln>

<ln l="1426" t="14213" r="5784" b="14414" baseLine="14362" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="14213" r="2040" b="14371">Gouws</wd>

<space/>

<wd l="2126" t="14232" r="2280" b="14371">et</wd>

<space/>

<wd l="2366" t="14213" r="2568" b="14371">al.</wd>

<space/>

<wd l="2659" t="14213" r="3360" b="14414">(2011)).</wd>

<space/>

<wd l="3461" t="14213" r="3950" b="14371">Some</wd>

<space/>

<wd l="4037" t="14261" r="4301" b="14371">are</wd>

<space/>

<wd l="4392" t="14213" r="5371" b="14414">supervised,</wd>

<space/>

<wd l="5462" t="14213" r="5784" b="14371">like</wd>

<space/>

</ln>

<ln l="1421" t="14467" r="5779" b="14669" baseLine="14616" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="14467" r="1752" b="14626">that</wd>

<space/>

<wd l="1829" t="14467" r="1992" b="14621">in</wd>

<space/>

<wd l="2069" t="14467" r="2875" b="14669">Chrupała</wd>

<space/>

<wd l="2947" t="14467" r="3576" b="14669">(2014),</wd>

<space/>

<wd l="3658" t="14467" r="4310" b="14669">making</wd>

<space/>

<wd l="4382" t="14515" r="4675" b="14626">use</wd>

<space/>

<wd l="4757" t="14467" r="4958" b="14626">of</wd>

<space/>

<wd l="5011" t="14515" r="5107" b="14626">a</wd>

<space/>

<wd l="5179" t="14467" r="5779" b="14626">Condi-</wd>

</ln>

<ln l="1421" t="14717" r="5779" b="14918" baseLine="14870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="14717" r="1915" b="14875">tional</wd>

<space/>

<wd l="2030" t="14717" r="2779" b="14875">Random</wd>

<space/>

<wd l="2880" t="14717" r="3341" b="14875">Field</wd>

<space/>

<wd l="3451" t="14717" r="4238" b="14918">(Lafferty</wd>

<space/>

<wd l="4349" t="14736" r="4502" b="14875">et</wd>

<space/>

<wd l="4618" t="14717" r="4877" b="14909">al.,</wd>

<space/>

<wd l="4997" t="14717" r="5501" b="14918">2001)</wd>

<space/>

<wd l="5616" t="14736" r="5779" b="14875">to</wd>

</ln>

</para>

</column>

<column l="6110" t="2071" r="10507" b="14929">

<para l="6787" t="2122" r="9744" b="3437" alignment="centered" lsp="exactly" lspExact="274" language="en">

<ln l="7176" t="2122" r="9370" b="2338" baseLine="2285" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="7176" t="2122" r="8304" b="2290">Viachaslau</wd>

<space/>

<wd l="8376" t="2122" r="9370" b="2338">Patsepnia
</wd>

</ln>

<ln l="7872" t="2395" r="8664" b="2563" baseLine="2554" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="7872" t="2395" r="8242" b="2563">IHS</wd>

<space/>

<wd l="8318" t="2395" r="8664" b="2563">Inc.
</wd>

</ln>

<ln l="6787" t="2664" r="9744" b="2885" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6787" t="2669" r="7003" b="2837">55</wd>

<space/>

<wd l="7085" t="2664" r="8136" b="2885">Cambridge</wd>

<space/>

<wd l="8198" t="2664" r="8784" b="2885">pkwy,</wd>

<space/>

<wd l="8870" t="2664" r="9346" b="2837">Suite</wd>

<space/>

<wd l="9422" t="2669" r="9744" b="2837">601
</wd>

</ln>

<ln l="6864" t="2942" r="9691" b="3163" baseLine="3106" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6864" t="2942" r="7968" b="3163">Cambridge,</wd>

<space/>

<wd l="8040" t="2947" r="8429" b="3110">MA</wd>

<space/>

<wd l="8496" t="2947" r="9139" b="3154">02142,</wd>

<space/>

<wd l="9211" t="2947" r="9691" b="3115">USA
</wd>

</ln>

<ln l="7046" t="3216" r="9518" b="3437" baseLine="3384" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="7046" t="3216" r="9518" b="3437">Slava.Patsepnia@ihs.com</wd>

</ln>

</para>

<para l="6120" t="3989" r="10483" b="4406" alignment="justified" spaceBefore="496" lsp="exactly" lspExact="258" language="en">

<ln l="6130" t="3989" r="10483" b="4195" baseLine="4142" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="3994" r="6557" b="4152">learn</wd>

<space/>

<wd l="6662" t="3994" r="6926" b="4152">the</wd>

<space/>

<wd l="7037" t="4042" r="7915" b="4195">sequences</wd>

<space/>

<wd l="8021" t="3994" r="8222" b="4152">of</wd>

<space/>

<wd l="8299" t="3994" r="8626" b="4152">edit</wd>

<space/>

<wd l="8726" t="3994" r="9634" b="4195">operations</wd>

<space/>

<wd l="9739" t="3994" r="10166" b="4152">from</wd>

<space/>

<wd l="10262" t="3994" r="10483" b="4152">la-</wd>

</ln>

<ln l="6120" t="4243" r="7128" b="4406" baseLine="4402" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6120" t="4248" r="6667" b="4406">belled</wd>

<space/>

<wd l="6725" t="4248" r="7128" b="4406">data.</wd>

</ln>

</para>

<para l="6125" t="4493" r="10493" b="5208" alignment="justified" fli="288" lsp="exactly" lspExact="252" language="en">

<ln l="6355" t="4493" r="10493" b="4704" baseLine="4651" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6355" t="4507" r="6533" b="4656">In</wd>

<space/>

<wd l="6590" t="4502" r="6907" b="4661">this</wd>

<space/>

<wd l="6965" t="4550" r="7507" b="4704">paper,</wd>

<space/>

<wd l="7574" t="4550" r="7829" b="4661">we</wd>

<space/>

<wd l="7882" t="4522" r="8525" b="4704">present</wd>

<space/>

<wd l="8587" t="4550" r="8784" b="4661">an</wd>

<space/>

<wd l="8851" t="4502" r="9653" b="4704">approach</wd>

<space/>

<wd l="9706" t="4502" r="10214" b="4661">based</wd>

<space/>

<wd l="10277" t="4550" r="10493" b="4661">on</wd>

<space/>

</ln>

<ln l="6125" t="4747" r="10483" b="4958" baseLine="4906" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="4757" r="6389" b="4915">the</wd>

<space/>

<wd l="6485" t="4805" r="6979" b="4958">usage</wd>

<space/>

<wd l="7075" t="4757" r="7277" b="4915">of</wd>

<space/>

<wd l="7344" t="4757" r="8568" b="4915">normalization</wd>

<space/>

<wd l="8659" t="4757" r="9384" b="4915">lexicons</wd>

<space/>

<wd l="9485" t="4757" r="9802" b="4915">and</wd>

<space/>

<wd l="9893" t="4805" r="9989" b="4915">a</wd>

<space/>

<wd l="10080" t="4757" r="10483" b="4915">CRF</wd>

<space/>

</ln>

<ln l="6125" t="4997" r="9859" b="5208" baseLine="5155" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="5006" r="6667" b="5165">model</wd>

<space/>

<wd l="6734" t="5006" r="6989" b="5165">for</wd>

<space/>

<wd l="7046" t="5006" r="8006" b="5208">identifying</wd>

<space/>

<wd l="8054" t="5006" r="8827" b="5208">potential</wd>

<space/>

<wd l="8890" t="5006" r="9859" b="5165">candidates.</wd>

</ln>

</para>

<para l="6130" t="5472" r="8232" b="6058" alignment="left" ri="2232" spaceBefore="50" lsp="exactly" lspExact="423" language="en">

<ln l="6130" t="5472" r="8232" b="5688" baseLine="5630" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="5472" r="6235" b="5635">2</wd>

<space/>

<wd l="6490" t="5472" r="6994" b="5640">Task</wd>

<space/>

<wd l="7051" t="5472" r="8232" b="5688">Description</wd>

<space/>

</ln>

<ln l="6130" t="5894" r="7406" b="6058" baseLine="6053" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="5899" r="6379" b="6058">2.1</wd>

<space/>

<wd l="6701" t="5904" r="7406" b="6058">Dataset</wd>

</ln>

</para>

<para l="6125" t="6264" r="10488" b="6979" alignment="justified" spaceBefore="116" lsp="exactly" lspExact="253" language="en">

<ln l="6130" t="6264" r="10483" b="6470" baseLine="6422" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="6269" r="6466" b="6427">The</wd>

<space/>

<wd l="6566" t="6317" r="7142" b="6470">corpus</wd>

<space/>

<wd l="7234" t="6269" r="8026" b="6470">provided</wd>

<space/>

<wd l="8107" t="6269" r="8333" b="6470">by</wd>

<space/>

<wd l="8424" t="6269" r="8688" b="6427">the</wd>

<space/>

<wd l="8789" t="6269" r="9696" b="6470">organizers</wd>

<space/>

<wd l="9797" t="6269" r="10483" b="6427">consists</wd>

<space/>

</ln>

<ln l="6130" t="6514" r="10488" b="6682" baseLine="6672" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="6523" r="6331" b="6682">of</wd>

<space/>

<wd l="6370" t="6523" r="6802" b="6682">2950</wd>

<space/>

<wd l="6864" t="6523" r="7718" b="6682">annotated</wd>

<space/>

<wd l="7771" t="6542" r="8381" b="6682">tweets.</wd>

<space/>

<wd l="8448" t="6523" r="8784" b="6682">The</wd>

<space/>

<wd l="8851" t="6523" r="9854" b="6682">annotations</wd>

<space/>

<wd l="9922" t="6523" r="10488" b="6682">follow</wd>

<space/>

</ln>

<ln l="6125" t="6768" r="9562" b="6979" baseLine="6926" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="6778" r="6576" b="6936">these</wd>

<space/>

<wd l="6634" t="6778" r="7531" b="6979">guidelines</wd>

<space/>

<wd l="7598" t="6778" r="8410" b="6979">(Baldwin</wd>

<space/>

<wd l="8467" t="6797" r="8626" b="6936">et</wd>

<space/>

<wd l="8683" t="6778" r="8942" b="6970">al.,</wd>

<space/>

<wd l="9010" t="6778" r="9562" b="6979">2015):</wd>

</ln>

</para>

<para l="6408" t="7320" r="10493" b="10056" alignment="justified" li="576" spaceBefore="296" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="7320" r="10488" b="7483" baseLine="7474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="7330" r="6686" b="7474">•</wd>

<tab position="6489"/>

<wd l="6686" t="7325" r="7896" b="7483">Non-standard</wd>

<space/>

<wd l="7954" t="7325" r="8486" b="7483">words</wd>

<space/>

<wd l="8558" t="7373" r="8822" b="7483">are</wd>

<space/>

<wd l="8885" t="7325" r="9878" b="7483">normalized</wd>

<space/>

<wd l="9936" t="7344" r="10104" b="7483">to</wd>

<space/>

<wd l="10176" t="7373" r="10488" b="7483">one</wd>

<space/>

</ln>

<ln l="6696" t="7570" r="10493" b="7781" baseLine="7728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6696" t="7627" r="6878" b="7738">or</wd>

<space/>

<wd l="6941" t="7627" r="7387" b="7738">more</wd>

<space/>

<wd l="7459" t="7579" r="8294" b="7738">canonical</wd>

<space/>

<wd l="8366" t="7579" r="9038" b="7781">English</wd>

<space/>

<wd l="9101" t="7579" r="9634" b="7738">words</wd>

<space/>

<wd l="9701" t="7579" r="10210" b="7738">based</wd>

<space/>

<wd l="10277" t="7627" r="10493" b="7738">on</wd>

<space/>

</ln>

<ln l="6696" t="7819" r="10488" b="8030" baseLine="7978">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6696" t="7877" r="6792" b="7987">a</wd>

<space/>

<wd l="6850" t="7829" r="7872" b="8030">pre-defined</wd>

<space/>

<wd l="7939" t="7829" r="8630" b="7987">lexicon.</wd>

<space/>

<wd l="8707" t="7834" r="9014" b="7987">For</wd>

<space/>

<wd l="9082" t="7829" r="9845" b="8021">instance,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9926" t="7829" r="9989" b="7987">l</wd>

<space/>

<wd l="10056" t="7882" r="10157" b="7987">o</wd>

<space/>

<wd l="10234" t="7882" r="10330" b="7987">v</wd>

<space/>

<wd l="10397" t="7882" r="10488" b="7987">e</wd>

<space/>

</run>

</ln>

<ln l="6701" t="8078" r="10483" b="8285" baseLine="8232">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6701" t="8083" r="7282" b="8242">should</wd>

<space/>

<wd l="7330" t="8083" r="7541" b="8242">be</wd>

<space/>

<wd l="7598" t="8083" r="8592" b="8242">normalized</wd>

<space/>

<wd l="8640" t="8102" r="8808" b="8242">to</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8875" t="8083" r="9235" b="8242">love</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9298" t="8083" r="10483" b="8285">(many-to-one</wd>

<space/>

</run>

</ln>

<ln l="6691" t="8338" r="10483" b="8539" baseLine="8486">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6691" t="8338" r="8035" b="8539">normalization),</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8107" t="8366" r="8558" b="8496">tmrw</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8616" t="8357" r="8784" b="8496">to</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8856" t="8366" r="9720" b="8496">tomorrow</wd>

<space/>

</run>

<wd l="9787" t="8338" r="10483" b="8539" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(one-to-</wd>

</ln>

<ln l="6696" t="8587" r="10483" b="8789" baseLine="8741">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6696" t="8635" r="7008" b="8746">one</wd>

<space/>

<wd l="7147" t="8587" r="8491" b="8789">normalization),</wd>

<space/>

<wd l="8645" t="8587" r="8962" b="8746">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9096" t="8640" r="9293" b="8746">cu</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9442" t="8606" r="9605" b="8746">to</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9749" t="8640" r="10027" b="8746">see</wd>

<space/>

<wd l="10152" t="8640" r="10483" b="8789">you</wd>

<space/>

</run>

</ln>

<ln l="6696" t="8842" r="10483" b="9043" baseLine="8990" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6696" t="8842" r="7886" b="9043">(one-to-many</wd>

<space/>

<wd l="8002" t="8842" r="9341" b="9043">normalization).</wd>

<space/>

<wd l="9475" t="8842" r="10483" b="9000">Additional-</wd>

</ln>

<ln l="6696" t="9096" r="10488" b="9298" baseLine="9245">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6696" t="9096" r="6907" b="9298">ly,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6970" t="9101" r="7392" b="9250">IBM</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7440" t="9096" r="8021" b="9254">should</wd>

<space/>

<wd l="8074" t="9096" r="8285" b="9254">be</wd>

<space/>

<wd l="8352" t="9096" r="8645" b="9254">left</wd>

<space/>

<wd l="8702" t="9096" r="9624" b="9254">untouched</wd>

<space/>

<wd l="9686" t="9144" r="9859" b="9254">as</wd>

<space/>

<wd l="9931" t="9096" r="10046" b="9254">it</wd>

<space/>

<wd l="10114" t="9096" r="10253" b="9254">is</wd>

<space/>

<wd l="10320" t="9096" r="10488" b="9250">in</wd>

<space/>

</run>

</ln>

<ln l="6691" t="9350" r="10483" b="9542" baseLine="9499" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="9350" r="6955" b="9509">the</wd>

<space/>

<wd l="7037" t="9350" r="7685" b="9509">lexicon</wd>

<space/>

<wd l="7762" t="9350" r="8078" b="9509">and</wd>

<space/>

<wd l="8150" t="9350" r="8270" b="9509">it</wd>

<space/>

<wd l="8347" t="9350" r="8486" b="9509">is</wd>

<space/>

<wd l="8568" t="9350" r="8736" b="9504">in</wd>

<space/>

<wd l="8813" t="9350" r="9010" b="9509">its</wd>

<space/>

<wd l="9096" t="9350" r="9931" b="9509">canonical</wd>

<space/>

<wd l="10013" t="9350" r="10483" b="9542">form,</wd>

<space/>

</ln>

<ln l="6696" t="9600" r="10483" b="9802" baseLine="9754">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6696" t="9600" r="7013" b="9758">and</wd>

<space/>

<wd l="7066" t="9600" r="7334" b="9758">the</wd>

<space/>

<wd l="7402" t="9600" r="8146" b="9758">informal</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8218" t="9600" r="8448" b="9758">lol</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8515" t="9600" r="9096" b="9758">should</wd>

<space/>

<wd l="9144" t="9600" r="9355" b="9758">be</wd>

<space/>

<wd l="9422" t="9600" r="10262" b="9802">expanded</wd>

<space/>

<wd l="10320" t="9619" r="10483" b="9758">to</wd>

<space/>

</run>

</ln>

<ln l="6696" t="9854" r="8299" b="10056" baseLine="10003">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6696" t="9854" r="7478" b="10056">laughing</wd>

<space/>

<wd l="7531" t="9883" r="7814" b="10013">out</wd>

<space/>

</run>

<wd l="7867" t="9854" r="8299" b="10013"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">loud</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6408" t="10123" r="10493" b="11338" alignment="justified" li="576" spaceBefore="15" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="10123" r="10483" b="10325" baseLine="10272" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6408" t="10128" r="6686" b="10272">•</wd>

<tab position="6489"/>

<wd l="6686" t="10123" r="7896" b="10282">Non-standard</wd>

<space/>

<wd l="7963" t="10123" r="8496" b="10282">words</wd>

<space/>

<wd l="8573" t="10171" r="8952" b="10325">may</wd>

<space/>

<wd l="9014" t="10123" r="9230" b="10282">be</wd>

<space/>

<wd l="9307" t="10123" r="9806" b="10282">either</wd>

<space/>

<wd l="9883" t="10123" r="10483" b="10282">out-of-</wd>

</ln>

<ln l="6691" t="10378" r="10493" b="10579" baseLine="10526">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="6691" t="10378" r="7666" b="10579">vocabulary</wd>

<space/>

<wd l="7766" t="10378" r="8376" b="10579">(OOV)</wd>

<space/>

<wd l="8477" t="10378" r="9048" b="10536">tokens</wd>

<space/>

<wd l="9149" t="10378" r="9586" b="10579">(e.g.,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="9691" t="10406" r="10138" b="10536">tmrw</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="10238" t="10378" r="10493" b="10536">for</wd>

<space/>

</run>

</ln>

<ln l="6696" t="10627" r="10483" b="10829" baseLine="10776">

<wd l="6696" t="10627" r="7627" b="10829"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">tomorrow</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><space/>

<wd l="7762" t="10675" r="7944" b="10786">or</wd>

<space/>

<wd l="8069" t="10627" r="9283" b="10829">in-vocabulary</wd>

<space/>

<wd l="9413" t="10627" r="9782" b="10829">(IV)</wd>

<space/>

<wd l="9912" t="10627" r="10483" b="10786">tokens</wd>

<space/>

</run>

</ln>

<ln l="6696" t="10882" r="10493" b="11083" baseLine="11030">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="6696" t="10882" r="7128" b="11083">(e.g.,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="7262" t="10891" r="7536" b="11040">wit</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="7661" t="10882" r="7915" b="11040">for</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="8040" t="10882" r="8414" b="11040">with</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1"><wd l="8549" t="10882" r="8717" b="11035">in</wd>

<space/>

<wd l="8846" t="10882" r="9014" b="11035">“I</wd>

<space/>

<wd l="9139" t="10882" r="9475" b="11040">will</wd>

<space/>

<wd l="9614" t="10930" r="10080" b="11040">come</wd>

<space/>

<wd l="10210" t="10882" r="10493" b="11040">wit</wd>

<space/>

</run>

</ln>

<ln l="6691" t="11136" r="7234" b="11338" baseLine="11285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="11136" r="7234" b="11338">you”).</wd>

</ln>

</para>

<para l="6408" t="11400" r="10493" b="12869" alignment="justified" li="576" spaceBefore="13" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="11400" r="10483" b="11602" baseLine="11549">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6408" t="11400" r="6696" b="11549">•</wd>

<tab position="6491"/>

<wd l="6696" t="11400" r="7133" b="11602">Only</wd>

<space/>

<wd l="7248" t="11400" r="8434" b="11602">alphanumeric</wd>

<space/>

<wd l="8554" t="11400" r="9120" b="11558">tokens</wd>

<space/>

<wd l="9245" t="11400" r="9677" b="11602">(e.g.,</wd>

<space/>

</run>

<wd l="9797" t="11400" r="9955" b="11592"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10080" t="11405" r="10483" b="11558">4eva</wd>

<space/>

</run>

</ln>

<ln l="6696" t="11654" r="10483" b="11856" baseLine="11803">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6696" t="11654" r="7013" b="11813">and</wd>

<space/>

</run>

<wd l="7118" t="11654" r="7632" b="11856"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">tmrw</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7747" t="11654" r="8064" b="11813">and</wd>

<space/>

<wd l="8170" t="11654" r="9206" b="11856">apostrophes</wd>

<space/>

<wd l="9317" t="11654" r="9725" b="11813">used</wd>

<space/>

<wd l="9826" t="11654" r="9994" b="11808">in</wd>

<space/>

<wd l="10104" t="11702" r="10483" b="11813">con-</wd>

</run>

</ln>

<ln l="6691" t="11909" r="10493" b="12110" baseLine="12058">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6691" t="11909" r="7445" b="12067">tractions</wd>

<space/>

<wd l="7526" t="11909" r="7963" b="12110">(e.g.,</wd>

<space/>

</run>

<wd l="8026" t="11909" r="8779" b="12110"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">yoou&apos;ve</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8866" t="11957" r="9130" b="12067">are</wd>

<space/>

<wd l="9206" t="11909" r="10162" b="12067">considered</wd>

<space/>

<wd l="10238" t="11909" r="10493" b="12067">for</wd>

<space/>

</run>

</ln>

<ln l="6691" t="12163" r="10478" b="12365" baseLine="12312" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="12163" r="7958" b="12322">normalization.</wd>

<space/>

<wd l="8054" t="12163" r="8693" b="12322">Tokens</wd>

<space/>

<wd l="8789" t="12163" r="9614" b="12365">including</wd>

<space/>

<wd l="9701" t="12163" r="10478" b="12365">hyphens,</wd>

<space/>

</ln>

<ln l="6701" t="12418" r="10483" b="12619" baseLine="12566" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6701" t="12418" r="7214" b="12619">single</wd>

<space/>

<wd l="7315" t="12437" r="7882" b="12619">quotes</wd>

<space/>

<wd l="7982" t="12418" r="8299" b="12576">and</wd>

<space/>

<wd l="8395" t="12418" r="8842" b="12576">other</wd>

<space/>

<wd l="8933" t="12437" r="9394" b="12619">types</wd>

<space/>

<wd l="9499" t="12418" r="9696" b="12576">of</wd>

<space/>

<wd l="9773" t="12437" r="10483" b="12576">contrac-</wd>

</ln>

<ln l="6691" t="12667" r="8794" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="12667" r="7114" b="12826">tions</wd>

<space/>

<wd l="7181" t="12667" r="7766" b="12826">should</wd>

<space/>

<wd l="7810" t="12667" r="8021" b="12826">be</wd>

<space/>

<wd l="8083" t="12667" r="8794" b="12869">ignored.</wd>

</ln>

</para>

<para l="6408" t="12936" r="10488" b="13646" alignment="justified" li="576" spaceBefore="21" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="12936" r="10488" b="13138" baseLine="13085" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="12941" r="6691" b="13085">•</wd>

<tab position="6489"/>

<wd l="6691" t="12936" r="7397" b="13094">Domain</wd>

<space/>

<wd l="7493" t="12936" r="8160" b="13138">specific</wd>

<space/>

<wd l="8256" t="12936" r="8880" b="13094">entities</wd>

<space/>

<wd l="8971" t="12984" r="9235" b="13094">are</wd>

<space/>

<wd l="9326" t="12936" r="9994" b="13138">ignored</wd>

<space/>

<wd l="10080" t="12984" r="10488" b="13094">even</wd>

<space/>

</ln>

<ln l="6696" t="13190" r="10483" b="13392" baseLine="13339" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6696" t="13190" r="6845" b="13344">if</wd>

<space/>

<wd l="6950" t="13190" r="7330" b="13392">they</wd>

<space/>

<wd l="7459" t="13238" r="7723" b="13349">are</wd>

<space/>

<wd l="7858" t="13190" r="8021" b="13344">in</wd>

<space/>

<wd l="8150" t="13190" r="9298" b="13349">non-standard</wd>

<space/>

<wd l="9427" t="13190" r="9979" b="13382">forms,</wd>

<space/>

<wd l="10123" t="13238" r="10483" b="13392">e.g.,</wd>

<space/>

</ln>

<ln l="6691" t="13445" r="7699" b="13646" baseLine="13594">

<wd l="6691" t="13445" r="7133" b="13646"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">#ttyl</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7205" t="13445" r="7699" b="13646">@nyc</wd>

</run>

</ln>

</para>

<para l="6408" t="13709" r="10488" b="14880" alignment="justified" li="576" spaceBefore="9" fli="-288" lsp="exactly" lspExact="250" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="13709" r="10483" b="13910" baseLine="13858" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="13714" r="6696" b="13858">•</wd>

<tab position="6489"/>

<wd l="6696" t="13714" r="6821" b="13867">It</wd>

<space/>

<wd l="6912" t="13709" r="7046" b="13867">is</wd>

<space/>

<wd l="7133" t="13709" r="7858" b="13910">possible</wd>

<space/>

<wd l="7949" t="13709" r="8203" b="13867">for</wd>

<space/>

<wd l="8290" t="13757" r="8386" b="13867">a</wd>

<space/>

<wd l="8467" t="13728" r="8942" b="13867">tweet</wd>

<space/>

<wd l="9029" t="13728" r="9192" b="13867">to</wd>

<space/>

<wd l="9283" t="13709" r="9696" b="13867">have</wd>

<space/>

<wd l="9782" t="13757" r="9998" b="13867">no</wd>

<space/>

<wd l="10085" t="13757" r="10483" b="13867">non-</wd>

</ln>

<ln l="6701" t="13963" r="10483" b="14165" baseLine="14117" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6701" t="13963" r="7445" b="14122">standard</wd>

<space/>

<wd l="7493" t="13963" r="8064" b="14122">tokens</wd>

<space/>

<wd l="8122" t="13963" r="8410" b="14122">but</wd>

<space/>

<wd l="8477" t="13963" r="8794" b="14122">still</wd>

<space/>

<wd l="8856" t="13963" r="9480" b="14165">require</wd>

<space/>

<wd l="9538" t="13963" r="10483" b="14122">normaliza-</wd>

</ln>

<ln l="6691" t="14218" r="10488" b="14419" baseLine="14371">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6691" t="14218" r="7037" b="14376">tion</wd>

<space/>

<wd l="7094" t="14218" r="7526" b="14419">(e.g.,</wd>

<space/>

<wd l="7594" t="14218" r="7858" b="14376">the</wd>

<space/>

<wd l="7920" t="14218" r="8659" b="14419">example</wd>

<space/>

<wd l="8726" t="14218" r="8923" b="14376">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8962" t="14227" r="9230" b="14376">wit</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9288" t="14218" r="9931" b="14419">above),</wd>

<space/>

<wd l="9998" t="14218" r="10315" b="14376">and</wd>

<space/>

<wd l="10373" t="14218" r="10488" b="14376">it</wd>

<space/>

</run>

</ln>

<ln l="6696" t="14472" r="10483" b="14674" baseLine="14621" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6696" t="14472" r="6830" b="14630">is</wd>

<space/>

<wd l="6912" t="14472" r="7258" b="14630">also</wd>

<space/>

<wd l="7330" t="14472" r="8050" b="14674">possible</wd>

<space/>

<wd l="8126" t="14472" r="8381" b="14630">for</wd>

<space/>

<wd l="8448" t="14472" r="8717" b="14630">the</wd>

<space/>

<wd l="8789" t="14491" r="9264" b="14630">tweet</wd>

<space/>

<wd l="9336" t="14491" r="9499" b="14630">to</wd>

<space/>

<wd l="9576" t="14472" r="10195" b="14674">require</wd>

<space/>

<wd l="10267" t="14520" r="10483" b="14630">no</wd>

<space/>

</ln>

<ln l="6691" t="14722" r="9014" b="14880" baseLine="14870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="14722" r="7915" b="14880">normalization</wd>

<space/>

<wd l="7968" t="14722" r="9014" b="14880">whatsoever.</wd>

</ln>

</para>

</column>

</section>

<section l="1416" t="14929" r="10507" b="16480">

<column l="1416" t="14929" r="10507" b="16480">

<para l="5800" t="15792" r="6143" b="15946" alignment="centered" spaceBefore="815" lsp="exactly" lspExact="249" language="en">

<ln l="5866" t="15792" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="40">

<wd l="5866" t="15792" r="6077" b="15946">78</wd>

</ln>

</para>

<para l="2918" t="16133" r="8981" b="16469" alignment="centered" spaceBefore="139" lsp="exactly" lspExact="170" language="en">

<ln l="2918" t="16133" r="8981" b="16301" baseLine="16253" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2918" t="16133" r="3802" b="16296">Proceedings</wd>

<space/>

<wd l="3854" t="16133" r="4018" b="16296">of</wd>

<space/>

<wd l="4037" t="16133" r="4248" b="16262">the</wd>

<space/>

<wd l="4286" t="16138" r="4622" b="16262">ACL</wd>

<space/>

<wd l="4666" t="16133" r="5026" b="16262">2015</wd>

<space/>

<wd l="5078" t="16133" r="5779" b="16296">Workshop</wd>

<space/>

<wd l="5832" t="16176" r="6000" b="16262">on</wd>

<space/>

<wd l="6043" t="16138" r="6456" b="16296">Noisy</wd>

<space/>

<wd l="6518" t="16133" r="7627" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7675" t="16138" r="7992" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8045" t="16171" r="8443" b="16301">pages</wd>

<space/>

<wd l="8496" t="16133" r="8981" b="16286">78–81,
</wd>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4311.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1416" marginTop="1389" marginRight="1390" marginBottom="1302" offsetX="-8" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1416" t="1389" r="10519" b="15426">

<column l="1416" t="1389" r="5813" b="15426">

<para l="1704" t="1478" r="5789" b="2189" alignment="justified" li="576" spaceBefore="48" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="1478" r="5774" b="1680" baseLine="1627" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1704" t="1483" r="1982" b="1627">•</wd>

<tab position="1785"/>

<wd l="1982" t="1483" r="2578" b="1680">Proper</wd>

<space/>

<wd l="2698" t="1526" r="3221" b="1637">nouns</wd>

<space/>

<wd l="3360" t="1478" r="3941" b="1637">should</wd>

<space/>

<wd l="4056" t="1478" r="4267" b="1637">be</wd>

<space/>

<wd l="4397" t="1478" r="4690" b="1637">left</wd>

<space/>

<wd l="4814" t="1478" r="5774" b="1670">untouched,</wd>

<space/>

</ln>

<ln l="1987" t="1733" r="5789" b="1934" baseLine="1882" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1987" t="1781" r="2400" b="1891">even</wd>

<space/>

<wd l="2501" t="1733" r="2650" b="1886">if</wd>

<space/>

<wd l="2722" t="1733" r="3106" b="1934">they</wd>

<space/>

<wd l="3202" t="1781" r="3461" b="1891">are</wd>

<space/>

<wd l="3557" t="1752" r="3840" b="1891">not</wd>

<space/>

<wd l="3936" t="1733" r="4099" b="1886">in</wd>

<space/>

<wd l="4195" t="1733" r="4459" b="1891">the</wd>

<space/>

<wd l="4560" t="1733" r="5040" b="1934">given</wd>

<space/>

<wd l="5141" t="1733" r="5789" b="1891">lexicon</wd>

<space/>

</ln>

<ln l="1987" t="1987" r="3240" b="2189" baseLine="2136">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1987" t="1987" r="2424" b="2189">(e.g.,</wd>

<space/>

</run>

<wd l="2501" t="1987" r="3240" b="2189"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Twitter</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1704" t="2256" r="5779" b="2962" alignment="justified" li="576" spaceBefore="19" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="2256" r="5779" b="2414" baseLine="2405" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1704" t="2256" r="1982" b="2405">•</wd>

<tab position="1787"/>

<wd l="1982" t="2256" r="2261" b="2410">All</wd>

<space/>

<wd l="2352" t="2256" r="3658" b="2414">normalizations</wd>

<space/>

<wd l="3758" t="2256" r="4339" b="2414">should</wd>

<space/>

<wd l="4416" t="2304" r="4709" b="2414">use</wd>

<space/>

<wd l="4795" t="2256" r="5064" b="2414">the</wd>

<space/>

<wd l="5150" t="2256" r="5779" b="2414">Ameri-</wd>

</ln>

<ln l="1987" t="2510" r="5779" b="2712" baseLine="2659">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1987" t="2558" r="2285" b="2669">can</wd>

<space/>

<wd l="2381" t="2510" r="3072" b="2712">spelling</wd>

<space/>

<wd l="3158" t="2510" r="3590" b="2712">(e.g.,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3686" t="2510" r="4402" b="2669">tokenize</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4483" t="2510" r="4997" b="2669">rather</wd>

<space/>

<wd l="5078" t="2510" r="5453" b="2669">than</wd>

<space/>

</run>

<wd l="5544" t="2539" r="5779" b="2669" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">to-</wd>

</ln>

<ln l="1982" t="2760" r="2650" b="2962" baseLine="2914">

<wd l="1982" t="2760" r="2650" b="2962"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">kenise</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1426" t="3298" r="3019" b="3456" alignment="left" spaceBefore="275" lsp="exactly" lspExact="257" language="en">

<ln l="1426" t="3298" r="3019" b="3456" baseLine="3446" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="15">

<wd l="1426" t="3298" r="1685" b="3456">2.2</wd>

<space/>

<wd l="1997" t="3298" r="3019" b="3456">Evaluation</wd>

</ln>

</para>

<para l="1421" t="3667" r="5779" b="4114" alignment="justified" spaceBefore="118" lsp="exactly" lspExact="253" language="en">

<ln l="1421" t="3667" r="5779" b="3869" baseLine="3816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="3667" r="2376" b="3826">Evaluation</wd>

<space/>

<wd l="2482" t="3715" r="2822" b="3826">was</wd>

<space/>

<wd l="2933" t="3686" r="3101" b="3826">to</wd>

<space/>

<wd l="3211" t="3667" r="3418" b="3826">be</wd>

<space/>

<wd l="3533" t="3667" r="4147" b="3826">carried</wd>

<space/>

<wd l="4253" t="3686" r="4531" b="3826">out</wd>

<space/>

<wd l="4642" t="3667" r="5506" b="3869">according</wd>

<space/>

<wd l="5611" t="3686" r="5779" b="3826">to</wd>

<space/>

</ln>

<ln l="1421" t="3922" r="4373" b="4114" baseLine="4070" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="3922" r="2290" b="4114">Precision,</wd>

<space/>

<wd l="2352" t="3922" r="2962" b="4114">Recall,</wd>

<space/>

<wd l="3029" t="3922" r="3346" b="4080">and</wd>

<space/>

<wd l="3394" t="3922" r="3605" b="4075">F1</wd>

<space/>

<wd l="3682" t="3922" r="4373" b="4080">metrics.</wd>

</ln>

</para>

<para l="1421" t="4382" r="3888" b="4598" alignment="left" spaceBefore="205" lsp="exactly" lspExact="273" language="en">

<ln l="1421" t="4382" r="3888" b="4598" baseLine="4546" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">

<wd l="1421" t="4382" r="1531" b="4550">3</wd>

<space/>

<wd l="1858" t="4382" r="3250" b="4598">Experimental</wd>

<space/>

<wd l="3322" t="4382" r="3888" b="4598">Setup</wd>

</ln>

</para>

<para l="1421" t="4810" r="5789" b="5472" alignment="justified" spaceBefore="160" lsp="exactly" lspExact="253" language="en">

<ln l="1421" t="4810" r="5789" b="5011" baseLine="4958" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="4810" r="1872" b="5002">First,</wd>

<space/>

<wd l="2035" t="4858" r="2131" b="4968">a</wd>

<space/>

<wd l="2275" t="4810" r="3499" b="4968">normalization</wd>

<space/>

<wd l="3648" t="4810" r="4291" b="4968">lexicon</wd>

<space/>

<wd l="4445" t="4858" r="4776" b="4968">was</wd>

<space/>

<wd l="4939" t="4810" r="5789" b="5011">generated</wd>

<space/>

</ln>

<ln l="1426" t="5064" r="5784" b="5266" baseLine="5213" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="5064" r="1853" b="5222">from</wd>

<space/>

<wd l="1939" t="5064" r="2208" b="5222">the</wd>

<space/>

<wd l="2309" t="5064" r="2789" b="5266">given</wd>

<space/>

<wd l="2885" t="5064" r="3571" b="5266">training</wd>

<space/>

<wd l="3667" t="5064" r="4080" b="5256">data,</wd>

<space/>

<wd l="4186" t="5064" r="4944" b="5222">enriched</wd>

<space/>

<wd l="5035" t="5064" r="5424" b="5222">with</wd>

<space/>

<wd l="5515" t="5064" r="5784" b="5222">the</wd>

<space/>

</ln>

<ln l="1426" t="5314" r="3706" b="5472" baseLine="5467" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="5314" r="1790" b="5472">data</wd>

<space/>

<wd l="1848" t="5314" r="2270" b="5472">from</wd>

<space/>

<wd l="2333" t="5314" r="2942" b="5472">several</wd>

<space/>

<wd l="3014" t="5362" r="3706" b="5472">sources:</wd>

</ln>

</para>

<para l="1704" t="5582" r="5779" b="6293" alignment="justified" li="576" spaceBefore="14" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="5582" r="5779" b="5784" baseLine="5731" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1704" t="5587" r="1982" b="5731">•</wd>

<tab position="1785"/>

<wd l="1982" t="5582" r="2491" b="5741">Word</wd>

<space/>

<wd l="2616" t="5582" r="3048" b="5784">pairs</wd>

<space/>

<wd l="3187" t="5582" r="3998" b="5741">extracted</wd>

<space/>

<wd l="4128" t="5582" r="4550" b="5741">from</wd>

<space/>

<wd l="4680" t="5582" r="4949" b="5741">the</wd>

<space/>

<wd l="5093" t="5582" r="5779" b="5741">datasets</wd>

<space/>

</ln>

<ln l="1982" t="5837" r="5770" b="6038" baseLine="5986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1982" t="5837" r="2395" b="5995">used</wd>

<space/>

<wd l="2462" t="5837" r="2717" b="5995">for</wd>

<space/>

<wd l="2784" t="5837" r="3365" b="5995">lexical</wd>

<space/>

<wd l="3437" t="5837" r="4656" b="5995">normalization</wd>

<space/>

<wd l="4728" t="5837" r="5208" b="6038">(Han,</wd>

<space/>

<wd l="5290" t="5837" r="5770" b="6029">2011;</wd>

<space/>

</ln>

<ln l="1982" t="6091" r="2909" b="6293" baseLine="6240" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1982" t="6091" r="2338" b="6283">Liu,</wd>

<space/>

<wd l="2405" t="6091" r="2909" b="6293">2011)</wd>

</ln>

</para>

<para l="1704" t="6355" r="5789" b="8333" alignment="justified" li="576" spaceBefore="16" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="6355" r="5784" b="6514" baseLine="6504" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1704" t="6360" r="1987" b="6504">•</wd>

<tab position="1785"/>

<wd l="1987" t="6355" r="2328" b="6514">The</wd>

<space/>

<wd l="2434" t="6355" r="2971" b="6514">online</wd>

<space/>

<wd l="3082" t="6355" r="3586" b="6514">social</wd>

<space/>

<wd l="3686" t="6355" r="4224" b="6514">media</wd>

<space/>

<wd l="4325" t="6355" r="5419" b="6514">abbreviation</wd>

<space/>

<wd l="5520" t="6355" r="5784" b="6514">list</wd>

<space/>

</ln>

<ln l="1987" t="6566" r="5779" b="6811" baseLine="6755">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1987" t="6610" r="2189" b="6768">of</wd>

<space/>

<wd l="2232" t="6610" r="2635" b="6768">Beal</wd>

<space/>

</run>

<wd l="2707" t="6566" r="3398" b="6811"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">(2015)</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">1</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3480" t="6610" r="4397" b="6811">Compared</wd>

<space/>

<wd l="4459" t="6629" r="4622" b="6768">to</wd>

<space/>

<wd l="4694" t="6610" r="4963" b="6768">the</wd>

<space/>

<wd l="5026" t="6610" r="5779" b="6811">previous</wd>

<space/>

</run>

</ln>

<ln l="1982" t="6864" r="5779" b="7066" baseLine="7013" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1982" t="6864" r="2933" b="7066">workshops</wd>

<space/>

<wd l="3125" t="6864" r="3514" b="7022">with</wd>

<space/>

<wd l="3701" t="6883" r="4646" b="7022">one-to-one</wd>

<space/>

<wd l="4834" t="6864" r="5779" b="7022">normaliza-</wd>

</ln>

<ln l="1982" t="7118" r="5779" b="7310" baseLine="7267" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1982" t="7118" r="2462" b="7310">tions,</wd>

<space/>

<wd l="2554" t="7118" r="2818" b="7277">the</wd>

<space/>

<wd l="2909" t="7138" r="3528" b="7277">current</wd>

<space/>

<wd l="3610" t="7118" r="3970" b="7277">task</wd>

<space/>

<wd l="4046" t="7118" r="4392" b="7277">also</wd>

<space/>

<wd l="4483" t="7118" r="5309" b="7277">considers</wd>

<space/>

<wd l="5400" t="7166" r="5779" b="7277">one-</wd>

</ln>

<ln l="1982" t="7373" r="5789" b="7574" baseLine="7522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1982" t="7392" r="2722" b="7574">to-many</wd>

<space/>

<wd l="2779" t="7373" r="4138" b="7565">normalizations,</wd>

<space/>

<wd l="4205" t="7373" r="4522" b="7531">and</wd>

<space/>

<wd l="4584" t="7373" r="5443" b="7574">obviously</wd>

<space/>

<wd l="5506" t="7392" r="5789" b="7531">not</wd>

<space/>

</ln>

<ln l="1987" t="7622" r="5784" b="7824" baseLine="7771" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1987" t="7622" r="2203" b="7781">all</wd>

<space/>

<wd l="2270" t="7622" r="3446" b="7781">abbreviations</wd>

<space/>

<wd l="3518" t="7670" r="3778" b="7781">are</wd>

<space/>

<wd l="3840" t="7642" r="4478" b="7824">present</wd>

<space/>

<wd l="4546" t="7622" r="4709" b="7776">in</wd>

<space/>

<wd l="4771" t="7622" r="5040" b="7781">the</wd>

<space/>

<wd l="5102" t="7622" r="5784" b="7824">training</wd>

<space/>

</ln>

<ln l="1987" t="7877" r="5789" b="8069" baseLine="8026" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1987" t="7877" r="2400" b="8069">data,</wd>

<space/>

<wd l="2510" t="7925" r="2693" b="8035">so</wd>

<space/>

<wd l="2789" t="7877" r="3058" b="8035">the</wd>

<space/>

<wd l="3154" t="7925" r="3442" b="8035">use</wd>

<space/>

<wd l="3542" t="7877" r="3744" b="8035">of</wd>

<space/>

<wd l="3821" t="7925" r="3917" b="8035">a</wd>

<space/>

<wd l="4008" t="7877" r="4272" b="8035">list</wd>

<space/>

<wd l="4368" t="7877" r="4570" b="8035">of</wd>

<space/>

<wd l="4651" t="7877" r="5150" b="8035">social</wd>

<space/>

<wd l="5251" t="7877" r="5789" b="8035">media</wd>

<space/>

</ln>

<ln l="1987" t="8131" r="5501" b="8333" baseLine="8280" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1987" t="8131" r="3168" b="8290">abbreviations</wd>

<space/>

<wd l="3230" t="8179" r="3533" b="8290">can</wd>

<space/>

<wd l="3581" t="8131" r="3792" b="8290">be</wd>

<space/>

<wd l="3850" t="8131" r="4238" b="8290">vital</wd>

<space/>

<wd l="4296" t="8150" r="4464" b="8290">to</wd>

<space/>

<wd l="4522" t="8131" r="4790" b="8290">the</wd>

<space/>

<wd l="4858" t="8150" r="5501" b="8333">system.</wd>

</ln>

</para>

<para l="1416" t="8381" r="5789" b="10104" alignment="justified" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="1646" t="8381" r="5779" b="8582" baseLine="8530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="8381" r="1867" b="8539">At</wd>

<space/>

<wd l="1958" t="8381" r="2227" b="8539">the</wd>

<space/>

<wd l="2323" t="8400" r="2942" b="8539">current</wd>

<space/>

<wd l="3043" t="8400" r="3480" b="8582">stage</wd>

<space/>

<wd l="3581" t="8381" r="3778" b="8539">of</wd>

<space/>

<wd l="3854" t="8381" r="4978" b="8582">development</wd>

<space/>

<wd l="5074" t="8381" r="5338" b="8539">the</wd>

<space/>

<wd l="5443" t="8429" r="5779" b="8582">sys-</wd>

</ln>

<ln l="1421" t="8635" r="5784" b="8794" baseLine="8784" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="8654" r="1752" b="8794">tem</wd>

<space/>

<wd l="1872" t="8635" r="2006" b="8794">is</wd>

<space/>

<wd l="2131" t="8635" r="2717" b="8794">unable</wd>

<space/>

<wd l="2832" t="8654" r="3000" b="8794">to</wd>

<space/>

<wd l="3130" t="8635" r="4195" b="8794">differentiate</wd>

<space/>

<wd l="4310" t="8635" r="5045" b="8794">between</wd>

<space/>

<wd l="5174" t="8635" r="5784" b="8794">several</wd>

<space/>

</ln>

<ln l="1421" t="8890" r="5779" b="9082" baseLine="9038" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="8890" r="2645" b="9048">normalization</wd>

<space/>

<wd l="2731" t="8890" r="3475" b="9082">variants;</wd>

<space/>

<wd l="3581" t="8890" r="3994" b="9082">thus,</wd>

<space/>

<wd l="4094" t="8890" r="4675" b="9048">entries</wd>

<space/>

<wd l="4766" t="8890" r="5160" b="9048">with</wd>

<space/>

<wd l="5251" t="8890" r="5779" b="9048">multi-</wd>

</ln>

<ln l="1416" t="9139" r="5784" b="9341" baseLine="9293" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="9139" r="1685" b="9341">ple</wd>

<space/>

<wd l="1762" t="9139" r="2482" b="9341">possible</wd>

<space/>

<wd l="2563" t="9139" r="3254" b="9298">variants</wd>

<space/>

<wd l="3336" t="9187" r="3758" b="9298">were</wd>

<space/>

<wd l="3835" t="9139" r="4651" b="9298">reviewed</wd>

<space/>

<wd l="4718" t="9158" r="4886" b="9298">to</wd>

<space/>

<wd l="4968" t="9139" r="5438" b="9298">make</wd>

<space/>

<wd l="5515" t="9139" r="5784" b="9298">the</wd>

<space/>

</ln>

<ln l="1421" t="9394" r="5789" b="9595" baseLine="9542" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="9413" r="1843" b="9552">most</wd>

<space/>

<wd l="1930" t="9394" r="2602" b="9552">suitable</wd>

<space/>

<wd l="2683" t="9394" r="3293" b="9552">variant</wd>

<space/>

<wd l="3370" t="9394" r="3720" b="9552">first</wd>

<space/>

<wd l="3797" t="9394" r="3965" b="9547">in</wd>

<space/>

<wd l="4037" t="9394" r="4306" b="9552">the</wd>

<space/>

<wd l="4387" t="9394" r="4651" b="9552">list</wd>

<space/>

<wd l="4728" t="9394" r="5376" b="9595">(entries</wd>

<space/>

<wd l="5458" t="9394" r="5789" b="9552">that</wd>

<space/>

</ln>

<ln l="1426" t="9648" r="5784" b="9850" baseLine="9797" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="9696" r="1690" b="9806">are</wd>

<space/>

<wd l="1752" t="9667" r="2179" b="9806">most</wd>

<space/>

<wd l="2246" t="9648" r="2976" b="9850">frequent</wd>

<space/>

<wd l="3043" t="9648" r="3206" b="9802">in</wd>

<space/>

<wd l="3278" t="9648" r="3960" b="9806">datasets</wd>

<space/>

<wd l="4037" t="9696" r="4296" b="9806">are</wd>

<space/>

<wd l="4358" t="9648" r="4939" b="9850">placed</wd>

<space/>

<wd l="5002" t="9648" r="5400" b="9840">first,</wd>

<space/>

<wd l="5472" t="9696" r="5784" b="9850">any</wd>

<space/>

</ln>

<ln l="1421" t="9902" r="4061" b="10104" baseLine="10051" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="9902" r="1723" b="10061">ties</wd>

<space/>

<wd l="1781" t="9950" r="2208" b="10061">were</wd>

<space/>

<wd l="2261" t="9902" r="3082" b="10104">manually</wd>

<space/>

<wd l="3139" t="9902" r="4061" b="10104">reviewed).</wd>

</ln>

</para>

<para l="1416" t="10152" r="5784" b="11366" alignment="justified" spaceBefore="2" fli="216" lsp="exactly" lspExact="252" language="en">

<ln l="1656" t="10152" r="5784" b="10344" baseLine="10306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="10152" r="2342" b="10344">Second,</wd>

<space/>

<wd l="2429" t="10200" r="2525" b="10310">a</wd>

<space/>

<wd l="2602" t="10152" r="3005" b="10310">CRF</wd>

<space/>

<wd l="3082" t="10152" r="3624" b="10310">model</wd>

<space/>

<wd l="3706" t="10200" r="4042" b="10310">was</wd>

<space/>

<wd l="4118" t="10152" r="4776" b="10310">trained.</wd>

<space/>

<wd l="4862" t="10152" r="5203" b="10310">The</wd>

<space/>

<wd l="5280" t="10152" r="5784" b="10310">labels</wd>

<space/>

</ln>

<ln l="1426" t="10406" r="5784" b="10608" baseLine="10555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="10406" r="2035" b="10565">chosen</wd>

<space/>

<wd l="2093" t="10454" r="2515" b="10565">were</wd>

<space/>

<wd l="2587" t="10406" r="3197" b="10565">CAND</wd>

<space/>

<wd l="3269" t="10406" r="3586" b="10565">and</wd>

<space/>

<wd l="3638" t="10406" r="4877" b="10608">NOT_CAND,</wd>

<space/>

<wd l="4944" t="10406" r="5784" b="10608">reflecting</wd>

<space/>

</ln>

<ln l="1416" t="10661" r="5779" b="10862" baseLine="10810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="10661" r="2189" b="10862">potential</wd>

<space/>

<wd l="2338" t="10661" r="3562" b="10819">normalization</wd>

<space/>

<wd l="3710" t="10661" r="4632" b="10819">candidates</wd>

<space/>

<wd l="4786" t="10661" r="5102" b="10819">and</wd>

<space/>

<wd l="5246" t="10661" r="5779" b="10819">words</wd>

<space/>

</ln>

<ln l="1421" t="10910" r="5784" b="11112" baseLine="11064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="10910" r="1752" b="11069">that</wd>

<space/>

<wd l="1838" t="10910" r="2419" b="11069">should</wd>

<space/>

<wd l="2491" t="10930" r="2770" b="11069">not</wd>

<space/>

<wd l="2842" t="10910" r="3053" b="11069">be</wd>

<space/>

<wd l="3130" t="10910" r="4162" b="11102">normalized,</wd>

<space/>

<wd l="4248" t="10910" r="5357" b="11112">respectively.</wd>

<space/>

<wd l="5448" t="10910" r="5784" b="11069">The</wd>

<space/>

</ln>

<ln l="1426" t="11165" r="4013" b="11366" baseLine="11318" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="11165" r="2275" b="11366">following</wd>

<space/>

<wd l="2338" t="11165" r="3024" b="11323">features</wd>

<space/>

<wd l="3082" t="11213" r="3509" b="11323">were</wd>

<space/>

<wd l="3566" t="11165" r="4013" b="11323">used:</wd>

</ln>

</para>

<para l="1421" t="11419" r="5808" b="11827" alignment="justified" fli="216" lsp="exactly" lspExact="251" language="en">

<ln l="1651" t="11419" r="5808" b="11621" baseLine="11568">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="11424" r="2304" b="11578">Token:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2429" t="11419" r="2808" b="11578">This</wd>

<space/>

<wd l="2923" t="11419" r="3528" b="11578">feature</wd>

<space/>

<wd l="3634" t="11438" r="4522" b="11621">represents</wd>

<space/>

<wd l="4627" t="11419" r="4896" b="11578">the</wd>

<space/>

<wd l="5011" t="11419" r="5501" b="11621">string</wd>

<space/>

<wd l="5606" t="11419" r="5808" b="11578">of</wd>

<space/>

</run>

</ln>

<ln l="1421" t="11669" r="2952" b="11827" baseLine="11818" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="11669" r="1685" b="11827">the</wd>

<space/>

<wd l="1752" t="11688" r="2366" b="11827">current</wd>

<space/>

<wd l="2419" t="11669" r="2952" b="11827">token.</wd>

</ln>

</para>

<para l="1416" t="11923" r="5794" b="13138" alignment="justified" spaceBefore="2" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="1651" t="11923" r="5794" b="12082" baseLine="12077">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="11923" r="2390" b="12082">Context</wd>

<space/>

<wd l="2506" t="11928" r="3293" b="12082">Feature:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3408" t="11923" r="3749" b="12082">The</wd>

<space/>

<wd l="3850" t="11923" r="4334" b="12082">token</wd>

<space/>

<wd l="4435" t="11942" r="4603" b="12082">to</wd>

<space/>

<wd l="4709" t="11923" r="4973" b="12082">the</wd>

<space/>

<wd l="5083" t="11923" r="5371" b="12082">left</wd>

<space/>

<wd l="5477" t="11923" r="5794" b="12082">and</wd>

<space/>

</run>

</ln>

<ln l="1421" t="12178" r="5779" b="12379" baseLine="12326" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="12178" r="1685" b="12336">the</wd>

<space/>

<wd l="1747" t="12178" r="2232" b="12336">token</wd>

<space/>

<wd l="2294" t="12197" r="2458" b="12336">to</wd>

<space/>

<wd l="2525" t="12178" r="2789" b="12336">the</wd>

<space/>

<wd l="2851" t="12178" r="3264" b="12379">right</wd>

<space/>

<wd l="3326" t="12226" r="3590" b="12336">are</wd>

<space/>

<wd l="3648" t="12178" r="4056" b="12336">used</wd>

<space/>

<wd l="4114" t="12226" r="4286" b="12336">as</wd>

<space/>

<wd l="4354" t="12197" r="4680" b="12336">two</wd>

<space/>

<wd l="4742" t="12197" r="5386" b="12336">context</wd>

<space/>

<wd l="5448" t="12178" r="5779" b="12336">fea-</wd>

</ln>

<ln l="1421" t="12432" r="5784" b="12634" baseLine="12581" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="12451" r="1891" b="12590">tures.</wd>

<space/>

<wd l="2040" t="12432" r="2376" b="12590">The</wd>

<space/>

<wd l="2525" t="12432" r="3576" b="12634">surrounding</wd>

<space/>

<wd l="3710" t="12432" r="4243" b="12590">words</wd>

<space/>

<wd l="4382" t="12432" r="5016" b="12634">usually</wd>

<space/>

<wd l="5155" t="12480" r="5784" b="12634">convey</wd>

<space/>

</ln>

<ln l="1421" t="12682" r="5784" b="12883" baseLine="12830" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="12682" r="1954" b="12840">useful</wd>

<space/>

<wd l="2040" t="12682" r="3072" b="12840">information</wd>

<space/>

<wd l="3154" t="12682" r="3643" b="12840">about</wd>

<space/>

<wd l="3725" t="12730" r="3821" b="12840">a</wd>

<space/>

<wd l="3893" t="12682" r="4378" b="12840">token</wd>

<space/>

<wd l="4459" t="12682" r="4997" b="12840">which</wd>

<space/>

<wd l="5074" t="12682" r="5534" b="12883">helps</wd>

<space/>

<wd l="5621" t="12682" r="5784" b="12835">in</wd>

<space/>

</ln>

<ln l="1416" t="12936" r="4982" b="13138" baseLine="13085" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="12936" r="2314" b="13138">predicting</wd>

<space/>

<wd l="2366" t="12936" r="2635" b="13094">the</wd>

<space/>

<wd l="2698" t="12955" r="3302" b="13094">correct</wd>

<space/>

<wd l="3355" t="12955" r="3629" b="13138">tag</wd>

<space/>

<wd l="3686" t="12936" r="3941" b="13094">for</wd>

<space/>

<wd l="3994" t="12936" r="4397" b="13094">each</wd>

<space/>

<wd l="4450" t="12936" r="4982" b="13094">token.</wd>

</ln>

</para>

<para l="1421" t="13190" r="5784" b="14150" alignment="justified" spaceBefore="1" spaceAfter="717" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="1646" t="13190" r="5784" b="13392" baseLine="13339">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1646" t="13190" r="3005" b="13392">Alphanumeric</wd>

<space/>

<wd l="3120" t="13190" r="3850" b="13349">feature:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3974" t="13190" r="4358" b="13349">This</wd>

<space/>

<wd l="4474" t="13190" r="5078" b="13349">feature</wd>

<space/>

<wd l="5194" t="13190" r="5784" b="13349">checks</wd>

<space/>

</run>

</ln>

<ln l="1421" t="13440" r="5784" b="13598" baseLine="13589" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="13440" r="2131" b="13598">whether</wd>

<space/>

<wd l="2270" t="13440" r="2539" b="13598">the</wd>

<space/>

<wd l="2683" t="13440" r="3173" b="13598">token</wd>

<space/>

<wd l="3322" t="13440" r="3979" b="13598">adheres</wd>

<space/>

<wd l="4128" t="13459" r="4296" b="13598">to</wd>

<space/>

<wd l="4445" t="13440" r="4709" b="13598">the</wd>

<space/>

<wd l="4862" t="13440" r="5784" b="13598">annotation</wd>

<space/>

</ln>

<ln l="1426" t="13694" r="5779" b="13896" baseLine="13843" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="13694" r="2323" b="13896">guidelines</wd>

<space/>

<wd l="2410" t="13694" r="2726" b="13853">and</wd>

<space/>

<wd l="2798" t="13694" r="3350" b="13853">makes</wd>

<space/>

<wd l="3446" t="13742" r="3802" b="13853">sure</wd>

<space/>

<wd l="3883" t="13694" r="4210" b="13853">that</wd>

<space/>

<wd l="4291" t="13694" r="5462" b="13896">non-adhering</wd>

<space/>

<wd l="5539" t="13714" r="5779" b="13853">to-</wd>

</ln>

<ln l="1421" t="13949" r="5290" b="14150" baseLine="14098" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="13949" r="1814" b="14107">kens</wd>

<space/>

<wd l="1882" t="13997" r="2146" b="14107">are</wd>

<space/>

<wd l="2203" t="13968" r="2486" b="14107">not</wd>

<space/>

<wd l="2539" t="13949" r="3202" b="14107">marked</wd>

<space/>

<wd l="3254" t="13997" r="3432" b="14107">as</wd>

<space/>

<wd l="3490" t="13949" r="4258" b="14150">potential</wd>

<space/>

<wd l="4325" t="13949" r="5290" b="14107">candidates.</wd>

</ln>

</para>

<rulerline l="1416" t="14894" r="4301" b="14894" type="single" width="14" color="000000"/>

<para l="1426" t="15010" r="5755" b="15418" alignment="justified" ri="72" spaceBefore="114" fli="288" lsp="exactly" lspExact="211" language="en">

<ln l="1714" t="15010" r="5755" b="15216" baseLine="15166">

<wd l="1714" t="15010" r="5755" b="15216"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">http://www.webopedia.com/quick_ref/textmessageabbr</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="1426" t="15250" r="2352" b="15418" baseLine="15379" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1426" t="15250" r="2352" b="15418">eviations.asp</wd>

</ln>

</para>

</column>

<column l="6122" t="1389" r="10519" b="15426">

<para l="6125" t="1464" r="10488" b="2174" alignment="justified" spaceBefore="34" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="6350" t="1464" r="10483" b="1666" baseLine="1613">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6350" t="1464" r="7704" b="1622">Normalization</wd>

<space/>

<wd l="7800" t="1464" r="8760" b="1666">dictionary</wd>

<space/>

<wd l="8851" t="1464" r="9581" b="1622">feature:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9682" t="1464" r="10061" b="1622">This</wd>

<space/>

<wd l="10152" t="1464" r="10483" b="1622">fea-</wd>

</run>

</ln>

<ln l="6125" t="1718" r="10488" b="1920" baseLine="1867" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="1738" r="6466" b="1877">ture</wd>

<space/>

<wd l="6566" t="1718" r="7152" b="1877">checks</wd>

<space/>

<wd l="7248" t="1718" r="7958" b="1877">whether</wd>

<space/>

<wd l="8050" t="1718" r="8318" b="1877">the</wd>

<space/>

<wd l="8410" t="1718" r="8894" b="1877">token</wd>

<space/>

<wd l="8995" t="1718" r="9130" b="1877">is</wd>

<space/>

<wd l="9226" t="1738" r="9864" b="1920">present</wd>

<space/>

<wd l="9965" t="1718" r="10128" b="1872">in</wd>

<space/>

<wd l="10219" t="1718" r="10488" b="1877">the</wd>

<space/>

</ln>

<ln l="6130" t="1973" r="9005" b="2174" baseLine="2122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="1973" r="6984" b="2174">generated</wd>

<space/>

<wd l="7037" t="1973" r="8256" b="2131">normalization</wd>

<space/>

<wd l="8318" t="1973" r="9005" b="2131">lexicon.</wd>

</ln>

</para>

<para l="6130" t="2222" r="10488" b="3182" alignment="justified" fli="216" lsp="exactly" lspExact="252" language="en">

<ln l="6355" t="2222" r="10483" b="2381" baseLine="2376">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6355" t="2222" r="7306" b="2381">Canonical</wd>

<space/>

<wd l="7373" t="2222" r="8030" b="2381">lexicon</wd>

<space/>

</run>

<wd l="8102" t="2222" r="8813" b="2381"><run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">feature</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8957" t="2222" r="9336" b="2381">This</wd>

<space/>

<wd l="9408" t="2222" r="10013" b="2381">feature</wd>

<space/>

<wd l="10080" t="2222" r="10483" b="2381">indi-</wd>

</run>

</ln>

<ln l="6130" t="2477" r="10488" b="2678" baseLine="2626" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="2496" r="6562" b="2635">cates</wd>

<space/>

<wd l="6653" t="2477" r="7363" b="2635">whether</wd>

<space/>

<wd l="7450" t="2525" r="7632" b="2635">or</wd>

<space/>

<wd l="7714" t="2496" r="7997" b="2635">not</wd>

<space/>

<wd l="8083" t="2477" r="8347" b="2635">the</wd>

<space/>

<wd l="8434" t="2477" r="8918" b="2635">token</wd>

<space/>

<wd l="9014" t="2477" r="9149" b="2635">is</wd>

<space/>

<wd l="9240" t="2496" r="9878" b="2678">present</wd>

<space/>

<wd l="9970" t="2477" r="10133" b="2630">in</wd>

<space/>

<wd l="10219" t="2477" r="10488" b="2635">the</wd>

<space/>

</ln>

<ln l="6130" t="2731" r="10483" b="2933" baseLine="2880" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="2731" r="6965" b="2890">canonical</wd>

<space/>

<wd l="7051" t="2731" r="7694" b="2890">lexicon</wd>

<space/>

<wd l="7771" t="2731" r="8563" b="2933">provided</wd>

<space/>

<wd l="8630" t="2731" r="8856" b="2933">by</wd>

<space/>

<wd l="8933" t="2731" r="9202" b="2890">the</wd>

<space/>

<wd l="9283" t="2731" r="10147" b="2933">workshop</wd>

<space/>

<wd l="10238" t="2779" r="10483" b="2890">or-</wd>

</ln>

<ln l="6130" t="2981" r="6898" b="3182" baseLine="3134" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="2981" r="6898" b="3182">ganizers.</wd>

</ln>

</para>

<para l="6125" t="3235" r="10488" b="4195" alignment="justified" fli="216" lsp="exactly" lspExact="252" language="en">

<ln l="6350" t="3235" r="10488" b="3437" baseLine="3389">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6350" t="3240" r="6898" b="3394">Word</wd>

<space/>

<wd l="7008" t="3240" r="7594" b="3437">length</wd>

<space/>

<wd l="7714" t="3240" r="8054" b="3394">and</wd>

<space/>

<wd l="8170" t="3240" r="8904" b="3394">number</wd>

<space/>

<wd l="9019" t="3235" r="9211" b="3394">of</wd>

<space/>

</run>

<wd l="9302" t="3240" r="9970" b="3394"><run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">vowels</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10090" t="3240" r="10488" b="3394">Two</wd>

<space/>

</run>

</ln>

<ln l="6134" t="3490" r="10483" b="3691" baseLine="3638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6134" t="3509" r="6845" b="3691">separate</wd>

<space/>

<wd l="6931" t="3490" r="7618" b="3648">features</wd>

<space/>

<wd l="7709" t="3538" r="7882" b="3648">as</wd>

<space/>

<wd l="7963" t="3490" r="8338" b="3648">well</wd>

<space/>

<wd l="8429" t="3538" r="8602" b="3648">as</wd>

<space/>

<wd l="8688" t="3490" r="9096" b="3648">their</wd>

<space/>

<wd l="9178" t="3490" r="10171" b="3682">correlation,</wd>

<space/>

<wd l="10262" t="3490" r="10483" b="3648">al-</wd>

</ln>

<ln l="6130" t="3744" r="10483" b="3946" baseLine="3893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="3744" r="6734" b="3946">lowing</wd>

<space/>

<wd l="6864" t="3763" r="7032" b="3902">to</wd>

<space/>

<wd l="7166" t="3763" r="7430" b="3946">tag</wd>

<space/>

<wd l="7560" t="3744" r="8098" b="3902">words</wd>

<space/>

<wd l="8232" t="3744" r="8621" b="3902">with</wd>

<space/>

<wd l="8750" t="3792" r="9734" b="3902">uncommon</wd>

<space/>

<wd l="9869" t="3744" r="10483" b="3946">length-</wd>

</ln>

<ln l="6125" t="3994" r="9235" b="4195" baseLine="4142">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6125" t="3994" r="6658" b="4152">vowel</wd>

<space/>

<wd l="6720" t="3994" r="7718" b="4186">correlation,</wd>

<space/>

<wd l="7786" t="3994" r="8107" b="4152">like</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8170" t="3994" r="8491" b="4176">bcz,</wd>

<space/>

<wd l="8539" t="3994" r="8861" b="4195">pls,</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8942" t="4013" r="9235" b="4152">etc.</wd>

</run>

</ln>

</para>

<para l="6125" t="4248" r="10488" b="4910" alignment="justified" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="6350" t="4248" r="10483" b="4406" baseLine="4397">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6350" t="4248" r="6754" b="4406">Edit</wd>

<space/>

<wd l="6854" t="4248" r="7613" b="4406">distance</wd>

<space/>

<wd l="7714" t="4248" r="8438" b="4406">feature:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8549" t="4248" r="9077" b="4406">marks</wd>

<space/>

<wd l="9173" t="4296" r="9269" b="4406">a</wd>

<space/>

<wd l="9355" t="4248" r="9840" b="4406">token</wd>

<space/>

<wd l="9926" t="4248" r="10258" b="4406">that</wd>

<space/>

<wd l="10349" t="4248" r="10483" b="4406">is</wd>

<space/>

</run>

</ln>

<ln l="6125" t="4502" r="10488" b="4704" baseLine="4651" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="4502" r="6686" b="4661">within</wd>

<space/>

<wd l="6802" t="4550" r="6998" b="4661">an</wd>

<space/>

<wd l="7118" t="4502" r="7445" b="4661">edit</wd>

<space/>

<wd l="7560" t="4502" r="8275" b="4661">distance</wd>

<space/>

<wd l="8390" t="4502" r="8592" b="4661">of</wd>

<space/>

<wd l="8683" t="4502" r="8784" b="4656">2</wd>

<space/>

<wd l="8904" t="4550" r="9086" b="4661">or</wd>

<space/>

<wd l="9202" t="4502" r="9518" b="4661">less</wd>

<space/>

<wd l="9638" t="4502" r="10066" b="4661">from</wd>

<space/>

<wd l="10176" t="4550" r="10488" b="4704">any</wd>

<space/>

</ln>

<ln l="6125" t="4752" r="8770" b="4910" baseLine="4901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="4752" r="6581" b="4910">word</wd>

<space/>

<wd l="6638" t="4752" r="6802" b="4906">in</wd>

<space/>

<wd l="6859" t="4752" r="7123" b="4910">the</wd>

<space/>

<wd l="7186" t="4752" r="8021" b="4910">canonical</wd>

<space/>

<wd l="8083" t="4752" r="8770" b="4910">lexicon.</wd>

</ln>

</para>

<para l="6355" t="5006" r="8894" b="5198" alignment="justified" li="216" spaceBefore="1" lsp="exactly" lspExact="253" language="en">

<ln l="6355" t="5006" r="8894" b="5198" baseLine="5155" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6355" t="5006" r="6893" b="5198">Third,</wd>

<space/>

<wd l="6950" t="5006" r="7219" b="5165">the</wd>

<space/>

<wd l="7277" t="5026" r="7608" b="5165">text</wd>

<space/>

<wd l="7666" t="5006" r="7800" b="5165">is</wd>

<space/>

<wd l="7862" t="5006" r="8894" b="5165">normalized:</wd>

</ln>

</para>

<para l="6408" t="5275" r="10493" b="5938" alignment="justified" li="504" spaceBefore="14" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="5275" r="10483" b="5477" baseLine="5424" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="5275" r="6691" b="5424">•</wd>

<tab position="6491"/>

<wd l="6691" t="5275" r="6970" b="5429">All</wd>

<space/>

<wd l="7066" t="5275" r="7637" b="5434">tokens</wd>

<space/>

<wd l="7738" t="5275" r="8323" b="5477">tagged</wd>

<space/>

<wd l="8424" t="5323" r="8597" b="5434">as</wd>

<space/>

<wd l="8693" t="5275" r="9461" b="5477">potential</wd>

<space/>

<wd l="9566" t="5275" r="10483" b="5434">candidates</wd>

<space/>

</ln>

<ln l="6686" t="5530" r="10493" b="5731" baseLine="5678" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6686" t="5530" r="6912" b="5731">by</wd>

<space/>

<wd l="6984" t="5530" r="7248" b="5688">the</wd>

<space/>

<wd l="7334" t="5530" r="7738" b="5688">CRF</wd>

<space/>

<wd l="7814" t="5530" r="8357" b="5688">model</wd>

<space/>

<wd l="8443" t="5578" r="8707" b="5688">are</wd>

<space/>

<wd l="8779" t="5530" r="9773" b="5688">normalized</wd>

<space/>

<wd l="9840" t="5549" r="10008" b="5688">to</wd>

<space/>

<wd l="10085" t="5530" r="10493" b="5688">their</wd>

<space/>

</ln>

<ln l="6696" t="5779" r="8136" b="5938" baseLine="5928" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6696" t="5779" r="7339" b="5938">lexicon</wd>

<space/>

<wd l="7397" t="5779" r="8136" b="5938">variants.</wd>

</ln>

</para>

<para l="6408" t="6048" r="10493" b="7219" alignment="justified" li="504" spaceBefore="21" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="6048" r="10483" b="6250" baseLine="6202" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="6048" r="6691" b="6202">•</wd>

<tab position="6494"/>

<wd l="6691" t="6048" r="6970" b="6202">All</wd>

<space/>

<wd l="7046" t="6048" r="8232" b="6250">alphanumeric</wd>

<space/>

<wd l="8309" t="6048" r="8846" b="6206">words</wd>

<space/>

<wd l="8923" t="6096" r="9182" b="6206">are</wd>

<space/>

<wd l="9254" t="6048" r="10253" b="6206">normalized</wd>

<space/>

<wd l="10315" t="6067" r="10483" b="6206">to</wd>

<space/>

</ln>

<ln l="6691" t="6302" r="10493" b="6504" baseLine="6451" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="6302" r="6955" b="6461">the</wd>

<space/>

<wd l="7085" t="6302" r="7944" b="6461">American</wd>

<space/>

<wd l="8083" t="6302" r="8770" b="6504">spelling</wd>

<space/>

<wd l="8890" t="6302" r="9278" b="6461">with</wd>

<space/>

<wd l="9403" t="6302" r="9672" b="6461">the</wd>

<space/>

<wd l="9792" t="6302" r="10493" b="6461">VarCon</wd>

<space/>

</ln>

<ln l="6691" t="6514" r="10488" b="6758" baseLine="6703">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6691" t="6557" r="7027" b="6715">tool</wd>

<space/>

<wd l="7133" t="6557" r="8059" b="6758">(Atkinson,</wd>

<space/>

</run>

<wd l="8165" t="6514" r="8798" b="6758"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015)</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8909" t="6557" r="9293" b="6715">This</wd>

<space/>

<wd l="9398" t="6557" r="10118" b="6715">includes</wd>

<space/>

<wd l="10219" t="6557" r="10488" b="6715">the</wd>

<space/>

</run>

</ln>

<ln l="6691" t="6811" r="10493" b="7013" baseLine="6960" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="6811" r="7258" b="6970">tokens</wd>

<space/>

<wd l="7325" t="6811" r="7862" b="6970">which</wd>

<space/>

<wd l="7930" t="6859" r="8189" b="6970">are</wd>

<space/>

<wd l="8261" t="6811" r="8904" b="7013">already</wd>

<space/>

<wd l="8962" t="6811" r="9955" b="6970">normalized</wd>

<space/>

<wd l="10013" t="6811" r="10493" b="7013">using</wd>

<space/>

</ln>

<ln l="6691" t="7061" r="7709" b="7219" baseLine="7214" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6691" t="7061" r="6955" b="7219">the</wd>

<space/>

<wd l="7018" t="7061" r="7709" b="7219">lexicon.</wd>

</ln>

</para>

<para l="6408" t="7330" r="10512" b="14870" alignment="justified" li="504" spaceBefore="14" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6408" t="7330" r="10478" b="7531" baseLine="7478" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6408" t="7334" r="6691" b="7478">•</wd>

<tab position="6489"/>

<wd l="6691" t="7334" r="6994" b="7488">We</wd>

<space/>

<wd l="7061" t="7330" r="7474" b="7488">have</wd>

<space/>

<wd l="7546" t="7330" r="7891" b="7488">also</wd>

<space/>

<wd l="7958" t="7330" r="8366" b="7488">tried</wd>

<space/>

<wd l="8429" t="7349" r="8592" b="7488">to</wd>

<space/>

<wd l="8669" t="7330" r="9389" b="7531">improve</wd>

<space/>

<wd l="9456" t="7330" r="9725" b="7488">the</wd>

<space/>

<wd l="9792" t="7330" r="10478" b="7488">normal-</wd>

</ln>

<ln l="6696" t="7584" r="10478" b="7786" baseLine="7733" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="7584" r="7291" b="7742">ization</wd>

<space/>

<wd l="7411" t="7584" r="7982" b="7742">results</wd>

<space/>

<wd l="8098" t="7584" r="8323" b="7786">by</wd>

<space/>

<wd l="8443" t="7584" r="8918" b="7786">using</wd>

<space/>

<wd l="9043" t="7632" r="9139" b="7742">a</wd>

<space/>

<wd l="9259" t="7584" r="10478" b="7786">did-you-mean</wd>

<space/>

</ln>

<ln l="6696" t="7838" r="10483" b="8040" baseLine="7987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="7838" r="7344" b="8040">(DYM)</wd>

<space/>

<wd l="7426" t="7838" r="8078" b="7997">module</wd>

<space/>

<wd l="8155" t="7838" r="8486" b="7997">that</wd>

<space/>

<wd l="8563" t="7838" r="8702" b="7997">is</wd>

<space/>

<wd l="8784" t="7838" r="9571" b="8040">currently</wd>

<space/>

<wd l="9638" t="7838" r="10138" b="8040">being</wd>

<space/>

<wd l="10210" t="7838" r="10483" b="7997">de-</wd>

</ln>

<ln l="6691" t="8088" r="10488" b="8290" baseLine="8237" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="8088" r="7392" b="8290">veloped</wd>

<space/>

<wd l="7522" t="8107" r="7675" b="8246">at</wd>

<space/>

<wd l="7810" t="8088" r="8150" b="8246">IHS</wd>

<space/>

<wd l="8285" t="8088" r="8755" b="8246">R&amp;D</wd>

<space/>

<wd l="8890" t="8107" r="9360" b="8246">team.</wd>

<space/>

<wd l="9509" t="8088" r="9845" b="8246">The</wd>

<space/>

<wd l="9979" t="8093" r="10488" b="8242">DYM</wd>

<space/>

</ln>

<ln l="6691" t="8342" r="10483" b="8544" baseLine="8491" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="8342" r="7344" b="8501">module</wd>

<space/>

<wd l="7536" t="8362" r="8222" b="8501">corrects</wd>

<space/>

<wd l="8405" t="8390" r="8774" b="8501">user</wd>

<space/>

<wd l="8957" t="8342" r="10483" b="8544">queries/sentences</wd>

<space/>

</ln>

<ln l="6691" t="8597" r="10493" b="8798" baseLine="8746" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="8597" r="7080" b="8755">with</wd>

<space/>

<wd l="7186" t="8597" r="8280" b="8798">misspellings</wd>

<space/>

<wd l="8386" t="8597" r="8611" b="8798">by</wd>

<space/>

<wd l="8707" t="8597" r="9571" b="8798">providing</wd>

<space/>

<wd l="9677" t="8597" r="10493" b="8755">corrected</wd>

<space/>

</ln>

<ln l="6691" t="8846" r="10483" b="9048" baseLine="9000" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="8846" r="7526" b="9048">variant(s)</wd>

<space/>

<wd l="7627" t="8846" r="8016" b="9005">with</wd>

<space/>

<wd l="8112" t="8894" r="8208" b="9005">a</wd>

<space/>

<wd l="8299" t="8846" r="9254" b="9005">confidence</wd>

<space/>

<wd l="9350" t="8894" r="10080" b="9005">measure</wd>

<space/>

<wd l="10176" t="8846" r="10483" b="9048">(in-</wd>

</ln>

<ln l="6696" t="9101" r="10483" b="9302" baseLine="9254" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="9101" r="7349" b="9302">cluding</wd>

<space/>

<wd l="7416" t="9149" r="7632" b="9259">no</wd>

<space/>

<wd l="7709" t="9101" r="8597" b="9259">correction</wd>

<space/>

<wd l="8664" t="9101" r="9274" b="9259">variant</wd>

<space/>

<wd l="9341" t="9101" r="9730" b="9259">with</wd>

<space/>

<wd l="9802" t="9101" r="10066" b="9259">the</wd>

<space/>

<wd l="10142" t="9149" r="10483" b="9259">cor-</wd>

</ln>

<ln l="6691" t="9355" r="10488" b="9557" baseLine="9504" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="9355" r="7670" b="9557">responding</wd>

<space/>

<wd l="7891" t="9355" r="8846" b="9514">confidence</wd>

<space/>

<wd l="9067" t="9355" r="9917" b="9557">measure).</wd>

<space/>

<wd l="10152" t="9355" r="10488" b="9514">The</wd>

<space/>

</ln>

<ln l="6691" t="9610" r="10488" b="9768" baseLine="9758" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="9614" r="7200" b="9763">DYM</wd>

<space/>

<wd l="7262" t="9610" r="7920" b="9768">module</wd>

<space/>

<wd l="7987" t="9610" r="8126" b="9768">is</wd>

<space/>

<wd l="8194" t="9658" r="8390" b="9768">an</wd>

<space/>

<wd l="8467" t="9610" r="8928" b="9768">SVM</wd>

<space/>

<wd l="8990" t="9610" r="9533" b="9768">model</wd>

<space/>

<wd l="9600" t="9610" r="10214" b="9768">trained</wd>

<space/>

<wd l="10277" t="9658" r="10488" b="9768">on</wd>

<space/>

</ln>

<ln l="6696" t="9859" r="10483" b="10061" baseLine="10013" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="9907" r="6792" b="10018">a</wd>

<space/>

<wd l="6888" t="9878" r="7123" b="10018">set</wd>

<space/>

<wd l="7224" t="9859" r="7421" b="10018">of</wd>

<space/>

<wd l="7498" t="9859" r="8184" b="10018">features</wd>

<space/>

<wd l="8285" t="9859" r="8539" b="10018">for</wd>

<space/>

<wd l="8630" t="9859" r="9029" b="10018">each</wd>

<space/>

<wd l="9125" t="9859" r="9326" b="10018">of</wd>

<space/>

<wd l="9394" t="9859" r="9662" b="10018">the</wd>

<space/>

<wd l="9754" t="9859" r="10483" b="10061">multiple</wd>

<space/>

</ln>

<ln l="6696" t="10114" r="10483" b="10315" baseLine="10262" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="10114" r="7613" b="10272">candidates</wd>

<space/>

<wd l="7766" t="10114" r="8621" b="10315">generated</wd>

<space/>

<wd l="8765" t="10114" r="9019" b="10272">for</wd>

<space/>

<wd l="9158" t="10162" r="9355" b="10272">an</wd>

<space/>

<wd l="9509" t="10114" r="9960" b="10315">input</wd>

<space/>

<wd l="10104" t="10162" r="10483" b="10315">que-</wd>

</ln>

<ln l="6691" t="10368" r="10483" b="10570" baseLine="10517" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="10368" r="7733" b="10570">ry/sentence.</wd>

<space/>

<wd l="7862" t="10373" r="8165" b="10526">We</wd>

<space/>

<wd l="8280" t="10368" r="8688" b="10526">used</wd>

<space/>

<wd l="8798" t="10368" r="9062" b="10526">the</wd>

<space/>

<wd l="9182" t="10368" r="10037" b="10570">following</wd>

<space/>

<wd l="10152" t="10368" r="10483" b="10526">fea-</wd>

</ln>

<ln l="6691" t="10618" r="10483" b="10810" baseLine="10766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="10637" r="7162" b="10776">tures:</wd>

<space/>

<wd l="7267" t="10666" r="7694" b="10776">error</wd>

<space/>

<wd l="7771" t="10618" r="8314" b="10776">model</wd>

<space/>

<wd l="8410" t="10666" r="8914" b="10810">score,</wd>

<space/>

<wd l="9005" t="10618" r="10075" b="10776">Levenshtein</wd>

<space/>

<wd l="10166" t="10618" r="10483" b="10776">dis-</wd>

</ln>

<ln l="6691" t="10872" r="10512" b="11074" baseLine="11026" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="10891" r="7200" b="11064">tance,</wd>

<space/>

<wd l="7310" t="10872" r="8093" b="11074">language</wd>

<space/>

<wd l="8189" t="10872" r="8731" b="11030">model</wd>

<space/>

<wd l="8842" t="10920" r="9346" b="11064">score,</wd>

<space/>

<wd l="9446" t="10872" r="9715" b="11030">the</wd>

<space/>

<wd l="9811" t="10872" r="10210" b="11030">ratio</wd>

<space/>

<wd l="10310" t="10872" r="10512" b="11030">of</wd>

<space/>

</ln>

<ln l="6696" t="11126" r="10483" b="11328" baseLine="11275" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="11174" r="7459" b="11285">common</wd>

<space/>

<wd l="7526" t="11174" r="7968" b="11285">noun</wd>

<space/>

<wd l="8040" t="11126" r="9014" b="11328">vocabulary</wd>

<space/>

<wd l="9086" t="11126" r="9672" b="11318">words,</wd>

<space/>

<wd l="9749" t="11126" r="10013" b="11285">the</wd>

<space/>

<wd l="10085" t="11126" r="10483" b="11285">ratio</wd>

<space/>

</ln>

<ln l="6696" t="11376" r="10488" b="11578" baseLine="11525" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="11376" r="6898" b="11534">of</wd>

<space/>

<wd l="6946" t="11424" r="7526" b="11578">proper</wd>

<space/>

<wd l="7598" t="11424" r="8040" b="11534">noun</wd>

<space/>

<wd l="8112" t="11376" r="9086" b="11578">vocabulary</wd>

<space/>

<wd l="9163" t="11376" r="9749" b="11568">words,</wd>

<space/>

<wd l="9835" t="11376" r="10152" b="11534">and</wd>

<space/>

<wd l="10219" t="11376" r="10488" b="11534">the</wd>

<space/>

</ln>

<ln l="6691" t="11630" r="10488" b="11832" baseLine="11779" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="11630" r="7363" b="11789">number</wd>

<space/>

<wd l="7560" t="11630" r="7762" b="11789">of</wd>

<space/>

<wd l="7939" t="11630" r="8640" b="11832">changes</wd>

<space/>

<wd l="8846" t="11630" r="9010" b="11784">in</wd>

<space/>

<wd l="9206" t="11630" r="10488" b="11789">non-lowercase</wd>

<space/>

</ln>

<ln l="6691" t="11885" r="10493" b="12043" baseLine="12034" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="11885" r="7272" b="12043">words.</wd>

<space/>

<wd l="7349" t="11885" r="7618" b="12038">An</wd>

<space/>

<wd l="7690" t="11933" r="8117" b="12043">error</wd>

<space/>

<wd l="8179" t="11885" r="8722" b="12043">model</wd>

<space/>

<wd l="8803" t="11933" r="9254" b="12043">score</wd>

<space/>

<wd l="9326" t="11933" r="9662" b="12043">was</wd>

<space/>

<wd l="9739" t="11885" r="10493" b="12043">obtained</wd>

<space/>

</ln>

<ln l="6696" t="12139" r="10483" b="12341" baseLine="12288" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="12139" r="7123" b="12298">from</wd>

<space/>

<wd l="7243" t="12187" r="7440" b="12298">an</wd>

<space/>

<wd l="7570" t="12139" r="8933" b="12341">autocompletion</wd>

<space/>

<wd l="9053" t="12139" r="9370" b="12298">and</wd>

<space/>

<wd l="9494" t="12158" r="10483" b="12298">autocorrec-</wd>

</ln>

<ln l="6691" t="12389" r="10488" b="12590" baseLine="12538" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="12389" r="7037" b="12547">tion</wd>

<space/>

<wd l="7142" t="12389" r="7795" b="12547">module</wd>

<space/>

<wd l="7915" t="12389" r="8563" b="12590">(AAM)</wd>

<space/>

<wd l="8683" t="12389" r="8938" b="12547">for</wd>

<space/>

<wd l="9038" t="12389" r="9581" b="12547">which</wd>

<space/>

<wd l="9691" t="12437" r="9888" b="12547">an</wd>

<space/>

<wd l="10008" t="12389" r="10488" b="12547">index</wd>

<space/>

</ln>

<ln l="6691" t="12643" r="10483" b="12845" baseLine="12792" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="12691" r="7027" b="12802">was</wd>

<space/>

<wd l="7128" t="12643" r="7536" b="12802">built</wd>

<space/>

<wd l="7637" t="12643" r="8064" b="12802">from</wd>

<space/>

<wd l="8184" t="12643" r="8736" b="12802">12.4M</wd>

<space/>

<wd l="8846" t="12643" r="9787" b="12802">documents</wd>

<space/>

<wd l="9898" t="12643" r="10483" b="12845">(scien-</wd>

</ln>

<ln l="6691" t="12893" r="10483" b="13099" baseLine="13046" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="12898" r="7042" b="13056">tific</wd>

<space/>

<wd l="7133" t="12946" r="7704" b="13099">papers</wd>

<space/>

<wd l="7810" t="12994" r="7872" b="13013">-</wd>

<space/>

<wd l="7963" t="12898" r="8582" b="13090">42.1%,</wd>

<space/>

<wd l="8683" t="12898" r="9600" b="13099">Wikipedia</wd>

<space/>

<wd l="9696" t="12898" r="10320" b="13056">articles</wd>

<space/>

<wd l="10421" t="12989" r="10483" b="13013">-</wd>

<space/>

</ln>

<ln l="6691" t="13147" r="10478" b="13349" baseLine="13296" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="13147" r="7306" b="13339">23.5%,</wd>

<space/>

<wd l="7382" t="13166" r="8006" b="13349">patents</wd>

<space/>

<wd l="8088" t="13243" r="8150" b="13262">-</wd>

<space/>

<wd l="8246" t="13147" r="8842" b="13339">19.4%,</wd>

<space/>

<wd l="8933" t="13147" r="9432" b="13306">social</wd>

<space/>

<wd l="9509" t="13166" r="9922" b="13306">texts</wd>

<space/>

<wd l="10003" t="13243" r="10066" b="13262">-</wd>

<space/>

<wd l="10147" t="13147" r="10478" b="13339">8%,</wd>

<space/>

</ln>

<ln l="6696" t="13402" r="10483" b="13603" baseLine="13550" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="13402" r="7013" b="13560">and</wd>

<space/>

<wd l="7138" t="13450" r="7584" b="13560">news</wd>

<space/>

<wd l="7723" t="13498" r="7786" b="13517">-</wd>

<space/>

<wd l="7920" t="13402" r="8328" b="13603">7%).</wd>

<space/>

<wd l="8467" t="13402" r="8803" b="13560">The</wd>

<space/>

<wd l="8938" t="13402" r="9566" b="13603">2-gram</wd>

<space/>

<wd l="9696" t="13402" r="10483" b="13603">language</wd>

<space/>

</ln>

<ln l="6691" t="13656" r="10488" b="13858" baseLine="13805" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="13656" r="7234" b="13814">model</wd>

<space/>

<wd l="7296" t="13704" r="7637" b="13814">was</wd>

<space/>

<wd l="7694" t="13656" r="8102" b="13814">built</wd>

<space/>

<wd l="8165" t="13656" r="8592" b="13814">from</wd>

<space/>

<wd l="8669" t="13656" r="9139" b="13814">177K</wd>

<space/>

<wd l="9187" t="13675" r="9811" b="13858">patents</wd>

<space/>

<wd l="9878" t="13656" r="10488" b="13858">(1.36G</wd>

<space/>

</ln>

<ln l="6691" t="13910" r="10493" b="14112" baseLine="14059" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="13910" r="7224" b="14069">words</wd>

<space/>

<wd l="7286" t="13910" r="7608" b="14069">and</wd>

<space/>

<wd l="7666" t="13910" r="8126" b="14069">2.6M</wd>

<space/>

<wd l="8189" t="13910" r="9278" b="14112">vocabulary).</wd>

<space/>

<wd l="9360" t="13910" r="9835" b="14069">Since</wd>

<space/>

<wd l="9898" t="13958" r="10152" b="14069">we</wd>

<space/>

<wd l="10214" t="13910" r="10493" b="14069">did</wd>

<space/>

</ln>

<ln l="6691" t="14160" r="10483" b="14362" baseLine="14309" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6691" t="14179" r="6974" b="14318">not</wd>

<space/>

<wd l="7046" t="14160" r="7459" b="14318">have</wd>

<space/>

<wd l="7541" t="14160" r="8184" b="14362">enough</wd>

<space/>

<wd l="8261" t="14160" r="8645" b="14318">time</wd>

<space/>

<wd l="8722" t="14179" r="8890" b="14318">to</wd>

<space/>

<wd l="8971" t="14160" r="9437" b="14318">tailor</wd>

<space/>

<wd l="9504" t="14160" r="9902" b="14318">both</wd>

<space/>

<wd l="9974" t="14165" r="10483" b="14314">DYM</wd>

<space/>

</ln>

<ln l="6696" t="14414" r="10483" b="14616" baseLine="14563" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="14414" r="7013" b="14573">and</wd>

<space/>

<wd l="7138" t="14414" r="7646" b="14568">AAM</wd>

<space/>

<wd l="7776" t="14414" r="8515" b="14573">modules</wd>

<space/>

<wd l="8650" t="14414" r="8904" b="14573">for</wd>

<space/>

<wd l="9038" t="14414" r="9538" b="14573">social</wd>

<space/>

<wd l="9667" t="14434" r="9998" b="14573">text</wd>

<space/>

<wd l="10118" t="14462" r="10483" b="14616">pro-</wd>

</ln>

<ln l="6696" t="14669" r="10488" b="14870" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="6696" t="14669" r="7387" b="14870">cessing,</wd>

<space/>

<wd l="7507" t="14674" r="8016" b="14822">DYM</wd>

<space/>

<wd l="8141" t="14669" r="8458" b="14827">and</wd>

<space/>

<wd l="8573" t="14669" r="9082" b="14822">AAM</wd>

<space/>

<wd l="9202" t="14669" r="9941" b="14827">modules</wd>

<space/>

<wd l="10061" t="14717" r="10488" b="14827">were</wd>

</ln>

</para>

<para l="6408" t="15221" r="8813" b="15418" alignment="left" li="216" spaceBefore="338" lsp="exactly" lspExact="206" language="en">

<ln l="6408" t="15221" r="8813" b="15418" baseLine="15376">

<wd l="6408" t="15221" r="8813" b="15418"><run underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">http://wordlist.aspell.net/varcon/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<rulerline l="6120" t="15106" r="9005" b="15106" type="single" width="19" color="000000"/>

<dd l="1416" t="15736" r="10519" b="15977">

<para l="5800" t="15792" r="6143" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5866" t="15792" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="41">

<wd l="5866" t="15792" r="6077" b="15946">79</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4311.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1282" marginTop="1417" marginRight="1392" marginBottom="1292" offsetX="52" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1282" t="1417" r="10517" b="15344">

<column l="1282" t="1417" r="5908" b="15344">

<para l="1982" t="1464" r="5789" b="2131" alignment="justified" li="648" ri="72" spaceBefore="5" lsp="exactly" lspExact="253" language="en">

<ln l="1982" t="1464" r="5784" b="1622" baseLine="1613" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1982" t="1464" r="2395" b="1622">used</wd>

<space/>

<wd l="2467" t="1464" r="2722" b="1622">for</wd>

<space/>

<wd l="2794" t="1464" r="3106" b="1622">this</wd>

<space/>

<wd l="3187" t="1464" r="3835" b="1622">Twitter</wd>

<space/>

<wd l="3907" t="1464" r="4488" b="1622">lexical</wd>

<space/>

<wd l="4565" t="1464" r="5784" b="1622">normalization</wd>

<space/>

</ln>

<ln l="1992" t="1718" r="5789" b="1920" baseLine="1867" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1992" t="1738" r="2597" b="1920">system</wd>

<space/>

<wd l="2717" t="1766" r="2890" b="1877">as</wd>

<space/>

<wd l="3014" t="1718" r="3206" b="1910">is,</wd>

<space/>

<wd l="3322" t="1718" r="3816" b="1920">being</wd>

<space/>

<wd l="3936" t="1718" r="4627" b="1920">actually</wd>

<space/>

<wd l="4742" t="1718" r="5419" b="1877">tailored</wd>

<space/>

<wd l="5534" t="1718" r="5789" b="1877">for</wd>

<space/>

</ln>

<ln l="1982" t="1973" r="4526" b="2131" baseLine="2122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1982" t="1973" r="2779" b="2131">technical</wd>

<space/>

<wd l="2842" t="1973" r="3158" b="2131">and</wd>

<space/>

<wd l="3216" t="1973" r="4008" b="2131">scientific</wd>

<space/>

<wd l="4070" t="1992" r="4526" b="2131">texts.</wd>

</ln>

</para>

<para l="1421" t="2640" r="4440" b="2842" alignment="left" li="144" ri="72" spaceBefore="411" lsp="exactly" lspExact="259" language="en">

<ln l="1421" t="2640" r="4440" b="2842" baseLine="2789" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">

<wd l="1421" t="2640" r="1675" b="2798">3.1</wd>

<space/>

<wd l="1997" t="2645" r="2678" b="2798">Results</wd>

<space/>

<wd l="2746" t="2645" r="3091" b="2798">and</wd>

<space/>

<wd l="3154" t="2688" r="3643" b="2798">error</wd>

<space/>

<wd l="3710" t="2640" r="4440" b="2842">analysis</wd>

</ln>

</para>

<para l="1426" t="3010" r="5808" b="3422" alignment="justified" li="144" ri="72" spaceBefore="115" lsp="exactly" lspExact="253" language="en">

<ln l="1426" t="3010" r="5808" b="3211" baseLine="3158" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="3010" r="2078" b="3211">Testing</wd>

<space/>

<wd l="2136" t="3058" r="2477" b="3168">was</wd>

<space/>

<wd l="2534" t="3010" r="3456" b="3211">performed</wd>

<space/>

<wd l="3518" t="3058" r="3734" b="3168">on</wd>

<space/>

<wd l="3792" t="3010" r="4056" b="3168">the</wd>

<space/>

<wd l="4114" t="3010" r="4906" b="3211">provided</wd>

<space/>

<wd l="4963" t="3058" r="5539" b="3211">corpus</wd>

<space/>

<wd l="5606" t="3010" r="5808" b="3168">of</wd>

<space/>

</ln>

<ln l="1445" t="3264" r="2520" b="3422" baseLine="3413" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3264" r="1853" b="3422">1967</wd>

<space/>

<wd l="1915" t="3283" r="2520" b="3422">tweets.</wd>

</ln>

</para>

<para l="1426" t="3514" r="5779" b="3926" alignment="justified" li="144" ri="72" spaceBefore="3" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="1651" t="3514" r="5779" b="3715" baseLine="3667" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="3514" r="2146" b="3672">Table</wd>

<space/>

<wd l="2275" t="3514" r="2338" b="3667">1</wd>

<space/>

<wd l="2472" t="3514" r="3010" b="3672">shows</wd>

<space/>

<wd l="3110" t="3514" r="3379" b="3672">the</wd>

<space/>

<wd l="3475" t="3514" r="4584" b="3715">performance</wd>

<space/>

<wd l="4694" t="3514" r="4896" b="3672">of</wd>

<space/>

<wd l="4982" t="3562" r="5275" b="3672">our</wd>

<space/>

<wd l="5376" t="3514" r="5779" b="3672">CRF</wd>

<space/>

</ln>

<ln l="1426" t="3768" r="4920" b="3926" baseLine="3922" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="3768" r="2261" b="3926">candidate</wd>

<space/>

<wd l="2318" t="3768" r="2861" b="3926">model</wd>

<space/>

<wd l="2923" t="3768" r="3312" b="3926">with</wd>

<space/>

<wd l="3374" t="3768" r="4128" b="3926">different</wd>

<space/>

<wd l="4186" t="3768" r="4920" b="3926">features:</wd>

</ln>

</para>

<para l="1704" t="4037" r="5789" b="4493" alignment="justified" li="648" ri="72" spaceBefore="12" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="4037" r="5789" b="4238" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1704" t="4037" r="1982" b="4186">•</wd>

<tab position="1787"/>

<wd l="1982" t="4037" r="2141" b="4190">A</wd>

<space/>

<wd l="2203" t="4037" r="2928" b="4195">baseline</wd>

<space/>

<wd l="3000" t="4037" r="3542" b="4195">model</wd>

<space/>

<wd l="3614" t="4037" r="4003" b="4195">with</wd>

<space/>

<wd l="4075" t="4037" r="4464" b="4238">only</wd>

<space/>

<wd l="4526" t="4037" r="5064" b="4229">token,</wd>

<space/>

<wd l="5146" t="4056" r="5789" b="4195">context</wd>

<space/>

</ln>

<ln l="1987" t="4291" r="4349" b="4493" baseLine="4440" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1987" t="4291" r="2309" b="4450">and</wd>

<space/>

<wd l="2362" t="4291" r="3547" b="4493">alphanumeric</wd>

<space/>

<wd l="3619" t="4291" r="4349" b="4450">features.</wd>

</ln>

</para>

<para l="1704" t="4560" r="5784" b="5222" alignment="justified" li="648" ri="72" spaceBefore="14" fli="-288" lsp="exactly" lspExact="253" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="4560" r="5784" b="4718" baseLine="4709" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1704" t="4560" r="1982" b="4709">•</wd>

<tab position="1787"/>

<wd l="1982" t="4560" r="2141" b="4714">A</wd>

<space/>

<wd l="2237" t="4560" r="2962" b="4718">baseline</wd>

<space/>

<wd l="3062" t="4560" r="3605" b="4718">model</wd>

<space/>

<wd l="3710" t="4560" r="4099" b="4718">with</wd>

<space/>

<wd l="4195" t="4560" r="4464" b="4718">the</wd>

<space/>

<wd l="4565" t="4560" r="5784" b="4718">normalization</wd>

<space/>

</ln>

<ln l="1987" t="4814" r="5779" b="5016" baseLine="4963" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1987" t="4814" r="2880" b="5016">dictionary</wd>

<space/>

<wd l="2981" t="4814" r="3298" b="4973">and</wd>

<space/>

<wd l="3394" t="4814" r="3658" b="4973">the</wd>

<space/>

<wd l="3763" t="4814" r="4598" b="4973">canonical</wd>

<space/>

<wd l="4704" t="4814" r="5347" b="4973">lexicon</wd>

<space/>

<wd l="5448" t="4814" r="5779" b="4973">fea-</wd>

</ln>

<ln l="1982" t="5064" r="3038" b="5222" baseLine="5213" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1982" t="5083" r="2410" b="5222">tures</wd>

<space/>

<wd l="2472" t="5064" r="3038" b="5222">added.</wd>

</ln>

</para>

<para l="1704" t="5333" r="5006" b="5491" alignment="justified" li="648" ri="72" spaceBefore="16" fli="-288" lsp="exactly" lspExact="252" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1704" t="5333" r="5006" b="5491" baseLine="5482" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1704" t="5333" r="1982" b="5482">•</wd>

<tab position="1787"/>

<wd l="1982" t="5333" r="2141" b="5486">A</wd>

<space/>

<wd l="2198" t="5333" r="2741" b="5491">model</wd>

<space/>

<wd l="2803" t="5333" r="3197" b="5491">with</wd>

<space/>

<wd l="3254" t="5333" r="3470" b="5491">all</wd>

<space/>

<wd l="3533" t="5333" r="4219" b="5491">features</wd>

<space/>

<wd l="4282" t="5333" r="5006" b="5491">enabled.</wd>

</ln>

</para>

<para l="1421" t="5587" r="5784" b="6250" alignment="justified" li="144" ri="72" spaceAfter="238" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="1709" t="5587" r="5784" b="5746" baseLine="5736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1709" t="5587" r="2203" b="5746">Table</wd>

<space/>

<wd l="2299" t="5587" r="2400" b="5741">2</wd>

<space/>

<wd l="2491" t="5587" r="3134" b="5746">reflects</wd>

<space/>

<wd l="3230" t="5635" r="3523" b="5746">our</wd>

<space/>

<wd l="3619" t="5587" r="4478" b="5746">submitted</wd>

<space/>

<wd l="4565" t="5587" r="5784" b="5746">normalization</wd>

<space/>

</ln>

<ln l="1421" t="5842" r="5779" b="6000" baseLine="5990" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="5842" r="1910" b="6000">result</wd>

<space/>

<wd l="1987" t="5842" r="2304" b="6000">and</wd>

<space/>

<wd l="2376" t="5890" r="2472" b="6000">a</wd>

<space/>

<wd l="2539" t="5842" r="3029" b="6000">result</wd>

<space/>

<wd l="3106" t="5842" r="3778" b="6000">without</wd>

<space/>

<wd l="3845" t="5842" r="4114" b="6000">the</wd>

<space/>

<wd l="4190" t="5846" r="4699" b="5995">DYM</wd>

<space/>

<wd l="4776" t="5842" r="5429" b="6000">module</wd>

<space/>

<wd l="5510" t="5842" r="5779" b="6000">de-</wd>

</ln>

<ln l="1430" t="6091" r="2678" b="6250" baseLine="6240" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1430" t="6091" r="2059" b="6250">scribed</wd>

<space/>

<wd l="2117" t="6091" r="2678" b="6250">above.</wd>

</ln>

</para>

<table l="1282" t="6562" r="5908" b="9158" alignment="left" spaceBefore="14" spaceAfter="14">

<topBorder type="single" width="34"/>

<bottomBorder type="single" width="14"/>

<gridTable>

<gridCol>1651</gridCol>

<gridCol>1113</gridCol>

<gridCol>917</gridCol>

<gridCol>945</gridCol>

<gridRow>787</gridRow>

<gridRow>773</gridRow>

<gridRow>518</gridRow>

<gridRow>518</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<topBorder type="single" width="34"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1282" t="6562" r="2933" b="7349" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="34"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="3058" t="6634" r="3907" b="7334" alignment="centered" lsp="exactly" lspExact="253" language="en">

<ln l="3058" t="6634" r="3907" b="6787" baseLine="6778" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3058" t="6634" r="3907" b="6787">Precision
</wd>

</ln>

<ln l="3202" t="6883" r="3758" b="7085" baseLine="7032" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3202" t="6883" r="3691" b="7085">(CRF</wd>

<space/>

<wd l="3744" t="6883" r="3758" b="7085">|
</wd>

</ln>

<ln l="3206" t="7133" r="3758" b="7334" baseLine="7286" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3206" t="7133" r="3758" b="7334">Final)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="34"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4214" t="6629" r="4795" b="7334" alignment="centered" lsp="exactly" lspExact="253" language="en">

<ln l="4214" t="6629" r="4795" b="6787" baseLine="6778" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="4214" t="6629" r="4795" b="6787">Recall
</wd>

</ln>

<ln l="4219" t="6883" r="4776" b="7085" baseLine="7032" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="4219" t="6883" r="4704" b="7085">(CRF</wd>

<space/>

<wd l="4762" t="6883" r="4776" b="7085">|
</wd>

</ln>

<ln l="4219" t="7133" r="4771" b="7334" baseLine="7286" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="4219" t="7133" r="4771" b="7334">Final)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="34"/>

<bottomBorder type="single" width="14"/>

<para l="5141" t="6629" r="5698" b="7334" alignment="centered" lsp="exactly" lspExact="253" language="en">

<ln l="5294" t="6629" r="5534" b="6782" baseLine="6778" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="5294" t="6629" r="5534" b="6782">F1
</wd>

</ln>

<ln l="5141" t="6883" r="5698" b="7085" baseLine="7032" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="5141" t="6883" r="5626" b="7085">(CRF</wd>

<space/>

<wd l="5683" t="6883" r="5698" b="7085">|
</wd>

</ln>

<ln l="5141" t="7133" r="5693" b="7334" baseLine="7286" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="5141" t="7133" r="5693" b="7334">Final)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1493" t="7402" r="2746" b="8112" alignment="centered" spaceAfter="3" lsp="exactly" lspExact="253" language="en">

<ln l="1709" t="7402" r="2534" b="7560" baseLine="7550" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1709" t="7402" r="2352" b="7560">Tokens</wd>

<space/>

<wd l="2410" t="7421" r="2534" b="7541">+
</wd>

</ln>

<ln l="1690" t="7656" r="2558" b="7819" baseLine="7805" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1690" t="7656" r="2381" b="7814">Context</wd>

<space/>

<wd l="2434" t="7675" r="2558" b="7795">+
</wd>

</ln>

<ln l="1493" t="7786" r="2746" b="8112" baseLine="8059" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1493" t="7910" r="2746" b="8112">Alphanumeric</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="3197" t="7531" r="3773" b="7733" alignment="left" spaceBefore="137" lsp="exactly" lspExact="253" language="en">

<tabs position="3197"/>

<ln l="3197" t="7531" r="3773" b="7733" baseLine="7680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3197" t="7531" r="3667" b="7690">0.991</wd>

<space/>

<wd l="3758" t="7531" r="3773" b="7733">|</wd>

</ln>

</para>

<para l="3192" t="7781" r="3792" b="7939" alignment="left" spaceBefore="1" spaceAfter="128" lsp="exactly" lspExact="253" language="en">

<tabs position="3192"/>

<ln l="3192" t="7781" r="3792" b="7939" baseLine="7934" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3192" t="7781" r="3792" b="7939">0.8782</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4267" t="7531" r="4733" b="7733" alignment="centered" spaceBefore="137" lsp="exactly" lspExact="253" language="en">

<ln l="4267" t="7531" r="4733" b="7733" baseLine="7680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4267" t="7531" r="4642" b="7690">0.57</wd>

<space/>

<wd l="4718" t="7531" r="4733" b="7733">|</wd>

</ln>

</para>

<para l="4210" t="7781" r="4810" b="7939" alignment="centered" spaceBefore="1" spaceAfter="128" lsp="exactly" lspExact="253" language="en">

<ln l="4210" t="7781" r="4810" b="7939" baseLine="7934" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4210" t="7781" r="4795" b="7939">0.6013</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="5078" t="7531" r="5765" b="7733" alignment="left" spaceBefore="137" lsp="exactly" lspExact="253" language="en">

<tabs position="5078"/>

<ln l="5078" t="7531" r="5765" b="7733" baseLine="7680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5078" t="7531" r="5674" b="7690">0.7237</wd>

<space/>

<wd l="5750" t="7531" r="5765" b="7733">|</wd>

</ln>

</para>

<para l="5126" t="7781" r="5726" b="7939" alignment="left" spaceBefore="1" spaceAfter="128" lsp="exactly" lspExact="253" language="en">

<tabs position="5126"/>

<ln l="5126" t="7781" r="5726" b="7939" baseLine="7934" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="5126" t="7781" r="5726" b="7939">0.7139</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1459" t="8174" r="2779" b="8630" alignment="centered" spaceAfter="3" lsp="exactly" lspExact="253" language="en">

<ln l="1459" t="8174" r="2779" b="8333" baseLine="8323" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1459" t="8174" r="2050" b="8333">Added</wd>

<space/>

<wd l="2107" t="8174" r="2779" b="8333">diction-
</wd>

</ln>

<ln l="1608" t="8429" r="2635" b="8630" baseLine="8578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1608" t="8477" r="1886" b="8630">ary</wd>

<space/>

<wd l="1944" t="8429" r="2635" b="8587">features</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="3197" t="8174" r="3773" b="8376" alignment="left" lsp="exactly" lspExact="253" language="en">

<tabs position="3197"/>

<ln l="3197" t="8174" r="3773" b="8376" baseLine="8323" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3197" t="8174" r="3682" b="8333">0.907</wd>

<space/>

<wd l="3758" t="8174" r="3773" b="8376">|</wd>

</ln>

</para>

<para l="3192" t="8429" r="3792" b="8587" alignment="left" spaceBefore="2" spaceAfter="3" lsp="exactly" lspExact="253" language="en">

<tabs position="3192"/>

<ln l="3192" t="8429" r="3792" b="8587" baseLine="8578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3192" t="8429" r="3792" b="8587">0.8376</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4214" t="8174" r="4790" b="8376" alignment="centered" lsp="exactly" lspExact="253" language="en">

<ln l="4214" t="8174" r="4790" b="8376" baseLine="8323" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4214" t="8174" r="4699" b="8333">0.824</wd>

<space/>

<wd l="4776" t="8174" r="4790" b="8376">|</wd>

</ln>

</para>

<para l="4210" t="8429" r="4795" b="8587" alignment="centered" spaceBefore="2" spaceAfter="3" lsp="exactly" lspExact="253" language="en">

<ln l="4210" t="8429" r="4795" b="8587" baseLine="8578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4210" t="8429" r="4795" b="8587">0.8133</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="5078" t="8174" r="5765" b="8376" alignment="left" lsp="exactly" lspExact="253" language="en">

<tabs position="5078"/>

<ln l="5078" t="8174" r="5765" b="8376" baseLine="8323" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5078" t="8174" r="5669" b="8333">0.8635</wd>

<space/>

<wd l="5750" t="8174" r="5765" b="8376">|</wd>

</ln>

</para>

<para l="5126" t="8429" r="5717" b="8587" alignment="left" spaceBefore="2" spaceAfter="3" lsp="exactly" lspExact="253" language="en">

<tabs position="5126"/>

<ln l="5126" t="8429" r="5717" b="8587" baseLine="8578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5126" t="8429" r="5717" b="8587">0.8253</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1603" t="8818" r="2635" b="8976" alignment="centered" spaceBefore="132" spaceAfter="119" lsp="exactly" lspExact="253" language="en">

<ln l="1603" t="8818" r="2635" b="8976" baseLine="8966" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1603" t="8818" r="1882" b="8971">All</wd>

<space/>

<wd l="1949" t="8818" r="2635" b="8976">features</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="3197" t="8693" r="3773" b="8894" alignment="left" lsp="exactly" lspExact="253" language="en">

<tabs position="3197"/>

<ln l="3197" t="8693" r="3773" b="8894" baseLine="8842" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3197" t="8693" r="3677" b="8851">0.915</wd>

<space/>

<wd l="3758" t="8693" r="3773" b="8894">|</wd>

</ln>

</para>

<para l="3192" t="8947" r="3787" b="9106" alignment="left" spaceBefore="1" lsp="exactly" lspExact="242" language="en">

<tabs position="3192"/>

<ln l="3192" t="8947" r="3787" b="9106" baseLine="9096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3192" t="8947" r="3787" b="9106">0.8469</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4214" t="8693" r="4790" b="8894" alignment="centered" lsp="exactly" lspExact="253" language="en">

<ln l="4214" t="8693" r="4790" b="8894" baseLine="8842" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4214" t="8693" r="4694" b="8851">0.817</wd>

<space/>

<wd l="4776" t="8693" r="4790" b="8894">|</wd>

</ln>

</para>

<para l="4210" t="8947" r="4795" b="9106" alignment="centered" spaceBefore="1" lsp="exactly" lspExact="242" language="en">

<ln l="4210" t="8947" r="4795" b="9106" baseLine="9096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4210" t="8947" r="4795" b="9106">0.8083</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="top">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="5078" t="8693" r="5765" b="8894" alignment="left" lsp="exactly" lspExact="253" language="en">

<tabs position="5078"/>

<ln l="5078" t="8693" r="5765" b="8894" baseLine="8842" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5078" t="8693" r="5678" b="8851">0.8632</wd>

<space/>

<wd l="5750" t="8693" r="5765" b="8894">|</wd>

</ln>

</para>

<para l="5126" t="8952" r="5722" b="9110" alignment="left" spaceBefore="3" lsp="exactly" lspExact="240" language="en">

<tabs position="5126"/>

<ln l="5126" t="8952" r="5722" b="9110" baseLine="9101" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="5126" t="8952" r="5722" b="9110">0.8272</wd>

</ln>

</para>

</cell>

</table>

<para l="1421" t="9206" r="5779" b="10171" alignment="justified" li="144" ri="72" spaceAfter="234" lsp="exactly" lspExact="253" language="en">

<ln l="1426" t="9206" r="5779" b="9365" baseLine="9355" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1426" t="9206" r="1920" b="9365">Table</wd>

<space/>

<wd l="2016" t="9206" r="2146" b="9365">1.</wd>

<space/>

<wd l="2232" t="9206" r="2789" b="9365">Result</wd>

<space/>

<wd l="2866" t="9206" r="3504" b="9365">metrics</wd>

<space/>

<wd l="3586" t="9206" r="3787" b="9365">of</wd>

<space/>

<wd l="3840" t="9206" r="4675" b="9365">candidate</wd>

<space/>

<wd l="4757" t="9206" r="5160" b="9365">CRF</wd>

<space/>

<wd l="5237" t="9206" r="5779" b="9365">model</wd>

<space/>

</ln>

<ln l="1421" t="9461" r="5779" b="9662" baseLine="9610" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1421" t="9461" r="1810" b="9619">with</wd>

<space/>

<wd l="1891" t="9461" r="2645" b="9619">different</wd>

<space/>

<wd l="2722" t="9461" r="3408" b="9619">features</wd>

<space/>

<wd l="3490" t="9461" r="3883" b="9662">(and</wd>

<space/>

<wd l="3955" t="9461" r="4157" b="9619">its</wd>

<space/>

<wd l="4238" t="9461" r="4829" b="9662">impact</wd>

<space/>

<wd l="4910" t="9509" r="5126" b="9619">on</wd>

<space/>

<wd l="5198" t="9461" r="5467" b="9619">the</wd>

<space/>

<wd l="5544" t="9509" r="5779" b="9619">re-</wd>

</ln>

<ln l="1430" t="9715" r="5779" b="9917" baseLine="9864" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1430" t="9715" r="1738" b="9874">sult</wd>

<space/>

<wd l="1848" t="9715" r="2251" b="9874">after</wd>

<space/>

<wd l="2352" t="9715" r="3571" b="9874">normalization</wd>

<space/>

<wd l="3677" t="9715" r="4152" b="9917">using</wd>

<space/>

<wd l="4262" t="9763" r="4358" b="9874">a</wd>

<space/>

<wd l="4469" t="9715" r="5333" b="9874">submitted</wd>

<space/>

<wd l="5438" t="9763" r="5779" b="9917">sys-</wd>

</ln>

<ln l="1421" t="9970" r="1867" b="10171" baseLine="10118" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1421" t="9970" r="1867" b="10171">tem).</wd>

</ln>

</para>

<table l="1282" t="10435" r="5908" b="12514" alignment="left" spaceBefore="14" spaceAfter="14">

<topBorder type="single" width="34"/>

<bottomBorder type="single" width="14"/>

<gridTable>

<gridCol>1555</gridCol>

<gridCol>1061</gridCol>

<gridCol>1065</gridCol>

<gridCol>945</gridCol>

<gridRow>283</gridRow>

<gridRow>1023</gridRow>

<gridRow>773</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<topBorder type="single" width="34"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1282" t="10435" r="2837" b="10718" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="34"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="2938" t="10507" r="3787" b="10661" alignment="centered" lsp="exactly" lspExact="250" language="en">

<ln l="2938" t="10507" r="3787" b="10661" baseLine="10656" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2938" t="10507" r="3787" b="10661">Precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="34"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4138" t="10502" r="4718" b="10661" alignment="centered" lsp="exactly" lspExact="250" language="en">

<ln l="4138" t="10502" r="4718" b="10661" baseLine="10656" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="4138" t="10502" r="4718" b="10661">Recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="34"/>

<bottomBorder type="single" width="14"/>

<para l="5294" t="10502" r="5534" b="10656" alignment="centered" lsp="exactly" lspExact="250" language="en">

<ln l="5294" t="10502" r="5534" b="10656" baseLine="10656" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5294" t="10502" r="5534" b="10656">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1416" t="10771" r="2693" b="11731" alignment="left" li="144" ri="144" lsp="exactly" lspExact="251" language="en">

<ln l="1421" t="10771" r="2141" b="10930" baseLine="10920" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1421" t="10771" r="2141" b="10930">Lexicon</wd>

<space/>

</ln>

<ln l="1416" t="11026" r="2693" b="11184" baseLine="11174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1416" t="11026" r="2693" b="11184">Normalization</wd>

<space/>

</ln>

<ln l="1421" t="11261" r="2107" b="11429" baseLine="11429" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1421" t="11294" r="1546" b="11414">+</wd>

<space/>

<wd l="1598" t="11280" r="2107" b="11429">DYM</wd>

<space/>

</ln>

<ln l="1426" t="11530" r="2429" b="11731" baseLine="11683" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1426" t="11530" r="2429" b="11731">(submitted)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="3072" t="11150" r="3662" b="11309" alignment="centered" spaceBefore="392" spaceAfter="373" lsp="exactly" lspExact="253" language="en">

<ln l="3072" t="11150" r="3662" b="11309" baseLine="11304" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3072" t="11150" r="3662" b="11309">0.8469</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4133" t="11150" r="4718" b="11309" alignment="centered" spaceBefore="392" spaceAfter="373" lsp="exactly" lspExact="253" language="en">

<ln l="4133" t="11150" r="4718" b="11309" baseLine="11304" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4133" t="11150" r="4718" b="11309">0.8083</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="5126" t="11150" r="5726" b="11309" alignment="centered" spaceBefore="392" spaceAfter="373" lsp="exactly" lspExact="253" language="en">

<ln l="5126" t="11150" r="5726" b="11309" baseLine="11304" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="5126" t="11150" r="5726" b="11309">0.8272</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="1416" t="11794" r="2693" b="12456" alignment="left" li="108" spaceAfter="8" lsp="exactly" lspExact="253" language="en">

<ln l="1421" t="11794" r="2141" b="11952" baseLine="11942" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="11794" r="2141" b="11952">Lexicon</wd>

<space/>

</ln>

<ln l="1416" t="12048" r="2693" b="12206" baseLine="12197" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1416" t="12048" r="2693" b="12206">Normalization</wd>

<space/>

</ln>

<ln l="1421" t="12298" r="2654" b="12456" baseLine="12446" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="12298" r="2093" b="12456">without</wd>

<space/>

<wd l="2146" t="12302" r="2654" b="12451">DYM</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="3072" t="12048" r="3658" b="12206" alignment="centered" spaceBefore="262" spaceAfter="257" lsp="exactly" lspExact="253" language="en">

<ln l="3072" t="12048" r="3658" b="12206" baseLine="12197" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3072" t="12048" r="3658" b="12206">0.8765</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<rightBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="4133" t="12048" r="4723" b="12206" alignment="centered" spaceBefore="262" spaceAfter="257" lsp="exactly" lspExact="253" language="en">

<ln l="4133" t="12048" r="4723" b="12206" baseLine="12197" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4133" t="12048" r="4723" b="12206">0.7949</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="14"/>

<topBorder type="single" width="14"/>

<bottomBorder type="single" width="14"/>

<para l="5126" t="12053" r="5726" b="12211" alignment="centered" spaceBefore="264" spaceAfter="249" lsp="exactly" lspExact="259" language="en">

<ln l="5126" t="12053" r="5726" b="12211" baseLine="12202" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="5126" t="12053" r="5726" b="12211">0.8337</wd>

</ln>

</para>

</cell>

</table>

<para l="1421" t="12562" r="5774" b="13018" alignment="justified" li="144" ri="72" lsp="exactly" lspExact="253" language="en">

<ln l="1426" t="12562" r="5774" b="12763" baseLine="12715" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="12562" r="1920" b="12720">Table</wd>

<space/>

<wd l="1982" t="12562" r="2131" b="12720">2.</wd>

<space/>

<wd l="2203" t="12562" r="2765" b="12720">Result</wd>

<space/>

<wd l="2822" t="12562" r="3466" b="12720">metrics</wd>

<space/>

<wd l="3533" t="12562" r="3730" b="12720">of</wd>

<space/>

<wd l="3763" t="12581" r="4090" b="12720">two</wd>

<space/>

<wd l="4152" t="12562" r="5371" b="12720">normalization</wd>

<space/>

<wd l="5438" t="12610" r="5774" b="12763">sys-</wd>

</ln>

<ln l="1421" t="12816" r="3120" b="13018" baseLine="12965" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="12835" r="1752" b="12974">tem</wd>

<space/>

<wd l="1810" t="12816" r="3120" b="13018">configurations.</wd>

</ln>

</para>

<para l="1382" t="13320" r="5789" b="15293" alignment="justified" li="144" ri="72" spaceBefore="253" spaceAfter="35" fli="216" lsp="exactly" lspExact="253" language="en">

<ln l="1709" t="13320" r="5789" b="13522" baseLine="13474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1709" t="13320" r="2045" b="13478">The</wd>

<space/>

<wd l="2117" t="13325" r="2626" b="13474">DYM</wd>

<space/>

<wd l="2707" t="13320" r="3312" b="13478">feature</wd>

<space/>

<wd l="3389" t="13320" r="3782" b="13478">does</wd>

<space/>

<wd l="3864" t="13368" r="3960" b="13478">a</wd>

<space/>

<wd l="4037" t="13320" r="4474" b="13522">good</wd>

<space/>

<wd l="4522" t="13320" r="4819" b="13522">job</wd>

<space/>

<wd l="4901" t="13320" r="5789" b="13522">correcting</wd>

<space/>

</ln>

<ln l="1421" t="13574" r="5784" b="13776" baseLine="13723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1421" t="13594" r="1891" b="13776">typos</wd>

<space/>

<wd l="2011" t="13574" r="2328" b="13733">and</wd>

<space/>

<wd l="2434" t="13574" r="3269" b="13776">removing</wd>

<space/>

<wd l="3384" t="13574" r="4224" b="13733">excessive</wd>

<space/>

<wd l="4339" t="13574" r="5136" b="13776">duplicate</wd>

<space/>

<wd l="5251" t="13574" r="5784" b="13733">letters</wd>

<space/>

</ln>

<ln l="1426" t="13819" r="5789" b="14030" baseLine="13978">

<wd l="1426" t="13829" r="2170" b="14030"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">beutiful</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-5"><wd l="2333" t="13819" r="2520" b="13982">4</wd>

<space/>

</run>

<wd l="2693" t="13829" r="3518" b="14030"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">beautiful</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="3686" t="13858" r="4128" b="13987">tosee</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-5"><wd l="4301" t="13819" r="4488" b="13982">4</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="4656" t="13858" r="4819" b="13987">to</wd>

<space/>

</run>

<wd l="4973" t="13882" r="5309" b="14021"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">see</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

<wd l="5472" t="13829" r="5789" b="13987">and</wd>

<space/>

</run>

</ln>

<ln l="1416" t="14069" r="5784" b="14280" baseLine="14227">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="1416" t="14078" r="2371" b="14237">smileeeeee</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-5"><wd l="2453" t="14069" r="2640" b="14232">4</wd>

<space/>

</run>

<wd l="2712" t="14078" r="3298" b="14280"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">smile</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

<wd l="3374" t="14083" r="4229" b="14270">However,</wd>

<space/>

<wd l="4306" t="14126" r="4714" b="14237">even</wd>

<space/>

<wd l="4781" t="14078" r="5170" b="14237">with</wd>

<space/>

<wd l="5237" t="14126" r="5333" b="14237">a</wd>

<space/>

<wd l="5395" t="14078" r="5784" b="14280">high</wd>

<space/>

</run>

</ln>

<ln l="1426" t="14333" r="5784" b="14534" baseLine="14486" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1426" t="14333" r="2381" b="14491">confidence</wd>

<space/>

<wd l="2486" t="14333" r="3350" b="14525">threshold,</wd>

<space/>

<wd l="3466" t="14333" r="3898" b="14534">quite</wd>

<space/>

<wd l="4003" t="14381" r="4099" b="14491">a</wd>

<space/>

<wd l="4195" t="14333" r="4867" b="14491">number</wd>

<space/>

<wd l="4968" t="14333" r="5170" b="14491">of</wd>

<space/>

<wd l="5246" t="14333" r="5784" b="14491">words</wd>

<space/>

</ln>

<ln l="1426" t="14587" r="5784" b="14789" baseLine="14736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1426" t="14635" r="1690" b="14746">are</wd>

<space/>

<wd l="1757" t="14587" r="2750" b="14746">normalized</wd>

<space/>

<wd l="2813" t="14587" r="3869" b="14789">excessively,</wd>

<space/>

<wd l="3941" t="14587" r="4555" b="14789">mainly</wd>

<space/>

<wd l="4618" t="14587" r="5083" b="14746">those</wd>

<space/>

<wd l="5150" t="14587" r="5318" b="14741">in</wd>

<space/>

<wd l="5386" t="14635" r="5784" b="14746">non-</wd>

</ln>

<ln l="1421" t="14827" r="5774" b="15038" baseLine="14986">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="1421" t="14837" r="2093" b="15038">English</wd>

<space/>

<wd l="2174" t="14837" r="2429" b="15038">(or</wd>

<space/>

<wd l="2496" t="14837" r="3235" b="15038">partially</wd>

<space/>

<wd l="3307" t="14837" r="4046" b="15038">English)</wd>

<space/>

<wd l="4128" t="14856" r="4742" b="15029">tweets,</wd>

<space/>

<wd l="4829" t="14885" r="5126" b="15038">e.g.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="5174" t="14837" r="5501" b="15038">jeil</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-5"><wd l="5587" t="14827" r="5774" b="14990">4</wd>

<space/>

</run>

</ln>

<ln l="1382" t="15082" r="5779" b="15293" baseLine="15240">

<wd l="1382" t="15091" r="1762" b="15293"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">jail</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="1829" t="15091" r="2203" b="15293">hoje</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-5"><wd l="2285" t="15082" r="2472" b="15245">4</wd>

<space/>

</run>

<wd l="2544" t="15091" r="3019" b="15293"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">hope</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

<wd l="3091" t="15091" r="3408" b="15250">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="3466" t="15144" r="4022" b="15250">wasan</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-5"><wd l="4104" t="15082" r="4291" b="15245">4</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="4363" t="15144" r="4704" b="15250">was</wd>

<space/>

</run>

<wd l="4771" t="15144" r="5035" b="15283"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">an</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

<wd l="5107" t="15091" r="5275" b="15245">in</wd>

<space/>

<wd l="5342" t="15091" r="5779" b="15250">addi-</wd>

</run>

</ln>

<ln l="0" t="0" r="0" b="0" baseLine="0" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<space/>

</ln>

</para>

</column>

<column l="6120" t="1417" r="10517" b="14709">

<para l="6125" t="1464" r="10498" b="4910" alignment="justified" spaceBefore="1" lsp="exactly" lspExact="253" language="en">

<ln l="6125" t="1464" r="10498" b="1666" baseLine="1613">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6125" t="1464" r="6470" b="1622">tion</wd>

<space/>

<wd l="6542" t="1483" r="6710" b="1622">to</wd>

<space/>

<wd l="6802" t="1512" r="7253" b="1622">some</wd>

<space/>

<wd l="7334" t="1464" r="8112" b="1622">incorrect</wd>

<space/>

<wd l="8189" t="1464" r="9494" b="1622">normalizations</wd>

<space/>

<wd l="9576" t="1464" r="9898" b="1622">like</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="9950" t="1464" r="10498" b="1666">parkd</wd>

<space/>

</run>

</ln>

<ln l="6139" t="1709" r="10483" b="1920" baseLine="1867">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1"><wd l="6139" t="1709" r="6326" b="1872">4</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6379" t="1718" r="6821" b="1920">park</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6883" t="1718" r="7579" b="1920">(instead</wd>

<space/>

<wd l="7646" t="1718" r="7848" b="1877">of</wd>

<space/>

</run>

<wd l="7862" t="1718" r="8568" b="1920"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">parked</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="8645" t="1766" r="8827" b="1877">or</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="8894" t="1718" r="9744" b="1877">hundread</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1"><wd l="9816" t="1709" r="10003" b="1872">4</wd>

<space/>

</run>

<wd l="10085" t="1718" r="10483" b="1877" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">hun-</wd>

</ln>

<ln l="6125" t="1973" r="10488" b="2174" baseLine="2122">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6125" t="1973" r="6610" b="2131">dreds</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6715" t="1973" r="7411" b="2174">(instead</wd>

<space/>

<wd l="7507" t="1973" r="7709" b="2131">of</wd>

<space/>

</run>

<wd l="7781" t="1973" r="8630" b="2174"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">hundred</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="8741" t="1973" r="9259" b="2131">These</wd>

<space/>

<wd l="9360" t="1973" r="10118" b="2131">mistakes</wd>

<space/>

<wd l="10229" t="2021" r="10488" b="2131">are</wd>

<space/>

</run>

</ln>

<ln l="6130" t="2222" r="10483" b="2424" baseLine="2376" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6130" t="2222" r="6902" b="2424">frequent,</wd>

<space/>

<wd l="6998" t="2222" r="7315" b="2381">and</wd>

<space/>

<wd l="7392" t="2270" r="7589" b="2381">an</wd>

<space/>

<wd l="7680" t="2222" r="8395" b="2381">increase</wd>

<space/>

<wd l="8482" t="2222" r="8645" b="2376">in</wd>

<space/>

<wd l="8726" t="2222" r="9211" b="2381">recall</wd>

<space/>

<wd l="9298" t="2222" r="9691" b="2381">does</wd>

<space/>

<wd l="9778" t="2242" r="10056" b="2381">not</wd>

<space/>

<wd l="10142" t="2242" r="10483" b="2381">out-</wd>

</ln>

<ln l="6125" t="2477" r="10488" b="2678" baseLine="2626" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="2477" r="6662" b="2678">weigh</wd>

<space/>

<wd l="6773" t="2525" r="6869" b="2635">a</wd>

<space/>

<wd l="6974" t="2477" r="7306" b="2635">loss</wd>

<space/>

<wd l="7421" t="2477" r="7584" b="2630">in</wd>

<space/>

<wd l="7685" t="2477" r="8544" b="2678">precision;</wd>

<space/>

<wd l="8664" t="2477" r="9077" b="2669">thus,</wd>

<space/>

<wd l="9187" t="2477" r="9456" b="2635">the</wd>

<space/>

<wd l="9562" t="2482" r="10488" b="2635">F-measure</wd>

<space/>

</ln>

<ln l="6125" t="2731" r="10483" b="2890" baseLine="2880" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="2731" r="6797" b="2890">without</wd>

<space/>

<wd l="6893" t="2731" r="7157" b="2890">the</wd>

<space/>

<wd l="7253" t="2736" r="7762" b="2885">DYM</wd>

<space/>

<wd l="7862" t="2731" r="8467" b="2890">feature</wd>

<space/>

<wd l="8568" t="2731" r="8731" b="2885">in</wd>

<space/>

<wd l="8832" t="2731" r="9029" b="2890">its</wd>

<space/>

<wd l="9134" t="2750" r="9754" b="2890">current</wd>

<space/>

<wd l="9854" t="2750" r="10248" b="2890">state</wd>

<space/>

<wd l="10349" t="2731" r="10483" b="2890">is</wd>

<space/>

</ln>

<ln l="6130" t="2981" r="10493" b="3182" baseLine="3134" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6130" t="3029" r="6538" b="3139">even</wd>

<space/>

<wd l="6605" t="3029" r="6701" b="3139">a</wd>

<space/>

<wd l="6768" t="2981" r="7166" b="3139">little</wd>

<space/>

<wd l="7224" t="2981" r="7464" b="3139">bit</wd>

<space/>

<wd l="7526" t="2981" r="8088" b="3182">higher</wd>

<space/>

<wd l="8150" t="2981" r="8530" b="3139">than</wd>

<space/>

<wd l="8597" t="3029" r="8890" b="3139">our</wd>

<space/>

<wd l="8957" t="2981" r="9821" b="3139">submitted</wd>

<space/>

<wd l="9888" t="3000" r="10493" b="3182">system</wd>

<space/>

</ln>

<ln l="6125" t="3235" r="10488" b="3437" baseLine="3389" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="3235" r="6514" b="3394">with</wd>

<space/>

<wd l="6576" t="3235" r="6734" b="3394">it.</wd>

<space/>

<wd l="6806" t="3235" r="7661" b="3437">Lowering</wd>

<space/>

<wd l="7718" t="3235" r="7982" b="3394">the</wd>

<space/>

<wd l="8050" t="3235" r="9010" b="3394">confidence</wd>

<space/>

<wd l="9067" t="3235" r="9888" b="3394">threshold</wd>

<space/>

<wd l="9936" t="3235" r="10488" b="3437">brings</wd>

<space/>

</ln>

<ln l="6125" t="3490" r="10483" b="3682" baseLine="3638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="3538" r="6571" b="3648">more</wd>

<space/>

<wd l="6667" t="3509" r="7277" b="3648">correct</wd>

<space/>

<wd l="7363" t="3490" r="8722" b="3682">normalizations,</wd>

<space/>

<wd l="8813" t="3490" r="9101" b="3648">but</wd>

<space/>

<wd l="9192" t="3490" r="9504" b="3648">due</wd>

<space/>

<wd l="9590" t="3509" r="9758" b="3648">to</wd>

<space/>

<wd l="9850" t="3490" r="10118" b="3648">the</wd>

<space/>

<wd l="10210" t="3538" r="10483" b="3648">na-</wd>

</ln>

<ln l="6125" t="3744" r="10493" b="3946" baseLine="3893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="3763" r="6466" b="3902">ture</wd>

<space/>

<wd l="6547" t="3744" r="6749" b="3902">of</wd>

<space/>

<wd l="6802" t="3763" r="7358" b="3902">tweets</wd>

<space/>

<wd l="7440" t="3792" r="7848" b="3902">even</wd>

<space/>

<wd l="7925" t="3792" r="8371" b="3902">more</wd>

<space/>

<wd l="8458" t="3744" r="9235" b="3902">incorrect</wd>

<space/>

<wd l="9317" t="3792" r="9758" b="3936">ones,</wd>

<space/>

<wd l="9850" t="3744" r="10493" b="3946">leading</wd>

<space/>

</ln>

<ln l="6125" t="3994" r="10488" b="4195" baseLine="4142" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="4013" r="6288" b="4152">to</wd>

<space/>

<wd l="6374" t="4042" r="6571" b="4152">an</wd>

<space/>

<wd l="6658" t="3994" r="7262" b="4152">overall</wd>

<space/>

<wd l="7344" t="3994" r="7738" b="4195">drop</wd>

<space/>

<wd l="7824" t="3994" r="7987" b="4147">in</wd>

<space/>

<wd l="8064" t="3994" r="8275" b="4147">F1</wd>

<space/>

<wd l="8381" t="4042" r="8880" b="4152">score.</wd>

<space/>

<wd l="8962" t="3994" r="10152" b="4186">Nevertheless,</wd>

<space/>

<wd l="10234" t="4042" r="10488" b="4152">we</wd>

<space/>

</ln>

<ln l="6130" t="4248" r="10483" b="4450" baseLine="4397" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6130" t="4248" r="6811" b="4406">decided</wd>

<space/>

<wd l="6869" t="4267" r="7032" b="4406">to</wd>

<space/>

<wd l="7094" t="4296" r="7387" b="4406">use</wd>

<space/>

<wd l="7450" t="4248" r="7771" b="4406">and</wd>

<space/>

<wd l="7834" t="4248" r="8419" b="4406">submit</wd>

<space/>

<wd l="8477" t="4248" r="8746" b="4406">the</wd>

<space/>

<wd l="8813" t="4267" r="9418" b="4450">system</wd>

<space/>

<wd l="9470" t="4248" r="9864" b="4406">with</wd>

<space/>

<wd l="9922" t="4253" r="10483" b="4440">DYM,</wd>

<space/>

</ln>

<ln l="6134" t="4502" r="10483" b="4704" baseLine="4651" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6134" t="4502" r="6576" b="4661">since</wd>

<space/>

<wd l="6653" t="4550" r="6907" b="4661">we</wd>

<space/>

<wd l="6979" t="4502" r="7618" b="4661">believe</wd>

<space/>

<wd l="7694" t="4502" r="7958" b="4661">the</wd>

<space/>

<wd l="8040" t="4522" r="8366" b="4661">text</wd>

<space/>

<wd l="8443" t="4502" r="9437" b="4661">normalized</wd>

<space/>

<wd l="9509" t="4502" r="9821" b="4661">this</wd>

<space/>

<wd l="9902" t="4550" r="10267" b="4704">way</wd>

<space/>

<wd l="10344" t="4502" r="10483" b="4661">is</wd>

<space/>

</ln>

<ln l="6125" t="4752" r="8669" b="4910" baseLine="4901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="4800" r="6571" b="4910">more</wd>

<space/>

<wd l="6638" t="4752" r="7315" b="4910">suitable</wd>

<space/>

<wd l="7373" t="4752" r="7632" b="4910">for</wd>

<space/>

<wd l="7685" t="4752" r="8285" b="4910">further</wd>

<space/>

<wd l="8338" t="4800" r="8669" b="4910">use.</wd>

</ln>

</para>

<para l="6120" t="5006" r="10512" b="9720" alignment="justified" spaceBefore="2" fli="288" lsp="exactly" lspExact="253" language="en">

<ln l="6408" t="5006" r="10483" b="5208" baseLine="5155" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="5006" r="7210" b="5208">Attempts</wd>

<space/>

<wd l="7315" t="5054" r="7738" b="5165">were</wd>

<space/>

<wd l="7838" t="5006" r="8309" b="5165">made</wd>

<space/>

<wd l="8410" t="5026" r="8578" b="5165">to</wd>

<space/>

<wd l="8688" t="5006" r="9408" b="5208">improve</wd>

<space/>

<wd l="9509" t="5006" r="9778" b="5165">the</wd>

<space/>

<wd l="9874" t="5006" r="10483" b="5208">perfor-</wd>

</ln>

<ln l="6125" t="5261" r="10493" b="5419" baseLine="5410" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="5309" r="6691" b="5419">mance</wd>

<space/>

<wd l="6787" t="5261" r="6989" b="5419">of</wd>

<space/>

<wd l="7046" t="5261" r="7315" b="5419">the</wd>

<space/>

<wd l="7402" t="5266" r="7910" b="5414">DYM</wd>

<space/>

<wd l="7997" t="5261" r="8654" b="5419">module</wd>

<space/>

<wd l="8746" t="5309" r="8918" b="5419">as</wd>

<space/>

<wd l="9005" t="5261" r="9379" b="5419">well</wd>

<space/>

<wd l="9475" t="5309" r="9648" b="5419">as</wd>

<space/>

<wd l="9734" t="5280" r="9898" b="5419">to</wd>

<space/>

<wd l="9998" t="5261" r="10493" b="5419">select</wd>

<space/>

</ln>

<ln l="6125" t="5510" r="10483" b="5669" baseLine="5659" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="5510" r="6389" b="5669">the</wd>

<space/>

<wd l="6480" t="5530" r="7090" b="5669">correct</wd>

<space/>

<wd l="7176" t="5510" r="8011" b="5669">candidate</wd>

<space/>

<wd l="8098" t="5510" r="8520" b="5669">from</wd>

<space/>

<wd l="8606" t="5558" r="8702" b="5669">a</wd>

<space/>

<wd l="8779" t="5510" r="10003" b="5669">normalization</wd>

<space/>

<wd l="10090" t="5510" r="10483" b="5669">lexi-</wd>

</ln>

<ln l="6130" t="5765" r="10493" b="5966" baseLine="5914" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="5813" r="6442" b="5923">con</wd>

<space/>

<wd l="6523" t="5765" r="6672" b="5918">if</wd>

<space/>

<wd l="6725" t="5765" r="7166" b="5923">there</wd>

<space/>

<wd l="7248" t="5765" r="7387" b="5923">is</wd>

<space/>

<wd l="7464" t="5813" r="7910" b="5923">more</wd>

<space/>

<wd l="7992" t="5765" r="8362" b="5923">than</wd>

<space/>

<wd l="8448" t="5813" r="8760" b="5923">one</wd>

<space/>

<wd l="8837" t="5765" r="9446" b="5923">variant</wd>

<space/>

<wd l="9518" t="5784" r="10157" b="5966">present</wd>

<space/>

<wd l="10238" t="5765" r="10493" b="5966">(ur</wd>

<space/>

</ln>

<ln l="6139" t="6010" r="10488" b="6221" baseLine="6168">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="6139" t="6010" r="6326" b="6173">4</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6456" t="6019" r="7080" b="6221">you’re,</wd>

<space/>

<wd l="7205" t="6067" r="7656" b="6221">your,</wd>

<space/>

<wd l="7781" t="6019" r="8227" b="6221">you).</wd>

<space/>

<wd l="8357" t="6024" r="8664" b="6178">For</wd>

<space/>

<wd l="8784" t="6019" r="9571" b="6221">example,</wd>

<space/>

<wd l="9701" t="6019" r="10488" b="6221">language</wd>

<space/>

</run>

</ln>

<ln l="6130" t="6274" r="10488" b="6475" baseLine="6422" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="6274" r="6931" b="6432">detection</wd>

<space/>

<wd l="7032" t="6274" r="7565" b="6432">works</wd>

<space/>

<wd l="7670" t="6274" r="8045" b="6432">well</wd>

<space/>

<wd l="8155" t="6322" r="8371" b="6432">on</wd>

<space/>

<wd l="8467" t="6274" r="9096" b="6475">regular</wd>

<space/>

<wd l="9202" t="6274" r="9754" b="6432">search</wd>

<space/>

<wd l="9859" t="6274" r="10488" b="6475">queries</wd>

<space/>

</ln>

<ln l="6130" t="6523" r="10512" b="6725" baseLine="6672" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="6523" r="6446" b="6682">and</wd>

<space/>

<wd l="6514" t="6523" r="7003" b="6682">could</wd>

<space/>

<wd l="7061" t="6523" r="8011" b="6725">potentially</wd>

<space/>

<wd l="8078" t="6523" r="8616" b="6682">forbid</wd>

<space/>

<wd l="8678" t="6523" r="8947" b="6682">the</wd>

<space/>

<wd l="9019" t="6523" r="10238" b="6682">normalization</wd>

<space/>

<wd l="10310" t="6523" r="10512" b="6682">of</wd>

<space/>

</ln>

<ln l="6125" t="6778" r="10493" b="6979" baseLine="6926" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="6778" r="6658" b="6936">words</wd>

<space/>

<wd l="6730" t="6778" r="6893" b="6931">in</wd>

<space/>

<wd l="6955" t="6778" r="8030" b="6979">non-English</wd>

<space/>

<wd l="8093" t="6797" r="8698" b="6936">tweets.</wd>

<space/>

<wd l="8774" t="6782" r="9629" b="6970">However,</wd>

<space/>

<wd l="9701" t="6778" r="9816" b="6936">it</wd>

<space/>

<wd l="9874" t="6778" r="10493" b="6979">proved</wd>

<space/>

</ln>

<ln l="6125" t="7032" r="10488" b="7234" baseLine="7181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="7051" r="6288" b="7190">to</wd>

<space/>

<wd l="6379" t="7032" r="6590" b="7190">be</wd>

<space/>

<wd l="6677" t="7051" r="6960" b="7190">not</wd>

<space/>

<wd l="7046" t="7032" r="7666" b="7234">helpful</wd>

<space/>

<wd l="7762" t="7032" r="8016" b="7190">for</wd>

<space/>

<wd l="8102" t="7051" r="8659" b="7190">tweets</wd>

<space/>

<wd l="8746" t="7128" r="8866" b="7138">–</wd>

<space/>

<wd l="8947" t="7032" r="9211" b="7190">the</wd>

<space/>

<wd l="9302" t="7080" r="10128" b="7234">messages</wd>

<space/>

<wd l="10224" t="7080" r="10488" b="7190">are</wd>

<space/>

</ln>

<ln l="6134" t="7282" r="10493" b="7483" baseLine="7435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6134" t="7282" r="6614" b="7474">short,</wd>

<space/>

<wd l="6691" t="7330" r="7142" b="7440">some</wd>

<space/>

<wd l="7214" t="7282" r="7416" b="7440">of</wd>

<space/>

<wd l="7454" t="7282" r="7896" b="7440">them</wd>

<space/>

<wd l="7958" t="7330" r="8222" b="7440">are</wd>

<space/>

<wd l="8290" t="7330" r="8386" b="7440">a</wd>

<space/>

<wd l="8443" t="7282" r="9125" b="7440">mixture</wd>

<space/>

<wd l="9197" t="7282" r="9398" b="7440">of</wd>

<space/>

<wd l="9437" t="7282" r="10109" b="7483">English</wd>

<space/>

<wd l="10176" t="7282" r="10493" b="7440">and</wd>

<space/>

</ln>

<ln l="6134" t="7536" r="10483" b="7738" baseLine="7685" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6134" t="7584" r="6586" b="7694">some</wd>

<space/>

<wd l="6662" t="7536" r="7118" b="7694">other</wd>

<space/>

<wd l="7190" t="7536" r="7978" b="7738">language</wd>

<space/>

<wd l="8059" t="7536" r="8544" b="7738">(thus,</wd>

<space/>

<wd l="8626" t="7536" r="8774" b="7690">if</wd>

<space/>

<wd l="8827" t="7536" r="9269" b="7694">there</wd>

<space/>

<wd l="9346" t="7536" r="9485" b="7694">is</wd>

<space/>

<wd l="9566" t="7584" r="9662" b="7694">a</wd>

<space/>

<wd l="9734" t="7536" r="10483" b="7694">normali-</wd>

</ln>

<ln l="6125" t="7790" r="10483" b="7992" baseLine="7939" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="7790" r="6662" b="7949">zation</wd>

<space/>

<wd l="6744" t="7790" r="7637" b="7949">restriction</wd>

<space/>

<wd l="7728" t="7838" r="7939" b="7949">on</wd>

<space/>

<wd l="8035" t="7790" r="8424" b="7949">such</wd>

<space/>

<wd l="8510" t="7810" r="9120" b="7982">tweets,</wd>

<space/>

<wd l="9206" t="7790" r="9974" b="7992">potential</wd>

<space/>

<wd l="10066" t="7795" r="10483" b="7992">Eng-</wd>

</ln>

<ln l="6130" t="8040" r="10483" b="8242" baseLine="8194" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="8040" r="6442" b="8198">lish</wd>

<space/>

<wd l="6523" t="8040" r="7829" b="8198">normalizations</wd>

<space/>

<wd l="7920" t="8088" r="8179" b="8198">are</wd>

<space/>

<wd l="8270" t="8040" r="8702" b="8242">lost),</wd>

<space/>

<wd l="8798" t="8040" r="9115" b="8198">and</wd>

<space/>

<wd l="9202" t="8040" r="9720" b="8242">slang-</wd>

<space/>

<wd l="9811" t="8040" r="10128" b="8198">and</wd>

<space/>

<wd l="10210" t="8040" r="10483" b="8198">ab-</wd>

</ln>

<ln l="6120" t="8294" r="10483" b="8496" baseLine="8448" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6120" t="8294" r="7430" b="8453">breviation-rich</wd>

<space/>

<wd l="7498" t="8314" r="8054" b="8453">tweets</wd>

<space/>

<wd l="8126" t="8342" r="8390" b="8453">are</wd>

<space/>

<wd l="8458" t="8294" r="8851" b="8453">hard</wd>

<space/>

<wd l="8909" t="8314" r="9077" b="8453">to</wd>

<space/>

<wd l="9154" t="8294" r="9850" b="8496">analyse.</wd>

<space/>

<wd l="9926" t="8294" r="10085" b="8448">A</wd>

<space/>

<wd l="10152" t="8294" r="10483" b="8453">lan-</wd>

</ln>

<ln l="6130" t="8549" r="10493" b="8750" baseLine="8698" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="8597" r="6643" b="8750">guage</wd>

<space/>

<wd l="6730" t="8549" r="7272" b="8707">model</wd>

<space/>

<wd l="7363" t="8597" r="7699" b="8707">was</wd>

<space/>

<wd l="7786" t="8549" r="8194" b="8707">used</wd>

<space/>

<wd l="8275" t="8549" r="8443" b="8702">in</wd>

<space/>

<wd l="8530" t="8597" r="8726" b="8707">an</wd>

<space/>

<wd l="8818" t="8568" r="9475" b="8750">attempt</wd>

<space/>

<wd l="9557" t="8568" r="9720" b="8707">to</wd>

<space/>

<wd l="9821" t="8549" r="10310" b="8707">select</wd>

<space/>

<wd l="10397" t="8597" r="10493" b="8707">a</wd>

<space/>

</ln>

<ln l="6130" t="8803" r="10493" b="9005" baseLine="8952" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="8822" r="6734" b="8962">correct</wd>

<space/>

<wd l="6802" t="8803" r="8026" b="8962">normalization</wd>

<space/>

<wd l="8098" t="8803" r="8520" b="8962">from</wd>

<space/>

<wd l="8587" t="8803" r="9317" b="9005">multiple</wd>

<space/>

<wd l="9389" t="8803" r="10133" b="8995">variants,</wd>

<space/>

<wd l="10205" t="8803" r="10493" b="8962">but</wd>

<space/>

</ln>

<ln l="6125" t="9053" r="10488" b="9254" baseLine="9206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="9053" r="6437" b="9211">this</wd>

<space/>

<wd l="6518" t="9053" r="6802" b="9211">did</wd>

<space/>

<wd l="6869" t="9072" r="7152" b="9211">not</wd>

<space/>

<wd l="7219" t="9101" r="7723" b="9254">prove</wd>

<space/>

<wd l="7795" t="9072" r="7963" b="9211">to</wd>

<space/>

<wd l="8035" t="9053" r="8246" b="9211">be</wd>

<space/>

<wd l="8328" t="9053" r="9134" b="9245">effective,</wd>

<space/>

<wd l="9221" t="9053" r="9720" b="9254">likely</wd>

<space/>

<wd l="9787" t="9053" r="10488" b="9211">because</wd>

<space/>

</ln>

<ln l="6125" t="9307" r="10493" b="9466" baseLine="9456" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="9307" r="6389" b="9466">the</wd>

<space/>

<wd l="6466" t="9307" r="7008" b="9466">model</wd>

<space/>

<wd l="7085" t="9307" r="7493" b="9466">used</wd>

<space/>

<wd l="7560" t="9355" r="7896" b="9466">was</wd>

<space/>

<wd l="7973" t="9326" r="8256" b="9466">not</wd>

<space/>

<wd l="8328" t="9307" r="9014" b="9466">focused</wd>

<space/>

<wd l="9082" t="9355" r="9298" b="9466">on</wd>

<space/>

<wd l="9379" t="9307" r="9878" b="9466">social</wd>

<space/>

<wd l="9955" t="9307" r="10493" b="9466">media</wd>

<space/>

</ln>

<ln l="6125" t="9566" r="6586" b="9720" baseLine="9710" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="9581" r="6586" b="9720">texts.</wd>

</ln>

</para>

<para l="6125" t="9811" r="10493" b="11491" alignment="justified" spaceBefore="1" fli="288" lsp="exactly" lspExact="253" language="en">

<ln l="6408" t="9811" r="10488" b="10013" baseLine="9960" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6408" t="9816" r="6710" b="9970">We</wd>

<space/>

<wd l="6835" t="9859" r="7099" b="9970">see</wd>

<space/>

<wd l="7214" t="9859" r="7680" b="9970">room</wd>

<space/>

<wd l="7790" t="9811" r="8045" b="9970">for</wd>

<space/>

<wd l="8150" t="9811" r="8918" b="10013">potential</wd>

<space/>

<wd l="9038" t="9811" r="10205" b="10013">improvement</wd>

<space/>

<wd l="10320" t="9811" r="10488" b="9965">in</wd>

<space/>

</ln>

<ln l="6125" t="10066" r="10483" b="10267" baseLine="10214" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="10066" r="6686" b="10267">tuning</wd>

<space/>

<wd l="6787" t="10066" r="7051" b="10224">the</wd>

<space/>

<wd l="7157" t="10070" r="7666" b="10219">DYM</wd>

<space/>

<wd l="7771" t="10066" r="8107" b="10224">tool</wd>

<space/>

<wd l="8213" t="10085" r="8381" b="10224">to</wd>

<space/>

<wd l="8496" t="10066" r="8995" b="10224">social</wd>

<space/>

<wd l="9101" t="10066" r="9638" b="10224">media</wd>

<space/>

<wd l="9734" t="10085" r="10200" b="10258">texts,</wd>

<space/>

<wd l="10310" t="10114" r="10483" b="10224">as</wd>

<space/>

</ln>

<ln l="6125" t="10320" r="10483" b="10522" baseLine="10469" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="10320" r="6499" b="10478">well</wd>

<space/>

<wd l="6581" t="10368" r="6754" b="10478">as</wd>

<space/>

<wd l="6840" t="10320" r="7003" b="10474">in</wd>

<space/>

<wd l="7085" t="10320" r="7786" b="10522">filtering</wd>

<space/>

<wd l="7862" t="10320" r="8933" b="10522">non-English</wd>

<space/>

<wd l="9010" t="10320" r="9542" b="10478">words</wd>

<space/>

<wd l="9624" t="10320" r="10051" b="10478">from</wd>

<space/>

<wd l="10123" t="10368" r="10483" b="10478">nor-</wd>

</ln>

<ln l="6125" t="10574" r="10488" b="10776" baseLine="10723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="10574" r="7056" b="10733">malization</wd>

<space/>

<wd l="7171" t="10574" r="8146" b="10766">candidates,</wd>

<space/>

<wd l="8266" t="10574" r="9533" b="10776">experimenting</wd>

<space/>

<wd l="9643" t="10574" r="10037" b="10733">with</wd>

<space/>

<wd l="10152" t="10574" r="10488" b="10733">lan-</wd>

</ln>

<ln l="6130" t="10824" r="10493" b="11026" baseLine="10973" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="10872" r="6643" b="11026">guage</wd>

<space/>

<wd l="6730" t="10824" r="7363" b="10982">models</wd>

<space/>

<wd l="7450" t="10824" r="8126" b="10982">tailored</wd>

<space/>

<wd l="8203" t="10843" r="8371" b="10982">to</wd>

<space/>

<wd l="8467" t="10824" r="8966" b="10982">social</wd>

<space/>

<wd l="9053" t="10824" r="9595" b="10982">media</wd>

<space/>

<wd l="9672" t="10843" r="10085" b="10982">texts</wd>

<space/>

<wd l="10176" t="10824" r="10493" b="10982">and</wd>

<space/>

</ln>

<ln l="6130" t="11078" r="10483" b="11280" baseLine="11227" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6130" t="11078" r="6725" b="11237">further</wd>

<space/>

<wd l="6811" t="11078" r="7637" b="11280">enriching</wd>

<space/>

<wd l="7723" t="11078" r="7987" b="11237">the</wd>

<space/>

<wd l="8078" t="11078" r="8722" b="11237">lexicon</wd>

<space/>

<wd l="8808" t="11078" r="9197" b="11237">with</wd>

<space/>

<wd l="9283" t="11126" r="9648" b="11237">new</wd>

<space/>

<wd l="9734" t="11078" r="10483" b="11237">normali-</wd>

</ln>

<ln l="6125" t="11333" r="7128" b="11491" baseLine="11482" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6125" t="11333" r="6662" b="11491">zation</wd>

<space/>

<wd l="6725" t="11333" r="7128" b="11491">data.</wd>

</ln>

</para>

<para l="6130" t="11794" r="7699" b="11962" alignment="left" spaceBefore="205" lsp="exactly" lspExact="273" language="en">

<ln l="6130" t="11794" r="7699" b="11962" baseLine="11957" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="18">

<wd l="6130" t="11794" r="6240" b="11957">4</wd>

<space/>

<wd l="6566" t="11794" r="7699" b="11962">Conclusion</wd>

</ln>

</para>

<para l="6120" t="12221" r="10493" b="14654" alignment="justified" spaceBefore="160" lsp="exactly" lspExact="252" language="en">

<ln l="6130" t="12221" r="10493" b="12422" baseLine="12370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6130" t="12226" r="6302" b="12374">In</wd>

<space/>

<wd l="6365" t="12221" r="6677" b="12379">this</wd>

<space/>

<wd l="6739" t="12269" r="7282" b="12422">paper,</wd>

<space/>

<wd l="7349" t="12269" r="7603" b="12379">we</wd>

<space/>

<wd l="7661" t="12221" r="8510" b="12422">presented</wd>

<space/>

<wd l="8568" t="12269" r="8664" b="12379">a</wd>

<space/>

<wd l="8731" t="12240" r="9336" b="12422">system</wd>

<space/>

<wd l="9398" t="12221" r="10176" b="12422">designed</wd>

<space/>

<wd l="10238" t="12221" r="10493" b="12379">for</wd>

<space/>

</ln>

<ln l="6120" t="12475" r="10478" b="12677" baseLine="12624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6120" t="12475" r="7238" b="12677">participation</wd>

<space/>

<wd l="7315" t="12475" r="7483" b="12629">in</wd>

<space/>

<wd l="7570" t="12475" r="8136" b="12634">shared</wd>

<space/>

<wd l="8208" t="12475" r="8568" b="12634">task</wd>

<space/>

<wd l="8635" t="12475" r="8851" b="12634">#2</wd>

<space/>

<wd l="8938" t="12475" r="9139" b="12634">of</wd>

<space/>

<wd l="9192" t="12475" r="9456" b="12634">the</wd>

<space/>

<wd l="9538" t="12475" r="9974" b="12634">ACL</wd>

<space/>

<wd l="10056" t="12475" r="10478" b="12634">2015</wd>

<space/>

</ln>

<ln l="6125" t="12725" r="10483" b="12926" baseLine="12874" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="12725" r="6984" b="12926">workshop</wd>

<space/>

<wd l="7070" t="12773" r="7286" b="12883">on</wd>

<space/>

<wd l="7354" t="12725" r="7834" b="12926">noisy</wd>

<space/>

<wd l="7901" t="12725" r="9202" b="12926">user-generated</wd>

<space/>

<wd l="9269" t="12744" r="9643" b="12883">text.</wd>

<space/>

<wd l="9730" t="12725" r="10070" b="12883">Our</wd>

<space/>

<wd l="10147" t="12773" r="10483" b="12926">sys-</wd>

</ln>

<ln l="6125" t="12979" r="10488" b="13181" baseLine="13128" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="12998" r="6456" b="13138">tem</wd>

<space/>

<wd l="6538" t="12979" r="7090" b="13138">makes</wd>

<space/>

<wd l="7181" t="13027" r="7474" b="13138">use</wd>

<space/>

<wd l="7565" t="12979" r="7766" b="13138">of</wd>

<space/>

<wd l="7834" t="12979" r="8237" b="13138">CRF</wd>

<space/>

<wd l="8333" t="12979" r="8587" b="13138">for</wd>

<space/>

<wd l="8674" t="12979" r="9634" b="13181">identifying</wd>

<space/>

<wd l="9715" t="12979" r="10488" b="13181">potential</wd>

<space/>

</ln>

<ln l="6130" t="13234" r="10493" b="13426" baseLine="13382" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6130" t="13234" r="7099" b="13426">candidates,</wd>

<space/>

<wd l="7238" t="13234" r="7963" b="13392">lexicons</wd>

<space/>

<wd l="8088" t="13253" r="8256" b="13392">to</wd>

<space/>

<wd l="8386" t="13234" r="9259" b="13392">normalize</wd>

<space/>

<wd l="9389" t="13234" r="9826" b="13392">them</wd>

<space/>

<wd l="9955" t="13234" r="10272" b="13392">and</wd>

<space/>

<wd l="10397" t="13282" r="10493" b="13392">a</wd>

<space/>

</ln>

<ln l="6125" t="13483" r="10493" b="13685" baseLine="13637" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="13488" r="6634" b="13637">DYM</wd>

<space/>

<wd l="6696" t="13483" r="7349" b="13642">module</wd>

<space/>

<wd l="7416" t="13531" r="7589" b="13642">as</wd>

<space/>

<wd l="7661" t="13531" r="7757" b="13642">a</wd>

<space/>

<wd l="7805" t="13483" r="9192" b="13685">post-processing</wd>

<space/>

<wd l="9259" t="13502" r="9600" b="13685">step</wd>

<space/>

<wd l="9658" t="13502" r="9830" b="13642">to</wd>

<space/>

<wd l="9898" t="13483" r="10493" b="13642">further</wd>

<space/>

</ln>

<ln l="6130" t="13738" r="10483" b="13939" baseLine="13891" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6130" t="13757" r="6734" b="13896">correct</wd>

<space/>

<wd l="6830" t="13786" r="7282" b="13896">some</wd>

<space/>

<wd l="7378" t="13738" r="7579" b="13896">of</wd>

<space/>

<wd l="7642" t="13738" r="7910" b="13896">the</wd>

<space/>

<wd l="8002" t="13738" r="8942" b="13939">misspelled</wd>

<space/>

<wd l="9029" t="13738" r="9605" b="13896">words.</wd>

<space/>

<wd l="9710" t="13738" r="10051" b="13896">Our</wd>

<space/>

<wd l="10147" t="13786" r="10483" b="13939">sys-</wd>

</ln>

<ln l="6125" t="13992" r="10488" b="14194" baseLine="14141" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="14011" r="6456" b="14150">tem</wd>

<space/>

<wd l="6571" t="13992" r="7171" b="14150">ranked</wd>

<space/>

<wd l="7296" t="13992" r="7906" b="14150">second</wd>

<space/>

<wd l="8026" t="14040" r="8616" b="14194">among</wd>

<space/>

<wd l="8736" t="13992" r="8952" b="14150">all</wd>

<space/>

<wd l="9096" t="13992" r="9269" b="14146">11</wd>

<space/>

<wd l="9422" t="13992" r="10488" b="14150">submissions</wd>

<space/>

</ln>

<ln l="6125" t="14242" r="10474" b="14443" baseLine="14395" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6125" t="14242" r="6514" b="14400">with</wd>

<space/>

<wd l="6586" t="14242" r="7186" b="14400">0.8272</wd>

<space/>

<wd l="7253" t="14246" r="8179" b="14400">F-measure</wd>

<space/>

<wd l="8251" t="14242" r="8568" b="14400">and</wd>

<space/>

<wd l="8630" t="14242" r="9230" b="14400">ranked</wd>

<space/>

<wd l="9302" t="14242" r="9653" b="14400">first</wd>

<space/>

<wd l="9720" t="14290" r="10315" b="14443">among</wd>

<space/>

<wd l="10387" t="14246" r="10474" b="14400">5</wd>

<space/>

</ln>

<ln l="6134" t="14496" r="9710" b="14654" baseLine="14650" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6134" t="14496" r="7195" b="14654">submissions</wd>

<space/>

<wd l="7258" t="14496" r="7517" b="14654">for</wd>

<space/>

<wd l="7565" t="14496" r="7834" b="14654">the</wd>

<space/>

<wd l="7891" t="14496" r="9130" b="14654">unconstrained</wd>

<space/>

<wd l="9178" t="14496" r="9710" b="14654">mode.</wd>

</ln>

</para>

</column>

</section>

<dd l="5776" t="15746" r="6181" b="15975">

<para l="5809" t="15792" r="6148" b="15946" alignment="left" lsp="exactly" lspExact="223" language="en">

<ln l="5875" t="15792" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="29">

<wd l="5875" t="15792" r="6082" b="15946">80</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4311.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1421" marginTop="1420" marginRight="6068" marginBottom="858" offsetX="8" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1421" t="1420" r="5841" b="15980">

<column l="1421" t="1420" r="5841" b="15980">

<para l="1421" t="1478" r="2530" b="1646" alignment="left" spaceBefore="6" lsp="exactly" lspExact="273" language="en">

<ln l="1421" t="1478" r="2530" b="1646" baseLine="1637" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="1478" r="2530" b="1646">References</wd>

</ln>

</para>

<para l="1421" t="1853" r="5765" b="2270" alignment="justified" li="216" ri="72" spaceBefore="113" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1421" t="1853" r="5765" b="2002" baseLine="1992">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1421" t="1858" r="1910" b="2002">Kevin</wd>

<space/>

<wd l="1978" t="1858" r="2750" b="2002">Atkinson.</wd>

<space/>

<wd l="2832" t="1858" r="3504" b="2002">VarCon.</wd>

<space/>

<wd l="3586" t="1862" r="4003" b="2002">Vers.</wd>

<space/>

<wd l="4090" t="1858" r="5030" b="2002">2015.02.15.</wd>

<space/>

</run>

<wd l="5136" t="1858" r="5501" b="2002"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Web</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5592" t="1858" r="5765" b="2002">01</wd>

<space/>

</run>

</ln>

<ln l="1646" t="2088" r="5160" b="2270" baseLine="2222" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="2088" r="1992" b="2270">Apr.</wd>

<space/>

<wd l="2054" t="2088" r="2501" b="2232">2015.</wd>

<space/>

<wd l="2563" t="2088" r="5160" b="2270">http://wordlist.aspell.net/varcon/</wd>

</ln>

</para>

<para l="1426" t="2434" r="5827" b="3998" alignment="justified" li="216" spaceBefore="114" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1426" t="2434" r="5779" b="2616" baseLine="2573" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="2434" r="2107" b="2616">Timothy</wd>

<space/>

<wd l="2189" t="2434" r="2909" b="2606">Baldwin,</wd>

<space/>

<wd l="3000" t="2434" r="4315" b="2578">Marie-Catherine</wd>

<space/>

<wd l="4406" t="2434" r="4589" b="2578">de</wd>

<space/>

<wd l="4670" t="2434" r="5458" b="2606">Marneffe,</wd>

<space/>

<wd l="5549" t="2438" r="5779" b="2578">Bo</wd>

<space/>

</ln>

<ln l="1646" t="2664" r="5774" b="2846" baseLine="2798" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="2669" r="2021" b="2837">Han,</wd>

<space/>

<wd l="2107" t="2669" r="3110" b="2846">Young-Bum</wd>

<space/>

<wd l="3182" t="2664" r="3581" b="2837">Kim,</wd>

<space/>

<wd l="3667" t="2664" r="4056" b="2808">Alan</wd>

<space/>

<wd l="4133" t="2664" r="4632" b="2837">Ritter,</wd>

<space/>

<wd l="4718" t="2664" r="5002" b="2808">and</wd>

<space/>

<wd l="5078" t="2664" r="5410" b="2808">Wei</wd>

<space/>

<wd l="5491" t="2669" r="5774" b="2808">Xu.</wd>

<space/>

</ln>

<ln l="1646" t="2894" r="5789" b="3077" baseLine="3034" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="2894" r="2088" b="3038">2015.</wd>

<space/>

<wd l="2174" t="2894" r="2717" b="3038">Shared</wd>

<space/>

<wd l="2779" t="2894" r="3173" b="3038">tasks</wd>

<space/>

<wd l="3245" t="2894" r="3432" b="3038">of</wd>

<space/>

<wd l="3466" t="2894" r="3710" b="3038">the</wd>

<space/>

<wd l="3773" t="2894" r="4162" b="3038">2015</wd>

<space/>

<wd l="4243" t="2894" r="5021" b="3077">workshop</wd>

<space/>

<wd l="5093" t="2938" r="5290" b="3038">on</wd>

<space/>

<wd l="5352" t="2894" r="5789" b="3077">noisy</wd>

<space/>

</ln>

<ln l="1646" t="3125" r="5784" b="3307" baseLine="3259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="3125" r="2822" b="3307">user-generated</wd>

<space/>

<wd l="2918" t="3144" r="3259" b="3269">text:</wd>

<space/>

<wd l="3370" t="3125" r="3960" b="3269">Twitter</wd>

<space/>

<wd l="4051" t="3125" r="4574" b="3269">lexical</wd>

<space/>

<wd l="4675" t="3125" r="5784" b="3269">normalization</wd>

<space/>

</ln>

<ln l="1651" t="3355" r="5827" b="3538" baseLine="3490">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="3355" r="1934" b="3499">and</wd>

<space/>

<wd l="2030" t="3355" r="2563" b="3499">named</wd>

<space/>

<wd l="2664" t="3355" r="3120" b="3538">entity</wd>

<space/>

<wd l="3211" t="3355" r="4162" b="3538">recognition.</wd>

<space/>

<wd l="4272" t="3360" r="4435" b="3494">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4526" t="3355" r="5534" b="3538">Proceedings</wd>

<space/>

<wd l="5635" t="3355" r="5827" b="3538">of</wd>

<space/>

</run>

</ln>

<ln l="1651" t="3586" r="5789" b="3768" baseLine="3725" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="3586" r="1886" b="3730">the</wd>

<space/>

<wd l="2083" t="3586" r="2866" b="3768">Workshop</wd>

<space/>

<wd l="3038" t="3634" r="3230" b="3730">on</wd>

<space/>

<wd l="3394" t="3590" r="3859" b="3768">Noisy</wd>

<space/>

<wd l="4042" t="3586" r="5285" b="3768">User-generated</wd>

<space/>

<wd l="5453" t="3590" r="5789" b="3730">Text</wd>

<space/>

</ln>

<ln l="1656" t="3816" r="4090" b="3998" baseLine="3950">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="3816" r="2285" b="3998">(WNUT</wd>

<space/>

</run>

<wd l="2314" t="3816" r="2827" b="3998"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2885" t="3816" r="3518" b="3998">Beijing,</wd>

<space/>

<wd l="3581" t="3816" r="4090" b="3960">China.</wd>

</run>

</ln>

</para>

<para l="1421" t="4166" r="5779" b="5040" alignment="left" li="216" spaceBefore="115" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1421" t="4166" r="5779" b="4349" baseLine="4301" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="4166" r="1992" b="4349">Vangie</wd>

<space/>

<wd l="2074" t="4166" r="2477" b="4310">Beal.</wd>

<space/>

<wd l="2568" t="4171" r="2933" b="4310">Text</wd>

<space/>

<wd l="3010" t="4166" r="3845" b="4349">messaging</wd>

<space/>

<wd l="3931" t="4166" r="4214" b="4310">and</wd>

<space/>

<wd l="4296" t="4166" r="4786" b="4310">online</wd>

<space/>

<wd l="4872" t="4166" r="5198" b="4310">chat</wd>

<space/>

<wd l="5280" t="4166" r="5779" b="4310">abbre-</wd>

</ln>

<ln l="1646" t="4392" r="3936" b="4579" baseLine="4531">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1646" t="4397" r="2318" b="4541">viations.</wd>

<space/>

</run>

<wd l="2405" t="4397" r="2774" b="4541"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Web</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2842" t="4397" r="3014" b="4541">01</wd>

<space/>

<wd l="3086" t="4397" r="3432" b="4579">Apr.</wd>

<space/>

<wd l="3494" t="4397" r="3936" b="4541">2015.</wd>

<space/>

</run>

</ln>

<ln l="1646" t="4627" r="5722" b="4810" baseLine="4762" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="4627" r="5722" b="4810">http://www.webopedia.com/quick_ref/textmessage</wd>

<space/>

</ln>

<ln l="1651" t="4858" r="3034" b="5040" baseLine="4992" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="4858" r="3034" b="5040">abbreviations.asp</wd>

</ln>

</para>

<para l="1426" t="5208" r="5784" b="6307" alignment="justified" li="216" spaceBefore="120" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1426" t="5208" r="5784" b="5390" baseLine="5342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1426" t="5208" r="2160" b="5390">Grzegorz</wd>

<space/>

<wd l="2270" t="5208" r="3034" b="5390">Chrupała.</wd>

<space/>

<wd l="3149" t="5208" r="3590" b="5352">2014.</wd>

<space/>

<wd l="3701" t="5208" r="4709" b="5390">Normalizing</wd>

<space/>

<wd l="4814" t="5227" r="5318" b="5352">tweets</wd>

<space/>

<wd l="5429" t="5208" r="5784" b="5352">with</wd>

<space/>

</ln>

<ln l="1651" t="5434" r="5784" b="5616" baseLine="5573" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="5434" r="1949" b="5578">edit</wd>

<space/>

<wd l="2059" t="5434" r="2568" b="5616">scripts</wd>

<space/>

<wd l="2678" t="5434" r="2966" b="5578">and</wd>

<space/>

<wd l="3067" t="5453" r="3792" b="5578">recurrent</wd>

<space/>

<wd l="3893" t="5434" r="4392" b="5578">neural</wd>

<space/>

<wd l="4502" t="5434" r="5501" b="5616">embeddings.</wd>

<space/>

<wd l="5621" t="5438" r="5784" b="5573">In</wd>

<space/>

</ln>

<ln l="1642" t="5664" r="5784" b="5846" baseLine="5798" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="5664" r="2650" b="5846">Proceedings</wd>

<space/>

<wd l="2707" t="5664" r="2899" b="5846">of</wd>

<space/>

<wd l="2918" t="5664" r="3154" b="5808">the</wd>

<space/>

<wd l="3216" t="5664" r="3624" b="5808">52nd</wd>

<space/>

<wd l="3658" t="5664" r="4253" b="5808">Annual</wd>

<space/>

<wd l="4291" t="5669" r="4958" b="5846">Meeting</wd>

<space/>

<wd l="5016" t="5664" r="5208" b="5846">of</wd>

<space/>

<wd l="5227" t="5664" r="5462" b="5808">the</wd>

<space/>

<wd l="5510" t="5664" r="5784" b="5808">As-</wd>

</ln>

<ln l="1642" t="5894" r="5779" b="6077" baseLine="6029" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="5904" r="2376" b="6038">sociation</wd>

<space/>

<wd l="2510" t="5894" r="2784" b="6077">for</wd>

<space/>

<wd l="2957" t="5894" r="4152" b="6077">Computational</wd>

<space/>

<wd l="4301" t="5899" r="5184" b="6077">Linguistics</wd>

<space/>

<wd l="5362" t="5894" r="5779" b="6077">(ACL</wd>

<space/>

</ln>

<ln l="1646" t="6125" r="4858" b="6307" baseLine="6264">

<wd l="1646" t="6125" r="2160" b="6307"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2014)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2213" t="6168" r="2664" b="6307">pages</wd>

<space/>

<wd l="2726" t="6125" r="3466" b="6298">680–686,</wd>

<space/>

<wd l="3523" t="6125" r="4363" b="6298">Baltimore,</wd>

<space/>

<wd l="4421" t="6125" r="4858" b="6269">USA.</wd>

</run>

</ln>

</para>

<para l="1430" t="6475" r="5789" b="7579" alignment="justified" li="216" spaceBefore="109" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1430" t="6475" r="5770" b="6658" baseLine="6614" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1430" t="6475" r="2054" b="6658">Stephan</wd>

<space/>

<wd l="2184" t="6475" r="2789" b="6648">Gouws,</wd>

<space/>

<wd l="2909" t="6475" r="3278" b="6614">Dirk</wd>

<space/>

<wd l="3394" t="6480" r="3883" b="6658">Hovy,</wd>

<space/>

<wd l="4008" t="6475" r="4291" b="6619">and</wd>

<space/>

<wd l="4406" t="6475" r="4997" b="6619">Donald</wd>

<space/>

<wd l="5112" t="6475" r="5770" b="6619">Metzler.</wd>

<space/>

</ln>

<ln l="1646" t="6706" r="5789" b="6888" baseLine="6840" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="6706" r="2088" b="6850">2011.</wd>

<space/>

<wd l="2146" t="6706" r="3245" b="6888">Unsupervised</wd>

<space/>

<wd l="3298" t="6706" r="3859" b="6888">mining</wd>

<space/>

<wd l="3917" t="6706" r="4104" b="6850">of</wd>

<space/>

<wd l="4133" t="6706" r="4656" b="6850">lexical</wd>

<space/>

<wd l="4709" t="6706" r="5338" b="6850">variants</wd>

<space/>

<wd l="5400" t="6706" r="5789" b="6850">from</wd>

<space/>

</ln>

<ln l="1646" t="6936" r="5784" b="7118" baseLine="7070">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1646" t="6936" r="2083" b="7118">noisy</wd>

<space/>

<wd l="2131" t="6955" r="2467" b="7080">text.</wd>

<space/>

<wd l="2539" t="6941" r="2702" b="7075">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2750" t="6936" r="3754" b="7118">Proceedings</wd>

<space/>

<wd l="3811" t="6936" r="4003" b="7118">of</wd>

<space/>

<wd l="4022" t="6936" r="4258" b="7080">the</wd>

<space/>

<wd l="4310" t="6941" r="4709" b="7080">First</wd>

<space/>

<wd l="4752" t="6936" r="5530" b="7118">workshop</wd>

<space/>

<wd l="5592" t="6984" r="5784" b="7080">on</wd>

<space/>

</run>

</ln>

<ln l="1666" t="7166" r="5784" b="7349" baseLine="7301">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1666" t="7166" r="2755" b="7349">Unsupervised</wd>

<space/>

<wd l="2813" t="7171" r="3562" b="7349">Learning</wd>

<space/>

<wd l="3634" t="7176" r="3782" b="7310">in</wd>

<space/>

</run>

<wd l="3850" t="7171" r="4267" b="7339"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">NLP</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4344" t="7210" r="4795" b="7349">pages</wd>

<space/>

<wd l="4886" t="7166" r="5419" b="7339">82–90,</wd>

<space/>

<wd l="5501" t="7166" r="5784" b="7310">Ed-</wd>

</run>

</ln>

<ln l="1651" t="7397" r="2693" b="7579" baseLine="7531" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="7397" r="2309" b="7579">inburgh,</wd>

<space/>

<wd l="2366" t="7402" r="2693" b="7541">UK.</wd>

</ln>

</para>

<para l="1522" t="7747" r="5789" b="8846" alignment="justified" li="216" spaceBefore="120" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1522" t="7747" r="5779" b="7930" baseLine="7882" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1522" t="7752" r="1747" b="7891">Bo</wd>

<space/>

<wd l="1838" t="7752" r="2174" b="7891">Han</wd>

<space/>

<wd l="2261" t="7747" r="2549" b="7891">and</wd>

<space/>

<wd l="2635" t="7747" r="3322" b="7930">Timothy</wd>

<space/>

<wd l="3408" t="7747" r="4128" b="7891">Baldwin.</wd>

<space/>

<wd l="4224" t="7747" r="4666" b="7891">2011.</wd>

<space/>

<wd l="4766" t="7747" r="5357" b="7891">Lexical</wd>

<space/>

<wd l="5453" t="7790" r="5779" b="7891">nor-</wd>

</ln>

<ln l="1646" t="7978" r="5789" b="8160" baseLine="8112" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="7978" r="2491" b="8122">malization</wd>

<space/>

<wd l="2597" t="7978" r="2784" b="8122">of</wd>

<space/>

<wd l="2870" t="7978" r="3264" b="8122">short</wd>

<space/>

<wd l="3365" t="7997" r="3667" b="8122">text</wd>

<space/>

<wd l="3768" t="8021" r="4565" b="8160">messages:</wd>

<space/>

<wd l="4680" t="7978" r="5150" b="8122">Makn</wd>

<space/>

<wd l="5261" t="8021" r="5587" b="8122">sens</wd>

<space/>

<wd l="5702" t="8021" r="5789" b="8122">a</wd>

<space/>

</ln>

<ln l="1646" t="8203" r="5784" b="8386" baseLine="8338">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1646" t="8203" r="2304" b="8347">#twitter.</wd>

<space/>

<wd l="2395" t="8208" r="2554" b="8342">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2621" t="8203" r="3629" b="8386">Proceedings</wd>

<space/>

<wd l="3706" t="8203" r="3898" b="8386">of</wd>

<space/>

<wd l="3931" t="8203" r="4166" b="8347">the</wd>

<space/>

<wd l="4248" t="8203" r="4598" b="8347">49th</wd>

<space/>

<wd l="4666" t="8203" r="5256" b="8347">Annual</wd>

<space/>

<wd l="5314" t="8208" r="5784" b="8347">Meet-</wd>

</run>

</ln>

<ln l="1651" t="8434" r="5784" b="8616" baseLine="8568" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="8443" r="1906" b="8616">ing</wd>

<space/>

<wd l="1982" t="8434" r="2174" b="8616">of</wd>

<space/>

<wd l="2213" t="8434" r="2448" b="8578">the</wd>

<space/>

<wd l="2520" t="8434" r="3456" b="8578">Association</wd>

<space/>

<wd l="3499" t="8434" r="3773" b="8616">for</wd>

<space/>

<wd l="3854" t="8434" r="5054" b="8616">Computational</wd>

<space/>

<wd l="5112" t="8438" r="5784" b="8616">Linguis-</wd>

</ln>

<ln l="1651" t="8664" r="5510" b="8846" baseLine="8803">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="8674" r="1925" b="8808">tics</wd>

<space/>

<wd l="1982" t="8664" r="2400" b="8846">(ACL</wd>

<space/>

</run>

<wd l="2453" t="8664" r="2966" b="8846"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2011)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3019" t="8707" r="3475" b="8846">pages</wd>

<space/>

<wd l="3533" t="8664" r="4243" b="8837">368-378,</wd>

<space/>

<wd l="4301" t="8664" r="5021" b="8837">Portland,</wd>

<space/>

<wd l="5078" t="8664" r="5510" b="8808">USA.</wd>

</run>

</ln>

</para>

<para l="1421" t="9014" r="5784" b="10570" alignment="justified" li="216" spaceBefore="108" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1421" t="9014" r="5779" b="9197" baseLine="9154" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="9014" r="1800" b="9158">John</wd>

<space/>

<wd l="1877" t="9019" r="2059" b="9158">D.</wd>

<space/>

<wd l="2155" t="9014" r="2851" b="9197">Lafferty,</wd>

<space/>

<wd l="2942" t="9014" r="3590" b="9158">Andrew</wd>

<space/>

<wd l="3667" t="9014" r="4565" b="9187">McCallum,</wd>

<space/>

<wd l="4661" t="9014" r="4944" b="9158">and</wd>

<space/>

<wd l="5026" t="9014" r="5779" b="9158">Fernando</wd>

<space/>

</ln>

<ln l="1651" t="9245" r="5770" b="9389" baseLine="9379" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="9245" r="1819" b="9389">C.</wd>

<space/>

<wd l="1915" t="9250" r="2098" b="9389">N.</wd>

<space/>

<wd l="2203" t="9245" r="2808" b="9389">Pereira.</wd>

<space/>

<wd l="2909" t="9245" r="3346" b="9389">2001.</wd>

<space/>

<wd l="3451" t="9245" r="4382" b="9389">Conditional</wd>

<space/>

<wd l="4474" t="9245" r="5155" b="9389">Random</wd>

<space/>

<wd l="5237" t="9245" r="5770" b="9389">Fields:</wd>

<space/>

</ln>

<ln l="1646" t="9475" r="5784" b="9658" baseLine="9610" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="9475" r="2654" b="9619">Probabilistic</wd>

<space/>

<wd l="2755" t="9475" r="3322" b="9619">models</wd>

<space/>

<wd l="3427" t="9475" r="3658" b="9619">for</wd>

<space/>

<wd l="3758" t="9475" r="4666" b="9658">segmenting</wd>

<space/>

<wd l="4766" t="9475" r="5050" b="9619">and</wd>

<space/>

<wd l="5146" t="9475" r="5784" b="9658">labeling</wd>

<space/>

</ln>

<ln l="1656" t="9706" r="5784" b="9888" baseLine="9840">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="9749" r="2376" b="9888">sequence</wd>

<space/>

</run>

<wd l="2434" t="9706" r="2794" b="9850"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">data</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2870" t="9710" r="3029" b="9845">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3077" t="9706" r="4080" b="9888">Proceedings</wd>

<space/>

<wd l="4138" t="9706" r="4330" b="9888">of</wd>

<space/>

<wd l="4344" t="9706" r="4584" b="9850">the</wd>

<space/>

<wd l="4627" t="9706" r="5501" b="9888">Eighteenth</wd>

<space/>

<wd l="5544" t="9710" r="5784" b="9850">In-</wd>

</run>

</ln>

<ln l="1651" t="9936" r="5779" b="10118" baseLine="10070">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="9936" r="2544" b="10080">ternational</wd>

<space/>

<wd l="2707" t="9936" r="3619" b="10118">Conference</wd>

<space/>

<wd l="3787" t="9984" r="3979" b="10080">on</wd>

<space/>

<wd l="4133" t="9936" r="4838" b="10080">Machine</wd>

<space/>

</run>

<wd l="4992" t="9941" r="5779" b="10118"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Learning</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1651" t="10166" r="5779" b="10349" baseLine="10301" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="10166" r="2424" b="10339">ICML&apos;01,</wd>

<space/>

<wd l="2486" t="10210" r="2942" b="10349">pages</wd>

<space/>

<wd l="3005" t="10166" r="3744" b="10310">282–289.</wd>

<space/>

<wd l="3816" t="10171" r="4440" b="10349">Morgan</wd>

<space/>

<wd l="4502" t="10166" r="5347" b="10310">Kaufmann</wd>

<space/>

<wd l="5405" t="10166" r="5779" b="10310">Pub-</wd>

</ln>

<ln l="1651" t="10397" r="4627" b="10570" baseLine="10531" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="10397" r="2165" b="10541">lishers</wd>

<space/>

<wd l="2222" t="10402" r="2563" b="10570">Inc.,</wd>

<space/>

<wd l="2635" t="10397" r="2918" b="10541">San</wd>

<space/>

<wd l="2976" t="10397" r="3792" b="10570">Francisco,</wd>

<space/>

<wd l="3854" t="10397" r="4171" b="10570">CA,</wd>

<space/>

<wd l="4229" t="10397" r="4627" b="10541">USA</wd>

</ln>

</para>

<para l="1522" t="10747" r="5827" b="12298" alignment="justified" li="216" spaceBefore="111" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1522" t="10747" r="5779" b="10930" baseLine="10882" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1522" t="10747" r="1771" b="10891">Fei</wd>

<space/>

<wd l="1853" t="10747" r="2174" b="10920">Liu,</wd>

<space/>

<wd l="2261" t="10747" r="2866" b="10930">Fuliang</wd>

<space/>

<wd l="2947" t="10752" r="3466" b="10930">Weng,</wd>

<space/>

<wd l="3552" t="10747" r="4296" b="10930">Bingqing</wd>

<space/>

<wd l="4378" t="10752" r="4896" b="10930">Wang,</wd>

<space/>

<wd l="4987" t="10747" r="5270" b="10891">and</wd>

<space/>

<wd l="5352" t="10752" r="5779" b="10930">Yang</wd>

<space/>

</ln>

<ln l="1646" t="10978" r="5774" b="11150" baseLine="11112" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="10978" r="1963" b="11122">Liu.</wd>

<space/>

<wd l="2117" t="10978" r="2558" b="11122">2011.</wd>

<space/>

<wd l="2717" t="10978" r="3466" b="11150">Insertion,</wd>

<space/>

<wd l="3619" t="10978" r="4301" b="11150">deletion,</wd>

<space/>

<wd l="4459" t="11021" r="4627" b="11122">or</wd>

<space/>

<wd l="4776" t="10978" r="5774" b="11122">substitution?</wd>

<space/>

</ln>

<ln l="1642" t="11203" r="5779" b="11386" baseLine="11342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="11203" r="2654" b="11386">Normalizing</wd>

<space/>

<wd l="2942" t="11222" r="3245" b="11347">text</wd>

<space/>

<wd l="3528" t="11246" r="4277" b="11386">messages</wd>

<space/>

<wd l="4570" t="11203" r="5179" b="11347">without</wd>

<space/>

<wd l="5458" t="11246" r="5779" b="11386">pre-</wd>

</ln>

<ln l="1651" t="11434" r="5827" b="11616" baseLine="11568">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="11434" r="2779" b="11616">categorization</wd>

<space/>

<wd l="2870" t="11477" r="3139" b="11578">nor</wd>

<space/>

<wd l="3235" t="11434" r="4186" b="11616">supervision.</wd>

<space/>

<wd l="4291" t="11438" r="4450" b="11573">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4536" t="11434" r="5539" b="11616">Proceedings</wd>

<space/>

<wd l="5635" t="11434" r="5827" b="11616">of</wd>

<space/>

</run>

</ln>

<ln l="1651" t="11664" r="5789" b="11846" baseLine="11798" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="11664" r="1886" b="11808">the</wd>

<space/>

<wd l="2002" t="11664" r="2352" b="11808">49th</wd>

<space/>

<wd l="2453" t="11664" r="3043" b="11808">Annual</wd>

<space/>

<wd l="3134" t="11669" r="3802" b="11846">Meeting</wd>

<space/>

<wd l="3907" t="11664" r="4099" b="11846">of</wd>

<space/>

<wd l="4166" t="11664" r="4402" b="11808">the</wd>

<space/>

<wd l="4502" t="11664" r="5438" b="11808">Association</wd>

<space/>

<wd l="5515" t="11664" r="5789" b="11846">for</wd>

<space/>

</ln>

<ln l="1656" t="11894" r="5779" b="12077" baseLine="12034">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="11894" r="2856" b="12077">Computational</wd>

<space/>

<wd l="2918" t="11899" r="3802" b="12077">Linguistics</wd>

<space/>

<wd l="3893" t="11894" r="4306" b="12077">(ACL</wd>

<space/>

</run>

<wd l="4392" t="11894" r="4901" b="12077"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2011)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4982" t="11938" r="5434" b="12077">pages</wd>

<space/>

<wd l="5520" t="11894" r="5779" b="12038">71-</wd>

<space/>

</run>

</ln>

<ln l="1651" t="12125" r="3163" b="12298" baseLine="12259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="12125" r="1891" b="12298">76,</wd>

<space/>

<wd l="1949" t="12125" r="2669" b="12298">Portland,</wd>

<space/>

<wd l="2726" t="12125" r="3163" b="12269">USA.</wd>

</ln>

</para>

<para l="1421" t="12475" r="5794" b="13771" alignment="justified" li="216" spaceBefore="117" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1421" t="12475" r="5784" b="12658" baseLine="12610" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="12475" r="1670" b="12619">Fei</wd>

<space/>

<wd l="1786" t="12475" r="2107" b="12648">Liu,</wd>

<space/>

<wd l="2227" t="12475" r="2832" b="12658">Fuliang</wd>

<space/>

<wd l="2947" t="12480" r="3470" b="12658">Weng,</wd>

<space/>

<wd l="3595" t="12475" r="3878" b="12619">and</wd>

<space/>

<wd l="3994" t="12475" r="4373" b="12619">Xiao</wd>

<space/>

<wd l="4493" t="12475" r="4954" b="12658">Jiang.</wd>

<space/>

<wd l="5078" t="12475" r="5515" b="12619">2012.</wd>

<space/>

<wd l="5640" t="12475" r="5784" b="12614">A</wd>

<space/>

</ln>

<ln l="1642" t="12706" r="5779" b="12888" baseLine="12840" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="12706" r="2890" b="12888">broad-coverage</wd>

<space/>

<wd l="3024" t="12706" r="4133" b="12850">normalization</wd>

<space/>

<wd l="4272" t="12725" r="4824" b="12888">system</wd>

<space/>

<wd l="4958" t="12706" r="5189" b="12850">for</wd>

<space/>

<wd l="5328" t="12706" r="5779" b="12850">social</wd>

<space/>

</ln>

<ln l="1646" t="12936" r="5794" b="13118" baseLine="13070">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1646" t="12936" r="2136" b="13080">media</wd>

<space/>

<wd l="2194" t="12936" r="2947" b="13118">language.</wd>

<space/>

<wd l="3019" t="12941" r="3182" b="13075">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3230" t="12936" r="4238" b="13118">Proceedings</wd>

<space/>

<wd l="4296" t="12936" r="4488" b="13118">of</wd>

<space/>

<wd l="4507" t="12936" r="4742" b="13080">the</wd>

<space/>

<wd l="4805" t="12936" r="5150" b="13080">50th</wd>

<space/>

<wd l="5203" t="12936" r="5794" b="13080">Annual</wd>

<space/>

</run>

</ln>

<ln l="1637" t="13166" r="5784" b="13349" baseLine="13301" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1637" t="13171" r="2309" b="13349">Meeting</wd>

<space/>

<wd l="2371" t="13166" r="2563" b="13349">of</wd>

<space/>

<wd l="2592" t="13166" r="2827" b="13310">the</wd>

<space/>

<wd l="2885" t="13166" r="3821" b="13310">Association</wd>

<space/>

<wd l="3854" t="13166" r="4128" b="13349">for</wd>

<space/>

<wd l="4200" t="13166" r="5400" b="13349">Computational</wd>

<space/>

<wd l="5448" t="13171" r="5784" b="13310">Lin-</wd>

</ln>

<ln l="1637" t="13397" r="5774" b="13579" baseLine="13531">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1637" t="13406" r="2256" b="13579">guistics</wd>

<space/>

<wd l="2323" t="13397" r="2741" b="13579">(ACL</wd>

<space/>

</run>

<wd l="2803" t="13397" r="3317" b="13579"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2012)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3374" t="13440" r="3830" b="13579">pages</wd>

<space/>

<wd l="3912" t="13397" r="4805" b="13570">1035-1044,</wd>

<space/>

<wd l="4867" t="13397" r="5194" b="13579">Jeju</wd>

<space/>

<wd l="5251" t="13397" r="5774" b="13570">Island,</wd>

<space/>

</run>

</ln>

<ln l="1646" t="13632" r="2174" b="13771" baseLine="13762" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="13632" r="2174" b="13771">Korea.</wd>

</ln>

</para>

<para l="1421" t="13973" r="5784" b="15067" alignment="justified" li="216" spaceBefore="117" spaceAfter="883" fli="-216" lsp="exactly" lspExact="231" language="en">

<ln l="1421" t="13973" r="5784" b="14155" baseLine="14107" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1421" t="13973" r="1613" b="14112">Yi</wd>

<space/>

<wd l="1723" t="13978" r="2155" b="14155">Yang</wd>

<space/>

<wd l="2266" t="13973" r="2554" b="14117">and</wd>

<space/>

<wd l="2659" t="13973" r="3110" b="14117">Jacob</wd>

<space/>

<wd l="3221" t="13973" r="4080" b="14117">Eisenstein.</wd>

<space/>

<wd l="4200" t="13973" r="4642" b="14117">2013.</wd>

<space/>

<wd l="4757" t="13973" r="4901" b="14112">A</wd>

<space/>

<wd l="5011" t="13973" r="5784" b="14155">log-linear</wd>

<space/>

</ln>

<ln l="1646" t="14203" r="5779" b="14386" baseLine="14342">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1646" t="14203" r="2141" b="14347">model</wd>

<space/>

<wd l="2213" t="14203" r="2443" b="14347">for</wd>

<space/>

<wd l="2501" t="14203" r="3552" b="14386">unsupervised</wd>

<space/>

<wd l="3614" t="14222" r="3912" b="14347">text</wd>

<space/>

<wd l="3974" t="14203" r="5122" b="14347">normalization.</wd>

<space/>

<wd l="5198" t="14208" r="5357" b="14342">In</wd>

<space/>

</run>

<wd l="5414" t="14208" r="5779" b="14347" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Pro-</wd>

</ln>

<ln l="1651" t="14434" r="5779" b="14616" baseLine="14573" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="14434" r="2347" b="14616">ceedings</wd>

<space/>

<wd l="2438" t="14434" r="2630" b="14616">of</wd>

<space/>

<wd l="2688" t="14434" r="3595" b="14616">Conference</wd>

<space/>

<wd l="3691" t="14482" r="3883" b="14578">on</wd>

<space/>

<wd l="3965" t="14434" r="4771" b="14616">Empirical</wd>

<space/>

<wd l="4843" t="14434" r="5544" b="14578">Methods</wd>

<space/>

<wd l="5635" t="14443" r="5779" b="14578">in</wd>

<space/>

</ln>

<ln l="1637" t="14659" r="5779" b="14846" baseLine="14798">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1637" t="14669" r="2208" b="14808">Natura</wd>

<space/>

<wd l="2270" t="14669" r="3077" b="14846">Language</wd>

<space/>

<wd l="3139" t="14669" r="4037" b="14846">Processing</wd>

<space/>

</run>

<wd l="4104" t="14664" r="4925" b="14846"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(EMNLP)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4992" t="14707" r="5448" b="14846">pages</wd>

<space/>

<wd l="5520" t="14664" r="5779" b="14808">61-</wd>

<space/>

</run>

</ln>

<ln l="1651" t="14894" r="3029" b="15067" baseLine="15034" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="14894" r="1891" b="15067">72,</wd>

<space/>

<wd l="1958" t="14894" r="2534" b="15067">Seattle,</wd>

<space/>

<wd l="2592" t="14894" r="3029" b="15038">USA.</wd>

</ln>

</para>

</column>

</section>

<dd l="5841" t="15751" r="6161" b="15980">

<para l="5841" t="15787" r="6128" b="15946" alignment="left" lsp="exactly" lspExact="218" language="en">

<ln l="5875" t="15787" r="6062" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="900" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="4">

<wd l="5875" t="15792" r="6062" b="15946">81</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

