<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4309.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1361" marginTop="1360" marginRight="1227" marginBottom="358" offsetX="-22" offsetY="-18" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1361" t="1360" r="10682" b="4092">

<column l="1361" t="1360" r="10682" b="4092">

<para l="1608" t="1435" r="10344" b="1963" alignment="centered" spaceBefore="34" lsp="exactly" lspExact="317" language="en">

<ln l="1608" t="1435" r="10344" b="1699" baseLine="1632" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1608" t="1435" r="2534" b="1642">Lattice:</wd>

<space/>

<wd l="2645" t="1440" r="3235" b="1642">Data</wd>

<space/>

<wd l="3307" t="1435" r="4694" b="1699">Adaptation</wd>

<space/>

<wd l="4766" t="1435" r="5122" b="1642">for</wd>

<space/>

<wd l="5198" t="1440" r="6067" b="1646">Named</wd>

<space/>

<wd l="6144" t="1435" r="6907" b="1699">Entity</wd>

<space/>

<wd l="6989" t="1435" r="8448" b="1699">Recognition</wd>

<space/>

<wd l="8525" t="1498" r="8822" b="1642">on</wd>

<space/>

<wd l="8899" t="1440" r="9730" b="1642">Tweets</wd>

<space/>

<wd l="9811" t="1435" r="10344" b="1642">with
</wd>

</ln>

<ln l="4781" t="1752" r="7162" b="1963" baseLine="1949" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="4781" t="1752" r="6499" b="1958">Features-Rich</wd>

<space/>

<wd l="6590" t="1752" r="7162" b="1963">CRF</wd>

</ln>

</para>

<para l="2429" t="2419" r="9917" b="2592" alignment="left" li="1080" spaceBefore="334" lsp="exactly" lspExact="274" language="en">

<tabs position="2429"/>

<tabs alignment="left" position="2592" leaderChar=" "/>

<ln l="2429" t="2419" r="9917" b="2592" baseLine="2574" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2429" t="2419" r="2894" b="2592">Tian</wd>

<space/>

<wd l="2962" t="2419" r="3547" b="2592">TIAN</wd>

<tab position="3547"/>

<wd l="5160" t="2424" r="5827" b="2592">Marco</wd>

<space/>

<wd l="5894" t="2419" r="6787" b="2592">Dinarelli</wd>

<tab position="6787"/>

<wd l="8016" t="2424" r="8794" b="2592">Isabelle</wd>

<space/>

<wd l="8856" t="2424" r="9917" b="2587">TELLIER</wd>

</ln>

</para>

<para l="1680" t="2698" r="10267" b="2870" alignment="centered" spaceBefore="14" lsp="exactly" lspExact="274" language="en">

<ln l="1680" t="2698" r="10267" b="2870" baseLine="2862" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">

<wd l="1680" t="2702" r="2342" b="2870">Lattice</wd>

<space/>

<wd l="2400" t="2702" r="2477" b="2870">/</wd>

<space/>

<wd l="2554" t="2702" r="2626" b="2866">1</wd>

<space/>

<wd l="2707" t="2702" r="3504" b="2870">Maurice</wd>

<space/>

<wd l="3566" t="2702" r="4291" b="2870">Arnoux</wd>

<space/>

<wd l="4666" t="2702" r="5333" b="2870">Lattice</wd>

<space/>

<wd l="5386" t="2702" r="5462" b="2870">/</wd>

<space/>

<wd l="5539" t="2702" r="5611" b="2866">1</wd>

<space/>

<wd l="5698" t="2702" r="6494" b="2870">Maurice</wd>

<space/>

<wd l="6552" t="2702" r="7282" b="2870">Arnoux</wd>

<space/>

<wd l="7656" t="2702" r="8318" b="2870">Lattice</wd>

<space/>

<wd l="8376" t="2702" r="8453" b="2870">/</wd>

<space/>

<wd l="8530" t="2702" r="8602" b="2866">1</wd>

<space/>

<wd l="8683" t="2702" r="9480" b="2870">Maurice</wd>

<space/>

<wd l="9542" t="2702" r="10267" b="2870">Arnoux</wd>

</ln>

</para>

<para l="1906" t="2981" r="10046" b="3154" alignment="left" li="504" lsp="exactly" lspExact="274" language="en">

<tabs position="1906"/>

<tabs alignment="left" position="3154" leaderChar=" "/>

<ln l="1906" t="2981" r="10046" b="3154" baseLine="3137" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1906" t="2981" r="2491" b="3154">92120</wd>

<space/>

<wd l="2558" t="2981" r="4075" b="3149">MONTROUGE</wd>

<tab position="4075"/>

<wd l="4891" t="2981" r="5482" b="3154">92120</wd>

<space/>

<wd l="5544" t="2981" r="7061" b="3149">MONTROUGE</wd>

<tab position="7061"/>

<wd l="7882" t="2981" r="8467" b="3154">92120</wd>

<space/>

<wd l="8534" t="2981" r="10046" b="3149">MONTROUGE</wd>

</ln>

</para>

<para l="2078" t="3307" r="10622" b="3456" alignment="left" li="720" spaceBefore="82" spaceAfter="633" lsp="exactly" lspExact="176" language="en">

<tabs position="2078"/>

<ln l="2078" t="3307" r="10622" b="3456" baseLine="3419" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="2078" t="3307" r="3898" b="3437">tian.tian@live.cn</wd>

<tab position="3898"/>

<wd l="4790" t="3307" r="7152" b="3437">marco.dinarelli@ens.fr</wd>

<space/>

<wd l="7310" t="3307" r="10622" b="3456">isabelle.tellier@univ-paris3.fr</wd>

</ln>

</para>

</column>

</section>

<section l="1361" t="4092" r="10682" b="15336">

<column l="1361" t="4092" r="5901" b="15336">

<para l="3178" t="4142" r="4070" b="4315" alignment="centered" li="72" spaceBefore="3" lsp="exactly" lspExact="274" language="en">

<ln l="3178" t="4142" r="4070" b="4315" baseLine="4306" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3178" t="4142" r="4070" b="4315">Abstract</wd>

</ln>

</para>

<para l="1781" t="4704" r="5467" b="8112" alignment="justified" li="360" ri="432" spaceBefore="268" lsp="exactly" lspExact="271" language="en">

<ln l="1781" t="4704" r="5453" b="4862" baseLine="4853" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4704" r="2160" b="4862">This</wd>

<space/>

<wd l="2237" t="4704" r="2774" b="4862">article</wd>

<space/>

<wd l="2842" t="4704" r="3643" b="4862">describes</wd>

<space/>

<wd l="3720" t="4757" r="4008" b="4862">our</wd>

<space/>

<wd l="4070" t="4709" r="4478" b="4862">CRF</wd>

<space/>

<wd l="4541" t="4704" r="5126" b="4862">named</wd>

<space/>

<wd l="5194" t="4757" r="5453" b="4862">en-</wd>

</ln>

<ln l="1781" t="4973" r="5453" b="5174" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4973" r="2069" b="5174">tity</wd>

<space/>

<wd l="2126" t="4997" r="2899" b="5131">extractor</wd>

<space/>

<wd l="2947" t="4973" r="3202" b="5131">for</wd>

<space/>

<wd l="3250" t="4973" r="3878" b="5131">Twitter</wd>

<space/>

<wd l="3931" t="4973" r="4334" b="5131">data.</wd>

<space/>

<wd l="4411" t="4978" r="4694" b="5131">We</wd>

<space/>

<wd l="4752" t="4973" r="5088" b="5131">first</wd>

<space/>

<wd l="5141" t="4973" r="5453" b="5131">dis-</wd>

</ln>

<ln l="1786" t="5242" r="5462" b="5443" baseLine="5395" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5294" r="2146" b="5400">cuss</wd>

<space/>

<wd l="2218" t="5294" r="2669" b="5400">some</wd>

<space/>

<wd l="2731" t="5242" r="3744" b="5443">specificities</wd>

<space/>

<wd l="3811" t="5242" r="3998" b="5400">of</wd>

<space/>

<wd l="4042" t="5242" r="4306" b="5400">the</wd>

<space/>

<wd l="4358" t="5242" r="4752" b="5429">task,</wd>

<space/>

<wd l="4819" t="5242" r="5208" b="5400">with</wd>

<space/>

<wd l="5266" t="5294" r="5462" b="5400">an</wd>

<space/>

</ln>

<ln l="1786" t="5515" r="5467" b="5717" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5515" r="2515" b="5717">example</wd>

<space/>

<wd l="2587" t="5515" r="3096" b="5674">found</wd>

<space/>

<wd l="3163" t="5515" r="3336" b="5669">in</wd>

<space/>

<wd l="3403" t="5515" r="3667" b="5674">the</wd>

<space/>

<wd l="3739" t="5515" r="4416" b="5717">training</wd>

<space/>

<wd l="4493" t="5515" r="4896" b="5674">data.</wd>

<space/>

<wd l="5016" t="5515" r="5467" b="5674">Then</wd>

<space/>

</ln>

<ln l="1781" t="5784" r="5453" b="5986" baseLine="5938" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5837" r="2035" b="5942">we</wd>

<space/>

<wd l="2102" t="5808" r="2736" b="5986">present</wd>

<space/>

<wd l="2803" t="5784" r="3168" b="5942">how</wd>

<space/>

<wd l="3240" t="5837" r="3494" b="5942">we</wd>

<space/>

<wd l="3562" t="5784" r="3960" b="5942">built</wd>

<space/>

<wd l="4032" t="5837" r="4320" b="5942">our</wd>

<space/>

<wd l="4392" t="5789" r="4795" b="5942">CRF</wd>

<space/>

<wd l="4867" t="5784" r="5453" b="5971">model,</wd>

<space/>

</ln>

<ln l="1786" t="6058" r="5453" b="6259" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="6058" r="2650" b="6259">especially</wd>

<space/>

<wd l="2726" t="6058" r="2995" b="6216">the</wd>

<space/>

<wd l="3067" t="6110" r="3427" b="6259">way</wd>

<space/>

<wd l="3504" t="6058" r="4186" b="6216">features</wd>

<space/>

<wd l="4272" t="6110" r="4694" b="6216">were</wd>

<space/>

<wd l="4771" t="6058" r="5453" b="6216">defined.</wd>

<space/>

</ln>

<ln l="1781" t="6326" r="5462" b="6528" baseLine="6480" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="6326" r="2117" b="6485">The</wd>

<space/>

<wd l="2198" t="6326" r="2760" b="6485">results</wd>

<space/>

<wd l="2851" t="6326" r="3043" b="6485">of</wd>

<space/>

<wd l="3110" t="6326" r="3557" b="6485">these</wd>

<space/>

<wd l="3643" t="6326" r="3979" b="6485">first</wd>

<space/>

<wd l="4061" t="6326" r="5112" b="6528">experiments</wd>

<space/>

<wd l="5203" t="6379" r="5462" b="6485">are</wd>

<space/>

</ln>

<ln l="1786" t="6600" r="5467" b="6802" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="6600" r="2299" b="6802">given.</wd>

<space/>

<wd l="2544" t="6605" r="2827" b="6758">We</wd>

<space/>

<wd l="2947" t="6600" r="3288" b="6758">also</wd>

<space/>

<wd l="3403" t="6600" r="3912" b="6758">tested</wd>

<space/>

<wd l="4027" t="6653" r="4315" b="6758">our</wd>

<space/>

<wd l="4421" t="6600" r="4963" b="6758">model</wd>

<space/>

<wd l="5078" t="6600" r="5467" b="6758">with</wd>

<space/>

</ln>

<ln l="1786" t="6869" r="5453" b="7070" baseLine="7022" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="6869" r="2088" b="7027">dev</wd>

<space/>

<wd l="2174" t="6869" r="2592" b="7027">2015</wd>

<space/>

<wd l="2702" t="6869" r="3067" b="7027">data</wd>

<space/>

<wd l="3163" t="6869" r="3475" b="7027">and</wd>

<space/>

<wd l="3566" t="6922" r="3821" b="7027">we</wd>

<space/>

<wd l="3922" t="6869" r="4646" b="7027">describe</wd>

<space/>

<wd l="4742" t="6869" r="5006" b="7027">the</wd>

<space/>

<wd l="5102" t="6922" r="5453" b="7070">pro-</wd>

</ln>

<ln l="1786" t="7142" r="5453" b="7344" baseLine="7291" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="7142" r="2362" b="7301">cedure</wd>

<space/>

<wd l="2434" t="7195" r="2683" b="7301">we</wd>

<space/>

<wd l="2755" t="7142" r="3158" b="7301">have</wd>

<space/>

<wd l="3230" t="7142" r="3629" b="7301">used</wd>

<space/>

<wd l="3701" t="7166" r="3864" b="7301">to</wd>

<space/>

<wd l="3941" t="7142" r="4411" b="7344">adapt</wd>

<space/>

<wd l="4483" t="7142" r="4934" b="7301">older</wd>

<space/>

<wd l="4997" t="7142" r="5453" b="7301">Twit-</wd>

</ln>

<ln l="1781" t="7411" r="5453" b="7570" baseLine="7560" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7435" r="2016" b="7570">ter</wd>

<space/>

<wd l="2078" t="7411" r="2443" b="7570">data</wd>

<space/>

<wd l="2501" t="7435" r="2669" b="7570">to</wd>

<space/>

<wd l="2736" t="7411" r="3000" b="7570">the</wd>

<space/>

<wd l="3067" t="7411" r="3432" b="7570">data</wd>

<space/>

<wd l="3494" t="7411" r="4267" b="7570">available</wd>

<space/>

<wd l="4334" t="7411" r="4589" b="7570">for</wd>

<space/>

<wd l="4651" t="7411" r="4958" b="7570">this</wd>

<space/>

<wd l="5035" t="7411" r="5453" b="7570">2015</wd>

<space/>

</ln>

<ln l="1790" t="7685" r="5467" b="7843" baseLine="7834" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1790" t="7685" r="2352" b="7843">shared</wd>

<space/>

<wd l="2419" t="7685" r="2813" b="7843">task.</wd>

<space/>

<wd l="2947" t="7690" r="3288" b="7843">Our</wd>

<space/>

<wd l="3355" t="7685" r="3739" b="7843">final</wd>

<space/>

<wd l="3811" t="7685" r="4373" b="7843">results</wd>

<space/>

<wd l="4450" t="7685" r="4709" b="7843">for</wd>

<space/>

<wd l="4776" t="7685" r="5040" b="7843">the</wd>

<space/>

<wd l="5112" t="7685" r="5467" b="7843">task</wd>

<space/>

</ln>

<ln l="1786" t="7954" r="2981" b="8112" baseLine="8102" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="8006" r="2045" b="8112">are</wd>

<space/>

<wd l="2107" t="7954" r="2981" b="8112">discussed.</wd>

</ln>

</para>

<para l="1454" t="8491" r="3091" b="8664" alignment="left" li="72" spaceBefore="288" lsp="exactly" lspExact="274" language="en">

<ln l="1454" t="8491" r="3091" b="8664" baseLine="8659" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1454" t="8491" r="1550" b="8659">1</wd>

<space/>

<wd l="1805" t="8491" r="3091" b="8664">Introduction</wd>

</ln>

</para>

<para l="1440" t="8966" r="5818" b="12917" alignment="justified" li="72" ri="72" spaceBefore="183" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="8966" r="5818" b="9168" baseLine="9115" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8971" r="1622" b="9120">In</wd>

<space/>

<wd l="1685" t="8966" r="1992" b="9125">this</wd>

<space/>

<wd l="2069" t="8966" r="2630" b="9125">shared</wd>

<space/>

<wd l="2688" t="8966" r="3086" b="9154">task,</wd>

<space/>

<wd l="3158" t="9019" r="3413" b="9125">we</wd>

<space/>

<wd l="3475" t="8966" r="3878" b="9125">have</wd>

<space/>

<wd l="3941" t="8990" r="4104" b="9125">to</wd>

<space/>

<wd l="4176" t="8990" r="4762" b="9125">extract</wd>

<space/>

<wd l="4848" t="8971" r="5035" b="9125">10</wd>

<space/>

<wd l="5102" t="8990" r="5554" b="9168">types</wd>

<space/>

<wd l="5630" t="8966" r="5818" b="9125">of</wd>

<space/>

</ln>

<ln l="1450" t="9235" r="5803" b="9437" baseLine="9389" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="9240" r="1699" b="9432">(or</wd>

<space/>

<wd l="1762" t="9259" r="2040" b="9394">not</wd>

<space/>

<wd l="2107" t="9235" r="2654" b="9437">typed)</wd>

<space/>

<wd l="2731" t="9235" r="3312" b="9394">named</wd>

<space/>

<wd l="3379" t="9235" r="3998" b="9394">entities</wd>

<space/>

<wd l="4075" t="9235" r="4243" b="9389">in</wd>

<space/>

<wd l="4310" t="9235" r="4939" b="9394">Twitter</wd>

<space/>

<wd l="5006" t="9235" r="5405" b="9394">data.</wd>

<space/>

<wd l="5520" t="9240" r="5803" b="9394">We</wd>

<space/>

</ln>

<ln l="1440" t="9509" r="5808" b="9710" baseLine="9658" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9509" r="1843" b="9667">have</wd>

<space/>

<wd l="1934" t="9533" r="2093" b="9667">at</wd>

<space/>

<wd l="2179" t="9562" r="2472" b="9667">our</wd>

<space/>

<wd l="2558" t="9509" r="3264" b="9710">disposal</wd>

<space/>

<wd l="3355" t="9533" r="3677" b="9667">two</wd>

<space/>

<wd l="3768" t="9509" r="4459" b="9667">labelled</wd>

<space/>

<wd l="4550" t="9562" r="5256" b="9710">corpora:</wd>

<space/>

<wd l="5405" t="9509" r="5808" b="9667">train</wd>

<space/>

</ln>

<ln l="1445" t="9778" r="5794" b="9979" baseLine="9931" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9778" r="1757" b="9936">and</wd>

<space/>

<wd l="1838" t="9778" r="2170" b="9936">dev.</wd>

<space/>

<wd l="2318" t="9778" r="2659" b="9936">The</wd>

<space/>

<wd l="2741" t="9778" r="3077" b="9936">first</wd>

<space/>

<wd l="3163" t="9778" r="3773" b="9936">section</wd>

<space/>

<wd l="3859" t="9778" r="4382" b="9936">shows</wd>

<space/>

<wd l="4478" t="9830" r="4925" b="9936">some</wd>

<space/>

<wd l="5016" t="9778" r="5794" b="9979">specifici-</wd>

</ln>

<ln l="1440" t="10051" r="5803" b="10253" baseLine="10200" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10051" r="1733" b="10210">ties</wd>

<space/>

<wd l="1814" t="10051" r="2006" b="10210">of</wd>

<space/>

<wd l="2059" t="10051" r="2323" b="10210">the</wd>

<space/>

<wd l="2395" t="10051" r="2798" b="10238">data,</wd>

<space/>

<wd l="2880" t="10051" r="3307" b="10210">from</wd>

<space/>

<wd l="3374" t="10104" r="3571" b="10210">an</wd>

<space/>

<wd l="3648" t="10051" r="4378" b="10253">example</wd>

<space/>

<wd l="4445" t="10051" r="4570" b="10210">it</wd>

<space/>

<wd l="4637" t="10051" r="5405" b="10210">contains.</wd>

<space/>

<wd l="5520" t="10056" r="5803" b="10210">We</wd>

<space/>

</ln>

<ln l="1440" t="10320" r="5803" b="10522" baseLine="10469" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10320" r="1819" b="10478">then</wd>

<space/>

<wd l="1872" t="10344" r="2669" b="10478">construct</wd>

<space/>

<wd l="2726" t="10373" r="2822" b="10478">a</wd>

<space/>

<wd l="2875" t="10325" r="3278" b="10478">CRF</wd>

<space/>

<wd l="3331" t="10320" r="3874" b="10478">model</wd>

<space/>

<wd l="3931" t="10320" r="4190" b="10478">for</wd>

<space/>

<wd l="4238" t="10320" r="4502" b="10478">the</wd>

<space/>

<wd l="4555" t="10320" r="4949" b="10507">task,</wd>

<space/>

<wd l="5016" t="10320" r="5482" b="10522">using</wd>

<space/>

<wd l="5539" t="10320" r="5803" b="10478">the</wd>

<space/>

</ln>

<ln l="1450" t="10594" r="5803" b="10795" baseLine="10742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="10594" r="2189" b="10752">software</wd>

<space/>

<wd l="2280" t="10594" r="2899" b="10795">Wapiti.</wd>

<space/>

<wd l="3086" t="10598" r="3422" b="10752">Our</wd>

<space/>

<wd l="3509" t="10594" r="4190" b="10752">features</wd>

<space/>

<wd l="4291" t="10594" r="4546" b="10752">for</wd>

<space/>

<wd l="4632" t="10594" r="4939" b="10752">this</wd>

<space/>

<wd l="5040" t="10598" r="5448" b="10752">CRF</wd>

<space/>

<wd l="5544" t="10646" r="5803" b="10752">are</wd>

<space/>

</ln>

<ln l="1445" t="10862" r="5803" b="11064" baseLine="11011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="10862" r="2050" b="11021">chosen</wd>

<space/>

<wd l="2126" t="10862" r="2981" b="11064">according</wd>

<space/>

<wd l="3062" t="10886" r="3230" b="11021">to</wd>

<space/>

<wd l="3312" t="10862" r="3576" b="11021">the</wd>

<space/>

<wd l="3662" t="10862" r="4992" b="11050">state-of-the-art,</wd>

<space/>

<wd l="5088" t="10862" r="5458" b="11064">they</wd>

<space/>

<wd l="5544" t="10915" r="5803" b="11021">are</wd>

<space/>

</ln>

<ln l="1445" t="11131" r="5808" b="11290" baseLine="11285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="11131" r="2275" b="11290">described</wd>

<space/>

<wd l="2338" t="11131" r="2506" b="11285">in</wd>

<space/>

<wd l="2568" t="11131" r="2832" b="11290">the</wd>

<space/>

<wd l="2904" t="11131" r="3499" b="11290">second</wd>

<space/>

<wd l="3566" t="11131" r="4219" b="11290">section.</wd>

<space/>

<wd l="4315" t="11131" r="4656" b="11290">The</wd>

<space/>

<wd l="4714" t="11131" r="5126" b="11290">third</wd>

<space/>

<wd l="5198" t="11131" r="5808" b="11290">section</wd>

<space/>

</ln>

<ln l="1440" t="11405" r="5803" b="11606" baseLine="11554" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11405" r="2088" b="11563">focuses</wd>

<space/>

<wd l="2179" t="11458" r="2395" b="11563">on</wd>

<space/>

<wd l="2482" t="11458" r="2933" b="11563">some</wd>

<space/>

<wd l="3014" t="11405" r="4066" b="11606">experiments</wd>

<space/>

<wd l="4157" t="11405" r="4546" b="11563">with</wd>

<space/>

<wd l="4622" t="11405" r="5021" b="11563">train</wd>

<space/>

<wd l="5107" t="11405" r="5419" b="11563">and</wd>

<space/>

<wd l="5501" t="11405" r="5803" b="11563">dev</wd>

<space/>

</ln>

<ln l="1445" t="11674" r="5808" b="11875" baseLine="11827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="11674" r="1757" b="11832">and</wd>

<space/>

<wd l="1824" t="11674" r="2261" b="11875">gives</wd>

<space/>

<wd l="2333" t="11674" r="2597" b="11832">the</wd>

<space/>

<wd l="2664" t="11674" r="3413" b="11832">obtained</wd>

<space/>

<wd l="3475" t="11674" r="4090" b="11832">results.</wd>

<space/>

<wd l="4190" t="11674" r="4526" b="11832">The</wd>

<space/>

<wd l="4594" t="11674" r="5126" b="11832">fourth</wd>

<space/>

<wd l="5198" t="11674" r="5808" b="11832">section</wd>

<space/>

</ln>

<ln l="1440" t="11947" r="5794" b="12149" baseLine="12096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11947" r="1579" b="12106">is</wd>

<space/>

<wd l="1632" t="11947" r="2117" b="12106">about</wd>

<space/>

<wd l="2160" t="11947" r="2424" b="12106">the</wd>

<space/>

<wd l="2467" t="11947" r="3341" b="12149">procedure</wd>

<space/>

<wd l="3384" t="12000" r="3638" b="12106">we</wd>

<space/>

<wd l="3682" t="11947" r="4085" b="12106">have</wd>

<space/>

<wd l="4133" t="11947" r="4531" b="12106">used</wd>

<space/>

<wd l="4574" t="11971" r="4742" b="12106">to</wd>

<space/>

<wd l="4790" t="11947" r="5232" b="12106">build</wd>

<space/>

<wd l="5280" t="12000" r="5573" b="12106">our</wd>

<space/>

<wd l="5616" t="11947" r="5794" b="12101">fi-</wd>

</ln>

<ln l="1440" t="12216" r="5794" b="12418" baseLine="12370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12216" r="1704" b="12374">nal</wd>

<space/>

<wd l="1766" t="12216" r="2352" b="12403">model,</wd>

<space/>

<wd l="2424" t="12216" r="2640" b="12418">by</wd>

<space/>

<wd l="2707" t="12216" r="3461" b="12418">applying</wd>

<space/>

<wd l="3528" t="12269" r="3624" b="12374">a</wd>

<space/>

<wd l="3682" t="12216" r="4334" b="12374">domain</wd>

<space/>

<wd l="4397" t="12216" r="5299" b="12418">adaptation</wd>

<space/>

<wd l="5366" t="12240" r="5794" b="12374">strat-</wd>

</ln>

<ln l="1445" t="12490" r="5803" b="12691" baseLine="12638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12542" r="1781" b="12691">egy.</wd>

<space/>

<wd l="1939" t="12494" r="2122" b="12643">In</wd>

<space/>

<wd l="2203" t="12490" r="2467" b="12648">the</wd>

<space/>

<wd l="2549" t="12490" r="2856" b="12648">last</wd>

<space/>

<wd l="2942" t="12490" r="3595" b="12677">section,</wd>

<space/>

<wd l="3696" t="12542" r="3950" b="12648">we</wd>

<space/>

<wd l="4037" t="12490" r="4651" b="12648">discuss</wd>

<space/>

<wd l="4752" t="12542" r="5203" b="12648">some</wd>

<space/>

<wd l="5285" t="12490" r="5803" b="12648">future</wd>

<space/>

</ln>

<ln l="1440" t="12758" r="3638" b="12917" baseLine="12912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12758" r="1886" b="12917">work</wd>

<space/>

<wd l="1939" t="12758" r="2198" b="12917">for</wd>

<space/>

<wd l="2251" t="12758" r="2558" b="12917">this</wd>

<space/>

<wd l="2630" t="12758" r="3192" b="12917">shared</wd>

<space/>

<wd l="3245" t="12758" r="3638" b="12917">task.</wd>

</ln>

</para>

<para l="1440" t="13277" r="3206" b="13498" alignment="left" li="72" spaceBefore="264" lsp="exactly" lspExact="274" language="en">

<ln l="1440" t="13277" r="3206" b="13498" baseLine="13445" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1440" t="13277" r="1555" b="13445">2</wd>

<space/>

<wd l="1800" t="13282" r="2290" b="13450">Data</wd>

<space/>

<wd l="2352" t="13277" r="3206" b="13498">Analysis</wd>

</ln>

</para>

<para l="1440" t="13752" r="5808" b="15302" alignment="justified" li="72" ri="72" spaceBefore="183" spaceAfter="19" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="13752" r="5803" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="13752" r="2266" b="13954">Although</wd>

<space/>

<wd l="2318" t="13752" r="2904" b="13910">named</wd>

<space/>

<wd l="2962" t="13752" r="3451" b="13954">entity</wd>

<space/>

<wd l="3509" t="13752" r="4502" b="13954">recognition</wd>

<space/>

<wd l="4555" t="13752" r="4694" b="13910">is</wd>

<space/>

<wd l="4762" t="13805" r="4858" b="13910">a</wd>

<space/>

<wd l="4910" t="13752" r="5803" b="13910">traditional</wd>

<space/>

</ln>

<ln l="1440" t="14021" r="5808" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14021" r="1795" b="14179">task</wd>

<space/>

<wd l="1867" t="14021" r="2054" b="14179">of</wd>

<space/>

<wd l="2112" t="14021" r="2717" b="14179">natural</wd>

<space/>

<wd l="2789" t="14021" r="3571" b="14222">language</wd>

<space/>

<wd l="3643" t="14021" r="4574" b="14222">processing</wd>

<space/>

<wd l="4656" t="14026" r="5194" b="14218">(NLP)</wd>

<space/>

<wd l="5270" t="14021" r="5808" b="14179">which</wd>

<space/>

</ln>

<ln l="1440" t="14294" r="5794" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14294" r="1723" b="14453">has</wd>

<space/>

<wd l="1810" t="14294" r="2285" b="14496">given</wd>

<space/>

<wd l="2357" t="14294" r="2674" b="14453">rise</wd>

<space/>

<wd l="2750" t="14318" r="2914" b="14453">to</wd>

<space/>

<wd l="3000" t="14347" r="3096" b="14453">a</wd>

<space/>

<wd l="3168" t="14294" r="3600" b="14496">large</wd>

<space/>

<wd l="3677" t="14294" r="4109" b="14496">body</wd>

<space/>

<wd l="4190" t="14294" r="4382" b="14453">of</wd>

<space/>

<wd l="4445" t="14294" r="4968" b="14453">works</wd>

<space/>

<wd l="5050" t="14294" r="5309" b="14453">for</wd>

<space/>

<wd l="5381" t="14294" r="5794" b="14453">writ-</wd>

</ln>

<ln l="1440" t="14563" r="5808" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14587" r="1709" b="14722">ten</wd>

<space/>

<wd l="1771" t="14563" r="2443" b="14765">English</wd>

<space/>

<wd l="2515" t="14563" r="3134" b="14760">(Finkel</wd>

<space/>

<wd l="3206" t="14587" r="3360" b="14722">et</wd>

<space/>

<wd l="3432" t="14563" r="3682" b="14750">al.,</wd>

<space/>

<wd l="3768" t="14563" r="4262" b="14760">2005)</wd>

<space/>

<wd l="4344" t="14616" r="4526" b="14722">or</wd>

<space/>

<wd l="4589" t="14616" r="5021" b="14722">news</wd>

<space/>

<wd l="5098" t="14563" r="5563" b="14722">wires</wd>

<space/>

<wd l="5635" t="14563" r="5808" b="14717">in</wd>

<space/>

</ln>

<ln l="1440" t="14837" r="5808" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14837" r="2050" b="14995">French</wd>

<space/>

<wd l="2098" t="14842" r="2621" b="15034">(Stern</wd>

<space/>

<wd l="2669" t="14837" r="2981" b="14995">and</wd>

<space/>

<wd l="3024" t="14842" r="3562" b="15038">Sagot,</wd>

<space/>

<wd l="3619" t="14842" r="4171" b="15034">2010),</wd>

<space/>

<wd l="4224" t="14837" r="4493" b="14995">the</wd>

<space/>

<wd l="4541" t="14890" r="4982" b="14995">same</wd>

<space/>

<wd l="5026" t="14837" r="5376" b="14995">task</wd>

<space/>

<wd l="5419" t="14837" r="5808" b="14995">with</wd>

<space/>

</ln>

<ln l="1440" t="15106" r="5794" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="15106" r="2069" b="15264">Twitter</wd>

<space/>

<wd l="2131" t="15106" r="2496" b="15264">data</wd>

<space/>

<wd l="2554" t="15106" r="3235" b="15264">remains</wd>

<space/>

<wd l="3312" t="15106" r="3994" b="15264">difficult</wd>

<space/>

<wd l="4066" t="15106" r="4632" b="15302">(Ritter</wd>

<space/>

<wd l="4694" t="15130" r="4848" b="15264">et</wd>

<space/>

<wd l="4915" t="15106" r="5165" b="15293">al.,</wd>

<space/>

<wd l="5246" t="15110" r="5794" b="15302">2011).</wd>

</ln>

</para>

</column>

<column l="6142" t="4102" r="10682" b="15336">

<frame l="6152" t="4102" r="10672" b="4459">

<leftBorder type="single" width="10" color="000000"/>

<topBorder type="single" width="10" color="000000"/>

<rightBorder type="single" width="10" color="000000"/>

<bottomBorder type="single" width="10" color="000000"/>

<para l="6336" t="4238" r="10450" b="4406" alignment="left" li="144" spaceBefore="86" spaceAfter="40" lsp="exactly" lspExact="221" language="en">

<ln l="6336" t="4238" r="10450" b="4406" baseLine="4358">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6336" t="4238" r="6778" b="4406">Today</wd>

<space/>

<wd l="6826" t="4277" r="7176" b="4368">wasz</wd>

<space/>

<wd l="7224" t="4243" r="7507" b="4368">Fun</wd>

<space/>

<wd l="7550" t="4277" r="7862" b="4368">cusz</wd>

<space/>

<wd l="7915" t="4277" r="8251" b="4368">anna</wd>

<space/>

<wd l="8299" t="4238" r="8712" b="4368">Came</wd>

<space/>

<wd l="8746" t="4238" r="9029" b="4406">juss</wd>

<space/>

<wd l="9082" t="4238" r="9293" b="4368">for</wd>

<space/>

<wd l="9336" t="4277" r="9552" b="4368">me</wd>

<space/>

</run>

<wd l="9614" t="4238" r="9874" b="4373"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&lt;</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9941" t="4238" r="10450" b="4368">hahaha</wd>

</run>

</ln>

</para>

</frame>

<para l="6989" t="4680" r="9672" b="4882" alignment="centered" spaceBefore="147" lsp="exactly" lspExact="271" language="en">

<ln l="6989" t="4680" r="9672" b="4882" baseLine="4829" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6989" t="4680" r="7555" b="4882">Figure</wd>

<space/>

<wd l="7637" t="4685" r="7762" b="4838">1:</wd>

<space/>

<wd l="7848" t="4685" r="8117" b="4834">An</wd>

<space/>

<wd l="8174" t="4680" r="8904" b="4882">example</wd>

<space/>

<wd l="8966" t="4680" r="9154" b="4838">of</wd>

<space/>

<wd l="9197" t="4704" r="9672" b="4838">tweet</wd>

</ln>

</para>

<para l="6144" t="5448" r="10507" b="5923" alignment="justified" ri="144" spaceBefore="499" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="5448" r="10507" b="5650" baseLine="5602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5448" r="6523" b="5606">This</wd>

<space/>

<wd l="6590" t="5448" r="6725" b="5606">is</wd>

<space/>

<wd l="6792" t="5472" r="7070" b="5606">not</wd>

<space/>

<wd l="7128" t="5448" r="7512" b="5650">only</wd>

<space/>

<wd l="7570" t="5448" r="8261" b="5606">because</wd>

<space/>

<wd l="8318" t="5448" r="8510" b="5606">of</wd>

<space/>

<wd l="8554" t="5448" r="8818" b="5606">the</wd>

<space/>

<wd l="8875" t="5448" r="9226" b="5606">task</wd>

<space/>

<wd l="9283" t="5448" r="9763" b="5635">itself,</wd>

<space/>

<wd l="9830" t="5448" r="10104" b="5606">but</wd>

<space/>

<wd l="10166" t="5448" r="10507" b="5606">also</wd>

<space/>

</ln>

<ln l="6144" t="5722" r="9456" b="5923" baseLine="5870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5722" r="6835" b="5880">because</wd>

<space/>

<wd l="6898" t="5722" r="7085" b="5880">of</wd>

<space/>

<wd l="7128" t="5722" r="7392" b="5880">the</wd>

<space/>

<wd l="7450" t="5774" r="7805" b="5923">way</wd>

<space/>

<wd l="7862" t="5746" r="8414" b="5880">tweets</wd>

<space/>

<wd l="8482" t="5774" r="8741" b="5880">are</wd>

<space/>

<wd l="8798" t="5722" r="9456" b="5880">written.</wd>

</ln>

</para>

<para l="6144" t="5995" r="10512" b="7008" alignment="justified" ri="144" spaceBefore="6" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="5995" r="10502" b="6197" baseLine="6144" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5995" r="6931" b="6197">Figure</wd>

<space/>

<wd l="7027" t="6000" r="7090" b="6149">1</wd>

<space/>

<wd l="7190" t="5995" r="7714" b="6154">shows</wd>

<space/>

<wd l="7795" t="6048" r="7992" b="6154">an</wd>

<space/>

<wd l="8069" t="5995" r="8798" b="6197">example</wd>

<space/>

<wd l="8875" t="5995" r="9062" b="6154">of</wd>

<space/>

<wd l="9120" t="6019" r="9634" b="6154">tweet.</wd>

<space/>

<wd l="9758" t="5995" r="10094" b="6154">The</wd>

<space/>

<wd l="10171" t="6048" r="10502" b="6154">cor-</wd>

</ln>

<ln l="6144" t="6264" r="10512" b="6466" baseLine="6418" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6288" r="6475" b="6422">rect</wd>

<space/>

<wd l="6562" t="6288" r="7301" b="6422">sentence</wd>

<space/>

<wd l="7387" t="6264" r="7963" b="6422">should</wd>

<space/>

<wd l="8040" t="6264" r="8290" b="6422">be:</wd>

<space/>

<wd l="8419" t="6264" r="8957" b="6466">Today</wd>

<space/>

<wd l="9038" t="6317" r="9365" b="6422">was</wd>

<space/>

<wd l="9451" t="6264" r="9744" b="6422">fun</wd>

<space/>

<wd l="9821" t="6264" r="10512" b="6422">because</wd>

<space/>

</ln>

<ln l="6144" t="6538" r="10512" b="6739" baseLine="6686">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="6542" r="6624" b="6696">Anna</wd>

<space/>

<wd l="6686" t="6590" r="7142" b="6696">came</wd>

<space/>

<wd l="7186" t="6538" r="7522" b="6739">just</wd>

<space/>

<wd l="7584" t="6538" r="7843" b="6696">for</wd>

<space/>

<wd l="7901" t="6590" r="8165" b="6696">me</wd>

<space/>

</run>

<wd l="8246" t="6542" r="8554" b="6701"><run underlined="none" subsuperscript="none" fontSize="1350" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&lt;</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8654" t="6538" r="9317" b="6696">hahaha.</wd>

<space/>

<wd l="9422" t="6542" r="9706" b="6696">We</wd>

<space/>

<wd l="9773" t="6590" r="10070" b="6696">can</wd>

<space/>

<wd l="10133" t="6562" r="10512" b="6696">note</wd>

<space/>

</run>

</ln>

<ln l="6144" t="6806" r="8414" b="7008" baseLine="6960" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6806" r="6413" b="6965">the</wd>

<space/>

<wd l="6466" t="6806" r="7306" b="7008">following</wd>

<space/>

<wd l="7363" t="6806" r="8414" b="7008">phenomena:</wd>

</ln>

</para>

<para l="6384" t="7267" r="10502" b="7742" alignment="justified" li="432" ri="144" spaceBefore="188" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="7267" r="10502" b="7469" baseLine="7421" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="7320" r="6590" b="7421">•</wd>

<tab position="6441"/>

<wd l="6590" t="7267" r="7267" b="7469">spelling</wd>

<space/>

<wd l="7397" t="7267" r="8198" b="7426">mistakes:</wd>

<space/>

<wd l="8419" t="7320" r="8846" b="7426">wasz</wd>

<space/>

<wd l="8986" t="7272" r="9499" b="7464">(was),</wd>

<space/>

<wd l="9653" t="7320" r="10032" b="7426">cusz</wd>

<space/>

<wd l="10171" t="7267" r="10502" b="7464">(be-</wd>

</ln>

<ln l="6586" t="7541" r="8093" b="7742" baseLine="7690" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="7546" r="7181" b="7738">cause),</wd>

<space/>

<wd l="7229" t="7541" r="7579" b="7742">juss</wd>

<space/>

<wd l="7651" t="7541" r="8093" b="7742">(just)</wd>

</ln>

</para>

<para l="6384" t="8002" r="10498" b="8472" alignment="justified" li="432" ri="144" spaceBefore="192" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="8002" r="10498" b="8203" baseLine="8150" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="8054" r="6586" b="8150">•</wd>

<tab position="6438"/>

<wd l="6586" t="8002" r="7445" b="8160">confusion</wd>

<space/>

<wd l="7536" t="8002" r="7728" b="8160">of</wd>

<space/>

<wd l="7800" t="8002" r="8851" b="8203">upper/lower</wd>

<space/>

<wd l="8942" t="8054" r="9442" b="8160">cases:</wd>

<space/>

<wd l="9590" t="8006" r="9931" b="8160">Fun</wd>

<space/>

<wd l="10032" t="8002" r="10498" b="8198">(fun),</wd>

<space/>

</ln>

<ln l="6586" t="8280" r="8933" b="8472" baseLine="8424" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="8328" r="6998" b="8434">anna</wd>

<space/>

<wd l="7056" t="8280" r="7709" b="8472">(Anna),</wd>

<space/>

<wd l="7781" t="8280" r="8285" b="8434">Came</wd>

<space/>

<wd l="8347" t="8280" r="8933" b="8472">(came)</wd>

</ln>

</para>

<para l="6384" t="8736" r="7786" b="8899" alignment="justified" li="432" spaceBefore="198" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="8736" r="7786" b="8899" baseLine="8885">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="8789" r="6586" b="8885">•</wd>

<tab position="6438"/>

<wd l="6586" t="8736" r="7435" b="8894">emoticon:</wd>

<space/>

</run>

<wd l="7536" t="8741" r="7786" b="8899"><run underlined="none" subsuperscript="none" fontSize="1350" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&lt;</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6384" t="9197" r="8328" b="9398" alignment="justified" li="432" spaceBefore="182" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="9197" r="8328" b="9398" baseLine="9346" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="9197" r="6581" b="9346">•</wd>

<tab position="6467"/>

<wd l="6581" t="9197" r="7618" b="9398">interjection:</wd>

<space/>

<wd l="7704" t="9197" r="8328" b="9355">hahaha</wd>

</ln>

</para>

<para l="6144" t="9658" r="10517" b="10944" alignment="justified" ri="144" spaceBefore="190" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="9658" r="10502" b="9859" baseLine="9811" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9662" r="6648" b="9816">We</wd>

<space/>

<wd l="6715" t="9658" r="7334" b="9816">remark</wd>

<space/>

<wd l="7402" t="9658" r="7776" b="9816">here</wd>

<space/>

<wd l="7848" t="9658" r="8174" b="9816">that</wd>

<space/>

<wd l="8242" t="9658" r="8510" b="9816">the</wd>

<space/>

<wd l="8582" t="9658" r="8962" b="9859">only</wd>

<space/>

<wd l="9034" t="9710" r="9504" b="9816">name</wd>

<space/>

<wd l="9576" t="9658" r="9859" b="9816">has</wd>

<space/>

<wd l="9936" t="9710" r="10147" b="9816">no</wd>

<space/>

<wd l="10219" t="9710" r="10502" b="9859">up-</wd>

</ln>

<ln l="6144" t="9931" r="10517" b="10133" baseLine="10080" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9984" r="6427" b="10133">per</wd>

<space/>

<wd l="6514" t="9984" r="6883" b="10090">case</wd>

<space/>

<wd l="6965" t="9931" r="7493" b="10090">letters</wd>

<space/>

<wd l="7584" t="9931" r="8290" b="10090">whereas</wd>

<space/>

<wd l="8386" t="9931" r="8832" b="10090">other</wd>

<space/>

<wd l="8914" t="9931" r="9437" b="10090">words</wd>

<space/>

<wd l="9528" t="9931" r="9931" b="10090">have</wd>

<space/>

<wd l="10013" t="9984" r="10517" b="10133">upper</wd>

<space/>

</ln>

<ln l="6149" t="10200" r="10502" b="10397" baseLine="10354" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="10253" r="6600" b="10358">cases</wd>

<space/>

<wd l="6677" t="10200" r="7061" b="10397">(like</wd>

<space/>

<wd l="7128" t="10205" r="7699" b="10387">”Fun”,</wd>

<space/>

<wd l="7776" t="10205" r="8592" b="10397">”Came”).</wd>

<space/>

<wd l="8688" t="10205" r="8957" b="10387">So,</wd>

<space/>

<wd l="9029" t="10200" r="9154" b="10358">it</wd>

<space/>

<wd l="9211" t="10200" r="9758" b="10358">would</wd>

<space/>

<wd l="9816" t="10200" r="10018" b="10358">be</wd>

<space/>

<wd l="10085" t="10200" r="10502" b="10358">diffi-</wd>

</ln>

<ln l="6149" t="10474" r="10512" b="10675" baseLine="10622" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="10474" r="6475" b="10632">cult</wd>

<space/>

<wd l="6518" t="10474" r="6778" b="10632">for</wd>

<space/>

<wd l="6826" t="10526" r="6922" b="10632">a</wd>

<space/>

<wd l="6965" t="10474" r="7546" b="10632">named</wd>

<space/>

<wd l="7594" t="10474" r="8083" b="10675">entity</wd>

<space/>

<wd l="8141" t="10498" r="8909" b="10632">extractor</wd>

<space/>

<wd l="8952" t="10498" r="9120" b="10632">to</wd>

<space/>

<wd l="9173" t="10474" r="9941" b="10675">correctly</wd>

<space/>

<wd l="9994" t="10474" r="10512" b="10632">detect</wd>

<space/>

</ln>

<ln l="6144" t="10742" r="7666" b="10944" baseLine="10891" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10742" r="6451" b="10901">this</wd>

<space/>

<wd l="6514" t="10795" r="7099" b="10944">person</wd>

<space/>

<wd l="7152" t="10795" r="7666" b="10901">name.</wd>

</ln>

</para>

<para l="6144" t="11213" r="10066" b="11813" alignment="left" ri="576" spaceBefore="70" lsp="exactly" lspExact="422" language="en">

<ln l="6144" t="11213" r="10066" b="11434" baseLine="11381" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11213" r="6259" b="11386">3</wd>

<space/>

<wd l="6514" t="11213" r="6994" b="11386">CRF</wd>

<space/>

<wd l="7061" t="11213" r="8688" b="11434">Implementation</wd>

<space/>

<wd l="8755" t="11218" r="9130" b="11386">and</wd>

<space/>

<wd l="9192" t="11218" r="10066" b="11386">Features</wd>

<space/>

</ln>

<ln l="6144" t="11654" r="7939" b="11813" baseLine="11803" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11654" r="6408" b="11813">3.1</wd>

<space/>

<wd l="6648" t="11654" r="7080" b="11813">CRF</wd>

<space/>

<wd l="7138" t="11659" r="7939" b="11813">Features</wd>

</ln>

</para>

<para l="6144" t="11971" r="10517" b="14914" alignment="justified" ri="144" spaceBefore="84" spaceAfter="105" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="11971" r="10488" b="12211" baseLine="12154">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="12014" r="6432" b="12168">We</wd>

<space/>

<wd l="6509" t="12010" r="6912" b="12168">used</wd>

<space/>

<wd l="6984" t="12010" r="7253" b="12168">the</wd>

<space/>

<wd l="7334" t="12014" r="7742" b="12168">CRF</wd>

<space/>

<wd l="7819" t="12010" r="9192" b="12211">implementation</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="9283" t="12019" r="9826" b="12211">Wapiti</wd>

<space/>

<wd l="9917" t="12014" r="10344" b="12168">1.5.0</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="10435" t="11971" r="10488" b="12082">1</wd>

<space/>

</run>

</ln>

<ln l="6144" t="12278" r="10502" b="12480" baseLine="12432" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="12302" r="6312" b="12437">to</wd>

<space/>

<wd l="6408" t="12302" r="6922" b="12437">create</wd>

<space/>

<wd l="7018" t="12331" r="7306" b="12437">our</wd>

<space/>

<wd l="7397" t="12283" r="7805" b="12437">CRF</wd>

<space/>

<wd l="7891" t="12278" r="8482" b="12437">model.</wd>

<space/>

<wd l="8664" t="12278" r="9000" b="12437">The</wd>

<space/>

<wd l="9096" t="12278" r="10195" b="12480">optimization</wd>

<space/>

<wd l="10286" t="12278" r="10502" b="12437">al-</wd>

</ln>

<ln l="6149" t="12552" r="10517" b="12754" baseLine="12701" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="12552" r="6840" b="12754">gorithm</wd>

<space/>

<wd l="6922" t="12605" r="7171" b="12710">we</wd>

<space/>

<wd l="7262" t="12552" r="7752" b="12710">chose</wd>

<space/>

<wd l="7838" t="12605" r="8165" b="12710">was</wd>

<space/>

<wd l="8256" t="12595" r="8894" b="12754">rprop+.</wd>

<space/>

<wd l="9062" t="12552" r="9398" b="12710">The</wd>

<space/>

<wd l="9485" t="12552" r="10166" b="12710">features</wd>

<space/>

<wd l="10258" t="12552" r="10517" b="12710">for</wd>

<space/>

</ln>

<ln l="6144" t="12821" r="10502" b="13022" baseLine="12974" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="12821" r="6413" b="12979">the</wd>

<space/>

<wd l="6490" t="12821" r="7051" b="12979">tokens</wd>

<space/>

<wd l="7138" t="12874" r="7402" b="12979">are</wd>

<space/>

<wd l="7483" t="12821" r="7694" b="12979">all</wd>

<space/>

<wd l="7771" t="12821" r="7944" b="12974">in</wd>

<space/>

<wd l="8021" t="12821" r="8822" b="13022">unigrams</wd>

<space/>

<wd l="8914" t="12821" r="9226" b="12979">and</wd>

<space/>

<wd l="9302" t="12821" r="9859" b="12979">within</wd>

<space/>

<wd l="9941" t="12874" r="10037" b="12979">a</wd>

<space/>

<wd l="10109" t="12821" r="10502" b="12979">win-</wd>

</ln>

<ln l="6149" t="13094" r="10512" b="13296" baseLine="13243" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="13094" r="6514" b="13253">dow</wd>

<space/>

<wd l="6595" t="13094" r="6787" b="13253">of</wd>

<space/>

<wd l="6854" t="13094" r="7186" b="13253">size</wd>

<space/>

<wd l="7262" t="13099" r="7354" b="13253">3</wd>

<space/>

<wd l="7450" t="13094" r="8251" b="13296">(previous</wd>

<space/>

<wd l="8333" t="13094" r="8861" b="13282">token,</wd>

<space/>

<wd l="8952" t="13118" r="9566" b="13253">current</wd>

<space/>

<wd l="9638" t="13094" r="10123" b="13253">token</wd>

<space/>

<wd l="10200" t="13094" r="10512" b="13253">and</wd>

<space/>

</ln>

<ln l="6144" t="13363" r="10498" b="13565" baseLine="13517" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13387" r="6518" b="13522">next</wd>

<space/>

<wd l="6576" t="13363" r="7171" b="13560">token).</wd>

<space/>

<wd l="7258" t="13363" r="7598" b="13522">The</wd>

<space/>

<wd l="7651" t="13363" r="8347" b="13565">bigrams</wd>

<space/>

<wd l="8419" t="13416" r="8678" b="13522">are</wd>

<space/>

<wd l="8741" t="13363" r="9120" b="13565">only</wd>

<space/>

<wd l="9182" t="13363" r="9653" b="13522">made</wd>

<space/>

<wd l="9715" t="13363" r="9902" b="13522">of</wd>

<space/>

<wd l="9946" t="13363" r="10498" b="13550">labels,</wd>

<space/>

</ln>

<ln l="6149" t="13637" r="10502" b="13838" baseLine="13786" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="13637" r="7378" b="13838">characterizing</wd>

<space/>

<wd l="7483" t="13637" r="7906" b="13795">label</wd>

<space/>

<wd l="8006" t="13637" r="8962" b="13795">transitions.</wd>

<space/>

<wd l="9178" t="13637" r="9658" b="13795">Table</wd>

<space/>

<wd l="9782" t="13642" r="9845" b="13790">1</wd>

<space/>

<wd l="9979" t="13637" r="10502" b="13795">shows</wd>

<space/>

</ln>

<ln l="6144" t="13906" r="10502" b="14107" baseLine="14054" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13906" r="6413" b="14064">the</wd>

<space/>

<wd l="6514" t="13906" r="7195" b="14064">features</wd>

<space/>

<wd l="7301" t="13958" r="7555" b="14064">we</wd>

<space/>

<wd l="7656" t="13906" r="8837" b="14107">implemented.</wd>

<space/>

<wd l="9053" t="13906" r="9576" b="14064">These</wd>

<space/>

<wd l="9677" t="13906" r="10502" b="14107">templates</wd>

<space/>

</ln>

<ln l="6144" t="14179" r="10498" b="14381" baseLine="14328" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14179" r="6547" b="14338">have</wd>

<space/>

<wd l="6619" t="14179" r="7032" b="14338">been</wd>

<space/>

<wd l="7109" t="14179" r="7709" b="14338">chosen</wd>

<space/>

<wd l="7781" t="14179" r="8616" b="14381">following</wd>

<space/>

<wd l="8702" t="14179" r="9370" b="14376">(Suzuki</wd>

<space/>

<wd l="9446" t="14179" r="9758" b="14338">and</wd>

<space/>

<wd l="9826" t="14179" r="10498" b="14366">Isozaki,</wd>

<space/>

</ln>

<ln l="6149" t="14448" r="10512" b="14650" baseLine="14597" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="14453" r="6696" b="14645">2008),</wd>

<space/>

<wd l="6782" t="14453" r="7656" b="14650">(Lavergne</wd>

<space/>

<wd l="7723" t="14472" r="7882" b="14606">et</wd>

<space/>

<wd l="7944" t="14448" r="8194" b="14635">al.,</wd>

<space/>

<wd l="8275" t="14453" r="8822" b="14645">2010),</wd>

<space/>

<wd l="8909" t="14448" r="10291" b="14645">(Nooralahzadeh</wd>

<space/>

<wd l="10358" t="14472" r="10512" b="14606">et</wd>

<space/>

</ln>

<ln l="6149" t="14717" r="9336" b="14914" baseLine="14870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="14717" r="6403" b="14904">al.,</wd>

<space/>

<wd l="6470" t="14722" r="6965" b="14914">2014)</wd>

<space/>

<wd l="7037" t="14717" r="7349" b="14875">and</wd>

<space/>

<wd l="7411" t="14722" r="8251" b="14914">(Constant</wd>

<space/>

<wd l="8309" t="14741" r="8462" b="14875">et</wd>

<space/>

<wd l="8520" t="14717" r="8770" b="14904">al.,</wd>

<space/>

<wd l="8842" t="14722" r="9336" b="14914">2011)</wd>

</ln>

</para>

<rulerline l="6142" t="15048" r="7344" b="15048" type="single" width="10" color="000000"/>

<para l="6408" t="15101" r="7982" b="15302" alignment="left" li="216" spaceBefore="57" spaceAfter="31" lsp="exactly" lspExact="206" language="en">

<ln l="6408" t="15101" r="7982" b="15302" baseLine="15255">

<wd l="6408" t="15101" r="7982" b="15302"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">https://wapiti.limsi.fr</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<section l="2918" t="15336" r="9038" b="16480">

<column l="2918" t="15336" r="9038" b="16480">

<para l="5804" t="15787" r="6143" b="15946" alignment="centered" spaceBefore="387" lsp="exactly" lspExact="271" language="en">

<ln l="5870" t="15787" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="39">

<wd l="5870" t="15787" r="6077" b="15946">68</wd>

</ln>

</para>

<para l="2918" t="16133" r="8981" b="16469" alignment="justified" ri="72" spaceBefore="138" lsp="exactly" lspExact="170" language="en">

<ln l="2918" t="16133" r="8981" b="16301" baseLine="16253">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="2918" t="16133" r="3802" b="16296">Proceedings</wd>

<space/>

<wd l="3854" t="16133" r="4018" b="16296">of</wd>

<space/>

<wd l="4037" t="16133" r="4248" b="16262">the</wd>

<space/>

<wd l="4286" t="16138" r="4622" b="16262">ACL</wd>

<space/>

<wd l="4666" t="16133" r="5026" b="16262">2015</wd>

<space/>

<wd l="5078" t="16133" r="5779" b="16296">Workshop</wd>

<space/>

<wd l="5832" t="16176" r="6000" b="16262">on</wd>

<space/>

<wd l="6043" t="16138" r="6456" b="16296">Noisy</wd>

<space/>

<wd l="6518" t="16133" r="7627" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7675" t="16138" r="7992" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="8045" t="16171" r="8443" b="16301">pages</wd>

<space/>

<wd l="8501" t="16133" r="8981" b="16286">68–71,</wd>

<space/>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">c</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-3">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4309.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1323" marginTop="1248" marginRight="1265" marginBottom="1302" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1323" t="1248" r="10644" b="15325">

<column l="1323" t="1248" r="5863" b="15325">

<table l="1714" t="1258" r="5534" b="10814" alignment="left" li="391" ri="329" spaceBefore="10" spaceAfter="151">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<gridTable>

<gridCol>3820</gridCol>

<gridRow>283</gridRow>

<gridRow>2717</gridRow>

<gridRow>2990</gridRow>

<gridRow>548</gridRow>

<gridRow>2174</gridRow>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>282</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3120" t="1301" r="4123" b="1459" alignment="centered" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="3120" t="1301" r="4123" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3120" t="1301" r="3605" b="1459">token</wd>

<space/>

<wd l="3658" t="1301" r="4123" b="1459">value</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1843" t="1579" r="5400" b="4219" alignment="centered" spaceAfter="20" lsp="exactly" lspExact="268" language="en">

<ln l="3240" t="1579" r="4008" b="1781" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3240" t="1579" r="4008" b="1781">fstUpper
</wd>

</ln>

<ln l="3240" t="1853" r="4013" b="2054" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3240" t="1853" r="4013" b="2054">shortCap
</wd>

</ln>

<ln l="3254" t="2122" r="3989" b="2323" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3254" t="2122" r="3989" b="2323">longCap
</wd>

</ln>

<ln l="3278" t="2390" r="3965" b="2592" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3278" t="2390" r="3965" b="2592">mixCap
</wd>

</ln>

<ln l="3206" t="2664" r="4046" b="2866" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3206" t="2664" r="4046" b="2866">hasUpper
</wd>

</ln>

<ln l="3245" t="2933" r="4008" b="3134" baseLine="3086" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3245" t="2933" r="4008" b="3134">allUpper
</wd>

</ln>

<ln l="1843" t="3206" r="5400" b="3408" baseLine="3355" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1843" t="3211" r="2616" b="3408">capType:</wd>

<space/>

<wd l="2702" t="3206" r="3792" b="3365">combination</wd>

<space/>

<wd l="3850" t="3206" r="4042" b="3365">of</wd>

<space/>

<wd l="4085" t="3206" r="4186" b="3365">6</wd>

<space/>

<wd l="4243" t="3206" r="4800" b="3408">binary</wd>

<space/>

<wd l="4858" t="3206" r="5400" b="3365">values
</wd>

</ln>

<ln l="3259" t="3475" r="3998" b="3634" baseLine="3629" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3259" t="3475" r="3998" b="3634">allLetter
</wd>

</ln>

<ln l="3110" t="3749" r="4147" b="3950" baseLine="3898" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3110" t="3749" r="4147" b="3950">singleLetter
</wd>

</ln>

<ln l="2146" t="4018" r="5098" b="4219" baseLine="4171" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="2146" t="4018" r="3101" b="4219">tokenType:</wd>

<space/>

<wd l="3187" t="4018" r="4258" b="4219">punctuation,</wd>

<space/>

<wd l="4330" t="4022" r="4478" b="4205">9,</wd>

<space/>

<wd l="4546" t="4070" r="4651" b="4171">x</wd>

<space/>

<wd l="4714" t="4070" r="4891" b="4176">or</wd>

<space/>

<wd l="4944" t="4022" r="5098" b="4171">X</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2707" t="4296" r="4531" b="7166" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="268" language="en">

<ln l="3120" t="4296" r="4128" b="4454" baseLine="4450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3120" t="4296" r="4128" b="4454">hasNumber
</wd>

</ln>

<ln l="3163" t="4570" r="4094" b="4728" baseLine="4718" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3163" t="4570" r="4094" b="4728">allNumber
</wd>

</ln>

<ln l="3182" t="4838" r="4061" b="4997" baseLine="4992" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3182" t="4838" r="4061" b="4997">isDecimal
</wd>

</ln>

<ln l="3221" t="5117" r="4032" b="5270" baseLine="5261" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3221" t="5117" r="4032" b="5270">onePunct
</wd>

</ln>

<ln l="3269" t="5381" r="3984" b="5539" baseLine="5534" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3269" t="5381" r="3984" b="5539">allPunct
</wd>

</ln>

<ln l="3230" t="5654" r="4018" b="5813" baseLine="5803" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3230" t="5654" r="4018" b="5813">hasPunct
</wd>

</ln>

<ln l="3182" t="5923" r="4066" b="6125" baseLine="6072" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3182" t="5923" r="4066" b="6125">longPunct
</wd>

</ln>

<ln l="3043" t="6197" r="4205" b="6394" baseLine="6346" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3043" t="6197" r="4205" b="6394">hasQuotation
</wd>

</ln>

<ln l="2707" t="6466" r="4531" b="6667" baseLine="6614" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="2707" t="6466" r="4531" b="6667">hasAtLeast2periodes
</wd>

</ln>

<ln l="2822" t="6734" r="4426" b="6936" baseLine="6888" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="2822" t="6734" r="4426" b="6936">finishedByPeriode
</wd>

</ln>

<ln l="3254" t="7008" r="3994" b="7166" baseLine="7157" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3254" t="7008" r="3994" b="7166">hasDash</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3379" t="7286" r="3874" b="7445" alignment="centered" lsp="exactly" lspExact="244" language="en">

<ln l="3379" t="7286" r="3874" b="7445" baseLine="7435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3379" t="7286" r="3874" b="7445">lower</wd>

</ln>

</para>

<para l="2707" t="7555" r="4541" b="7714" alignment="centered" spaceBefore="3" spaceAfter="24" lsp="exactly" lspExact="271" language="en">

<ln l="2707" t="7555" r="4541" b="7714" baseLine="7709" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2707" t="7555" r="4541" b="7714">returnUnicodeVector</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3163" t="7838" r="4075" b="9893" alignment="centered" spaceAfter="24" lsp="exactly" lspExact="268" language="en">

<ln l="3322" t="7838" r="3922" b="7997" baseLine="7987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3322" t="7838" r="3922" b="7997">isEmal
</wd>

</ln>

<ln l="3331" t="8107" r="3917" b="8266" baseLine="8256" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3331" t="8107" r="3917" b="8266">isURL
</wd>

</ln>

<ln l="3418" t="8376" r="3826" b="8534" baseLine="8530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3418" t="8376" r="3826" b="8534">isRT
</wd>

</ln>

<ln l="3336" t="8650" r="3907" b="8808" baseLine="8798" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3336" t="8650" r="3907" b="8808">isUSR
</wd>

</ln>

<ln l="3163" t="8918" r="4075" b="9120" baseLine="9072" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3163" t="8918" r="4075" b="9120">isHashTag
</wd>

</ln>

<ln l="3346" t="9192" r="3902" b="9350" baseLine="9341" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3346" t="9192" r="3902" b="9350">isDate
</wd>

</ln>

<ln l="3322" t="9461" r="3922" b="9619" baseLine="9614" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3322" t="9461" r="3922" b="9619">isTime
</wd>

</ln>

<ln l="3226" t="9734" r="4018" b="9893" baseLine="9883" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="3226" t="9734" r="4018" b="9893">isAbbrev</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2352" t="10013" r="4882" b="10214" alignment="centered" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="2352" t="10013" r="4882" b="10214" baseLine="10162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2352" t="10013" r="2952" b="10214">prefixe</wd>

<space/>

<wd l="3034" t="10066" r="3187" b="10200">n,</wd>

<space/>

<wd l="3259" t="10013" r="3835" b="10171">suffixe</wd>

<space/>

<wd l="3917" t="10066" r="4027" b="10166">n</wd>

<space/>

<wd l="4090" t="10018" r="4262" b="10210">(n</wd>

<space/>

<wd l="4320" t="10080" r="4435" b="10142">=</wd>

<space/>

<wd l="4517" t="10013" r="4882" b="10210">1..5)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2136" t="10291" r="5098" b="10493" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="244" language="en">

<ln l="2136" t="10291" r="5098" b="10493" baseLine="10440" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2136" t="10315" r="2702" b="10493">postag</wd>

<space/>

<wd l="2760" t="10291" r="2933" b="10445">in</wd>

<space/>

<wd l="2986" t="10296" r="3427" b="10450">PTB:</wd>

<space/>

<wd l="3499" t="10291" r="3893" b="10450">with</wd>

<space/>

<wd l="3946" t="10291" r="4498" b="10493">binary</wd>

<space/>

<wd l="4555" t="10291" r="5098" b="10450">values</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1858" t="10570" r="5395" b="10771" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="243" language="en">

<ln l="1858" t="10570" r="5395" b="10771" baseLine="10718" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1858" t="10594" r="2597" b="10771">category</wd>

<space/>

<wd l="2654" t="10570" r="2822" b="10723">in</wd>

<space/>

<wd l="2880" t="10574" r="3466" b="10728">Brown</wd>

<space/>

<wd l="3528" t="10570" r="4147" b="10728">cluster:</wd>

<space/>

<wd l="4229" t="10570" r="4402" b="10723">in</wd>

<space/>

<wd l="4454" t="10570" r="5011" b="10771">binary</wd>

<space/>

<wd l="5069" t="10594" r="5395" b="10728">tree</wd>

</ln>

</para>

</cell>

</table>

<para l="2659" t="11026" r="4579" b="11184" alignment="centered" lsp="exactly" lspExact="271" language="en">

<ln l="2659" t="11026" r="4579" b="11184" baseLine="11179" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2659" t="11026" r="3139" b="11184">Table</wd>

<space/>

<wd l="3216" t="11030" r="3346" b="11184">1:</wd>

<space/>

<wd l="3437" t="11030" r="3840" b="11184">CRF</wd>

<space/>

<wd l="3898" t="11026" r="4579" b="11184">features</wd>

</ln>

</para>

<para l="1440" t="11856" r="5818" b="15302" alignment="justified" li="72" ri="72" spaceBefore="566" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="11856" r="5789" b="12058" baseLine="12005" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="11856" r="1997" b="12014">The</wd>

<space/>

<wd l="2050" t="11861" r="2779" b="12058">capType</wd>

<space/>

<wd l="2827" t="11856" r="3509" b="12014">features</wd>

<space/>

<wd l="3566" t="11909" r="4238" b="12058">regroup</wd>

<space/>

<wd l="4296" t="11856" r="4397" b="12014">6</wd>

<space/>

<wd l="4450" t="11856" r="5002" b="12058">binary</wd>

<space/>

<wd l="5054" t="11856" r="5789" b="12014">features:</wd>

<space/>

</ln>

<ln l="1445" t="12125" r="5794" b="12326" baseLine="12278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12125" r="2237" b="12326">allUpper,</wd>

<space/>

<wd l="2328" t="12125" r="3149" b="12326">shortCap,</wd>

<space/>

<wd l="3235" t="12125" r="4018" b="12326">longCap,</wd>

<space/>

<wd l="4104" t="12125" r="4915" b="12312">allLower,</wd>

<space/>

<wd l="4997" t="12125" r="5794" b="12326">fstUpper,</wd>

<space/>

</ln>

<ln l="1440" t="12398" r="5794" b="12600" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12398" r="2174" b="12600">mixCap.</wd>

<space/>

<wd l="2309" t="12398" r="2650" b="12557">The</wd>

<space/>

<wd l="2722" t="12398" r="3634" b="12600">tokenType</wd>

<space/>

<wd l="3710" t="12398" r="4315" b="12557">feature</wd>

<space/>

<wd l="4387" t="12398" r="5314" b="12557">transforms</wd>

<space/>

<wd l="5400" t="12451" r="5496" b="12557">a</wd>

<space/>

<wd l="5563" t="12422" r="5794" b="12557">to-</wd>

</ln>

<ln l="1440" t="12667" r="5794" b="12854" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12667" r="1752" b="12826">ken</wd>

<space/>

<wd l="1834" t="12667" r="2170" b="12826">into</wd>

<space/>

<wd l="2261" t="12720" r="2357" b="12826">a</wd>

<space/>

<wd l="2438" t="12667" r="3394" b="12826">”skeleton”:</wd>

<space/>

<wd l="3533" t="12667" r="3701" b="12821">in</wd>

<space/>

<wd l="3782" t="12667" r="4090" b="12826">this</wd>

<space/>

<wd l="4190" t="12667" r="4949" b="12854">skeleton,</wd>

<space/>

<wd l="5050" t="12667" r="5261" b="12826">all</wd>

<space/>

<wd l="5347" t="12720" r="5794" b="12826">num-</wd>

</ln>

<ln l="1440" t="12941" r="5803" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12941" r="1795" b="13099">bers</wd>

<space/>

<wd l="1867" t="12994" r="2131" b="13099">are</wd>

<space/>

<wd l="2194" t="12941" r="2933" b="13142">replaced</wd>

<space/>

<wd l="2990" t="12941" r="3206" b="13142">by</wd>

<space/>

<wd l="3274" t="12946" r="3422" b="13128">9,</wd>

<space/>

<wd l="3499" t="12941" r="3710" b="13099">all</wd>

<space/>

<wd l="3773" t="12941" r="4301" b="13099">letters</wd>

<space/>

<wd l="4368" t="12941" r="4541" b="13094">in</wd>

<space/>

<wd l="4598" t="12941" r="5093" b="13099">lower</wd>

<space/>

<wd l="5155" t="12994" r="5525" b="13099">case</wd>

<space/>

<wd l="5587" t="12941" r="5803" b="13142">by</wd>

<space/>

</ln>

<ln l="1440" t="13210" r="5794" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="13262" r="1594" b="13397">x,</wd>

<space/>

<wd l="1680" t="13210" r="1891" b="13368">all</wd>

<space/>

<wd l="1963" t="13210" r="2486" b="13368">letters</wd>

<space/>

<wd l="2563" t="13210" r="2736" b="13363">in</wd>

<space/>

<wd l="2803" t="13262" r="3302" b="13411">upper</wd>

<space/>

<wd l="3370" t="13262" r="3744" b="13368">case</wd>

<space/>

<wd l="3811" t="13210" r="4027" b="13411">by</wd>

<space/>

<wd l="4099" t="13214" r="4253" b="13363">X</wd>

<space/>

<wd l="4330" t="13210" r="4642" b="13368">and</wd>

<space/>

<wd l="4709" t="13210" r="4973" b="13368">the</wd>

<space/>

<wd l="5040" t="13234" r="5794" b="13411">punctua-</wd>

</ln>

<ln l="1440" t="13478" r="5798" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="13478" r="1858" b="13637">tions</wd>

<space/>

<wd l="1934" t="13478" r="2539" b="13637">remain</wd>

<space/>

<wd l="2606" t="13478" r="3595" b="13680">unchanged.</wd>

<space/>

<wd l="3715" t="13478" r="4056" b="13637">The</wd>

<space/>

<wd l="4123" t="13478" r="5386" b="13680">part-of-speech</wd>

<space/>

<wd l="5453" t="13502" r="5798" b="13680">tags</wd>

<space/>

</ln>

<ln l="1450" t="13752" r="5808" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="13757" r="2232" b="13954">(postags)</wd>

<space/>

<wd l="2294" t="13752" r="2486" b="13910">of</wd>

<space/>

<wd l="2520" t="13752" r="2789" b="13910">the</wd>

<space/>

<wd l="2837" t="13757" r="3274" b="13910">Penn</wd>

<space/>

<wd l="3322" t="13757" r="3715" b="13910">Tree</wd>

<space/>

<wd l="3768" t="13752" r="4229" b="13910">Bank</wd>

<space/>

<wd l="4286" t="13757" r="4810" b="13949">(PTB)</wd>

<space/>

<wd l="4882" t="13757" r="5592" b="13949">(Marcus</wd>

<space/>

<wd l="5654" t="13776" r="5808" b="13910">et</wd>

<space/>

</ln>

<ln l="1445" t="14021" r="5803" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="14021" r="1694" b="14208">al.,</wd>

<space/>

<wd l="1805" t="14026" r="2280" b="14218">1993)</wd>

<space/>

<wd l="2366" t="14045" r="3101" b="14222">generate</wd>

<space/>

<wd l="3168" t="14021" r="3374" b="14179">45</wd>

<space/>

<wd l="3466" t="14021" r="4104" b="14179">distinct</wd>

<space/>

<wd l="4171" t="14021" r="4906" b="14179">features.</wd>

<space/>

<wd l="5030" t="14021" r="5472" b="14179">Each</wd>

<space/>

<wd l="5539" t="14045" r="5803" b="14222">tag</wd>

<space/>

</ln>

<ln l="1440" t="14294" r="5794" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14294" r="1613" b="14448">in</wd>

<space/>

<wd l="1666" t="14294" r="1930" b="14453">the</wd>

<space/>

<wd l="1987" t="14299" r="2376" b="14448">PTB</wd>

<space/>

<wd l="2443" t="14294" r="3197" b="14453">becomes</wd>

<space/>

<wd l="3269" t="14347" r="3365" b="14453">a</wd>

<space/>

<wd l="3413" t="14294" r="4018" b="14453">feature</wd>

<space/>

<wd l="4075" t="14294" r="4464" b="14453">with</wd>

<space/>

<wd l="4522" t="14347" r="4618" b="14453">a</wd>

<space/>

<wd l="4670" t="14294" r="5227" b="14496">binary</wd>

<space/>

<wd l="5285" t="14294" r="5794" b="14453">value.</wd>

<space/>

</ln>

<ln l="1440" t="14563" r="5818" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14563" r="1781" b="14722">The</wd>

<space/>

<wd l="1838" t="14568" r="2674" b="14765">”category</wd>

<space/>

<wd l="2731" t="14563" r="2904" b="14717">in</wd>

<space/>

<wd l="2957" t="14568" r="3547" b="14722">Brown</wd>

<space/>

<wd l="3605" t="14563" r="4272" b="14722">cluster”</wd>

<space/>

<wd l="4334" t="14616" r="4699" b="14722">uses</wd>

<space/>

<wd l="4762" t="14563" r="5030" b="14722">the</wd>

<space/>

<wd l="5083" t="14563" r="5573" b="14722">result</wd>

<space/>

<wd l="5630" t="14563" r="5818" b="14722">of</wd>

<space/>

</ln>

<ln l="1440" t="14837" r="5808" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14842" r="2030" b="14995">Brown</wd>

<space/>

<wd l="2126" t="14837" r="2976" b="15038">clustering</wd>

<space/>

<wd l="3082" t="14842" r="3734" b="15034">(Brown</wd>

<space/>

<wd l="3826" t="14861" r="3979" b="14995">et</wd>

<space/>

<wd l="4075" t="14837" r="4325" b="15024">al.,</wd>

<space/>

<wd l="4459" t="14842" r="4934" b="15034">1992)</wd>

<space/>

<wd l="5040" t="14837" r="5808" b="14995">executed</wd>

<space/>

</ln>

<ln l="1440" t="15106" r="5784" b="15302" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="15106" r="1829" b="15264">with</wd>

<space/>

<wd l="1949" t="15106" r="2914" b="15293">56,345,753</wd>

<space/>

<wd l="3043" t="15130" r="3595" b="15264">tweets</wd>

<space/>

<wd l="3725" t="15106" r="4498" b="15264">available</wd>

<space/>

<wd l="4618" t="15130" r="4771" b="15264">at</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-3"><wd l="4896" t="15110" r="5784" b="15302">http://</wd>

</run>

</ln>

</para>

</column>

<column l="6104" t="1248" r="10644" b="15325">

<table l="6360" t="1258" r="10296" b="2102" alignment="left" li="256" ri="348" spaceBefore="10" spaceAfter="151">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>1070</gridCol>

<gridCol>1037</gridCol>

<gridCol>912</gridCol>

<gridCol>917</gridCol>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>282</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6360" t="1258" r="7430" b="1541" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7550" t="1301" r="8347" b="1502" alignment="centered" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="7550" t="1301" r="8347" b="1502" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7550" t="1301" r="8347" b="1502">precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8683" t="1301" r="9163" b="1459" alignment="centered" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="8683" t="1301" r="9163" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="8683" t="1301" r="9163" b="1459">recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9648" t="1306" r="9998" b="1454" alignment="centered" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="9648" t="1306" r="9998" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">

<wd l="9648" t="1306" r="9998" b="1454">FB1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6749" t="1579" r="7046" b="1738" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="244" language="en">

<ln l="6749" t="1579" r="7046" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="6749" t="1579" r="7046" b="1738">dev</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7618" t="1579" r="8275" b="1738" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="244" language="en">

<ln l="7618" t="1579" r="8275" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7618" t="1579" r="8275" b="1738">69.01%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8592" t="1579" r="9250" b="1738" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="244" language="en">

<ln l="8592" t="1579" r="9250" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="8592" t="1579" r="9250" b="1738">33.15%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9499" t="1584" r="10162" b="1738" alignment="centered" spaceAfter="29" lsp="exactly" lspExact="244" language="en">

<ln l="9499" t="1584" r="10162" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="9499" t="1584" r="10162" b="1738">44.78%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6490" t="1858" r="7296" b="2016" alignment="centered" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="6490" t="1858" r="7296" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6490" t="1858" r="6792" b="2016">dev</wd>

<space/>

<wd l="6878" t="1858" r="7296" b="2016">2015</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7613" t="1858" r="8275" b="2016" alignment="centered" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="7613" t="1858" r="8275" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="7613" t="1858" r="8275" b="2016">43.26%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8592" t="1862" r="9250" b="2016" alignment="centered" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="8592" t="1862" r="9250" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="8592" t="1862" r="9250" b="2016">22.43%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9504" t="1858" r="10162" b="2016" alignment="centered" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="9504" t="1858" r="10162" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9504" t="1858" r="10162" b="2016">29.54%</wd>

</ln>

</para>

</cell>

</table>

<para l="6144" t="2314" r="10512" b="2746" alignment="justified" ri="144" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="2314" r="10512" b="2515" baseLine="2467" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2314" r="6624" b="2472">Table</wd>

<space/>

<wd l="6682" t="2318" r="6830" b="2472">2:</wd>

<space/>

<wd l="6912" t="2314" r="7930" b="2515">Experiment</wd>

<space/>

<wd l="7982" t="2314" r="8544" b="2472">results</wd>

<space/>

<wd l="8602" t="2314" r="8990" b="2472">with</wd>

<space/>

<wd l="9038" t="2314" r="9581" b="2472">model</wd>

<space/>

<wd l="9638" t="2314" r="10243" b="2472">trained</wd>

<space/>

<wd l="10296" t="2366" r="10512" b="2472">on</wd>

<space/>

</ln>

<ln l="6144" t="2587" r="6878" b="2746" baseLine="2736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2587" r="6547" b="2746">train</wd>

<space/>

<wd l="6605" t="2587" r="6878" b="2746">file</wd>

</ln>

</para>

<para l="6144" t="3360" r="10512" b="6269" alignment="justified" ri="144" spaceBefore="504" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="3360" r="10512" b="3533" baseLine="3509">

<wd l="6149" t="3365" r="9854" b="3533"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">www.ark.cs.cmu.edu/TweetNLP/</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10171" t="3360" r="10512" b="3518">The</wd>

<space/>

</run>

</ln>

<ln l="6149" t="3629" r="10507" b="3830" baseLine="3782" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3629" r="6562" b="3787">class</wd>

<space/>

<wd l="6643" t="3629" r="6835" b="3787">of</wd>

<space/>

<wd l="6898" t="3629" r="7291" b="3787">each</wd>

<space/>

<wd l="7363" t="3629" r="7848" b="3787">token</wd>

<space/>

<wd l="7915" t="3629" r="8054" b="3787">is</wd>

<space/>

<wd l="8131" t="3629" r="9139" b="3830">represented</wd>

<space/>

<wd l="9206" t="3629" r="9595" b="3787">with</wd>

<space/>

<wd l="9691" t="3634" r="9869" b="3787">13</wd>

<space/>

<wd l="9955" t="3629" r="10507" b="3830">binary</wd>

<space/>

</ln>

<ln l="6144" t="3902" r="10507" b="4104" baseLine="4051" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3902" r="6739" b="4061">values.</wd>

<space/>

<wd l="6859" t="3902" r="7378" b="4061">These</wd>

<space/>

<wd l="7450" t="3902" r="7992" b="4061">values</wd>

<space/>

<wd l="8069" t="3926" r="8870" b="4104">represent</wd>

<space/>

<wd l="8933" t="3902" r="9720" b="4061">therefore</wd>

<space/>

<wd l="9792" t="3955" r="9888" b="4061">a</wd>

<space/>

<wd l="9955" t="3902" r="10507" b="4104">binary</wd>

<space/>

</ln>

<ln l="6144" t="4171" r="10507" b="4373" baseLine="4325" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4195" r="6514" b="4330">tree.</wd>

<space/>

<wd l="6701" t="4171" r="7138" b="4330">Each</wd>

<space/>

<wd l="7224" t="4171" r="7690" b="4330">value</wd>

<space/>

<wd l="7781" t="4224" r="8333" b="4330">means</wd>

<space/>

<wd l="8434" t="4224" r="8741" b="4330">one</wd>

<space/>

<wd l="8832" t="4171" r="9245" b="4330">level</wd>

<space/>

<wd l="9336" t="4171" r="9509" b="4325">in</wd>

<space/>

<wd l="9595" t="4171" r="9864" b="4330">the</wd>

<space/>

<wd l="9955" t="4171" r="10507" b="4373">binary</wd>

<space/>

</ln>

<ln l="6144" t="4445" r="10498" b="4632" baseLine="4594" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4469" r="6514" b="4603">tree.</wd>

<space/>

<wd l="6691" t="4450" r="6917" b="4603">So</wd>

<space/>

<wd l="7003" t="4498" r="7258" b="4603">we</wd>

<space/>

<wd l="7344" t="4445" r="7733" b="4603">took</wd>

<space/>

<wd l="7819" t="4445" r="8083" b="4603">the</wd>

<space/>

<wd l="8174" t="4445" r="8510" b="4603">first</wd>

<space/>

<wd l="8597" t="4445" r="9062" b="4603">value</wd>

<space/>

<wd l="9149" t="4445" r="9408" b="4603">for</wd>

<space/>

<wd l="9494" t="4445" r="9888" b="4603">each</wd>

<space/>

<wd l="9974" t="4445" r="10498" b="4632">token,</wd>

<space/>

</ln>

<ln l="6144" t="4714" r="10512" b="4915" baseLine="4867" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4714" r="6403" b="4872">i.e.</wd>

<space/>

<wd l="6504" t="4714" r="6701" b="4872">its</wd>

<space/>

<wd l="6778" t="4738" r="7517" b="4915">category</wd>

<space/>

<wd l="7579" t="4714" r="7968" b="4872">with</wd>

<space/>

<wd l="8035" t="4714" r="8414" b="4915">only</wd>

<space/>

<wd l="8486" t="4766" r="8794" b="4872">one</wd>

<space/>

<wd l="8856" t="4714" r="9269" b="4872">level</wd>

<space/>

<wd l="9346" t="4718" r="9730" b="4910">(two</wd>

<space/>

<wd l="9797" t="4714" r="10512" b="4915">possible</wd>

<space/>

</ln>

<ln l="6144" t="4987" r="10512" b="5184" baseLine="5136" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4987" r="7109" b="5184">values).We</wd>

<space/>

<wd l="7181" t="4987" r="7560" b="5146">then</wd>

<space/>

<wd l="7627" t="4987" r="8016" b="5146">took</wd>

<space/>

<wd l="8088" t="4987" r="8352" b="5146">the</wd>

<space/>

<wd l="8434" t="4987" r="8770" b="5146">first</wd>

<space/>

<wd l="8837" t="5011" r="9158" b="5146">two</wd>

<space/>

<wd l="9235" t="4987" r="9778" b="5146">values</wd>

<space/>

<wd l="9864" t="4987" r="10051" b="5146">of</wd>

<space/>

<wd l="10118" t="4987" r="10512" b="5146">each</wd>

<space/>

</ln>

<ln l="6144" t="5256" r="10502" b="5458" baseLine="5405" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5256" r="6672" b="5443">token,</wd>

<space/>

<wd l="6749" t="5256" r="7507" b="5458">resulting</wd>

<space/>

<wd l="7574" t="5256" r="7747" b="5410">in</wd>

<space/>

<wd l="7810" t="5256" r="8074" b="5414">the</wd>

<space/>

<wd l="8146" t="5256" r="8995" b="5458">clustering</wd>

<space/>

<wd l="9067" t="5256" r="9259" b="5414">of</wd>

<space/>

<wd l="9312" t="5256" r="9883" b="5414">twitter</wd>

<space/>

<wd l="9946" t="5256" r="10502" b="5414">tokens</wd>

<space/>

</ln>

<ln l="6144" t="5530" r="10498" b="5717" baseLine="5678" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5530" r="6480" b="5688">into</wd>

<space/>

<wd l="6547" t="5530" r="6912" b="5688">four</wd>

<space/>

<wd l="6974" t="5530" r="7618" b="5717">classes,</wd>

<space/>

<wd l="7699" t="5554" r="7992" b="5688">etc.</wd>

<space/>

<wd l="8088" t="5534" r="8376" b="5688">We</wd>

<space/>

<wd l="8438" t="5530" r="8827" b="5688">took</wd>

<space/>

<wd l="8885" t="5530" r="9283" b="5688">until</wd>

<space/>

<wd l="9350" t="5530" r="9562" b="5688">all</wd>

<space/>

<wd l="9648" t="5534" r="9830" b="5688">13</wd>

<space/>

<wd l="9902" t="5530" r="10498" b="5717">values,</wd>

<space/>

</ln>

<ln l="6144" t="5798" r="10512" b="6000" baseLine="5947" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5822" r="6312" b="5957">to</wd>

<space/>

<wd l="6379" t="5822" r="6643" b="6000">get</wd>

<space/>

<wd l="6696" t="5798" r="6960" b="5957">the</wd>

<space/>

<wd l="7022" t="5798" r="7618" b="5957">classes</wd>

<space/>

<wd l="7690" t="5798" r="7877" b="5957">of</wd>

<space/>

<wd l="7920" t="5798" r="8189" b="5957">the</wd>

<space/>

<wd l="8246" t="5798" r="8731" b="5957">token</wd>

<space/>

<wd l="8789" t="5822" r="8942" b="5957">at</wd>

<space/>

<wd l="9005" t="5851" r="9470" b="6000">every</wd>

<space/>

<wd l="9533" t="5798" r="9946" b="5957">level</wd>

<space/>

<wd l="10008" t="5798" r="10200" b="5957">of</wd>

<space/>

<wd l="10243" t="5798" r="10512" b="5957">the</wd>

<space/>

</ln>

<ln l="6144" t="6067" r="7128" b="6269" baseLine="6221" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6067" r="6701" b="6269">binary</wd>

<space/>

<wd l="6758" t="6091" r="7128" b="6226">tree.</wd>

</ln>

</para>

<para l="6144" t="6610" r="8938" b="6768" alignment="left" spaceBefore="288" lsp="exactly" lspExact="249" language="en">

<ln l="6144" t="6610" r="8938" b="6768" baseLine="6758" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">

<wd l="6144" t="6610" r="6413" b="6768">3.2</wd>

<space/>

<wd l="6638" t="6614" r="6974" b="6768">Use</wd>

<space/>

<wd l="7037" t="6610" r="7224" b="6768">of</wd>

<space/>

<wd l="7267" t="6610" r="7944" b="6768">Lexical</wd>

<space/>

<wd l="8006" t="6614" r="8938" b="6768">Resources</wd>

</ln>

</para>

<para l="6144" t="7008" r="10526" b="12629" alignment="justified" ri="144" spaceBefore="150" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="7008" r="10502" b="7210" baseLine="7162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="7013" r="6379" b="7166">As</wd>

<space/>

<wd l="6490" t="7008" r="6859" b="7210">they</wd>

<space/>

<wd l="6965" t="7061" r="7387" b="7166">were</wd>

<space/>

<wd l="7493" t="7008" r="8218" b="7166">attached</wd>

<space/>

<wd l="8314" t="7008" r="8702" b="7166">with</wd>

<space/>

<wd l="8803" t="7008" r="9072" b="7166">the</wd>

<space/>

<wd l="9178" t="7008" r="9950" b="7166">available</wd>

<space/>

<wd l="10051" t="7008" r="10502" b="7166">base-</wd>

</ln>

<ln l="6144" t="7282" r="10512" b="7483" baseLine="7430" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="7282" r="6518" b="7469">line,</wd>

<space/>

<wd l="6586" t="7334" r="6840" b="7440">we</wd>

<space/>

<wd l="6902" t="7282" r="7762" b="7483">processed</wd>

<space/>

<wd l="7824" t="7334" r="7920" b="7440">a</wd>

<space/>

<wd l="7982" t="7306" r="8218" b="7440">set</wd>

<space/>

<wd l="8280" t="7282" r="8472" b="7440">of</wd>

<space/>

<wd l="8520" t="7282" r="9010" b="7483">entity</wd>

<space/>

<wd l="9077" t="7282" r="10133" b="7440">dictionaries.</wd>

<space/>

<wd l="10224" t="7286" r="10512" b="7440">We</wd>

<space/>

</ln>

<ln l="6144" t="7550" r="10507" b="7709" baseLine="7704" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="7550" r="6547" b="7709">tried</wd>

<space/>

<wd l="6643" t="7574" r="6806" b="7709">to</wd>

<space/>

<wd l="6912" t="7550" r="7694" b="7709">associate</wd>

<space/>

<wd l="7790" t="7550" r="8237" b="7709">these</wd>

<space/>

<wd l="8338" t="7550" r="9346" b="7709">dictionaries</wd>

<space/>

<wd l="9446" t="7550" r="9835" b="7709">with</wd>

<space/>

<wd l="9931" t="7550" r="10195" b="7709">the</wd>

<space/>

<wd l="10315" t="7555" r="10507" b="7709">10</wd>

<space/>

</ln>

<ln l="6144" t="7824" r="10512" b="8026" baseLine="7973" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="7848" r="6600" b="8026">types</wd>

<space/>

<wd l="6686" t="7824" r="6878" b="7982">of</wd>

<space/>

<wd l="6946" t="7824" r="7565" b="7982">entities</wd>

<space/>

<wd l="7651" t="7824" r="8290" b="7982">defined</wd>

<space/>

<wd l="8366" t="7824" r="8626" b="7982">for</wd>

<space/>

<wd l="8698" t="7824" r="8962" b="7982">the</wd>

<space/>

<wd l="9048" t="7824" r="9610" b="7982">shared</wd>

<space/>

<wd l="9686" t="7824" r="10080" b="7982">task.</wd>

<space/>

<wd l="10224" t="7829" r="10512" b="7982">We</wd>

<space/>

</ln>

<ln l="6149" t="8088" r="10507" b="8294" baseLine="8246" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="8093" r="6778" b="8251">deleted</wd>

<space/>

<wd l="6835" t="8093" r="7742" b="8294">duplicated</wd>

<space/>

<wd l="7805" t="8093" r="8165" b="8251">data</wd>

<space/>

<wd l="8227" t="8098" r="8467" b="8290">(as</wd>

<space/>

<wd l="8530" t="8146" r="8784" b="8251">we</wd>

<space/>

<wd l="8842" t="8093" r="9216" b="8294">kept</wd>

<space/>

<wd l="9278" t="8093" r="9658" b="8294">only</wd>

<space/>

<wd l="9720" t="8098" r="10507" b="8294">cap.1000</wd>

<space/>

</ln>

<ln l="6144" t="8366" r="10512" b="8568" baseLine="8515" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="8366" r="6422" b="8525">but</wd>

<space/>

<wd l="6518" t="8390" r="6797" b="8525">not</wd>

<space/>

<wd l="6902" t="8371" r="7469" b="8568">cap.10</wd>

<space/>

<wd l="7570" t="8419" r="7862" b="8525">nor</wd>

<space/>

<wd l="7963" t="8366" r="8534" b="8554">others,</wd>

<space/>

<wd l="8659" t="8371" r="9024" b="8563">etc).</wd>

<space/>

<wd l="9235" t="8366" r="9686" b="8525">Then</wd>

<space/>

<wd l="9782" t="8419" r="10037" b="8525">we</wd>

<space/>

<wd l="10138" t="8366" r="10512" b="8525">read</wd>

<space/>

</ln>

<ln l="6149" t="8635" r="10502" b="8837" baseLine="8789" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="8688" r="6619" b="8837">every</wd>

<space/>

<wd l="6730" t="8635" r="7123" b="8794">item</wd>

<space/>

<wd l="7234" t="8635" r="7426" b="8794">of</wd>

<space/>

<wd l="7522" t="8635" r="7786" b="8794">the</wd>

<space/>

<wd l="7896" t="8635" r="8290" b="8794">lists.</wd>

<space/>

<wd l="8534" t="8640" r="8770" b="8794">As</wd>

<space/>

<wd l="8894" t="8688" r="9346" b="8794">some</wd>

<space/>

<wd l="9456" t="8635" r="9922" b="8794">items</wd>

<space/>

<wd l="10046" t="8635" r="10502" b="8832">(enti-</wd>

</ln>

<ln l="6144" t="8909" r="10512" b="9106" baseLine="9058" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="8909" r="6509" b="9106">ties)</wd>

<space/>

<wd l="6614" t="8909" r="7253" b="9067">contain</wd>

<space/>

<wd l="7339" t="8962" r="7786" b="9067">more</wd>

<space/>

<wd l="7872" t="8909" r="8246" b="9067">than</wd>

<space/>

<wd l="8342" t="8962" r="8650" b="9067">one</wd>

<space/>

<wd l="8741" t="8909" r="9264" b="9096">token,</wd>

<space/>

<wd l="9374" t="8962" r="9624" b="9067">we</wd>

<space/>

<wd l="9720" t="8909" r="10512" b="9067">extracted</wd>

<space/>

</ln>

<ln l="6144" t="9178" r="10502" b="9379" baseLine="9331" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9178" r="6413" b="9336">the</wd>

<space/>

<wd l="6494" t="9178" r="6830" b="9336">first</wd>

<space/>

<wd l="6902" t="9178" r="7464" b="9336">tokens</wd>

<space/>

<wd l="7555" t="9182" r="7805" b="9374">(or</wd>

<space/>

<wd l="7877" t="9178" r="8141" b="9336">the</wd>

<space/>

<wd l="8222" t="9178" r="8602" b="9379">only</wd>

<space/>

<wd l="8678" t="9178" r="9163" b="9336">token</wd>

<space/>

<wd l="9240" t="9178" r="9499" b="9336">for</wd>

<space/>

<wd l="9571" t="9178" r="10502" b="9336">one-token-</wd>

</ln>

<ln l="6149" t="9451" r="10507" b="9653" baseLine="9600" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="9451" r="6840" b="9648">entities)</wd>

<space/>

<wd l="6960" t="9451" r="7272" b="9610">and</wd>

<space/>

<wd l="7373" t="9451" r="7642" b="9610">the</wd>

<space/>

<wd l="7747" t="9451" r="8626" b="9653">remaining</wd>

<space/>

<wd l="8741" t="9504" r="9130" b="9610">ones</wd>

<space/>

<wd l="9240" t="9451" r="9797" b="9610">before</wd>

<space/>

<wd l="9917" t="9451" r="10507" b="9653">storing</wd>

<space/>

</ln>

<ln l="6144" t="9720" r="10502" b="9922" baseLine="9869" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9720" r="6586" b="9878">them</wd>

<space/>

<wd l="6686" t="9720" r="7022" b="9878">into</wd>

<space/>

<wd l="7133" t="9720" r="7877" b="9878">different</wd>

<space/>

<wd l="7978" t="9720" r="8376" b="9878">lists.</wd>

<space/>

<wd l="8606" t="9725" r="8875" b="9907">So,</wd>

<space/>

<wd l="9005" t="9720" r="9259" b="9878">for</wd>

<space/>

<wd l="9365" t="9773" r="9835" b="9922">every</wd>

<space/>

<wd l="9946" t="9720" r="10502" b="9878">dictio-</wd>

</ln>

<ln l="6144" t="9994" r="10507" b="10195" baseLine="10142" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10046" r="6528" b="10195">nary</wd>

<space/>

<wd l="6600" t="10046" r="6854" b="10152">we</wd>

<space/>

<wd l="6922" t="9994" r="7277" b="10181">had,</wd>

<space/>

<wd l="7358" t="10046" r="7613" b="10152">we</wd>

<space/>

<wd l="7685" t="9994" r="8309" b="10152">created</wd>

<space/>

<wd l="8381" t="9998" r="8482" b="10147">2</wd>

<space/>

<wd l="8549" t="9994" r="8942" b="10152">lists:</wd>

<space/>

<wd l="9058" t="10046" r="9154" b="10152">a</wd>

<space/>

<wd l="9221" t="9994" r="10507" b="10195">”B-dictionary”</wd>

<space/>

</ln>

<ln l="6149" t="10262" r="10502" b="10464" baseLine="10411" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="10262" r="6461" b="10421">and</wd>

<space/>

<wd l="6581" t="10315" r="6677" b="10421">a</wd>

<space/>

<wd l="6792" t="10262" r="8054" b="10464">”I-dictionary”,</wd>

<space/>

<wd l="8194" t="10262" r="9024" b="10464">preparing</wd>

<space/>

<wd l="9144" t="10262" r="9408" b="10421">the</wd>

<space/>

<wd l="9523" t="10267" r="9898" b="10421">BIO</wd>

<space/>

<wd l="10013" t="10262" r="10502" b="10421">label-</wd>

</ln>

<ln l="6144" t="10531" r="10507" b="10733" baseLine="10685" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10531" r="6552" b="10733">ings.</wd>

<space/>

<wd l="6638" t="10531" r="7286" b="10733">Finally,</wd>

<space/>

<wd l="7354" t="10584" r="7608" b="10690">we</wd>

<space/>

<wd l="7666" t="10531" r="8534" b="10733">integrated</wd>

<space/>

<wd l="8592" t="10531" r="9038" b="10690">these</wd>

<space/>

<wd l="9101" t="10531" r="10109" b="10690">dictionaries</wd>

<space/>

<wd l="10171" t="10531" r="10507" b="10690">into</wd>

<space/>

</ln>

<ln l="6144" t="10805" r="10526" b="11006" baseLine="10954" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10805" r="6413" b="10963">the</wd>

<space/>

<wd l="6499" t="10805" r="7042" b="10963">model</wd>

<space/>

<wd l="7138" t="10805" r="7349" b="11006">by</wd>

<space/>

<wd l="7445" t="10805" r="7997" b="11006">binary</wd>

<space/>

<wd l="8088" t="10805" r="8683" b="10963">values.</wd>

<space/>

<wd l="8866" t="10810" r="9168" b="10963">For</wd>

<space/>

<wd l="9259" t="10805" r="9658" b="10963">each</wd>

<space/>

<wd l="9744" t="10805" r="10267" b="10992">token,</wd>

<space/>

<wd l="10378" t="10805" r="10526" b="10958">if</wd>

<space/>

</ln>

<ln l="6144" t="11074" r="10502" b="11275" baseLine="11227" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="11074" r="6269" b="11232">it</wd>

<space/>

<wd l="6370" t="11074" r="6504" b="11232">is</wd>

<space/>

<wd l="6614" t="11098" r="7248" b="11275">present</wd>

<space/>

<wd l="7349" t="11074" r="7517" b="11227">in</wd>

<space/>

<wd l="7622" t="11126" r="7718" b="11232">a</wd>

<space/>

<wd l="7824" t="11074" r="8698" b="11275">dictionary</wd>

<space/>

<wd l="8813" t="11074" r="9979" b="11275">(B-dictionary</wd>

<space/>

<wd l="10085" t="11126" r="10267" b="11232">or</wd>

<space/>

<wd l="10368" t="11078" r="10502" b="11227">I-</wd>

</ln>

<ln l="6149" t="11347" r="10502" b="11549" baseLine="11496" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="11347" r="7147" b="11549">dictionary),</wd>

<space/>

<wd l="7262" t="11347" r="7459" b="11506">its</wd>

<space/>

<wd l="7560" t="11347" r="8026" b="11506">value</wd>

<space/>

<wd l="8122" t="11347" r="8381" b="11506">for</wd>

<space/>

<wd l="8472" t="11347" r="8736" b="11506">the</wd>

<space/>

<wd l="8837" t="11347" r="10075" b="11549">corresponding</wd>

<space/>

<wd l="10171" t="11347" r="10502" b="11506">fea-</wd>

</ln>

<ln l="6144" t="11616" r="10512" b="11803" baseLine="11770" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="11640" r="6485" b="11774">ture</wd>

<space/>

<wd l="6566" t="11616" r="6701" b="11774">is</wd>

<space/>

<wd l="6797" t="11640" r="7032" b="11774">set</wd>

<space/>

<wd l="7109" t="11640" r="7277" b="11774">to</wd>

<space/>

<wd l="7382" t="11621" r="7512" b="11803">1,</wd>

<space/>

<wd l="7613" t="11616" r="7925" b="11774">and</wd>

<space/>

<wd l="8006" t="11621" r="8107" b="11774">0</wd>

<space/>

<wd l="8198" t="11616" r="9082" b="11774">otherwise.</wd>

<space/>

<wd l="9235" t="11616" r="9614" b="11774">And</wd>

<space/>

<wd l="9691" t="11669" r="9946" b="11774">we</wd>

<space/>

<wd l="10032" t="11616" r="10512" b="11774">could</wd>

<space/>

</ln>

<ln l="6149" t="11890" r="10512" b="12091" baseLine="12038" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="11890" r="6739" b="12091">always</wd>

<space/>

<wd l="6854" t="11914" r="7094" b="12091">try</wd>

<space/>

<wd l="7205" t="11890" r="7594" b="12048">with</wd>

<space/>

<wd l="7704" t="11890" r="8150" b="12048">other</wd>

<space/>

<wd l="8251" t="11942" r="9154" b="12048">ressources</wd>

<space/>

<wd l="9269" t="11890" r="9590" b="12048">like</wd>

<space/>

<wd l="9701" t="11894" r="10512" b="12048">FreeBase</wd>

<space/>

</ln>

<ln l="6149" t="12154" r="10517" b="12360" baseLine="12312">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-1"><wd l="6149" t="12163" r="9398" b="12355">https://www.freebase.com/</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="9466" t="12158" r="9778" b="12317">and</wd>

<space/>

<wd l="9826" t="12158" r="10517" b="12360">dbpedia</wd>

<space/>

</run>

</ln>

<ln l="6149" t="12437" r="8678" b="12629" baseLine="12581">

<wd l="6149" t="12437" r="8678" b="12629"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-1">http://dbpedia.org/</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="12984" r="9667" b="13205" alignment="left" spaceBefore="280" lsp="exactly" lspExact="279" language="en">

<ln l="6144" t="12984" r="9667" b="13205" baseLine="13147" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="6144" t="12984" r="6259" b="13152">4</wd>

<space/>

<wd l="6509" t="12984" r="7061" b="13157">Some</wd>

<space/>

<wd l="7123" t="12984" r="8419" b="13205">Experiments</wd>

<space/>

<wd l="8486" t="12989" r="8866" b="13157">and</wd>

<space/>

<wd l="8933" t="12989" r="9667" b="13157">Results</wd>

</ln>

</para>

<para l="6144" t="13478" r="10526" b="15264" alignment="justified" ri="144" spaceBefore="204" spaceAfter="5" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="13478" r="10502" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13478" r="6576" b="13637">With</wd>

<space/>

<wd l="6667" t="13478" r="6931" b="13637">the</wd>

<space/>

<wd l="7027" t="13478" r="7858" b="13680">templates</wd>

<space/>

<wd l="7963" t="13478" r="8602" b="13637">defined</wd>

<space/>

<wd l="8693" t="13478" r="8866" b="13632">in</wd>

<space/>

<wd l="8957" t="13478" r="9226" b="13637">the</wd>

<space/>

<wd l="9322" t="13478" r="10056" b="13680">previous</wd>

<space/>

<wd l="10171" t="13531" r="10502" b="13637">sec-</wd>

</ln>

<ln l="6144" t="13752" r="10512" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13752" r="6528" b="13939">tion,</wd>

<space/>

<wd l="6648" t="13805" r="6898" b="13910">we</wd>

<space/>

<wd l="6998" t="13752" r="7397" b="13910">used</wd>

<space/>

<wd l="7493" t="13795" r="8088" b="13954">rprop+</wd>

<space/>

<wd l="8189" t="13805" r="8357" b="13910">as</wd>

<space/>

<wd l="8467" t="13752" r="9566" b="13954">optimization</wd>

<space/>

<wd l="9667" t="13752" r="10512" b="13954">algorithm</wd>

<space/>

</ln>

<ln l="6144" t="14021" r="10507" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14021" r="6317" b="14174">in</wd>

<space/>

<wd l="6427" t="14021" r="7003" b="14222">Wapiti</wd>

<space/>

<wd l="7123" t="14021" r="7435" b="14179">and</wd>

<space/>

<wd l="7546" t="14074" r="7795" b="14179">we</wd>

<space/>

<wd l="7915" t="14021" r="8189" b="14179">did</wd>

<space/>

<wd l="8314" t="14074" r="8760" b="14179">some</wd>

<space/>

<wd l="8880" t="14021" r="9931" b="14222">experiments</wd>

<space/>

<wd l="10061" t="14021" r="10507" b="14222">(only</wd>

<space/>

</ln>

<ln l="6144" t="14294" r="10502" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14294" r="6533" b="14453">with</wd>

<space/>

<wd l="6614" t="14294" r="6883" b="14453">the</wd>

<space/>

<wd l="6989" t="14299" r="7181" b="14453">10</wd>

<space/>

<wd l="7267" t="14294" r="7910" b="14453">distinct</wd>

<space/>

<wd l="7987" t="14318" r="8443" b="14496">types</wd>

<space/>

<wd l="8534" t="14294" r="8726" b="14453">of</wd>

<space/>

<wd l="8798" t="14294" r="9490" b="14491">entities)</wd>

<space/>

<wd l="9581" t="14294" r="9970" b="14453">with</wd>

<space/>

<wd l="10051" t="14294" r="10502" b="14453">mod-</wd>

</ln>

<ln l="6149" t="14563" r="10512" b="14750" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="14563" r="6379" b="14722">els</wd>

<space/>

<wd l="6466" t="14563" r="7070" b="14722">trained</wd>

<space/>

<wd l="7147" t="14563" r="7536" b="14722">with</wd>

<space/>

<wd l="7618" t="14563" r="8198" b="14722">”train”</wd>

<space/>

<wd l="8290" t="14563" r="8602" b="14722">and</wd>

<space/>

<wd l="8674" t="14563" r="9187" b="14722">tested</wd>

<space/>

<wd l="9264" t="14616" r="9480" b="14722">on</wd>

<space/>

<wd l="9562" t="14563" r="10104" b="14750">”dev”,</wd>

<space/>

<wd l="10200" t="14563" r="10512" b="14722">and</wd>

<space/>

</ln>

<ln l="6144" t="14837" r="10526" b="14995" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14837" r="6538" b="14995">later</wd>

<space/>

<wd l="6581" t="14837" r="7094" b="14995">tested</wd>

<space/>

<wd l="7142" t="14890" r="7358" b="14995">on</wd>

<space/>

<wd l="7411" t="14837" r="7810" b="14995">”dev</wd>

<space/>

<wd l="7896" t="14837" r="8467" b="14995">2015”.</wd>

<space/>

<wd l="8544" t="14837" r="9024" b="14995">Table</wd>

<space/>

<wd l="9077" t="14842" r="9178" b="14990">2</wd>

<space/>

<wd l="9240" t="14837" r="9763" b="14995">shows</wd>

<space/>

<wd l="9830" t="14890" r="10282" b="14995">some</wd>

<space/>

<wd l="10334" t="14837" r="10526" b="14995">of</wd>

<space/>

</ln>

<ln l="6144" t="15106" r="7262" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="15106" r="6595" b="15264">these</wd>

<space/>

<wd l="6648" t="15106" r="7262" b="15264">results.</wd>

</ln>

</para>

</column>

</section>

<dd l="1323" t="15736" r="10644" b="15977">

<para l="5804" t="15787" r="6143" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5870" t="15787" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="39">

<wd l="5870" t="15787" r="6077" b="15946">69</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4309.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1318" marginTop="1248" marginRight="1270" marginBottom="1302" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1318" t="1248" r="10639" b="15356">

<column l="1318" t="1248" r="5858" b="15356">

<para l="1445" t="1306" r="5323" b="1810" alignment="left" li="432" ri="504" spaceBefore="13" fli="-360" lsp="exactly" lspExact="278" language="en">

<ln l="1445" t="1306" r="5323" b="1526" baseLine="1474" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1310" r="1555" b="1478">5</wd>

<space/>

<wd l="1810" t="1306" r="2290" b="1478">CRF</wd>

<space/>

<wd l="2352" t="1310" r="2995" b="1478">Model</wd>

<space/>

<wd l="3067" t="1306" r="3946" b="1526">Training</wd>

<space/>

<wd l="4013" t="1306" r="4454" b="1478">with</wd>

<space/>

<wd l="4517" t="1306" r="5323" b="1478">Domain</wd>

<space/>

</ln>

<ln l="1800" t="1589" r="3504" b="1810" baseLine="1752" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1800" t="1594" r="2290" b="1762">Data</wd>

<space/>

<wd l="2352" t="1589" r="3504" b="1810">Adaptation</wd>

</ln>

</para>

<para l="1440" t="2054" r="5808" b="3614" alignment="justified" li="72" spaceBefore="177" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="2054" r="5808" b="2256" baseLine="2208" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2059" r="1675" b="2213">As</wd>

<space/>

<wd l="1771" t="2107" r="2026" b="2213">we</wd>

<space/>

<wd l="2117" t="2107" r="2414" b="2213">can</wd>

<space/>

<wd l="2515" t="2107" r="2784" b="2213">see</wd>

<space/>

<wd l="2870" t="2054" r="3043" b="2208">in</wd>

<space/>

<wd l="3130" t="2054" r="3394" b="2213">the</wd>

<space/>

<wd l="3485" t="2054" r="4219" b="2256">previous</wd>

<space/>

<wd l="4330" t="2054" r="4978" b="2242">section,</wd>

<space/>

<wd l="5093" t="2107" r="5381" b="2213">our</wd>

<space/>

<wd l="5472" t="2054" r="5808" b="2213">first</wd>

<space/>

</ln>

<ln l="1440" t="2328" r="5794" b="2530" baseLine="2477" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2328" r="1982" b="2486">model</wd>

<space/>

<wd l="2088" t="2328" r="2866" b="2530">performs</wd>

<space/>

<wd l="2976" t="2328" r="3542" b="2530">poorly</wd>

<space/>

<wd l="3653" t="2381" r="3864" b="2486">on</wd>

<space/>

<wd l="3970" t="2328" r="4272" b="2486">dev</wd>

<space/>

<wd l="4358" t="2328" r="4776" b="2486">2105</wd>

<space/>

<wd l="4896" t="2328" r="5261" b="2486">data</wd>

<space/>

<wd l="5362" t="2381" r="5794" b="2486">com-</wd>

</ln>

<ln l="1440" t="2597" r="5808" b="2798" baseLine="2750" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2597" r="1925" b="2798">pared</wd>

<space/>

<wd l="2045" t="2621" r="2213" b="2755">to</wd>

<space/>

<wd l="2338" t="2597" r="2674" b="2755">dev.</wd>

<space/>

<wd l="2952" t="2597" r="3331" b="2755">This</wd>

<space/>

<wd l="3466" t="2621" r="4190" b="2798">suggests</wd>

<space/>

<wd l="4315" t="2597" r="4646" b="2755">that</wd>

<space/>

<wd l="4766" t="2597" r="5030" b="2755">the</wd>

<space/>

<wd l="5155" t="2597" r="5520" b="2755">data</wd>

<space/>

<wd l="5635" t="2597" r="5808" b="2750">in</wd>

<space/>

</ln>

<ln l="1445" t="2870" r="5803" b="3072" baseLine="3019" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="2870" r="1747" b="3029">dev</wd>

<space/>

<wd l="1834" t="2870" r="2251" b="3029">2015</wd>

<space/>

<wd l="2347" t="2923" r="2606" b="3029">are</wd>

<space/>

<wd l="2683" t="2923" r="3062" b="3072">very</wd>

<space/>

<wd l="3149" t="2870" r="3893" b="3029">different</wd>

<space/>

<wd l="3965" t="2870" r="4392" b="3029">from</wd>

<space/>

<wd l="4469" t="2870" r="4733" b="3029">the</wd>

<space/>

<wd l="4814" t="2870" r="5179" b="3029">data</wd>

<space/>

<wd l="5251" t="2870" r="5419" b="3024">in</wd>

<space/>

<wd l="5501" t="2870" r="5803" b="3029">dev</wd>

<space/>

</ln>

<ln l="1445" t="3139" r="5794" b="3298" baseLine="3288" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3139" r="1757" b="3298">and</wd>

<space/>

<wd l="1853" t="3139" r="2299" b="3298">train.</wd>

<space/>

<wd l="2510" t="3139" r="2890" b="3298">This</wd>

<space/>

<wd l="2995" t="3139" r="3739" b="3298">intuition</wd>

<space/>

<wd l="3835" t="3139" r="4118" b="3298">has</wd>

<space/>

<wd l="4224" t="3139" r="4810" b="3298">indeed</wd>

<space/>

<wd l="4906" t="3139" r="5318" b="3298">been</wd>

<space/>

<wd l="5424" t="3192" r="5794" b="3298">con-</wd>

</ln>

<ln l="1445" t="3413" r="4190" b="3614" baseLine="3562" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="3413" r="2011" b="3571">firmed</wd>

<space/>

<wd l="2064" t="3413" r="2280" b="3614">by</wd>

<space/>

<wd l="2342" t="3466" r="2438" b="3571">a</wd>

<space/>

<wd l="2491" t="3413" r="2976" b="3614">quick</wd>

<space/>

<wd l="3034" t="3413" r="3394" b="3571">data</wd>

<space/>

<wd l="3451" t="3413" r="4190" b="3614">analysis.</wd>

</ln>

</para>

<para l="1440" t="3696" r="5808" b="9048" alignment="justified" li="72" spaceBefore="13" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="3696" r="5808" b="3898" baseLine="3845" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="3701" r="1891" b="3854">As</wd>

<space/>

<wd l="1978" t="3749" r="2074" b="3854">a</wd>

<space/>

<wd l="2141" t="3749" r="3298" b="3898">consequence,</wd>

<space/>

<wd l="3384" t="3749" r="3634" b="3854">we</wd>

<space/>

<wd l="3706" t="3696" r="4022" b="3854">had</wd>

<space/>

<wd l="4090" t="3696" r="4358" b="3854">the</wd>

<space/>

<wd l="4430" t="3696" r="4795" b="3854">idea</wd>

<space/>

<wd l="4862" t="3720" r="5030" b="3854">to</wd>

<space/>

<wd l="5102" t="3696" r="5808" b="3898">perform</wd>

<space/>

</ln>

<ln l="1445" t="3965" r="5803" b="4166" baseLine="4118" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="4018" r="1541" b="4123">a</wd>

<space/>

<wd l="1603" t="3965" r="1992" b="4123">kind</wd>

<space/>

<wd l="2059" t="3965" r="2251" b="4123">of</wd>

<space/>

<wd l="2309" t="3965" r="2962" b="4123">domain</wd>

<space/>

<wd l="3029" t="3965" r="3394" b="4123">data</wd>

<space/>

<wd l="3461" t="3965" r="4406" b="4166">adaptation,</wd>

<space/>

<wd l="4488" t="3965" r="5189" b="4166">inspired</wd>

<space/>

<wd l="5256" t="3965" r="5467" b="4166">by</wd>

<space/>

<wd l="5539" t="3965" r="5803" b="4123">the</wd>

<space/>

</ln>

<ln l="1440" t="4238" r="5798" b="4440" baseLine="4387" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="4238" r="1886" b="4397">work</wd>

<space/>

<wd l="1982" t="4238" r="2174" b="4397">of</wd>

<space/>

<wd l="2261" t="4238" r="3173" b="4440">(Raymond</wd>

<space/>

<wd l="3269" t="4238" r="3581" b="4397">and</wd>

<space/>

<wd l="3667" t="4238" r="4363" b="4440">Fayolle,</wd>

<space/>

<wd l="4478" t="4243" r="5026" b="4435">2010).</wd>

<space/>

<wd l="5218" t="4243" r="5400" b="4392">In</wd>

<space/>

<wd l="5491" t="4238" r="5798" b="4397">this</wd>

<space/>

</ln>

<ln l="1445" t="4507" r="5798" b="4709" baseLine="4661">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1445" t="4531" r="2122" b="4694">context,</wd>

<space/>

<wd l="2189" t="4507" r="2453" b="4666">the</wd>

<space/>

<wd l="2510" t="4507" r="2875" b="4666">data</wd>

<space/>

<wd l="2923" t="4560" r="3178" b="4666">we</wd>

<space/>

<wd l="3235" t="4531" r="3658" b="4666">want</wd>

<space/>

<wd l="3710" t="4531" r="3874" b="4666">to</wd>

<space/>

<wd l="3936" t="4507" r="4406" b="4709">adapt</wd>

<space/>

<wd l="4459" t="4507" r="4594" b="4666">is</wd>

<space/>

<wd l="4661" t="4507" r="5179" b="4666">called</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="5232" t="4560" r="5798" b="4666">source</wd>

<space/>

</run>

</ln>

<ln l="1440" t="4781" r="5803" b="4982" baseLine="4930">

<wd l="1440" t="4781" r="2136" b="4939"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">domain</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="2275" t="4786" r="2458" b="4934">In</wd>

<space/>

<wd l="2534" t="4834" r="2827" b="4939">our</wd>

<space/>

<wd l="2899" t="4834" r="3317" b="4968">case,</wd>

<space/>

<wd l="3403" t="4781" r="3806" b="4939">train</wd>

<space/>

<wd l="3883" t="4781" r="4195" b="4939">and</wd>

<space/>

<wd l="4272" t="4781" r="4574" b="4939">dev</wd>

<space/>

<wd l="4656" t="4781" r="5021" b="4939">data</wd>

<space/>

<wd l="5088" t="4781" r="5462" b="4982">play</wd>

<space/>

<wd l="5539" t="4781" r="5803" b="4939">the</wd>

<space/>

</run>

</ln>

<ln l="1440" t="5050" r="5794" b="5251" baseLine="5203">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="5050" r="1781" b="5208">role</wd>

<space/>

<wd l="1848" t="5050" r="2035" b="5208">of</wd>

<space/>

<wd l="2083" t="5050" r="2390" b="5208">this</wd>

<space/>

<wd l="2472" t="5102" r="3034" b="5208">source</wd>

<space/>

<wd l="3101" t="5050" r="3792" b="5208">domain.</wd>

<space/>

<wd l="3893" t="5050" r="4234" b="5208">The</wd>

<space/>

<wd l="4296" t="5050" r="4632" b="5208">role</wd>

<space/>

<wd l="4704" t="5050" r="4891" b="5208">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="4944" t="5083" r="5458" b="5251">target</wd>

<space/>

<wd l="5515" t="5050" r="5794" b="5208">do-</wd>

</run>

</ln>

<ln l="1440" t="5323" r="5808" b="5525" baseLine="5472">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="5333" r="1872" b="5482">main</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1954" t="5323" r="2093" b="5482">is</wd>

<space/>

<wd l="2179" t="5323" r="2760" b="5525">played</wd>

<space/>

<wd l="2837" t="5323" r="3053" b="5525">by</wd>

<space/>

<wd l="3134" t="5323" r="3398" b="5482">the</wd>

<space/>

<wd l="3480" t="5376" r="3830" b="5482">new</wd>

<space/>

<wd l="3917" t="5323" r="4555" b="5482">version</wd>

<space/>

<wd l="4637" t="5323" r="4829" b="5482">of</wd>

<space/>

<wd l="4891" t="5347" r="5366" b="5482">tweet</wd>

<space/>

<wd l="5448" t="5323" r="5808" b="5482">data</wd>

<space/>

</run>

</ln>

<ln l="1440" t="5592" r="5794" b="5794" baseLine="5746" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="5592" r="2213" b="5794">provided</wd>

<space/>

<wd l="2261" t="5592" r="2520" b="5750">for</wd>

<space/>

<wd l="2563" t="5592" r="2827" b="5750">the</wd>

<space/>

<wd l="2885" t="5592" r="3446" b="5750">shared</wd>

<space/>

<wd l="3494" t="5592" r="3888" b="5779">task,</wd>

<space/>

<wd l="3946" t="5592" r="4277" b="5750">that</wd>

<space/>

<wd l="4325" t="5592" r="4459" b="5750">is</wd>

<space/>

<wd l="4522" t="5592" r="4819" b="5750">dev</wd>

<space/>

<wd l="4910" t="5592" r="5328" b="5750">2105</wd>

<space/>

<wd l="5390" t="5592" r="5794" b="5750">data.</wd>

<space/>

</ln>

<ln l="1440" t="5866" r="5794" b="6067" baseLine="6014" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="5866" r="1781" b="6024">The</wd>

<space/>

<wd l="1829" t="5866" r="2626" b="6067">approach</wd>

<space/>

<wd l="2678" t="5866" r="3509" b="6024">described</wd>

<space/>

<wd l="3552" t="5866" r="3725" b="6019">in</wd>

<space/>

<wd l="3782" t="5866" r="4694" b="6067">(Raymond</wd>

<space/>

<wd l="4742" t="5866" r="5054" b="6024">and</wd>

<space/>

<wd l="5098" t="5866" r="5794" b="6067">Fayolle,</wd>

<space/>

</ln>

<ln l="1445" t="6134" r="5808" b="6336" baseLine="6283" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="6139" r="1939" b="6331">2010)</wd>

<space/>

<wd l="1997" t="6134" r="2510" b="6293">mixes</wd>

<space/>

<wd l="2568" t="6134" r="3283" b="6336">together</wd>

<space/>

<wd l="3336" t="6134" r="3696" b="6293">data</wd>

<space/>

<wd l="3744" t="6134" r="4171" b="6293">from</wd>

<space/>

<wd l="4214" t="6134" r="4483" b="6293">the</wd>

<space/>

<wd l="4541" t="6187" r="5102" b="6293">source</wd>

<space/>

<wd l="5155" t="6134" r="5808" b="6293">domain</wd>

<space/>

</ln>

<ln l="1445" t="6408" r="5803" b="6610" baseLine="6557" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="6408" r="1757" b="6566">and</wd>

<space/>

<wd l="1805" t="6408" r="2232" b="6566">from</wd>

<space/>

<wd l="2280" t="6408" r="2544" b="6566">the</wd>

<space/>

<wd l="2597" t="6432" r="3091" b="6610">target</wd>

<space/>

<wd l="3144" t="6408" r="3797" b="6566">domain</wd>

<space/>

<wd l="3845" t="6408" r="4018" b="6562">in</wd>

<space/>

<wd l="4070" t="6408" r="4531" b="6566">order</wd>

<space/>

<wd l="4574" t="6432" r="4742" b="6566">to</wd>

<space/>

<wd l="4795" t="6408" r="5198" b="6566">train</wd>

<space/>

<wd l="5251" t="6461" r="5347" b="6566">a</wd>

<space/>

<wd l="5400" t="6413" r="5803" b="6566">CRF</wd>

<space/>

</ln>

<ln l="1440" t="6677" r="5798" b="6878" baseLine="6826" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="6677" r="2030" b="6835">model.</wd>

<space/>

<wd l="2179" t="6677" r="2515" b="6835">The</wd>

<space/>

<wd l="2602" t="6677" r="3504" b="6878">originality</wd>

<space/>

<wd l="3590" t="6677" r="3778" b="6835">of</wd>

<space/>

<wd l="3845" t="6677" r="4152" b="6835">this</wd>

<space/>

<wd l="4243" t="6677" r="5040" b="6878">approach</wd>

<space/>

<wd l="5122" t="6677" r="5798" b="6835">consists</wd>

<space/>

</ln>

<ln l="1440" t="6946" r="5808" b="7147" baseLine="7099" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="6946" r="1613" b="7099">in</wd>

<space/>

<wd l="1661" t="6946" r="2131" b="7147">using</wd>

<space/>

<wd l="2184" t="6998" r="2630" b="7104">more</wd>

<space/>

<wd l="2688" t="6950" r="3091" b="7104">CRF</wd>

<space/>

<wd l="3144" t="6946" r="3826" b="7104">features</wd>

<space/>

<wd l="3883" t="6946" r="4142" b="7104">for</wd>

<space/>

<wd l="4186" t="6946" r="4454" b="7104">the</wd>

<space/>

<wd l="4502" t="6974" r="4843" b="7147">part</wd>

<space/>

<wd l="4901" t="6946" r="5088" b="7104">of</wd>

<space/>

<wd l="5126" t="6946" r="5390" b="7104">the</wd>

<space/>

<wd l="5448" t="6946" r="5808" b="7104">data</wd>

<space/>

</ln>

<ln l="1445" t="7219" r="5803" b="7421" baseLine="7368" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="7219" r="2467" b="7421">constituting</wd>

<space/>

<wd l="2520" t="7219" r="2784" b="7378">the</wd>

<space/>

<wd l="2832" t="7243" r="3326" b="7421">target</wd>

<space/>

<wd l="3379" t="7219" r="4027" b="7378">domain</wd>

<space/>

<wd l="4075" t="7219" r="4454" b="7378">than</wd>

<space/>

<wd l="4498" t="7219" r="5179" b="7378">features</wd>

<space/>

<wd l="5237" t="7219" r="5496" b="7378">for</wd>

<space/>

<wd l="5539" t="7219" r="5803" b="7378">the</wd>

<space/>

</ln>

<ln l="1445" t="7488" r="5794" b="7690" baseLine="7642" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="7488" r="1810" b="7646">data</wd>

<space/>

<wd l="1886" t="7488" r="2909" b="7690">constituting</wd>

<space/>

<wd l="2986" t="7488" r="3254" b="7646">the</wd>

<space/>

<wd l="3341" t="7541" r="3898" b="7646">source</wd>

<space/>

<wd l="3984" t="7488" r="4675" b="7646">domain.</wd>

<space/>

<wd l="4819" t="7488" r="5160" b="7646">The</wd>

<space/>

<wd l="5242" t="7541" r="5794" b="7646">conse-</wd>

</ln>

<ln l="1445" t="7762" r="5803" b="7963" baseLine="7910" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="7814" r="2059" b="7963">quence</wd>

<space/>

<wd l="2112" t="7762" r="2304" b="7920">of</wd>

<space/>

<wd l="2342" t="7762" r="2650" b="7920">this</wd>

<space/>

<wd l="2712" t="7762" r="3278" b="7920">choice</wd>

<space/>

<wd l="3331" t="7762" r="3466" b="7920">is</wd>

<space/>

<wd l="3528" t="7762" r="3854" b="7920">that</wd>

<space/>

<wd l="3907" t="7762" r="4171" b="7920">the</wd>

<space/>

<wd l="4229" t="7766" r="4637" b="7920">CRF</wd>

<space/>

<wd l="4690" t="7762" r="5309" b="7920">models</wd>

<space/>

<wd l="5371" t="7762" r="5803" b="7920">learn</wd>

<space/>

</ln>

<ln l="1440" t="8030" r="5808" b="8232" baseLine="8184" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8030" r="2381" b="8189">word-label</wd>

<space/>

<wd l="2462" t="8030" r="3624" b="8232">dependencies</wd>

<space/>

<wd l="3706" t="8030" r="4133" b="8189">from</wd>

<space/>

<wd l="4200" t="8030" r="4589" b="8189">both</wd>

<space/>

<wd l="4666" t="8030" r="5443" b="8218">domains,</wd>

<space/>

<wd l="5530" t="8030" r="5808" b="8189">but</wd>

<space/>

</ln>

<ln l="1440" t="8304" r="5808" b="8506" baseLine="8453" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8328" r="1718" b="8506">put</wd>

<space/>

<wd l="1786" t="8304" r="2270" b="8462">much</wd>

<space/>

<wd l="2342" t="8328" r="3053" b="8506">stronger</wd>

<space/>

<wd l="3115" t="8304" r="4094" b="8506">importance</wd>

<space/>

<wd l="4171" t="8304" r="4838" b="8501">(feature</wd>

<space/>

<wd l="4915" t="8309" r="5510" b="8501">scores)</wd>

<space/>

<wd l="5592" t="8357" r="5808" b="8462">on</wd>

<space/>

</ln>

<ln l="1440" t="8573" r="5794" b="8774" baseLine="8726" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8573" r="2122" b="8731">features</wd>

<space/>

<wd l="2213" t="8573" r="2386" b="8726">in</wd>

<space/>

<wd l="2467" t="8573" r="2731" b="8731">the</wd>

<space/>

<wd l="2818" t="8597" r="3312" b="8774">target</wd>

<space/>

<wd l="3398" t="8573" r="4090" b="8760">domain,</wd>

<space/>

<wd l="4200" t="8573" r="4637" b="8731">since</wd>

<space/>

<wd l="4723" t="8573" r="5093" b="8774">they</wd>

<space/>

<wd l="5184" t="8626" r="5443" b="8731">are</wd>

<space/>

<wd l="5530" t="8573" r="5794" b="8731">de-</wd>

</ln>

<ln l="1450" t="8846" r="4862" b="9048" baseLine="8995" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="8846" r="2074" b="9005">scribed</wd>

<space/>

<wd l="2126" t="8846" r="2338" b="9048">by</wd>

<space/>

<wd l="2395" t="8899" r="2846" b="9005">more</wd>

<space/>

<wd l="2899" t="8846" r="3931" b="9005">information</wd>

<space/>

<wd l="3994" t="8846" r="4862" b="9043">(features).</wd>

</ln>

</para>

<para l="1440" t="9130" r="5808" b="11501" alignment="justified" li="72" spaceBefore="14" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="9130" r="5794" b="9331" baseLine="9278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="9134" r="1944" b="9288">We</wd>

<space/>

<wd l="2093" t="9130" r="2938" b="9288">annotated</wd>

<space/>

<wd l="3091" t="9130" r="3994" b="9288">afterwards</wd>

<space/>

<wd l="4147" t="9130" r="4416" b="9288">the</wd>

<space/>

<wd l="4560" t="9130" r="5237" b="9331">training</wd>

<space/>

<wd l="5390" t="9130" r="5794" b="9317">data,</wd>

<space/>

</ln>

<ln l="1440" t="9403" r="5803" b="9605" baseLine="9552" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9403" r="1973" b="9562">which</wd>

<space/>

<wd l="2064" t="9456" r="2318" b="9562">we</wd>

<space/>

<wd l="2410" t="9403" r="2813" b="9562">have</wd>

<space/>

<wd l="2904" t="9403" r="3542" b="9605">already</wd>

<space/>

<wd l="3643" t="9456" r="4022" b="9562">seen</wd>

<space/>

<wd l="4114" t="9403" r="4675" b="9605">during</wd>

<space/>

<wd l="4771" t="9403" r="5035" b="9562">the</wd>

<space/>

<wd l="5126" t="9403" r="5803" b="9605">training</wd>

<space/>

</ln>

<ln l="1440" t="9672" r="5794" b="9874" baseLine="9821" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9672" r="1982" b="9874">phase,</wd>

<space/>

<wd l="2078" t="9672" r="2467" b="9830">with</wd>

<space/>

<wd l="2554" t="9672" r="2947" b="9830">such</wd>

<space/>

<wd l="3029" t="9725" r="3125" b="9830">a</wd>

<space/>

<wd l="3202" t="9672" r="3792" b="9830">model.</wd>

<space/>

<wd l="3946" t="9672" r="4104" b="9826">If</wd>

<space/>

<wd l="4171" t="9672" r="4440" b="9830">the</wd>

<space/>

<wd l="4517" t="9672" r="5059" b="9830">model</wd>

<space/>

<wd l="5150" t="9725" r="5443" b="9830">can</wd>

<space/>

<wd l="5530" t="9725" r="5794" b="9874">ap-</wd>

</ln>

<ln l="1440" t="9941" r="5794" b="10142" baseLine="10094" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9941" r="1714" b="10142">ply</wd>

<space/>

<wd l="1776" t="9965" r="2486" b="10142">stronger</wd>

<space/>

<wd l="2539" t="9941" r="3701" b="10142">dependencies</wd>

<space/>

<wd l="3758" t="9941" r="4402" b="10099">learned</wd>

<space/>

<wd l="4450" t="9941" r="4877" b="10099">from</wd>

<space/>

<wd l="4925" t="9941" r="5189" b="10099">the</wd>

<space/>

<wd l="5242" t="9965" r="5794" b="10142">target-</wd>

</ln>

<ln l="1445" t="10214" r="5808" b="10416" baseLine="10363" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="10214" r="2098" b="10373">domain</wd>

<space/>

<wd l="2150" t="10243" r="2491" b="10416">part</wd>

<space/>

<wd l="2544" t="10214" r="2736" b="10373">of</wd>

<space/>

<wd l="2774" t="10214" r="3043" b="10373">the</wd>

<space/>

<wd l="3096" t="10214" r="3773" b="10416">training</wd>

<space/>

<wd l="3835" t="10214" r="4234" b="10402">data,</wd>

<space/>

<wd l="4301" t="10214" r="4421" b="10373">it</wd>

<space/>

<wd l="4474" t="10214" r="4805" b="10373">will</wd>

<space/>

<wd l="4872" t="10214" r="5347" b="10416">apply</wd>

<space/>

<wd l="5414" t="10214" r="5808" b="10373">such</wd>

<space/>

</ln>

<ln l="1445" t="10483" r="5794" b="10685" baseLine="10637" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="10483" r="2606" b="10685">dependencies</wd>

<space/>

<wd l="2707" t="10483" r="3686" b="10685">performing</wd>

<space/>

<wd l="3782" t="10483" r="4138" b="10642">thus</wd>

<space/>

<wd l="4238" t="10483" r="4502" b="10642">the</wd>

<space/>

<wd l="4603" t="10483" r="5227" b="10642">desired</wd>

<space/>

<wd l="5328" t="10483" r="5794" b="10685">adap-</wd>

</ln>

<ln l="1440" t="10757" r="5798" b="10958" baseLine="10906" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="10757" r="1982" b="10915">tation.</wd>

<space/>

<wd l="2136" t="10757" r="3024" b="10915">Otherwise</wd>

<space/>

<wd l="3106" t="10757" r="3230" b="10915">it</wd>

<space/>

<wd l="3302" t="10757" r="3643" b="10915">will</wd>

<space/>

<wd l="3725" t="10757" r="4205" b="10958">apply</wd>

<space/>

<wd l="4286" t="10757" r="4550" b="10915">the</wd>

<space/>

<wd l="4637" t="10757" r="5798" b="10958">dependencies</wd>

<space/>

</ln>

<ln l="1440" t="11026" r="5794" b="11227" baseLine="11179" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="11026" r="2083" b="11184">learned</wd>

<space/>

<wd l="2150" t="11026" r="2578" b="11184">from</wd>

<space/>

<wd l="2640" t="11026" r="2909" b="11184">the</wd>

<space/>

<wd l="2986" t="11026" r="4277" b="11184">source-domain</wd>

<space/>

<wd l="4339" t="11054" r="4685" b="11227">part</wd>

<space/>

<wd l="4752" t="11026" r="4944" b="11184">of</wd>

<space/>

<wd l="4997" t="11026" r="5266" b="11184">the</wd>

<space/>

<wd l="5333" t="11026" r="5794" b="11184">train-</wd>

</ln>

<ln l="1440" t="11299" r="5026" b="11501" baseLine="11448" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="11299" r="1714" b="11501">ing</wd>

<space/>

<wd l="1776" t="11299" r="2179" b="11486">data,</wd>

<space/>

<wd l="2246" t="11299" r="2602" b="11458">thus</wd>

<space/>

<wd l="2664" t="11299" r="3350" b="11501">keeping</wd>

<space/>

<wd l="3408" t="11299" r="3672" b="11458">the</wd>

<space/>

<wd l="3734" t="11299" r="4008" b="11458">old</wd>

<space/>

<wd l="4066" t="11299" r="5026" b="11458">annotation.</wd>

</ln>

</para>

<para l="1440" t="11582" r="5808" b="15307" alignment="justified" li="72" spaceBefore="17" spaceAfter="33" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="11582" r="5794" b="11784" baseLine="11736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="11587" r="1944" b="11741">We</wd>

<space/>

<wd l="2030" t="11582" r="2410" b="11784">only</wd>

<space/>

<wd l="2496" t="11582" r="3134" b="11784">applied</wd>

<space/>

<wd l="3221" t="11635" r="3418" b="11741">an</wd>

<space/>

<wd l="3509" t="11582" r="4776" b="11784">approximation</wd>

<space/>

<wd l="4862" t="11582" r="5050" b="11741">of</wd>

<space/>

<wd l="5117" t="11582" r="5424" b="11741">this</wd>

<space/>

<wd l="5520" t="11582" r="5794" b="11741">do-</wd>

</ln>

<ln l="1440" t="11856" r="5794" b="12058" baseLine="12005" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11856" r="1877" b="12014">main</wd>

<space/>

<wd l="1934" t="11856" r="2842" b="12058">adaptation</wd>

<space/>

<wd l="2894" t="11856" r="3768" b="12058">procedure</wd>

<space/>

<wd l="3830" t="11856" r="4018" b="12014">of</wd>

<space/>

<wd l="4070" t="11856" r="4982" b="12058">(Raymond</wd>

<space/>

<wd l="5045" t="11856" r="5357" b="12014">and</wd>

<space/>

<wd l="5410" t="11861" r="5794" b="12058">Fay-</wd>

</ln>

<ln l="1445" t="12125" r="5808" b="12322" baseLine="12278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12125" r="1810" b="12312">olle,</wd>

<space/>

<wd l="1901" t="12130" r="2448" b="12322">2010),</wd>

<space/>

<wd l="2530" t="12125" r="3221" b="12283">because</wd>

<space/>

<wd l="3293" t="12125" r="3485" b="12283">of</wd>

<space/>

<wd l="3542" t="12178" r="3638" b="12283">a</wd>

<space/>

<wd l="3715" t="12125" r="4315" b="12283">serious</wd>

<space/>

<wd l="4392" t="12125" r="4757" b="12283">lack</wd>

<space/>

<wd l="4829" t="12125" r="5016" b="12283">of</wd>

<space/>

<wd l="5074" t="12125" r="5501" b="12283">time.</wd>

<space/>

<wd l="5626" t="12130" r="5808" b="12278">In</wd>

<space/>

</ln>

<ln l="1445" t="12398" r="5808" b="12586" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12398" r="1906" b="12557">order</wd>

<space/>

<wd l="1949" t="12422" r="2117" b="12557">to</wd>

<space/>

<wd l="2174" t="12422" r="2688" b="12557">create</wd>

<space/>

<wd l="2746" t="12451" r="3034" b="12557">our</wd>

<space/>

<wd l="3086" t="12398" r="3466" b="12557">final</wd>

<space/>

<wd l="3518" t="12398" r="4104" b="12586">model,</wd>

<space/>

<wd l="4166" t="12451" r="4421" b="12557">we</wd>

<space/>

<wd l="4469" t="12398" r="5078" b="12557">trained</wd>

<space/>

<wd l="5131" t="12451" r="5419" b="12557">our</wd>

<space/>

<wd l="5472" t="12398" r="5808" b="12557">first</wd>

<space/>

</ln>

<ln l="1445" t="12667" r="5803" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12672" r="1853" b="12826">CRF</wd>

<space/>

<wd l="1920" t="12667" r="2462" b="12826">model</wd>

<space/>

<wd l="2549" t="12667" r="3000" b="12864">(with</wd>

<space/>

<wd l="3067" t="12667" r="3331" b="12826">the</wd>

<space/>

<wd l="3403" t="12667" r="4234" b="12869">templates</wd>

<space/>

<wd l="4310" t="12667" r="5232" b="12826">mentioned</wd>

<space/>

<wd l="5299" t="12667" r="5472" b="12821">in</wd>

<space/>

<wd l="5539" t="12667" r="5803" b="12826">the</wd>

<space/>

</ln>

<ln l="1440" t="12941" r="5808" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12941" r="2179" b="13142">previous</wd>

<space/>

<wd l="2251" t="12941" r="2923" b="13138">section)</wd>

<space/>

<wd l="2990" t="12941" r="3379" b="13099">with</wd>

<space/>

<wd l="3442" t="12941" r="3739" b="13099">dev</wd>

<space/>

<wd l="3826" t="12941" r="4301" b="13099">2015.</wd>

<space/>

<wd l="4387" t="12946" r="4675" b="13099">We</wd>

<space/>

<wd l="4733" t="12941" r="5107" b="13099">then</wd>

<space/>

<wd l="5170" t="12941" r="5808" b="13142">applied</wd>

<space/>

</ln>

<ln l="1440" t="13210" r="5808" b="13368" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13210" r="1747" b="13368">this</wd>

<space/>

<wd l="1853" t="13210" r="2189" b="13368">first</wd>

<space/>

<wd l="2285" t="13214" r="2693" b="13368">CRF</wd>

<space/>

<wd l="2789" t="13210" r="3331" b="13368">model</wd>

<space/>

<wd l="3427" t="13234" r="3595" b="13368">to</wd>

<space/>

<wd l="3691" t="13210" r="4094" b="13368">train</wd>

<space/>

<wd l="4190" t="13210" r="4502" b="13368">and</wd>

<space/>

<wd l="4598" t="13210" r="4901" b="13368">dev</wd>

<space/>

<wd l="4997" t="13234" r="5165" b="13368">to</wd>

<space/>

<wd l="5266" t="13210" r="5808" b="13368">obtain</wd>

<space/>

</ln>

<ln l="1440" t="13478" r="5808" b="13666" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13478" r="1843" b="13637">train</wd>

<space/>

<wd l="1925" t="13478" r="2174" b="13637">crf</wd>

<space/>

<wd l="2242" t="13478" r="2554" b="13637">and</wd>

<space/>

<wd l="2630" t="13478" r="2933" b="13637">dev</wd>

<space/>

<wd l="3019" t="13478" r="3302" b="13637">crf.</wd>

<space/>

<wd l="3446" t="13483" r="3715" b="13666">So,</wd>

<space/>

<wd l="3811" t="13478" r="4258" b="13637">these</wd>

<space/>

<wd l="4339" t="13478" r="4699" b="13637">data</wd>

<space/>

<wd l="4776" t="13531" r="5040" b="13637">are</wd>

<space/>

<wd l="5117" t="13478" r="5808" b="13637">labelled</wd>

<space/>

</ln>

<ln l="1440" t="13752" r="5794" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13752" r="1829" b="13910">with</wd>

<space/>

<wd l="1896" t="13805" r="2184" b="13910">our</wd>

<space/>

<wd l="2251" t="13752" r="2587" b="13910">first</wd>

<space/>

<wd l="2650" t="13757" r="3058" b="13910">CRF</wd>

<space/>

<wd l="3120" t="13752" r="3710" b="13910">model.</wd>

<space/>

<wd l="3811" t="13757" r="4099" b="13910">We</wd>

<space/>

<wd l="4166" t="13776" r="4440" b="13954">got</wd>

<space/>

<wd l="4502" t="13752" r="4747" b="13910">rid</wd>

<space/>

<wd l="4814" t="13752" r="5002" b="13910">of</wd>

<space/>

<wd l="5054" t="13752" r="5318" b="13910">the</wd>

<space/>

<wd l="5386" t="13752" r="5794" b="13954">orig-</wd>

</ln>

<ln l="1440" t="14021" r="5803" b="14208" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="14021" r="1766" b="14179">inal</wd>

<space/>

<wd l="1834" t="14021" r="2338" b="14179">labels</wd>

<space/>

<wd l="2410" t="14021" r="2669" b="14179">for</wd>

<space/>

<wd l="2731" t="14021" r="3134" b="14179">train</wd>

<space/>

<wd l="3206" t="14021" r="3518" b="14179">and</wd>

<space/>

<wd l="3586" t="14021" r="3922" b="14179">dev.</wd>

<space/>

<wd l="4037" t="14021" r="4459" b="14208">And,</wd>

<space/>

<wd l="4541" t="14021" r="4709" b="14174">in</wd>

<space/>

<wd l="4776" t="14021" r="5045" b="14179">the</wd>

<space/>

<wd l="5117" t="14021" r="5467" b="14208">end,</wd>

<space/>

<wd l="5549" t="14074" r="5803" b="14179">we</wd>

<space/>

</ln>

<ln l="1440" t="14294" r="5794" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="14294" r="2050" b="14453">trained</wd>

<space/>

<wd l="2098" t="14347" r="2386" b="14453">our</wd>

<space/>

<wd l="2429" t="14294" r="2813" b="14453">final</wd>

<space/>

<wd l="2861" t="14294" r="3403" b="14453">model</wd>

<space/>

<wd l="3461" t="14294" r="4114" b="14496">(always</wd>

<space/>

<wd l="4166" t="14294" r="4555" b="14453">with</wd>

<space/>

<wd l="4603" t="14294" r="4867" b="14453">the</wd>

<space/>

<wd l="4920" t="14347" r="5362" b="14453">same</wd>

<space/>

<wd l="5405" t="14318" r="5794" b="14453">tem-</wd>

</ln>

<ln l="1440" t="14563" r="5794" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="14563" r="2011" b="14765">plates)</wd>

<space/>

<wd l="2078" t="14563" r="2467" b="14722">with</wd>

<space/>

<wd l="2525" t="14563" r="2827" b="14722">dev</wd>

<space/>

<wd l="2914" t="14563" r="3389" b="14750">2015,</wd>

<space/>

<wd l="3456" t="14563" r="3859" b="14722">train</wd>

<space/>

<wd l="3941" t="14563" r="4190" b="14722">crf</wd>

<space/>

<wd l="4238" t="14563" r="4550" b="14722">and</wd>

<space/>

<wd l="4608" t="14563" r="4910" b="14722">dev</wd>

<space/>

<wd l="4997" t="14563" r="5246" b="14722">crf</wd>

<space/>

<wd l="5294" t="14563" r="5506" b="14722">all</wd>

<space/>

<wd l="5563" t="14587" r="5794" b="14722">to-</wd>

</ln>

<ln l="1445" t="14837" r="5798" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="14837" r="2016" b="15038">gether.</wd>

<space/>

<wd l="2093" t="14842" r="2376" b="14995">We</wd>

<space/>

<wd l="2429" t="14837" r="2702" b="14995">did</wd>

<space/>

<wd l="2746" t="14837" r="3014" b="14995">the</wd>

<space/>

<wd l="3067" t="14890" r="3509" b="14995">same</wd>

<space/>

<wd l="3552" t="14837" r="4426" b="15038">procedure</wd>

<space/>

<wd l="4469" t="14837" r="4728" b="14995">for</wd>

<space/>

<wd l="4771" t="14837" r="5035" b="14995">the</wd>

<space/>

<wd l="5107" t="14842" r="5294" b="14995">10</wd>

<space/>

<wd l="5347" t="14861" r="5798" b="15038">types</wd>

<space/>

</ln>

<ln l="1445" t="15106" r="5794" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="15106" r="2064" b="15264">entities</wd>

<space/>

<wd l="2136" t="15106" r="2448" b="15264">and</wd>

<space/>

<wd l="2510" t="15106" r="2770" b="15264">for</wd>

<space/>

<wd l="2827" t="15158" r="3043" b="15264">no</wd>

<space/>

<wd l="3106" t="15106" r="3595" b="15307">typed</wd>

<space/>

<wd l="3658" t="15106" r="4061" b="15264">data.</wd>

<space/>

<wd l="4171" t="15110" r="4507" b="15264">Our</wd>

<space/>

<wd l="4565" t="15106" r="5126" b="15264">results</wd>

<space/>

<wd l="5203" t="15158" r="5462" b="15264">are</wd>

<space/>

<wd l="5530" t="15106" r="5794" b="15264">de-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

</column>

<column l="6099" t="1248" r="10639" b="15356">

<table l="6408" t="1258" r="10253" b="2102" alignment="left" li="309" ri="386" spaceBefore="10" spaceAfter="152">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>974</gridCol>

<gridCol>1042</gridCol>

<gridCol>912</gridCol>

<gridCol>917</gridCol>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>282</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6408" t="1258" r="7382" b="1541" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7502" t="1301" r="8304" b="1502" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="7502" t="1301" r="8304" b="1502" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7502" t="1301" r="8304" b="1502">precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8635" t="1301" r="9115" b="1459" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="8635" t="1301" r="9115" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="8635" t="1301" r="9110" b="1459">recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9600" t="1306" r="9955" b="1454" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="9600" t="1306" r="9955" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="9600" t="1306" r="9955" b="1454">FB1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6552" t="1584" r="7258" b="1781" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<ln l="6552" t="1584" r="7258" b="1781" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6552" t="1584" r="6744" b="1738">10</wd>

<space/>

<wd l="6802" t="1603" r="7258" b="1781">types</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7570" t="1579" r="8232" b="1738" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<ln l="7570" t="1579" r="8232" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="7570" t="1579" r="8232" b="1738">55.17%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8602" t="1579" r="9149" b="1738" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<ln l="8602" t="1579" r="9149" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="8602" t="1579" r="9149" b="1738">9.68%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9475" t="1579" r="10118" b="1738" alignment="centered" spaceAfter="28" lsp="exactly" lspExact="245" language="en">

<ln l="9475" t="1579" r="10118" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="9475" t="1579" r="10118" b="1738">16.47%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6571" t="1867" r="7219" b="2059" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="6571" t="1867" r="7219" b="2059" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6571" t="1910" r="6787" b="2016">no</wd>

<space/>

<wd l="6845" t="1882" r="7219" b="2059">type</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7570" t="1858" r="8232" b="2016" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="7570" t="1858" r="8232" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="7570" t="1858" r="8232" b="2016">58.42%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8549" t="1858" r="9206" b="2016" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="8549" t="1858" r="9206" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="8549" t="1858" r="9206" b="2016">25.72%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="9456" t="1858" r="10118" b="2016" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="9456" t="1858" r="10118" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="9456" t="1858" r="10118" b="2016">35.71%</wd>

</ln>

</para>

</cell>

</table>

<para l="6144" t="2314" r="10498" b="2789" alignment="justified" ri="72" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="2314" r="10498" b="2472" baseLine="2467" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2314" r="6624" b="2472">Table</wd>

<space/>

<wd l="6696" t="2318" r="6845" b="2472">3:</wd>

<space/>

<wd l="6955" t="2314" r="7589" b="2472">Results</wd>

<space/>

<wd l="7661" t="2314" r="8050" b="2472">with</wd>

<space/>

<wd l="8117" t="2314" r="8659" b="2472">model</wd>

<space/>

<wd l="8731" t="2314" r="9336" b="2472">trained</wd>

<space/>

<wd l="9408" t="2366" r="9619" b="2472">on</wd>

<space/>

<wd l="9691" t="2314" r="9994" b="2472">dev</wd>

<space/>

<wd l="10080" t="2314" r="10498" b="2472">2015</wd>

<space/>

</ln>

<ln l="6144" t="2587" r="9043" b="2789" baseLine="2736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2587" r="6523" b="2746">then</wd>

<space/>

<wd l="6581" t="2587" r="7219" b="2789">applied</wd>

<space/>

<wd l="7272" t="2611" r="7440" b="2746">to</wd>

<space/>

<wd l="7498" t="2587" r="7896" b="2746">train</wd>

<space/>

<wd l="7958" t="2587" r="8266" b="2746">and</wd>

<space/>

<wd l="8328" t="2587" r="8626" b="2746">dev</wd>

<space/>

<wd l="8688" t="2587" r="9043" b="2746">files</wd>

</ln>

</para>

<para l="6154" t="3331" r="7742" b="3490" alignment="justified" ri="72" spaceBefore="473" lsp="exactly" lspExact="271" language="en">

<ln l="6154" t="3331" r="7742" b="3490" baseLine="3480" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="3331" r="6778" b="3490">scribed</wd>

<space/>

<wd l="6830" t="3331" r="7003" b="3485">in</wd>

<space/>

<wd l="7056" t="3331" r="7531" b="3490">Table</wd>

<space/>

<wd l="7594" t="3336" r="7742" b="3490">3.</wd>

</ln>

</para>

<para l="6144" t="3600" r="10517" b="6509" alignment="justified" ri="72" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6370" t="3600" r="10517" b="3802" baseLine="3754" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="3600" r="7272" b="3802">Compared</wd>

<space/>

<wd l="7354" t="3624" r="7517" b="3758">to</wd>

<space/>

<wd l="7603" t="3600" r="8165" b="3758">results</wd>

<space/>

<wd l="8251" t="3600" r="8640" b="3758">with</wd>

<space/>

<wd l="8726" t="3600" r="9024" b="3758">dev</wd>

<space/>

<wd l="9110" t="3600" r="9586" b="3787">2015,</wd>

<space/>

<wd l="9686" t="3653" r="9936" b="3758">we</wd>

<space/>

<wd l="10018" t="3600" r="10334" b="3758">had</wd>

<space/>

<wd l="10421" t="3653" r="10517" b="3758">a</wd>

<space/>

</ln>

<ln l="6144" t="3874" r="10502" b="4075" baseLine="4022" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3874" r="6648" b="4032">better</wd>

<space/>

<wd l="6720" t="3874" r="7565" b="4075">precision,</wd>

<space/>

<wd l="7661" t="3874" r="8194" b="4032">which</wd>

<space/>

<wd l="8280" t="3874" r="9029" b="4032">confirms</wd>

<space/>

<wd l="9115" t="3874" r="9446" b="4032">that</wd>

<space/>

<wd l="9523" t="3874" r="9787" b="4032">the</wd>

<space/>

<wd l="9874" t="3874" r="10502" b="4075">adapta-</wd>

</ln>

<ln l="6144" t="4142" r="10517" b="4344" baseLine="4296" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4142" r="6485" b="4301">tion</wd>

<space/>

<wd l="6576" t="4195" r="6907" b="4301">was</wd>

<space/>

<wd l="7008" t="4142" r="7517" b="4301">worth</wd>

<space/>

<wd l="7613" t="4142" r="8146" b="4344">doing.</wd>

<space/>

<wd l="8338" t="4147" r="9130" b="4301">However</wd>

<space/>

<wd l="9216" t="4195" r="9470" b="4301">we</wd>

<space/>

<wd l="9566" t="4142" r="9912" b="4301">also</wd>

<space/>

<wd l="10008" t="4142" r="10325" b="4301">had</wd>

<space/>

<wd l="10421" t="4195" r="10517" b="4301">a</wd>

<space/>

</ln>

<ln l="6144" t="4416" r="10502" b="4618" baseLine="4565" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4416" r="6634" b="4574">much</wd>

<space/>

<wd l="6691" t="4469" r="7210" b="4574">worse</wd>

<space/>

<wd l="7272" t="4416" r="7800" b="4603">recall,</wd>

<space/>

<wd l="7872" t="4416" r="8410" b="4574">which</wd>

<space/>

<wd l="8472" t="4416" r="8957" b="4574">could</wd>

<space/>

<wd l="9014" t="4416" r="9221" b="4574">be</wd>

<space/>

<wd l="9293" t="4469" r="10094" b="4618">someway</wd>

<space/>

<wd l="10162" t="4469" r="10502" b="4618">pre-</wd>

</ln>

<ln l="6149" t="4685" r="10517" b="4843" baseLine="4834" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="4685" r="6682" b="4843">dicted</wd>

<space/>

<wd l="6782" t="4685" r="7219" b="4843">since</wd>

<space/>

<wd l="7315" t="4685" r="7579" b="4843">the</wd>

<space/>

<wd l="7680" t="4685" r="7982" b="4843">dev</wd>

<space/>

<wd l="8069" t="4685" r="8486" b="4843">2015</wd>

<space/>

<wd l="8597" t="4685" r="8962" b="4843">data</wd>

<space/>

<wd l="9053" t="4685" r="9187" b="4843">is</wd>

<space/>

<wd l="9288" t="4685" r="9778" b="4843">much</wd>

<space/>

<wd l="9878" t="4685" r="10517" b="4843">smaller</wd>

<space/>

</ln>

<ln l="6144" t="4958" r="10507" b="5160" baseLine="5107" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4958" r="6518" b="5117">than</wd>

<space/>

<wd l="6576" t="4958" r="6840" b="5117">the</wd>

<space/>

<wd l="6893" t="4958" r="7570" b="5160">training</wd>

<space/>

<wd l="7627" t="4958" r="8030" b="5117">data.</wd>

<space/>

<wd l="8107" t="4963" r="8246" b="5117">It</wd>

<space/>

<wd l="8294" t="4958" r="8650" b="5117">thus</wd>

<space/>

<wd l="8717" t="4982" r="9307" b="5117">creates</wd>

<space/>

<wd l="9374" t="5011" r="9470" b="5117">a</wd>

<space/>

<wd l="9528" t="4958" r="10128" b="5117">serious</wd>

<space/>

<wd l="10190" t="4958" r="10507" b="5117">low</wd>

<space/>

</ln>

<ln l="6149" t="5227" r="10512" b="5429" baseLine="5376" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="5227" r="6898" b="5429">covering</wd>

<space/>

<wd l="6950" t="5227" r="7718" b="5429">problem.</wd>

<space/>

<wd l="7800" t="5227" r="8232" b="5386">Such</wd>

<space/>

<wd l="8280" t="5227" r="9010" b="5429">problem</wd>

<space/>

<wd l="9058" t="5280" r="9355" b="5386">can</wd>

<space/>

<wd l="9403" t="5227" r="9610" b="5386">be</wd>

<space/>

<wd l="9662" t="5280" r="10512" b="5386">overcome</wd>

<space/>

</ln>

<ln l="6144" t="5496" r="10502" b="5698" baseLine="5650" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5496" r="6360" b="5698">by</wd>

<space/>

<wd l="6470" t="5496" r="7224" b="5698">applying</wd>

<space/>

<wd l="7330" t="5496" r="7594" b="5654">the</wd>

<space/>

<wd l="7699" t="5520" r="8155" b="5654">exact</wd>

<space/>

<wd l="8256" t="5496" r="9163" b="5698">adaptation</wd>

<space/>

<wd l="9259" t="5496" r="10133" b="5698">procedure</wd>

<space/>

<wd l="10238" t="5496" r="10502" b="5654">de-</wd>

</ln>

<ln l="6154" t="5770" r="10517" b="5971" baseLine="5918" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="5770" r="6778" b="5928">scribed</wd>

<space/>

<wd l="6835" t="5770" r="7003" b="5923">in</wd>

<space/>

<wd l="7070" t="5770" r="7982" b="5971">(Raymond</wd>

<space/>

<wd l="8045" t="5770" r="8357" b="5928">and</wd>

<space/>

<wd l="8410" t="5770" r="9106" b="5971">Fayolle,</wd>

<space/>

<wd l="9178" t="5774" r="9725" b="5966">2010),</wd>

<space/>

<wd l="9797" t="5770" r="10517" b="5971">together</wd>

<space/>

</ln>

<ln l="6144" t="6038" r="10502" b="6235" baseLine="6192" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6038" r="6533" b="6197">with</wd>

<space/>

<wd l="6610" t="6038" r="6874" b="6197">the</wd>

<space/>

<wd l="6955" t="6091" r="7243" b="6197">use</wd>

<space/>

<wd l="7325" t="6038" r="7517" b="6197">of</wd>

<space/>

<wd l="7579" t="6091" r="8026" b="6197">more</wd>

<space/>

<wd l="8107" t="6038" r="8798" b="6197">external</wd>

<space/>

<wd l="8880" t="6091" r="9696" b="6197">resources</wd>

<space/>

<wd l="9792" t="6038" r="10253" b="6235">(such</wd>

<space/>

<wd l="10334" t="6091" r="10502" b="6197">as</wd>

<space/>

</ln>

<ln l="6144" t="6312" r="7142" b="6509" baseLine="6461" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6365" r="6619" b="6470">name</wd>

<space/>

<wd l="6672" t="6312" r="7142" b="6509">lists).</wd>

</ln>

</para>

<para l="6149" t="6768" r="7795" b="6941" alignment="left" ri="72" spaceBefore="201" lsp="exactly" lspExact="276" language="en">

<ln l="6149" t="6768" r="7795" b="6941" baseLine="6931" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">

<wd l="6149" t="6768" r="6259" b="6941">6</wd>

<space/>

<wd l="6504" t="6773" r="7205" b="6941">Future</wd>

<space/>

<wd l="7267" t="6773" r="7795" b="6941">work</wd>

</ln>

</para>

<para l="6144" t="7195" r="10517" b="9518" alignment="justified" ri="72" spaceBefore="137" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="7195" r="10502" b="7397" baseLine="7344" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="7200" r="6326" b="7349">In</wd>

<space/>

<wd l="6418" t="7195" r="6686" b="7354">the</wd>

<space/>

<wd l="6778" t="7195" r="7339" b="7382">future,</wd>

<space/>

<wd l="7454" t="7248" r="7704" b="7354">we</wd>

<space/>

<wd l="7805" t="7195" r="8285" b="7354">could</wd>

<space/>

<wd l="8381" t="7195" r="8587" b="7354">do</wd>

<space/>

<wd l="8693" t="7248" r="9144" b="7354">some</wd>

<space/>

<wd l="9235" t="7248" r="9811" b="7397">proper</wd>

<space/>

<wd l="9902" t="7195" r="10502" b="7397">experi-</wd>

</ln>

<ln l="6144" t="7464" r="10498" b="7666" baseLine="7618" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="7488" r="6658" b="7622">ments</wd>

<space/>

<wd l="6754" t="7464" r="6926" b="7618">in</wd>

<space/>

<wd l="7013" t="7517" r="7450" b="7622">cross</wd>

<space/>

<wd l="7546" t="7464" r="8414" b="7622">validation</wd>

<space/>

<wd l="8501" t="7464" r="8890" b="7622">with</wd>

<space/>

<wd l="8976" t="7464" r="9240" b="7622">the</wd>

<space/>

<wd l="9326" t="7464" r="10003" b="7666">training</wd>

<space/>

<wd l="10099" t="7464" r="10498" b="7651">data,</wd>

<space/>

</ln>

<ln l="6144" t="7738" r="10512" b="7939" baseLine="7886" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="7738" r="6317" b="7891">in</wd>

<space/>

<wd l="6384" t="7738" r="6845" b="7896">order</wd>

<space/>

<wd l="6902" t="7762" r="7066" b="7896">to</wd>

<space/>

<wd l="7138" t="7738" r="7474" b="7896">find</wd>

<space/>

<wd l="7536" t="7738" r="8035" b="7896">better</wd>

<space/>

<wd l="8093" t="7738" r="8976" b="7939">templates,</wd>

<space/>

<wd l="9058" t="7738" r="9365" b="7896">and</wd>

<space/>

<wd l="9432" t="7738" r="9768" b="7896">find</wd>

<space/>

<wd l="9830" t="7738" r="10094" b="7896">the</wd>

<space/>

<wd l="10162" t="7738" r="10512" b="7896">best</wd>

<space/>

</ln>

<ln l="6144" t="8006" r="10498" b="8208" baseLine="8160" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="8011" r="6365" b="8160">L1</wd>

<space/>

<wd l="6466" t="8006" r="6778" b="8165">and</wd>

<space/>

<wd l="6845" t="8011" r="7085" b="8160">L2</wd>

<space/>

<wd l="7162" t="8006" r="8371" b="8208">regularization</wd>

<space/>

<wd l="8443" t="8030" r="9389" b="8208">parameters</wd>

<space/>

<wd l="9475" t="8006" r="9667" b="8165">of</wd>

<space/>

<wd l="9725" t="8006" r="9989" b="8165">the</wd>

<space/>

<wd l="10066" t="8011" r="10498" b="8165">CRF.</wd>

<space/>

</ln>

<ln l="6144" t="8280" r="10502" b="8482" baseLine="8429" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="8285" r="6432" b="8438">We</wd>

<space/>

<wd l="6509" t="8280" r="7128" b="8438">believe</wd>

<space/>

<wd l="7210" t="8280" r="7536" b="8438">that</wd>

<space/>

<wd l="7618" t="8280" r="8386" b="8482">correctly</wd>

<space/>

<wd l="8467" t="8280" r="9442" b="8482">performing</wd>

<space/>

<wd l="9523" t="8280" r="9792" b="8438">the</wd>

<space/>

<wd l="9874" t="8280" r="10502" b="8482">adapta-</wd>

</ln>

<ln l="6144" t="8549" r="10502" b="8750" baseLine="8698" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="8549" r="6485" b="8707">tion</wd>

<space/>

<wd l="6571" t="8549" r="7440" b="8750">procedure</wd>

<space/>

<wd l="7531" t="8549" r="7723" b="8707">of</wd>

<space/>

<wd l="7805" t="8549" r="8717" b="8750">(Raymond</wd>

<space/>

<wd l="8808" t="8549" r="9120" b="8707">and</wd>

<space/>

<wd l="9202" t="8549" r="9898" b="8750">Fayolle,</wd>

<space/>

<wd l="10008" t="8554" r="10502" b="8746">2010)</wd>

<space/>

</ln>

<ln l="6149" t="8822" r="10517" b="9024" baseLine="8971" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6149" t="8822" r="6461" b="8981">and</wd>

<space/>

<wd l="6557" t="8822" r="6912" b="8981">thus</wd>

<space/>

<wd l="7022" t="8822" r="7838" b="9024">obtaining</wd>

<space/>

<wd l="7939" t="8875" r="8035" b="8981">a</wd>

<space/>

<wd l="8126" t="8822" r="8630" b="8981">better</wd>

<space/>

<wd l="8726" t="8827" r="9130" b="8981">CRF</wd>

<space/>

<wd l="9230" t="8822" r="9773" b="8981">model</wd>

<space/>

<wd l="9869" t="8822" r="10128" b="8981">for</wd>

<space/>

<wd l="10224" t="8875" r="10517" b="8981">our</wd>

<space/>

</ln>

<ln l="6144" t="9091" r="10517" b="9293" baseLine="9240" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="9091" r="6730" b="9250">named</wd>

<space/>

<wd l="6797" t="9091" r="7286" b="9293">entity</wd>

<space/>

<wd l="7358" t="9115" r="8131" b="9250">extractor</wd>

<space/>

<wd l="8194" t="9091" r="8736" b="9250">would</wd>

<space/>

<wd l="8798" t="9091" r="9163" b="9250">lead</wd>

<space/>

<wd l="9230" t="9115" r="9394" b="9250">to</wd>

<space/>

<wd l="9466" t="9091" r="9950" b="9250">much</wd>

<space/>

<wd l="10013" t="9091" r="10517" b="9250">better</wd>

<space/>

</ln>

<ln l="6144" t="9360" r="6758" b="9518" baseLine="9514" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="9360" r="6758" b="9518">results.</wd>

</ln>

</para>

<para l="6149" t="10070" r="7248" b="10243" alignment="left" ri="72" spaceBefore="455" lsp="exactly" lspExact="276" language="en">

<ln l="6149" t="10070" r="7248" b="10243" baseLine="10238" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="10070" r="7248" b="10243">References</wd>

</ln>

</para>

<para l="6144" t="10450" r="10502" b="11472" alignment="justified" li="216" ri="72" spaceBefore="110" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="10450" r="10502" b="10618" baseLine="10584" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6144" t="10454" r="6557" b="10594">Peter</wd>

<space/>

<wd l="6653" t="10454" r="6787" b="10594">F.</wd>

<space/>

<wd l="6898" t="10454" r="7478" b="10618">Brown,</wd>

<space/>

<wd l="7594" t="10454" r="8006" b="10594">Peter</wd>

<space/>

<wd l="8102" t="10454" r="8261" b="10594">V.</wd>

<space/>

<wd l="8376" t="10450" r="9086" b="10618">deSouza,</wd>

<space/>

<wd l="9206" t="10450" r="9749" b="10594">Robert</wd>

<space/>

<wd l="9845" t="10454" r="10008" b="10594">L.</wd>

<space/>

<wd l="10118" t="10454" r="10502" b="10594">Mer-</wd>

</ln>

<ln l="6370" t="10670" r="10498" b="10838" baseLine="10805" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6370" t="10714" r="6643" b="10838">cer,</wd>

<space/>

<wd l="6763" t="10670" r="7387" b="10814">Vincent</wd>

<space/>

<wd l="7483" t="10675" r="7598" b="10814">J.</wd>

<space/>

<wd l="7714" t="10670" r="8150" b="10814">Della</wd>

<space/>

<wd l="8246" t="10670" r="8755" b="10838">Pietra,</wd>

<space/>

<wd l="8880" t="10670" r="9168" b="10814">and</wd>

<space/>

<wd l="9269" t="10670" r="9811" b="10814">Jenifer</wd>

<space/>

<wd l="9917" t="10670" r="10080" b="10814">C.</wd>

<space/>

<wd l="10195" t="10670" r="10498" b="10814">Lai.</wd>

<space/>

</ln>

<ln l="6384" t="10886" r="10502" b="11074" baseLine="11026" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6384" t="10886" r="6802" b="11030">1992.</wd>

<space/>

<wd l="6984" t="10886" r="7934" b="11030">Class-based</wd>

<space/>

<wd l="8011" t="10930" r="8592" b="11074">n-gram</wd>

<space/>

<wd l="8669" t="10886" r="9235" b="11030">models</wd>

<space/>

<wd l="9326" t="10886" r="9499" b="11030">of</wd>

<space/>

<wd l="9566" t="10886" r="10118" b="11030">natural</wd>

<space/>

<wd l="10200" t="10886" r="10502" b="11030">lan-</wd>

</ln>

<ln l="6370" t="11107" r="10502" b="11294" baseLine="11242">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><wd l="6370" t="11150" r="6878" b="11294">guage.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><wd l="7018" t="11112" r="7670" b="11290">Comput.</wd>

<space/>

</run>

<wd l="7752" t="11112" r="8501" b="11290"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">Linguist.</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><space/>

<wd l="8597" t="11107" r="9806" b="11285">18(4):467–479,</wd>

<space/>

<wd l="9878" t="11112" r="10502" b="11251">Decem-</wd>

</run>

</ln>

<ln l="6365" t="11328" r="6648" b="11472" baseLine="11462" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6365" t="11328" r="6648" b="11472">ber.</wd>

</ln>

</para>

<para l="6144" t="11717" r="10512" b="12998" alignment="justified" li="216" ri="72" spaceBefore="165" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="11717" r="10502" b="11904" baseLine="11851" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11717" r="6859" b="11861">Matthieu</wd>

<space/>

<wd l="6970" t="11717" r="7714" b="11885">Constant,</wd>

<space/>

<wd l="7834" t="11717" r="8453" b="11861">Isabelle</wd>

<space/>

<wd l="8554" t="11717" r="9106" b="11885">Tellier,</wd>

<space/>

<wd l="9221" t="11722" r="9725" b="11904">Denys</wd>

<space/>

<wd l="9826" t="11717" r="10502" b="11885">Duchier,</wd>

<space/>

</ln>

<ln l="6365" t="11933" r="10502" b="12120" baseLine="12072" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="11938" r="6874" b="12077">Yoann</wd>

<space/>

<wd l="6950" t="11938" r="7594" b="12115">Dupont,</wd>

<space/>

<wd l="7685" t="11933" r="8376" b="12120">Anthony</wd>

<space/>

<wd l="8462" t="11933" r="9154" b="12120">Sigogne,</wd>

<space/>

<wd l="9250" t="11933" r="9538" b="12077">and</wd>

<space/>

<wd l="9619" t="11933" r="10118" b="12120">Sylvie</wd>

<space/>

<wd l="10200" t="11933" r="10502" b="12072">Bil-</wd>

</ln>

<ln l="6365" t="12154" r="10507" b="12341" baseLine="12288" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12154" r="6614" b="12298">lot.</wd>

<space/>

<wd l="6734" t="12154" r="7166" b="12298">2011.</wd>

<space/>

<wd l="7286" t="12154" r="7915" b="12341">Int´egrer</wd>

<space/>

<wd l="7982" t="12154" r="8237" b="12298">des</wd>

<space/>

<wd l="8309" t="12154" r="9427" b="12298">connaissances</wd>

<space/>

<wd l="9494" t="12154" r="10507" b="12341">linguistiques</wd>

<space/>

</ln>

<ln l="6370" t="12370" r="10512" b="12562" baseLine="12509" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="12374" r="6725" b="12518">dans</wd>

<space/>

<wd l="6816" t="12418" r="7018" b="12518">un</wd>

<space/>

<wd l="7104" t="12374" r="7478" b="12518">CRF</wd>

<space/>

<wd l="7579" t="12418" r="7603" b="12518">:</wd>

<space/>

<wd l="7709" t="12374" r="8592" b="12557">application</wd>

<space/>

<wd l="8683" t="12370" r="8770" b="12518">a`</wd>

<space/>

<wd l="8851" t="12374" r="10056" b="12562">l’apprentissage</wd>

<space/>

<wd l="10152" t="12374" r="10512" b="12518">d’un</wd>

<space/>

</ln>

<ln l="6374" t="12590" r="10502" b="12778" baseLine="12729">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="12590" r="8141" b="12778">segmenteur-´etiqueteur</wd>

<space/>

<wd l="8222" t="12590" r="8414" b="12734">du</wd>

<space/>

</run>

<wd l="8501" t="12590" r="9168" b="12773"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">franc</run>

<run underlined="none" subsuperscript="subscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">¸</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ais.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9350" t="12595" r="9518" b="12730">In</wd>

<space/>

</run>

<wd l="9605" t="12595" r="10109" b="12758"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">TALN</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10195" t="12590" r="10502" b="12734">vol-</wd>

</run>

</ln>

<ln l="6365" t="12811" r="9859" b="12998" baseLine="12946" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12854" r="6706" b="12955">ume</wd>

<space/>

<wd l="6778" t="12811" r="6898" b="12979">1,</wd>

<space/>

<wd l="6955" t="12854" r="7330" b="12998">page</wd>

<space/>

<wd l="7387" t="12811" r="7723" b="12979">321,</wd>

<space/>

<wd l="7781" t="12811" r="8755" b="12994">Montpellier,</wd>

<space/>

<wd l="8813" t="12816" r="9398" b="12979">France,</wd>

<space/>

<wd l="9456" t="12816" r="9859" b="12955">June.</wd>

</ln>

</para>

<para l="6144" t="13200" r="10512" b="14702" alignment="justified" li="216" ri="72" spaceBefore="164" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="13200" r="10512" b="13387" baseLine="13334" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13205" r="6605" b="13387">Jenny</wd>

<space/>

<wd l="6715" t="13205" r="6888" b="13344">R.</wd>

<space/>

<wd l="7003" t="13200" r="7555" b="13368">Finkel,</wd>

<space/>

<wd l="7685" t="13200" r="8165" b="13344">Trond</wd>

<space/>

<wd l="8275" t="13200" r="9048" b="13387">Grenager,</wd>

<space/>

<wd l="9178" t="13200" r="9466" b="13344">and</wd>

<space/>

<wd l="9576" t="13200" r="10512" b="13382">Christopher</wd>

<space/>

</ln>

<ln l="6365" t="13416" r="10502" b="13603" baseLine="13555" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13416" r="7123" b="13603">Manning.</wd>

<space/>

<wd l="7267" t="13416" r="7699" b="13560">2005.</wd>

<space/>

<wd l="7838" t="13416" r="8923" b="13603">Incorporating</wd>

<space/>

<wd l="8995" t="13416" r="9744" b="13560">non-local</wd>

<space/>

<wd l="9816" t="13416" r="10502" b="13560">informa-</wd>

</ln>

<ln l="6365" t="13637" r="10507" b="13824" baseLine="13771" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13637" r="6677" b="13781">tion</wd>

<space/>

<wd l="6754" t="13637" r="7061" b="13781">into</wd>

<space/>

<wd l="7147" t="13637" r="8088" b="13781">information</wd>

<space/>

<wd l="8174" t="13637" r="8962" b="13781">extraction</wd>

<space/>

<wd l="9053" t="13656" r="9667" b="13824">systems</wd>

<space/>

<wd l="9754" t="13637" r="9950" b="13824">by</wd>

<space/>

<wd l="10042" t="13637" r="10507" b="13781">Gibbs</wd>

<space/>

</ln>

<ln l="6374" t="13858" r="10502" b="14045" baseLine="13992">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="13858" r="7133" b="14045">sampling.</wd>

<space/>

<wd l="7229" t="13862" r="7397" b="13997">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7450" t="13858" r="8434" b="14040">Proceedings</wd>

<space/>

<wd l="8491" t="13858" r="8674" b="14040">of</wd>

<space/>

<wd l="8702" t="13858" r="8938" b="14002">the</wd>

<space/>

<wd l="8995" t="13858" r="9370" b="14002">43rd</wd>

<space/>

<wd l="9403" t="13858" r="9994" b="14002">Annual</wd>

<space/>

<wd l="10042" t="13862" r="10502" b="14002">Meet-</wd>

</run>

</ln>

<ln l="6374" t="14074" r="10502" b="14256" baseLine="14213">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="14078" r="6614" b="14256">ing</wd>

<space/>

<wd l="6706" t="14122" r="6898" b="14218">on</wd>

<space/>

<wd l="6970" t="14078" r="7910" b="14218">Association</wd>

<space/>

<wd l="7958" t="14074" r="8237" b="14256">for</wd>

<space/>

<wd l="8318" t="14074" r="9509" b="14256">Computational</wd>

<space/>

</run>

<wd l="9581" t="14078" r="10502" b="14256"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Linguistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="6365" t="14294" r="10498" b="14482" baseLine="14429" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14294" r="6754" b="14438">ACL</wd>

<space/>

<wd l="6845" t="14294" r="7142" b="14462">’05,</wd>

<space/>

<wd l="7234" t="14338" r="7680" b="14482">pages</wd>

<space/>

<wd l="7771" t="14294" r="8506" b="14462">363–370,</wd>

<space/>

<wd l="8602" t="14294" r="9605" b="14482">Stroudsburg,</wd>

<space/>

<wd l="9701" t="14299" r="9979" b="14462">PA,</wd>

<space/>

<wd l="10061" t="14294" r="10498" b="14438">USA.</wd>

<space/>

</ln>

<ln l="6365" t="14515" r="9797" b="14702" baseLine="14650" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14515" r="7306" b="14659">Association</wd>

<space/>

<wd l="7354" t="14515" r="7589" b="14659">for</wd>

<space/>

<wd l="7642" t="14515" r="8818" b="14698">Computational</wd>

<space/>

<wd l="8870" t="14515" r="9797" b="14702">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="14899" r="10502" b="15307" alignment="justified" li="216" ri="72" spaceBefore="171" spaceAfter="37" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="14899" r="10498" b="15086" baseLine="15038">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="14899" r="6782" b="15043">Thomas</wd>

<space/>

<wd l="6845" t="14904" r="7632" b="15086">Lavergne,</wd>

<space/>

<wd l="7699" t="14899" r="8256" b="15043">Olivier</wd>

<space/>

<wd l="8318" t="14899" r="8866" b="15086">Capp´e,</wd>

<space/>

<wd l="8938" t="14899" r="9221" b="15043">and</wd>

<space/>

</run>

<wd l="9278" t="14899" r="9960" b="15082"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Franc</run>

<run underlined="none" subsuperscript="subscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">¸</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">ois</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="10022" t="14904" r="10498" b="15043">Yvon.</wd>

<space/>

</run>

</ln>

<ln l="6370" t="15120" r="10502" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6370" t="15120" r="6802" b="15264">2010.</wd>

<space/>

<wd l="6950" t="15120" r="7642" b="15264">Practical</wd>

<space/>

<wd l="7714" t="15163" r="8064" b="15307">very</wd>

<space/>

<wd l="8136" t="15120" r="8530" b="15307">large</wd>

<space/>

<wd l="8611" t="15120" r="8995" b="15264">scale</wd>

<space/>

<wd l="9072" t="15120" r="9408" b="15264">crfs.</wd>

<space/>

<wd l="9552" t="15125" r="9720" b="15259">In</wd>

<space/>

</run>

<wd l="9787" t="15120" r="10502" b="15264" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Proceed-</wd>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<dd l="1318" t="15736" r="10639" b="15977">

<para l="5800" t="15792" r="6148" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5866" t="15792" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="43">

<wd l="5866" t="15792" r="6082" b="15946">70</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4309.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1280" marginRight="6089" marginBottom="858" offsetX="8" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1280" r="5820" b="15980">

<column l="1440" t="1280" r="5820" b="15980">

<para l="1622" t="1334" r="5808" b="2179" alignment="justified" li="216" spaceBefore="22" lsp="exactly" lspExact="220" language="en">

<ln l="1666" t="1334" r="5803" b="1517" baseLine="1474" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="1339" r="1992" b="1517">ings</wd>

<space/>

<wd l="2059" t="1334" r="2242" b="1517">of</wd>

<space/>

<wd l="2275" t="1334" r="2515" b="1478">the</wd>

<space/>

<wd l="2578" t="1334" r="2928" b="1478">48th</wd>

<space/>

<wd l="2981" t="1334" r="3576" b="1478">Annual</wd>

<space/>

<wd l="3629" t="1339" r="4282" b="1517">Meeting</wd>

<space/>

<wd l="4354" t="1334" r="4536" b="1517">of</wd>

<space/>

<wd l="4574" t="1334" r="4810" b="1478">the</wd>

<space/>

<wd l="4862" t="1339" r="5803" b="1478">Association</wd>

<space/>

</ln>

<ln l="1622" t="1555" r="5808" b="1742" baseLine="1694">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1622" t="1555" r="1901" b="1738">for</wd>

<space/>

<wd l="1939" t="1555" r="3130" b="1738">Computational</wd>

<space/>

</run>

<wd l="3158" t="1560" r="4080" b="1738"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Linguistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4128" t="1555" r="4517" b="1699">ACL</wd>

<space/>

<wd l="4574" t="1555" r="4867" b="1723">’10,</wd>

<space/>

<wd l="4915" t="1598" r="5362" b="1742">pages</wd>

<space/>

<wd l="5410" t="1555" r="5808" b="1699">504–</wd>

<space/>

</run>

</ln>

<ln l="1661" t="1776" r="5798" b="1963" baseLine="1910" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="1776" r="2002" b="1944">513,</wd>

<space/>

<wd l="2083" t="1776" r="3091" b="1963">Stroudsburg,</wd>

<space/>

<wd l="3168" t="1781" r="3451" b="1944">PA,</wd>

<space/>

<wd l="3523" t="1776" r="3960" b="1920">USA.</wd>

<space/>

<wd l="4042" t="1776" r="4982" b="1920">Association</wd>

<space/>

<wd l="5050" t="1776" r="5285" b="1920">for</wd>

<space/>

<wd l="5357" t="1776" r="5798" b="1920">Com-</wd>

</ln>

<ln l="1656" t="1992" r="3427" b="2179" baseLine="2131" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="1992" r="2453" b="2174">putational</wd>

<space/>

<wd l="2506" t="1992" r="3427" b="2179">Linguistics.</wd>

</ln>

</para>

<para l="1440" t="2390" r="5808" b="3226" alignment="justified" li="216" spaceBefore="176" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="2390" r="5808" b="2578" baseLine="2530" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="2390" r="2107" b="2534">Mitchell</wd>

<space/>

<wd l="2170" t="2395" r="2299" b="2534">P.</wd>

<space/>

<wd l="2366" t="2395" r="3005" b="2558">Marcus,</wd>

<space/>

<wd l="3072" t="2390" r="3734" b="2534">Beatrice</wd>

<space/>

<wd l="3797" t="2390" r="4565" b="2558">Santorini,</wd>

<space/>

<wd l="4637" t="2390" r="4920" b="2534">and</wd>

<space/>

<wd l="4973" t="2395" r="5400" b="2578">Mary</wd>

<space/>

<wd l="5462" t="2395" r="5808" b="2530">Ann</wd>

<space/>

</ln>

<ln l="1656" t="2611" r="5808" b="2798" baseLine="2750" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="2611" r="2885" b="2755">Marcinkiewicz.</wd>

<space/>

<wd l="3062" t="2611" r="3480" b="2755">1993.</wd>

<space/>

<wd l="3634" t="2611" r="4325" b="2798">Building</wd>

<space/>

<wd l="4406" t="2654" r="4493" b="2755">a</wd>

<space/>

<wd l="4565" t="2611" r="4958" b="2798">large</wd>

<space/>

<wd l="5035" t="2611" r="5808" b="2755">annotated</wd>

<space/>

</ln>

<ln l="1661" t="2832" r="5798" b="3019" baseLine="2966">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1661" t="2875" r="2184" b="3014">corpus</wd>

<space/>

<wd l="2251" t="2832" r="2424" b="2976">of</wd>

<space/>

<wd l="2472" t="2832" r="3082" b="3019">english:</wd>

<space/>

<wd l="3173" t="2832" r="3480" b="2976">The</wd>

<space/>

<wd l="3538" t="2875" r="3926" b="3014">penn</wd>

<space/>

<wd l="3979" t="2832" r="4704" b="2976">treebank.</wd>

<space/>

</run>

<wd l="4819" t="2837" r="5798" b="2976" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">COMPUTA-</wd>

</ln>

<ln l="1666" t="3048" r="4886" b="3226" baseLine="3187">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1666" t="3053" r="2342" b="3192">TIONAL</wd>

<space/>

</run>

<wd l="2386" t="3053" r="3605" b="3216"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">LINGUISTICS</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3682" t="3048" r="4886" b="3226">19(2):313–330.</wd>

</run>

</ln>

</para>

<para l="1440" t="3446" r="5813" b="4733" alignment="justified" li="216" spaceBefore="175" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="3446" r="5803" b="3614" baseLine="3586" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3446" r="1992" b="3590">Farhad</wd>

<space/>

<wd l="2098" t="3446" r="3350" b="3614">Nooralahzadeh,</wd>

<space/>

<wd l="3485" t="3446" r="4162" b="3590">Caroline</wd>

<space/>

<wd l="4272" t="3451" r="4714" b="3614">Brun,</wd>

<space/>

<wd l="4848" t="3446" r="5131" b="3590">and</wd>

<space/>

<wd l="5246" t="3446" r="5803" b="3590">Claude</wd>

<space/>

</ln>

<ln l="1656" t="3667" r="5803" b="3854" baseLine="3806" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="3672" r="2126" b="3811">Roux.</wd>

<space/>

<wd l="2218" t="3667" r="2650" b="3811">2014.</wd>

<space/>

<wd l="2736" t="3672" r="3053" b="3811">Part</wd>

<space/>

<wd l="3096" t="3667" r="3269" b="3811">of</wd>

<space/>

<wd l="3307" t="3667" r="3840" b="3850">speech</wd>

<space/>

<wd l="3883" t="3667" r="4474" b="3854">tagging</wd>

<space/>

<wd l="4517" t="3667" r="4752" b="3811">for</wd>

<space/>

<wd l="4790" t="3667" r="5299" b="3811">french</wd>

<space/>

<wd l="5352" t="3667" r="5803" b="3811">social</wd>

<space/>

</ln>

<ln l="1656" t="3888" r="5808" b="4056" baseLine="4022">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1656" t="3888" r="2146" b="4032">media</wd>

<space/>

<wd l="2222" t="3888" r="2592" b="4032">data.</wd>

<space/>

<wd l="2750" t="3893" r="2918" b="4027">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="3000" t="3893" r="3725" b="4032">COLING</wd>

<space/>

<wd l="3797" t="3888" r="4224" b="4056">2014,</wd>

<space/>

<wd l="4325" t="3888" r="4675" b="4032">25th</wd>

<space/>

<wd l="4747" t="3888" r="5808" b="4032">International</wd>

<space/>

</run>

</ln>

<ln l="1666" t="4104" r="5798" b="4286" baseLine="4243" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1666" t="4104" r="2568" b="4286">Conference</wd>

<space/>

<wd l="2621" t="4152" r="2813" b="4248">on</wd>

<space/>

<wd l="2875" t="4104" r="4066" b="4286">Computational</wd>

<space/>

<wd l="4104" t="4109" r="5016" b="4286">Linguistics,</wd>

<space/>

<wd l="5083" t="4104" r="5798" b="4248">Proceed-</wd>

</ln>

<ln l="1666" t="4325" r="5813" b="4507" baseLine="4464" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1666" t="4330" r="1992" b="4507">ings</wd>

<space/>

<wd l="2074" t="4325" r="2256" b="4507">of</wd>

<space/>

<wd l="2309" t="4325" r="2544" b="4469">the</wd>

<space/>

<wd l="2640" t="4325" r="3595" b="4507">Conference:</wd>

<space/>

<wd l="3739" t="4325" r="4493" b="4469">Technical</wd>

<space/>

<wd l="4574" t="4330" r="5146" b="4507">Papers,</wd>

<space/>

<wd l="5242" t="4330" r="5813" b="4507">August</wd>

<space/>

</ln>

<ln l="1656" t="4546" r="5491" b="4733" baseLine="4680">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1656" t="4546" r="2150" b="4714">23-29,</wd>

<space/>

<wd l="2222" t="4546" r="2650" b="4714">2014,</wd>

<space/>

<wd l="2717" t="4546" r="3302" b="4714">Dublin,</wd>

<space/>

</run>

<wd l="3370" t="4546" r="3998" b="4714"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Ireland</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="4051" t="4589" r="4502" b="4733">pages</wd>

<space/>

<wd l="4574" t="4546" r="5491" b="4690">1764–1772.</wd>

</run>

</ln>

</para>

<para l="1445" t="4944" r="5803" b="6005" alignment="justified" li="216" spaceBefore="175" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="4944" r="5798" b="5131" baseLine="5078" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="1445" t="4944" r="2165" b="5088">Christian</wd>

<space/>

<wd l="2227" t="4944" r="3005" b="5131">Raymond</wd>

<space/>

<wd l="3067" t="4944" r="3350" b="5088">and</wd>

<space/>

<wd l="3408" t="4944" r="3883" b="5088">Julien</wd>

<space/>

<wd l="3941" t="4944" r="4574" b="5131">Fayolle.</wd>

<space/>

<wd l="4690" t="4944" r="5122" b="5088">2010.</wd>

<space/>

<wd l="5232" t="4949" r="5798" b="5088">Recon-</wd>

</ln>

<ln l="1656" t="5160" r="5803" b="5342" baseLine="5299" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="1656" t="5160" r="2419" b="5304">naissance</wd>

<space/>

<wd l="2462" t="5160" r="3043" b="5304">robuste</wd>

<space/>

<wd l="3086" t="5160" r="3763" b="5304">d’entit´es</wd>

<space/>

<wd l="3811" t="5160" r="4570" b="5304">nomm´ees</wd>

<space/>

<wd l="4622" t="5203" r="4858" b="5304">sur</wd>

<space/>

<wd l="4901" t="5160" r="5083" b="5304">de</wd>

<space/>

<wd l="5122" t="5160" r="5270" b="5304">la</wd>

<space/>

<wd l="5309" t="5160" r="5803" b="5342">parole</wd>

<space/>

</ln>

<ln l="1656" t="5381" r="5798" b="5563" baseLine="5520">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6"><wd l="1656" t="5381" r="2395" b="5525">transcrite</wd>

<space/>

<wd l="2477" t="5381" r="3893" b="5563">automatiquement.</wd>

<space/>

<wd l="4046" t="5386" r="4214" b="5520">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6"><wd l="4291" t="5381" r="5194" b="5563">Conf´erence</wd>

<space/>

<wd l="5275" t="5386" r="5798" b="5525">Traite-</wd>

</run>

</ln>

<ln l="1656" t="5602" r="5798" b="5784" baseLine="5736">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6"><wd l="1656" t="5630" r="2054" b="5746">ment</wd>

<space/>

<wd l="2098" t="5606" r="3091" b="5784">automatique</wd>

<space/>

<wd l="3144" t="5602" r="3408" b="5746">des</wd>

<space/>

<wd l="3466" t="5602" r="4080" b="5784">langues</wd>

<space/>

<wd l="4133" t="5602" r="4949" b="5770">naturelles,</wd>

<space/>

</run>

<wd l="5035" t="5602" r="5798" b="5770"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">TALN’10</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6"><space/>

</run>

</ln>

<ln l="1656" t="5818" r="4987" b="6005" baseLine="5957" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="1656" t="5818" r="2434" b="5986">Montr´eal,</wd>

<space/>

<wd l="2491" t="5818" r="3139" b="5995">Qu´ebec,</wd>

<space/>

<wd l="3202" t="5818" r="3835" b="5986">Canada,</wd>

<space/>

<wd l="3893" t="5818" r="4253" b="6005">July.</wd>

<space/>

<wd l="4310" t="5822" r="4987" b="5962">ATALA.</wd>

</ln>

</para>

<para l="1440" t="6221" r="5803" b="7718" alignment="justified" li="216" spaceBefore="173" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="6221" r="5794" b="6389" baseLine="6355" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6221" r="1824" b="6365">Alan</wd>

<space/>

<wd l="1910" t="6221" r="2395" b="6389">Ritter,</wd>

<space/>

<wd l="2496" t="6221" r="2851" b="6365">Sam</wd>

<space/>

<wd l="2933" t="6221" r="3413" b="6389">Clark,</wd>

<space/>

<wd l="3509" t="6226" r="4238" b="6389">Mausam,</wd>

<space/>

<wd l="4339" t="6221" r="4622" b="6365">and</wd>

<space/>

<wd l="4704" t="6221" r="5102" b="6365">Oren</wd>

<space/>

<wd l="5179" t="6221" r="5794" b="6365">Etzioni.</wd>

<space/>

</ln>

<ln l="1661" t="6437" r="5798" b="6624" baseLine="6576" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="6437" r="2093" b="6581">2011.</wd>

<space/>

<wd l="2232" t="6437" r="2808" b="6581">Named</wd>

<space/>

<wd l="2875" t="6437" r="3322" b="6624">entity</wd>

<space/>

<wd l="3394" t="6437" r="4301" b="6624">recognition</wd>

<space/>

<wd l="4363" t="6437" r="4522" b="6576">in</wd>

<space/>

<wd l="4584" t="6456" r="5131" b="6581">tweets:</wd>

<space/>

<wd l="5246" t="6442" r="5491" b="6576">An</wd>

<space/>

<wd l="5558" t="6480" r="5798" b="6581">ex-</wd>

</ln>

<ln l="1656" t="6658" r="5803" b="6845" baseLine="6792">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="6658" r="2506" b="6840">perimental</wd>

<space/>

<wd l="2573" t="6658" r="3024" b="6845">study.</wd>

<space/>

<wd l="3125" t="6662" r="3288" b="6797">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3346" t="6658" r="4330" b="6840">Proceedings</wd>

<space/>

<wd l="4392" t="6658" r="4570" b="6840">of</wd>

<space/>

<wd l="4598" t="6658" r="4838" b="6802">the</wd>

<space/>

<wd l="4906" t="6658" r="5803" b="6840">Conference</wd>

<space/>

</run>

</ln>

<ln l="1661" t="6874" r="5798" b="7056" baseLine="7013" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="6922" r="1853" b="7018">on</wd>

<space/>

<wd l="1944" t="6874" r="2746" b="7056">Empirical</wd>

<space/>

<wd l="2832" t="6874" r="3523" b="7018">Methods</wd>

<space/>

<wd l="3624" t="6878" r="3763" b="7018">in</wd>

<space/>

<wd l="3854" t="6874" r="4478" b="7018">Natural</wd>

<space/>

<wd l="4560" t="6878" r="5357" b="7056">Language</wd>

<space/>

<wd l="5448" t="6878" r="5798" b="7018">Pro-</wd>

</ln>

<ln l="1661" t="7094" r="5798" b="7282" baseLine="7234">

<wd l="1661" t="7099" r="2290" b="7277"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">cessing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2386" t="7099" r="3062" b="7238">EMNLP</wd>

<space/>

<wd l="3158" t="7094" r="3456" b="7262">’11,</wd>

<space/>

<wd l="3552" t="7138" r="4003" b="7282">pages</wd>

<space/>

<wd l="4109" t="7094" r="5030" b="7262">1524–1534,</wd>

<space/>

<wd l="5136" t="7094" r="5798" b="7238">Strouds-</wd>

</run>

</ln>

<ln l="1656" t="7315" r="5798" b="7502" baseLine="7450" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="7315" r="2059" b="7502">burg,</wd>

<space/>

<wd l="2117" t="7320" r="2395" b="7483">PA,</wd>

<space/>

<wd l="2453" t="7315" r="2890" b="7459">USA.</wd>

<space/>

<wd l="2952" t="7315" r="3893" b="7459">Association</wd>

<space/>

<wd l="3946" t="7315" r="4176" b="7459">for</wd>

<space/>

<wd l="4234" t="7315" r="5410" b="7498">Computational</wd>

<space/>

<wd l="5462" t="7315" r="5798" b="7454">Lin-</wd>

</ln>

<ln l="1661" t="7531" r="2304" b="7718" baseLine="7670" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="7531" r="2304" b="7718">guistics.</wd>

</ln>

</para>

<para l="1440" t="7930" r="5808" b="8554" alignment="justified" li="216" spaceBefore="176" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="7930" r="5808" b="8117" baseLine="8069" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7934" r="1843" b="8074">Rosa</wd>

<space/>

<wd l="1920" t="7930" r="2338" b="8074">Stern</wd>

<space/>

<wd l="2424" t="7930" r="2707" b="8074">and</wd>

<space/>

<wd l="2784" t="7934" r="3317" b="8074">Benoit</wd>

<space/>

<wd l="3398" t="7930" r="3888" b="8117">Sagot.</wd>

<space/>

<wd l="4066" t="7930" r="4498" b="8074">2010.</wd>

<space/>

<wd l="4675" t="7934" r="5486" b="8074">Resources</wd>

<space/>

<wd l="5573" t="7930" r="5808" b="8074">for</wd>

<space/>

</ln>

<ln l="1656" t="8150" r="5798" b="8338" baseLine="8290" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="8150" r="2189" b="8294">named</wd>

<space/>

<wd l="2294" t="8150" r="2741" b="8338">entity</wd>

<space/>

<wd l="2846" t="8150" r="3754" b="8338">recognition</wd>

<space/>

<wd l="3859" t="8150" r="4147" b="8294">and</wd>

<space/>

<wd l="4243" t="8150" r="5045" b="8294">resolution</wd>

<space/>

<wd l="5146" t="8150" r="5299" b="8290">in</wd>

<space/>

<wd l="5400" t="8194" r="5798" b="8294">news</wd>

<space/>

</ln>

<ln l="1656" t="8371" r="5419" b="8554" baseLine="8506">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="8371" r="2126" b="8515">wires.</wd>

<space/>

<wd l="2213" t="8376" r="2381" b="8510">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2424" t="8376" r="2899" b="8554">Entity</wd>

<space/>

<wd l="2952" t="8371" r="3350" b="8515">2010</wd>

<space/>

<wd l="3413" t="8371" r="4186" b="8554">Workshop</wd>

<space/>

<wd l="4238" t="8400" r="4402" b="8515">at</wd>

<space/>

<wd l="4440" t="8376" r="4939" b="8515">LREC</wd>

<space/>

</run>

<wd l="4982" t="8371" r="5419" b="8515"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2010</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="8770" r="5808" b="9350" alignment="justified" li="216" spaceBefore="180" spaceAfter="6572" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="8770" r="5808" b="8952" baseLine="8904" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8774" r="1718" b="8914">Jun</wd>

<space/>

<wd l="1762" t="8770" r="2309" b="8914">Suzuki</wd>

<space/>

<wd l="2352" t="8770" r="2635" b="8914">and</wd>

<space/>

<wd l="2674" t="8770" r="3216" b="8914">Hideki</wd>

<space/>

<wd l="3254" t="8770" r="3869" b="8914">Isozaki.</wd>

<space/>

<wd l="3960" t="8770" r="4392" b="8914">2008.</wd>

<space/>

<wd l="4483" t="8770" r="5808" b="8952">Semi-supervised</wd>

<space/>

</ln>

<ln l="1666" t="8990" r="5798" b="9178" baseLine="9125" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="8990" r="2462" b="9173">sequential</wd>

<space/>

<wd l="2568" t="8990" r="3206" b="9178">labeling</wd>

<space/>

<wd l="3317" t="8990" r="3600" b="9134">and</wd>

<space/>

<wd l="3710" t="8990" r="4762" b="9178">segmentation</wd>

<space/>

<wd l="4862" t="8990" r="5290" b="9178">using</wd>

<space/>

<wd l="5400" t="8990" r="5798" b="9178">giga-</wd>

</ln>

<ln l="1656" t="9206" r="4670" b="9350" baseLine="9346">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="9206" r="2069" b="9350">word</wd>

<space/>

<wd l="2126" t="9206" r="2510" b="9350">scale</wd>

<space/>

<wd l="2563" t="9206" r="3341" b="9350">unlabeled</wd>

<space/>

<wd l="3394" t="9206" r="3758" b="9350">data.</wd>

<space/>

<wd l="3840" t="9211" r="4008" b="9346">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4051" t="9211" r="4219" b="9350">In</wd>

<space/>

</run>

<wd l="4258" t="9211" r="4670" b="9350"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<dd l="5820" t="15746" r="6161" b="15980">

<para l="5820" t="15787" r="6128" b="15946" alignment="left" lsp="exactly" lspExact="223" language="en">

<ln l="5866" t="15787" r="6062" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="7">

<wd l="5866" t="15792" r="6062" b="15946">71</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

