<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4320.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1437" marginTop="1340" marginRight="1378" marginBottom="358" offsetX="-26" offsetY="12" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="2194" t="1340" r="10474" b="4092">

<column l="2194" t="1340" r="10474" b="4092">

<para l="2400" t="1406" r="9547" b="1992" alignment="left" li="2448" ri="936" spaceBefore="27" fli="-2232" lsp="exactly" lspExact="317" language="en">

<ln l="2400" t="1406" r="9547" b="1670" baseLine="1608" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2400" t="1406" r="3720" b="1670">Enhancing</wd>

<space/>

<wd l="3797" t="1411" r="4666" b="1618">Named</wd>

<space/>

<wd l="4742" t="1406" r="5506" b="1670">Entity</wd>

<space/>

<wd l="5587" t="1406" r="7046" b="1670">Recognition</wd>

<space/>

<wd l="7118" t="1406" r="7358" b="1608">in</wd>

<space/>

<wd l="7435" t="1406" r="8328" b="1613">Twitter</wd>

<space/>

<wd l="8405" t="1411" r="9547" b="1670">Messages</wd>

<space/>

</ln>

<ln l="4685" t="1728" r="7262" b="1992" baseLine="1925" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4685" t="1728" r="5381" b="1992">Using</wd>

<space/>

<wd l="5458" t="1728" r="6216" b="1992">Entity</wd>

<space/>

<wd l="6298" t="1728" r="7262" b="1992">Linking</wd>

</ln>

</para>

<para l="2194" t="2270" r="9912" b="2525" alignment="left" spaceBefore="247" lsp="exactly" lspExact="292" language="en">

<tabs position="2194"/>

<tabs alignment="left" position="2525" leaderChar=" "/>

<ln l="2194" t="2270" r="9912" b="2525" baseLine="2451">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="2194" t="2309" r="2789" b="2525">Ikuya</wd>

<space/>

</run>

<wd l="2846" t="2275" r="3763" b="2477"><run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-1">Yamada</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-1">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-1"><space/>

<wd l="3811" t="2275" r="3883" b="2386">2</wd>

<space/>

<wd l="3922" t="2275" r="3998" b="2390">3</wd>

<tab position="3998"/>

</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="5155" t="2304" r="5957" b="2477">Hideaki</wd>

<space/>

</run>

<wd l="6024" t="2275" r="6845" b="2477"><run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-1">Takeda</run>

<run underlined="none" subsuperscript="superscript" fontSize="1200" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-1">2</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-1"><tab position="6845"/>

<wd l="7896" t="2304" r="8914" b="2525">Yoshiyasu</wd>

<space/>

</run>

<wd l="8981" t="2275" r="9912" b="2525"><run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Arial" fontFamily="roman" fontPitch="variable" spacing="-1">Takefuji</run>

<run underlined="none" subsuperscript="superscript" fontSize="1200" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-1">3</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="2203" t="2616" r="10402" b="3086" alignment="left" li="1008" ri="72" fli="-1008" lsp="exactly" lspExact="274" language="en">

<tabs position="2203"/>

<ln l="2203" t="2616" r="10402" b="2798" baseLine="2750" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0" forcedEOF="true">

<wd l="2203" t="2616" r="4008" b="2798">ikuya@ousia.jp</wd>

<tab position="4008"/>

<wd l="4963" t="2616" r="7042" b="2798">takeda@nii.ac.jp</wd>

<space/>

<wd l="7406" t="2616" r="10402" b="2798">takefuji@sfc.keio.ac.jp
</wd>

</ln>

<ln l="3187" t="2846" r="8774" b="3086" baseLine="3032" forcedEOF="true">

<wd l="3187" t="2846" r="3830" b="3043"><run underlined="none" subsuperscript="superscript" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Studio</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3893" t="2885" r="4440" b="3072">Ousia,</wd>

<space/>

<wd l="4507" t="2885" r="5722" b="3043">4489-105-221</wd>

<space/>

<wd l="5798" t="2885" r="6302" b="3072">Endo,</wd>

<space/>

<wd l="6370" t="2885" r="7195" b="3086">Fujisawa,</wd>

<space/>

<wd l="7262" t="2890" r="8218" b="3086">Kanagawa,</wd>

<space/>

<wd l="8285" t="2890" r="8774" b="3086">Japan</wd>

</run>

</ln>

</para>

<para l="2597" t="3125" r="9355" b="3365" alignment="left" li="360" spaceBefore="7" lsp="exactly" lspExact="271" language="en">

<ln l="2597" t="3125" r="9355" b="3365" baseLine="3311">

<wd l="2597" t="3125" r="3437" b="3322"><run underlined="none" subsuperscript="superscript" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">National</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3494" t="3163" r="4210" b="3322">Institute</wd>

<space/>

<wd l="4267" t="3163" r="4459" b="3322">of</wd>

<space/>

<wd l="4502" t="3163" r="5549" b="3350">Informatics,</wd>

<space/>

<wd l="5621" t="3168" r="6086" b="3317">2-1-2</wd>

<space/>

<wd l="6144" t="3163" r="7286" b="3350">Hitotsubashi,</wd>

<space/>

<wd l="7358" t="3163" r="8136" b="3365">Chiyoda,</wd>

<space/>

<wd l="8203" t="3163" r="8794" b="3365">Tokyo,</wd>

<space/>

<wd l="8861" t="3168" r="9355" b="3365">Japan</wd>

</run>

</ln>

</para>

<para l="3456" t="3403" r="8496" b="3643" alignment="left" li="1224" spaceBefore="7" spaceAfter="444" lsp="exactly" lspExact="271" language="en">

<ln l="3456" t="3403" r="8496" b="3643" baseLine="3588">

<wd l="3456" t="3403" r="3960" b="3600"><run underlined="none" subsuperscript="superscript" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">3</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Keio</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="4018" t="3442" r="4963" b="3643">University,</wd>

<space/>

<wd l="5030" t="3442" r="5458" b="3600">5322</wd>

<space/>

<wd l="5520" t="3442" r="6024" b="3629">Endo,</wd>

<space/>

<wd l="6086" t="3442" r="6912" b="3643">Fujisawa,</wd>

<space/>

<wd l="6984" t="3446" r="7934" b="3643">Kanagawa,</wd>

<space/>

<wd l="8002" t="3446" r="8496" b="3643">Japan</wd>

</run>

</ln>

</para>

</column>

</section>

<section l="1437" t="4092" r="10531" b="15336">

<column l="1437" t="4092" r="5824" b="15336">

<para l="3178" t="4142" r="4070" b="4315" alignment="centered" spaceBefore="3" lsp="exactly" lspExact="273" language="en">

<ln l="3178" t="4142" r="4070" b="4315" baseLine="4306" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3178" t="4142" r="4070" b="4315">Abstract</wd>

</ln>

</para>

<para l="1781" t="4622" r="5467" b="10243" alignment="justified" li="216" ri="360" spaceBefore="188" lsp="exactly" lspExact="271" language="en">

<ln l="1781" t="4622" r="5467" b="4824" baseLine="4771" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4627" r="1963" b="4776">In</wd>

<space/>

<wd l="2059" t="4622" r="2366" b="4781">this</wd>

<space/>

<wd l="2467" t="4675" r="2990" b="4824">paper,</wd>

<space/>

<wd l="3106" t="4675" r="3360" b="4781">we</wd>

<space/>

<wd l="3461" t="4622" r="4181" b="4781">describe</wd>

<space/>

<wd l="4282" t="4675" r="4574" b="4781">our</wd>

<space/>

<wd l="4670" t="4622" r="5467" b="4824">approach</wd>

<space/>

</ln>

<ln l="1781" t="4891" r="5453" b="5093" baseLine="5045">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1781" t="4891" r="2040" b="5050">for</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2112" t="4891" r="2741" b="5050">Named</wd>

<space/>

<wd l="2808" t="4901" r="3331" b="5093">Entity</wd>

<space/>

<wd l="3408" t="4901" r="4464" b="5093">Recognition</wd>

<space/>

<wd l="4555" t="4901" r="4714" b="5050">in</wd>

<space/>

</run>

<wd l="4805" t="4901" r="5453" b="5078"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Twitter</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1786" t="5165" r="5462" b="5366" baseLine="5314" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5218" r="1882" b="5323">a</wd>

<space/>

<wd l="1997" t="5165" r="2558" b="5323">shared</wd>

<space/>

<wd l="2664" t="5165" r="3019" b="5323">task</wd>

<space/>

<wd l="3125" t="5165" r="3384" b="5323">for</wd>

<space/>

<wd l="3490" t="5170" r="3922" b="5323">ACL</wd>

<space/>

<wd l="4032" t="5165" r="4450" b="5323">2015</wd>

<space/>

<wd l="4574" t="5165" r="5462" b="5366">Workshop</wd>

<space/>

</ln>

<ln l="1786" t="5434" r="5467" b="5635" baseLine="5587" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5486" r="2002" b="5592">on</wd>

<space/>

<wd l="2050" t="5434" r="2568" b="5635">Noisy</wd>

<space/>

<wd l="2626" t="5434" r="3955" b="5635">User-generated</wd>

<space/>

<wd l="4008" t="5438" r="4392" b="5592">Text</wd>

<space/>

<wd l="4454" t="5434" r="5256" b="5630">(Baldwin</wd>

<space/>

<wd l="5314" t="5458" r="5467" b="5592">et</wd>

<space/>

</ln>

<ln l="1786" t="5707" r="5453" b="5909" baseLine="5856" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5707" r="2035" b="5894">al.,</wd>

<space/>

<wd l="2155" t="5707" r="2702" b="5904">2015).</wd>

<space/>

<wd l="2899" t="5712" r="3624" b="5866">Because</wd>

<space/>

<wd l="3725" t="5707" r="3917" b="5866">of</wd>

<space/>

<wd l="3998" t="5707" r="4262" b="5866">the</wd>

<space/>

<wd l="4358" t="5707" r="4858" b="5909">noisy,</wd>

<space/>

<wd l="4982" t="5707" r="5453" b="5894">short,</wd>

<space/>

</ln>

<ln l="1786" t="5976" r="5453" b="6178" baseLine="6125" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5976" r="2098" b="6134">and</wd>

<space/>

<wd l="2179" t="5976" r="3043" b="6178">colloquial</wd>

<space/>

<wd l="3130" t="6000" r="3672" b="6134">nature</wd>

<space/>

<wd l="3758" t="5976" r="3950" b="6134">of</wd>

<space/>

<wd l="4013" t="5976" r="4675" b="6163">Twitter,</wd>

<space/>

<wd l="4771" t="5976" r="5035" b="6134">the</wd>

<space/>

<wd l="5117" t="6029" r="5453" b="6178">per-</wd>

</ln>

<ln l="1781" t="6245" r="5467" b="6446" baseLine="6398" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="6245" r="2602" b="6403">formance</wd>

<space/>

<wd l="2722" t="6245" r="2914" b="6403">of</wd>

<space/>

<wd l="3010" t="6245" r="3643" b="6403">Named</wd>

<space/>

<wd l="3754" t="6245" r="4282" b="6446">Entity</wd>

<space/>

<wd l="4397" t="6245" r="5467" b="6446">Recognition</wd>

<space/>

</ln>

<ln l="1790" t="6518" r="5458" b="6720" baseLine="6667" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1790" t="6523" r="2352" b="6715">(NER)</wd>

<space/>

<wd l="2438" t="6518" r="3197" b="6720">degrades</wd>

<space/>

<wd l="3288" t="6518" r="4387" b="6720">significantly.</wd>

<space/>

<wd l="4517" t="6523" r="4738" b="6677">To</wd>

<space/>

<wd l="4814" t="6518" r="5458" b="6677">address</wd>

<space/>

</ln>

<ln l="1781" t="6787" r="5467" b="6989" baseLine="6941" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="6787" r="2088" b="6946">this</wd>

<space/>

<wd l="2165" t="6787" r="2933" b="6989">problem,</wd>

<space/>

<wd l="3019" t="6840" r="3269" b="6946">we</wd>

<space/>

<wd l="3341" t="6840" r="4032" b="6989">propose</wd>

<space/>

<wd l="4104" t="6840" r="4200" b="6946">a</wd>

<space/>

<wd l="4262" t="6787" r="4738" b="6946">novel</wd>

<space/>

<wd l="4810" t="6787" r="5467" b="6946">method</wd>

<space/>

</ln>

<ln l="1781" t="7061" r="5467" b="7262" baseLine="7210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7085" r="1949" b="7219">to</wd>

<space/>

<wd l="2016" t="7061" r="2722" b="7219">enhance</wd>

<space/>

<wd l="2784" t="7061" r="3048" b="7219">the</wd>

<space/>

<wd l="3110" t="7061" r="4214" b="7262">performance</wd>

<space/>

<wd l="4277" t="7061" r="4469" b="7219">of</wd>

<space/>

<wd l="4512" t="7061" r="4781" b="7219">the</wd>

<space/>

<wd l="4838" t="7061" r="5467" b="7219">Twitter</wd>

<space/>

</ln>

<ln l="1781" t="7330" r="5467" b="7531" baseLine="7483">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1781" t="7334" r="2213" b="7488">NER</wd>

<space/>

<wd l="2299" t="7330" r="2650" b="7488">task</wd>

<space/>

<wd l="2731" t="7330" r="2942" b="7531">by</wd>

<space/>

<wd l="3029" t="7330" r="3499" b="7531">using</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3576" t="7339" r="4104" b="7531">Entity</wd>

<space/>

<wd l="4181" t="7330" r="4848" b="7531">Linking</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4930" t="7330" r="5467" b="7488">which</wd>

<space/>

</run>

</ln>

<ln l="1781" t="7603" r="5458" b="7805" baseLine="7752" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7603" r="1920" b="7762">is</wd>

<space/>

<wd l="2002" t="7656" r="2098" b="7762">a</wd>

<space/>

<wd l="2170" t="7603" r="2822" b="7762">method</wd>

<space/>

<wd l="2894" t="7603" r="3154" b="7762">for</wd>

<space/>

<wd l="3226" t="7603" r="4018" b="7805">detecting</wd>

<space/>

<wd l="4099" t="7603" r="4589" b="7805">entity</wd>

<space/>

<wd l="4666" t="7603" r="5458" b="7762">mentions</wd>

<space/>

</ln>

<ln l="1781" t="7872" r="5453" b="8074" baseLine="8026" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7872" r="1954" b="8026">in</wd>

<space/>

<wd l="2021" t="7896" r="2347" b="8030">text</wd>

<space/>

<wd l="2419" t="7872" r="2731" b="8030">and</wd>

<space/>

<wd l="2798" t="7872" r="3605" b="8074">resolving</wd>

<space/>

<wd l="3677" t="7872" r="4118" b="8030">them</wd>

<space/>

<wd l="4186" t="7896" r="4349" b="8030">to</wd>

<space/>

<wd l="4430" t="7872" r="5453" b="8074">correspond-</wd>

</ln>

<ln l="1781" t="8146" r="5458" b="8347" baseLine="8294" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8146" r="2054" b="8347">ing</wd>

<space/>

<wd l="2170" t="8146" r="2741" b="8304">entries</wd>

<space/>

<wd l="2856" t="8146" r="3029" b="8299">in</wd>

<space/>

<wd l="3134" t="8146" r="4085" b="8347">knowledge</wd>

<space/>

<wd l="4195" t="8146" r="4661" b="8304">bases</wd>

<space/>

<wd l="4786" t="8146" r="5174" b="8304">such</wd>

<space/>

<wd l="5290" t="8198" r="5458" b="8304">as</wd>

<space/>

</ln>

<ln l="1781" t="8414" r="5453" b="8616" baseLine="8568" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8414" r="2722" b="8616">Wikipedia.</wd>

<space/>

<wd l="2808" t="8419" r="3144" b="8573">Our</wd>

<space/>

<wd l="3197" t="8414" r="3850" b="8573">method</wd>

<space/>

<wd l="3902" t="8414" r="4042" b="8573">is</wd>

<space/>

<wd l="4104" t="8414" r="4598" b="8573">based</wd>

<space/>

<wd l="4656" t="8467" r="4872" b="8573">on</wd>

<space/>

<wd l="4934" t="8467" r="5453" b="8616">super-</wd>

</ln>

<ln l="1781" t="8688" r="5453" b="8890" baseLine="8837" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8688" r="2242" b="8846">vised</wd>

<space/>

<wd l="2294" t="8688" r="3821" b="8890">machine-learning</wd>

<space/>

<wd l="3883" t="8688" r="4195" b="8846">and</wd>

<space/>

<wd l="4253" t="8741" r="4618" b="8846">uses</wd>

<space/>

<wd l="4680" t="8688" r="4949" b="8846">the</wd>

<space/>

<wd l="5006" t="8688" r="5453" b="8890">high-</wd>

</ln>

<ln l="1786" t="8957" r="5462" b="9158" baseLine="9106" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="8957" r="2381" b="9158">quality</wd>

<space/>

<wd l="2472" t="8957" r="3422" b="9158">knowledge</wd>

<space/>

<wd l="3514" t="8957" r="4262" b="9115">obtained</wd>

<space/>

<wd l="4349" t="8957" r="4776" b="9115">from</wd>

<space/>

<wd l="4867" t="8957" r="5462" b="9115">several</wd>

<space/>

</ln>

<ln l="1786" t="9230" r="5467" b="9432" baseLine="9379" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="9283" r="2208" b="9432">open</wd>

<space/>

<wd l="2318" t="9230" r="3269" b="9432">knowledge</wd>

<space/>

<wd l="3384" t="9230" r="3898" b="9389">bases.</wd>

<space/>

<wd l="4152" t="9235" r="4334" b="9384">In</wd>

<space/>

<wd l="4454" t="9230" r="5467" b="9432">comparison</wd>

<space/>

</ln>

<ln l="1781" t="9499" r="5458" b="9701" baseLine="9648" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="9499" r="2170" b="9658">with</wd>

<space/>

<wd l="2256" t="9499" r="2520" b="9658">the</wd>

<space/>

<wd l="2611" t="9499" r="3062" b="9658">other</wd>

<space/>

<wd l="3154" t="9523" r="3826" b="9701">systems</wd>

<space/>

<wd l="3922" t="9499" r="4723" b="9701">proposed</wd>

<space/>

<wd l="4810" t="9499" r="5069" b="9658">for</wd>

<space/>

<wd l="5150" t="9499" r="5458" b="9658">this</wd>

<space/>

</ln>

<ln l="1790" t="9768" r="5467" b="9955" baseLine="9922" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1790" t="9768" r="2352" b="9926">shared</wd>

<space/>

<wd l="2414" t="9768" r="2808" b="9955">task,</wd>

<space/>

<wd l="2890" t="9821" r="3178" b="9926">our</wd>

<space/>

<wd l="3235" t="9768" r="3893" b="9926">method</wd>

<space/>

<wd l="3960" t="9768" r="4723" b="9926">achieved</wd>

<space/>

<wd l="4786" t="9768" r="5050" b="9926">the</wd>

<space/>

<wd l="5112" t="9768" r="5467" b="9926">best</wd>

<space/>

</ln>

<ln l="1781" t="10042" r="2928" b="10243" baseLine="10190" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="10042" r="2928" b="10243">performance.</wd>

</ln>

</para>

<para l="1454" t="10498" r="3091" b="10670" alignment="left" spaceBefore="208" lsp="exactly" lspExact="273" language="en">

<ln l="1454" t="10498" r="3091" b="10670" baseLine="10666" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1454" t="10498" r="1550" b="10666">1</wd>

<space/>

<wd l="1805" t="10498" r="3091" b="10670">Introduction</wd>

</ln>

</para>

<para l="1440" t="10930" r="5818" b="13800" alignment="justified" spaceBefore="133" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="10930" r="5803" b="11131" baseLine="11083" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10930" r="2074" b="11088">Named</wd>

<space/>

<wd l="2174" t="10930" r="2702" b="11131">Entity</wd>

<space/>

<wd l="2813" t="10930" r="3878" b="11131">Recognition</wd>

<space/>

<wd l="3989" t="10934" r="4550" b="11126">(NER)</wd>

<space/>

<wd l="4666" t="10930" r="5155" b="11088">refers</wd>

<space/>

<wd l="5266" t="10954" r="5434" b="11088">to</wd>

<space/>

<wd l="5539" t="10930" r="5803" b="11088">the</wd>

<space/>

</ln>

<ln l="1440" t="11203" r="5794" b="11405" baseLine="11352" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11203" r="1795" b="11362">task</wd>

<space/>

<wd l="1862" t="11203" r="2054" b="11362">of</wd>

<space/>

<wd l="2107" t="11203" r="3062" b="11405">identifying</wd>

<space/>

<wd l="3134" t="11203" r="3926" b="11362">mentions</wd>

<space/>

<wd l="4003" t="11203" r="4195" b="11362">of</wd>

<space/>

<wd l="4253" t="11203" r="4872" b="11362">entities</wd>

<space/>

<wd l="4954" t="11208" r="5376" b="11405">(e.g.,</wd>

<space/>

<wd l="5458" t="11256" r="5794" b="11405">per-</wd>

</ln>

<ln l="1450" t="11472" r="5794" b="11674" baseLine="11621" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1450" t="11525" r="1872" b="11659">sons,</wd>

<space/>

<wd l="1987" t="11472" r="2818" b="11659">locations,</wd>

<space/>

<wd l="2938" t="11472" r="4166" b="11674">organizations)</wd>

<space/>

<wd l="4272" t="11472" r="4829" b="11630">within</wd>

<space/>

<wd l="4925" t="11496" r="5290" b="11630">text.</wd>

<space/>

<wd l="5491" t="11477" r="5794" b="11630">Be-</wd>

</ln>

<ln l="1445" t="11746" r="5818" b="11947" baseLine="11894" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11798" r="1925" b="11904">cause</wd>

<space/>

<wd l="1992" t="11746" r="2184" b="11904">of</wd>

<space/>

<wd l="2232" t="11746" r="2501" b="11904">the</wd>

<space/>

<wd l="2563" t="11746" r="3067" b="11947">noisy,</wd>

<space/>

<wd l="3154" t="11746" r="3624" b="11933">short,</wd>

<space/>

<wd l="3706" t="11746" r="4018" b="11904">and</wd>

<space/>

<wd l="4085" t="11746" r="4949" b="11947">colloquial</wd>

<space/>

<wd l="5016" t="11770" r="5558" b="11904">nature</wd>

<space/>

<wd l="5630" t="11746" r="5818" b="11904">of</wd>

<space/>

</ln>

<ln l="1440" t="12014" r="5818" b="12216" baseLine="12163">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="12014" r="2069" b="12173">Twitter</wd>

<space/>

<wd l="2136" t="12067" r="2952" b="12216">messages</wd>

<space/>

<wd l="3043" t="12019" r="3293" b="12211">(or</wd>

<space/>

</run>

<wd l="3365" t="12019" r="4022" b="12211"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">tweets</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">),</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="4109" t="12014" r="4378" b="12173">the</wd>

<space/>

<wd l="4450" t="12014" r="5549" b="12216">performance</wd>

<space/>

<wd l="5630" t="12014" r="5818" b="12173">of</wd>

<space/>

</run>

</ln>

<ln l="1450" t="12283" r="5808" b="12485" baseLine="12437" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1450" t="12283" r="2179" b="12442">standard</wd>

<space/>

<wd l="2251" t="12288" r="2688" b="12442">NER</wd>

<space/>

<wd l="2774" t="12283" r="3509" b="12442">software</wd>

<space/>

<wd l="3595" t="12283" r="4661" b="12485">significantly</wd>

<space/>

<wd l="4747" t="12283" r="5371" b="12442">suffers.</wd>

<space/>

<wd l="5506" t="12288" r="5808" b="12442">For</wd>

<space/>

</ln>

<ln l="1445" t="12557" r="5794" b="12758" baseLine="12706" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12557" r="2218" b="12758">example,</wd>

<space/>

<wd l="2342" t="12557" r="3331" b="12758">Derczynski</wd>

<space/>

<wd l="3442" t="12581" r="3595" b="12715">et</wd>

<space/>

<wd l="3701" t="12557" r="3898" b="12715">al.</wd>

<space/>

<wd l="4123" t="12557" r="5179" b="12758">(Derczynski</wd>

<space/>

<wd l="5285" t="12581" r="5438" b="12715">et</wd>

<space/>

<wd l="5544" t="12557" r="5794" b="12744">al.,</wd>

<space/>

</ln>

<ln l="1445" t="12826" r="5803" b="13027" baseLine="12979" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12826" r="1939" b="13022">2015)</wd>

<space/>

<wd l="2006" t="12826" r="2702" b="13027">recently</wd>

<space/>

<wd l="2770" t="12826" r="3941" b="12984">demonstrated</wd>

<space/>

<wd l="3998" t="12826" r="4325" b="12984">that</wd>

<space/>

<wd l="4382" t="12826" r="4646" b="12984">the</wd>

<space/>

<wd l="4704" t="12826" r="5803" b="13027">performance</wd>

<space/>

</ln>

<ln l="1445" t="13099" r="5794" b="13301" baseLine="13248" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="13099" r="1637" b="13258">of</wd>

<space/>

<wd l="1747" t="13099" r="2376" b="13258">various</wd>

<space/>

<wd l="2515" t="13099" r="3806" b="13258">state-of-the-art</wd>

<space/>

<wd l="3931" t="13104" r="4363" b="13258">NER</wd>

<space/>

<wd l="4498" t="13099" r="5237" b="13258">software</wd>

<space/>

<wd l="5371" t="13104" r="5794" b="13301">(e.g.,</wd>

<space/>

</ln>

<ln l="1445" t="13368" r="5803" b="13570" baseLine="13522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="13368" r="2194" b="13526">Stanford</wd>

<space/>

<wd l="2242" t="13373" r="2674" b="13526">NER</wd>

<space/>

<wd l="2726" t="13368" r="3038" b="13526">and</wd>

<space/>

<wd l="3086" t="13373" r="3826" b="13565">ANNIE)</wd>

<space/>

<wd l="3888" t="13368" r="4022" b="13526">is</wd>

<space/>

<wd l="4080" t="13368" r="4838" b="13570">typically</wd>

<space/>

<wd l="4891" t="13368" r="5386" b="13526">lower</wd>

<space/>

<wd l="5429" t="13368" r="5803" b="13526">than</wd>

<space/>

</ln>

<ln l="1445" t="13603" r="3178" b="13800" baseLine="13782">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="13642" r="1829" b="13800">50%</wd>

<space/>

</run>

<wd l="1896" t="13603" r="2194" b="13795"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">F1</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2270" t="13642" r="2530" b="13800">for</wd>

<space/>

<wd l="2578" t="13666" r="3178" b="13800">tweets.</wd>

</run>

</ln>

</para>

<para l="1440" t="13910" r="5808" b="14928" alignment="justified" spaceBefore="6" spaceAfter="101" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="13910" r="5794" b="14112" baseLine="14064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="13910" r="2189" b="14112">Entity</wd>

<space/>

<wd l="2290" t="13910" r="2976" b="14112">Linking</wd>

<space/>

<wd l="3082" t="13915" r="3475" b="14107">(EL)</wd>

<space/>

<wd l="3581" t="13910" r="4070" b="14069">refers</wd>

<space/>

<wd l="4176" t="13934" r="4339" b="14069">to</wd>

<space/>

<wd l="4440" t="13910" r="4704" b="14069">the</wd>

<space/>

<wd l="4800" t="13910" r="5155" b="14069">task</wd>

<space/>

<wd l="5256" t="13910" r="5443" b="14069">of</wd>

<space/>

<wd l="5530" t="13910" r="5794" b="14069">de-</wd>

</ln>

<ln l="1440" t="14184" r="5808" b="14386" baseLine="14333" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14184" r="2030" b="14386">tecting</wd>

<space/>

<wd l="2122" t="14184" r="2707" b="14342">textual</wd>

<space/>

<wd l="2798" t="14184" r="3288" b="14386">entity</wd>

<space/>

<wd l="3379" t="14184" r="4171" b="14342">mentions</wd>

<space/>

<wd l="4267" t="14184" r="4579" b="14342">and</wd>

<space/>

<wd l="4666" t="14184" r="5280" b="14386">linking</wd>

<space/>

<wd l="5371" t="14184" r="5808" b="14342">them</wd>

<space/>

</ln>

<ln l="1440" t="14453" r="5798" b="14654" baseLine="14602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14477" r="1608" b="14611">to</wd>

<space/>

<wd l="1690" t="14453" r="2933" b="14654">corresponding</wd>

<space/>

<wd l="3014" t="14453" r="3586" b="14611">entries</wd>

<space/>

<wd l="3672" t="14453" r="4229" b="14611">within</wd>

<space/>

<wd l="4306" t="14453" r="5256" b="14654">knowledge</wd>

<space/>

<wd l="5333" t="14453" r="5798" b="14611">bases</wd>

<space/>

</ln>

<ln l="1450" t="14726" r="5794" b="14928" baseLine="14875" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="14731" r="1872" b="14928">(e.g.,</wd>

<space/>

<wd l="2006" t="14726" r="2947" b="14928">Wikipedia,</wd>

<space/>

<wd l="3082" t="14726" r="3864" b="14928">DBpedia</wd>

<space/>

<wd l="3979" t="14731" r="4478" b="14923">(Auer</wd>

<space/>

<wd l="4589" t="14750" r="4747" b="14885">et</wd>

<space/>

<wd l="4858" t="14726" r="5107" b="14914">al.,</wd>

<space/>

<wd l="5246" t="14731" r="5794" b="14923">2007),</wd>

</ln>

</para>

<rulerline l="1437" t="15048" r="2640" b="15048" type="single" width="10" color="000000"/>

<para l="1704" t="15101" r="4872" b="15302" alignment="left" li="216" spaceBefore="58" spaceAfter="32" lsp="exactly" lspExact="204" language="en">

<ln l="1704" t="15101" r="4872" b="15302" baseLine="15257">

<wd l="1704" t="15101" r="2040" b="15264"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">The</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2088" t="15134" r="2760" b="15264">harmonic</wd>

<space/>

<wd l="2808" t="15173" r="3192" b="15264">mean</wd>

<space/>

<wd l="3245" t="15134" r="3403" b="15264">of</wd>

<space/>

<wd l="3437" t="15134" r="4094" b="15302">precision</wd>

<space/>

<wd l="4142" t="15134" r="4397" b="15264">and</wd>

<space/>

<wd l="4440" t="15134" r="4872" b="15264">recall.</wd>

</run>

</ln>

</para>

</column>

<column l="6144" t="4092" r="10531" b="15336">

<para l="6144" t="4157" r="10526" b="8650" alignment="justified" spaceBefore="3" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="4157" r="10526" b="4354" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4157" r="6922" b="4315">Freebase</wd>

<space/>

<wd l="7027" t="4157" r="7944" b="4354">(Bollacker</wd>

<space/>

<wd l="8040" t="4181" r="8194" b="4315">et</wd>

<space/>

<wd l="8299" t="4157" r="8549" b="4344">al.,</wd>

<space/>

<wd l="8674" t="4162" r="9293" b="4354">2008)).</wd>

<space/>

<wd l="9504" t="4162" r="10229" b="4315">Because</wd>

<space/>

<wd l="10334" t="4157" r="10526" b="4315">of</wd>

<space/>

</ln>

<ln l="6144" t="4426" r="10512" b="4627" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4426" r="6413" b="4584">the</wd>

<space/>

<wd l="6499" t="4450" r="7032" b="4584">recent</wd>

<space/>

<wd l="7123" t="4478" r="8054" b="4627">emergence</wd>

<space/>

<wd l="8146" t="4426" r="8338" b="4584">of</wd>

<space/>

<wd l="8410" t="4426" r="8842" b="4627">large</wd>

<space/>

<wd l="8933" t="4426" r="9470" b="4584">online</wd>

<space/>

<wd l="9557" t="4426" r="10512" b="4627">knowledge</wd>

<space/>

</ln>

<ln l="6144" t="4699" r="10502" b="4901" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4699" r="6610" b="4858">bases</wd>

<space/>

<wd l="6686" t="4704" r="7166" b="4896">(KB),</wd>

<space/>

<wd l="7238" t="4704" r="7507" b="4853">EL</wd>

<space/>

<wd l="7565" t="4699" r="7848" b="4858">has</wd>

<space/>

<wd l="7910" t="4699" r="8611" b="4901">recently</wd>

<space/>

<wd l="8678" t="4699" r="9254" b="4901">gained</wd>

<space/>

<wd l="9322" t="4699" r="10224" b="4901">significant</wd>

<space/>

<wd l="10286" t="4723" r="10502" b="4858">at-</wd>

</ln>

<ln l="6144" t="4968" r="10512" b="5170" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4968" r="6797" b="5126">tention.</wd>

<space/>

<wd l="6931" t="4973" r="7066" b="5126">It</wd>

<space/>

<wd l="7138" t="4968" r="7277" b="5126">is</wd>

<space/>

<wd l="7363" t="4968" r="7997" b="5126">evident</wd>

<space/>

<wd l="8069" t="4968" r="8400" b="5126">that</wd>

<space/>

<wd l="8472" t="4968" r="8736" b="5126">the</wd>

<space/>

<wd l="8813" t="4968" r="9912" b="5170">performance</wd>

<space/>

<wd l="9994" t="4968" r="10186" b="5126">of</wd>

<space/>

<wd l="10243" t="4973" r="10512" b="5122">EL</wd>

<space/>

</ln>

<ln l="6149" t="5242" r="10507" b="5443" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="5242" r="6494" b="5400">also</wd>

<space/>

<wd l="6562" t="5242" r="7320" b="5443">degrades</wd>

<space/>

<wd l="7387" t="5242" r="7862" b="5400">when</wd>

<space/>

<wd l="7925" t="5242" r="8765" b="5443">analyzing</wd>

<space/>

<wd l="8827" t="5266" r="9379" b="5400">tweets</wd>

<space/>

<wd l="9456" t="5242" r="10507" b="5443">(Derczynski</wd>

<space/>

</ln>

<ln l="6149" t="5510" r="10507" b="5712" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="5534" r="6307" b="5669">et</wd>

<space/>

<wd l="6398" t="5510" r="6648" b="5698">al.,</wd>

<space/>

<wd l="6763" t="5510" r="7243" b="5698">2015;</wd>

<space/>

<wd l="7358" t="5510" r="7757" b="5712">Meij</wd>

<space/>

<wd l="7867" t="5534" r="8021" b="5669">et</wd>

<space/>

<wd l="8112" t="5510" r="8362" b="5698">al.,</wd>

<space/>

<wd l="8477" t="5515" r="9024" b="5707">2012).</wd>

<space/>

<wd l="9206" t="5515" r="10027" b="5698">However,</wd>

<space/>

<wd l="10142" t="5515" r="10507" b="5669">Guo</wd>

<space/>

</ln>

<ln l="6149" t="5784" r="10512" b="5986" baseLine="5933" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="5808" r="6307" b="5942">et</wd>

<space/>

<wd l="6403" t="5784" r="6600" b="5942">al.</wd>

<space/>

<wd l="6806" t="5789" r="7238" b="5981">(Guo</wd>

<space/>

<wd l="7344" t="5808" r="7498" b="5942">et</wd>

<space/>

<wd l="7594" t="5784" r="7843" b="5971">al.,</wd>

<space/>

<wd l="7963" t="5789" r="8458" b="5981">2013)</wd>

<space/>

<wd l="8563" t="5784" r="9264" b="5986">recently</wd>

<space/>

<wd l="9360" t="5784" r="10090" b="5942">revealed</wd>

<space/>

<wd l="10186" t="5784" r="10512" b="5942">that</wd>

<space/>

</ln>

<ln l="6144" t="6053" r="10512" b="6211" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6053" r="6413" b="6211">the</wd>

<space/>

<wd l="6485" t="6053" r="6922" b="6211">main</wd>

<space/>

<wd l="6998" t="6053" r="7642" b="6211">failures</wd>

<space/>

<wd l="7728" t="6053" r="7920" b="6211">of</wd>

<space/>

<wd l="7978" t="6053" r="8606" b="6211">Twitter</wd>

<space/>

<wd l="8678" t="6058" r="8947" b="6206">EL</wd>

<space/>

<wd l="9024" t="6106" r="9283" b="6211">are</wd>

<space/>

<wd l="9365" t="6053" r="9955" b="6211">caused</wd>

<space/>

<wd l="10027" t="6053" r="10512" b="6211">while</wd>

<space/>

</ln>

<ln l="6149" t="6326" r="10502" b="6528" baseLine="6475" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="6326" r="6941" b="6528">detecting</wd>

<space/>

<wd l="7032" t="6326" r="7522" b="6528">entity</wd>

<space/>

<wd l="7608" t="6326" r="8400" b="6485">mentions</wd>

<space/>

<wd l="8491" t="6326" r="8918" b="6485">from</wd>

<space/>

<wd l="8995" t="6350" r="9365" b="6514">text,</wd>

<space/>

<wd l="9461" t="6326" r="10152" b="6485">because</wd>

<space/>

<wd l="10238" t="6379" r="10502" b="6485">ex-</wd>

</ln>

<ln l="6144" t="6595" r="10512" b="6797" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="6595" r="6629" b="6797">isting</wd>

<space/>

<wd l="6730" t="6600" r="6998" b="6749">EL</wd>

<space/>

<wd l="7099" t="6595" r="7829" b="6754">methods</wd>

<space/>

<wd l="7939" t="6595" r="8568" b="6797">usually</wd>

<space/>

<wd l="8678" t="6595" r="9317" b="6754">address</wd>

<space/>

<wd l="9427" t="6595" r="9696" b="6754">the</wd>

<space/>

<wd l="9797" t="6595" r="10512" b="6754">mention</wd>

<space/>

</ln>

<ln l="6149" t="6869" r="10512" b="7070" baseLine="7018" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="6869" r="6946" b="7027">detection</wd>

<space/>

<wd l="7051" t="6869" r="7406" b="7027">task</wd>

<space/>

<wd l="7512" t="6869" r="7723" b="7070">by</wd>

<space/>

<wd l="7834" t="6869" r="8304" b="7070">using</wd>

<space/>

<wd l="8419" t="6869" r="9110" b="7027">external</wd>

<space/>

<wd l="9221" t="6874" r="9653" b="7027">NER</wd>

<space/>

<wd l="9773" t="6869" r="10512" b="7027">software</wd>

<space/>

</ln>

<ln l="6144" t="7138" r="10507" b="7339" baseLine="7286" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7138" r="6701" b="7296">whose</wd>

<space/>

<wd l="6758" t="7138" r="7862" b="7339">performance</wd>

<space/>

<wd l="7920" t="7138" r="8054" b="7296">is</wd>

<space/>

<wd l="8122" t="7138" r="8990" b="7296">unreliable</wd>

<space/>

<wd l="9048" t="7138" r="9523" b="7296">when</wd>

<space/>

<wd l="9576" t="7138" r="10507" b="7339">processing</wd>

<space/>

</ln>

<ln l="6144" t="7406" r="10512" b="7608" baseLine="7560" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7430" r="6744" b="7565">tweets.</wd>

<space/>

<wd l="6845" t="7406" r="8069" b="7608">Consequently,</wd>

<space/>

<wd l="8146" t="7406" r="8746" b="7565">several</wd>

<space/>

<wd l="8813" t="7406" r="9778" b="7608">approaches</wd>

<space/>

<wd l="9854" t="7411" r="10291" b="7603">(Guo</wd>

<space/>

<wd l="10358" t="7430" r="10512" b="7565">et</wd>

<space/>

</ln>

<ln l="6149" t="7680" r="10512" b="7882" baseLine="7829" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="7680" r="6403" b="7867">al.,</wd>

<space/>

<wd l="6461" t="7685" r="6941" b="7867">2013;</wd>

<space/>

<wd l="7003" t="7680" r="7709" b="7838">Yamada</wd>

<space/>

<wd l="7752" t="7704" r="7906" b="7838">et</wd>

<space/>

<wd l="7954" t="7680" r="8203" b="7867">al.,</wd>

<space/>

<wd l="8266" t="7680" r="8760" b="7877">2015)</wd>

<space/>

<wd l="8808" t="7680" r="9216" b="7838">have</wd>

<space/>

<wd l="9259" t="7680" r="9672" b="7838">been</wd>

<space/>

<wd l="9710" t="7680" r="10512" b="7882">proposed</wd>

<space/>

</ln>

<ln l="6144" t="7949" r="10507" b="8107" baseLine="8102" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7949" r="6533" b="8107">with</wd>

<space/>

<wd l="6600" t="7949" r="7421" b="8107">enhanced</wd>

<space/>

<wd l="7483" t="7949" r="8160" b="8107">abilities</wd>

<space/>

<wd l="8232" t="7949" r="8558" b="8107">that</wd>

<space/>

<wd l="8626" t="7949" r="9264" b="8107">address</wd>

<space/>

<wd l="9336" t="7949" r="9600" b="8107">the</wd>

<space/>

<wd l="9662" t="7949" r="10013" b="8107">task</wd>

<space/>

<wd l="10075" t="7949" r="10243" b="8102">in</wd>

<space/>

<wd l="10310" t="8002" r="10507" b="8107">an</wd>

<space/>

</ln>

<ln l="6149" t="8222" r="10507" b="8424" baseLine="8371">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="8222" r="7099" b="8381">end-to-end</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7152" t="8275" r="7810" b="8381">manner</wd>

<space/>

<wd l="7858" t="8222" r="8525" b="8381">without</wd>

<space/>

<wd l="8582" t="8222" r="9547" b="8424">completely</wd>

<space/>

<wd l="9605" t="8222" r="10507" b="8424">depending</wd>

<space/>

</run>

</ln>

<ln l="6149" t="8491" r="7699" b="8650" baseLine="8645" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="8544" r="6365" b="8650">on</wd>

<space/>

<wd l="6418" t="8496" r="6854" b="8650">NER</wd>

<space/>

<wd l="6917" t="8491" r="7699" b="8650">software.</wd>

</ln>

</para>

<para l="6144" t="8818" r="10526" b="12274" alignment="justified" spaceBefore="53" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="8818" r="10512" b="9019" baseLine="8971" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6365" t="8818" r="6701" b="8976">The</wd>

<space/>

<wd l="6749" t="8818" r="7186" b="8976">main</wd>

<space/>

<wd l="7234" t="8818" r="8021" b="9019">objective</wd>

<space/>

<wd l="8074" t="8818" r="8261" b="8976">of</wd>

<space/>

<wd l="8294" t="8818" r="8602" b="8976">this</wd>

<space/>

<wd l="8664" t="8818" r="9125" b="9019">study</wd>

<space/>

<wd l="9173" t="8818" r="9312" b="8976">is</wd>

<space/>

<wd l="9365" t="8842" r="9528" b="8976">to</wd>

<space/>

<wd l="9581" t="8818" r="10512" b="9019">investigate</wd>

<space/>

</ln>

<ln l="6144" t="9091" r="10526" b="9293" baseLine="9240" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9091" r="6413" b="9250">the</wd>

<space/>

<wd l="6504" t="9091" r="7411" b="9293">possibility</wd>

<space/>

<wd l="7512" t="9091" r="7704" b="9250">of</wd>

<space/>

<wd l="7790" t="9091" r="8678" b="9293">enhancing</wd>

<space/>

<wd l="8774" t="9091" r="9038" b="9250">the</wd>

<space/>

<wd l="9134" t="9091" r="10234" b="9293">performance</wd>

<space/>

<wd l="10334" t="9091" r="10526" b="9250">of</wd>

<space/>

</ln>

<ln l="6144" t="9360" r="10512" b="9562" baseLine="9514" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9360" r="6773" b="9518">Twitter</wd>

<space/>

<wd l="6816" t="9365" r="7253" b="9518">NER</wd>

<space/>

<wd l="7296" t="9360" r="7512" b="9562">by</wd>

<space/>

<wd l="7560" t="9360" r="8030" b="9562">using</wd>

<space/>

<wd l="8083" t="9413" r="8280" b="9518">an</wd>

<space/>

<wd l="8333" t="9360" r="9278" b="9518">end-to-end</wd>

<space/>

<wd l="9322" t="9365" r="9629" b="9518">EL.</wd>

<space/>

<wd l="9686" t="9360" r="10512" b="9562">Although</wd>

<space/>

</ln>

<ln l="6144" t="9634" r="10526" b="9835" baseLine="9782">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="9638" r="6413" b="9787">EL</wd>

<space/>

<wd l="6494" t="9634" r="6629" b="9792">is</wd>

<space/>

<wd l="6720" t="9634" r="7478" b="9835">typically</wd>

<space/>

<wd l="7565" t="9634" r="8477" b="9835">performed</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="8554" t="9638" r="8976" b="9835">after</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="9053" t="9638" r="9490" b="9792">NER</wd>

<space/>

<wd l="9571" t="9634" r="9744" b="9787">in</wd>

<space/>

<wd l="9826" t="9658" r="10248" b="9792">most</wd>

<space/>

<wd l="10334" t="9634" r="10526" b="9792">of</wd>

<space/>

</run>

</ln>

<ln l="6144" t="9902" r="10512" b="10104" baseLine="10051" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9902" r="6413" b="10061">the</wd>

<space/>

<wd l="6494" t="9902" r="7176" b="10104">existing</wd>

<space/>

<wd l="7258" t="9902" r="8040" b="10090">methods,</wd>

<space/>

<wd l="8136" t="9955" r="8429" b="10061">our</wd>

<space/>

<wd l="8506" t="9902" r="9302" b="10104">approach</wd>

<space/>

<wd l="9379" t="9902" r="10157" b="10104">performs</wd>

<space/>

<wd l="10243" t="9907" r="10512" b="10056">EL</wd>

<space/>

</ln>

<ln l="6149" t="10176" r="10512" b="10378" baseLine="10325">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6149" t="10176" r="6691" b="10378">before</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6744" t="10181" r="7176" b="10334">NER</wd>

<space/>

<wd l="7234" t="10176" r="7546" b="10334">and</wd>

<space/>

<wd l="7594" t="10229" r="7958" b="10334">uses</wd>

<space/>

<wd l="8016" t="10176" r="8280" b="10334">the</wd>

<space/>

<wd l="8328" t="10181" r="8597" b="10330">EL</wd>

<space/>

<wd l="8645" t="10176" r="9206" b="10334">results</wd>

<space/>

<wd l="9264" t="10200" r="9427" b="10334">to</wd>

<space/>

<wd l="9485" t="10176" r="10195" b="10334">enhance</wd>

<space/>

<wd l="10243" t="10176" r="10512" b="10334">the</wd>

<space/>

</run>

</ln>

<ln l="6144" t="10445" r="10502" b="10646" baseLine="10594" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="10450" r="6581" b="10603">NER</wd>

<space/>

<wd l="6643" t="10445" r="7786" b="10646">performance.</wd>

<space/>

<wd l="7882" t="10445" r="8765" b="10646">Resolving</wd>

<space/>

<wd l="8827" t="10445" r="9091" b="10603">the</wd>

<space/>

<wd l="9158" t="10445" r="9648" b="10646">entity</wd>

<space/>

<wd l="9710" t="10445" r="10502" b="10603">mentions</wd>

<space/>

</ln>

<ln l="6144" t="10714" r="10507" b="10915" baseLine="10867" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="10738" r="6312" b="10872">to</wd>

<space/>

<wd l="6360" t="10714" r="6624" b="10872">the</wd>

<space/>

<wd l="6677" t="10718" r="6965" b="10867">KB</wd>

<space/>

<wd l="7022" t="10714" r="7594" b="10872">entries</wd>

<space/>

<wd l="7651" t="10714" r="8290" b="10872">enables</wd>

<space/>

<wd l="8342" t="10766" r="8530" b="10872">us</wd>

<space/>

<wd l="8582" t="10738" r="8750" b="10872">to</wd>

<space/>

<wd l="8798" t="10766" r="9086" b="10872">use</wd>

<space/>

<wd l="9134" t="10714" r="9398" b="10872">the</wd>

<space/>

<wd l="9446" t="10714" r="10507" b="10915">high-quality</wd>

<space/>

</ln>

<ln l="6144" t="10987" r="10502" b="11189" baseLine="11136" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="10987" r="7094" b="11189">knowledge</wd>

<space/>

<wd l="7166" t="10987" r="7339" b="11141">in</wd>

<space/>

<wd l="7411" t="10992" r="7699" b="11141">KB</wd>

<space/>

<wd l="7776" t="10987" r="8035" b="11146">for</wd>

<space/>

<wd l="8107" t="10987" r="8995" b="11189">enhancing</wd>

<space/>

<wd l="9067" t="10987" r="9336" b="11146">the</wd>

<space/>

<wd l="9403" t="10992" r="9840" b="11146">NER</wd>

<space/>

<wd l="9912" t="10987" r="10502" b="11189">perfor-</wd>

</ln>

<ln l="6144" t="11256" r="10502" b="11458" baseLine="11410" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11309" r="6758" b="11414">mance.</wd>

<space/>

<wd l="6922" t="11256" r="7301" b="11414">This</wd>

<space/>

<wd l="7387" t="11256" r="8342" b="11458">knowledge</wd>

<space/>

<wd l="8424" t="11256" r="9144" b="11414">includes</wd>

<space/>

<wd l="9230" t="11256" r="9758" b="11458">things</wd>

<space/>

<wd l="9859" t="11256" r="10248" b="11414">such</wd>

<space/>

<wd l="10334" t="11309" r="10502" b="11414">as</wd>

<space/>

</ln>

<ln l="6144" t="11530" r="10502" b="11731" baseLine="11678" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11530" r="6413" b="11688">the</wd>

<space/>

<wd l="6480" t="11530" r="7373" b="11731">popularity</wd>

<space/>

<wd l="7450" t="11530" r="7642" b="11688">of</wd>

<space/>

<wd l="7694" t="11530" r="7963" b="11688">the</wd>

<space/>

<wd l="8035" t="11530" r="8558" b="11731">entity,</wd>

<space/>

<wd l="8640" t="11530" r="8904" b="11688">the</wd>

<space/>

<wd l="8981" t="11530" r="9571" b="11688">classes</wd>

<space/>

<wd l="9653" t="11530" r="9845" b="11688">of</wd>

<space/>

<wd l="9898" t="11530" r="10162" b="11688">the</wd>

<space/>

<wd l="10238" t="11582" r="10502" b="11688">en-</wd>

</ln>

<ln l="6144" t="11798" r="10512" b="12000" baseLine="11952" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11798" r="6466" b="12000">tity,</wd>

<space/>

<wd l="6566" t="11798" r="6878" b="11957">and</wd>

<space/>

<wd l="6955" t="11798" r="7224" b="11957">the</wd>

<space/>

<wd l="7306" t="11798" r="8189" b="11957">likelihood</wd>

<space/>

<wd l="8266" t="11798" r="8597" b="11957">that</wd>

<space/>

<wd l="8674" t="11798" r="8938" b="11957">the</wd>

<space/>

<wd l="9024" t="11798" r="9514" b="12000">entity</wd>

<space/>

<wd l="9600" t="11851" r="10253" b="12000">appears</wd>

<space/>

<wd l="10339" t="11798" r="10512" b="11952">in</wd>

<space/>

</ln>

<ln l="6144" t="12072" r="7680" b="12274" baseLine="12221" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12072" r="6413" b="12230">the</wd>

<space/>

<wd l="6470" t="12072" r="6946" b="12274">given</wd>

<space/>

<wd l="7003" t="12096" r="7680" b="12230">context.</wd>

</ln>

</para>

<para l="6144" t="12398" r="10517" b="15307" alignment="justified" spaceBefore="57" spaceAfter="20" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="12398" r="10512" b="12600" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6365" t="12403" r="6648" b="12557">We</wd>

<space/>

<wd l="6706" t="12398" r="7190" b="12600">begin</wd>

<space/>

<wd l="7248" t="12398" r="7464" b="12600">by</wd>

<space/>

<wd l="7526" t="12398" r="8088" b="12600">briefly</wd>

<space/>

<wd l="8150" t="12398" r="9154" b="12600">introducing</wd>

<space/>

<wd l="9221" t="12451" r="9514" b="12557">our</wd>

<space/>

<wd l="9571" t="12398" r="10512" b="12557">end-to-end</wd>

<space/>

</ln>

<ln l="6144" t="12667" r="10498" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12672" r="6413" b="12821">EL</wd>

<space/>

<wd l="6518" t="12667" r="7176" b="12826">method</wd>

<space/>

<wd l="7282" t="12667" r="7608" b="12826">that</wd>

<space/>

<wd l="7723" t="12667" r="8702" b="12869">specifically</wd>

<space/>

<wd l="8813" t="12667" r="9461" b="12826">focuses</wd>

<space/>

<wd l="9581" t="12720" r="9792" b="12826">on</wd>

<space/>

<wd l="9898" t="12691" r="10498" b="12826">tweets.</wd>

<space/>

</ln>

<ln l="6149" t="12941" r="10502" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="12946" r="6490" b="13099">Our</wd>

<space/>

<wd l="6557" t="12946" r="6826" b="13094">EL</wd>

<space/>

<wd l="6893" t="12941" r="7550" b="13099">method</wd>

<space/>

<wd l="7622" t="12941" r="7757" b="13099">is</wd>

<space/>

<wd l="7838" t="12941" r="8333" b="13099">based</wd>

<space/>

<wd l="8410" t="12994" r="8626" b="13099">on</wd>

<space/>

<wd l="8702" t="12941" r="9629" b="13142">supervised</wd>

<space/>

<wd l="9701" t="12941" r="10502" b="13099">machine-</wd>

</ln>

<ln l="6144" t="13210" r="10512" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13210" r="6859" b="13411">learning</wd>

<space/>

<wd l="6946" t="13210" r="7258" b="13368">and</wd>

<space/>

<wd l="7339" t="13210" r="8165" b="13368">addresses</wd>

<space/>

<wd l="8251" t="13210" r="8515" b="13368">the</wd>

<space/>

<wd l="8597" t="13210" r="8952" b="13368">task</wd>

<space/>

<wd l="9029" t="13210" r="9202" b="13363">in</wd>

<space/>

<wd l="9283" t="13262" r="9480" b="13368">an</wd>

<space/>

<wd l="9571" t="13210" r="10512" b="13368">end-to-end</wd>

<space/>

</ln>

<ln l="6144" t="13478" r="10517" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13531" r="6830" b="13637">manner.</wd>

<space/>

<wd l="6984" t="13483" r="7118" b="13637">It</wd>

<space/>

<wd l="7200" t="13478" r="8011" b="13637">considers</wd>

<space/>

<wd l="8102" t="13531" r="8568" b="13680">every</wd>

<space/>

<wd l="8650" t="13478" r="9365" b="13680">possible</wd>

<space/>

<wd l="9446" t="13531" r="10080" b="13680">n-gram</wd>

<space/>

<wd l="10157" t="13531" r="10330" b="13637">as</wd>

<space/>

<wd l="10421" t="13531" r="10517" b="13637">a</wd>

<space/>

</ln>

<ln l="6149" t="13752" r="10512" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="13752" r="6979" b="13910">candidate</wd>

<space/>

<wd l="7056" t="13752" r="7546" b="13954">entity</wd>

<space/>

<wd l="7618" t="13752" r="8333" b="13910">mention</wd>

<space/>

<wd l="8405" t="13752" r="8717" b="13910">and</wd>

<space/>

<wd l="8789" t="13752" r="9384" b="13910">detects</wd>

<space/>

<wd l="9461" t="13752" r="9725" b="13910">the</wd>

<space/>

<wd l="9797" t="13752" r="10512" b="13910">mention</wd>

<space/>

</ln>

<ln l="6144" t="14021" r="10502" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14021" r="6533" b="14179">with</wd>

<space/>

<wd l="6581" t="14074" r="6677" b="14179">a</wd>

<space/>

<wd l="6720" t="14021" r="7958" b="14222">corresponding</wd>

<space/>

<wd l="8006" t="14021" r="8347" b="14174">link</wd>

<space/>

<wd l="8390" t="14045" r="8554" b="14179">to</wd>

<space/>

<wd l="8606" t="14074" r="8702" b="14179">a</wd>

<space/>

<wd l="8746" t="14026" r="9034" b="14174">KB</wd>

<space/>

<wd l="9091" t="14045" r="9533" b="14222">entry</wd>

<space/>

<wd l="9576" t="14021" r="9725" b="14174">if</wd>

<space/>

<wd l="9754" t="14021" r="10018" b="14179">the</wd>

<space/>

<wd l="10061" t="14074" r="10502" b="14179">men-</wd>

</ln>

<ln l="6144" t="14294" r="10512" b="14482" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14294" r="6485" b="14453">tion</wd>

<space/>

<wd l="6562" t="14294" r="7042" b="14453">exists</wd>

<space/>

<wd l="7123" t="14294" r="7296" b="14448">in</wd>

<space/>

<wd l="7368" t="14294" r="7632" b="14453">the</wd>

<space/>

<wd l="7714" t="14299" r="8054" b="14453">KB.</wd>

<space/>

<wd l="8136" t="14294" r="9269" b="14482">Furthermore,</wd>

<space/>

<wd l="9360" t="14294" r="9485" b="14453">it</wd>

<space/>

<wd l="9557" t="14347" r="9854" b="14453">can</wd>

<space/>

<wd l="9931" t="14294" r="10512" b="14453">handle</wd>

<space/>

</ln>

<ln l="6144" t="14563" r="10502" b="14765" baseLine="14717">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="14563" r="6936" b="14722">mentions</wd>

<space/>

<wd l="7003" t="14563" r="7330" b="14722">that</wd>

<space/>

<wd l="7392" t="14616" r="7973" b="14765">appear</wd>

<space/>

<wd l="8030" t="14616" r="8198" b="14722">as</wd>

<space/>

<wd l="8266" t="14563" r="9014" b="14765">irregular</wd>

<space/>

<wd l="9067" t="14563" r="9571" b="14722">forms</wd>

<space/>

<wd l="9643" t="14568" r="10066" b="14765">(e.g.,</wd>

<space/>

</run>

<wd l="10133" t="14573" r="10502" b="14722" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">mis-</wd>

</ln>

<ln l="6144" t="14837" r="10507" b="15038" baseLine="14986">

<wd l="6144" t="14837" r="6965" b="15038"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">spellings</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

</run>

<wd l="7051" t="14837" r="8285" b="15024"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">abbreviations</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="8371" t="14842" r="9278" b="15038">acronyms)</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="9355" t="14837" r="9826" b="15038">using</wd>

<space/>

<wd l="9912" t="14837" r="10507" b="14995">several</wd>

<space/>

</run>

</ln>

<ln l="6149" t="15106" r="9686" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="15106" r="7234" b="15307">approximate</wd>

<space/>

<wd l="7301" t="15106" r="7786" b="15307">string</wd>

<space/>

<wd l="7843" t="15106" r="8650" b="15307">matching</wd>

<space/>

<wd l="8712" t="15106" r="9686" b="15307">algorithms.</wd>

</ln>

</para>

</column>

</section>

<section l="1437" t="15336" r="10531" b="16480">

<column l="1437" t="15336" r="10531" b="16480">

<para l="5771" t="15787" r="6200" b="15946" alignment="centered" spaceBefore="386" lsp="exactly" lspExact="271" language="en">

<ln l="5837" t="15787" r="6134" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="24">

<wd l="5837" t="15787" r="6134" b="15946">136</wd>

</ln>

</para>

<para l="2827" t="16133" r="9072" b="16469" alignment="centered" spaceBefore="139" lsp="exactly" lspExact="170" language="en">

<ln l="2827" t="16133" r="9072" b="16301" baseLine="16253" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2827" t="16133" r="3710" b="16296">Proceedings</wd>

<space/>

<wd l="3763" t="16133" r="3926" b="16296">of</wd>

<space/>

<wd l="3950" t="16133" r="4162" b="16262">the</wd>

<space/>

<wd l="4200" t="16138" r="4531" b="16262">ACL</wd>

<space/>

<wd l="4574" t="16133" r="4934" b="16262">2015</wd>

<space/>

<wd l="4987" t="16133" r="5688" b="16296">Workshop</wd>

<space/>

<wd l="5741" t="16176" r="5914" b="16262">on</wd>

<space/>

<wd l="5957" t="16138" r="6365" b="16296">Noisy</wd>

<space/>

<wd l="6427" t="16133" r="7536" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7584" t="16138" r="7901" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7954" t="16171" r="8352" b="16301">pages</wd>

<space/>

<wd l="8424" t="16133" r="9072" b="16286">136–140,
</wd>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4320.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1437" marginTop="1260" marginRight="1378" marginBottom="1292" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1437" t="1260" r="10531" b="15359">

<column l="1437" t="1260" r="5824" b="15359">

<para l="1440" t="1320" r="5808" b="3106" alignment="justified" spaceBefore="1" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="1320" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="1320" r="1997" b="1478">The</wd>

<space/>

<wd l="2093" t="1325" r="2525" b="1478">NER</wd>

<space/>

<wd l="2621" t="1320" r="2971" b="1478">task</wd>

<space/>

<wd l="3062" t="1320" r="3202" b="1478">is</wd>

<space/>

<wd l="3312" t="1320" r="3682" b="1522">split</wd>

<space/>

<wd l="3773" t="1320" r="4109" b="1478">into</wd>

<space/>

<wd l="4205" t="1344" r="4526" b="1478">two</wd>

<space/>

<wd l="4632" t="1344" r="5338" b="1522">separate</wd>

<space/>

<wd l="5438" t="1320" r="5794" b="1478">sub-</wd>

</ln>

<ln l="1440" t="1594" r="5803" b="1795" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="1594" r="1920" b="1752">tasks:</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2098" t="1603" r="3250" b="1795">segmentation</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3360" t="1594" r="3672" b="1752">and</wd>

<space/>

</run>

<wd l="3778" t="1594" r="4968" b="1795"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">classification</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5189" t="1594" r="5803" b="1795">During</wd>

<space/>

</run>

</ln>

<ln l="1450" t="1862" r="5808" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="1862" r="2645" b="2064">segmentation,</wd>

<space/>

<wd l="2784" t="1862" r="3053" b="2021">the</wd>

<space/>

<wd l="3173" t="1862" r="3662" b="2064">entity</wd>

<space/>

<wd l="3782" t="1862" r="4574" b="2021">mentions</wd>

<space/>

<wd l="4699" t="1915" r="4963" b="2021">are</wd>

<space/>

<wd l="5083" t="1862" r="5808" b="2021">detected</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="5794" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2136" r="1867" b="2294">from</wd>

<space/>

<wd l="1939" t="2160" r="2539" b="2294">tweets.</wd>

<space/>

<wd l="2678" t="2136" r="3173" b="2323">Then,</wd>

<space/>

<wd l="3264" t="2136" r="3528" b="2294">the</wd>

<space/>

<wd l="3610" t="2136" r="4099" b="2338">entity</wd>

<space/>

<wd l="4176" t="2136" r="4968" b="2294">mentions</wd>

<space/>

<wd l="5059" t="2189" r="5318" b="2294">are</wd>

<space/>

<wd l="5400" t="2136" r="5794" b="2294">clas-</wd>

</ln>

<ln l="1450" t="2405" r="5798" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="2405" r="1915" b="2563">sified</wd>

<space/>

<wd l="1978" t="2405" r="2314" b="2563">into</wd>

<space/>

<wd l="2386" t="2405" r="2650" b="2563">the</wd>

<space/>

<wd l="2717" t="2405" r="3638" b="2606">predefined</wd>

<space/>

<wd l="3706" t="2405" r="4195" b="2606">entity</wd>

<space/>

<wd l="4262" t="2429" r="4766" b="2606">types.</wd>

<space/>

<wd l="4882" t="2405" r="5304" b="2563">Both</wd>

<space/>

<wd l="5371" t="2405" r="5798" b="2563">tasks</wd>

<space/>

</ln>

<ln l="1440" t="2678" r="5798" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2678" r="2078" b="2837">involve</wd>

<space/>

<wd l="2150" t="2678" r="3072" b="2880">supervised</wd>

<space/>

<wd l="3134" t="2678" r="4656" b="2880">machine-learning</wd>

<space/>

<wd l="4718" t="2678" r="5107" b="2837">with</wd>

<space/>

<wd l="5170" t="2678" r="5798" b="2837">various</wd>

<space/>

</ln>

<ln l="1440" t="2947" r="2174" b="3106" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2947" r="2174" b="3106">features.</wd>

</ln>

</para>

<para l="1440" t="3240" r="5808" b="4752" alignment="justified" spaceBefore="20" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="3240" r="5808" b="3442" baseLine="3389" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="3245" r="1963" b="3398">For</wd>

<space/>

<wd l="2006" t="3240" r="2275" b="3398">the</wd>

<space/>

<wd l="2338" t="3240" r="3490" b="3442">segmentation</wd>

<space/>

<wd l="3538" t="3240" r="3931" b="3427">task,</wd>

<space/>

<wd l="3994" t="3293" r="4248" b="3398">we</wd>

<space/>

<wd l="4301" t="3293" r="4589" b="3398">use</wd>

<space/>

<wd l="4646" t="3240" r="5006" b="3398">data</wd>

<space/>

<wd l="5059" t="3240" r="5808" b="3398">obtained</wd>

<space/>

</ln>

<ln l="1440" t="3509" r="5794" b="3710" baseLine="3662" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="3509" r="1867" b="3667">from</wd>

<space/>

<wd l="1968" t="3509" r="2232" b="3667">the</wd>

<space/>

<wd l="2342" t="3514" r="2630" b="3662">KB</wd>

<space/>

<wd l="2750" t="3509" r="2942" b="3667">of</wd>

<space/>

<wd l="3034" t="3509" r="3298" b="3667">the</wd>

<space/>

<wd l="3408" t="3509" r="4646" b="3710">corresponding</wd>

<space/>

<wd l="4762" t="3509" r="5251" b="3710">entity</wd>

<space/>

<wd l="5357" t="3562" r="5794" b="3667">men-</wd>

</ln>

<ln l="1440" t="3782" r="5803" b="3984" baseLine="3931" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="3782" r="1781" b="3941">tion</wd>

<space/>

<wd l="1853" t="3782" r="2578" b="3941">detected</wd>

<space/>

<wd l="2645" t="3782" r="2861" b="3984">by</wd>

<space/>

<wd l="2933" t="3782" r="3197" b="3941">the</wd>

<space/>

<wd l="3269" t="3787" r="3538" b="3936">EL</wd>

<space/>

<wd l="3610" t="3782" r="3922" b="3941">and</wd>

<space/>

<wd l="3989" t="3782" r="4253" b="3941">the</wd>

<space/>

<wd l="4330" t="3806" r="4886" b="3984">output</wd>

<space/>

<wd l="4958" t="3782" r="5146" b="3941">of</wd>

<space/>

<wd l="5208" t="3835" r="5304" b="3941">a</wd>

<space/>

<wd l="5371" t="3787" r="5803" b="3941">NER</wd>

<space/>

</ln>

<ln l="1450" t="4051" r="5794" b="4253" baseLine="4205" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="4051" r="2189" b="4210">software</wd>

<space/>

<wd l="2285" t="4104" r="2453" b="4210">as</wd>

<space/>

<wd l="2554" t="4051" r="2822" b="4210">the</wd>

<space/>

<wd l="2914" t="4051" r="3350" b="4210">main</wd>

<space/>

<wd l="3442" t="4051" r="4963" b="4253">machine-learning</wd>

<space/>

<wd l="5059" t="4051" r="5794" b="4210">features.</wd>

<space/>

</ln>

<ln l="1440" t="4325" r="5798" b="4512" baseLine="4474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="4325" r="2573" b="4512">Furthermore,</wd>

<space/>

<wd l="2640" t="4378" r="2890" b="4483">we</wd>

<space/>

<wd l="2942" t="4325" r="3586" b="4483">include</wd>

<space/>

<wd l="3648" t="4325" r="4243" b="4483">several</wd>

<space/>

<wd l="4306" t="4378" r="5064" b="4483">common</wd>

<space/>

<wd l="5117" t="4325" r="5798" b="4483">features</wd>

<space/>

</ln>

<ln l="1440" t="4594" r="4344" b="4752" baseLine="4747" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="4594" r="1843" b="4752">used</wd>

<space/>

<wd l="1896" t="4594" r="2064" b="4747">in</wd>

<space/>

<wd l="2117" t="4594" r="3014" b="4752">traditional</wd>

<space/>

<wd l="3072" t="4598" r="3504" b="4752">NER</wd>

<space/>

<wd l="3562" t="4594" r="4344" b="4752">methods.</wd>

</ln>

</para>

<para l="1440" t="4886" r="5808" b="7795" alignment="justified" spaceBefore="19" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="4886" r="5803" b="5088" baseLine="5035" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="4891" r="1963" b="5045">For</wd>

<space/>

<wd l="2040" t="4886" r="2304" b="5045">the</wd>

<space/>

<wd l="2390" t="4886" r="3528" b="5045">classification</wd>

<space/>

<wd l="3605" t="4886" r="3998" b="5074">task,</wd>

<space/>

<wd l="4099" t="4886" r="4363" b="5045">the</wd>

<space/>

<wd l="4445" t="4886" r="5285" b="5088">following</wd>

<space/>

<wd l="5371" t="4886" r="5803" b="5045">three</wd>

<space/>

</ln>

<ln l="1440" t="5160" r="5794" b="5362" baseLine="5309" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="5184" r="1891" b="5362">types</wd>

<space/>

<wd l="1973" t="5160" r="2165" b="5318">of</wd>

<space/>

<wd l="2218" t="5160" r="2899" b="5318">features</wd>

<space/>

<wd l="2981" t="5213" r="3240" b="5318">are</wd>

<space/>

<wd l="3307" t="5160" r="3710" b="5318">used</wd>

<space/>

<wd l="3778" t="5213" r="3946" b="5318">as</wd>

<space/>

<wd l="4022" t="5160" r="4709" b="5362">primary</wd>

<space/>

<wd l="4781" t="5160" r="5515" b="5318">features:</wd>

<space/>

<wd l="5650" t="5165" r="5794" b="5357">1)</wd>

<space/>

</ln>

<ln l="1440" t="5429" r="5794" b="5630" baseLine="5578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="5429" r="1704" b="5587">the</wd>

<space/>

<wd l="1781" t="5434" r="2064" b="5582">KB</wd>

<space/>

<wd l="2146" t="5453" r="2597" b="5630">types</wd>

<space/>

<wd l="2678" t="5429" r="2870" b="5587">of</wd>

<space/>

<wd l="2923" t="5429" r="3187" b="5587">the</wd>

<space/>

<wd l="3259" t="5429" r="3749" b="5630">entity</wd>

<space/>

<wd l="3826" t="5429" r="4550" b="5587">detected</wd>

<space/>

<wd l="4618" t="5429" r="4829" b="5630">by</wd>

<space/>

<wd l="4901" t="5429" r="5165" b="5587">the</wd>

<space/>

<wd l="5237" t="5434" r="5544" b="5616">EL,</wd>

<space/>

<wd l="5630" t="5434" r="5794" b="5626">2)</wd>

<space/>

</ln>

<ln l="1440" t="5698" r="5808" b="5899" baseLine="5851" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="5698" r="1704" b="5856">the</wd>

<space/>

<wd l="1757" t="5698" r="2246" b="5899">entity</wd>

<space/>

<wd l="2299" t="5722" r="2750" b="5899">types</wd>

<space/>

<wd l="2808" t="5698" r="3533" b="5856">detected</wd>

<space/>

<wd l="3576" t="5698" r="3792" b="5899">by</wd>

<space/>

<wd l="3845" t="5698" r="4109" b="5856">the</wd>

<space/>

<wd l="4157" t="5702" r="4589" b="5856">NER</wd>

<space/>

<wd l="4646" t="5698" r="5429" b="5885">software,</wd>

<space/>

<wd l="5496" t="5698" r="5808" b="5856">and</wd>

<space/>

</ln>

<ln l="1445" t="5971" r="5808" b="6173" baseLine="6120" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="5976" r="1613" b="6168">3)</wd>

<space/>

<wd l="1690" t="5971" r="1954" b="6130">the</wd>

<space/>

<wd l="2026" t="5995" r="2573" b="6130">vector</wd>

<space/>

<wd l="2635" t="5971" r="3874" b="6173">representation</wd>

<space/>

<wd l="3946" t="5971" r="4138" b="6130">of</wd>

<space/>

<wd l="4190" t="5971" r="4454" b="6130">the</wd>

<space/>

<wd l="4531" t="5971" r="5021" b="6173">entity</wd>

<space/>

<wd l="5088" t="5971" r="5808" b="6130">mention</wd>

<space/>

</ln>

<ln l="1445" t="6240" r="5794" b="6442" baseLine="6394" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="6240" r="2088" b="6398">derived</wd>

<space/>

<wd l="2155" t="6240" r="2582" b="6398">from</wd>

<space/>

<wd l="2650" t="6240" r="3096" b="6398">word</wd>

<space/>

<wd l="3168" t="6240" r="4262" b="6442">embeddings.</wd>

<space/>

<wd l="4382" t="6240" r="4723" b="6398">The</wd>

<space/>

<wd l="4795" t="6240" r="5424" b="6442">entity’s</wd>

<space/>

<wd l="5506" t="6245" r="5794" b="6394">KB</wd>

<space/>

</ln>

<ln l="1440" t="6514" r="5798" b="6715" baseLine="6662" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="6538" r="1891" b="6715">types</wd>

<space/>

<wd l="1958" t="6566" r="2218" b="6672">are</wd>

<space/>

<wd l="2280" t="6514" r="3072" b="6672">extracted</wd>

<space/>

<wd l="3125" t="6514" r="3552" b="6672">from</wd>

<space/>

<wd l="3600" t="6514" r="3869" b="6672">the</wd>

<space/>

<wd l="3926" t="6514" r="5165" b="6715">corresponding</wd>

<space/>

<wd l="5227" t="6514" r="5798" b="6672">entries</wd>

<space/>

</ln>

<ln l="1440" t="6782" r="5794" b="6984" baseLine="6936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="6782" r="1613" b="6936">in</wd>

<space/>

<wd l="1685" t="6782" r="2462" b="6984">DBpedia</wd>

<space/>

<wd l="2534" t="6782" r="2846" b="6941">and</wd>

<space/>

<wd l="2918" t="6782" r="3739" b="6941">Freebase.</wd>

<space/>

<wd l="3874" t="6782" r="5006" b="6970">Furthermore,</wd>

<space/>

<wd l="5093" t="6782" r="5362" b="6941">the</wd>

<space/>

<wd l="5434" t="6835" r="5794" b="6941">vec-</wd>

</ln>

<ln l="1440" t="7056" r="5808" b="7258" baseLine="7205" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="7080" r="1685" b="7214">tor</wd>

<space/>

<wd l="1742" t="7056" r="2981" b="7258">representation</wd>

<space/>

<wd l="3048" t="7056" r="3240" b="7214">of</wd>

<space/>

<wd l="3288" t="7056" r="3552" b="7214">the</wd>

<space/>

<wd l="3619" t="7056" r="4109" b="7258">entity</wd>

<space/>

<wd l="4176" t="7056" r="4891" b="7214">mention</wd>

<space/>

<wd l="4954" t="7056" r="5088" b="7214">is</wd>

<space/>

<wd l="5165" t="7056" r="5808" b="7214">derived</wd>

<space/>

</ln>

<ln l="1440" t="7325" r="5794" b="7526" baseLine="7478" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="7325" r="1910" b="7526">using</wd>

<space/>

<wd l="1973" t="7325" r="2525" b="7483">GloVe</wd>

<space/>

<wd l="2587" t="7325" r="3034" b="7483">word</wd>

<space/>

<wd l="3091" t="7325" r="4133" b="7526">embeddings</wd>

<space/>

<wd l="4210" t="7325" r="5270" b="7526">(Pennington</wd>

<space/>

<wd l="5328" t="7349" r="5482" b="7483">et</wd>

<space/>

<wd l="5544" t="7325" r="5794" b="7512">al.,</wd>

<space/>

</ln>

<ln l="1445" t="7603" r="1992" b="7795" baseLine="7747" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="7603" r="1992" b="7795">2014).</wd>

</ln>

</para>

<para l="1440" t="7886" r="5803" b="9710" alignment="justified" spaceBefore="16" fli="216" lsp="exactly" lspExact="272" language="en">

<ln l="1656" t="7886" r="5803" b="8088" baseLine="8040" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="7891" r="1882" b="8045">To</wd>

<space/>

<wd l="1958" t="7886" r="2362" b="8045">train</wd>

<space/>

<wd l="2443" t="7886" r="2755" b="8045">and</wd>

<space/>

<wd l="2832" t="7886" r="3542" b="8045">evaluate</wd>

<space/>

<wd l="3624" t="7939" r="3917" b="8045">our</wd>

<space/>

<wd l="3998" t="7910" r="4637" b="8088">system,</wd>

<space/>

<wd l="4733" t="7939" r="4982" b="8045">we</wd>

<space/>

<wd l="5064" t="7886" r="5462" b="8045">used</wd>

<space/>

<wd l="5539" t="7886" r="5803" b="8045">the</wd>

<space/>

</ln>

<ln l="1445" t="8160" r="5803" b="8362" baseLine="8309">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="8160" r="2050" b="8318">dataset</wd>

<space/>

<wd l="2112" t="8160" r="2587" b="8362">given</wd>

<space/>

<wd l="2645" t="8160" r="2861" b="8362">by</wd>

<space/>

<wd l="2928" t="8160" r="3192" b="8318">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="3250" t="8160" r="3883" b="8318">Named</wd>

<space/>

<wd l="3931" t="8170" r="4459" b="8362">Entity</wd>

<space/>

<wd l="4517" t="8170" r="5568" b="8362">Recognition</wd>

<space/>

<wd l="5645" t="8170" r="5803" b="8318">in</wd>

<space/>

</run>

</ln>

<ln l="1450" t="8429" r="5794" b="8630" baseLine="8582">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1450" t="8438" r="2059" b="8587">Twitter</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2126" t="8429" r="2688" b="8587">shared</wd>

<space/>

<wd l="2741" t="8429" r="3139" b="8587">task.</wd>

<space/>

<wd l="3226" t="8434" r="3566" b="8587">Our</wd>

<space/>

<wd l="3619" t="8429" r="4421" b="8630">proposed</wd>

<space/>

<wd l="4474" t="8429" r="5131" b="8587">method</wd>

<space/>

<wd l="5198" t="8429" r="5794" b="8630">signifi-</wd>

</run>

</ln>

<ln l="1445" t="8702" r="5803" b="8904" baseLine="8851" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="8702" r="1968" b="8904">cantly</wd>

<space/>

<wd l="2035" t="8702" r="3221" b="8904">outperformed</wd>

<space/>

<wd l="3278" t="8702" r="3547" b="8861">the</wd>

<space/>

<wd l="3614" t="8702" r="4214" b="8861">second</wd>

<space/>

<wd l="4272" t="8702" r="4862" b="8861">ranked</wd>

<space/>

<wd l="4930" t="8726" r="5530" b="8904">system</wd>

<space/>

<wd l="5587" t="8702" r="5803" b="8904">by</wd>

<space/>

</ln>

<ln l="1445" t="8971" r="5794" b="9173" baseLine="9125">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="9024" r="1541" b="9130">a</wd>

<space/>

<wd l="1584" t="8971" r="2006" b="9130">wide</wd>

<space/>

<wd l="2054" t="8971" r="2717" b="9173">margin;</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2789" t="8976" r="3331" b="9130">10.3%</wd>

<space/>

<wd l="3389" t="8976" r="3610" b="9125">F1</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="3682" t="8995" r="3835" b="9130">at</wd>

<space/>

<wd l="3878" t="8971" r="4147" b="9130">the</wd>

<space/>

<wd l="4200" t="8971" r="5352" b="9173">segmentation</wd>

<space/>

<wd l="5400" t="8971" r="5794" b="9158">task,</wd>

<space/>

</run>

</ln>

<ln l="1445" t="9245" r="5794" b="9446" baseLine="9394">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="9245" r="1757" b="9403">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1819" t="9250" r="2266" b="9403">5.0%</wd>

<space/>

<wd l="2338" t="9250" r="2563" b="9398">F1</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2654" t="9269" r="2808" b="9403">at</wd>

<space/>

<wd l="2870" t="9245" r="3134" b="9403">the</wd>

<space/>

<wd l="3206" t="9245" r="4147" b="9403">end-to-end</wd>

<space/>

<wd l="4219" t="9245" r="4675" b="9442">(both</wd>

<space/>

<wd l="4738" t="9245" r="5002" b="9403">the</wd>

<space/>

<wd l="5078" t="9298" r="5794" b="9446">segmen-</wd>

</run>

</ln>

<ln l="1440" t="9514" r="4344" b="9710" baseLine="9667" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9514" r="1939" b="9672">tation</wd>

<space/>

<wd l="1997" t="9514" r="2309" b="9672">and</wd>

<space/>

<wd l="2362" t="9514" r="2626" b="9672">the</wd>

<space/>

<wd l="2688" t="9514" r="3883" b="9710">classification)</wd>

<space/>

<wd l="3950" t="9514" r="4344" b="9672">task.</wd>

</ln>

</para>

<para l="1440" t="10046" r="3998" b="10733" alignment="left" ri="1800" spaceBefore="78" lsp="exactly" lspExact="471" language="en">

<ln l="1440" t="10046" r="3998" b="10267" baseLine="10214" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10046" r="1555" b="10214">2</wd>

<space/>

<wd l="1805" t="10051" r="2198" b="10219">The</wd>

<space/>

<wd l="2256" t="10051" r="3206" b="10267">Proposed</wd>

<space/>

<wd l="3274" t="10046" r="3998" b="10267">System</wd>

<space/>

</ln>

<ln l="1440" t="10531" r="3230" b="10733" baseLine="10685" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10531" r="1704" b="10690">2.1</wd>

<space/>

<wd l="1930" t="10531" r="3230" b="10733">Preprocessing</wd>

</ln>

</para>

<para l="1440" t="10925" r="5803" b="12206" alignment="justified" spaceBefore="116" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="10925" r="5803" b="11126" baseLine="11074" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10925" r="1781" b="11083">The</wd>

<space/>

<wd l="1901" t="10949" r="2501" b="11126">system</wd>

<space/>

<wd l="2611" t="10925" r="2952" b="11083">first</wd>

<space/>

<wd l="3062" t="10925" r="3682" b="11126">assigns</wd>

<space/>

<wd l="3802" t="10925" r="5064" b="11126">part-of-speech</wd>

<space/>

<wd l="5174" t="10949" r="5515" b="11126">tags</wd>

<space/>

<wd l="5635" t="10949" r="5803" b="11083">to</wd>

<space/>

</ln>

<ln l="1440" t="11194" r="5794" b="11395" baseLine="11342" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11194" r="1704" b="11352">the</wd>

<space/>

<wd l="1795" t="11194" r="2554" b="11395">resulting</wd>

<space/>

<wd l="2650" t="11194" r="3206" b="11352">tokens</wd>

<space/>

<wd l="3307" t="11194" r="3773" b="11395">using</wd>

<space/>

<wd l="3869" t="11198" r="4330" b="11347">ARK</wd>

<space/>

<wd l="4416" t="11194" r="5045" b="11352">Twitter</wd>

<space/>

<wd l="5131" t="11194" r="5794" b="11352">Part-of-</wd>

</ln>

<ln l="1445" t="11462" r="5794" b="11664" baseLine="11616" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="11462" r="2074" b="11664">Speech</wd>

<space/>

<wd l="2150" t="11467" r="2755" b="11664">Tagger</wd>

<space/>

<wd l="2837" t="11462" r="3552" b="11664">(Gimpel</wd>

<space/>

<wd l="3638" t="11486" r="3792" b="11621">et</wd>

<space/>

<wd l="3874" t="11462" r="4123" b="11650">al.,</wd>

<space/>

<wd l="4224" t="11467" r="4771" b="11659">2011).</wd>

<space/>

<wd l="4920" t="11467" r="5054" b="11621">It</wd>

<space/>

<wd l="5136" t="11462" r="5482" b="11621">also</wd>

<space/>

<wd l="5563" t="11486" r="5794" b="11621">to-</wd>

</ln>

<ln l="1440" t="11736" r="5794" b="11938" baseLine="11885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11736" r="2083" b="11894">kenizes</wd>

<space/>

<wd l="2165" t="11736" r="2794" b="11894">Twitter</wd>

<space/>

<wd l="2866" t="11736" r="3610" b="11938">hashtags</wd>

<space/>

<wd l="3691" t="11736" r="4162" b="11938">using</wd>

<space/>

<wd l="4243" t="11789" r="4536" b="11894">our</wd>

<space/>

<wd l="4608" t="11736" r="5429" b="11894">enhanced</wd>

<space/>

<wd l="5501" t="11736" r="5794" b="11890">im-</wd>

</ln>

<ln l="1440" t="12005" r="5030" b="12206" baseLine="12158" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12005" r="2582" b="12206">plementation</wd>

<space/>

<wd l="2640" t="12005" r="2827" b="12163">of</wd>

<space/>

<wd l="2870" t="12005" r="3134" b="12163">the</wd>

<space/>

<wd l="3192" t="12005" r="3854" b="12206">hashtag</wd>

<space/>

<wd l="3912" t="12005" r="5030" b="12163">tokenization.</wd>

</ln>

</para>

<para l="1440" t="12528" r="3302" b="12730" alignment="left" spaceBefore="268" lsp="exactly" lspExact="253" language="en">

<ln l="1440" t="12528" r="3302" b="12730" baseLine="12677" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">

<wd l="1440" t="12528" r="1709" b="12686">2.2</wd>

<space/>

<wd l="1930" t="12528" r="2510" b="12730">Entity</wd>

<space/>

<wd l="2568" t="12528" r="3302" b="12730">Linking</wd>

</ln>

</para>

<para l="1440" t="12917" r="5808" b="14472" alignment="justified" spaceBefore="119" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="12917" r="5808" b="13075" baseLine="13070" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12922" r="1723" b="13075">We</wd>

<space/>

<wd l="1819" t="12917" r="2654" b="13075">formalize</wd>

<space/>

<wd l="2760" t="12970" r="3048" b="13075">our</wd>

<space/>

<wd l="3139" t="12922" r="3408" b="13070">EL</wd>

<space/>

<wd l="3504" t="12917" r="3854" b="13075">task</wd>

<space/>

<wd l="3955" t="12970" r="4123" b="13075">as</wd>

<space/>

<wd l="4229" t="12917" r="4920" b="13075">follows:</wd>

<space/>

<wd l="5093" t="12917" r="5616" b="13075">Given</wd>

<space/>

<wd l="5712" t="12970" r="5808" b="13075">a</wd>

<space/>

</ln>

<ln l="1440" t="13190" r="5803" b="13392" baseLine="13339" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13214" r="1954" b="13378">tweet,</wd>

<space/>

<wd l="2093" t="13243" r="2386" b="13349">our</wd>

<space/>

<wd l="2491" t="13190" r="2861" b="13392">goal</wd>

<space/>

<wd l="2971" t="13190" r="3110" b="13349">is</wd>

<space/>

<wd l="3226" t="13214" r="3394" b="13349">to</wd>

<space/>

<wd l="3504" t="13190" r="4354" b="13392">recognize</wd>

<space/>

<wd l="4469" t="13243" r="4565" b="13349">a</wd>

<space/>

<wd l="4675" t="13214" r="4910" b="13349">set</wd>

<space/>

<wd l="5021" t="13190" r="5213" b="13349">of</wd>

<space/>

<wd l="5314" t="13190" r="5803" b="13392">entity</wd>

<space/>

</ln>

<ln l="1440" t="13459" r="5808" b="13661" baseLine="13608">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="13459" r="2232" b="13618">mentions</wd>

<space/>

<wd l="2304" t="13464" r="2726" b="13661">(e.g.,</wd>

<space/>

</run>

<wd l="2803" t="13459" r="3480" b="13646"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Obama</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3547" t="13459" r="4382" b="13618">President</wd>

<space/>

</run>

<wd l="4440" t="13459" r="5117" b="13646"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Obama</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5179" t="13459" r="5808" b="13618">Barack</wd>

<space/>

</run>

</ln>

<ln l="1450" t="13733" r="5803" b="13934" baseLine="13882">

<wd l="1450" t="13733" r="2146" b="13930"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Obama</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2232" t="13733" r="2563" b="13891">that</wd>

<space/>

<wd l="2645" t="13786" r="3226" b="13934">appear</wd>

<space/>

<wd l="3298" t="13733" r="3470" b="13886">in</wd>

<space/>

<wd l="3552" t="13786" r="3648" b="13891">a</wd>

<space/>

<wd l="3720" t="13757" r="4238" b="13920">tweet,</wd>

<space/>

<wd l="4334" t="13733" r="4646" b="13891">and</wd>

<space/>

<wd l="4723" t="13733" r="5102" b="13891">then</wd>

<space/>

<wd l="5179" t="13733" r="5803" b="13891">resolve</wd>

<space/>

</run>

</ln>

<ln l="1440" t="13982" r="5794" b="14203" baseLine="14150">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="14002" r="1704" b="14160">the</wd>

<space/>

<wd l="1776" t="14002" r="2568" b="14160">mentions</wd>

<space/>

<wd l="2645" t="14002" r="2981" b="14160">into</wd>

<space/>

<wd l="3058" t="14002" r="3677" b="14160">entities</wd>

<space/>

<wd l="3763" t="14006" r="4186" b="14203">(e.g.,</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4282" t="13992" r="4944" b="14165">Barack</wd>

<space/>

</run>

<wd l="5021" t="13992" r="5794" b="14198"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Obama</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1440" t="14270" r="3686" b="14472" baseLine="14424" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14270" r="1613" b="14424">in</wd>

<space/>

<wd l="1666" t="14270" r="2568" b="14472">Wikipedia</wd>

<space/>

<wd l="2621" t="14270" r="2765" b="14424">if</wd>

<space/>

<wd l="2808" t="14270" r="3178" b="14472">they</wd>

<space/>

<wd l="3240" t="14270" r="3686" b="14429">exist.</wd>

</ln>

</para>

<para l="1440" t="14563" r="5803" b="15307" alignment="justified" spaceBefore="21" spaceAfter="32" fli="216" lsp="exactly" lspExact="272" language="en">

<ln l="1661" t="14563" r="5794" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1661" t="14568" r="2002" b="14722">Our</wd>

<space/>

<wd l="2050" t="14568" r="2318" b="14717">EL</wd>

<space/>

<wd l="2381" t="14587" r="2981" b="14765">system</wd>

<space/>

<wd l="3034" t="14563" r="3859" b="14722">addresses</wd>

<space/>

<wd l="3922" t="14563" r="4186" b="14722">the</wd>

<space/>

<wd l="4238" t="14563" r="4594" b="14722">task</wd>

<space/>

<wd l="4646" t="14563" r="5112" b="14765">using</wd>

<space/>

<wd l="5170" t="14563" r="5438" b="14722">the</wd>

<space/>

<wd l="5491" t="14563" r="5794" b="14722">fol-</wd>

</ln>

<ln l="1440" t="14837" r="5803" b="15038" baseLine="14986">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="14837" r="2035" b="15038">lowing</wd>

<space/>

<wd l="2126" t="14861" r="2448" b="14995">two</wd>

<space/>

<wd l="2544" t="14861" r="3019" b="15038">steps;</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="3134" t="14846" r="3830" b="14995">mention</wd>

<space/>

<wd l="3926" t="14837" r="4776" b="14995">candidate</wd>

<space/>

<wd l="4867" t="14846" r="5803" b="15038">generation</wd>

<space/>

</run>

</ln>

<ln l="1445" t="15106" r="5203" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="15106" r="1757" b="15264">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1810" t="15115" r="2510" b="15264">mention</wd>

<space/>

<wd l="2568" t="15106" r="3365" b="15264">detection</wd>

<space/>

<wd l="3422" t="15106" r="3754" b="15264">and</wd>

<space/>

</run>

<wd l="3802" t="15106" r="5203" b="15307"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">disambiguation</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

</para>

</column>

<column l="6144" t="1260" r="10531" b="15359">

<para l="6144" t="1320" r="9720" b="1478" alignment="left" spaceBefore="20" lsp="exactly" lspExact="253" language="en">

<ln l="6144" t="1320" r="9720" b="1478" baseLine="1474" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1320" r="6576" b="1478">2.2.1</wd>

<space/>

<wd l="6802" t="1320" r="7589" b="1478">Mention</wd>

<space/>

<wd l="7651" t="1320" r="8611" b="1478">Candidate</wd>

<space/>

<wd l="8674" t="1320" r="9720" b="1478">Generation</wd>

</ln>

</para>

<para l="6144" t="1651" r="10526" b="3706" alignment="justified" spaceBefore="52" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="1651" r="10502" b="1853" baseLine="1800" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="1656" r="6490" b="1810">Our</wd>

<space/>

<wd l="6571" t="1675" r="7171" b="1853">system</wd>

<space/>

<wd l="7253" t="1651" r="7589" b="1810">first</wd>

<space/>

<wd l="7670" t="1675" r="8477" b="1853">generates</wd>

<space/>

<wd l="8568" t="1704" r="8664" b="1810">a</wd>

<space/>

<wd l="8750" t="1675" r="8986" b="1810">set</wd>

<space/>

<wd l="9062" t="1651" r="9254" b="1810">of</wd>

<space/>

<wd l="9322" t="1651" r="10152" b="1810">candidate</wd>

<space/>

<wd l="10238" t="1704" r="10502" b="1810">en-</wd>

</ln>

<ln l="6144" t="1920" r="10502" b="2122" baseLine="2069" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="1920" r="6432" b="2122">tity</wd>

<space/>

<wd l="6504" t="1920" r="7296" b="2078">mentions</wd>

<space/>

<wd l="7368" t="1920" r="7762" b="2078">with</wd>

<space/>

<wd l="7824" t="1920" r="8093" b="2078">the</wd>

<space/>

<wd l="8170" t="1944" r="8405" b="2078">set</wd>

<space/>

<wd l="8472" t="1920" r="8664" b="2078">of</wd>

<space/>

<wd l="8722" t="1920" r="9960" b="2122">corresponding</wd>

<space/>

<wd l="10032" t="1920" r="10502" b="2078">refer-</wd>

</ln>

<ln l="6149" t="2189" r="10526" b="2390" baseLine="2342" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="2213" r="6413" b="2347">ent</wd>

<space/>

<wd l="6490" t="2189" r="7162" b="2347">entities.</wd>

<space/>

<wd l="7296" t="2189" r="7632" b="2347">The</wd>

<space/>

<wd l="7718" t="2213" r="8318" b="2390">system</wd>

<space/>

<wd l="8390" t="2189" r="8827" b="2347">takes</wd>

<space/>

<wd l="8914" t="2189" r="9125" b="2347">all</wd>

<space/>

<wd l="9202" t="2189" r="9466" b="2347">the</wd>

<space/>

<wd l="9542" t="2242" r="10248" b="2390">n-grams</wd>

<space/>

<wd l="10334" t="2189" r="10526" b="2347">of</wd>

<space/>

</ln>

<ln l="6149" t="2462" r="10498" b="2664" baseLine="2611">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="6149" t="2515" r="6269" b="2621">n</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1400" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="6360" t="2477" r="6499" b="2650">≤</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="6605" t="2467" r="6797" b="2621">10</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6869" t="2462" r="7181" b="2621">and</wd>

<space/>

<wd l="7238" t="2462" r="7704" b="2621">looks</wd>

<space/>

<wd l="7771" t="2515" r="7987" b="2664">up</wd>

<space/>

<wd l="8054" t="2462" r="8453" b="2621">each</wd>

<space/>

<wd l="8510" t="2515" r="9144" b="2664">n-gram</wd>

<space/>

<wd l="9202" t="2462" r="9370" b="2616">in</wd>

<space/>

<wd l="9432" t="2515" r="9528" b="2621">a</wd>

<space/>

<wd l="9590" t="2462" r="10498" b="2664">dictionary,</wd>

<space/>

</run>

</ln>

<ln l="6144" t="2731" r="10502" b="2933" baseLine="2885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2755" r="6610" b="2890">treats</wd>

<space/>

<wd l="6677" t="2784" r="6874" b="2890">an</wd>

<space/>

<wd l="6931" t="2784" r="7565" b="2933">n-gram</wd>

<space/>

<wd l="7618" t="2784" r="7786" b="2890">as</wd>

<space/>

<wd l="7853" t="2784" r="7949" b="2890">a</wd>

<space/>

<wd l="8002" t="2731" r="8832" b="2890">candidate</wd>

<space/>

<wd l="8890" t="2731" r="9605" b="2890">mention</wd>

<space/>

<wd l="9658" t="2731" r="9802" b="2885">if</wd>

<space/>

<wd l="9845" t="2731" r="9965" b="2890">it</wd>

<space/>

<wd l="10022" t="2731" r="10502" b="2890">exists</wd>

<space/>

</ln>

<ln l="6144" t="3005" r="10512" b="3206" baseLine="3154" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3005" r="6317" b="3158">in</wd>

<space/>

<wd l="6384" t="3005" r="6653" b="3163">the</wd>

<space/>

<wd l="6730" t="3005" r="7637" b="3206">dictionary,</wd>

<space/>

<wd l="7728" t="3005" r="8040" b="3163">and</wd>

<space/>

<wd l="8112" t="3005" r="8698" b="3206">finally,</wd>

<space/>

<wd l="8789" t="3029" r="9600" b="3206">generates</wd>

<space/>

<wd l="9682" t="3058" r="9878" b="3163">an</wd>

<space/>

<wd l="9960" t="3029" r="10512" b="3206">output</wd>

<space/>

</ln>

<ln l="6149" t="3274" r="10512" b="3475" baseLine="3427" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="3274" r="6341" b="3432">of</wd>

<space/>

<wd l="6394" t="3274" r="6806" b="3475">pairs</wd>

<space/>

<wd l="6883" t="3274" r="7075" b="3432">of</wd>

<space/>

<wd l="7128" t="3274" r="7920" b="3432">mentions</wd>

<space/>

<wd l="7997" t="3274" r="8309" b="3432">and</wd>

<space/>

<wd l="8371" t="3274" r="8774" b="3432">their</wd>

<space/>

<wd l="8842" t="3274" r="9734" b="3432">associated</wd>

<space/>

<wd l="9797" t="3274" r="10512" b="3475">possible</wd>

<space/>

</ln>

<ln l="6144" t="3547" r="7550" b="3706" baseLine="3696" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3547" r="6826" b="3706">referent</wd>

<space/>

<wd l="6883" t="3547" r="7550" b="3706">entities.</wd>

</ln>

</para>

<para l="6144" t="3974" r="10517" b="6888" alignment="justified" spaceBefore="158" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="3974" r="10517" b="4176" baseLine="4128">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="3974" r="7584" b="4176">Mention-Entity</wd>

<space/>

<wd l="7642" t="3974" r="8693" b="4176">Dictionary:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8928" t="3974" r="9264" b="4133">The</wd>

<space/>

<wd l="9331" t="3998" r="9931" b="4176">system</wd>

<space/>

<wd l="9984" t="4027" r="10349" b="4133">uses</wd>

<space/>

<wd l="10421" t="4027" r="10517" b="4133">a</wd>

<space/>

</run>

</ln>

<ln l="6144" t="4248" r="10502" b="4450" baseLine="4397">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="4258" r="7406" b="4450">mention-entity</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7459" t="4248" r="8333" b="4450">dictionary</wd>

<space/>

<wd l="8386" t="4248" r="8717" b="4406">that</wd>

<space/>

<wd l="8760" t="4301" r="9211" b="4450">maps</wd>

<space/>

<wd l="9274" t="4301" r="9370" b="4406">a</wd>

<space/>

<wd l="9413" t="4248" r="10128" b="4406">mention</wd>

<space/>

<wd l="10186" t="4301" r="10502" b="4406">sur-</wd>

</run>

</ln>

<ln l="6144" t="4517" r="10502" b="4718" baseLine="4666">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="4517" r="6504" b="4675">face</wd>

<space/>

<wd l="6595" t="4522" r="7013" b="4718">(e.g.,</wd>

<space/>

</run>

<wd l="7109" t="4517" r="7656" b="4718"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">apple</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="7742" t="4541" r="7910" b="4675">to</wd>

<space/>

<wd l="7992" t="4517" r="8256" b="4675">the</wd>

<space/>

<wd l="8333" t="4517" r="9048" b="4718">possible</wd>

<space/>

<wd l="9125" t="4517" r="9806" b="4675">referent</wd>

<space/>

<wd l="9883" t="4517" r="10502" b="4675">entities</wd>

<space/>

</run>

</ln>

<ln l="6154" t="4781" r="10512" b="4992" baseLine="4939">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6154" t="4795" r="6576" b="4992">(e.g.,</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6691" t="4781" r="7243" b="4992">Apple</wd>

<space/>

</run>

<wd l="7368" t="4781" r="7747" b="4978"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Inc.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7858" t="4781" r="8410" b="4992">Apple</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8520" t="4790" r="9173" b="4987">(food)).</wd>

<space/>

<wd l="9365" t="4790" r="9701" b="4949">The</wd>

<space/>

<wd l="9797" t="4790" r="10512" b="4992">possible</wd>

<space/>

</run>

</ln>

<ln l="6144" t="5059" r="10512" b="5261" baseLine="5208" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5059" r="6864" b="5218">mention</wd>

<space/>

<wd l="6950" t="5059" r="7646" b="5218">surfaces</wd>

<space/>

<wd l="7738" t="5059" r="7930" b="5218">of</wd>

<space/>

<wd l="8002" t="5112" r="8198" b="5218">an</wd>

<space/>

<wd l="8290" t="5059" r="8779" b="5261">entity</wd>

<space/>

<wd l="8866" t="5112" r="9130" b="5218">are</wd>

<space/>

<wd l="9216" t="5059" r="10008" b="5218">extracted</wd>

<space/>

<wd l="10085" t="5059" r="10512" b="5218">from</wd>

<space/>

</ln>

<ln l="6144" t="5328" r="10512" b="5530" baseLine="5482" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5328" r="6413" b="5486">the</wd>

<space/>

<wd l="6494" t="5328" r="7733" b="5530">corresponding</wd>

<space/>

<wd l="7814" t="5328" r="8717" b="5530">Wikipedia</wd>

<space/>

<wd l="8789" t="5381" r="9202" b="5530">page</wd>

<space/>

<wd l="9278" t="5328" r="9662" b="5515">title,</wd>

<space/>

<wd l="9754" t="5328" r="10022" b="5486">the</wd>

<space/>

<wd l="10099" t="5381" r="10512" b="5530">page</wd>

<space/>

</ln>

<ln l="6144" t="5602" r="10512" b="5803" baseLine="5750" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5602" r="6562" b="5760">titles</wd>

<space/>

<wd l="6658" t="5602" r="6850" b="5760">of</wd>

<space/>

<wd l="6917" t="5602" r="7186" b="5760">the</wd>

<space/>

<wd l="7267" t="5602" r="8174" b="5803">Wikipedia</wd>

<space/>

<wd l="8251" t="5654" r="8741" b="5803">pages</wd>

<space/>

<wd l="8832" t="5602" r="9158" b="5760">that</wd>

<space/>

<wd l="9240" t="5602" r="9912" b="5760">redirect</wd>

<space/>

<wd l="9994" t="5626" r="10157" b="5760">to</wd>

<space/>

<wd l="10243" t="5602" r="10512" b="5760">the</wd>

<space/>

</ln>

<ln l="6144" t="5870" r="10517" b="6072" baseLine="6024" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5923" r="6557" b="6072">page</wd>

<space/>

<wd l="6634" t="5870" r="6826" b="6029">of</wd>

<space/>

<wd l="6883" t="5870" r="7147" b="6029">the</wd>

<space/>

<wd l="7229" t="5870" r="7747" b="6072">entity,</wd>

<space/>

<wd l="7838" t="5870" r="8150" b="6029">and</wd>

<space/>

<wd l="8227" t="5870" r="8822" b="6029">anchor</wd>

<space/>

<wd l="8890" t="5894" r="9288" b="6029">texts</wd>

<space/>

<wd l="9370" t="5870" r="9542" b="6024">in</wd>

<space/>

<wd l="9610" t="5870" r="10517" b="6072">Wikipedia</wd>

<space/>

</ln>

<ln l="6149" t="6144" r="10512" b="6346" baseLine="6293" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="6144" r="6768" b="6302">articles</wd>

<space/>

<wd l="6859" t="6144" r="7190" b="6302">that</wd>

<space/>

<wd l="7272" t="6144" r="7723" b="6346">point</wd>

<space/>

<wd l="7805" t="6168" r="7973" b="6302">to</wd>

<space/>

<wd l="8064" t="6144" r="8328" b="6302">the</wd>

<space/>

<wd l="8414" t="6197" r="8822" b="6346">page</wd>

<space/>

<wd l="8914" t="6144" r="9106" b="6302">of</wd>

<space/>

<wd l="9178" t="6144" r="9442" b="6302">the</wd>

<space/>

<wd l="9533" t="6144" r="10056" b="6346">entity.</wd>

<space/>

<wd l="10224" t="6149" r="10512" b="6302">We</wd>

<space/>

</ln>

<ln l="6149" t="6413" r="10498" b="6614" baseLine="6566" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="6413" r="7152" b="6571">constructed</wd>

<space/>

<wd l="7200" t="6413" r="7507" b="6571">this</wd>

<space/>

<wd l="7574" t="6413" r="8448" b="6614">dictionary</wd>

<space/>

<wd l="8506" t="6413" r="8971" b="6614">using</wd>

<space/>

<wd l="9029" t="6413" r="9293" b="6571">the</wd>

<space/>

<wd l="9346" t="6418" r="10022" b="6614">January</wd>

<space/>

<wd l="10080" t="6413" r="10498" b="6571">2015</wd>

<space/>

</ln>

<ln l="6149" t="6686" r="7877" b="6888" baseLine="6835" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="6686" r="6638" b="6888">dump</wd>

<space/>

<wd l="6701" t="6686" r="6893" b="6845">of</wd>

<space/>

<wd l="6931" t="6686" r="7877" b="6888">Wikipedia.</wd>

</ln>

</para>

<para l="6144" t="7114" r="10512" b="9211" alignment="justified" spaceBefore="160" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="7114" r="10512" b="7315" baseLine="7267">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="7114" r="7373" b="7315">Approximate</wd>

<space/>

<wd l="7613" t="7114" r="8573" b="7272">Candidate</wd>

<space/>

<wd l="8808" t="7114" r="9912" b="7272">Generation:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="10152" t="7118" r="10512" b="7272">One</wd>

<space/>

</run>

</ln>

<ln l="6144" t="7387" r="10502" b="7589" baseLine="7536" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7387" r="6658" b="7589">major</wd>

<space/>

<wd l="6778" t="7387" r="7507" b="7589">problem</wd>

<space/>

<wd l="7632" t="7387" r="7824" b="7546">of</wd>

<space/>

<wd l="7934" t="7387" r="8198" b="7546">the</wd>

<space/>

<wd l="8323" t="7387" r="9043" b="7546">mention</wd>

<space/>

<wd l="9168" t="7387" r="9998" b="7546">candidate</wd>

<space/>

<wd l="10128" t="7440" r="10502" b="7589">gen-</wd>

</ln>

<ln l="6149" t="7656" r="10512" b="7858" baseLine="7810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="7656" r="6754" b="7814">eration</wd>

<space/>

<wd l="6893" t="7656" r="7243" b="7814">task</wd>

<space/>

<wd l="7387" t="7656" r="7522" b="7814">is</wd>

<space/>

<wd l="7670" t="7656" r="8002" b="7814">that</wd>

<space/>

<wd l="8141" t="7709" r="8616" b="7858">many</wd>

<space/>

<wd l="8765" t="7656" r="9254" b="7858">entity</wd>

<space/>

<wd l="9398" t="7656" r="10190" b="7814">mentions</wd>

<space/>

<wd l="10339" t="7656" r="10512" b="7810">in</wd>

<space/>

</ln>

<ln l="6144" t="7930" r="10502" b="8131" baseLine="8078" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="7954" r="6696" b="8088">tweets</wd>

<space/>

<wd l="6773" t="7954" r="7354" b="8088">cannot</wd>

<space/>

<wd l="7416" t="7930" r="7622" b="8088">be</wd>

<space/>

<wd l="7694" t="7930" r="8419" b="8088">detected</wd>

<space/>

<wd l="8486" t="7930" r="9173" b="8088">because</wd>

<space/>

<wd l="9240" t="7930" r="9610" b="8131">they</wd>

<space/>

<wd l="9686" t="7982" r="10267" b="8131">appear</wd>

<space/>

<wd l="10334" t="7982" r="10502" b="8088">as</wd>

<space/>

</ln>

<ln l="6144" t="8198" r="10498" b="8400" baseLine="8347">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="8198" r="6898" b="8400">irregular</wd>

<space/>

<wd l="6946" t="8198" r="7450" b="8357">forms</wd>

<space/>

<wd l="7522" t="8203" r="7944" b="8400">(e.g.,</wd>

<space/>

</run>

<wd l="8006" t="8198" r="9130" b="8400"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">misspellings</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

<wd l="9197" t="8198" r="10498" b="8395"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">abbreviations</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="6144" t="8472" r="10512" b="8674" baseLine="8621" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8477" r="6326" b="8626">In</wd>

<space/>

<wd l="6432" t="8472" r="6893" b="8630">order</wd>

<space/>

<wd l="6989" t="8496" r="7157" b="8630">to</wd>

<space/>

<wd l="7267" t="8472" r="7910" b="8630">address</wd>

<space/>

<wd l="8021" t="8472" r="8328" b="8630">this</wd>

<space/>

<wd l="8434" t="8472" r="9206" b="8674">problem,</wd>

<space/>

<wd l="9331" t="8525" r="9586" b="8630">we</wd>

<space/>

<wd l="9686" t="8472" r="10512" b="8630">introduce</wd>

<space/>

</ln>

<ln l="6144" t="8741" r="10507" b="8942" baseLine="8890" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8741" r="6413" b="8899">the</wd>

<space/>

<wd l="6499" t="8741" r="7339" b="8942">following</wd>

<space/>

<wd l="7430" t="8741" r="7862" b="8899">three</wd>

<space/>

<wd l="7958" t="8741" r="9043" b="8942">approximate</wd>

<space/>

<wd l="9139" t="8741" r="10507" b="8942">string-matching</wd>

<space/>

</ln>

<ln l="6144" t="9010" r="9874" b="9211" baseLine="9163" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9010" r="6878" b="9168">methods</wd>

<space/>

<wd l="6941" t="9034" r="7104" b="9168">to</wd>

<space/>

<wd l="7162" t="9010" r="7882" b="9211">improve</wd>

<space/>

<wd l="7939" t="9010" r="8203" b="9168">the</wd>

<space/>

<wd l="8266" t="9010" r="8813" b="9211">ability</wd>

<space/>

<wd l="8875" t="9010" r="9067" b="9168">of</wd>

<space/>

<wd l="9110" t="9010" r="9418" b="9168">this</wd>

<space/>

<wd l="9480" t="9010" r="9874" b="9168">task:</wd>

</ln>

</para>

<para l="6384" t="9494" r="10512" b="10512" alignment="justified" li="432" spaceBefore="212" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="9494" r="10502" b="9696" baseLine="9648">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6384" t="9504" r="6581" b="9648">•</wd>

<tab position="6465"/>

<wd l="6581" t="9504" r="7090" b="9696">Fuzzy</wd>

<space/>

<wd l="7142" t="9494" r="7666" b="9653">match</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7728" t="9494" r="8453" b="9653">searches</wd>

<space/>

<wd l="8510" t="9494" r="8774" b="9653">the</wd>

<space/>

<wd l="8827" t="9494" r="9542" b="9653">mention</wd>

<space/>

<wd l="9595" t="9494" r="10502" b="9653">candidates</wd>

<space/>

</run>

</ln>

<ln l="6581" t="9768" r="10502" b="9926" baseLine="9917" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="9768" r="6912" b="9926">that</wd>

<space/>

<wd l="6994" t="9768" r="7397" b="9926">have</wd>

<space/>

<wd l="7483" t="9792" r="7805" b="9926">text</wd>

<space/>

<wd l="7896" t="9768" r="8592" b="9926">surfaces</wd>

<space/>

<wd l="8683" t="9768" r="9245" b="9926">within</wd>

<space/>

<wd l="9331" t="9821" r="9427" b="9926">a</wd>

<space/>

<wd l="9514" t="9768" r="10099" b="9926">certain</wd>

<space/>

<wd l="10190" t="9768" r="10502" b="9926">dis-</wd>

</ln>

<ln l="6581" t="10037" r="10512" b="10238" baseLine="10190" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="10061" r="7042" b="10195">tance</wd>

<space/>

<wd l="7114" t="10037" r="7306" b="10195">of</wd>

<space/>

<wd l="7358" t="10037" r="7627" b="10195">the</wd>

<space/>

<wd l="7704" t="10037" r="8323" b="10195">surface</wd>

<space/>

<wd l="8395" t="10037" r="8587" b="10195">of</wd>

<space/>

<wd l="8640" t="10037" r="8909" b="10195">the</wd>

<space/>

<wd l="8976" t="10090" r="9610" b="10238">n-gram</wd>

<space/>

<wd l="9677" t="10037" r="10512" b="10195">measured</wd>

<space/>

</ln>

<ln l="6581" t="10310" r="7997" b="10512" baseLine="10459" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="10310" r="6797" b="10512">by</wd>

<space/>

<wd l="6859" t="10310" r="7186" b="10469">edit</wd>

<space/>

<wd l="7243" t="10310" r="7997" b="10469">distance.</wd>

</ln>

</para>

<para l="6384" t="10670" r="10512" b="11693" alignment="justified" li="432" spaceBefore="97" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="10675" r="10512" b="10877" baseLine="10829">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="10680" r="6566" b="10829">•</wd>

<tab position="6467"/>

<wd l="6566" t="10680" r="7694" b="10877">Approximate</wd>

<space/>

<wd l="7810" t="10675" r="8270" b="10834">token</wd>

<space/>

<wd l="8381" t="10675" r="8947" b="10834">search</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9062" t="10675" r="9682" b="10834">obtains</wd>

<space/>

<wd l="9797" t="10675" r="10512" b="10834">mention</wd>

<space/>

</run>

</ln>

<ln l="6586" t="10949" r="10502" b="11150" baseLine="11098" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="10949" r="7493" b="11107">candidates</wd>

<space/>

<wd l="7560" t="10949" r="8117" b="11107">whose</wd>

<space/>

<wd l="8174" t="10973" r="8501" b="11107">text</wd>

<space/>

<wd l="8563" t="10949" r="9259" b="11107">surfaces</wd>

<space/>

<wd l="9326" t="10949" r="9730" b="11107">have</wd>

<space/>

<wd l="9792" t="11002" r="9888" b="11107">a</wd>

<space/>

<wd l="9950" t="10949" r="10502" b="11150">signif-</wd>

</ln>

<ln l="6581" t="11218" r="10502" b="11376" baseLine="11371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="11218" r="7008" b="11376">icant</wd>

<space/>

<wd l="7066" t="11218" r="7459" b="11376">ratio</wd>

<space/>

<wd l="7526" t="11218" r="7718" b="11376">of</wd>

<space/>

<wd l="7762" t="11218" r="8285" b="11376">words</wd>

<space/>

<wd l="8352" t="11218" r="8525" b="11371">in</wd>

<space/>

<wd l="8587" t="11270" r="9346" b="11376">common</wd>

<space/>

<wd l="9403" t="11218" r="9792" b="11376">with</wd>

<space/>

<wd l="9850" t="11218" r="10118" b="11376">the</wd>

<space/>

<wd l="10186" t="11270" r="10502" b="11376">sur-</wd>

</ln>

<ln l="6581" t="11491" r="8227" b="11693" baseLine="11640" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="11491" r="6941" b="11650">face</wd>

<space/>

<wd l="7003" t="11491" r="7195" b="11650">of</wd>

<space/>

<wd l="7234" t="11491" r="7498" b="11650">the</wd>

<space/>

<wd l="7555" t="11544" r="8227" b="11693">n-gram.</wd>

</ln>

</para>

<para l="6384" t="11856" r="10502" b="12600" alignment="justified" li="432" spaceBefore="94" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="11856" r="10502" b="12058" baseLine="12010">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6384" t="11861" r="6566" b="12010">•</wd>

<tab position="6467"/>

<wd l="6566" t="11861" r="7354" b="12058">Acronym</wd>

<space/>

<wd l="7411" t="11856" r="7978" b="12014">search</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8030" t="11856" r="8765" b="12014">retrieves</wd>

<space/>

<wd l="8822" t="11856" r="9542" b="12014">mention</wd>

<space/>

<wd l="9595" t="11856" r="10502" b="12014">candidates</wd>

<space/>

</run>

</ln>

<ln l="6581" t="12091" r="10502" b="12331" baseLine="12274">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6581" t="12130" r="6970" b="12288">with</wd>

<space/>

<wd l="7022" t="12130" r="7738" b="12331">possible</wd>

<space/>

</run>

<wd l="7795" t="12091" r="8712" b="12331"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">acronyms</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8779" t="12130" r="9110" b="12288">that</wd>

<space/>

<wd l="9158" t="12130" r="9802" b="12288">include</wd>

<space/>

<wd l="9854" t="12130" r="10123" b="12288">the</wd>

<space/>

<wd l="10186" t="12182" r="10502" b="12288">sur-</wd>

</run>

</ln>

<ln l="6581" t="12398" r="8227" b="12600" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="12398" r="6941" b="12557">face</wd>

<space/>

<wd l="7003" t="12398" r="7195" b="12557">of</wd>

<space/>

<wd l="7234" t="12398" r="7498" b="12557">the</wd>

<space/>

<wd l="7555" t="12451" r="8227" b="12600">n-gram.</wd>

</ln>

</para>

<para l="6144" t="12883" r="10512" b="14712" alignment="justified" spaceBefore="215" spaceAfter="116" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="12883" r="10512" b="13085" baseLine="13032" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6365" t="12883" r="6888" b="13042">When</wd>

<space/>

<wd l="6974" t="12883" r="7445" b="13085">using</wd>

<space/>

<wd l="7536" t="12883" r="7800" b="13042">the</wd>

<space/>

<wd l="7896" t="12883" r="8405" b="13042">above</wd>

<space/>

<wd l="8491" t="12883" r="9274" b="13070">methods,</wd>

<space/>

<wd l="9384" t="12936" r="9638" b="13042">we</wd>

<space/>

<wd l="9730" t="12883" r="10512" b="13042">observed</wd>

<space/>

</ln>

<ln l="6144" t="13157" r="10502" b="13315" baseLine="13306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13157" r="6475" b="13315">that</wd>

<space/>

<wd l="6562" t="13157" r="6826" b="13315">the</wd>

<space/>

<wd l="6912" t="13157" r="7584" b="13315">number</wd>

<space/>

<wd l="7670" t="13157" r="7862" b="13315">of</wd>

<space/>

<wd l="7939" t="13157" r="8654" b="13315">mention</wd>

<space/>

<wd l="8746" t="13157" r="9653" b="13315">candidates</wd>

<space/>

<wd l="9749" t="13157" r="10502" b="13315">becomes</wd>

<space/>

</ln>

<ln l="6144" t="13426" r="10502" b="13627" baseLine="13574" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13478" r="6528" b="13627">very</wd>

<space/>

<wd l="6595" t="13426" r="7070" b="13627">large.</wd>

<space/>

<wd l="7176" t="13430" r="7397" b="13584">To</wd>

<space/>

<wd l="7469" t="13426" r="7824" b="13584">deal</wd>

<space/>

<wd l="7891" t="13426" r="8280" b="13584">with</wd>

<space/>

<wd l="8342" t="13426" r="8702" b="13613">this,</wd>

<space/>

<wd l="8779" t="13478" r="9034" b="13584">we</wd>

<space/>

<wd l="9096" t="13478" r="9384" b="13584">use</wd>

<space/>

<wd l="9456" t="13478" r="9552" b="13584">a</wd>

<space/>

<wd l="9619" t="13426" r="10190" b="13627">simple</wd>

<space/>

<wd l="10262" t="13426" r="10502" b="13579">fil-</wd>

</ln>

<ln l="6144" t="13690" r="10498" b="13896" baseLine="13848">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="13694" r="6653" b="13896">tering</wd>

<space/>

<wd l="6734" t="13694" r="7392" b="13853">method</wd>

<space/>

<wd l="7474" t="13694" r="7968" b="13853">based</wd>

<space/>

<wd l="8054" t="13747" r="8270" b="13853">on</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="8347" t="13699" r="8669" b="13896">soft</wd>

<space/>

<wd l="8750" t="13694" r="9206" b="13896">tf-idf</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="9293" t="13694" r="9926" b="13891">(Cohen</wd>

<space/>

<wd l="10013" t="13718" r="10166" b="13853">et</wd>

<space/>

<wd l="10248" t="13694" r="10498" b="13882">al.,</wd>

<space/>

</run>

</ln>

<ln l="6149" t="13968" r="10502" b="14170" baseLine="14117" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="13973" r="6701" b="14165">2003);</wd>

<space/>

<wd l="6768" t="14021" r="7022" b="14126">we</wd>

<space/>

<wd l="7085" t="13968" r="7666" b="14170">simply</wd>

<space/>

<wd l="7723" t="14021" r="8011" b="14126">use</wd>

<space/>

<wd l="8069" t="13968" r="8448" b="14170">only</wd>

<space/>

<wd l="8506" t="13968" r="8770" b="14126">the</wd>

<space/>

<wd l="8822" t="13968" r="9538" b="14126">mention</wd>

<space/>

<wd l="9595" t="13968" r="10502" b="14126">candidates</wd>

<space/>

</ln>

<ln l="6144" t="14237" r="10502" b="14438" baseLine="14390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14237" r="6475" b="14395">that</wd>

<space/>

<wd l="6518" t="14237" r="6922" b="14395">have</wd>

<space/>

<wd l="6974" t="14290" r="7070" b="14395">a</wd>

<space/>

<wd l="7123" t="14237" r="7949" b="14438">similarity</wd>

<space/>

<wd l="8002" t="14261" r="8606" b="14438">greater</wd>

<space/>

<wd l="8650" t="14237" r="9029" b="14395">than</wd>

<space/>

<wd l="9077" t="14290" r="9173" b="14395">a</wd>

<space/>

<wd l="9216" t="14237" r="10027" b="14395">threshold</wd>

<space/>

<wd l="10075" t="14290" r="10502" b="14395">mea-</wd>

</ln>

<ln l="6154" t="14510" r="10512" b="14712" baseLine="14659" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="14510" r="6619" b="14669">sured</wd>

<space/>

<wd l="6662" t="14510" r="6878" b="14712">by</wd>

<space/>

<wd l="6926" t="14510" r="7190" b="14669">the</wd>

<space/>

<wd l="7248" t="14510" r="7565" b="14669">soft</wd>

<space/>

<wd l="7608" t="14510" r="8102" b="14669">tf-idf.</wd>

<space/>

<wd l="8179" t="14515" r="8462" b="14669">We</wd>

<space/>

<wd l="8506" t="14563" r="8798" b="14669">use</wd>

<space/>

<wd l="8846" t="14515" r="9106" b="14669">0.9</wd>

<space/>

<wd l="9163" t="14563" r="9336" b="14669">as</wd>

<space/>

<wd l="9389" t="14510" r="9653" b="14669">the</wd>

<space/>

<wd l="9701" t="14510" r="10512" b="14669">threshold</wd>

</ln>

</para>

<rulerline l="6144" t="14846" r="7344" b="14846" type="single" width="10" color="000000"/>

<para l="6149" t="14904" r="10507" b="15302" alignment="justified" spaceBefore="66" spaceAfter="38" fli="216" lsp="exactly" lspExact="203" language="en">

<ln l="6398" t="14904" r="10507" b="15106" baseLine="15056">

<wd l="6398" t="14904" r="6701" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">We</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="6744" t="14957" r="7344" b="15106">generate</wd>

<space/>

<wd l="7387" t="14976" r="8069" b="15106">acronyms</wd>

<space/>

<wd l="8112" t="14938" r="8290" b="15106">by</wd>

<space/>

<wd l="8328" t="14938" r="9077" b="15106">tokenizing</wd>

<space/>

<wd l="9115" t="14938" r="9331" b="15067">the</wd>

<space/>

<wd l="9370" t="14938" r="9960" b="15067">mention</wd>

<space/>

<wd l="9998" t="14938" r="10507" b="15067">surface</wd>

<space/>

</run>

</ln>

<ln l="6149" t="15134" r="10464" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="15134" r="6408" b="15264">and</wd>

<space/>

<wd l="6456" t="15134" r="6936" b="15302">simply</wd>

<space/>

<wd l="6984" t="15134" r="7426" b="15302">taking</wd>

<space/>

<wd l="7474" t="15134" r="7690" b="15264">the</wd>

<space/>

<wd l="7742" t="15134" r="8021" b="15264">first</wd>

<space/>

<wd l="8064" t="15134" r="8784" b="15264">characters</wd>

<space/>

<wd l="8842" t="15134" r="8995" b="15264">of</wd>

<space/>

<wd l="9029" t="15134" r="9245" b="15264">the</wd>

<space/>

<wd l="9293" t="15134" r="9917" b="15302">resulting</wd>

<space/>

<wd l="9965" t="15134" r="10464" b="15264">tokens.</wd>

</ln>

</para>

</column>

</section>

<dd l="1437" t="15746" r="10531" b="15975">

<para l="5771" t="15792" r="6196" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6130" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="28">

<wd l="5837" t="15792" r="6130" b="15946">137</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4320.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1437" marginTop="1262" marginRight="1378" marginBottom="1292" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1437" t="1262" r="10531" b="15318">

<column l="1437" t="1262" r="5824" b="15318">

<para l="1440" t="1320" r="5808" b="1795" alignment="justified" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="1320" r="5808" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1320" r="2131" b="1478">because</wd>

<space/>

<wd l="2194" t="1320" r="2501" b="1478">this</wd>

<space/>

<wd l="2578" t="1320" r="3307" b="1478">achieves</wd>

<space/>

<wd l="3374" t="1320" r="3643" b="1478">the</wd>

<space/>

<wd l="3706" t="1320" r="4056" b="1478">best</wd>

<space/>

<wd l="4118" t="1320" r="5218" b="1522">performance</wd>

<space/>

<wd l="5285" t="1320" r="5453" b="1474">in</wd>

<space/>

<wd l="5520" t="1373" r="5808" b="1478">our</wd>

<space/>

</ln>

<ln l="1445" t="1594" r="3106" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1594" r="2496" b="1795">experiments</wd>

<space/>

<wd l="2563" t="1594" r="2755" b="1752">of</wd>

<space/>

<wd l="2794" t="1598" r="3106" b="1752">EL.</wd>

</ln>

</para>

<para l="1440" t="2040" r="5760" b="2242" alignment="justified" spaceBefore="199" lsp="exactly" lspExact="253" language="en">

<ln l="1440" t="2040" r="5760" b="2242" baseLine="2194" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="2040" r="1872" b="2198">2.2.2</wd>

<space/>

<wd l="2093" t="2040" r="2880" b="2198">Mention</wd>

<space/>

<wd l="2938" t="2040" r="3821" b="2198">Detection</wd>

<space/>

<wd l="3883" t="2045" r="4229" b="2198">and</wd>

<space/>

<wd l="4282" t="2040" r="5760" b="2242">Disambiguation</wd>

</ln>

</para>

<para l="1440" t="2381" r="5803" b="3350" alignment="justified" spaceBefore="63" lsp="exactly" lspExact="271" language="en">

<ln l="1445" t="2381" r="5794" b="2582" baseLine="2530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="2381" r="1968" b="2539">Given</wd>

<space/>

<wd l="2045" t="2434" r="2141" b="2539">a</wd>

<space/>

<wd l="2218" t="2381" r="2558" b="2582">pair</wd>

<space/>

<wd l="2635" t="2381" r="2827" b="2539">of</wd>

<space/>

<wd l="2894" t="2434" r="2990" b="2539">a</wd>

<space/>

<wd l="3067" t="2381" r="3782" b="2539">mention</wd>

<space/>

<wd l="3864" t="2381" r="4176" b="2539">and</wd>

<space/>

<wd l="4248" t="2381" r="4450" b="2539">its</wd>

<space/>

<wd l="4531" t="2381" r="5246" b="2582">possible</wd>

<space/>

<wd l="5323" t="2381" r="5794" b="2539">refer-</wd>

</ln>

<ln l="1445" t="2650" r="5803" b="2851" baseLine="2798" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="2674" r="1709" b="2808">ent</wd>

<space/>

<wd l="1762" t="2650" r="2285" b="2851">entity,</wd>

<space/>

<wd l="2347" t="2650" r="2472" b="2808">it</wd>

<space/>

<wd l="2525" t="2650" r="3010" b="2808">needs</wd>

<space/>

<wd l="3072" t="2674" r="3240" b="2808">to</wd>

<space/>

<wd l="3293" t="2650" r="3499" b="2808">be</wd>

<space/>

<wd l="3557" t="2650" r="4536" b="2808">determined</wd>

<space/>

<wd l="4584" t="2650" r="4733" b="2803">if</wd>

<space/>

<wd l="4771" t="2650" r="5035" b="2808">the</wd>

<space/>

<wd l="5088" t="2650" r="5803" b="2851">possible</wd>

<space/>

</ln>

<ln l="1440" t="2923" r="5794" b="3125" baseLine="3072" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2923" r="2122" b="3082">referent</wd>

<space/>

<wd l="2184" t="2923" r="2674" b="3125">entity</wd>

<space/>

<wd l="2741" t="2923" r="2875" b="3082">is</wd>

<space/>

<wd l="2947" t="2923" r="3533" b="3082">indeed</wd>

<space/>

<wd l="3590" t="2923" r="3859" b="3082">the</wd>

<space/>

<wd l="3926" t="2947" r="4526" b="3082">correct</wd>

<space/>

<wd l="4594" t="2976" r="4901" b="3082">one</wd>

<space/>

<wd l="4968" t="2923" r="5222" b="3082">for</wd>

<space/>

<wd l="5285" t="2923" r="5482" b="3082">its</wd>

<space/>

<wd l="5554" t="2976" r="5794" b="3082">as-</wd>

</ln>

<ln l="1450" t="3192" r="2966" b="3350" baseLine="3341" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="3192" r="2155" b="3350">sociated</wd>

<space/>

<wd l="2208" t="3192" r="2966" b="3350">mention.</wd>

</ln>

</para>

<para l="1440" t="3470" r="5808" b="4757" alignment="justified" spaceBefore="8" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="3470" r="5794" b="3672" baseLine="3624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="3475" r="1843" b="3624">In</wd>

<space/>

<wd l="1925" t="3470" r="2232" b="3629">this</wd>

<space/>

<wd l="2333" t="3494" r="2976" b="3672">system,</wd>

<space/>

<wd l="3077" t="3523" r="3331" b="3629">we</wd>

<space/>

<wd l="3418" t="3523" r="3706" b="3629">use</wd>

<space/>

<wd l="3797" t="3523" r="3893" b="3629">a</wd>

<space/>

<wd l="3984" t="3470" r="4910" b="3672">supervised</wd>

<space/>

<wd l="4992" t="3470" r="5794" b="3629">machine-</wd>

</ln>

<ln l="1440" t="3744" r="5803" b="3946" baseLine="3893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3744" r="2150" b="3946">learning</wd>

<space/>

<wd l="2237" t="3744" r="3082" b="3946">algorithm</wd>

<space/>

<wd l="3158" t="3768" r="3322" b="3902">to</wd>

<space/>

<wd l="3408" t="3744" r="3950" b="3946">assign</wd>

<space/>

<wd l="4027" t="3797" r="4123" b="3902">a</wd>

<space/>

<wd l="4200" t="3744" r="5021" b="3902">relevance</wd>

<space/>

<wd l="5107" t="3797" r="5558" b="3902">score</wd>

<space/>

<wd l="5635" t="3768" r="5803" b="3902">to</wd>

<space/>

</ln>

<ln l="1445" t="4013" r="5808" b="4214" baseLine="4166" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4013" r="1843" b="4171">each</wd>

<space/>

<wd l="1891" t="4013" r="2083" b="4171">of</wd>

<space/>

<wd l="2112" t="4013" r="2381" b="4171">the</wd>

<space/>

<wd l="2424" t="4013" r="2842" b="4214">pairs</wd>

<space/>

<wd l="2899" t="4013" r="3211" b="4171">and</wd>

<space/>

<wd l="3269" t="4013" r="3758" b="4171">select</wd>

<space/>

<wd l="3802" t="4013" r="4066" b="4171">the</wd>

<space/>

<wd l="4118" t="4013" r="4608" b="4214">entity</wd>

<space/>

<wd l="4656" t="4013" r="5371" b="4171">mention</wd>

<space/>

<wd l="5419" t="4013" r="5808" b="4171">with</wd>

<space/>

</ln>

<ln l="1440" t="4286" r="5803" b="4488" baseLine="4435">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="4286" r="1704" b="4445">the</wd>

<space/>

<wd l="1790" t="4286" r="2424" b="4488">highest</wd>

<space/>

<wd l="2520" t="4339" r="3010" b="4445">score.</wd>

<space/>

<wd l="3182" t="4291" r="3470" b="4445">We</wd>

<space/>

<wd l="3557" t="4339" r="3845" b="4445">use</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3941" t="4286" r="4603" b="4445">random</wd>

<space/>

<wd l="4661" t="4291" r="5189" b="4488">forest</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5275" t="4339" r="5443" b="4445">as</wd>

<space/>

<wd l="5539" t="4286" r="5803" b="4445">the</wd>

<space/>

</run>

</ln>

<ln l="1440" t="4555" r="3912" b="4757" baseLine="4704" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4555" r="2962" b="4757">machine-learning</wd>

<space/>

<wd l="3024" t="4555" r="3912" b="4757">algorithm.</wd>

</ln>

</para>

<para l="1440" t="4834" r="5808" b="7474" alignment="justified" spaceBefore="12" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="4834" r="5803" b="5035" baseLine="4987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="4838" r="2126" b="5021">Here,</wd>

<space/>

<wd l="2189" t="4886" r="2443" b="4992">we</wd>

<space/>

<wd l="2496" t="4886" r="2784" b="4992">use</wd>

<space/>

<wd l="2837" t="4834" r="4363" b="5035">machine-learning</wd>

<space/>

<wd l="4416" t="4834" r="5098" b="4992">features</wd>

<space/>

<wd l="5160" t="4834" r="5491" b="4992">that</wd>

<space/>

<wd l="5544" t="4886" r="5803" b="4992">are</wd>

<space/>

</ln>

<ln l="1440" t="5107" r="5794" b="5309" baseLine="5256" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="5107" r="2030" b="5309">mostly</wd>

<space/>

<wd l="2136" t="5107" r="2885" b="5266">identical</wd>

<space/>

<wd l="2990" t="5131" r="3158" b="5266">to</wd>

<space/>

<wd l="3264" t="5107" r="3528" b="5266">the</wd>

<space/>

<wd l="3629" t="5107" r="4286" b="5266">method</wd>

<space/>

<wd l="4387" t="5107" r="5189" b="5309">proposed</wd>

<space/>

<wd l="5290" t="5107" r="5794" b="5309">previ-</wd>

</ln>

<ln l="1445" t="5376" r="5794" b="5578" baseLine="5530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="5376" r="1910" b="5578">ously</wd>

<space/>

<wd l="1968" t="5376" r="2741" b="5573">(Yamada</wd>

<space/>

<wd l="2789" t="5400" r="2942" b="5534">et</wd>

<space/>

<wd l="2990" t="5376" r="3240" b="5563">al.,</wd>

<space/>

<wd l="3302" t="5376" r="3850" b="5573">2015).</wd>

<space/>

<wd l="3926" t="5376" r="4766" b="5578">Basically,</wd>

<space/>

<wd l="4829" t="5429" r="5083" b="5534">we</wd>

<space/>

<wd l="5126" t="5429" r="5419" b="5534">use</wd>

<space/>

<wd l="5462" t="5429" r="5794" b="5534">var-</wd>

</ln>

<ln l="1440" t="5650" r="5808" b="5851" baseLine="5798" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="5650" r="1795" b="5808">ious</wd>

<space/>

<wd l="1886" t="5650" r="2568" b="5808">features</wd>

<space/>

<wd l="2654" t="5650" r="2986" b="5808">that</wd>

<space/>

<wd l="3067" t="5702" r="3326" b="5808">are</wd>

<space/>

<wd l="3413" t="5650" r="4339" b="5851">commonly</wd>

<space/>

<wd l="4430" t="5650" r="5208" b="5808">observed</wd>

<space/>

<wd l="5290" t="5650" r="5458" b="5803">in</wd>

<space/>

<wd l="5539" t="5654" r="5808" b="5803">EL</wd>

<space/>

</ln>

<ln l="1450" t="5918" r="5803" b="6120" baseLine="6072" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1450" t="5918" r="2040" b="6077">studies</wd>

<space/>

<wd l="2141" t="5918" r="2453" b="6077">and</wd>

<space/>

<wd l="2549" t="5918" r="3259" b="6077">enhance</wd>

<space/>

<wd l="3350" t="5918" r="3614" b="6077">the</wd>

<space/>

<wd l="3710" t="5918" r="4810" b="6120">performance</wd>

<space/>

<wd l="4901" t="5918" r="5501" b="6077">further</wd>

<space/>

<wd l="5587" t="5918" r="5803" b="6120">by</wd>

<space/>

</ln>

<ln l="1440" t="6192" r="5794" b="6394" baseLine="6341" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="6192" r="2443" b="6394">introducing</wd>

<space/>

<wd l="2525" t="6216" r="2846" b="6350">two</wd>

<space/>

<wd l="2928" t="6245" r="3278" b="6350">new</wd>

<space/>

<wd l="3360" t="6192" r="4094" b="6350">features:</wd>

<space/>

<wd l="4253" t="6197" r="4397" b="6389">1)</wd>

<space/>

<wd l="4488" t="6192" r="4752" b="6350">the</wd>

<space/>

<wd l="4834" t="6192" r="5323" b="6394">entity</wd>

<space/>

<wd l="5405" t="6245" r="5794" b="6394">pop-</wd>

</ln>

<ln l="1440" t="6461" r="5803" b="6662" baseLine="6610" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="6461" r="2006" b="6662">ularity</wd>

<space/>

<wd l="2074" t="6461" r="3024" b="6662">knowledge</wd>

<space/>

<wd l="3091" t="6461" r="3883" b="6619">extracted</wd>

<space/>

<wd l="3946" t="6461" r="4373" b="6619">from</wd>

<space/>

<wd l="4430" t="6461" r="5338" b="6662">Wikipedia</wd>

<space/>

<wd l="5395" t="6514" r="5803" b="6662">page</wd>

<space/>

</ln>

<ln l="1440" t="6696" r="5808" b="6936" baseLine="6881">

<wd l="1440" t="6696" r="2078" b="6922"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">views</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">3</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2179" t="6734" r="2491" b="6893">and</wd>

<space/>

<wd l="2573" t="6739" r="2741" b="6931">2)</wd>

<space/>

<wd l="2832" t="6734" r="3096" b="6893">the</wd>

<space/>

<wd l="3182" t="6734" r="4080" b="6893">contextual</wd>

<space/>

<wd l="4171" t="6734" r="4997" b="6936">similarity</wd>

<space/>

<wd l="5078" t="6734" r="5808" b="6893">between</wd>

<space/>

</run>

</ln>

<ln l="1440" t="7003" r="5794" b="7205" baseLine="7152" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="7003" r="1704" b="7162">the</wd>

<space/>

<wd l="1762" t="7003" r="2251" b="7205">entity</wd>

<space/>

<wd l="2309" t="7003" r="2616" b="7162">and</wd>

<space/>

<wd l="2664" t="7003" r="2933" b="7162">the</wd>

<space/>

<wd l="2981" t="7027" r="3456" b="7162">tweet</wd>

<space/>

<wd l="3504" t="7003" r="4339" b="7162">measured</wd>

<space/>

<wd l="4387" t="7003" r="4603" b="7205">by</wd>

<space/>

<wd l="4656" t="7003" r="5102" b="7162">word</wd>

<space/>

<wd l="5155" t="7003" r="5794" b="7162">embed-</wd>

</ln>

<ln l="1445" t="7272" r="1958" b="7474" baseLine="7426" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="7272" r="1958" b="7474">dings.</wd>

</ln>

</para>

<para l="1440" t="7752" r="4402" b="7954" alignment="left" spaceBefore="222" lsp="exactly" lspExact="253" language="en">

<ln l="1440" t="7752" r="4402" b="7954" baseLine="7901" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7752" r="1709" b="7910">2.3</wd>

<space/>

<wd l="1930" t="7757" r="2597" b="7910">Named</wd>

<space/>

<wd l="2654" t="7752" r="3230" b="7954">Entity</wd>

<space/>

<wd l="3293" t="7752" r="4402" b="7954">Recognition</wd>

</ln>

</para>

<para l="1440" t="8117" r="5794" b="8592" alignment="justified" spaceBefore="98" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="8117" r="5794" b="8318" baseLine="8270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8122" r="1723" b="8275">We</wd>

<space/>

<wd l="1790" t="8117" r="2429" b="8275">address</wd>

<space/>

<wd l="2496" t="8117" r="2765" b="8275">the</wd>

<space/>

<wd l="2822" t="8122" r="3259" b="8275">NER</wd>

<space/>

<wd l="3317" t="8117" r="3672" b="8275">task</wd>

<space/>

<wd l="3730" t="8117" r="3941" b="8318">by</wd>

<space/>

<wd l="4003" t="8117" r="4982" b="8318">performing</wd>

<space/>

<wd l="5045" t="8141" r="5366" b="8275">two</wd>

<space/>

<wd l="5438" t="8117" r="5794" b="8275">sub-</wd>

</ln>

<ln l="1440" t="8390" r="4776" b="8592" baseLine="8539">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="8390" r="1920" b="8549">tasks:</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2006" t="8400" r="3158" b="8592">segmentation</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3221" t="8390" r="3533" b="8549">and</wd>

<space/>

</run>

<wd l="3590" t="8390" r="4776" b="8592"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">classification</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="8837" r="5093" b="9038" alignment="left" spaceBefore="196" lsp="exactly" lspExact="253" language="en">

<ln l="1440" t="8837" r="5093" b="9038" baseLine="8990" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8837" r="1867" b="8995">2.3.1</wd>

<space/>

<wd l="2098" t="8837" r="3365" b="9038">Segmentation</wd>

<space/>

<wd l="3427" t="8837" r="3619" b="8995">of</wd>

<space/>

<wd l="3658" t="8842" r="4325" b="8995">Named</wd>

<space/>

<wd l="4378" t="8837" r="5093" b="8995">Entities</wd>

</ln>

</para>

<para l="1440" t="9178" r="5808" b="11818" alignment="justified" spaceBefore="65" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="9178" r="5808" b="9379" baseLine="9326" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9182" r="1622" b="9331">In</wd>

<space/>

<wd l="1728" t="9178" r="2035" b="9336">this</wd>

<space/>

<wd l="2155" t="9202" r="2544" b="9379">step,</wd>

<space/>

<wd l="2674" t="9178" r="3163" b="9379">entity</wd>

<space/>

<wd l="3274" t="9178" r="4066" b="9336">mentions</wd>

<space/>

<wd l="4181" t="9230" r="4445" b="9336">are</wd>

<space/>

<wd l="4555" t="9178" r="5280" b="9336">detected</wd>

<space/>

<wd l="5381" t="9178" r="5808" b="9336">from</wd>

<space/>

</ln>

<ln l="1440" t="9446" r="5808" b="9605" baseLine="9595" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9470" r="2040" b="9605">tweets.</wd>

<space/>

<wd l="2160" t="9451" r="2443" b="9605">We</wd>

<space/>

<wd l="2515" t="9446" r="3350" b="9605">formalize</wd>

<space/>

<wd l="3418" t="9446" r="3725" b="9605">this</wd>

<space/>

<wd l="3802" t="9446" r="4152" b="9605">task</wd>

<space/>

<wd l="4224" t="9499" r="4392" b="9605">as</wd>

<space/>

<wd l="4469" t="9446" r="5160" b="9605">follows.</wd>

<space/>

<wd l="5285" t="9446" r="5808" b="9605">Given</wd>

<space/>

</ln>

<ln l="1445" t="9720" r="5798" b="9922" baseLine="9869" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="9773" r="1642" b="9878">an</wd>

<space/>

<wd l="1757" t="9773" r="2386" b="9922">n-gram</wd>

<space/>

<wd l="2491" t="9720" r="2664" b="9874">in</wd>

<space/>

<wd l="2774" t="9773" r="2870" b="9878">a</wd>

<space/>

<wd l="2976" t="9744" r="3494" b="9907">tweet,</wd>

<space/>

<wd l="3624" t="9720" r="3893" b="9878">the</wd>

<space/>

<wd l="4008" t="9720" r="4373" b="9922">goal</wd>

<space/>

<wd l="4493" t="9720" r="4680" b="9878">of</wd>

<space/>

<wd l="4776" t="9720" r="5083" b="9878">this</wd>

<space/>

<wd l="5198" t="9720" r="5554" b="9878">task</wd>

<space/>

<wd l="5659" t="9720" r="5798" b="9878">is</wd>

<space/>

</ln>

<ln l="1445" t="9989" r="5808" b="10190" baseLine="10138" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="9989" r="2261" b="10190">assigning</wd>

<space/>

<wd l="2362" t="10042" r="2458" b="10147">a</wd>

<space/>

<wd l="2544" t="9989" r="3096" b="10190">binary</wd>

<space/>

<wd l="3192" t="9989" r="3614" b="10147">label</wd>

<space/>

<wd l="3710" t="9989" r="4037" b="10147">that</wd>

<space/>

<wd l="4128" t="10013" r="5002" b="10190">represents</wd>

<space/>

<wd l="5102" t="9989" r="5808" b="10147">whether</wd>

<space/>

</ln>

<ln l="1440" t="10258" r="5794" b="10459" baseLine="10411" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10258" r="1704" b="10416">the</wd>

<space/>

<wd l="1786" t="10310" r="2419" b="10459">n-gram</wd>

<space/>

<wd l="2501" t="10258" r="3077" b="10416">should</wd>

<space/>

<wd l="3154" t="10258" r="3355" b="10416">be</wd>

<space/>

<wd l="3442" t="10258" r="4162" b="10416">detected</wd>

<space/>

<wd l="4243" t="10310" r="4411" b="10416">as</wd>

<space/>

<wd l="4502" t="10310" r="4699" b="10416">an</wd>

<space/>

<wd l="4786" t="10258" r="5275" b="10459">entity</wd>

<space/>

<wd l="5357" t="10310" r="5794" b="10416">men-</wd>

</ln>

<ln l="1440" t="10531" r="5794" b="10733" baseLine="10680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10531" r="1824" b="10690">tion.</wd>

<space/>

<wd l="2026" t="10536" r="2448" b="10690">Note</wd>

<space/>

<wd l="2544" t="10531" r="2870" b="10690">that</wd>

<space/>

<wd l="2966" t="10531" r="3139" b="10685">in</wd>

<space/>

<wd l="3235" t="10531" r="3696" b="10690">order</wd>

<space/>

<wd l="3787" t="10555" r="3955" b="10690">to</wd>

<space/>

<wd l="4056" t="10531" r="4622" b="10690">enable</wd>

<space/>

<wd l="4718" t="10531" r="4982" b="10690">the</wd>

<space/>

<wd l="5088" t="10531" r="5794" b="10733">straight-</wd>

</ln>

<ln l="1440" t="10800" r="5794" b="11002" baseLine="10954" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10800" r="2131" b="10958">forward</wd>

<space/>

<wd l="2213" t="10800" r="3154" b="11002">integration</wd>

<space/>

<wd l="3240" t="10800" r="3432" b="10958">of</wd>

<space/>

<wd l="3504" t="10805" r="3768" b="10954">EL</wd>

<space/>

<wd l="3854" t="10800" r="4166" b="10958">and</wd>

<space/>

<wd l="4248" t="10800" r="4555" b="10958">this</wd>

<space/>

<wd l="4646" t="10800" r="5045" b="10987">task,</wd>

<space/>

<wd l="5146" t="10853" r="5400" b="10958">we</wd>

<space/>

<wd l="5482" t="10800" r="5794" b="10958">for-</wd>

</ln>

<ln l="1440" t="11074" r="5798" b="11275" baseLine="11222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11074" r="2021" b="11232">malize</wd>

<space/>

<wd l="2136" t="11074" r="2443" b="11232">this</wd>

<space/>

<wd l="2563" t="11074" r="2918" b="11232">task</wd>

<space/>

<wd l="3034" t="11126" r="3202" b="11232">as</wd>

<space/>

<wd l="3336" t="11074" r="3917" b="11275">simply</wd>

<space/>

<wd l="4037" t="11074" r="4973" b="11275">classifying</wd>

<space/>

<wd l="5093" t="11126" r="5798" b="11275">n-grams</wd>

<space/>

</ln>

<ln l="1440" t="11342" r="5794" b="11544" baseLine="11496" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11342" r="2059" b="11501">instead</wd>

<space/>

<wd l="2150" t="11342" r="2342" b="11501">of</wd>

<space/>

<wd l="2419" t="11342" r="2683" b="11501">the</wd>

<space/>

<wd l="2779" t="11342" r="4181" b="11544">commonly-used</wd>

<space/>

<wd l="4272" t="11347" r="4632" b="11501">IOB</wd>

<space/>

<wd l="4733" t="11342" r="5434" b="11544">labeling</wd>

<space/>

<wd l="5530" t="11395" r="5794" b="11544">ap-</wd>

</ln>

<ln l="1440" t="11616" r="4757" b="11818" baseLine="11765" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11616" r="2035" b="11818">proach</wd>

<space/>

<wd l="2098" t="11616" r="3014" b="11813">(Ramshaw</wd>

<space/>

<wd l="3077" t="11616" r="3389" b="11774">and</wd>

<space/>

<wd l="3442" t="11621" r="4138" b="11803">Marcus,</wd>

<space/>

<wd l="4229" t="11616" r="4757" b="11813">1995).</wd>

</ln>

</para>

<para l="1440" t="11894" r="5808" b="13450" alignment="justified" spaceBefore="11" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="11894" r="5794" b="12096" baseLine="12043" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="11894" r="1997" b="12053">The</wd>

<space/>

<wd l="2050" t="11894" r="2491" b="12053">basic</wd>

<space/>

<wd l="2558" t="11918" r="3235" b="12096">strategy</wd>

<space/>

<wd l="3288" t="11894" r="3619" b="12053">that</wd>

<space/>

<wd l="3667" t="11947" r="3922" b="12053">we</wd>

<space/>

<wd l="3979" t="11894" r="4459" b="12096">adopt</wd>

<space/>

<wd l="4512" t="11894" r="4886" b="12053">here</wd>

<space/>

<wd l="4939" t="11894" r="5074" b="12053">is</wd>

<space/>

<wd l="5136" t="11918" r="5304" b="12053">to</wd>

<space/>

<wd l="5362" t="11947" r="5794" b="12053">com-</wd>

</ln>

<ln l="1440" t="12163" r="5794" b="12365" baseLine="12317" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12163" r="1814" b="12322">bine</wd>

<space/>

<wd l="1930" t="12163" r="2194" b="12322">the</wd>

<space/>

<wd l="2314" t="12187" r="2870" b="12365">output</wd>

<space/>

<wd l="2986" t="12163" r="3178" b="12322">of</wd>

<space/>

<wd l="3278" t="12168" r="3715" b="12322">NER</wd>

<space/>

<wd l="3840" t="12163" r="4579" b="12322">software</wd>

<space/>

<wd l="4699" t="12163" r="5006" b="12322">and</wd>

<space/>

<wd l="5122" t="12163" r="5386" b="12322">the</wd>

<space/>

<wd l="5506" t="12168" r="5794" b="12317">KB</wd>

<space/>

</ln>

<ln l="1440" t="12437" r="5808" b="12638" baseLine="12586" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12437" r="2390" b="12638">knowledge</wd>

<space/>

<wd l="2496" t="12437" r="2688" b="12595">of</wd>

<space/>

<wd l="2774" t="12437" r="3043" b="12595">the</wd>

<space/>

<wd l="3149" t="12437" r="4387" b="12638">corresponding</wd>

<space/>

<wd l="4498" t="12437" r="4987" b="12638">entity</wd>

<space/>

<wd l="5088" t="12437" r="5808" b="12595">mention</wd>

<space/>

</ln>

<ln l="1445" t="12706" r="5794" b="12907" baseLine="12859" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="12706" r="2170" b="12864">detected</wd>

<space/>

<wd l="2280" t="12706" r="2491" b="12907">by</wd>

<space/>

<wd l="2606" t="12706" r="2875" b="12864">the</wd>

<space/>

<wd l="2986" t="12710" r="3254" b="12859">EL</wd>

<space/>

<wd l="3365" t="12706" r="3835" b="12907">using</wd>

<space/>

<wd l="3960" t="12706" r="4882" b="12907">supervised</wd>

<space/>

<wd l="4992" t="12706" r="5794" b="12864">machine-</wd>

</ln>

<ln l="1440" t="12979" r="5803" b="13181" baseLine="13128">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="12979" r="2198" b="13181">learning.</wd>

<space/>

<wd l="2458" t="12984" r="2741" b="13138">We</wd>

<space/>

<wd l="2861" t="12979" r="3326" b="13181">again</wd>

<space/>

<wd l="3442" t="13032" r="3730" b="13138">use</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3854" t="12979" r="4517" b="13138">random</wd>

<space/>

<wd l="4603" t="12984" r="5131" b="13181">forest</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5246" t="13032" r="5414" b="13138">as</wd>

<space/>

<wd l="5539" t="12979" r="5803" b="13138">the</wd>

<space/>

</run>

</ln>

<ln l="1440" t="13248" r="3912" b="13450" baseLine="13402" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13248" r="2962" b="13450">machine-learning</wd>

<space/>

<wd l="3024" t="13248" r="3912" b="13450">algorithm.</wd>

</ln>

</para>

<para l="1440" t="13493" r="5808" b="14270" alignment="justified" spaceBefore="7" spaceAfter="133" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="13493" r="5808" b="13690" baseLine="13676">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><wd l="1656" t="13536" r="1944" b="13690">We</wd>

<space/>

<wd l="1987" t="13584" r="2275" b="13690">use</wd>

<space/>

<wd l="2323" t="13531" r="3072" b="13690">Stanford</wd>

<space/>

</run>

<wd l="3110" t="13493" r="3624" b="13690"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">NER</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">4</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5"><space/>

<wd l="3682" t="13584" r="3850" b="13690">as</wd>

<space/>

<wd l="3902" t="13531" r="4166" b="13690">the</wd>

<space/>

<wd l="4210" t="13536" r="4646" b="13690">NER</wd>

<space/>

<wd l="4699" t="13531" r="5434" b="13690">software</wd>

<space/>

<wd l="5477" t="13531" r="5808" b="13690">that</wd>

<space/>

</run>

</ln>

<ln l="1445" t="13800" r="5794" b="14002" baseLine="13949" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1445" t="13800" r="2174" b="13958">achieves</wd>

<space/>

<wd l="2232" t="13800" r="3043" b="14002">relatively</wd>

<space/>

<wd l="3101" t="13800" r="3600" b="13958">better</wd>

<space/>

<wd l="3648" t="13800" r="4747" b="14002">performance</wd>

<space/>

<wd l="4800" t="13800" r="4973" b="13954">in</wd>

<space/>

<wd l="5021" t="13800" r="5285" b="13958">the</wd>

<space/>

<wd l="5338" t="13800" r="5794" b="13958">Twit-</wd>

</ln>

<ln l="1440" t="14069" r="5794" b="14270" baseLine="14222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1440" t="14093" r="1675" b="14227">ter</wd>

<space/>

<wd l="1738" t="14074" r="2170" b="14227">NER</wd>

<space/>

<wd l="2237" t="14069" r="2587" b="14227">task</wd>

<space/>

<wd l="2654" t="14069" r="2822" b="14222">in</wd>

<space/>

<wd l="2894" t="14122" r="2990" b="14227">a</wd>

<space/>

<wd l="3048" t="14093" r="3586" b="14227">recent</wd>

<space/>

<wd l="3658" t="14069" r="4118" b="14270">study</wd>

<space/>

<wd l="4195" t="14069" r="5246" b="14270">(Derczynski</wd>

<space/>

<wd l="5323" t="14093" r="5477" b="14227">et</wd>

<space/>

<wd l="5544" t="14069" r="5794" b="14256">al.,</wd>

</ln>

</para>

<rulerline l="1437" t="14429" r="2640" b="14429" type="single" width="10" color="000000"/>

<para l="1440" t="14486" r="5299" b="14875" alignment="justified" spaceBefore="53" fli="216" lsp="exactly" lspExact="201" language="en">

<ln l="1699" t="14486" r="5299" b="14678" baseLine="14637">

<wd l="1699" t="14486" r="5299" b="14678"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">http://dumps.wikimedia.org/other/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><space/>

</run>

</ln>

<ln l="1440" t="14722" r="3048" b="14875" baseLine="14842" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="1440" t="14722" r="3048" b="14875">pagecounts-raw/</wd>

</ln>

</para>

<para l="1450" t="14904" r="5299" b="15264" alignment="justified" spaceBefore="15" spaceAfter="12" fli="216" lsp="exactly" lspExact="201" language="en">

<ln l="1694" t="14904" r="5299" b="15096" baseLine="15055">

<wd l="1694" t="14904" r="5299" b="15096"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">4</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">http://nlp.stanford.edu/software/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><space/>

</run>

</ln>

<ln l="1450" t="15144" r="2832" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="1450" t="15149" r="2832" b="15264">CRF-NER.shtml</wd>

</ln>

</para>

</column>

<column l="6144" t="1262" r="10531" b="15318">

<para l="6144" t="1320" r="10512" b="2880" alignment="justified" lsp="exactly" lspExact="270" language="en">

<ln l="6149" t="1320" r="10512" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="1320" r="6696" b="1517">2015).</wd>

<space/>

<wd l="6874" t="1325" r="7339" b="1507">Here,</wd>

<space/>

<wd l="7450" t="1373" r="7699" b="1478">we</wd>

<space/>

<wd l="7795" t="1320" r="8275" b="1522">adopt</wd>

<space/>

<wd l="8362" t="1344" r="8683" b="1478">two</wd>

<space/>

<wd l="8774" t="1320" r="9394" b="1478">models</wd>

<space/>

<wd l="9494" t="1320" r="9686" b="1478">of</wd>

<space/>

<wd l="9763" t="1320" r="10512" b="1478">Stanford</wd>

<space/>

</ln>

<ln l="6144" t="1594" r="10512" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1598" r="6581" b="1752">NER</wd>

<space/>

<wd l="6638" t="1618" r="6806" b="1752">to</wd>

<space/>

<wd l="6874" t="1594" r="7584" b="1752">enhance</wd>

<space/>

<wd l="7642" t="1594" r="7906" b="1752">the</wd>

<space/>

<wd l="7968" t="1594" r="9115" b="1795">performance:</wd>

<space/>

<wd l="9230" t="1598" r="9379" b="1790">1)</wd>

<space/>

<wd l="9446" t="1594" r="9710" b="1752">the</wd>

<space/>

<wd l="9782" t="1594" r="10512" b="1752">standard</wd>

<space/>

</ln>

<ln l="6144" t="1862" r="10502" b="2021" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1862" r="7070" b="2021">three-class</wd>

<space/>

<wd l="7166" t="1862" r="7709" b="2021">model</wd>

<space/>

<wd l="7800" t="1862" r="8338" b="2021">which</wd>

<space/>

<wd l="8424" t="1862" r="8558" b="2021">is</wd>

<space/>

<wd l="8659" t="1862" r="9408" b="2021">included</wd>

<space/>

<wd l="9499" t="1862" r="9667" b="2016">in</wd>

<space/>

<wd l="9754" t="1862" r="10022" b="2021">the</wd>

<space/>

<wd l="10118" t="1862" r="10502" b="2021">soft-</wd>

</ln>

<ln l="6144" t="2136" r="10502" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2189" r="6566" b="2294">ware</wd>

<space/>

<wd l="6638" t="2136" r="6950" b="2294">and</wd>

<space/>

<wd l="7022" t="2141" r="7186" b="2333">2)</wd>

<space/>

<wd l="7267" t="2189" r="7363" b="2294">a</wd>

<space/>

<wd l="7426" t="2136" r="7968" b="2294">model</wd>

<space/>

<wd l="8040" t="2136" r="8366" b="2294">that</wd>

<space/>

<wd l="8438" t="2136" r="8827" b="2294">does</wd>

<space/>

<wd l="8899" t="2160" r="9182" b="2294">not</wd>

<space/>

<wd l="9245" t="2189" r="9533" b="2294">use</wd>

<space/>

<wd l="9605" t="2136" r="10502" b="2338">capitaliza-</wd>

</ln>

<ln l="6144" t="2405" r="10502" b="2592" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2405" r="6485" b="2563">tion</wd>

<space/>

<wd l="6547" t="2458" r="6720" b="2563">as</wd>

<space/>

<wd l="6787" t="2458" r="6883" b="2563">a</wd>

<space/>

<wd l="6941" t="2405" r="7589" b="2592">feature,</wd>

<space/>

<wd l="7661" t="2405" r="7834" b="2558">in</wd>

<space/>

<wd l="7896" t="2405" r="8352" b="2563">order</wd>

<space/>

<wd l="8410" t="2429" r="8573" b="2563">to</wd>

<space/>

<wd l="8640" t="2405" r="9000" b="2563">deal</wd>

<space/>

<wd l="9062" t="2405" r="9451" b="2563">with</wd>

<space/>

<wd l="9509" t="2405" r="9773" b="2563">the</wd>

<space/>

<wd l="9830" t="2405" r="10502" b="2563">unrelia-</wd>

</ln>

<ln l="6144" t="2678" r="8952" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2678" r="6605" b="2880">bility</wd>

<space/>

<wd l="6667" t="2678" r="6854" b="2837">of</wd>

<space/>

<wd l="6902" t="2678" r="8074" b="2880">capitalization</wd>

<space/>

<wd l="8126" t="2678" r="8299" b="2832">in</wd>

<space/>

<wd l="8352" t="2702" r="8952" b="2837">tweets.</wd>

</ln>

</para>

<para l="6144" t="2952" r="10512" b="5280" alignment="justified" spaceBefore="4" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="2952" r="10512" b="3154" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="2952" r="6701" b="3110">The</wd>

<space/>

<wd l="6768" t="2952" r="7330" b="3110">results</wd>

<space/>

<wd l="7406" t="2952" r="7598" b="3110">of</wd>

<space/>

<wd l="7646" t="2952" r="7915" b="3110">the</wd>

<space/>

<wd l="7978" t="2957" r="8414" b="3110">NER</wd>

<space/>

<wd l="8486" t="2952" r="8798" b="3110">and</wd>

<space/>

<wd l="8861" t="2952" r="9125" b="3110">the</wd>

<space/>

<wd l="9197" t="2957" r="9485" b="3106">KB</wd>

<space/>

<wd l="9557" t="2952" r="10512" b="3154">knowledge</wd>

<space/>

</ln>

<ln l="6149" t="3221" r="10507" b="3422" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3221" r="6341" b="3379">of</wd>

<space/>

<wd l="6413" t="3221" r="6677" b="3379">the</wd>

<space/>

<wd l="6768" t="3221" r="8011" b="3422">corresponding</wd>

<space/>

<wd l="8102" t="3221" r="8592" b="3422">entity</wd>

<space/>

<wd l="8678" t="3221" r="9398" b="3379">mention</wd>

<space/>

<wd l="9485" t="3221" r="10210" b="3379">detected</wd>

<space/>

<wd l="10291" t="3221" r="10507" b="3422">by</wd>

<space/>

</ln>

<ln l="6144" t="3494" r="10507" b="3696" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3494" r="6413" b="3653">the</wd>

<space/>

<wd l="6485" t="3499" r="6754" b="3648">EL</wd>

<space/>

<wd l="6826" t="3547" r="7085" b="3653">are</wd>

<space/>

<wd l="7162" t="3494" r="7560" b="3653">used</wd>

<space/>

<wd l="7637" t="3547" r="7805" b="3653">as</wd>

<space/>

<wd l="7882" t="3494" r="8150" b="3653">the</wd>

<space/>

<wd l="8222" t="3494" r="8909" b="3696">primary</wd>

<space/>

<wd l="8986" t="3494" r="10507" b="3696">machine-learning</wd>

<space/>

</ln>

<ln l="6144" t="3763" r="10502" b="3922" baseLine="3917" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3763" r="6878" b="3922">features.</wd>

<space/>

<wd l="7022" t="3768" r="7306" b="3922">We</wd>

<space/>

<wd l="7387" t="3763" r="7733" b="3922">also</wd>

<space/>

<wd l="7810" t="3763" r="8453" b="3922">include</wd>

<space/>

<wd l="8530" t="3763" r="9211" b="3922">features</wd>

<space/>

<wd l="9293" t="3763" r="9624" b="3922">that</wd>

<space/>

<wd l="9701" t="3816" r="9960" b="3922">are</wd>

<space/>

<wd l="10037" t="3763" r="10502" b="3922">tradi-</wd>

</ln>

<ln l="6144" t="4037" r="10502" b="4238" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4037" r="6811" b="4238">tionally</wd>

<space/>

<wd l="6883" t="4037" r="7286" b="4195">used</wd>

<space/>

<wd l="7354" t="4037" r="7526" b="4190">in</wd>

<space/>

<wd l="7598" t="4042" r="8030" b="4195">NER</wd>

<space/>

<wd l="8112" t="4037" r="8506" b="4195">such</wd>

<space/>

<wd l="8578" t="4090" r="8750" b="4195">as</wd>

<space/>

<wd l="8827" t="4037" r="10090" b="4238">part-of-speech</wd>

<space/>

<wd l="10162" t="4061" r="10502" b="4238">tags</wd>

<space/>

</ln>

<ln l="6149" t="4306" r="10512" b="4507" baseLine="4459" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="4306" r="6461" b="4464">and</wd>

<space/>

<wd l="6538" t="4306" r="6802" b="4464">the</wd>

<space/>

<wd l="6888" t="4306" r="8059" b="4507">capitalization</wd>

<space/>

<wd l="8136" t="4306" r="8870" b="4464">features.</wd>

<space/>

<wd l="9014" t="4306" r="10152" b="4493">Furthermore,</wd>

<space/>

<wd l="10243" t="4306" r="10512" b="4464">the</wd>

<space/>

</ln>

<ln l="6144" t="4579" r="10507" b="4781" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4579" r="6542" b="4738">ratio</wd>

<space/>

<wd l="6619" t="4579" r="6811" b="4738">of</wd>

<space/>

<wd l="6869" t="4579" r="7133" b="4738">the</wd>

<space/>

<wd l="7210" t="4579" r="8150" b="4781">capitalized</wd>

<space/>

<wd l="8222" t="4579" r="8746" b="4738">words</wd>

<space/>

<wd l="8822" t="4579" r="8995" b="4733">in</wd>

<space/>

<wd l="9062" t="4579" r="9331" b="4738">the</wd>

<space/>

<wd l="9398" t="4603" r="9874" b="4738">tweet</wd>

<space/>

<wd l="9946" t="4579" r="10080" b="4738">is</wd>

<space/>

<wd l="10166" t="4579" r="10507" b="4738">also</wd>

<space/>

</ln>

<ln l="6144" t="4848" r="10502" b="5050" baseLine="5002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4848" r="6547" b="5006">used</wd>

<space/>

<wd l="6619" t="4901" r="6787" b="5006">as</wd>

<space/>

<wd l="6869" t="4901" r="7066" b="5006">an</wd>

<space/>

<wd l="7142" t="4848" r="7920" b="5006">indicator</wd>

<space/>

<wd l="7987" t="4848" r="8179" b="5006">of</wd>

<space/>

<wd l="8237" t="4848" r="8501" b="5006">the</wd>

<space/>

<wd l="8573" t="4848" r="9418" b="5050">reliability</wd>

<space/>

<wd l="9494" t="4848" r="9686" b="5006">of</wd>

<space/>

<wd l="9739" t="4848" r="10003" b="5006">the</wd>

<space/>

<wd l="10080" t="4848" r="10502" b="5050">capi-</wd>

</ln>

<ln l="6144" t="5122" r="7003" b="5280" baseLine="5270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5122" r="7003" b="5280">talization.</wd>

</ln>

</para>

<para l="6149" t="5395" r="10502" b="5822" alignment="justified" spaceBefore="6" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="5395" r="10502" b="5597" baseLine="5544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5395" r="6701" b="5554">The</wd>

<space/>

<wd l="6773" t="5395" r="8299" b="5597">machine-learning</wd>

<space/>

<wd l="8371" t="5395" r="9053" b="5554">features</wd>

<space/>

<wd l="9134" t="5395" r="9394" b="5554">for</wd>

<space/>

<wd l="9461" t="5395" r="9768" b="5554">this</wd>

<space/>

<wd l="9854" t="5419" r="10195" b="5597">step</wd>

<space/>

<wd l="10267" t="5395" r="10502" b="5549">in-</wd>

</ln>

<ln l="6149" t="5664" r="6662" b="5822" baseLine="5818" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="5664" r="6662" b="5822">clude:</wd>

</ln>

</para>

<para l="6384" t="6154" r="10526" b="6898" alignment="justified" li="432" spaceBefore="214" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6154" r="10526" b="6312" baseLine="6300">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="6163" r="6576" b="6302">•</wd>

<tab position="6462"/>

<wd l="6576" t="6163" r="6840" b="6307">EL</wd>

<space/>

<wd l="6912" t="6154" r="7733" b="6312">relevance</wd>

<space/>

</run>

<wd l="7805" t="6154" r="8405" b="6312"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">score</run>

<run italic="true" underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">*</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8510" t="6154" r="8846" b="6312">The</wd>

<space/>

<wd l="8914" t="6154" r="9739" b="6312">relevance</wd>

<space/>

<wd l="9811" t="6206" r="10262" b="6312">score</wd>

<space/>

<wd l="10334" t="6154" r="10526" b="6312">of</wd>

<space/>

</run>

</ln>

<ln l="6581" t="6422" r="10502" b="6624" baseLine="6576" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6422" r="6850" b="6581">the</wd>

<space/>

<wd l="6931" t="6422" r="7421" b="6624">entity</wd>

<space/>

<wd l="7502" t="6422" r="8218" b="6581">mention</wd>

<space/>

<wd l="8299" t="6422" r="9048" b="6624">assigned</wd>

<space/>

<wd l="9125" t="6422" r="9341" b="6624">by</wd>

<space/>

<wd l="9422" t="6422" r="9686" b="6581">the</wd>

<space/>

<wd l="9763" t="6422" r="10502" b="6624">previous</wd>

<space/>

</ln>

<ln l="6581" t="6696" r="7296" b="6898" baseLine="6845" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6701" r="6850" b="6850">EL</wd>

<space/>

<wd l="6912" t="6720" r="7296" b="6898">step.</wd>

</ln>

</para>

<para l="6384" t="7061" r="10512" b="7810" alignment="justified" li="432" spaceBefore="99" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="7061" r="10502" b="7267" baseLine="7212">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="7075" r="6576" b="7214">•</wd>

<tab position="6462"/>

<wd l="6576" t="7066" r="6974" b="7224">Link</wd>

<space/>

</run>

<wd l="7013" t="7061" r="8131" b="7267"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">probability</run>

<run italic="true" underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">*</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8232" t="7066" r="8573" b="7224">The</wd>

<space/>

<wd l="8635" t="7066" r="9590" b="7267">probability</wd>

<space/>

<wd l="9662" t="7066" r="9854" b="7224">of</wd>

<space/>

<wd l="9902" t="7066" r="10166" b="7224">the</wd>

<space/>

<wd l="10238" t="7118" r="10502" b="7224">en-</wd>

</run>

</ln>

<ln l="6581" t="7334" r="10512" b="7536" baseLine="7488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="7334" r="6869" b="7536">tity</wd>

<space/>

<wd l="6955" t="7334" r="7675" b="7493">mention</wd>

<space/>

<wd l="7762" t="7334" r="8611" b="7536">appearing</wd>

<space/>

<wd l="8707" t="7387" r="8875" b="7493">as</wd>

<space/>

<wd l="8971" t="7387" r="9168" b="7493">an</wd>

<space/>

<wd l="9259" t="7334" r="9854" b="7493">anchor</wd>

<space/>

<wd l="9931" t="7358" r="10258" b="7493">text</wd>

<space/>

<wd l="10339" t="7334" r="10512" b="7488">in</wd>

<space/>

</ln>

<ln l="6581" t="7608" r="7526" b="7810" baseLine="7757" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="7608" r="7526" b="7810">Wikipedia.</wd>

</ln>

</para>

<para l="6384" t="7973" r="10512" b="8717" alignment="justified" li="432" spaceBefore="99" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="7973" r="10507" b="8174" baseLine="8124">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="7978" r="6595" b="8126">•</wd>

<tab position="6467"/>

<wd l="6595" t="7973" r="7829" b="8174">Capitalization</wd>

<space/>

</run>

<wd l="7891" t="7973" r="9005" b="8174"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">probability</run>

<run italic="true" underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">*</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9134" t="7973" r="9475" b="8131">The</wd>

<space/>

<wd l="9552" t="7973" r="10507" b="8174">probability</wd>

<space/>

</run>

</ln>

<ln l="6586" t="8246" r="10512" b="8448" baseLine="8395" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="8246" r="6778" b="8405">of</wd>

<space/>

<wd l="6874" t="8246" r="7142" b="8405">the</wd>

<space/>

<wd l="7258" t="8246" r="7747" b="8448">entity</wd>

<space/>

<wd l="7862" t="8246" r="8578" b="8405">mention</wd>

<space/>

<wd l="8688" t="8246" r="9168" b="8448">being</wd>

<space/>

<wd l="9288" t="8246" r="10229" b="8448">capitalized</wd>

<space/>

<wd l="10339" t="8246" r="10512" b="8400">in</wd>

<space/>

</ln>

<ln l="6581" t="8515" r="7526" b="8717" baseLine="8669" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="8515" r="7526" b="8717">Wikipedia.</wd>

</ln>

</para>

<para l="6384" t="8885" r="10517" b="9629" alignment="justified" li="432" spaceBefore="94" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="8885" r="10517" b="9086" baseLine="9032">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="8894" r="6590" b="9034">•</wd>

<tab position="6462"/>

<wd l="6590" t="8885" r="6902" b="9043">The</wd>

<space/>

<wd l="6984" t="8885" r="7656" b="9043">number</wd>

<space/>

<wd l="7728" t="8890" r="7930" b="9086">of</wd>

<space/>

<wd l="7978" t="8885" r="8688" b="9043">inbound</wd>

<space/>

</run>

<wd l="8760" t="8885" r="9307" b="9043"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">links</run>

<run italic="true" underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">*</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9432" t="8885" r="9768" b="9043">The</wd>

<space/>

<wd l="9845" t="8885" r="10517" b="9043">number</wd>

<space/>

</run>

</ln>

<ln l="6586" t="9154" r="10507" b="9355" baseLine="9307" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="9154" r="6778" b="9312">of</wd>

<space/>

<wd l="6830" t="9154" r="7550" b="9312">inbound</wd>

<space/>

<wd l="7618" t="9154" r="8035" b="9312">links</wd>

<space/>

<wd l="8117" t="9154" r="8304" b="9312">of</wd>

<space/>

<wd l="8362" t="9154" r="8626" b="9312">the</wd>

<space/>

<wd l="8702" t="9154" r="9941" b="9355">corresponding</wd>

<space/>

<wd l="10018" t="9154" r="10507" b="9355">entity</wd>

<space/>

</ln>

<ln l="6581" t="9427" r="7752" b="9629" baseLine="9576" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="9427" r="6754" b="9581">in</wd>

<space/>

<wd l="6806" t="9427" r="7752" b="9629">Wikipedia.</wd>

</ln>

</para>

<para l="6384" t="9792" r="10512" b="10541" alignment="justified" li="432" spaceBefore="99" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="9792" r="10512" b="9998" baseLine="9943">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="9806" r="6590" b="9946">•</wd>

<tab position="6462"/>

<wd l="6590" t="9797" r="6902" b="9955">The</wd>

<space/>

<wd l="7070" t="9850" r="7762" b="9998">average</wd>

<space/>

<wd l="7906" t="9850" r="8342" b="9998">page</wd>

<space/>

</run>

<wd l="8506" t="9792" r="9043" b="9955"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">view</run>

<run italic="true" underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">*</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9341" t="9797" r="9677" b="9955">The</wd>

<space/>

<wd l="9845" t="9850" r="10512" b="9998">average</wd>

<space/>

</run>

</ln>

<ln l="6581" t="10066" r="10512" b="10267" baseLine="10219" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="10118" r="6994" b="10267">page</wd>

<space/>

<wd l="7118" t="10066" r="7531" b="10224">view</wd>

<space/>

<wd l="7661" t="10066" r="7853" b="10224">of</wd>

<space/>

<wd l="7963" t="10066" r="8227" b="10224">the</wd>

<space/>

<wd l="8357" t="10066" r="9595" b="10267">corresponding</wd>

<space/>

<wd l="9725" t="10066" r="10214" b="10267">entity</wd>

<space/>

<wd l="10339" t="10066" r="10512" b="10219">in</wd>

<space/>

</ln>

<ln l="6581" t="10339" r="7526" b="10541" baseLine="10488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="10339" r="7526" b="10541">Wikipedia.</wd>

</ln>

</para>

<para l="6384" t="10704" r="10507" b="11405" alignment="justified" li="432" spaceBefore="99" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="10704" r="10502" b="10906" baseLine="10858">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="10714" r="6576" b="10858">•</wd>

<tab position="6465"/>

<wd l="6576" t="10714" r="6989" b="10862">NER</wd>

<space/>

<wd l="7075" t="10757" r="7483" b="10906">span</wd>

<space/>

</run>

<wd l="7565" t="10704" r="8141" b="10862"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">match</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8275" t="10704" r="8866" b="10906">Binary</wd>

<space/>

<wd l="8952" t="10704" r="9494" b="10862">values</wd>

<space/>

<wd l="9581" t="10704" r="9912" b="10862">that</wd>

<space/>

<wd l="9989" t="10757" r="10502" b="10906">repre-</wd>

</run>

</ln>

<ln l="6590" t="10978" r="10507" b="11179" baseLine="11126" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6590" t="11002" r="6936" b="11136">sent</wd>

<space/>

<wd l="6998" t="10978" r="7704" b="11136">whether</wd>

<space/>

<wd l="7766" t="10978" r="8030" b="11136">the</wd>

<space/>

<wd l="8098" t="11030" r="8731" b="11179">n-gram</wd>

<space/>

<wd l="8789" t="10978" r="8928" b="11136">is</wd>

<space/>

<wd l="9005" t="10978" r="9730" b="11136">detected</wd>

<space/>

<wd l="9792" t="10978" r="10008" b="11179">by</wd>

<space/>

<wd l="10075" t="10982" r="10507" b="11136">NER</wd>

<space/>

</ln>

<ln l="6581" t="11246" r="7258" b="11405" baseLine="11400" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="11246" r="7258" b="11405">models.</wd>

</ln>

</para>

<para l="6384" t="11616" r="10526" b="12360" alignment="justified" li="432" spaceBefore="94" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="11616" r="10526" b="11818" baseLine="11765">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="11626" r="6581" b="11765">•</wd>

<tab position="6462"/>

<wd l="6581" t="11616" r="7853" b="11818">Part-of-speech</wd>

<space/>

</run>

<wd l="7958" t="11650" r="8357" b="11818"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">tags</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8520" t="11616" r="9792" b="11818">Part-of-speech</wd>

<space/>

<wd l="9883" t="11640" r="10229" b="11818">tags</wd>

<space/>

<wd l="10334" t="11616" r="10526" b="11774">of</wd>

<space/>

</run>

</ln>

<ln l="6581" t="11890" r="10512" b="12091" baseLine="12038" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="11890" r="6850" b="12048">the</wd>

<space/>

<wd l="6902" t="11890" r="7694" b="12091">previous,</wd>

<space/>

<wd l="7766" t="11890" r="8141" b="12077">first,</wd>

<space/>

<wd l="8208" t="11890" r="8554" b="12077">last,</wd>

<space/>

<wd l="8626" t="11890" r="8938" b="12048">and</wd>

<space/>

<wd l="8995" t="11914" r="9370" b="12048">next</wd>

<space/>

<wd l="9422" t="11890" r="9946" b="12048">words</wd>

<space/>

<wd l="10013" t="11890" r="10205" b="12048">of</wd>

<space/>

<wd l="10243" t="11890" r="10512" b="12048">the</wd>

<space/>

</ln>

<ln l="6581" t="12158" r="7258" b="12360" baseLine="12307" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="12211" r="7258" b="12360">n-gram.</wd>

</ln>

</para>

<para l="6384" t="12528" r="10512" b="13272" alignment="justified" li="432" spaceBefore="99" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="12528" r="10512" b="12730" baseLine="12677">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6384" t="12533" r="6595" b="12677">•</wd>

<tab position="6465"/>

<wd l="6595" t="12533" r="7262" b="12686">Context</wd>

<space/>

</run>

<wd l="7373" t="12528" r="8611" b="12730"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">capitalization</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8813" t="12528" r="9403" b="12730">Binary</wd>

<space/>

<wd l="9518" t="12528" r="10066" b="12686">values</wd>

<space/>

<wd l="10186" t="12528" r="10512" b="12686">that</wd>

<space/>

</run>

</ln>

<ln l="6581" t="12797" r="10512" b="12998" baseLine="12950" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="12821" r="7382" b="12998">represent</wd>

<space/>

<wd l="7430" t="12797" r="8136" b="12955">whether</wd>

<space/>

<wd l="8179" t="12797" r="8448" b="12955">the</wd>

<space/>

<wd l="8496" t="12797" r="9283" b="12998">previous,</wd>

<space/>

<wd l="9350" t="12797" r="9730" b="12984">first,</wd>

<space/>

<wd l="9787" t="12797" r="10133" b="12984">last,</wd>

<space/>

<wd l="10200" t="12797" r="10512" b="12955">and</wd>

<space/>

</ln>

<ln l="6581" t="13070" r="10147" b="13272" baseLine="13219" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="13094" r="6955" b="13229">next</wd>

<space/>

<wd l="7008" t="13070" r="7531" b="13229">words</wd>

<space/>

<wd l="7598" t="13070" r="7790" b="13229">of</wd>

<space/>

<wd l="7829" t="13070" r="8098" b="13229">the</wd>

<space/>

<wd l="8150" t="13123" r="8784" b="13272">n-gram</wd>

<space/>

<wd l="8842" t="13123" r="9101" b="13229">are</wd>

<space/>

<wd l="9163" t="13070" r="10147" b="13272">capitalized.</wd>

</ln>

</para>

<para l="6384" t="13435" r="10502" b="13910" alignment="justified" li="432" spaceBefore="97" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="13435" r="10502" b="13637" baseLine="13589">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="13440" r="6595" b="13589">•</wd>

<tab position="6467"/>

<wd l="6595" t="13435" r="7483" b="13594">Character</wd>

<space/>

</run>

<wd l="7546" t="13435" r="8131" b="13637"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">length</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8242" t="13435" r="8578" b="13594">The</wd>

<space/>

<wd l="8645" t="13435" r="9317" b="13594">number</wd>

<space/>

<wd l="9384" t="13435" r="9576" b="13594">of</wd>

<space/>

<wd l="9634" t="13435" r="10502" b="13594">characters</wd>

<space/>

</run>

</ln>

<ln l="6581" t="13709" r="9470" b="13910" baseLine="13858" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="13709" r="6960" b="13867">read</wd>

<space/>

<wd l="7013" t="13709" r="7181" b="13862">in</wd>

<space/>

<wd l="7238" t="13709" r="7502" b="13867">the</wd>

<space/>

<wd l="7565" t="13709" r="8184" b="13867">surface</wd>

<space/>

<wd l="8246" t="13709" r="8434" b="13867">of</wd>

<space/>

<wd l="8477" t="13709" r="8741" b="13867">the</wd>

<space/>

<wd l="8798" t="13762" r="9470" b="13910">n-gram.</wd>

</ln>

</para>

<para l="6384" t="14078" r="10512" b="14549" alignment="justified" li="432" spaceBefore="96" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="14078" r="10512" b="14280" baseLine="14227">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="14088" r="6590" b="14227">•</wd>

<tab position="6462"/>

<wd l="6590" t="14078" r="7090" b="14237">Token</wd>

<space/>

</run>

<wd l="7166" t="14078" r="7752" b="14280"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">length</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7867" t="14078" r="8203" b="14237">The</wd>

<space/>

<wd l="8275" t="14078" r="8942" b="14237">number</wd>

<space/>

<wd l="9014" t="14078" r="9206" b="14237">of</wd>

<space/>

<wd l="9259" t="14078" r="9821" b="14237">tokens</wd>

<space/>

<wd l="9898" t="14078" r="10272" b="14237">read</wd>

<space/>

<wd l="10339" t="14078" r="10512" b="14232">in</wd>

<space/>

</run>

</ln>

<ln l="6581" t="14347" r="7574" b="14549" baseLine="14496" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="14347" r="6850" b="14506">the</wd>

<space/>

<wd l="6902" t="14400" r="7574" b="14549">n-gram.</wd>

</ln>

</para>

<para l="6144" t="14832" r="10512" b="15307" alignment="justified" spaceBefore="221" fli="216" lsp="exactly" lspExact="265" language="en">

<ln l="6365" t="14832" r="10512" b="15034" baseLine="14984">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="14842" r="6787" b="14995">Note</wd>

<space/>

<wd l="6888" t="14837" r="7214" b="14995">that</wd>

<space/>

<wd l="7325" t="14890" r="7776" b="14995">some</wd>

<space/>

<wd l="7877" t="14837" r="8558" b="14995">features</wd>

<space/>

<wd l="8674" t="14837" r="9394" b="15034">(marked</wd>

<space/>

<wd l="9490" t="14837" r="9878" b="14995">with</wd>

<space/>

</run>

<wd l="9989" t="14832" r="10133" b="15034"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">*</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10248" t="14890" r="10512" b="14995">are</wd>

<space/>

</run>

</ln>

<ln l="6144" t="15106" r="10502" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="15106" r="6643" b="15264">based</wd>

<space/>

<wd l="6725" t="15158" r="6936" b="15264">on</wd>

<space/>

<wd l="7018" t="15158" r="7214" b="15264">an</wd>

<space/>

<wd l="7296" t="15106" r="7786" b="15307">entity</wd>

<space/>

<wd l="7862" t="15106" r="8582" b="15264">mention</wd>

<space/>

<wd l="8659" t="15106" r="9384" b="15264">detected</wd>

<space/>

<wd l="9456" t="15106" r="9672" b="15307">by</wd>

<space/>

<wd l="9749" t="15110" r="10061" b="15293">EL,</wd>

<space/>

<wd l="10147" t="15106" r="10502" b="15264">thus</wd>

</ln>

</para>

</column>

</section>

<dd l="1437" t="15746" r="10531" b="15975">

<para l="5771" t="15792" r="6196" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6130" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="28">

<wd l="5837" t="15792" r="6130" b="15946">138</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4320.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1406" marginTop="1252" marginRight="1315" marginBottom="1292" offsetX="8" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1406" t="1252" r="10594" b="15310">

<column l="1406" t="1252" r="5856" b="15310">

<para l="1440" t="1320" r="5794" b="1795" alignment="justified" spaceBefore="6" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="1320" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1320" r="1886" b="1478">these</wd>

<space/>

<wd l="1954" t="1320" r="2635" b="1478">features</wd>

<space/>

<wd l="2712" t="1373" r="3010" b="1478">can</wd>

<space/>

<wd l="3077" t="1320" r="3283" b="1478">be</wd>

<space/>

<wd l="3346" t="1320" r="4022" b="1522">missing</wd>

<space/>

<wd l="4090" t="1320" r="4238" b="1474">if</wd>

<space/>

<wd l="4291" t="1320" r="4723" b="1478">there</wd>

<space/>

<wd l="4790" t="1320" r="4930" b="1478">is</wd>

<space/>

<wd l="5002" t="1373" r="5218" b="1478">no</wd>

<space/>

<wd l="5290" t="1373" r="5794" b="1478">corre-</wd>

</ln>

<ln l="1450" t="1594" r="5299" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="1594" r="2237" b="1795">sponding</wd>

<space/>

<wd l="2299" t="1594" r="2789" b="1795">entity</wd>

<space/>

<wd l="2846" t="1594" r="3562" b="1752">mention</wd>

<space/>

<wd l="3619" t="1594" r="4344" b="1752">detected</wd>

<space/>

<wd l="4397" t="1594" r="4613" b="1795">by</wd>

<space/>

<wd l="4670" t="1594" r="4934" b="1752">the</wd>

<space/>

<wd l="4992" t="1598" r="5299" b="1752">EL.</wd>

</ln>

</para>

<para l="1440" t="1877" r="5803" b="2621" alignment="justified" spaceBefore="13" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="1877" r="5794" b="2078" baseLine="2030" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="1882" r="1944" b="2035">We</wd>

<space/>

<wd l="2021" t="1877" r="2362" b="2035">also</wd>

<space/>

<wd l="2434" t="1877" r="3062" b="2035">resolve</wd>

<space/>

<wd l="3139" t="1877" r="3854" b="2078">overlaps</wd>

<space/>

<wd l="3941" t="1877" r="4133" b="2035">of</wd>

<space/>

<wd l="4186" t="1877" r="4978" b="2035">mentions</wd>

<space/>

<wd l="5059" t="1877" r="5270" b="2078">by</wd>

<space/>

<wd l="5347" t="1877" r="5794" b="2035">itera-</wd>

</ln>

<ln l="1440" t="2150" r="5803" b="2352" baseLine="2299" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2150" r="1925" b="2352">tively</wd>

<space/>

<wd l="1982" t="2150" r="2746" b="2352">selecting</wd>

<space/>

<wd l="2789" t="2150" r="3058" b="2309">the</wd>

<space/>

<wd l="3101" t="2150" r="3730" b="2352">longest</wd>

<space/>

<wd l="3778" t="2150" r="4267" b="2352">entity</wd>

<space/>

<wd l="4315" t="2150" r="5030" b="2309">mention</wd>

<space/>

<wd l="5074" t="2150" r="5501" b="2309">from</wd>

<space/>

<wd l="5539" t="2150" r="5803" b="2309">the</wd>

<space/>

</ln>

<ln l="1440" t="2419" r="3269" b="2621" baseLine="2568" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2419" r="2304" b="2621">beginning</wd>

<space/>

<wd l="2371" t="2419" r="2558" b="2578">of</wd>

<space/>

<wd l="2606" t="2472" r="2702" b="2578">a</wd>

<space/>

<wd l="2750" t="2443" r="3269" b="2578">tweet.</wd>

</ln>

</para>

<para l="1440" t="2885" r="5069" b="3043" alignment="left" spaceBefore="214" lsp="exactly" lspExact="257" language="en">

<ln l="1440" t="2885" r="5069" b="3043" baseLine="3034" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2885" r="1872" b="3043">2.3.2</wd>

<space/>

<wd l="2102" t="2885" r="3341" b="3043">Classification</wd>

<space/>

<wd l="3403" t="2885" r="3595" b="3043">of</wd>

<space/>

<wd l="3634" t="2890" r="4301" b="3043">Named</wd>

<space/>

<wd l="4354" t="2885" r="5069" b="3043">Entities</wd>

</ln>

</para>

<para l="1440" t="3230" r="5808" b="4786" alignment="justified" spaceBefore="68" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="3230" r="5808" b="3432" baseLine="3379" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="3235" r="1622" b="3384">In</wd>

<space/>

<wd l="1675" t="3230" r="1982" b="3389">this</wd>

<space/>

<wd l="2050" t="3254" r="2434" b="3432">step,</wd>

<space/>

<wd l="2501" t="3230" r="3226" b="3389">detected</wd>

<space/>

<wd l="3283" t="3230" r="3768" b="3432">entity</wd>

<space/>

<wd l="3826" t="3230" r="4618" b="3389">mentions</wd>

<space/>

<wd l="4680" t="3283" r="4939" b="3389">are</wd>

<space/>

<wd l="4997" t="3230" r="5808" b="3389">classified</wd>

<space/>

</ln>

<ln l="1440" t="3490" r="5794" b="3701" baseLine="3653">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="3499" r="1776" b="3658">into</wd>

<space/>

<wd l="1858" t="3499" r="2126" b="3658">the</wd>

<space/>

<wd l="2208" t="3499" r="3130" b="3701">predefined</wd>

<space/>

<wd l="3206" t="3523" r="3658" b="3701">types</wd>

<space/>

<wd l="3758" t="3499" r="4128" b="3696">(i.e.,</wd>

<space/>

</run>

<wd l="4238" t="3533" r="4939" b="3701"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">person</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<wd l="5040" t="3490" r="5794" b="3701"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">geo-loc</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

</ln>

<ln l="1440" t="3758" r="5794" b="3974" baseLine="3922">

<wd l="1440" t="3763" r="2083" b="3974"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">facility</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<wd l="2160" t="3763" r="2918" b="3974"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">product</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<wd l="2990" t="3806" r="3912" b="3974"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">company</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<wd l="3989" t="3763" r="4598" b="3960"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">movie</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<wd l="4666" t="3778" r="5794" b="3974"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">sportsteam</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

</ln>

<ln l="1454" t="4032" r="5808" b="4243" baseLine="4195">

<wd l="1454" t="4032" r="2534" b="4229"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">musicartist</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

<wd l="2592" t="4032" r="3312" b="4229"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">tvshow</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3374" t="4042" r="3686" b="4200">and</wd>

<space/>

</run>

<wd l="3739" t="4032" r="4296" b="4238"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">other</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="4354" t="4042" r="4819" b="4243">using</wd>

<space/>

<wd l="4882" t="4042" r="5808" b="4243">supervised</wd>

<space/>

</run>

</ln>

<ln l="1440" t="4315" r="5794" b="4517" baseLine="4464" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="4315" r="3010" b="4517">machine-learning.</wd>

<space/>

<wd l="3086" t="4320" r="3557" b="4502">Here,</wd>

<space/>

<wd l="3619" t="4315" r="4118" b="4474">linear</wd>

<space/>

<wd l="4176" t="4344" r="4824" b="4517">support</wd>

<space/>

<wd l="4872" t="4339" r="5419" b="4474">vector</wd>

<space/>

<wd l="5467" t="4368" r="5794" b="4474">ma-</wd>

</ln>

<ln l="1445" t="4584" r="5347" b="4786" baseLine="4733" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="4584" r="1910" b="4742">chine</wd>

<space/>

<wd l="1968" t="4584" r="2102" b="4742">is</wd>

<space/>

<wd l="2170" t="4584" r="2568" b="4742">used</wd>

<space/>

<wd l="2626" t="4637" r="2794" b="4742">as</wd>

<space/>

<wd l="2856" t="4584" r="3125" b="4742">the</wd>

<space/>

<wd l="3178" t="4584" r="4704" b="4786">machine-learning</wd>

<space/>

<wd l="4762" t="4584" r="5347" b="4742">model.</wd>

</ln>

</para>

<para l="1440" t="4867" r="5808" b="5885" alignment="justified" spaceBefore="10" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1661" t="4867" r="5803" b="5069" baseLine="5021" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="4872" r="2021" b="5026">One</wd>

<space/>

<wd l="2083" t="4867" r="2520" b="5026">main</wd>

<space/>

<wd l="2582" t="4867" r="4104" b="5069">machine-learning</wd>

<space/>

<wd l="4166" t="4867" r="4771" b="5026">feature</wd>

<space/>

<wd l="4838" t="4867" r="5030" b="5026">of</wd>

<space/>

<wd l="5078" t="4867" r="5386" b="5026">this</wd>

<space/>

<wd l="5462" t="4891" r="5803" b="5069">step</wd>

<space/>

</ln>

<ln l="1440" t="5141" r="5808" b="5342" baseLine="5290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5141" r="1579" b="5299">is</wd>

<space/>

<wd l="1680" t="5141" r="1944" b="5299">the</wd>

<space/>

<wd l="2045" t="5141" r="3283" b="5342">corresponding</wd>

<space/>

<wd l="3384" t="5141" r="3874" b="5342">entity</wd>

<space/>

<wd l="3970" t="5165" r="4421" b="5342">types</wd>

<space/>

<wd l="4522" t="5141" r="5290" b="5299">retrieved</wd>

<space/>

<wd l="5381" t="5141" r="5808" b="5299">from</wd>

<space/>

</ln>

<ln l="1445" t="5410" r="5794" b="5611" baseLine="5563" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5414" r="1872" b="5568">KBs.</wd>

<space/>

<wd l="2002" t="5414" r="2285" b="5568">We</wd>

<space/>

<wd l="2362" t="5410" r="2904" b="5568">obtain</wd>

<space/>

<wd l="2981" t="5414" r="3269" b="5563">KB</wd>

<space/>

<wd l="3355" t="5410" r="3845" b="5611">entity</wd>

<space/>

<wd l="3917" t="5434" r="4373" b="5611">types</wd>

<space/>

<wd l="4450" t="5410" r="4877" b="5568">from</wd>

<space/>

<wd l="4949" t="5410" r="5213" b="5568">the</wd>

<space/>

<wd l="5290" t="5462" r="5794" b="5568">corre-</wd>

</ln>

<ln l="1450" t="5645" r="5352" b="5885" baseLine="5826">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="5683" r="2237" b="5885">sponding</wd>

<space/>

<wd l="2299" t="5683" r="2870" b="5842">entries</wd>

<space/>

<wd l="2933" t="5683" r="3101" b="5837">in</wd>

<space/>

</run>

<wd l="3154" t="5645" r="4003" b="5885"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">DBpedia</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">5</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4080" t="5683" r="4392" b="5842">and</wd>

<space/>

</run>

<wd l="4445" t="5645" r="5352" b="5842"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Freebase</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">6</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="5966" r="5818" b="10234" alignment="justified" spaceBefore="18" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1661" t="5966" r="5803" b="6168" baseLine="6115" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1661" t="5971" r="2021" b="6125">One</wd>

<space/>

<wd l="2069" t="5966" r="2798" b="6168">problem</wd>

<space/>

<wd l="2846" t="5966" r="3019" b="6120">in</wd>

<space/>

<wd l="3062" t="5966" r="3370" b="6125">this</wd>

<space/>

<wd l="3437" t="5990" r="3778" b="6168">step</wd>

<space/>

<wd l="3826" t="5966" r="3965" b="6125">is</wd>

<space/>

<wd l="4022" t="5966" r="4349" b="6125">that</wd>

<space/>

<wd l="4397" t="5966" r="4834" b="6125">there</wd>

<space/>

<wd l="4886" t="6019" r="5146" b="6125">are</wd>

<space/>

<wd l="5208" t="5966" r="5803" b="6125">several</wd>

<space/>

</ln>

<ln l="1445" t="6235" r="5794" b="6437" baseLine="6389" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="6235" r="1934" b="6437">entity</wd>

<space/>

<wd l="1997" t="6235" r="2789" b="6394">mentions</wd>

<space/>

<wd l="2851" t="6235" r="3182" b="6394">that</wd>

<space/>

<wd l="3245" t="6259" r="3821" b="6394">cannot</wd>

<space/>

<wd l="3878" t="6235" r="4085" b="6394">be</wd>

<space/>

<wd l="4147" t="6235" r="4872" b="6394">detected</wd>

<space/>

<wd l="4925" t="6235" r="5141" b="6437">by</wd>

<space/>

<wd l="5203" t="6240" r="5472" b="6389">EL</wd>

<space/>

<wd l="5525" t="6235" r="5794" b="6394">be-</wd>

</ln>

<ln l="1445" t="6509" r="5803" b="6710" baseLine="6658" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="6562" r="1925" b="6667">cause</wd>

<space/>

<wd l="1973" t="6509" r="2160" b="6667">of</wd>

<space/>

<wd l="2189" t="6509" r="2818" b="6667">various</wd>

<space/>

<wd l="2870" t="6562" r="3514" b="6667">reasons</wd>

<space/>

<wd l="3576" t="6514" r="3998" b="6710">(e.g.,</wd>

<space/>

<wd l="4056" t="6562" r="4152" b="6667">a</wd>

<space/>

<wd l="4190" t="6509" r="5270" b="6667">non-existent</wd>

<space/>

<wd l="5314" t="6509" r="5803" b="6710">entity</wd>

<space/>

</ln>

<ln l="1440" t="6778" r="5794" b="6979" baseLine="6931" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="6778" r="1613" b="6931">in</wd>

<space/>

<wd l="1685" t="6778" r="1954" b="6936">the</wd>

<space/>

<wd l="2035" t="6782" r="2376" b="6965">KB,</wd>

<space/>

<wd l="2467" t="6830" r="2669" b="6936">an</wd>

<space/>

<wd l="2750" t="6830" r="3178" b="6936">error</wd>

<space/>

<wd l="3250" t="6778" r="4224" b="6979">performing</wd>

<space/>

<wd l="4306" t="6782" r="4690" b="6974">EL).</wd>

<space/>

<wd l="4776" t="6782" r="4958" b="6931">In</wd>

<space/>

<wd l="5040" t="6778" r="5794" b="6965">addition,</wd>

<space/>

</ln>

<ln l="1450" t="7051" r="5808" b="7253" baseLine="7200" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="7104" r="1901" b="7210">some</wd>

<space/>

<wd l="1954" t="7051" r="2482" b="7210">minor</wd>

<space/>

<wd l="2534" t="7051" r="3154" b="7210">entities</wd>

<space/>

<wd l="3216" t="7051" r="3725" b="7253">might</wd>

<space/>

<wd l="3778" t="7075" r="4061" b="7210">not</wd>

<space/>

<wd l="4114" t="7051" r="4517" b="7210">have</wd>

<space/>

<wd l="4574" t="7051" r="5064" b="7253">entity</wd>

<space/>

<wd l="5122" t="7075" r="5573" b="7253">types</wd>

<space/>

<wd l="5635" t="7051" r="5808" b="7205">in</wd>

<space/>

</ln>

<ln l="1440" t="7320" r="5803" b="7522" baseLine="7469" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="7320" r="1704" b="7478">the</wd>

<space/>

<wd l="1786" t="7325" r="2213" b="7478">KBs.</wd>

<space/>

<wd l="2357" t="7325" r="2539" b="7474">In</wd>

<space/>

<wd l="2616" t="7320" r="3077" b="7478">order</wd>

<space/>

<wd l="3149" t="7344" r="3317" b="7478">to</wd>

<space/>

<wd l="3398" t="7320" r="3754" b="7478">deal</wd>

<space/>

<wd l="3835" t="7320" r="4224" b="7478">with</wd>

<space/>

<wd l="4296" t="7320" r="4603" b="7478">this</wd>

<space/>

<wd l="4690" t="7320" r="5458" b="7522">problem,</wd>

<space/>

<wd l="5549" t="7373" r="5803" b="7478">we</wd>

<space/>

</ln>

<ln l="1445" t="7594" r="5808" b="7795" baseLine="7742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="7594" r="1781" b="7752">first</wd>

<space/>

<wd l="1834" t="7594" r="2477" b="7752">include</wd>

<space/>

<wd l="2530" t="7594" r="2794" b="7752">the</wd>

<space/>

<wd l="2856" t="7594" r="3346" b="7795">entity</wd>

<space/>

<wd l="3403" t="7618" r="3854" b="7795">types</wd>

<space/>

<wd l="3917" t="7594" r="4728" b="7795">predicted</wd>

<space/>

<wd l="4781" t="7594" r="4997" b="7795">by</wd>

<space/>

<wd l="5059" t="7594" r="5808" b="7752">Stanford</wd>

<space/>

</ln>

<ln l="1440" t="7862" r="5794" b="8064" baseLine="8011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="7867" r="1877" b="8021">NER</wd>

<space/>

<wd l="1939" t="7915" r="2112" b="8021">as</wd>

<space/>

<wd l="2179" t="7862" r="2914" b="8021">features.</wd>

<space/>

<wd l="3005" t="7867" r="3826" b="8050">However,</wd>

<space/>

<wd l="3898" t="7862" r="4589" b="8021">because</wd>

<space/>

<wd l="4646" t="7862" r="4915" b="8021">the</wd>

<space/>

<wd l="4973" t="7886" r="5467" b="8064">target</wd>

<space/>

<wd l="5530" t="7915" r="5794" b="8021">en-</wd>

</ln>

<ln l="1440" t="8131" r="5808" b="8333" baseLine="8285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8131" r="1728" b="8333">tity</wd>

<space/>

<wd l="1814" t="8155" r="2266" b="8333">types</wd>

<space/>

<wd l="2362" t="8131" r="2554" b="8290">of</wd>

<space/>

<wd l="2626" t="8184" r="2914" b="8290">our</wd>

<space/>

<wd l="2990" t="8131" r="3346" b="8290">task</wd>

<space/>

<wd l="3432" t="8131" r="3643" b="8290">do</wd>

<space/>

<wd l="3725" t="8155" r="4008" b="8290">not</wd>

<space/>

<wd l="4094" t="8131" r="4752" b="8333">directly</wd>

<space/>

<wd l="4843" t="8131" r="5808" b="8333">correspond</wd>

<space/>

</ln>

<ln l="1440" t="8395" r="5794" b="8606" baseLine="8554">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="8429" r="1608" b="8563">to</wd>

<space/>

<wd l="1670" t="8405" r="1939" b="8563">the</wd>

<space/>

<wd l="2006" t="8458" r="2390" b="8563">ones</wd>

<space/>

<wd l="2467" t="8405" r="2938" b="8606">given</wd>

<space/>

<wd l="3000" t="8405" r="3168" b="8558">in</wd>

<space/>

<wd l="3235" t="8405" r="3984" b="8563">Stanford</wd>

<space/>

<wd l="4042" t="8410" r="4478" b="8563">NER</wd>

<space/>

<wd l="4550" t="8405" r="4925" b="8602">(i.e.,</wd>

<space/>

</run>

<wd l="5011" t="8395" r="5794" b="8592"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">location</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

</run>

</ln>

<ln l="1450" t="8664" r="5818" b="8875" baseLine="8827">

<wd l="1450" t="8707" r="2150" b="8875"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">person</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="2261" t="8674" r="2573" b="8832">and</wd>

<space/>

</run>

<wd l="2659" t="8664" r="3960" b="8875"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">organization</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">),</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="4061" t="8674" r="4330" b="8832">the</wd>

<space/>

<wd l="4421" t="8674" r="5530" b="8832">effectiveness</wd>

<space/>

<wd l="5630" t="8674" r="5818" b="8832">of</wd>

<space/>

</run>

</ln>

<ln l="1440" t="8947" r="5803" b="9149" baseLine="9096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8947" r="1886" b="9106">these</wd>

<space/>

<wd l="1949" t="8947" r="2630" b="9106">features</wd>

<space/>

<wd l="2698" t="8947" r="2837" b="9106">is</wd>

<space/>

<wd l="2909" t="8947" r="3758" b="9149">obviously</wd>

<space/>

<wd l="3821" t="8947" r="4483" b="9106">limited.</wd>

<space/>

<wd l="4574" t="8947" r="5477" b="9134">Therefore,</wd>

<space/>

<wd l="5549" t="9000" r="5803" b="9106">we</wd>

<space/>

</ln>

<ln l="1440" t="9216" r="5808" b="9418" baseLine="9370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9216" r="2266" b="9374">introduce</wd>

<space/>

<wd l="2347" t="9216" r="3005" b="9374">another</wd>

<space/>

<wd l="3082" t="9240" r="3456" b="9418">type</wd>

<space/>

<wd l="3542" t="9216" r="3730" b="9374">of</wd>

<space/>

<wd l="3797" t="9216" r="4402" b="9374">feature</wd>

<space/>

<wd l="4483" t="9216" r="4982" b="9374">based</wd>

<space/>

<wd l="5064" t="9269" r="5280" b="9374">on</wd>

<space/>

<wd l="5362" t="9216" r="5808" b="9374">word</wd>

<space/>

</ln>

<ln l="1445" t="9490" r="5794" b="9691" baseLine="9638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="9490" r="2539" b="9691">embeddings.</wd>

<space/>

<wd l="2616" t="9494" r="2918" b="9648">For</wd>

<space/>

<wd l="2966" t="9490" r="3326" b="9677">this,</wd>

<space/>

<wd l="3394" t="9542" r="3643" b="9648">we</wd>

<space/>

<wd l="3701" t="9542" r="3989" b="9648">use</wd>

<space/>

<wd l="4046" t="9490" r="4598" b="9648">GloVe</wd>

<space/>

<wd l="4651" t="9490" r="5098" b="9648">word</wd>

<space/>

<wd l="5155" t="9490" r="5794" b="9648">embed-</wd>

</ln>

<ln l="1445" t="9730" r="5818" b="9960" baseLine="9908">

<wd l="1445" t="9730" r="1987" b="9960"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">dings</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">7</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="2059" t="9782" r="2227" b="9917">to</wd>

<space/>

<wd l="2290" t="9758" r="3058" b="9917">calculate</wd>

<space/>

<wd l="3120" t="9811" r="3317" b="9917">an</wd>

<space/>

<wd l="3384" t="9811" r="4046" b="9960">average</wd>

<space/>

<wd l="4104" t="9782" r="4651" b="9917">vector</wd>

<space/>

<wd l="4709" t="9758" r="4901" b="9917">of</wd>

<space/>

<wd l="4939" t="9782" r="5558" b="9917">vectors</wd>

<space/>

<wd l="5630" t="9758" r="5818" b="9917">of</wd>

<space/>

</run>

</ln>

<ln l="1440" t="10032" r="3302" b="10234" baseLine="10181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="10032" r="1963" b="10190">words</wd>

<space/>

<wd l="2026" t="10032" r="2198" b="10186">in</wd>

<space/>

<wd l="2251" t="10085" r="2885" b="10234">n-gram</wd>

<space/>

<wd l="2933" t="10056" r="3302" b="10190">text.</wd>

</ln>

</para>

<para l="1440" t="10315" r="5808" b="11870" alignment="justified" spaceBefore="11" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="10315" r="5803" b="10517" baseLine="10464" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="10320" r="1944" b="10474">We</wd>

<space/>

<wd l="1997" t="10315" r="2342" b="10474">also</wd>

<space/>

<wd l="2395" t="10315" r="3034" b="10474">include</wd>

<space/>

<wd l="3086" t="10315" r="3350" b="10474">the</wd>

<space/>

<wd l="3403" t="10315" r="4224" b="10474">relevance</wd>

<space/>

<wd l="4286" t="10368" r="4738" b="10474">score</wd>

<space/>

<wd l="4790" t="10315" r="5539" b="10517">assigned</wd>

<space/>

<wd l="5587" t="10315" r="5803" b="10517">by</wd>

<space/>

</ln>

<ln l="1440" t="10584" r="5803" b="10786" baseLine="10738" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10584" r="1704" b="10742">the</wd>

<space/>

<wd l="1781" t="10584" r="2520" b="10786">previous</wd>

<space/>

<wd l="2602" t="10589" r="2870" b="10738">EL</wd>

<space/>

<wd l="2952" t="10608" r="3288" b="10786">step</wd>

<space/>

<wd l="3365" t="10584" r="3696" b="10742">that</wd>

<space/>

<wd l="3768" t="10584" r="4536" b="10742">indicates</wd>

<space/>

<wd l="4618" t="10584" r="4882" b="10742">the</wd>

<space/>

<wd l="4958" t="10584" r="5803" b="10786">reliability</wd>

<space/>

</ln>

<ln l="1445" t="10858" r="5808" b="11059" baseLine="11006" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="10858" r="1637" b="11016">of</wd>

<space/>

<wd l="1685" t="10858" r="1954" b="11016">the</wd>

<space/>

<wd l="2021" t="10862" r="2309" b="11011">KB</wd>

<space/>

<wd l="2390" t="10858" r="2880" b="11059">entity</wd>

<space/>

<wd l="2947" t="10882" r="3398" b="11059">types</wd>

<space/>

<wd l="3470" t="10882" r="3638" b="11016">to</wd>

<space/>

<wd l="3706" t="10858" r="3970" b="11016">the</wd>

<space/>

<wd l="4037" t="10858" r="4627" b="11016">model.</wd>

<space/>

<wd l="4733" t="10858" r="5074" b="11016">The</wd>

<space/>

<wd l="5141" t="10858" r="5808" b="11016">number</wd>

<space/>

</ln>

<ln l="1445" t="11126" r="5794" b="11285" baseLine="11280" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11126" r="1637" b="11285">of</wd>

<space/>

<wd l="1704" t="11126" r="2227" b="11285">words</wd>

<space/>

<wd l="2318" t="11126" r="2630" b="11285">and</wd>

<space/>

<wd l="2707" t="11126" r="2976" b="11285">the</wd>

<space/>

<wd l="3053" t="11126" r="3725" b="11285">number</wd>

<space/>

<wd l="3806" t="11126" r="3998" b="11285">of</wd>

<space/>

<wd l="4066" t="11126" r="4939" b="11285">characters</wd>

<space/>

<wd l="5026" t="11126" r="5198" b="11280">in</wd>

<space/>

<wd l="5275" t="11126" r="5544" b="11285">the</wd>

<space/>

<wd l="5626" t="11179" r="5794" b="11280">n-</wd>

</ln>

<ln l="1445" t="11400" r="5803" b="11602" baseLine="11549" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11453" r="1891" b="11602">gram</wd>

<space/>

<wd l="1949" t="11424" r="2270" b="11558">text</wd>

<space/>

<wd l="2333" t="11453" r="2597" b="11558">are</wd>

<space/>

<wd l="2659" t="11400" r="3000" b="11558">also</wd>

<space/>

<wd l="3062" t="11400" r="3816" b="11558">included</wd>

<space/>

<wd l="3878" t="11453" r="4046" b="11558">as</wd>

<space/>

<wd l="4114" t="11400" r="4795" b="11558">features</wd>

<space/>

<wd l="4862" t="11424" r="5030" b="11558">to</wd>

<space/>

<wd l="5098" t="11400" r="5803" b="11558">enhance</wd>

<space/>

</ln>

<ln l="1440" t="11669" r="5366" b="11870" baseLine="11818" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11669" r="1704" b="11827">the</wd>

<space/>

<wd l="1766" t="11669" r="3038" b="11870">expressiveness</wd>

<space/>

<wd l="3106" t="11669" r="3298" b="11827">of</wd>

<space/>

<wd l="3341" t="11722" r="3634" b="11827">our</wd>

<space/>

<wd l="3682" t="11669" r="4224" b="11827">model</wd>

<space/>

<wd l="4286" t="11722" r="4685" b="11827">even</wd>

<space/>

<wd l="4738" t="11669" r="5366" b="11827">further.</wd>

</ln>

</para>

<para l="1445" t="11952" r="5794" b="12384" alignment="justified" spaceBefore="14" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="11952" r="5794" b="12154" baseLine="12106" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="11952" r="1997" b="12110">The</wd>

<space/>

<wd l="2069" t="11952" r="3590" b="12154">machine-learning</wd>

<space/>

<wd l="3667" t="11952" r="4349" b="12110">features</wd>

<space/>

<wd l="4430" t="11952" r="4685" b="12110">for</wd>

<space/>

<wd l="4752" t="11952" r="5059" b="12110">this</wd>

<space/>

<wd l="5150" t="11976" r="5486" b="12154">step</wd>

<space/>

<wd l="5563" t="11952" r="5794" b="12106">in-</wd>

</ln>

<ln l="1445" t="12226" r="1954" b="12384" baseLine="12374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="12226" r="1954" b="12384">clude:</wd>

</ln>

</para>

<para l="1675" t="12754" r="5803" b="13224" alignment="justified" li="432" spaceBefore="260" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="12754" r="5803" b="12955" baseLine="12902">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1675" t="12763" r="1877" b="12902">•</wd>

<tab position="1753"/>

<wd l="1877" t="12763" r="2150" b="12907">KB</wd>

<space/>

<wd l="2208" t="12763" r="2688" b="12955">entity</wd>

<space/>

</run>

<wd l="2736" t="12787" r="3226" b="12955"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">types</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3307" t="12754" r="3643" b="12912">The</wd>

<space/>

<wd l="3696" t="12754" r="4186" b="12955">entity</wd>

<space/>

<wd l="4234" t="12778" r="4690" b="12955">types</wd>

<space/>

<wd l="4742" t="12754" r="4915" b="12907">in</wd>

<space/>

<wd l="4963" t="12758" r="5390" b="12912">KBs.</wd>

<space/>

<wd l="5467" t="12754" r="5803" b="12912">The</wd>

<space/>

</run>

</ln>

<ln l="1882" t="13022" r="5486" b="13224" baseLine="13176" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="13027" r="2256" b="13181">KBs</wd>

<space/>

<wd l="2318" t="13022" r="2722" b="13181">used</wd>

<space/>

<wd l="2774" t="13022" r="3413" b="13181">include</wd>

<space/>

<wd l="3470" t="13022" r="4248" b="13224">DBpedia</wd>

<space/>

<wd l="4306" t="13022" r="4618" b="13181">and</wd>

<space/>

<wd l="4670" t="13022" r="5486" b="13181">Freebase.</wd>

</ln>

</para>

<para l="1675" t="13411" r="5808" b="13843" alignment="justified" li="432" spaceBefore="116" spaceAfter="104" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="13411" r="5798" b="13613" baseLine="13560">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1675" t="13421" r="1872" b="13560">•</wd>

<tab position="1753"/>

<wd l="1872" t="13421" r="2285" b="13570">NER</wd>

<space/>

<wd l="2342" t="13411" r="3077" b="13570">detected</wd>

<space/>

</run>

<wd l="3130" t="13445" r="3533" b="13613"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">type</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3619" t="13411" r="3955" b="13570">The</wd>

<space/>

<wd l="4018" t="13411" r="4738" b="13570">detected</wd>

<space/>

<wd l="4800" t="13411" r="5285" b="13613">entity</wd>

<space/>

<wd l="5347" t="13435" r="5798" b="13613">types</wd>

<space/>

</run>

</ln>

<ln l="1882" t="13685" r="5808" b="13843" baseLine="13834" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="13685" r="2074" b="13843">of</wd>

<space/>

<wd l="2122" t="13685" r="2386" b="13843">the</wd>

<space/>

<wd l="2448" t="13690" r="2885" b="13843">NER</wd>

<space/>

<wd l="2947" t="13685" r="3533" b="13843">model.</wd>

<space/>

<wd l="3634" t="13690" r="3869" b="13843">As</wd>

<space/>

<wd l="3936" t="13685" r="4858" b="13843">mentioned</wd>

<space/>

<wd l="4920" t="13685" r="5093" b="13838">in</wd>

<space/>

<wd l="5155" t="13685" r="5808" b="13843">Section</wd>

</ln>

</para>

<rulerline l="1406" t="14016" r="2640" b="14016" type="single" width="10" color="000000"/>

<para l="1450" t="14064" r="5510" b="14462" alignment="left" ri="360" spaceBefore="54" fli="216" lsp="exactly" lspExact="199" language="en">

<ln l="1694" t="14064" r="5510" b="14261" baseLine="14224">

<wd l="1694" t="14064" r="5510" b="14261"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="-1">5</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">http://mappings.dbpedia.org/server/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1"><space/>

</run>

</ln>

<ln l="1450" t="14309" r="3254" b="14462" baseLine="14424" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">

<wd l="1450" t="14309" r="3254" b="14462">ontology/classes/</wd>

</ln>

</para>

<para l="1694" t="14482" r="5410" b="14678" alignment="left" li="216" spaceBefore="22" lsp="exactly" lspExact="199" language="en">

<ln l="1694" t="14482" r="5410" b="14678" baseLine="14642">

<wd l="1694" t="14482" r="5410" b="14678"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">6</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">http://wiki.freebase.com/wiki/Type</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1450" t="14702" r="5803" b="15293" alignment="justified" ri="72" spaceBefore="11" spaceAfter="13" fli="216" lsp="exactly" lspExact="200" language="en">

<ln l="1694" t="14702" r="5803" b="14904" baseLine="14854">

<wd l="1694" t="14702" r="1997" b="14866"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">7</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">We</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2098" t="14774" r="2338" b="14866">use</wd>

<space/>

<wd l="2438" t="14736" r="2654" b="14866">the</wd>

<space/>

<wd l="2765" t="14736" r="3965" b="14866">300-dimensional</wd>

<space/>

<wd l="4066" t="14736" r="4512" b="14866">model</wd>

<space/>

<wd l="4622" t="14736" r="5318" b="14904">generated</wd>

<space/>

<wd l="5414" t="14736" r="5803" b="14904">using</wd>

<space/>

</run>

</ln>

<ln l="1450" t="14933" r="5765" b="15106" baseLine="15058">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="14938" r="1819" b="15067">840B</wd>

<space/>

<wd l="1886" t="14938" r="2347" b="15067">tokens</wd>

<space/>

<wd l="2414" t="14938" r="3029" b="15067">obtained</wd>

<space/>

<wd l="3086" t="14938" r="3432" b="15067">from</wd>

<space/>

<wd l="3494" t="14938" r="4594" b="15067">CommonCrawl</wd>

<space/>

<wd l="4651" t="14976" r="5165" b="15106">corpus.</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><wd l="5270" t="14952" r="5765" b="15096">http:</wd>

<space/>

</run>

</ln>

<ln l="1459" t="15139" r="5083" b="15293" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="1459" t="15139" r="5083" b="15293">//nlp.stanford.edu/projects/glove/</wd>

</ln>

</para>

</column>

<column l="6144" t="1252" r="10594" b="15310">

<table l="6144" t="1262" r="10594" b="2904" alignment="left" spaceBefore="10" spaceAfter="157">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>1498</gridCol>

<gridCol>1056</gridCol>

<gridCol>931</gridCol>

<gridCol>965</gridCol>

<gridRow>278</gridRow>

<gridRow>250</gridRow>

<gridRow>274</gridRow>

<gridRow>268</gridRow>

<gridRow>269</gridRow>

<gridRow>303</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6293" t="1301" r="7502" b="1502" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="6293" t="1301" r="7502" b="1502" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6293" t="1306" r="6931" b="1502">System</wd>

<space/>

<wd l="6984" t="1306" r="7502" b="1459">Name</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7766" t="1301" r="8578" b="1459" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="7766" t="1301" r="8578" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="7766" t="1301" r="8578" b="1459">Precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8890" t="1301" r="9446" b="1459" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="8890" t="1301" r="9446" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8890" t="1301" r="9446" b="1459">Recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="10003" t="1301" r="10210" b="1454" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="10003" t="1301" r="10210" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-8">

<wd l="10003" t="1306" r="10210" b="1454">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="6365" t="1574" r="7435" b="1738" alignment="centered" lsp="exactly" lspExact="245" language="en">

<ln l="6365" t="1574" r="7435" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="1584" r="6701" b="1738">Our</wd>

<space/>

<wd l="6754" t="1579" r="7435" b="1738">Method</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="7814" t="1574" r="8501" b="1738" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="7814"/>

<ln l="7814" t="1574" r="8501" b="1738" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-8">

<wd l="7814" t="1579" r="8501" b="1738">72.20%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="8822" t="1574" r="9499" b="1738" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="8822"/>

<ln l="8822" t="1574" r="9499" b="1738" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-10">

<wd l="8822" t="1579" r="9499" b="1738">69.14%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="9763" t="1579" r="10445" b="1738" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="9763"/>

<ln l="9763" t="1579" r="10445" b="1738" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-9">

<wd l="9763" t="1579" r="10445" b="1738">70.63%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<para l="6451" t="1853" r="7334" b="2011" alignment="centered" lsp="exactly" lspExact="269" language="en">

<ln l="6451" t="1853" r="7334" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6451" t="1858" r="7334" b="2011">NLANGP</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="7838" t="1848" r="8496" b="2011" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="7838"/>

<ln l="7838" t="1848" r="8496" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7838" t="1853" r="8496" b="2011">67.74%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="8837" t="1853" r="9499" b="2011" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="8837"/>

<ln l="8837" t="1853" r="9499" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8837" t="1853" r="9499" b="2011">54.31%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="9787" t="1853" r="10445" b="2011" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="9787"/>

<ln l="9787" t="1853" r="10445" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9787" t="1853" r="10445" b="2011">60.29%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<para l="6614" t="2122" r="7171" b="2280" alignment="centered" lsp="exactly" lspExact="254" language="en">

<ln l="6614" t="2122" r="7171" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6614" t="2126" r="7171" b="2280">USFD</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="7838" t="2122" r="8496" b="2280" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="7838"/>

<ln l="7838" t="2122" r="8496" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7838" t="2122" r="8496" b="2280">63.81%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="8837" t="2122" r="9499" b="2280" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="8837"/>

<ln l="8837" t="2122" r="9499" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8837" t="2122" r="9499" b="2280">56.28%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="9787" t="2122" r="10445" b="2280" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="9787"/>

<ln l="9787" t="2122" r="10445" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9787" t="2122" r="10445" b="2280">59.81%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<para l="6264" t="2390" r="7522" b="2549" alignment="centered" lsp="exactly" lspExact="260" language="en">

<ln l="6264" t="2390" r="7522" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6264" t="2390" r="7522" b="2549">multimedialab</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="7838" t="2390" r="8496" b="2549" alignment="left" lsp="exactly" lspExact="260" language="en">

<tabs position="7838"/>

<ln l="7838" t="2390" r="8496" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7838" t="2390" r="8496" b="2549">62.93%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="8837" t="2390" r="9499" b="2549" alignment="left" lsp="exactly" lspExact="260" language="en">

<tabs position="8837"/>

<ln l="8837" t="2390" r="9499" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8837" t="2390" r="9499" b="2549">55.22%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="9787" t="2390" r="10445" b="2549" alignment="left" lsp="exactly" lspExact="260" language="en">

<tabs position="9787"/>

<ln l="9787" t="2390" r="10445" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9787" t="2390" r="10445" b="2549">58.82%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="6758" t="2683" r="7027" b="2822" alignment="centered" spaceAfter="23" lsp="exactly" lspExact="270" language="en">

<ln l="6758" t="2683" r="7027" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6758" t="2717" r="7027" b="2822">nrc</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="7838" t="2664" r="8496" b="2822" alignment="left" spaceAfter="23" lsp="exactly" lspExact="270" language="en">

<tabs position="7838"/>

<ln l="7838" t="2664" r="8496" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7838" t="2664" r="8496" b="2822">62.13%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="8837" t="2664" r="9499" b="2822" alignment="left" spaceAfter="23" lsp="exactly" lspExact="270" language="en">

<tabs position="8837"/>

<ln l="8837" t="2664" r="9499" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8837" t="2664" r="9499" b="2822">54.61%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="9787" t="2664" r="10445" b="2822" alignment="left" spaceAfter="23" lsp="exactly" lspExact="270" language="en">

<tabs position="9787"/>

<ln l="9787" t="2664" r="10445" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="9787" t="2664" r="10445" b="2822">58.13%</wd>

</ln>

</para>

</cell>

</table>

<para l="6144" t="3120" r="10512" b="3595" alignment="justified" ri="72" lsp="exactly" lspExact="269" language="en">

<ln l="6144" t="3120" r="10512" b="3322" baseLine="3274" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3120" r="6624" b="3278">Table</wd>

<space/>

<wd l="6706" t="3125" r="6835" b="3278">1:</wd>

<space/>

<wd l="6926" t="3120" r="8117" b="3278">Performances</wd>

<space/>

<wd l="8189" t="3120" r="8381" b="3278">of</wd>

<space/>

<wd l="8424" t="3120" r="8688" b="3278">the</wd>

<space/>

<wd l="8746" t="3120" r="9547" b="3322">proposed</wd>

<space/>

<wd l="9614" t="3144" r="10286" b="3322">systems</wd>

<space/>

<wd l="10358" t="3144" r="10512" b="3278">at</wd>

<space/>

</ln>

<ln l="6154" t="3394" r="7824" b="3595" baseLine="3542" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="3394" r="7147" b="3595">segmenting</wd>

<space/>

<wd l="7210" t="3394" r="7824" b="3552">entities</wd>

</ln>

</para>

<para l="6581" t="4061" r="10502" b="4488" alignment="justified" li="432" ri="72" spaceBefore="399" lsp="exactly" lspExact="271" language="en">

<ln l="6586" t="4061" r="10502" b="4248" baseLine="4210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="4066" r="7061" b="4248">2.3.1,</wd>

<space/>

<wd l="7157" t="4114" r="7411" b="4219">we</wd>

<space/>

<wd l="7488" t="4114" r="7776" b="4219">use</wd>

<space/>

<wd l="7858" t="4085" r="8179" b="4219">two</wd>

<space/>

<wd l="8266" t="4061" r="9005" b="4219">different</wd>

<space/>

<wd l="9082" t="4061" r="9706" b="4219">models</wd>

<space/>

<wd l="9797" t="4061" r="9989" b="4219">of</wd>

<space/>

<wd l="10056" t="4066" r="10502" b="4219">Stan-</wd>

</ln>

<ln l="6581" t="4330" r="7478" b="4488" baseLine="4483" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="4330" r="6946" b="4488">ford</wd>

<space/>

<wd l="6998" t="4334" r="7478" b="4488">NER.</wd>

</ln>

</para>

<para l="6384" t="4694" r="10512" b="5712" alignment="justified" li="432" ri="72" spaceBefore="92" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="4694" r="10512" b="4896" baseLine="4848">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="4704" r="6576" b="4848">•</wd>

<tab position="6465"/>

<wd l="6576" t="4704" r="7253" b="4896">N-gram</wd>

<space/>

</run>

<wd l="7373" t="4728" r="7963" b="4853"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">vector</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8165" t="4694" r="8506" b="4853">The</wd>

<space/>

<wd l="8621" t="4718" r="9168" b="4853">vector</wd>

<space/>

<wd l="9274" t="4694" r="10512" b="4896">representation</wd>

<space/>

</run>

</ln>

<ln l="6586" t="4968" r="10502" b="5170" baseLine="5117" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="4968" r="6778" b="5126">of</wd>

<space/>

<wd l="6840" t="4968" r="7104" b="5126">the</wd>

<space/>

<wd l="7186" t="5021" r="7814" b="5170">n-gram</wd>

<space/>

<wd l="7896" t="4968" r="8539" b="5126">derived</wd>

<space/>

<wd l="8611" t="4968" r="9082" b="5170">using</wd>

<space/>

<wd l="9163" t="4968" r="9427" b="5126">the</wd>

<space/>

<wd l="9504" t="4968" r="10162" b="5126">method</wd>

<space/>

<wd l="10238" t="5021" r="10502" b="5126">ex-</wd>

</ln>

<ln l="6581" t="5237" r="10512" b="5438" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="5237" r="7224" b="5438">plained</wd>

<space/>

<wd l="7315" t="5237" r="7824" b="5395">above</wd>

<space/>

<wd l="7910" t="5237" r="8222" b="5395">and</wd>

<space/>

<wd l="8309" t="5237" r="9024" b="5395">includes</wd>

<space/>

<wd l="9125" t="5237" r="9518" b="5395">each</wd>

<space/>

<wd l="9605" t="5237" r="10512" b="5395">dimension</wd>

<space/>

</ln>

<ln l="6586" t="5510" r="9542" b="5712" baseLine="5659" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="5510" r="6778" b="5669">of</wd>

<space/>

<wd l="6816" t="5510" r="7085" b="5669">the</wd>

<space/>

<wd l="7138" t="5534" r="7685" b="5669">vector</wd>

<space/>

<wd l="7742" t="5563" r="7910" b="5669">as</wd>

<space/>

<wd l="7978" t="5563" r="8074" b="5669">a</wd>

<space/>

<wd l="8131" t="5534" r="8837" b="5712">separate</wd>

<space/>

<wd l="8894" t="5510" r="9542" b="5669">feature.</wd>

</ln>

</para>

<para l="6384" t="5875" r="10502" b="6346" alignment="justified" li="432" ri="72" spaceBefore="97" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="5875" r="10502" b="6034" baseLine="6024">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="5885" r="6576" b="6024">•</wd>

<tab position="6462"/>

<wd l="6576" t="5885" r="6840" b="6029">EL</wd>

<space/>

<wd l="6912" t="5875" r="7738" b="6034">relevance</wd>

<space/>

</run>

<wd l="7810" t="5928" r="8318" b="6034"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">score</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8429" t="5875" r="8765" b="6034">The</wd>

<space/>

<wd l="8837" t="5875" r="9658" b="6034">relevance</wd>

<space/>

<wd l="9739" t="5928" r="10186" b="6034">score</wd>

<space/>

<wd l="10262" t="5928" r="10502" b="6034">as-</wd>

</run>

</ln>

<ln l="6590" t="6144" r="9317" b="6346" baseLine="6298" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6590" t="6144" r="7152" b="6346">signed</wd>

<space/>

<wd l="7205" t="6144" r="7421" b="6346">by</wd>

<space/>

<wd l="7478" t="6144" r="7742" b="6302">the</wd>

<space/>

<wd l="7800" t="6144" r="8539" b="6346">previous</wd>

<space/>

<wd l="8602" t="6149" r="8870" b="6298">EL</wd>

<space/>

<wd l="8933" t="6168" r="9317" b="6346">step.</wd>

</ln>

</para>

<para l="6384" t="6509" r="10502" b="6984" alignment="justified" li="432" ri="72" spaceBefore="91" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6509" r="10502" b="6710" baseLine="6662">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="6514" r="6595" b="6662">•</wd>

<tab position="6467"/>

<wd l="6595" t="6509" r="7483" b="6667">Character</wd>

<space/>

</run>

<wd l="7546" t="6509" r="8131" b="6710"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">length</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8242" t="6509" r="8578" b="6667">The</wd>

<space/>

<wd l="8645" t="6509" r="9317" b="6667">number</wd>

<space/>

<wd l="9384" t="6509" r="9576" b="6667">of</wd>

<space/>

<wd l="9634" t="6509" r="10502" b="6667">characters</wd>

<space/>

</run>

</ln>

<ln l="6581" t="6782" r="8611" b="6984" baseLine="6931" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6782" r="6960" b="6941">read</wd>

<space/>

<wd l="7013" t="6782" r="7181" b="6936">in</wd>

<space/>

<wd l="7238" t="6782" r="7502" b="6941">the</wd>

<space/>

<wd l="7555" t="6835" r="8189" b="6984">n-gram</wd>

<space/>

<wd l="8242" t="6806" r="8611" b="6941">text.</wd>

</ln>

</para>

<para l="6384" t="7147" r="10512" b="7618" alignment="justified" li="432" ri="72" spaceBefore="92" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="7147" r="10512" b="7349" baseLine="7296">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="7157" r="6590" b="7296">•</wd>

<tab position="6462"/>

<wd l="6590" t="7147" r="7090" b="7306">Token</wd>

<space/>

</run>

<wd l="7166" t="7147" r="7752" b="7349"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">length</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7867" t="7147" r="8203" b="7306">The</wd>

<space/>

<wd l="8275" t="7147" r="8942" b="7306">number</wd>

<space/>

<wd l="9014" t="7147" r="9206" b="7306">of</wd>

<space/>

<wd l="9259" t="7147" r="9821" b="7306">tokens</wd>

<space/>

<wd l="9898" t="7147" r="10272" b="7306">read</wd>

<space/>

<wd l="10339" t="7147" r="10512" b="7301">in</wd>

<space/>

</run>

</ln>

<ln l="6581" t="7416" r="7574" b="7618" baseLine="7565" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="7416" r="6850" b="7574">the</wd>

<space/>

<wd l="6902" t="7469" r="7574" b="7618">n-gram.</wd>

</ln>

</para>

<para l="6144" t="7886" r="7800" b="8107" alignment="left" ri="72" spaceBefore="220" lsp="exactly" lspExact="274" language="en">

<ln l="6144" t="7886" r="7800" b="8107" baseLine="8054" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="12">

<wd l="6144" t="7886" r="6259" b="8059">3</wd>

<space/>

<wd l="6504" t="7886" r="7800" b="8107">Experiments</wd>

</ln>

</para>

<para l="6144" t="8328" r="8491" b="8530" alignment="left" ri="72" spaceBefore="166" lsp="exactly" lspExact="257" language="en">

<ln l="6144" t="8328" r="8491" b="8530" baseLine="8477" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="8328" r="6408" b="8486">3.1</wd>

<space/>

<wd l="6638" t="8328" r="7906" b="8530">Experimental</wd>

<space/>

<wd l="7968" t="8328" r="8491" b="8530">Setup</wd>

</ln>

</para>

<para l="6144" t="8678" r="10517" b="10234" alignment="justified" ri="72" spaceBefore="78" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="8678" r="10512" b="8880" baseLine="8832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8683" r="6365" b="8837">To</wd>

<space/>

<wd l="6466" t="8678" r="6864" b="8837">train</wd>

<space/>

<wd l="6960" t="8731" r="7253" b="8837">our</wd>

<space/>

<wd l="7339" t="8678" r="8141" b="8880">proposed</wd>

<space/>

<wd l="8232" t="8683" r="8501" b="8832">EL</wd>

<space/>

<wd l="8592" t="8678" r="9288" b="8866">method,</wd>

<space/>

<wd l="9403" t="8731" r="9658" b="8837">we</wd>

<space/>

<wd l="9754" t="8678" r="10152" b="8837">used</wd>

<space/>

<wd l="10243" t="8678" r="10512" b="8837">the</wd>

<space/>

</ln>

<ln l="6144" t="8952" r="10502" b="9154" baseLine="9101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8952" r="7229" b="9154">#Microposts</wd>

<space/>

<wd l="7306" t="8952" r="7723" b="9110">2015</wd>

<space/>

<wd l="7800" t="8957" r="8069" b="9106">EL</wd>

<space/>

<wd l="8136" t="8952" r="8741" b="9110">dataset</wd>

<space/>

<wd l="8813" t="8952" r="9379" b="9149">(Rizzo</wd>

<space/>

<wd l="9451" t="8976" r="9605" b="9110">et</wd>

<space/>

<wd l="9672" t="8952" r="9926" b="9139">al.,</wd>

<space/>

<wd l="10008" t="8952" r="10502" b="9149">2015)</wd>

<space/>

</ln>

<ln l="6144" t="9221" r="10502" b="9403" baseLine="9374">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="9221" r="6475" b="9379">that</wd>

<space/>

<wd l="6552" t="9221" r="7267" b="9379">contains</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7349" t="9226" r="7843" b="9403">3,998</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7915" t="9245" r="8467" b="9379">tweets</wd>

<space/>

<wd l="8554" t="9221" r="8866" b="9379">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8938" t="9226" r="9427" b="9403">3,993</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="9509" t="9221" r="10502" b="9379">annotations</wd>

<space/>

</run>

</ln>

<ln l="6149" t="9456" r="10512" b="9696" baseLine="9639">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6149" t="9494" r="6341" b="9653">of</wd>

<space/>

</run>

<wd l="6408" t="9456" r="7157" b="9653"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">entities.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">8</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="7306" t="9494" r="7642" b="9653">The</wd>

<space/>

<wd l="7718" t="9494" r="8818" b="9696">performance</wd>

<space/>

<wd l="8899" t="9494" r="9091" b="9653">of</wd>

<space/>

<wd l="9154" t="9547" r="9446" b="9653">our</wd>

<space/>

<wd l="9514" t="9499" r="9782" b="9648">EL</wd>

<space/>

<wd l="9854" t="9494" r="10512" b="9653">method</wd>

<space/>

</run>

</ln>

<ln l="6144" t="9763" r="10517" b="9965" baseLine="9912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="9763" r="6614" b="9965">using</wd>

<space/>

<wd l="6662" t="9763" r="6970" b="9922">this</wd>

<space/>

<wd l="7022" t="9763" r="7862" b="9965">particular</wd>

<space/>

<wd l="7910" t="9763" r="8510" b="9922">dataset</wd>

<space/>

<wd l="8554" t="9763" r="8693" b="9922">is</wd>

<space/>

<wd l="8746" t="9763" r="9475" b="9965">reported</wd>

<space/>

<wd l="9518" t="9763" r="9691" b="9917">in</wd>

<space/>

<wd l="9744" t="9763" r="10517" b="9960">(Yamada</wd>

<space/>

</ln>

<ln l="6149" t="10037" r="7229" b="10234" baseLine="10186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="10061" r="6307" b="10195">et</wd>

<space/>

<wd l="6365" t="10037" r="6614" b="10224">al.,</wd>

<space/>

<wd l="6682" t="10037" r="7229" b="10234">2015).</wd>

</ln>

</para>

<para l="6144" t="10306" r="10512" b="11050" alignment="justified" ri="72" spaceBefore="31" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="10306" r="10512" b="10493" baseLine="10459" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="10310" r="6667" b="10464">For</wd>

<space/>

<wd l="6744" t="10306" r="7051" b="10464">this</wd>

<space/>

<wd l="7147" t="10306" r="7709" b="10464">shared</wd>

<space/>

<wd l="7786" t="10306" r="8179" b="10493">task,</wd>

<space/>

<wd l="8275" t="10358" r="8530" b="10464">we</wd>

<space/>

<wd l="8606" t="10306" r="9216" b="10464">trained</wd>

<space/>

<wd l="9298" t="10306" r="9610" b="10464">and</wd>

<space/>

<wd l="9691" t="10306" r="10512" b="10464">evaluated</wd>

<space/>

</ln>

<ln l="6149" t="10579" r="10502" b="10781" baseLine="10728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="10632" r="6442" b="10738">our</wd>

<space/>

<wd l="6509" t="10579" r="7310" b="10781">proposed</wd>

<space/>

<wd l="7382" t="10579" r="8011" b="10738">Twitter</wd>

<space/>

<wd l="8078" t="10584" r="8510" b="10738">NER</wd>

<space/>

<wd l="8587" t="10579" r="9058" b="10781">using</wd>

<space/>

<wd l="9130" t="10579" r="9398" b="10738">the</wd>

<space/>

<wd l="9475" t="10579" r="10075" b="10738">dataset</wd>

<space/>

<wd l="10147" t="10632" r="10502" b="10781">pro-</wd>

</ln>

<ln l="6144" t="10814" r="8270" b="11050" baseLine="10995">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="10848" r="6634" b="11006">vided</wd>

<space/>

<wd l="6686" t="10848" r="6898" b="11050">by</wd>

<space/>

<wd l="6960" t="10848" r="7224" b="11006">the</wd>

<space/>

</run>

<wd l="7277" t="10814" r="8270" b="11050"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">workshop.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">9</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="11304" r="7310" b="11462" alignment="left" ri="72" spaceBefore="171" lsp="exactly" lspExact="257" language="en">

<ln l="6144" t="11304" r="7310" b="11462" baseLine="11453" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">

<wd l="6144" t="11304" r="6413" b="11462">3.2</wd>

<space/>

<wd l="6643" t="11309" r="7310" b="11462">Results</wd>

</ln>

</para>

<para l="6144" t="11659" r="10512" b="12672" alignment="justified" ri="72" spaceBefore="77" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="11659" r="10512" b="11861" baseLine="11808" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11659" r="6624" b="11818">Table</wd>

<space/>

<wd l="6763" t="11664" r="6826" b="11813">1</wd>

<space/>

<wd l="6970" t="11659" r="7493" b="11818">shows</wd>

<space/>

<wd l="7613" t="11659" r="7882" b="11818">the</wd>

<space/>

<wd l="7992" t="11659" r="8554" b="11818">results</wd>

<space/>

<wd l="8683" t="11659" r="8870" b="11818">of</wd>

<space/>

<wd l="8971" t="11659" r="9235" b="11818">the</wd>

<space/>

<wd l="9360" t="11659" r="10512" b="11861">segmentation</wd>

<space/>

</ln>

<ln l="6144" t="11928" r="10502" b="12130" baseLine="12077" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11928" r="6499" b="12086">task</wd>

<space/>

<wd l="6600" t="11928" r="6792" b="12086">of</wd>

<space/>

<wd l="6874" t="11928" r="7138" b="12086">the</wd>

<space/>

<wd l="7243" t="11928" r="7555" b="12086">five</wd>

<space/>

<wd l="7656" t="11928" r="8669" b="12130">top-ranking</wd>

<space/>

<wd l="8779" t="11952" r="9504" b="12130">systems.</wd>

<space/>

<wd l="9715" t="11933" r="10056" b="12086">Our</wd>

<space/>

<wd l="10147" t="11981" r="10502" b="12130">pro-</wd>

</ln>

<ln l="6144" t="12202" r="10502" b="12403" baseLine="12350" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12202" r="6658" b="12403">posed</wd>

<space/>

<wd l="6744" t="12202" r="7397" b="12360">method</wd>

<space/>

<wd l="7493" t="12202" r="8558" b="12403">significantly</wd>

<space/>

<wd l="8654" t="12202" r="9710" b="12403">outperforms</wd>

<space/>

<wd l="9806" t="12202" r="10070" b="12360">the</wd>

<space/>

<wd l="10171" t="12254" r="10502" b="12360">sec-</wd>

</ln>

<ln l="6149" t="12470" r="9048" b="12672" baseLine="12619" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="12470" r="6475" b="12629">ond</wd>

<space/>

<wd l="6528" t="12470" r="7118" b="12629">ranked</wd>

<space/>

<wd l="7171" t="12470" r="7829" b="12629">method</wd>

<space/>

<wd l="7882" t="12470" r="8098" b="12672">by</wd>

<space/>

<wd l="8179" t="12475" r="8712" b="12629">10.3%</wd>

<space/>

<wd l="8774" t="12475" r="9048" b="12629">F1.</wd>

</ln>

</para>

<para l="6144" t="12744" r="10512" b="14299" alignment="justified" ri="72" spaceBefore="1" spaceAfter="110" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="12744" r="10512" b="12946" baseLine="12893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12744" r="6701" b="12902">The</wd>

<space/>

<wd l="6778" t="12744" r="7723" b="12902">end-to-end</wd>

<space/>

<wd l="7790" t="12744" r="8352" b="12902">results</wd>

<space/>

<wd l="8443" t="12744" r="8894" b="12941">(both</wd>

<space/>

<wd l="8976" t="12744" r="10128" b="12946">segmentation</wd>

<space/>

<wd l="10200" t="12744" r="10512" b="12902">and</wd>

<space/>

</ln>

<ln l="6149" t="13013" r="10502" b="13214" baseLine="13166" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13013" r="7286" b="13171">classification</wd>

<space/>

<wd l="7382" t="13013" r="7882" b="13210">tasks)</wd>

<space/>

<wd l="7992" t="13013" r="8184" b="13171">of</wd>

<space/>

<wd l="8266" t="13013" r="8530" b="13171">the</wd>

<space/>

<wd l="8635" t="13013" r="8947" b="13171">five</wd>

<space/>

<wd l="9043" t="13013" r="10061" b="13214">top-ranking</wd>

<space/>

<wd l="10171" t="13066" r="10502" b="13214">sys-</wd>

</ln>

<ln l="6144" t="13286" r="10502" b="13488" baseLine="13435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13310" r="6552" b="13445">tems</wd>

<space/>

<wd l="6624" t="13339" r="6883" b="13445">are</wd>

<space/>

<wd l="6950" t="13286" r="7507" b="13445">shown</wd>

<space/>

<wd l="7565" t="13286" r="7738" b="13440">in</wd>

<space/>

<wd l="7795" t="13286" r="8275" b="13445">Table</wd>

<space/>

<wd l="8338" t="13291" r="8486" b="13445">2.</wd>

<space/>

<wd l="8582" t="13291" r="9048" b="13474">Here,</wd>

<space/>

<wd l="9125" t="13339" r="9413" b="13445">our</wd>

<space/>

<wd l="9470" t="13286" r="10128" b="13445">method</wd>

<space/>

<wd l="10195" t="13286" r="10502" b="13488">sig-</wd>

</ln>

<ln l="6144" t="13555" r="10512" b="13757" baseLine="13709" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13555" r="6965" b="13757">nificantly</wd>

<space/>

<wd l="7046" t="13555" r="8098" b="13757">outperforms</wd>

<space/>

<wd l="8179" t="13555" r="8443" b="13714">the</wd>

<space/>

<wd l="8525" t="13555" r="9125" b="13714">second</wd>

<space/>

<wd l="9192" t="13555" r="9787" b="13714">ranked</wd>

<space/>

<wd l="9854" t="13555" r="10512" b="13714">method</wd>

<space/>

</ln>

<ln l="6144" t="13829" r="10502" b="14030" baseLine="13978" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13829" r="6360" b="14030">by</wd>

<space/>

<wd l="6432" t="13829" r="6869" b="13987">5.0%</wd>

<space/>

<wd l="6941" t="13834" r="7214" b="13987">F1.</wd>

<space/>

<wd l="7315" t="13829" r="7790" b="13987">Table</wd>

<space/>

<wd l="7858" t="13834" r="7949" b="13987">3</wd>

<space/>

<wd l="8030" t="13829" r="8371" b="13987">also</wd>

<space/>

<wd l="8438" t="13853" r="9144" b="14030">presents</wd>

<space/>

<wd l="9221" t="13829" r="9907" b="13987">detailed</wd>

<space/>

<wd l="9974" t="13882" r="10502" b="13987">scores</wd>

<space/>

</ln>

<ln l="6144" t="14098" r="8664" b="14299" baseLine="14246" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14098" r="6749" b="14256">broken</wd>

<space/>

<wd l="6806" t="14098" r="7286" b="14256">down</wd>

<space/>

<wd l="7339" t="14098" r="7550" b="14299">by</wd>

<space/>

<wd l="7618" t="14098" r="8102" b="14299">entity</wd>

<space/>

<wd l="8160" t="14122" r="8664" b="14299">types.</wd>

</ln>

</para>

<rulerline l="6144" t="14429" r="7344" b="14429" type="single" width="10" color="000000"/>

<para l="6149" t="14486" r="10502" b="14885" alignment="justified" ri="72" spaceBefore="64" fli="216" lsp="exactly" lspExact="201" language="en">

<ln l="6403" t="14486" r="10502" b="14688" baseLine="14638">

<wd l="6403" t="14486" r="6701" b="14650"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">8</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">We</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6763" t="14558" r="6998" b="14650">use</wd>

<space/>

<wd l="7061" t="14520" r="7277" b="14650">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7344" t="14525" r="7910" b="14683">training</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7978" t="14520" r="8232" b="14650">and</wd>

<space/>

<wd l="8290" t="14520" r="8506" b="14650">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8568" t="14520" r="8808" b="14650">dev</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8875" t="14539" r="9072" b="14650">set</wd>

<space/>

<wd l="9134" t="14520" r="9288" b="14650">of</wd>

<space/>

<wd l="9336" t="14520" r="9552" b="14650">the</wd>

<space/>

<wd l="9614" t="14520" r="10502" b="14688">#Microposts</wd>

<space/>

</run>

</ln>

<ln l="6149" t="14717" r="8486" b="14885" baseLine="14842" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="14717" r="6494" b="14846">2015</wd>

<space/>

<wd l="6552" t="14717" r="7051" b="14846">dataset</wd>

<space/>

<wd l="7094" t="14755" r="7234" b="14846">as</wd>

<space/>

<wd l="7286" t="14717" r="7502" b="14846">the</wd>

<space/>

<wd l="7550" t="14717" r="8102" b="14885">training</wd>

<space/>

<wd l="8155" t="14717" r="8486" b="14846">data.</wd>

</ln>

</para>

<para l="6144" t="14904" r="10502" b="15302" alignment="justified" ri="72" spaceBefore="15" spaceAfter="1" fli="216" lsp="exactly" lspExact="201" language="en">

<ln l="6398" t="14904" r="10502" b="15091" baseLine="15056">

<wd l="6398" t="14904" r="6701" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">9</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">We</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6749" t="14976" r="6984" b="15067">use</wd>

<space/>

<wd l="7032" t="14938" r="7248" b="15067">the</wd>

<space/>

</run>

<wd l="7306" t="14942" r="7685" b="15091"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">train</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7738" t="14938" r="7954" b="15067">the</wd>

<space/>

</run>

<wd l="8002" t="14938" r="8285" b="15091"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">dev</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8342" t="14938" r="8597" b="15067">and</wd>

<space/>

<wd l="8640" t="14938" r="8861" b="15067">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8909" t="14938" r="9149" b="15067">dev</wd>

<space/>

<wd l="9221" t="14938" r="9576" b="15067">2015</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9629" t="14957" r="9826" b="15067">set</wd>

<space/>

<wd l="9869" t="14938" r="10080" b="15067">for</wd>

<space/>

<wd l="10123" t="14938" r="10502" b="15067">train-</wd>

</run>

</ln>

<ln l="6144" t="15134" r="7570" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="15134" r="6370" b="15302">ing</wd>

<space/>

<wd l="6418" t="15134" r="6634" b="15264">the</wd>

<space/>

<wd l="6682" t="15139" r="7042" b="15264">NER</wd>

<space/>

<wd l="7085" t="15134" r="7570" b="15264">model.</wd>

</ln>

</para>

</column>

</section>

<dd l="5738" t="15746" r="6229" b="15975">

<para l="5771" t="15792" r="6196" b="15946" alignment="left" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6130" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="14">

<wd l="5837" t="15792" r="6130" b="15946">139</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4320.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1252" marginRight="1339" marginBottom="1292" offsetX="-34" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1252" r="10570" b="15315">

<column l="1440" t="1252" r="5890" b="15315">

<table l="1440" t="1262" r="5890" b="2904" alignment="left" spaceBefore="10" spaceAfter="158">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>1498</gridCol>

<gridCol>1056</gridCol>

<gridCol>936</gridCol>

<gridCol>960</gridCol>

<gridRow>278</gridRow>

<gridRow>250</gridRow>

<gridRow>274</gridRow>

<gridRow>268</gridRow>

<gridRow>274</gridRow>

<gridRow>298</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1584" t="1306" r="2798" b="1502" alignment="centered" spaceAfter="17" lsp="exactly" lspExact="247" language="en">

<ln l="1584" t="1306" r="2798" b="1502" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1584" t="1306" r="2227" b="1502">System</wd>

<space/>

<wd l="2280" t="1306" r="2798" b="1459">Name</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3058" t="1301" r="3874" b="1459" alignment="centered" spaceAfter="17" lsp="exactly" lspExact="247" language="en">

<ln l="3058" t="1301" r="3874" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3058" t="1301" r="3874" b="1459">Precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4186" t="1301" r="4742" b="1459" alignment="centered" spaceAfter="17" lsp="exactly" lspExact="247" language="en">

<ln l="4186" t="1301" r="4742" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4186" t="1301" r="4742" b="1459">Recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5299" t="1306" r="5506" b="1454" alignment="centered" spaceAfter="17" lsp="exactly" lspExact="247" language="en">

<ln l="5299" t="1306" r="5506" b="1454" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-8">

<wd l="5299" t="1306" r="5506" b="1454">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="1656" t="1579" r="2726" b="1738" alignment="centered" lsp="exactly" lspExact="245" language="en">

<ln l="1656" t="1579" r="2726" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="1584" r="1997" b="1738">Our</wd>

<space/>

<wd l="2050" t="1579" r="2726" b="1738">Method</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="3134" t="1579" r="3792" b="1738" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="3134"/>

<ln l="3134" t="1579" r="3792" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3134" t="1579" r="3792" b="1738">57.66%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="4114" t="1579" r="4795" b="1738" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="4114"/>

<ln l="4114" t="1579" r="4795" b="1738" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-9">

<wd l="4114" t="1579" r="4795" b="1738">55.22%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="5064" t="1579" r="5741" b="1738" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="5064"/>

<ln l="5064" t="1579" r="5741" b="1738" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-10">

<wd l="5064" t="1579" r="5741" b="1738">56.41%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<para l="1747" t="1858" r="2630" b="2011" alignment="centered" lsp="exactly" lspExact="269" language="en">

<ln l="1747" t="1858" r="2630" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1747" t="1858" r="2630" b="2011">NLANGP</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="3134" t="1853" r="3792" b="2011" alignment="left" lsp="exactly" lspExact="268" language="en">

<tabs position="3134"/>

<ln l="3134" t="1853" r="3792" b="2011" baseLine="2002">

<wd l="3134" t="1853" r="3792" b="2011"><run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">63.62</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">%</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="4128" t="1858" r="4790" b="2011" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="4128"/>

<ln l="4128" t="1858" r="4790" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4128" t="1858" r="4790" b="2011">41.12%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="5083" t="1853" r="5741" b="2011" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="5083"/>

<ln l="5083" t="1853" r="5741" b="2011" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5083" t="1853" r="5741" b="2011">51.40%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<para l="2050" t="2131" r="2323" b="2280" alignment="centered" lsp="exactly" lspExact="254" language="en">

<ln l="2050" t="2131" r="2323" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2050" t="2174" r="2323" b="2280">nrc</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="3134" t="2122" r="3792" b="2280" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="3134"/>

<ln l="3134" t="2122" r="3792" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3134" t="2122" r="3792" b="2280">53.24%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="4133" t="2122" r="4790" b="2280" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="4133"/>

<ln l="4133" t="2122" r="4790" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4133" t="2122" r="4790" b="2280">38.58%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="5078" t="2126" r="5741" b="2280" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="5078"/>

<ln l="5078" t="2126" r="5741" b="2280" baseLine="2270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5078" t="2126" r="5741" b="2280">44.74%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<para l="1560" t="2390" r="2818" b="2549" alignment="centered" lsp="exactly" lspExact="260" language="en">

<ln l="1560" t="2390" r="2818" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1560" t="2390" r="2818" b="2549">multimedialab</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="3130" t="2390" r="3792" b="2549" alignment="left" lsp="exactly" lspExact="260" language="en">

<tabs position="3130"/>

<ln l="3130" t="2390" r="3792" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3130" t="2390" r="3792" b="2549">49.52%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="4133" t="2395" r="4790" b="2549" alignment="left" lsp="exactly" lspExact="260" language="en">

<tabs position="4133"/>

<ln l="4133" t="2395" r="4790" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4133" t="2395" r="4790" b="2549">39.18%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="5078" t="2390" r="5741" b="2549" alignment="left" lsp="exactly" lspExact="260" language="en">

<tabs position="5078"/>

<ln l="5078" t="2390" r="5741" b="2549" baseLine="2544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5078" t="2390" r="5741" b="2549">43.75%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="1910" t="2669" r="2467" b="2822" alignment="centered" spaceAfter="22" lsp="exactly" lspExact="266" language="en">

<ln l="1910" t="2669" r="2467" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1910" t="2669" r="2467" b="2822">USFD</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="3130" t="2664" r="3792" b="2822" alignment="left" spaceAfter="22" lsp="exactly" lspExact="266" language="en">

<tabs position="3130"/>

<ln l="3130" t="2664" r="3792" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3130" t="2664" r="3792" b="2822">45.72%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="4133" t="2664" r="4790" b="2822" alignment="left" spaceAfter="22" lsp="exactly" lspExact="266" language="en">

<tabs position="4133"/>

<ln l="4133" t="2664" r="4790" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4133" t="2664" r="4790" b="2822">39.64%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="5078" t="2664" r="5741" b="2822" alignment="left" spaceAfter="22" lsp="exactly" lspExact="266" language="en">

<tabs position="5078"/>

<ln l="5078" t="2664" r="5741" b="2822" baseLine="2813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5078" t="2664" r="5741" b="2822">42.46%</wd>

</ln>

</para>

</cell>

</table>

<para l="1440" t="3120" r="5808" b="3595" alignment="justified" ri="72" spaceAfter="215" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="3120" r="5808" b="3322" baseLine="3274" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3120" r="1920" b="3278">Table</wd>

<space/>

<wd l="1982" t="3125" r="2131" b="3278">2:</wd>

<space/>

<wd l="2222" t="3120" r="3413" b="3278">Performances</wd>

<space/>

<wd l="3485" t="3120" r="3672" b="3278">of</wd>

<space/>

<wd l="3715" t="3120" r="3984" b="3278">the</wd>

<space/>

<wd l="4042" t="3120" r="4843" b="3322">proposed</wd>

<space/>

<wd l="4910" t="3144" r="5582" b="3322">systems</wd>

<space/>

<wd l="5654" t="3144" r="5808" b="3278">at</wd>

<space/>

</ln>

<ln l="1440" t="3394" r="5088" b="3595" baseLine="3542" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="3394" r="1829" b="3552">both</wd>

<space/>

<wd l="1891" t="3394" r="3043" b="3595">segmentation</wd>

<space/>

<wd l="3101" t="3394" r="3413" b="3552">and</wd>

<space/>

<wd l="3470" t="3394" r="4608" b="3552">classification</wd>

<space/>

<wd l="4661" t="3394" r="5088" b="3552">tasks</wd>

</ln>

</para>

<table l="1548" t="3840" r="5710" b="6835" alignment="left" li="108" ri="180" spaceBefore="10" spaceAfter="158">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>1265</gridCol>

<gridCol>1051</gridCol>

<gridCol>907</gridCol>

<gridCol>939</gridCol>

<gridRow>278</gridRow>

<gridRow>255</gridRow>

<gridRow>269</gridRow>

<gridRow>268</gridRow>

<gridRow>274</gridRow>

<gridRow>269</gridRow>

<gridRow>273</gridRow>

<gridRow>269</gridRow>

<gridRow>274</gridRow>

<gridRow>269</gridRow>

<gridRow>297</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="1675" t="3878" r="2693" b="4080" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="1675" t="3878" r="2693" b="4080" baseLine="4027" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1675" t="3878" r="2208" b="4080">Entity</wd>

<space/>

<wd l="2266" t="3883" r="2693" b="4080">Type</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2933" t="3878" r="3749" b="4037" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="2933" t="3878" r="3749" b="4037" baseLine="4027" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2933" t="3878" r="3749" b="4037">Precision</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4042" t="3878" r="4598" b="4037" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="4042" t="3878" r="4598" b="4037" baseLine="4027" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4042" t="3878" r="4598" b="4037">Recall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5117" t="3883" r="5328" b="4032" alignment="centered" spaceAfter="18" lsp="exactly" lspExact="246" language="en">

<ln l="5117" t="3883" r="5328" b="4032" baseLine="4027" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">

<wd l="5117" t="3883" r="5328" b="4032">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="1790" t="4166" r="2582" b="4358" alignment="centered" lsp="exactly" lspExact="245" language="en">

<ln l="1790" t="4166" r="2582" b="4358" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1790" t="4210" r="2582" b="4358">company</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="3005" t="4162" r="3667" b="4315" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="3005"/>

<ln l="3005" t="4162" r="3667" b="4315" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3005" t="4162" r="3667" b="4315">41.82%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="3989" t="4157" r="4646" b="4315" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="3989"/>

<ln l="3989" t="4157" r="4646" b="4315" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3989" t="4157" r="4646" b="4315">58.97%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="decimal" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<para l="4896" t="4162" r="5558" b="4315" alignment="left" lsp="exactly" lspExact="245" language="en">

<tabs position="4896"/>

<ln l="4896" t="4162" r="5558" b="4315" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4896" t="4162" r="5558" b="4315">48.94%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<para l="1877" t="4430" r="2491" b="4632" alignment="centered" lsp="exactly" lspExact="263" language="en">

<ln l="1877" t="4430" r="2491" b="4632" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1877" t="4430" r="2491" b="4632">facility</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="3010" t="4430" r="3667" b="4589" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="3010"/>

<ln l="3010" t="4430" r="3667" b="4589" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3010" t="4430" r="3667" b="4589">50.00%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="3989" t="4430" r="4646" b="4589" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="3989"/>

<ln l="3989" t="4430" r="4646" b="4589" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3989" t="4430" r="4646" b="4589">26.32%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<para l="4901" t="4435" r="5558" b="4589" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="4901"/>

<ln l="4901" t="4435" r="5558" b="4589" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4901" t="4435" r="5558" b="4589">34.48%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<para l="1862" t="4699" r="2506" b="4901" alignment="centered" lsp="exactly" lspExact="254" language="en">

<ln l="1862" t="4699" r="2506" b="4901" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1862" t="4699" r="2506" b="4901">geo-loc</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="3010" t="4699" r="3667" b="4858" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="3010"/>

<ln l="3010" t="4699" r="3667" b="4858" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3010" t="4699" r="3667" b="4858">57.59%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="3984" t="4699" r="4646" b="4858" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="3984"/>

<ln l="3984" t="4699" r="4646" b="4858" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3984" t="4699" r="4646" b="4858">78.45%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<para l="4901" t="4699" r="5558" b="4858" alignment="left" lsp="exactly" lspExact="254" language="en">

<tabs position="4901"/>

<ln l="4901" t="4699" r="5558" b="4858" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4901" t="4699" r="5558" b="4858">66.42%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<para l="1915" t="4968" r="2458" b="5126" alignment="centered" spaceAfter="3" lsp="exactly" lspExact="271" language="en">

<ln l="1915" t="4968" r="2458" b="5126" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1915" t="4968" r="2458" b="5126">movie</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="3010" t="4968" r="3667" b="5126" alignment="left" spaceAfter="3" lsp="exactly" lspExact="271" language="en">

<tabs position="3010"/>

<ln l="3010" t="4968" r="3667" b="5126" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3010" t="4968" r="3667" b="5126">66.67%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="3984" t="4973" r="4646" b="5126" alignment="left" spaceAfter="3" lsp="exactly" lspExact="271" language="en">

<tabs position="3984"/>

<ln l="3984" t="4973" r="4646" b="5126" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3984" t="4973" r="4646" b="5126">40.00%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<para l="4901" t="4968" r="5558" b="5126" alignment="left" spaceAfter="3" lsp="exactly" lspExact="271" language="en">

<tabs position="4901"/>

<ln l="4901" t="4968" r="5558" b="5126" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4901" t="4968" r="5558" b="5126">50.00%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<para l="1709" t="5242" r="2664" b="5400" alignment="centered" lsp="exactly" lspExact="259" language="en">

<ln l="1709" t="5242" r="2664" b="5400" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1709" t="5242" r="2664" b="5400">musicartist</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<para l="3005" t="5246" r="3667" b="5400" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="3005"/>

<ln l="3005" t="5246" r="3667" b="5400" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3005" t="5246" r="3667" b="5400">70.00%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<para l="3989" t="5242" r="4646" b="5400" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="3989"/>

<ln l="3989" t="5242" r="4646" b="5400" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3989" t="5242" r="4646" b="5400">34.15%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<para l="4896" t="5242" r="5558" b="5400" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="4896"/>

<ln l="4896" t="5242" r="5558" b="5400" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4896" t="5242" r="5558" b="5400">45.90%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<para l="1968" t="5510" r="2414" b="5669" alignment="centered" lsp="exactly" lspExact="263" language="en">

<ln l="1968" t="5510" r="2414" b="5669" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1968" t="5510" r="2414" b="5669">other</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<para l="3005" t="5510" r="3667" b="5669" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="3005"/>

<ln l="3005" t="5510" r="3667" b="5669" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3005" t="5510" r="3667" b="5669">47.06%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<para l="3984" t="5515" r="4646" b="5669" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="3984"/>

<ln l="3984" t="5515" r="4646" b="5669" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3984" t="5515" r="4646" b="5669">42.42%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<para l="4896" t="5510" r="5558" b="5669" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="4896"/>

<ln l="4896" t="5510" r="5558" b="5669" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4896" t="5510" r="5558" b="5669">44.62%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<para l="1896" t="5789" r="2477" b="5986" alignment="centered" lsp="exactly" lspExact="264" language="en">

<ln l="1896" t="5789" r="2477" b="5986" baseLine="5933" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1896" t="5837" r="2477" b="5986">person</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<para l="3005" t="5789" r="3667" b="5942" alignment="left" lsp="exactly" lspExact="264" language="en">

<tabs position="3005"/>

<ln l="3005" t="5789" r="3667" b="5942" baseLine="5933" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3005" t="5789" r="3667" b="5942">70.97%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<para l="3984" t="5789" r="4651" b="5942" alignment="left" lsp="exactly" lspExact="264" language="en">

<tabs position="3984"/>

<ln l="3984" t="5789" r="4651" b="5942" baseLine="5933" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3984" t="5789" r="4651" b="5942">77.19%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<para l="4896" t="5784" r="5558" b="5942" alignment="left" lsp="exactly" lspExact="264" language="en">

<tabs position="4896"/>

<ln l="4896" t="5784" r="5558" b="5942" baseLine="5933" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4896" t="5784" r="5558" b="5942">73.95%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<para l="1853" t="6053" r="2520" b="6254" alignment="centered" lsp="exactly" lspExact="269" language="en">

<ln l="1853" t="6053" r="2520" b="6254" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1853" t="6053" r="2520" b="6254">product</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="8" gridRowTill="8" alignment="decimal" verticalAlignment="middle">

<para l="3010" t="6058" r="3667" b="6211" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="3010"/>

<ln l="3010" t="6058" r="3667" b="6211" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3010" t="6058" r="3667" b="6211">34.78%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="8" gridRowTill="8" alignment="decimal" verticalAlignment="middle">

<para l="3989" t="6053" r="4646" b="6211" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="3989"/>

<ln l="3989" t="6053" r="4646" b="6211" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3989" t="6053" r="4646" b="6211">21.62%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="8" gridRowTill="8" alignment="decimal" verticalAlignment="middle">

<para l="4901" t="6053" r="5558" b="6211" alignment="left" lsp="exactly" lspExact="269" language="en">

<tabs position="4901"/>

<ln l="4901" t="6053" r="5558" b="6211" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4901" t="6053" r="5558" b="6211">26.67%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="middle">

<para l="1723" t="6331" r="2659" b="6528" alignment="centered" spaceAfter="3" lsp="exactly" lspExact="265" language="en">

<ln l="1723" t="6331" r="2659" b="6528" baseLine="6475" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1723" t="6350" r="2659" b="6528">sportsteam</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<para l="3010" t="6326" r="3667" b="6485" alignment="left" spaceAfter="3" lsp="exactly" lspExact="265" language="en">

<tabs position="3010"/>

<ln l="3010" t="6326" r="3667" b="6485" baseLine="6475" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3010" t="6326" r="3667" b="6485">66.67%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<para l="3989" t="6331" r="4646" b="6485" alignment="left" spaceAfter="3" lsp="exactly" lspExact="265" language="en">

<tabs position="3989"/>

<ln l="3989" t="6331" r="4646" b="6485" baseLine="6475" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="3989" t="6331" r="4646" b="6485">34.29%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<para l="4896" t="6326" r="5558" b="6485" alignment="left" spaceAfter="3" lsp="exactly" lspExact="265" language="en">

<tabs position="4896"/>

<ln l="4896" t="6326" r="5558" b="6485" baseLine="6475" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4896" t="6326" r="5558" b="6485">45.28%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="1872" t="6595" r="2496" b="6754" alignment="centered" spaceAfter="17" lsp="exactly" lspExact="270" language="en">

<ln l="1872" t="6595" r="2496" b="6754" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1872" t="6595" r="2496" b="6754">tvshow</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="3029" t="6600" r="3667" b="6754" alignment="left" spaceAfter="17" lsp="exactly" lspExact="270" language="en">

<tabs position="3029"/>

<ln l="3029" t="6600" r="3667" b="6754" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="3029" t="6600" r="3667" b="6754">14.29%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="3989" t="6595" r="4651" b="6754" alignment="left" spaceAfter="17" lsp="exactly" lspExact="270" language="en">

<tabs position="3989"/>

<ln l="3989" t="6595" r="4651" b="6754" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3989" t="6595" r="4651" b="6754">50.00%</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<bottomBorder type="single" width="10"/>

<para l="4901" t="6600" r="5558" b="6754" alignment="left" spaceAfter="17" lsp="exactly" lspExact="270" language="en">

<tabs position="4901"/>

<ln l="4901" t="6600" r="5558" b="6754" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4901" t="6600" r="5558" b="6754">22.22%</wd>

</ln>

</para>

</cell>

</table>

<para l="1440" t="7051" r="5803" b="7795" alignment="justified" ri="72" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="7051" r="5794" b="7253" baseLine="7205" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7051" r="1920" b="7210">Table</wd>

<space/>

<wd l="1997" t="7056" r="2146" b="7210">3:</wd>

<space/>

<wd l="2266" t="7051" r="3379" b="7210">Performance</wd>

<space/>

<wd l="3461" t="7051" r="3653" b="7210">of</wd>

<space/>

<wd l="3715" t="7104" r="4003" b="7210">our</wd>

<space/>

<wd l="4085" t="7075" r="4685" b="7253">system</wd>

<space/>

<wd l="4757" t="7075" r="4910" b="7210">at</wd>

<space/>

<wd l="4982" t="7051" r="5371" b="7210">both</wd>

<space/>

<wd l="5453" t="7104" r="5794" b="7253">seg-</wd>

</ln>

<ln l="1440" t="7325" r="5803" b="7526" baseLine="7474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7325" r="2314" b="7483">mentation</wd>

<space/>

<wd l="2366" t="7325" r="2678" b="7483">and</wd>

<space/>

<wd l="2731" t="7325" r="3869" b="7483">classification</wd>

<space/>

<wd l="3917" t="7325" r="4344" b="7483">tasks</wd>

<space/>

<wd l="4406" t="7325" r="5011" b="7483">broken</wd>

<space/>

<wd l="5064" t="7325" r="5539" b="7483">down</wd>

<space/>

<wd l="5587" t="7325" r="5803" b="7526">by</wd>

<space/>

</ln>

<ln l="1445" t="7594" r="2443" b="7795" baseLine="7747" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="7594" r="1934" b="7795">entity</wd>

<space/>

<wd l="1992" t="7618" r="2443" b="7795">types</wd>

</ln>

</para>

<para l="1440" t="8246" r="3029" b="8419" alignment="left" ri="72" spaceBefore="397" lsp="exactly" lspExact="273" language="en">

<ln l="1440" t="8246" r="3029" b="8419" baseLine="8414" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="12">

<wd l="1440" t="8246" r="1555" b="8414">4</wd>

<space/>

<wd l="1810" t="8246" r="3029" b="8419">Conclusions</wd>

</ln>

</para>

<para l="1440" t="8683" r="5808" b="10738" alignment="justified" ri="72" spaceBefore="151" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="8683" r="5808" b="8885" baseLine="8832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8688" r="1622" b="8837">In</wd>

<space/>

<wd l="1718" t="8683" r="2026" b="8842">this</wd>

<space/>

<wd l="2136" t="8736" r="2654" b="8885">paper,</wd>

<space/>

<wd l="2774" t="8736" r="3029" b="8842">we</wd>

<space/>

<wd l="3130" t="8683" r="3926" b="8885">proposed</wd>

<space/>

<wd l="4032" t="8736" r="4128" b="8842">a</wd>

<space/>

<wd l="4219" t="8683" r="4694" b="8842">novel</wd>

<space/>

<wd l="4800" t="8683" r="5453" b="8842">method</wd>

<space/>

<wd l="5549" t="8683" r="5808" b="8842">for</wd>

<space/>

</ln>

<ln l="1440" t="8957" r="5803" b="9115" baseLine="9106" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8957" r="1704" b="9115">the</wd>

<space/>

<wd l="1838" t="8957" r="2467" b="9115">Twitter</wd>

<space/>

<wd l="2597" t="8962" r="3029" b="9115">NER</wd>

<space/>

<wd l="3163" t="8957" r="3557" b="9115">task.</wd>

<space/>

<wd l="3869" t="8962" r="4152" b="9115">We</wd>

<space/>

<wd l="4296" t="8957" r="4949" b="9115">showed</wd>

<space/>

<wd l="5078" t="8957" r="5410" b="9115">that</wd>

<space/>

<wd l="5539" t="8957" r="5803" b="9115">the</wd>

<space/>

</ln>

<ln l="1445" t="9226" r="5794" b="9427" baseLine="9374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="9226" r="1810" b="9384">data</wd>

<space/>

<wd l="1896" t="9226" r="2664" b="9384">retrieved</wd>

<space/>

<wd l="2760" t="9226" r="3187" b="9384">from</wd>

<space/>

<wd l="3283" t="9278" r="3706" b="9427">open</wd>

<space/>

<wd l="3797" t="9226" r="4747" b="9427">knowledge</wd>

<space/>

<wd l="4843" t="9226" r="5309" b="9384">bases</wd>

<space/>

<wd l="5419" t="9226" r="5794" b="9422">(i.e.,</wd>

<space/>

</ln>

<ln l="1440" t="9494" r="5803" b="9696" baseLine="9648" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9494" r="2386" b="9696">Wikipedia,</wd>

<space/>

<wd l="2491" t="9494" r="3307" b="9696">DBpedia,</wd>

<space/>

<wd l="3413" t="9494" r="4253" b="9691">Freebase)</wd>

<space/>

<wd l="4354" t="9547" r="4646" b="9653">can</wd>

<space/>

<wd l="4738" t="9494" r="4944" b="9653">be</wd>

<space/>

<wd l="5030" t="9494" r="5803" b="9696">naturally</wd>

<space/>

</ln>

<ln l="1440" t="9768" r="5794" b="9970" baseLine="9917">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="9768" r="2280" b="9970">leveraged</wd>

<space/>

<wd l="2376" t="9792" r="2544" b="9926">to</wd>

<space/>

<wd l="2650" t="9768" r="3360" b="9926">enhance</wd>

<space/>

<wd l="3456" t="9773" r="3893" b="9926">NER</wd>

<space/>

<wd l="3994" t="9768" r="4459" b="9970">using</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4565" t="9778" r="5045" b="9970">entity</wd>

<space/>

</run>

<wd l="5150" t="9768" r="5794" b="9970"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">linking</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1440" t="10037" r="5794" b="10238" baseLine="10190" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10037" r="2573" b="10224">Furthermore,</wd>

<space/>

<wd l="2650" t="10037" r="2957" b="10195">this</wd>

<space/>

<wd l="3034" t="10037" r="3394" b="10195">data</wd>

<space/>

<wd l="3456" t="10090" r="4114" b="10238">appears</wd>

<space/>

<wd l="4181" t="10061" r="4349" b="10195">to</wd>

<space/>

<wd l="4416" t="10037" r="4618" b="10195">be</wd>

<space/>

<wd l="4680" t="10037" r="5237" b="10238">highly</wd>

<space/>

<wd l="5309" t="10037" r="5794" b="10195">effec-</wd>

</ln>

<ln l="1440" t="10310" r="5794" b="10512" baseLine="10459">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="10310" r="1757" b="10469">tive</wd>

<space/>

<wd l="1834" t="10310" r="2093" b="10469">for</wd>

<space/>

<wd l="2160" t="10310" r="2549" b="10469">both</wd>

<space/>

<wd l="2621" t="10310" r="2890" b="10469">the</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2962" t="10320" r="4114" b="10512">segmentation</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4195" t="10310" r="4507" b="10469">and</wd>

<space/>

<wd l="4579" t="10310" r="4848" b="10469">the</wd>

<space/>

</run>

<wd l="4925" t="10310" r="5794" b="10512" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">classifica-</wd>

</ln>

<ln l="1445" t="10579" r="2314" b="10738" baseLine="10733">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="10589" r="1776" b="10738">tion</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1834" t="10579" r="2314" b="10738">tasks.</wd>

</run>

</ln>

</para>

<para l="1445" t="11299" r="2544" b="11472" alignment="left" ri="72" spaceBefore="456" lsp="exactly" lspExact="273" language="en">

<ln l="1445" t="11299" r="2544" b="11472" baseLine="11462" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="11299" r="2544" b="11472">References</wd>

</ln>

</para>

<para l="1445" t="11683" r="5798" b="12528" alignment="justified" li="216" ri="72" spaceBefore="127" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="11683" r="5798" b="11870" baseLine="11821" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="11683" r="1906" b="11827">S¨oren</wd>

<space/>

<wd l="1987" t="11688" r="2424" b="11851">Auer,</wd>

<space/>

<wd l="2525" t="11683" r="3250" b="11827">Christian</wd>

<space/>

<wd l="3336" t="11683" r="3802" b="11851">Bizer,</wd>

<space/>

<wd l="3907" t="11683" r="4450" b="11870">Georgi</wd>

<space/>

<wd l="4541" t="11683" r="5362" b="11851">Kobilarov,</wd>

<space/>

<wd l="5462" t="11688" r="5798" b="11827">Jens</wd>

<space/>

</ln>

<ln l="1656" t="11904" r="5794" b="12091" baseLine="12038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="11904" r="2453" b="12072">Lehmann,</wd>

<space/>

<wd l="2587" t="11904" r="3216" b="12048">Richard</wd>

<space/>

<wd l="3331" t="11904" r="4133" b="12091">Cyganiak,</wd>

<space/>

<wd l="4272" t="11904" r="4555" b="12048">and</wd>

<space/>

<wd l="4666" t="11904" r="5314" b="12091">Zachary</wd>

<space/>

<wd l="5429" t="11909" r="5794" b="12048">Ives.</wd>

<space/>

</ln>

<ln l="1661" t="12125" r="5794" b="12307" baseLine="12259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="12125" r="2093" b="12269">2007.</wd>

<space/>

<wd l="2222" t="12125" r="2971" b="12307">DBpedia:</wd>

<space/>

<wd l="3082" t="12168" r="3168" b="12269">a</wd>

<space/>

<wd l="3226" t="12125" r="3830" b="12269">nucleus</wd>

<space/>

<wd l="3898" t="12125" r="4133" b="12269">for</wd>

<space/>

<wd l="4200" t="12168" r="4286" b="12269">a</wd>

<space/>

<wd l="4349" t="12125" r="4675" b="12269">web</wd>

<space/>

<wd l="4747" t="12125" r="4920" b="12269">of</wd>

<space/>

<wd l="4978" t="12168" r="5362" b="12307">open</wd>

<space/>

<wd l="5429" t="12125" r="5794" b="12269">data.</wd>

<space/>

</ln>

<ln l="1666" t="12341" r="4464" b="12528" baseLine="12480">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1666" t="12341" r="1954" b="12485">The</wd>

<space/>

<wd l="2006" t="12346" r="2736" b="12485">Semantic</wd>

<space/>

</run>

<wd l="2798" t="12341" r="3168" b="12509"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Web</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3221" t="12384" r="3672" b="12528">pages</wd>

<space/>

<wd l="3725" t="12341" r="4464" b="12485">722–735.</wd>

</run>

</ln>

</para>

<para l="1440" t="12744" r="5813" b="14237" alignment="justified" li="216" ri="72" spaceBefore="178" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="12744" r="5798" b="12931" baseLine="12883" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12744" r="2117" b="12931">Timothy</wd>

<space/>

<wd l="2261" t="12744" r="2981" b="12912">Baldwin,</wd>

<space/>

<wd l="3154" t="12744" r="3624" b="12888">Marie</wd>

<space/>

<wd l="3778" t="12744" r="4546" b="12888">Catherine</wd>

<space/>

<wd l="4694" t="12744" r="4877" b="12888">de</wd>

<space/>

<wd l="5021" t="12744" r="5798" b="12912">Marneffe,</wd>

<space/>

</ln>

<ln l="1656" t="12965" r="5803" b="13152" baseLine="13099" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="12970" r="1886" b="13109">Bo</wd>

<space/>

<wd l="1982" t="12970" r="2357" b="13133">Han,</wd>

<space/>

<wd l="2462" t="12970" r="3442" b="13152">Young-Bum</wd>

<space/>

<wd l="3533" t="12965" r="3926" b="13133">Kim,</wd>

<space/>

<wd l="4037" t="12965" r="4421" b="13109">Alan</wd>

<space/>

<wd l="4512" t="12965" r="5002" b="13133">Ritter,</wd>

<space/>

<wd l="5117" t="12965" r="5400" b="13109">and</wd>

<space/>

<wd l="5491" t="12965" r="5803" b="13109">Wei</wd>

<space/>

</ln>

<ln l="1656" t="13186" r="5808" b="13368" baseLine="13320" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="13190" r="1939" b="13330">Xu.</wd>

<space/>

<wd l="2083" t="13186" r="2515" b="13330">2015.</wd>

<space/>

<wd l="2664" t="13186" r="3211" b="13330">Shared</wd>

<space/>

<wd l="3278" t="13186" r="3672" b="13330">tasks</wd>

<space/>

<wd l="3749" t="13186" r="3922" b="13330">of</wd>

<space/>

<wd l="3979" t="13186" r="4219" b="13330">the</wd>

<space/>

<wd l="4291" t="13186" r="4680" b="13330">2015</wd>

<space/>

<wd l="4757" t="13186" r="5534" b="13368">workshop</wd>

<space/>

<wd l="5611" t="13229" r="5808" b="13330">on</wd>

<space/>

</ln>

<ln l="1656" t="13402" r="5798" b="13589" baseLine="13541" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="13402" r="2088" b="13589">noisy</wd>

<space/>

<wd l="2174" t="13402" r="3346" b="13589">user-generated</wd>

<space/>

<wd l="3427" t="13421" r="3763" b="13546">text:</wd>

<space/>

<wd l="3907" t="13402" r="4478" b="13546">Twitter</wd>

<space/>

<wd l="4565" t="13402" r="5088" b="13546">lexical</wd>

<space/>

<wd l="5174" t="13402" r="5798" b="13546">normal-</wd>

</ln>

<ln l="1656" t="13622" r="5798" b="13810" baseLine="13757">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="13622" r="2203" b="13766">ization</wd>

<space/>

<wd l="2275" t="13622" r="2558" b="13766">and</wd>

<space/>

<wd l="2630" t="13622" r="3163" b="13766">named</wd>

<space/>

<wd l="3235" t="13622" r="3682" b="13810">entity</wd>

<space/>

<wd l="3754" t="13622" r="4699" b="13810">recognition.</wd>

<space/>

<wd l="4848" t="13627" r="5016" b="13762">In</wd>

<space/>

</run>

<wd l="5083" t="13622" r="5798" b="13766" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Proceed-</wd>

</ln>

<ln l="1666" t="13843" r="5813" b="14026" baseLine="13978" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="13848" r="1992" b="14026">ings</wd>

<space/>

<wd l="2054" t="13843" r="2237" b="14026">of</wd>

<space/>

<wd l="2266" t="13843" r="2506" b="13987">the</wd>

<space/>

<wd l="2573" t="13843" r="3350" b="14026">Workshop</wd>

<space/>

<wd l="3418" t="13891" r="3610" b="13987">on</wd>

<space/>

<wd l="3667" t="13848" r="4123" b="14026">Noisy</wd>

<space/>

<wd l="4205" t="13843" r="5434" b="14026">User-generated</wd>

<space/>

<wd l="5496" t="13848" r="5813" b="13987">Text</wd>

<space/>

</ln>

<ln l="1661" t="14059" r="2832" b="14237" baseLine="14198">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="14064" r="2299" b="14237">(WNUT</wd>

<space/>

</run>

<wd l="2328" t="14059" r="2832" b="14237"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1445" t="14462" r="5818" b="15307" alignment="justified" li="216" ri="72" spaceBefore="181" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1445" t="14462" r="5808" b="14630" baseLine="14602" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="14467" r="1805" b="14606">Kurt</wd>

<space/>

<wd l="1891" t="14462" r="2698" b="14630">Bollacker,</wd>

<space/>

<wd l="2808" t="14462" r="3245" b="14606">Colin</wd>

<space/>

<wd l="3331" t="14467" r="3859" b="14630">Evans,</wd>

<space/>

<wd l="3960" t="14467" r="4598" b="14606">Praveen</wd>

<space/>

<wd l="4685" t="14462" r="5376" b="14630">Paritosh,</wd>

<space/>

<wd l="5482" t="14462" r="5808" b="14602">Tim</wd>

<space/>

</ln>

<ln l="1661" t="14683" r="5798" b="14870" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1661" t="14683" r="2218" b="14870">Sturge,</wd>

<space/>

<wd l="2304" t="14683" r="2587" b="14827">and</wd>

<space/>

<wd l="2659" t="14683" r="3120" b="14827">Jamie</wd>

<space/>

<wd l="3192" t="14683" r="3734" b="14870">Taylor.</wd>

<space/>

<wd l="3888" t="14683" r="4320" b="14827">2008.</wd>

<space/>

<wd l="4469" t="14683" r="5218" b="14827">Freebase:</wd>

<space/>

<wd l="5342" t="14726" r="5429" b="14827">a</wd>

<space/>

<wd l="5501" t="14683" r="5798" b="14827">col-</wd>

</ln>

<ln l="1656" t="14899" r="5803" b="15086" baseLine="15038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="14899" r="2597" b="15086">laboratively</wd>

<space/>

<wd l="2683" t="14899" r="3259" b="15043">created</wd>

<space/>

<wd l="3341" t="14899" r="3787" b="15086">graph</wd>

<space/>

<wd l="3874" t="14899" r="4550" b="15043">database</wd>

<space/>

<wd l="4632" t="14899" r="4862" b="15043">for</wd>

<space/>

<wd l="4954" t="14899" r="5803" b="15086">structuring</wd>

<space/>

</ln>

<ln l="1656" t="15120" r="5818" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1656" t="15120" r="2203" b="15264">human</wd>

<space/>

<wd l="2242" t="15120" r="3149" b="15307">knowledge.</wd>

<space/>

<wd l="3235" t="15125" r="3403" b="15259">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="3442" t="15120" r="4426" b="15302">Proceedings</wd>

<space/>

<wd l="4474" t="15120" r="4656" b="15302">of</wd>

<space/>

<wd l="4670" t="15120" r="4906" b="15264">the</wd>

<space/>

<wd l="4949" t="15120" r="5352" b="15264">2008</wd>

<space/>

<wd l="5376" t="15125" r="5818" b="15264">ACM</wd>

</run>

</ln>

</para>

</column>

<column l="6120" t="1252" r="10570" b="14576">

<para l="6365" t="1334" r="10517" b="1742" alignment="justified" li="216" ri="72" spaceBefore="53" lsp="exactly" lspExact="220" language="en">

<ln l="6365" t="1334" r="10517" b="1517" baseLine="1474" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="1339" r="7128" b="1478">SIGMOD</wd>

<space/>

<wd l="7166" t="1334" r="8227" b="1478">International</wd>

<space/>

<wd l="8280" t="1334" r="9182" b="1517">Conference</wd>

<space/>

<wd l="9235" t="1382" r="9422" b="1478">on</wd>

<space/>

<wd l="9470" t="1339" r="10517" b="1517">Management</wd>

<space/>

</ln>

<ln l="6370" t="1555" r="9768" b="1742" baseLine="1694">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6370" t="1555" r="6552" b="1738">of</wd>

<space/>

<wd l="6562" t="1560" r="6965" b="1699">Data</wd>

<space/>

<wd l="7022" t="1560" r="7848" b="1733">(SIGMOD</wd>

<space/>

</run>

<wd l="7925" t="1555" r="8270" b="1733"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">’08)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8328" t="1598" r="8774" b="1742">pages</wd>

<space/>

<wd l="8851" t="1555" r="9768" b="1699">1247–1250.</wd>

</run>

</ln>

</para>

<para l="6144" t="1954" r="10512" b="3019" alignment="justified" li="216" ri="72" spaceBefore="174" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="1954" r="10512" b="2136" baseLine="2093" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1954" r="6792" b="2098">William</wd>

<space/>

<wd l="6931" t="1958" r="7138" b="2098">W.</wd>

<space/>

<wd l="7296" t="1954" r="7853" b="2122">Cohen,</wd>

<space/>

<wd l="8021" t="1954" r="8659" b="2136">Pradeep</wd>

<space/>

<wd l="8803" t="1958" r="8986" b="2098">D.</wd>

<space/>

<wd l="9139" t="1954" r="10056" b="2122">Ravikumar,</wd>

<space/>

<wd l="10229" t="1954" r="10512" b="2098">and</wd>

<space/>

</ln>

<ln l="6370" t="2174" r="10507" b="2362" baseLine="2309" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="2174" r="7008" b="2357">Stephen</wd>

<space/>

<wd l="7061" t="2179" r="7219" b="2318">E.</wd>

<space/>

<wd l="7286" t="2174" r="8026" b="2362">Fienberg.</wd>

<space/>

<wd l="8126" t="2174" r="8558" b="2318">2003.</wd>

<space/>

<wd l="8654" t="2179" r="8798" b="2314">A</wd>

<space/>

<wd l="8861" t="2174" r="9782" b="2357">comparison</wd>

<space/>

<wd l="9840" t="2174" r="10013" b="2318">of</wd>

<space/>

<wd l="10066" t="2174" r="10507" b="2362">string</wd>

<space/>

</ln>

<ln l="6370" t="2390" r="10502" b="2578" baseLine="2530">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="2390" r="7013" b="2534">distance</wd>

<space/>

<wd l="7085" t="2390" r="7666" b="2534">metrics</wd>

<space/>

<wd l="7738" t="2390" r="7973" b="2534">for</wd>

<space/>

<wd l="8040" t="2390" r="9274" b="2578">name-matching</wd>

<space/>

<wd l="9346" t="2390" r="9782" b="2534">tasks.</wd>

<space/>

<wd l="9922" t="2395" r="10090" b="2530">In</wd>

<space/>

</run>

<wd l="10157" t="2395" r="10502" b="2534" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Pro-</wd>

</ln>

<ln l="6370" t="2611" r="10502" b="2794" baseLine="2750" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="2611" r="7061" b="2794">ceedings</wd>

<space/>

<wd l="7128" t="2611" r="7310" b="2794">of</wd>

<space/>

<wd l="7339" t="2611" r="8078" b="2755">IJCAI-03</wd>

<space/>

<wd l="8155" t="2611" r="8933" b="2794">Workshop</wd>

<space/>

<wd l="9005" t="2659" r="9197" b="2755">on</wd>

<space/>

<wd l="9259" t="2611" r="10210" b="2794">Information</wd>

<space/>

<wd l="10272" t="2616" r="10502" b="2755">In-</wd>

</ln>

<ln l="6370" t="2832" r="9149" b="3019" baseLine="2966">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="2837" r="7080" b="3014">tegration</wd>

<space/>

<wd l="7138" t="2880" r="7330" b="2976">on</wd>

<space/>

<wd l="7387" t="2832" r="7622" b="2976">the</wd>

<space/>

</run>

<wd l="7685" t="2832" r="8054" b="3000"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Web</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8112" t="2875" r="8558" b="3019">pages</wd>

<space/>

<wd l="8616" t="2832" r="9149" b="2976">73–78.</wd>

</run>

</ln>

</para>

<para l="6144" t="3230" r="10512" b="4507" alignment="justified" li="216" ri="72" spaceBefore="176" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="3230" r="10502" b="3418" baseLine="3365" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3235" r="6557" b="3374">Leon</wd>

<space/>

<wd l="6648" t="3230" r="7598" b="3418">Derczynski,</wd>

<space/>

<wd l="7709" t="3230" r="8189" b="3374">Diana</wd>

<space/>

<wd l="8280" t="3230" r="9038" b="3418">Maynard,</wd>

<space/>

<wd l="9154" t="3230" r="9902" b="3413">Giuseppe</wd>

<space/>

<wd l="9998" t="3230" r="10502" b="3398">Rizzo,</wd>

<space/>

</ln>

<ln l="6365" t="3451" r="10507" b="3638" baseLine="3586" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="3451" r="7022" b="3595">Marieke</wd>

<space/>

<wd l="7166" t="3494" r="7445" b="3595">van</wd>

<space/>

<wd l="7589" t="3456" r="7920" b="3634">Erp,</wd>

<space/>

<wd l="8093" t="3451" r="8928" b="3595">Genevieve</wd>

<space/>

<wd l="9072" t="3451" r="9686" b="3619">Gorrell,</wd>

<space/>

<wd l="9859" t="3451" r="10507" b="3638">Rapha¨el</wd>

<space/>

</ln>

<ln l="6365" t="3667" r="10498" b="3854" baseLine="3806" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="3672" r="6960" b="3854">Troncy,</wd>

<space/>

<wd l="7118" t="3667" r="7685" b="3811">Johann</wd>

<space/>

<wd l="7819" t="3667" r="8371" b="3835">Petrak,</wd>

<space/>

<wd l="8539" t="3667" r="8822" b="3811">and</wd>

<space/>

<wd l="8957" t="3667" r="9490" b="3811">Kalina</wd>

<space/>

<wd l="9619" t="3667" r="10498" b="3811">Bontcheva.</wd>

<space/>

</ln>

<ln l="6370" t="3888" r="10512" b="4075" baseLine="4022" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="3888" r="6802" b="4032">2015.</wd>

<space/>

<wd l="7013" t="3888" r="7704" b="4075">Analysis</wd>

<space/>

<wd l="7805" t="3888" r="7978" b="4032">of</wd>

<space/>

<wd l="8059" t="3888" r="8592" b="4032">named</wd>

<space/>

<wd l="8683" t="3888" r="9130" b="4075">entity</wd>

<space/>

<wd l="9226" t="3888" r="10133" b="4075">recognition</wd>

<space/>

<wd l="10229" t="3888" r="10512" b="4032">and</wd>

<space/>

</ln>

<ln l="6365" t="4104" r="10502" b="4291" baseLine="4243">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="4104" r="6926" b="4291">linking</wd>

<space/>

<wd l="6984" t="4104" r="7219" b="4248">for</wd>

<space/>

<wd l="7272" t="4123" r="7819" b="4248">tweets.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7920" t="4104" r="8875" b="4286">Information</wd>

<space/>

<wd l="8933" t="4109" r="9806" b="4286">Processing</wd>

<space/>

<wd l="9883" t="4109" r="10013" b="4248">&amp;</wd>

<space/>

<wd l="10075" t="4109" r="10502" b="4248">Man-</wd>

</run>

</ln>

<ln l="6365" t="4325" r="8160" b="4507" baseLine="4464">

<wd l="6365" t="4354" r="7080" b="4507"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">agement</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7138" t="4325" r="8160" b="4502">51(2):32–49.</wd>

</run>

</ln>

</para>

<para l="6149" t="4723" r="10507" b="6446" alignment="justified" li="216" ri="72" spaceBefore="171" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6149" t="4723" r="10502" b="4906" baseLine="4862" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4723" r="6624" b="4867">Kevin</wd>

<space/>

<wd l="6686" t="4723" r="7325" b="4906">Gimpel,</wd>

<space/>

<wd l="7392" t="4723" r="7963" b="4867">Nathan</wd>

<space/>

<wd l="8030" t="4723" r="8856" b="4891">Schneider,</wd>

<space/>

<wd l="8928" t="4723" r="9600" b="4867">Brendan</wd>

<space/>

<wd l="9667" t="4723" r="10502" b="4891">O’Connor,</wd>

<space/>

</ln>

<ln l="6365" t="4944" r="10502" b="5131" baseLine="5078" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="4944" r="7090" b="5131">Dipanjan</wd>

<space/>

<wd l="7234" t="4949" r="7584" b="5112">Das,</wd>

<space/>

<wd l="7752" t="4944" r="8280" b="5088">Daniel</wd>

<space/>

<wd l="8419" t="4944" r="8885" b="5112">Mills,</wd>

<space/>

<wd l="9053" t="4944" r="9499" b="5088">Jacob</wd>

<space/>

<wd l="9643" t="4944" r="10502" b="5112">Eisenstein,</wd>

<space/>

</ln>

<ln l="6365" t="5160" r="10502" b="5347" baseLine="5299" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="5160" r="7013" b="5304">Michael</wd>

<space/>

<wd l="7061" t="5160" r="7790" b="5328">Heilman,</wd>

<space/>

<wd l="7848" t="5160" r="8232" b="5304">Dani</wd>

<space/>

<wd l="8280" t="5165" r="9120" b="5347">Yogatama,</wd>

<space/>

<wd l="9173" t="5160" r="9715" b="5347">Jeffrey</wd>

<space/>

<wd l="9763" t="5160" r="10502" b="5347">Flanigan,</wd>

<space/>

</ln>

<ln l="6370" t="5381" r="10507" b="5568" baseLine="5520" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="5381" r="6653" b="5525">and</wd>

<space/>

<wd l="6720" t="5381" r="7152" b="5525">Noah</wd>

<space/>

<wd l="7224" t="5386" r="7368" b="5520">A</wd>

<space/>

<wd l="7440" t="5381" r="7954" b="5525">Smith.</wd>

<space/>

<wd l="8102" t="5381" r="8534" b="5525">2011.</wd>

<space/>

<wd l="8683" t="5381" r="9845" b="5563">Part-of-speech</wd>

<space/>

<wd l="9912" t="5381" r="10507" b="5568">tagging</wd>

<space/>

</ln>

<ln l="6365" t="5602" r="10498" b="5784" baseLine="5736" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="5602" r="6595" b="5746">for</wd>

<space/>

<wd l="6667" t="5602" r="7277" b="5746">Twitter:</wd>

<space/>

<wd l="7406" t="5602" r="8285" b="5770">annotation,</wd>

<space/>

<wd l="8371" t="5602" r="9043" b="5770">features,</wd>

<space/>

<wd l="9134" t="5602" r="9418" b="5746">and</wd>

<space/>

<wd l="9494" t="5602" r="10498" b="5784">experiments.</wd>

<space/>

</ln>

<ln l="6365" t="5818" r="10507" b="6000" baseLine="5957">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="5822" r="6533" b="5957">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6605" t="5818" r="7594" b="6000">Proceedings</wd>

<space/>

<wd l="7675" t="5818" r="7858" b="6000">of</wd>

<space/>

<wd l="7906" t="5818" r="8146" b="5962">the</wd>

<space/>

<wd l="8222" t="5818" r="8573" b="5962">49th</wd>

<space/>

<wd l="8640" t="5818" r="9230" b="5962">Annual</wd>

<space/>

<wd l="9302" t="5822" r="9955" b="6000">Meeting</wd>

<space/>

<wd l="10042" t="5818" r="10224" b="6000">of</wd>

<space/>

<wd l="10272" t="5818" r="10507" b="5962">the</wd>

<space/>

</run>

</ln>

<ln l="6350" t="6038" r="10507" b="6221" baseLine="6178" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6350" t="6043" r="7291" b="6182">Association</wd>

<space/>

<wd l="7320" t="6038" r="7594" b="6221">for</wd>

<space/>

<wd l="7656" t="6038" r="8842" b="6221">Computational</wd>

<space/>

<wd l="8894" t="6043" r="9835" b="6221">Linguistics:</wd>

<space/>

<wd l="9922" t="6043" r="10507" b="6182">Human</wd>

<space/>

</ln>

<ln l="6360" t="6259" r="10243" b="6446" baseLine="6394">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6360" t="6264" r="7157" b="6442">Language</wd>

<space/>

<wd l="7214" t="6259" r="8246" b="6442">Technologies</wd>

<space/>

<wd l="8299" t="6264" r="8741" b="6437">(HLT</wd>

<space/>

</run>

<wd l="8803" t="6259" r="9149" b="6437"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">’11)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="9206" t="6302" r="9653" b="6446">pages</wd>

<space/>

<wd l="9710" t="6259" r="10243" b="6403">42–47.</wd>

</run>

</ln>

</para>

<para l="6149" t="6658" r="10512" b="8117" alignment="justified" li="216" ri="72" spaceBefore="172" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6149" t="6658" r="10498" b="6845" baseLine="6792" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="6658" r="6787" b="6840">Stephen</wd>

<space/>

<wd l="6874" t="6658" r="7253" b="6826">Guo,</wd>

<space/>

<wd l="7349" t="6658" r="8160" b="6845">Ming-Wei</wd>

<space/>

<wd l="8246" t="6658" r="8803" b="6845">Chang,</wd>

<space/>

<wd l="8904" t="6658" r="9187" b="6802">and</wd>

<space/>

<wd l="9264" t="6662" r="9691" b="6802">Emre</wd>

<space/>

<wd l="9778" t="6658" r="10498" b="6802">Kiciman.</wd>

<space/>

</ln>

<ln l="6370" t="6874" r="10512" b="7061" baseLine="7013" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="6874" r="6802" b="7018">2013.</wd>

<space/>

<wd l="6907" t="6878" r="7109" b="7018">To</wd>

<space/>

<wd l="7166" t="6874" r="7478" b="7013">link</wd>

<space/>

<wd l="7536" t="6917" r="7699" b="7018">or</wd>

<space/>

<wd l="7757" t="6893" r="8011" b="7018">not</wd>

<space/>

<wd l="8069" t="6893" r="8218" b="7018">to</wd>

<space/>

<wd l="8280" t="6874" r="8674" b="7018">link?</wd>

<space/>

<wd l="8765" t="6917" r="8851" b="7018">a</wd>

<space/>

<wd l="8914" t="6874" r="9331" b="7061">study</wd>

<space/>

<wd l="9398" t="6917" r="9590" b="7018">on</wd>

<space/>

<wd l="9653" t="6874" r="10512" b="7018">end-to-end</wd>

<space/>

</ln>

<ln l="6365" t="7094" r="10507" b="7282" baseLine="7234">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="7099" r="6850" b="7238">Tweet</wd>

<space/>

<wd l="6931" t="7094" r="7378" b="7282">entity</wd>

<space/>

<wd l="7459" t="7094" r="8064" b="7282">linking.</wd>

<space/>

<wd l="8242" t="7099" r="8410" b="7234">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8486" t="7094" r="9475" b="7277">Proceedings</wd>

<space/>

<wd l="9557" t="7094" r="9739" b="7277">of</wd>

<space/>

<wd l="9792" t="7094" r="10032" b="7238">the</wd>

<space/>

<wd l="10114" t="7094" r="10507" b="7238">2013</wd>

<space/>

</run>

</ln>

<ln l="6374" t="7315" r="10507" b="7498" baseLine="7450" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="7315" r="7272" b="7498">Conference</wd>

<space/>

<wd l="7358" t="7315" r="7541" b="7498">of</wd>

<space/>

<wd l="7589" t="7315" r="7829" b="7459">the</wd>

<space/>

<wd l="7901" t="7315" r="8371" b="7459">North</wd>

<space/>

<wd l="8438" t="7320" r="9221" b="7459">American</wd>

<space/>

<wd l="9312" t="7315" r="9965" b="7498">Chapter</wd>

<space/>

<wd l="10037" t="7315" r="10219" b="7498">of</wd>

<space/>

<wd l="10272" t="7315" r="10507" b="7459">the</wd>

<space/>

</ln>

<ln l="6350" t="7531" r="10507" b="7714" baseLine="7670" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6350" t="7536" r="7291" b="7675">Association</wd>

<space/>

<wd l="7320" t="7531" r="7594" b="7714">for</wd>

<space/>

<wd l="7656" t="7531" r="8842" b="7714">Computational</wd>

<space/>

<wd l="8894" t="7536" r="9835" b="7714">Linguistics:</wd>

<space/>

<wd l="9922" t="7536" r="10507" b="7675">Human</wd>

<space/>

</ln>

<ln l="6360" t="7752" r="10507" b="7939" baseLine="7891">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6360" t="7757" r="7157" b="7934">Language</wd>

<space/>

<wd l="7258" t="7752" r="8285" b="7934">Technologies</wd>

<space/>

<wd l="8386" t="7757" r="9499" b="7930">(NAACL-HLT</wd>

<space/>

</run>

<wd l="9600" t="7752" r="9950" b="7930"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">’13)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10056" t="7795" r="10507" b="7939">pages</wd>

<space/>

</run>

</ln>

<ln l="6384" t="7973" r="7301" b="8117" baseLine="8107" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="7973" r="7301" b="8117">1020–1030.</wd>

</ln>

</para>

<para l="6144" t="8371" r="10507" b="9389" alignment="justified" li="216" ri="72" spaceBefore="177" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="8371" r="10498" b="8558" baseLine="8506" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="8371" r="6619" b="8558">Edgar</wd>

<space/>

<wd l="6672" t="8371" r="7090" b="8558">Meij,</wd>

<space/>

<wd l="7147" t="8376" r="7733" b="8515">Wouter</wd>

<space/>

<wd l="7781" t="8371" r="8683" b="8554">Weerkamp,</wd>

<space/>

<wd l="8746" t="8371" r="9029" b="8515">and</wd>

<space/>

<wd l="9077" t="8376" r="9744" b="8515">Maarten</wd>

<space/>

<wd l="9797" t="8371" r="9979" b="8515">de</wd>

<space/>

<wd l="10032" t="8371" r="10498" b="8558">Rijke.</wd>

<space/>

</ln>

<ln l="6370" t="8587" r="10502" b="8774" baseLine="8726">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6370" t="8587" r="6802" b="8731">2012.</wd>

<space/>

<wd l="6883" t="8587" r="7478" b="8774">Adding</wd>

<space/>

<wd l="7536" t="8587" r="8304" b="8731">semantics</wd>

<space/>

<wd l="8352" t="8606" r="8506" b="8731">to</wd>

<space/>

<wd l="8554" t="8587" r="9370" b="8774">microblog</wd>

<space/>

<wd l="9413" t="8606" r="9859" b="8770">posts.</wd>

<space/>

<wd l="9946" t="8592" r="10114" b="8726">In</wd>

<space/>

</run>

<wd l="10157" t="8592" r="10502" b="8731" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Pro-</wd>

</ln>

<ln l="6370" t="8808" r="10507" b="8990" baseLine="8947" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6370" t="8808" r="7061" b="8990">ceedings</wd>

<space/>

<wd l="7114" t="8808" r="7296" b="8990">of</wd>

<space/>

<wd l="7320" t="8808" r="7555" b="8952">the</wd>

<space/>

<wd l="7608" t="8808" r="7982" b="8990">Fifth</wd>

<space/>

<wd l="8021" t="8813" r="8462" b="8952">ACM</wd>

<space/>

<wd l="8496" t="8808" r="9552" b="8952">International</wd>

<space/>

<wd l="9610" t="8808" r="10507" b="8990">Conference</wd>

<space/>

</ln>

<ln l="6370" t="9029" r="10507" b="9216" baseLine="9163">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6370" t="9077" r="6562" b="9173">on</wd>

<space/>

<wd l="6614" t="9029" r="6936" b="9173">Web</wd>

<space/>

<wd l="6979" t="9029" r="7517" b="9173">Search</wd>

<space/>

<wd l="7560" t="9029" r="7867" b="9173">and</wd>

<space/>

<wd l="7896" t="9034" r="8294" b="9173">Data</wd>

<space/>

<wd l="8333" t="9034" r="8909" b="9211">Mining</wd>

<space/>

<wd l="8957" t="9034" r="9605" b="9206">(WSDM</wd>

<space/>

</run>

<wd l="9662" t="9029" r="10008" b="9206"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">’12)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="10056" t="9072" r="10507" b="9216">pages</wd>

<space/>

</run>

</ln>

<ln l="6370" t="9245" r="7099" b="9389" baseLine="9384" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6370" t="9245" r="7099" b="9389">563–572.</wd>

</ln>

</para>

<para l="6144" t="9643" r="10512" b="10709" alignment="justified" li="216" ri="72" spaceBefore="177" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="9643" r="10507" b="9830" baseLine="9782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="9643" r="6686" b="9830">Jeffrey</wd>

<space/>

<wd l="6734" t="9643" r="7685" b="9830">Pennington,</wd>

<space/>

<wd l="7738" t="9643" r="8366" b="9787">Richard</wd>

<space/>

<wd l="8414" t="9643" r="9000" b="9811">Socher,</wd>

<space/>

<wd l="9058" t="9643" r="9341" b="9787">and</wd>

<space/>

<wd l="9389" t="9643" r="10325" b="9826">Christopher</wd>

<space/>

<wd l="10368" t="9648" r="10507" b="9782">D</wd>

<space/>

</ln>

<ln l="6365" t="9864" r="10512" b="10051" baseLine="10003" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="9864" r="7123" b="10051">Manning.</wd>

<space/>

<wd l="7282" t="9864" r="7714" b="10008">2014.</wd>

<space/>

<wd l="7872" t="9864" r="8414" b="10008">GloVe:</wd>

<space/>

<wd l="8544" t="9864" r="9082" b="10008">Global</wd>

<space/>

<wd l="9154" t="9883" r="9720" b="10008">vectors</wd>

<space/>

<wd l="9797" t="9864" r="10032" b="10008">for</wd>

<space/>

<wd l="10104" t="9864" r="10512" b="10008">word</wd>

<space/>

</ln>

<ln l="6365" t="10085" r="10502" b="10267" baseLine="10219">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6365" t="10085" r="7531" b="10267">representation.</wd>

<space/>

<wd l="7733" t="10090" r="7896" b="10224">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7982" t="10085" r="8971" b="10267">Proceedings</wd>

<space/>

<wd l="9062" t="10085" r="9245" b="10267">of</wd>

<space/>

<wd l="9302" t="10085" r="9538" b="10229">the</wd>

<space/>

<wd l="9629" t="10085" r="10022" b="10229">2014</wd>

<space/>

<wd l="10123" t="10090" r="10502" b="10229">Con-</wd>

</run>

</ln>

<ln l="6331" t="10301" r="10507" b="10483" baseLine="10440" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6331" t="10301" r="6941" b="10483">ference</wd>

<space/>

<wd l="7003" t="10349" r="7190" b="10445">on</wd>

<space/>

<wd l="7243" t="10301" r="8050" b="10483">Empirical</wd>

<space/>

<wd l="8093" t="10301" r="8784" b="10445">Methods</wd>

<space/>

<wd l="8846" t="10306" r="8990" b="10445">in</wd>

<space/>

<wd l="9043" t="10301" r="9667" b="10445">Natural</wd>

<space/>

<wd l="9715" t="10306" r="10507" b="10483">Language</wd>

<space/>

</ln>

<ln l="6365" t="10522" r="9931" b="10709" baseLine="10661">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6365" t="10526" r="7238" b="10704">Processing</wd>

<space/>

<wd l="7296" t="10526" r="8011" b="10699">(EMNLP</wd>

<space/>

</run>

<wd l="8088" t="10522" r="8434" b="10699"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">’14)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="8491" t="10565" r="8938" b="10709">pages</wd>

<space/>

<wd l="9014" t="10522" r="9931" b="10666">1532–1543.</wd>

</run>

</ln>

</para>

<para l="6144" t="10920" r="10507" b="11765" alignment="justified" li="216" ri="72" spaceBefore="176" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="10920" r="10498" b="11064" baseLine="11059" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10925" r="6629" b="11064">Lance</wd>

<space/>

<wd l="6720" t="10925" r="6902" b="11064">A.</wd>

<space/>

<wd l="6998" t="10920" r="7776" b="11064">Ramshaw</wd>

<space/>

<wd l="7872" t="10920" r="8155" b="11064">and</wd>

<space/>

<wd l="8242" t="10920" r="8914" b="11064">Mitchell</wd>

<space/>

<wd l="9005" t="10925" r="9130" b="11064">P.</wd>

<space/>

<wd l="9226" t="10925" r="9864" b="11064">Marcus.</wd>

<space/>

<wd l="10080" t="10920" r="10498" b="11064">1995.</wd>

<space/>

</ln>

<ln l="6365" t="11141" r="10498" b="11328" baseLine="11275" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="11146" r="6715" b="11285">Text</wd>

<space/>

<wd l="6773" t="11141" r="7507" b="11328">chunking</wd>

<space/>

<wd l="7570" t="11141" r="7997" b="11328">using</wd>

<space/>

<wd l="8059" t="11141" r="9754" b="11285">transformation-based</wd>

<space/>

<wd l="9806" t="11141" r="10498" b="11328">learning.</wd>

<space/>

</ln>

<ln l="6365" t="11357" r="10507" b="11539" baseLine="11496">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="11362" r="6533" b="11496">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6629" t="11357" r="7618" b="11539">Proceedings</wd>

<space/>

<wd l="7723" t="11357" r="7906" b="11539">of</wd>

<space/>

<wd l="7958" t="11362" r="8338" b="11501">ACL</wd>

<space/>

<wd l="8443" t="11357" r="8875" b="11501">Third</wd>

<space/>

<wd l="8976" t="11357" r="9754" b="11539">Workshop</wd>

<space/>

<wd l="9864" t="11405" r="10051" b="11501">on</wd>

<space/>

<wd l="10171" t="11362" r="10507" b="11539">Very</wd>

<space/>

</run>

</ln>

<ln l="6360" t="11578" r="8702" b="11765" baseLine="11717">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6360" t="11582" r="6830" b="11760">Large</wd>

<space/>

</run>

<wd l="6888" t="11582" r="7608" b="11760"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Corpora</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7666" t="11621" r="8112" b="11765">pages</wd>

<space/>

<wd l="8174" t="11578" r="8702" b="11722">82–94.</wd>

</run>

</ln>

</para>

<para l="6149" t="11976" r="10512" b="13474" alignment="justified" li="216" ri="72" spaceBefore="173" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6149" t="11976" r="10502" b="12158" baseLine="12115" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="11976" r="6898" b="12158">Giuseppe</wd>

<space/>

<wd l="7027" t="11976" r="7531" b="12144">Rizzo,</wd>

<space/>

<wd l="7685" t="11981" r="8333" b="12158">Amparo</wd>

<space/>

<wd l="8467" t="11976" r="9221" b="12120">Elizabeth</wd>

<space/>

<wd l="9350" t="11976" r="9763" b="12120">Cano</wd>

<space/>

<wd l="9893" t="11981" r="10502" b="12144">Basave,</wd>

<space/>

</ln>

<ln l="6365" t="12197" r="10502" b="12384" baseLine="12331" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12197" r="6922" b="12341">Bianca</wd>

<space/>

<wd l="6979" t="12197" r="7584" b="12365">Pereira,</wd>

<space/>

<wd l="7656" t="12197" r="8246" b="12341">Andrea</wd>

<space/>

<wd l="8304" t="12202" r="8803" b="12384">Varga,</wd>

<space/>

<wd l="8875" t="12197" r="9576" b="12341">Matthew</wd>

<space/>

<wd l="9638" t="12202" r="10142" b="12365">Rowe,</wd>

<space/>

<wd l="10214" t="12197" r="10502" b="12336">Mi-</wd>

</ln>

<ln l="6365" t="12413" r="10507" b="12600" baseLine="12552" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12413" r="6605" b="12557">lan</wd>

<space/>

<wd l="6667" t="12413" r="7498" b="12581">Stankovic,</wd>

<space/>

<wd l="7565" t="12413" r="7848" b="12557">and</wd>

<space/>

<wd l="7901" t="12413" r="8602" b="12557">Aba-Sah</wd>

<space/>

<wd l="8654" t="12413" r="9254" b="12557">Dadzie.</wd>

<space/>

<wd l="9360" t="12413" r="9792" b="12557">2015.</wd>

<space/>

<wd l="9893" t="12413" r="10507" b="12600">Making</wd>

<space/>

</ln>

<ln l="6374" t="12634" r="10502" b="12816" baseLine="12773" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="12677" r="6792" b="12778">sense</wd>

<space/>

<wd l="6874" t="12634" r="7046" b="12778">of</wd>

<space/>

<wd l="7104" t="12634" r="7973" b="12816">microposts</wd>

<space/>

<wd l="8064" t="12634" r="9571" b="12816">(#Microposts2015)</wd>

<space/>

<wd l="9653" t="12634" r="10186" b="12778">named</wd>

<space/>

<wd l="10262" t="12677" r="10502" b="12778">en-</wd>

</ln>

<ln l="6365" t="12854" r="10512" b="13042" baseLine="12989" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12854" r="6624" b="13042">tity</wd>

<space/>

<wd l="6701" t="12854" r="7608" b="13042">recognition</wd>

<space/>

<wd l="7685" t="12854" r="7968" b="12998">and</wd>

<space/>

<wd l="8040" t="12854" r="8602" b="13042">linking</wd>

<space/>

<wd l="8688" t="12854" r="9307" b="13032">(NEEL)</wd>

<space/>

<wd l="9394" t="12854" r="10190" b="13042">challenge.</wd>

<space/>

<wd l="10344" t="12859" r="10512" b="12994">In</wd>

<space/>

</ln>

<ln l="6365" t="13070" r="10502" b="13253" baseLine="13210" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13070" r="6614" b="13214">5th</wd>

<space/>

<wd l="6677" t="13070" r="7454" b="13253">Workshop</wd>

<space/>

<wd l="7512" t="13118" r="7704" b="13214">on</wd>

<space/>

<wd l="7752" t="13070" r="8362" b="13253">Making</wd>

<space/>

<wd l="8414" t="13075" r="8866" b="13214">Sense</wd>

<space/>

<wd l="8918" t="13070" r="9101" b="13253">of</wd>

<space/>

<wd l="9115" t="13075" r="10008" b="13253">Microposts</wd>

<space/>

<wd l="10061" t="13070" r="10502" b="13248">(#Mi-</wd>

</ln>

<ln l="6370" t="13291" r="7531" b="13474" baseLine="13430">

<wd l="6370" t="13291" r="7531" b="13474"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">croposts2015)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="13690" r="10541" b="14530" alignment="justified" li="216" ri="72" spaceBefore="176" spaceAfter="35" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="13690" r="10502" b="13877" baseLine="13829" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13690" r="6600" b="13877">Ikuya</wd>

<space/>

<wd l="6667" t="13690" r="7354" b="13858">Yamada,</wd>

<space/>

<wd l="7435" t="13690" r="8059" b="13834">Hideaki</wd>

<space/>

<wd l="8131" t="13690" r="8741" b="13858">Takeda,</wd>

<space/>

<wd l="8827" t="13690" r="9110" b="13834">and</wd>

<space/>

<wd l="9178" t="13690" r="9994" b="13877">Yoshiyasu</wd>

<space/>

<wd l="10066" t="13690" r="10502" b="13834">Take-</wd>

</ln>

<ln l="6365" t="13910" r="10512" b="14098" baseLine="14045" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13910" r="6677" b="14098">fuji.</wd>

<space/>

<wd l="6821" t="13910" r="7253" b="14054">2015.</wd>

<space/>

<wd l="7387" t="13915" r="7632" b="14050">An</wd>

<space/>

<wd l="7704" t="13910" r="8563" b="14054">end-to-end</wd>

<space/>

<wd l="8635" t="13910" r="9082" b="14098">entity</wd>

<space/>

<wd l="9149" t="13910" r="9710" b="14098">linking</wd>

<space/>

<wd l="9787" t="13910" r="10512" b="14093">approach</wd>

<space/>

</ln>

<ln l="6365" t="14126" r="10541" b="14309" baseLine="14266">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="14126" r="6595" b="14270">for</wd>

<space/>

<wd l="6672" t="14131" r="7267" b="14270">Tweets.</wd>

<space/>

<wd l="7435" t="14131" r="7598" b="14266">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7675" t="14126" r="7925" b="14270">5th</wd>

<space/>

<wd l="8016" t="14126" r="8789" b="14309">Workshop</wd>

<space/>

<wd l="8875" t="14174" r="9062" b="14270">on</wd>

<space/>

<wd l="9139" t="14126" r="9749" b="14309">Making</wd>

<space/>

<wd l="9826" t="14131" r="10277" b="14270">Sense</wd>

<space/>

<wd l="10358" t="14126" r="10541" b="14309">of</wd>

<space/>

</run>

</ln>

<ln l="6360" t="14347" r="8909" b="14530" baseLine="14486">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6360" t="14352" r="7253" b="14530">Microposts</wd>

<space/>

<wd l="7306" t="14347" r="8352" b="14530">(#Microposts</wd>

<space/>

</run>

<wd l="8405" t="14347" r="8909" b="14525"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<dd l="5738" t="15746" r="6233" b="15975">

<para l="5771" t="15792" r="6200" b="15946" alignment="left" lsp="exactly" lspExact="223" language="en">

<ln l="5837" t="15792" r="6134" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="15">

<wd l="5837" t="15792" r="6134" b="15946">140</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

