<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4310.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1433" marginTop="1360" marginRight="1378" marginBottom="358" offsetX="-26" offsetY="-18" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1433" t="1360" r="10531" b="4092">

<column l="1433" t="1360" r="10531" b="4092">

<para l="1906" t="1435" r="10046" b="2016" alignment="centered" spaceBefore="34" lsp="exactly" lspExact="317" language="en">

<ln l="1906" t="1435" r="10046" b="1699" baseLine="1632" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="1906" t="1440" r="2880" b="1699">Hallym:</wd>

<space/>

<wd l="2990" t="1440" r="3864" b="1646">Named</wd>

<space/>

<wd l="3941" t="1435" r="4704" b="1699">Entity</wd>

<space/>

<wd l="4781" t="1435" r="6245" b="1699">Recognition</wd>

<space/>

<wd l="6322" t="1498" r="6619" b="1642">on</wd>

<space/>

<wd l="6696" t="1435" r="7594" b="1642">Twitter</wd>

<space/>

<wd l="7670" t="1435" r="8203" b="1642">with</wd>

<space/>

<wd l="8285" t="1440" r="9278" b="1642">Induced</wd>

<space/>

<wd l="9360" t="1440" r="10046" b="1642">Word
</wd>

</ln>

<ln l="5050" t="1752" r="6902" b="2016" baseLine="1949" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="5050" t="1752" r="6902" b="2016">Representation</wd>

</ln>

</para>

<para l="3240" t="2510" r="8650" b="2731" alignment="centered" li="1800" spaceBefore="432" lsp="exactly" lspExact="274" language="en">

<tabs position="3240"/>

<ln l="3240" t="2510" r="8650" b="2731" baseLine="2672" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3240" t="2510" r="4147" b="2683">Eun-Suk</wd>

<space/>

<wd l="4205" t="2515" r="4728" b="2731">Yang</wd>

<tab position="4728"/>

<wd l="7286" t="2510" r="8136" b="2731">Yu-Seop</wd>

<space/>

<wd l="8203" t="2510" r="8650" b="2678">Kim</wd>

</ln>

</para>

<para l="3096" t="2798" r="8851" b="3014" alignment="centered" li="1656" spaceBefore="8" lsp="exactly" lspExact="278" language="en">

<tabs position="3096"/>

<ln l="3096" t="2798" r="8851" b="3014" baseLine="2953" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3096" t="2798" r="3816" b="3014">Hallym</wd>

<space/>

<wd l="3874" t="2798" r="4867" b="3014">University</wd>

<tab position="4867"/>

<wd l="7080" t="2798" r="7795" b="3014">Hallym</wd>

<space/>

<wd l="7858" t="2798" r="8851" b="3014">University</wd>

</ln>

</para>

<para l="2635" t="3086" r="9389" b="3288" alignment="centered" li="1152" spaceBefore="15" spaceAfter="801" lsp="exactly" lspExact="253" language="en">

<tabs position="2635"/>

<ln l="2635" t="3086" r="9389" b="3288" baseLine="3232" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="-1">

<wd l="2635" t="3086" r="5347" b="3288">esyang219@gmail.com</wd>

<tab position="5347"/>

<wd l="6542" t="3086" r="9389" b="3288">yskim01@hallym.ac.kr</wd>

</ln>

</para>

</column>

</section>

<section l="1433" t="4092" r="10531" b="15336">

<column l="1433" t="4092" r="5820" b="15336">

<para l="3178" t="4142" r="4070" b="4315" alignment="centered" spaceBefore="3" lsp="exactly" lspExact="274" language="en">

<ln l="3178" t="4142" r="4070" b="4315" baseLine="4306" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3178" t="4142" r="4070" b="4315">Abstract</wd>

</ln>

</para>

<para l="1781" t="4622" r="5467" b="9158" alignment="justified" li="288" ri="360" spaceBefore="203" lsp="exactly" lspExact="270" language="en">

<ln l="1781" t="4622" r="5453" b="4824" baseLine="4771" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4622" r="2410" b="4781">Twitter</wd>

<space/>

<wd l="2467" t="4622" r="2606" b="4781">is</wd>

<space/>

<wd l="2683" t="4675" r="2779" b="4781">a</wd>

<space/>

<wd l="2837" t="4646" r="3211" b="4824">type</wd>

<space/>

<wd l="3278" t="4622" r="3470" b="4781">of</wd>

<space/>

<wd l="3528" t="4622" r="4027" b="4781">social</wd>

<space/>

<wd l="4090" t="4622" r="4627" b="4781">media</wd>

<space/>

<wd l="4690" t="4622" r="5016" b="4781">that</wd>

<space/>

<wd l="5083" t="4675" r="5453" b="4781">con-</wd>

</ln>

<ln l="1781" t="4891" r="5453" b="5093" baseLine="5045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4891" r="2184" b="5050">tains</wd>

<space/>

<wd l="2275" t="4891" r="2890" b="5050">diverse</wd>

<space/>

<wd l="2971" t="4891" r="4253" b="5093">user-generated</wd>

<space/>

<wd l="4325" t="4915" r="4781" b="5050">texts.</wd>

<space/>

<wd l="4930" t="4891" r="5453" b="5050">Tradi-</wd>

</ln>

<ln l="1781" t="5165" r="5467" b="5366" baseLine="5314" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5165" r="2275" b="5323">tional</wd>

<space/>

<wd l="2357" t="5165" r="2981" b="5323">models</wd>

<space/>

<wd l="3072" t="5218" r="3331" b="5323">are</wd>

<space/>

<wd l="3413" t="5189" r="3691" b="5323">not</wd>

<space/>

<wd l="3773" t="5165" r="4666" b="5366">applicable</wd>

<space/>

<wd l="4742" t="5189" r="4910" b="5323">to</wd>

<space/>

<wd l="4992" t="5189" r="5467" b="5323">tweet</wd>

<space/>

</ln>

<ln l="1786" t="5434" r="5453" b="5635" baseLine="5587" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="5434" r="2146" b="5592">data</wd>

<space/>

<wd l="2208" t="5434" r="2894" b="5592">because</wd>

<space/>

<wd l="2962" t="5434" r="3226" b="5592">the</wd>

<space/>

<wd l="3288" t="5458" r="3614" b="5592">text</wd>

<space/>

<wd l="3686" t="5434" r="4085" b="5635">style</wd>

<space/>

<wd l="4152" t="5434" r="4286" b="5592">is</wd>

<space/>

<wd l="4358" t="5458" r="4637" b="5592">not</wd>

<space/>

<wd l="4704" t="5486" r="4872" b="5592">as</wd>

<space/>

<wd l="4949" t="5486" r="5453" b="5635">gram-</wd>

</ln>

<ln l="1781" t="5707" r="5458" b="5866" baseLine="5856" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5707" r="2789" b="5866">maticalized</wd>

<space/>

<wd l="2880" t="5760" r="3048" b="5866">as</wd>

<space/>

<wd l="3144" t="5707" r="3470" b="5866">that</wd>

<space/>

<wd l="3562" t="5707" r="3754" b="5866">of</wd>

<space/>

<wd l="3826" t="5707" r="4704" b="5866">newswire.</wd>

<space/>

<wd l="4882" t="5712" r="5064" b="5861">In</wd>

<space/>

<wd l="5150" t="5707" r="5458" b="5866">this</wd>

<space/>

</ln>

<ln l="1781" t="5976" r="5467" b="6178" baseLine="6125" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="6029" r="2299" b="6178">paper,</wd>

<space/>

<wd l="2381" t="6029" r="2635" b="6134">we</wd>

<space/>

<wd l="2707" t="6000" r="3504" b="6134">construct</wd>

<space/>

<wd l="3566" t="5976" r="4013" b="6134">word</wd>

<space/>

<wd l="4085" t="5976" r="5126" b="6178">embeddings</wd>

<space/>

<wd l="5198" t="5976" r="5467" b="6134">via</wd>

<space/>

</ln>

<ln l="1786" t="6245" r="5467" b="6446" baseLine="6398" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="6245" r="2611" b="6403">canonical</wd>

<space/>

<wd l="2717" t="6245" r="3658" b="6403">correlation</wd>

<space/>

<wd l="3758" t="6245" r="4450" b="6446">analysis</wd>

<space/>

<wd l="4565" t="6250" r="5141" b="6442">(CCA)</wd>

<space/>

<wd l="5251" t="6298" r="5467" b="6403">on</wd>

<space/>

</ln>

<ln l="1786" t="6518" r="5467" b="6677" baseLine="6667" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="6571" r="1882" b="6677">a</wd>

<space/>

<wd l="1963" t="6518" r="3062" b="6677">considerable</wd>

<space/>

<wd l="3149" t="6542" r="3802" b="6677">amount</wd>

<space/>

<wd l="3888" t="6518" r="4080" b="6677">of</wd>

<space/>

<wd l="4147" t="6542" r="4622" b="6677">tweet</wd>

<space/>

<wd l="4709" t="6518" r="5069" b="6677">data</wd>

<space/>

<wd l="5155" t="6518" r="5467" b="6677">and</wd>

<space/>

</ln>

<ln l="1790" t="6787" r="5453" b="6989" baseLine="6941" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1790" t="6787" r="2232" b="6946">show</wd>

<space/>

<wd l="2309" t="6787" r="2573" b="6946">the</wd>

<space/>

<wd l="2654" t="6787" r="3326" b="6989">efficacy</wd>

<space/>

<wd l="3408" t="6787" r="3595" b="6946">of</wd>

<space/>

<wd l="3658" t="6787" r="4104" b="6946">word</wd>

<space/>

<wd l="4176" t="6787" r="5453" b="6989">representation.</wd>

<space/>

</ln>

<ln l="1781" t="7061" r="5453" b="7262" baseLine="7210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7061" r="2453" b="7219">Besides</wd>

<space/>

<wd l="2573" t="7061" r="3019" b="7219">word</wd>

<space/>

<wd l="3134" t="7061" r="4142" b="7262">embedding,</wd>

<space/>

<wd l="4282" t="7114" r="4536" b="7219">we</wd>

<space/>

<wd l="4651" t="7114" r="4939" b="7219">use</wd>

<space/>

<wd l="5054" t="7085" r="5453" b="7262">part-</wd>

</ln>

<ln l="1786" t="7330" r="5467" b="7531" baseLine="7483" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="7330" r="2630" b="7531">of-speech</wd>

<space/>

<wd l="2707" t="7334" r="3230" b="7526">(POS)</wd>

<space/>

<wd l="3307" t="7354" r="3706" b="7531">tags,</wd>

<space/>

<wd l="3792" t="7330" r="4450" b="7517">chunks,</wd>

<space/>

<wd l="4536" t="7330" r="4848" b="7488">and</wd>

<space/>

<wd l="4915" t="7330" r="5467" b="7488">brown</wd>

<space/>

</ln>

<ln l="1786" t="7603" r="5453" b="7805" baseLine="7752" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="7603" r="2438" b="7762">clusters</wd>

<space/>

<wd l="2544" t="7603" r="3235" b="7762">induced</wd>

<space/>

<wd l="3331" t="7603" r="3758" b="7762">from</wd>

<space/>

<wd l="3850" t="7603" r="4757" b="7805">Wikipedia</wd>

<space/>

<wd l="4853" t="7656" r="5021" b="7762">as</wd>

<space/>

<wd l="5126" t="7603" r="5453" b="7762">fea-</wd>

</ln>

<ln l="1781" t="7872" r="5467" b="8074" baseLine="8026" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7896" r="2246" b="8030">tures.</wd>

<space/>

<wd l="2395" t="7877" r="2866" b="8059">Here,</wd>

<space/>

<wd l="2962" t="7925" r="3211" b="8030">we</wd>

<space/>

<wd l="3298" t="7872" r="4018" b="8030">describe</wd>

<space/>

<wd l="4104" t="7925" r="4392" b="8030">our</wd>

<space/>

<wd l="4474" t="7896" r="5074" b="8074">system</wd>

<space/>

<wd l="5155" t="7872" r="5467" b="8030">and</wd>

<space/>

</ln>

<ln l="1781" t="8146" r="5467" b="8347" baseLine="8294" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8170" r="2414" b="8347">present</wd>

<space/>

<wd l="2506" t="8146" r="2770" b="8304">the</wd>

<space/>

<wd l="2866" t="8146" r="3250" b="8304">final</wd>

<space/>

<wd l="3346" t="8146" r="3907" b="8304">results</wd>

<space/>

<wd l="4013" t="8146" r="4488" b="8347">along</wd>

<space/>

<wd l="4584" t="8146" r="4973" b="8304">with</wd>

<space/>

<wd l="5064" t="8146" r="5467" b="8304">their</wd>

<space/>

</ln>

<ln l="1786" t="8414" r="5462" b="8616" baseLine="8568" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="8414" r="2525" b="8616">analysis.</wd>

<space/>

<wd l="2635" t="8419" r="2971" b="8573">Our</wd>

<space/>

<wd l="3029" t="8414" r="3571" b="8573">model</wd>

<space/>

<wd l="3643" t="8414" r="4373" b="8573">achieves</wd>

<space/>

<wd l="4450" t="8467" r="4646" b="8573">an</wd>

<space/>

<wd l="4714" t="8419" r="4920" b="8568">F1</wd>

<space/>

<wd l="5016" t="8467" r="5462" b="8573">score</wd>

<space/>

</ln>

<ln l="1786" t="8688" r="5453" b="8890" baseLine="8837" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="8688" r="1978" b="8846">of</wd>

<space/>

<wd l="2069" t="8693" r="2726" b="8846">37.21%</wd>

<space/>

<wd l="2837" t="8688" r="3230" b="8846">with</wd>

<space/>

<wd l="3331" t="8688" r="3821" b="8890">entity</wd>

<space/>

<wd l="3926" t="8712" r="4382" b="8890">types</wd>

<space/>

<wd l="4498" t="8688" r="4805" b="8846">and</wd>

<space/>

<wd l="4910" t="8688" r="5453" b="8846">distin-</wd>

</ln>

<ln l="1786" t="8957" r="5328" b="9158" baseLine="9106" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="8957" r="2429" b="9158">guishes</wd>

<space/>

<wd l="2496" t="8957" r="3154" b="9115">53.01%</wd>

<space/>

<wd l="3221" t="8957" r="3413" b="9115">of</wd>

<space/>

<wd l="3451" t="8957" r="3720" b="9115">the</wd>

<space/>

<wd l="3778" t="8957" r="4267" b="9158">entity</wd>

<space/>

<wd l="4325" t="8957" r="5328" b="9115">boundaries.</wd>

</ln>

</para>

<para l="1454" t="9413" r="3091" b="9586" alignment="left" spaceBefore="208" lsp="exactly" lspExact="274" language="en">

<ln l="1454" t="9413" r="3091" b="9586" baseLine="9581" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1454" t="9413" r="1550" b="9581">1</wd>

<space/>

<wd l="1805" t="9413" r="3091" b="9586">Introduction</wd>

</ln>

</para>

<para l="1440" t="9845" r="5803" b="11126" alignment="justified" spaceBefore="145" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="9845" r="5794" b="10046" baseLine="9998" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9845" r="2074" b="10003">Named</wd>

<space/>

<wd l="2136" t="9845" r="2621" b="10046">entity</wd>

<space/>

<wd l="2688" t="9845" r="3682" b="10046">recognition</wd>

<space/>

<wd l="3749" t="9850" r="4310" b="10042">(NER)</wd>

<space/>

<wd l="4382" t="9845" r="4517" b="10003">is</wd>

<space/>

<wd l="4589" t="9898" r="4685" b="10003">a</wd>

<space/>

<wd l="4742" t="9845" r="5093" b="10003">task</wd>

<space/>

<wd l="5155" t="9845" r="5347" b="10003">of</wd>

<space/>

<wd l="5400" t="9845" r="5794" b="10003">find-</wd>

</ln>

<ln l="1440" t="10118" r="5794" b="10320" baseLine="10267" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10118" r="1714" b="10320">ing</wd>

<space/>

<wd l="1795" t="10118" r="2107" b="10277">and</wd>

<space/>

<wd l="2179" t="10118" r="3115" b="10320">classifying</wd>

<space/>

<wd l="3192" t="10171" r="3739" b="10277">names</wd>

<space/>

<wd l="3826" t="10118" r="4018" b="10277">of</wd>

<space/>

<wd l="4070" t="10118" r="4651" b="10320">things,</wd>

<space/>

<wd l="4747" t="10118" r="5136" b="10277">such</wd>

<space/>

<wd l="5213" t="10171" r="5381" b="10277">as</wd>

<space/>

<wd l="5458" t="10171" r="5794" b="10320">per-</wd>

</ln>

<ln l="1450" t="10387" r="5803" b="10589" baseLine="10541" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1450" t="10440" r="1786" b="10574">son,</wd>

<space/>

<wd l="1872" t="10387" r="2616" b="10574">location,</wd>

<space/>

<wd l="2702" t="10387" r="3014" b="10546">and</wd>

<space/>

<wd l="3086" t="10387" r="4214" b="10589">organization,</wd>

<space/>

<wd l="4301" t="10387" r="4771" b="10589">given</wd>

<space/>

<wd l="4843" t="10440" r="4939" b="10546">a</wd>

<space/>

<wd l="5016" t="10440" r="5803" b="10589">sequence</wd>

<space/>

</ln>

<ln l="1445" t="10661" r="5794" b="10862" baseLine="10810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="10661" r="1637" b="10819">of</wd>

<space/>

<wd l="1685" t="10661" r="2261" b="10819">words.</wd>

<space/>

<wd l="2366" t="10666" r="2803" b="10819">NER</wd>

<space/>

<wd l="2866" t="10661" r="3005" b="10819">is</wd>

<space/>

<wd l="3082" t="10714" r="3178" b="10819">a</wd>

<space/>

<wd l="3240" t="10714" r="3619" b="10862">very</wd>

<space/>

<wd l="3686" t="10661" r="4536" b="10862">important</wd>

<space/>

<wd l="4608" t="10661" r="5256" b="10819">subtask</wd>

<space/>

<wd l="5323" t="10661" r="5515" b="10819">of</wd>

<space/>

<wd l="5563" t="10661" r="5794" b="10814">in-</wd>

</ln>

<ln l="1440" t="10930" r="3672" b="11126" baseLine="11083" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10930" r="2304" b="11088">formation</wd>

<space/>

<wd l="2362" t="10930" r="3226" b="11088">extraction</wd>

<space/>

<wd l="3288" t="10934" r="3672" b="11126">(IE).</wd>

</ln>

</para>

<para l="1440" t="11203" r="5808" b="14107" alignment="justified" spaceBefore="11" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="11203" r="5803" b="11405" baseLine="11352" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11203" r="1867" b="11362">With</wd>

<space/>

<wd l="1987" t="11203" r="2251" b="11362">the</wd>

<space/>

<wd l="2376" t="11203" r="3494" b="11405">development</wd>

<space/>

<wd l="3614" t="11203" r="3806" b="11362">of</wd>

<space/>

<wd l="3912" t="11203" r="4176" b="11362">the</wd>

<space/>

<wd l="4296" t="11208" r="5021" b="11390">Internet,</wd>

<space/>

<wd l="5170" t="11256" r="5266" b="11362">a</wd>

<space/>

<wd l="5381" t="11203" r="5803" b="11405">huge</wd>

<space/>

</ln>

<ln l="1445" t="11472" r="5803" b="11674" baseLine="11621" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11496" r="2098" b="11630">amount</wd>

<space/>

<wd l="2222" t="11472" r="2410" b="11630">of</wd>

<space/>

<wd l="2520" t="11472" r="3552" b="11630">information</wd>

<space/>

<wd l="3672" t="11472" r="3955" b="11630">has</wd>

<space/>

<wd l="4085" t="11472" r="4498" b="11630">been</wd>

<space/>

<wd l="4622" t="11472" r="5467" b="11674">generated</wd>

<space/>

<wd l="5587" t="11472" r="5803" b="11674">by</wd>

<space/>

</ln>

<ln l="1440" t="11746" r="5794" b="11947" baseLine="11894" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11798" r="1930" b="11904">users.</wd>

<space/>

<wd l="2136" t="11746" r="2477" b="11904">The</wd>

<space/>

<wd l="2573" t="11746" r="3605" b="11904">information</wd>

<space/>

<wd l="3706" t="11746" r="4550" b="11947">generated</wd>

<space/>

<wd l="4651" t="11798" r="4867" b="11904">on</wd>

<space/>

<wd l="4963" t="11746" r="5227" b="11904">the</wd>

<space/>

<wd l="5323" t="11750" r="5794" b="11904">Inter-</wd>

</ln>

<ln l="1440" t="12014" r="5808" b="12216" baseLine="12163" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12038" r="1752" b="12202">net,</wd>

<space/>

<wd l="1819" t="12014" r="2822" b="12216">particularly</wd>

<space/>

<wd l="2885" t="12067" r="3101" b="12173">on</wd>

<space/>

<wd l="3163" t="12014" r="3662" b="12173">social</wd>

<space/>

<wd l="3720" t="12014" r="4258" b="12173">media</wd>

<space/>

<wd l="4320" t="12019" r="4742" b="12216">(e.g.,</wd>

<space/>

<wd l="4810" t="12014" r="5438" b="12173">Twitter</wd>

<space/>

<wd l="5496" t="12014" r="5808" b="12173">and</wd>

<space/>

</ln>

<ln l="1440" t="12283" r="5794" b="12485" baseLine="12437" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12283" r="2400" b="12480">Facebook),</wd>

<space/>

<wd l="2482" t="12283" r="3202" b="12442">includes</wd>

<space/>

<wd l="3278" t="12336" r="3658" b="12485">very</wd>

<space/>

<wd l="3734" t="12283" r="4349" b="12442">diverse</wd>

<space/>

<wd l="4426" t="12283" r="4738" b="12442">and</wd>

<space/>

<wd l="4800" t="12283" r="5270" b="12485">noisy</wd>

<space/>

<wd l="5342" t="12307" r="5794" b="12442">texts.</wd>

<space/>

</ln>

<ln l="1440" t="12557" r="5794" b="12758" baseLine="12706" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12557" r="1781" b="12715">The</wd>

<space/>

<wd l="1843" t="12557" r="2491" b="12715">volume</wd>

<space/>

<wd l="2558" t="12557" r="2750" b="12715">of</wd>

<space/>

<wd l="2798" t="12557" r="3427" b="12715">Twitter</wd>

<space/>

<wd l="3490" t="12557" r="3850" b="12715">data</wd>

<space/>

<wd l="3907" t="12557" r="4190" b="12715">has</wd>

<space/>

<wd l="4262" t="12557" r="5088" b="12715">increased</wd>

<space/>

<wd l="5146" t="12557" r="5794" b="12758">rapidly,</wd>

<space/>

</ln>

<ln l="1445" t="12792" r="5794" b="13027" baseLine="12977">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="12826" r="1757" b="12984">and</wd>

<space/>

<wd l="1848" t="12826" r="2328" b="12984">about</wd>

<space/>

<wd l="2419" t="12826" r="2736" b="12984">500</wd>

<space/>

<wd l="2827" t="12826" r="3461" b="12984">million</wd>

<space/>

<wd l="3547" t="12850" r="4094" b="12984">tweets</wd>

<space/>

<wd l="4195" t="12878" r="4454" b="12984">are</wd>

<space/>

<wd l="4550" t="12850" r="4896" b="12984">sent</wd>

<space/>

<wd l="4982" t="12878" r="5266" b="13027">per</wd>

<space/>

</run>

<wd l="5352" t="12792" r="5794" b="13027"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">day</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">1</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="1440" t="13099" r="5808" b="13301" baseLine="13248" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13104" r="1622" b="13253">In</wd>

<space/>

<wd l="1718" t="13123" r="2256" b="13258">recent</wd>

<space/>

<wd l="2352" t="13152" r="2856" b="13301">years,</wd>

<space/>

<wd l="2976" t="13099" r="3605" b="13258">Twitter</wd>

<space/>

<wd l="3706" t="13099" r="4066" b="13258">data</wd>

<space/>

<wd l="4162" t="13099" r="4565" b="13258">have</wd>

<space/>

<wd l="4670" t="13099" r="5611" b="13258">considered</wd>

<space/>

<wd l="5712" t="13152" r="5808" b="13258">a</wd>

<space/>

</ln>

<ln l="1440" t="13368" r="5803" b="13570" baseLine="13522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13421" r="1795" b="13526">new</wd>

<space/>

<wd l="1886" t="13421" r="2448" b="13526">source</wd>

<space/>

<wd l="2530" t="13368" r="2702" b="13522">in</wd>

<space/>

<wd l="2779" t="13392" r="3326" b="13526">nature</wd>

<space/>

<wd l="3413" t="13368" r="3725" b="13526">and</wd>

<space/>

<wd l="3802" t="13368" r="4776" b="13526">researchers</wd>

<space/>

<wd l="4867" t="13421" r="5131" b="13526">are</wd>

<space/>

<wd l="5213" t="13368" r="5803" b="13570">paying</wd>

<space/>

</ln>

<ln l="1440" t="13642" r="5794" b="13838" baseLine="13790" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13642" r="2266" b="13800">increased</wd>

<space/>

<wd l="2352" t="13642" r="3115" b="13800">attention</wd>

<space/>

<wd l="3197" t="13666" r="3360" b="13800">to</wd>

<space/>

<wd l="3451" t="13642" r="3888" b="13800">them</wd>

<space/>

<wd l="3979" t="13642" r="4627" b="13838">(Bollen</wd>

<space/>

<wd l="4714" t="13666" r="4867" b="13800">et</wd>

<space/>

<wd l="4954" t="13642" r="5208" b="13829">al.,</wd>

<space/>

<wd l="5314" t="13646" r="5794" b="13829">2011;</wd>

<space/>

</ln>

<ln l="1440" t="13910" r="4382" b="14107" baseLine="14064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13910" r="2630" b="14069">Mathioudakis</wd>

<space/>

<wd l="2698" t="13910" r="3010" b="14069">and</wd>

<space/>

<wd l="3067" t="13910" r="3768" b="14098">Koudas,</wd>

<space/>

<wd l="3835" t="13915" r="4382" b="14107">2010).</wd>

</ln>

</para>

<para l="1440" t="14184" r="5808" b="14928" alignment="justified" spaceBefore="1" spaceAfter="102" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="14184" r="5808" b="14386" baseLine="14333" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14184" r="2069" b="14342">Twitter</wd>

<space/>

<wd l="2107" t="14184" r="2246" b="14342">is</wd>

<space/>

<wd l="2299" t="14237" r="2395" b="14342">a</wd>

<space/>

<wd l="2434" t="14208" r="2808" b="14386">type</wd>

<space/>

<wd l="2856" t="14184" r="3048" b="14342">of</wd>

<space/>

<wd l="3072" t="14184" r="4354" b="14386">microblogging</wd>

<space/>

<wd l="4411" t="14184" r="5016" b="14342">service</wd>

<space/>

<wd l="5059" t="14184" r="5232" b="14338">in</wd>

<space/>

<wd l="5270" t="14184" r="5808" b="14342">which</wd>

<space/>

</ln>

<ln l="1440" t="14453" r="5803" b="14654" baseLine="14602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14506" r="1882" b="14611">users</wd>

<space/>

<wd l="1973" t="14506" r="2237" b="14611">are</wd>

<space/>

<wd l="2323" t="14453" r="3005" b="14611">allowed</wd>

<space/>

<wd l="3082" t="14477" r="3250" b="14611">to</wd>

<space/>

<wd l="3336" t="14477" r="3701" b="14654">post</wd>

<space/>

<wd l="3782" t="14477" r="4498" b="14611">contents</wd>

<space/>

<wd l="4598" t="14453" r="4992" b="14611">such</wd>

<space/>

<wd l="5074" t="14506" r="5242" b="14611">as</wd>

<space/>

<wd l="5342" t="14453" r="5803" b="14611">small</wd>

<space/>

</ln>

<ln l="1440" t="14726" r="5803" b="14928" baseLine="14875" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="14779" r="2309" b="14928">messages,</wd>

<space/>

<wd l="2429" t="14726" r="3307" b="14885">individual</wd>

<space/>

<wd l="3408" t="14726" r="4070" b="14928">images,</wd>

<space/>

<wd l="4195" t="14779" r="4378" b="14885">or</wd>

<space/>

<wd l="4474" t="14726" r="5083" b="14885">videos.</wd>

<space/>

<wd l="5294" t="14726" r="5803" b="14885">There</wd>

</ln>

</para>

<rulerline l="1433" t="15048" r="2640" b="15048" type="single" width="10" color="000000"/>

<para l="1704" t="15101" r="5794" b="15302" alignment="right" spaceBefore="59" spaceAfter="31" lsp="exactly" lspExact="204" language="en">

<ln l="1704" t="15101" r="5794" b="15302" baseLine="15257">

<wd l="1704" t="15101" r="2021" b="15264"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">See</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2074" t="15134" r="5794" b="15302">“http://www.internetlivestats.com/twitter-statistics/”</wd>

</run>

</ln>

</para>

</column>

<column l="6144" t="4092" r="10531" b="15336">

<para l="6144" t="4157" r="10517" b="5443" alignment="justified" spaceBefore="4" lsp="exactly" lspExact="270" language="en">

<ln l="6149" t="4157" r="10502" b="4358" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4210" r="6413" b="4315">are</wd>

<space/>

<wd l="6470" t="4210" r="6566" b="4315">a</wd>

<space/>

<wd l="6619" t="4157" r="7286" b="4315">number</wd>

<space/>

<wd l="7344" t="4157" r="7531" b="4315">of</wd>

<space/>

<wd l="7574" t="4157" r="8856" b="4358">microblogging</wd>

<space/>

<wd l="8923" t="4157" r="9293" b="4315">sites</wd>

<space/>

<wd l="9365" t="4157" r="9754" b="4315">such</wd>

<space/>

<wd l="9811" t="4210" r="9979" b="4315">as</wd>

<space/>

<wd l="10042" t="4157" r="10502" b="4315">Twit-</wd>

</ln>

<ln l="6144" t="4426" r="10502" b="4613" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4450" r="6408" b="4613">ter,</wd>

<space/>

<wd l="6485" t="4426" r="7166" b="4613">Tumblr,</wd>

<space/>

<wd l="7238" t="4426" r="7714" b="4584">Plurk</wd>

<space/>

<wd l="7781" t="4426" r="8093" b="4584">and</wd>

<space/>

<wd l="8150" t="4426" r="8942" b="4584">identi.ca.</wd>

<space/>

<wd l="9043" t="4426" r="9480" b="4584">Each</wd>

<space/>

<wd l="9552" t="4426" r="10157" b="4584">service</wd>

<space/>

<wd l="10219" t="4426" r="10502" b="4584">has</wd>

<space/>

</ln>

<ln l="6144" t="4699" r="10517" b="4901" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4699" r="6346" b="4858">its</wd>

<space/>

<wd l="6427" t="4752" r="6792" b="4858">own</wd>

<space/>

<wd l="6864" t="4699" r="8150" b="4858">characteristics.</wd>

<space/>

<wd l="8275" t="4704" r="8582" b="4858">For</wd>

<space/>

<wd l="8650" t="4699" r="9427" b="4901">example,</wd>

<space/>

<wd l="9509" t="4699" r="9984" b="4858">Plurk</wd>

<space/>

<wd l="10051" t="4699" r="10334" b="4858">has</wd>

<space/>

<wd l="10421" t="4752" r="10517" b="4858">a</wd>

<space/>

</ln>

<ln l="6144" t="4968" r="10517" b="5170" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4968" r="6859" b="5126">timeline</wd>

<space/>

<wd l="6917" t="4968" r="7334" b="5126">view</wd>

<space/>

<wd l="7397" t="4968" r="7656" b="5126">for</wd>

<space/>

<wd l="7709" t="4968" r="8270" b="5126">videos</wd>

<space/>

<wd l="8342" t="4968" r="8654" b="5126">and</wd>

<space/>

<wd l="8707" t="4968" r="9442" b="5170">pictures,</wd>

<space/>

<wd l="9518" t="4968" r="9830" b="5126">and</wd>

<space/>

<wd l="9888" t="4968" r="10517" b="5126">Twitter</wd>

<space/>

</ln>

<ln l="6144" t="5242" r="7934" b="5443" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5242" r="6427" b="5400">has</wd>

<space/>

<wd l="6494" t="5246" r="7075" b="5400">“status</wd>

<space/>

<wd l="7138" t="5242" r="7934" b="5443">updates.”</wd>

</ln>

</para>

<para l="6144" t="5510" r="10512" b="7603" alignment="justified" spaceBefore="10" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="5510" r="10512" b="5712" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5510" r="6485" b="5669">The</wd>

<space/>

<wd l="6542" t="5510" r="7694" b="5669">characteristic</wd>

<space/>

<wd l="7757" t="5510" r="7949" b="5669">of</wd>

<space/>

<wd l="7992" t="5515" r="8573" b="5669">“status</wd>

<space/>

<wd l="8630" t="5510" r="9389" b="5712">updates”</wd>

<space/>

<wd l="9446" t="5510" r="9586" b="5669">is</wd>

<space/>

<wd l="9648" t="5563" r="9960" b="5669">one</wd>

<space/>

<wd l="10018" t="5510" r="10205" b="5669">of</wd>

<space/>

<wd l="10243" t="5510" r="10512" b="5669">the</wd>

<space/>

</ln>

<ln l="6144" t="5784" r="10502" b="5942" baseLine="5933" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5784" r="6830" b="5942">features</wd>

<space/>

<wd l="6883" t="5784" r="7214" b="5942">that</wd>

<space/>

<wd l="7262" t="5784" r="7810" b="5942">makes</wd>

<space/>

<wd l="7867" t="5784" r="8131" b="5942">the</wd>

<space/>

<wd l="8189" t="5784" r="9322" b="5942">classification</wd>

<space/>

<wd l="9374" t="5784" r="9566" b="5942">of</wd>

<space/>

<wd l="9600" t="5784" r="10186" b="5942">named</wd>

<space/>

<wd l="10238" t="5837" r="10502" b="5942">en-</wd>

</ln>

<ln l="6144" t="6053" r="10512" b="6240" baseLine="6206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6053" r="6562" b="6211">tities</wd>

<space/>

<wd l="6619" t="6053" r="6792" b="6206">in</wd>

<space/>

<wd l="6840" t="6053" r="7469" b="6211">Twitter</wd>

<space/>

<wd l="7517" t="6053" r="8242" b="6211">difficult.</wd>

<space/>

<wd l="8318" t="6058" r="8501" b="6206">In</wd>

<space/>

<wd l="8549" t="6053" r="9211" b="6240">Twitter,</wd>

<space/>

<wd l="9274" t="6053" r="9706" b="6211">there</wd>

<space/>

<wd l="9758" t="6053" r="9893" b="6211">is</wd>

<space/>

<wd l="9955" t="6106" r="10051" b="6211">a</wd>

<space/>

<wd l="10099" t="6053" r="10512" b="6211">limit</wd>

<space/>

</ln>

<ln l="6144" t="6326" r="10512" b="6528" baseLine="6475" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6326" r="6403" b="6485">for</wd>

<space/>

<wd l="6466" t="6326" r="6734" b="6485">the</wd>

<space/>

<wd l="6802" t="6326" r="7474" b="6485">number</wd>

<space/>

<wd l="7541" t="6326" r="7728" b="6485">of</wd>

<space/>

<wd l="7786" t="6326" r="8659" b="6485">characters</wd>

<space/>

<wd l="8736" t="6326" r="9062" b="6485">that</wd>

<space/>

<wd l="9130" t="6326" r="9710" b="6528">people</wd>

<space/>

<wd l="9782" t="6379" r="10075" b="6485">can</wd>

<space/>

<wd l="10147" t="6350" r="10512" b="6528">post</wd>

<space/>

</ln>

<ln l="6149" t="6595" r="10512" b="6797" baseLine="6749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="6619" r="6307" b="6754">at</wd>

<space/>

<wd l="6389" t="6648" r="6840" b="6754">once.</wd>

<space/>

<wd l="6998" t="6595" r="7589" b="6797">People</wd>

<space/>

<wd l="7670" t="6619" r="8035" b="6797">post</wd>

<space/>

<wd l="8117" t="6595" r="8520" b="6754">their</wd>

<space/>

<wd l="8597" t="6595" r="9341" b="6797">thoughts</wd>

<space/>

<wd l="9427" t="6595" r="9816" b="6754">with</wd>

<space/>

<wd l="9902" t="6648" r="9998" b="6754">a</wd>

<space/>

<wd l="10085" t="6595" r="10512" b="6754">short</wd>

<space/>

</ln>

<ln l="6154" t="6869" r="10507" b="7070" baseLine="7018" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6154" t="6893" r="6946" b="7056">sentence;</wd>

<space/>

<wd l="7027" t="6869" r="7334" b="7027">this</wd>

<space/>

<wd l="7406" t="6869" r="7848" b="7027">leads</wd>

<space/>

<wd l="7920" t="6893" r="8088" b="7027">to</wd>

<space/>

<wd l="8155" t="6869" r="8419" b="7027">the</wd>

<space/>

<wd l="8486" t="6869" r="9216" b="7070">problem</wd>

<space/>

<wd l="9278" t="6869" r="9610" b="7027">that</wd>

<space/>

<wd l="9672" t="6893" r="10219" b="7027">tweets</wd>

<space/>

<wd l="10296" t="6869" r="10507" b="7027">do</wd>

<space/>

</ln>

<ln l="6144" t="7138" r="10502" b="7334" baseLine="7286" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="7162" r="6427" b="7296">not</wd>

<space/>

<wd l="6485" t="7138" r="7128" b="7296">contain</wd>

<space/>

<wd l="7190" t="7138" r="7992" b="7296">sufficient</wd>

<space/>

<wd l="8050" t="7138" r="8952" b="7296">contextual</wd>

<space/>

<wd l="9010" t="7138" r="10042" b="7296">information</wd>

<space/>

<wd l="10109" t="7138" r="10502" b="7334">(Rit-</wd>

</ln>

<ln l="6144" t="7406" r="7517" b="7603" baseLine="7560" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="7430" r="6379" b="7565">ter</wd>

<space/>

<wd l="6437" t="7430" r="6590" b="7565">et</wd>

<space/>

<wd l="6648" t="7406" r="6898" b="7594">al.,</wd>

<space/>

<wd l="6970" t="7411" r="7517" b="7603">2011).</wd>

</ln>

</para>

<para l="6144" t="7680" r="10517" b="11362" alignment="justified" spaceBefore="12" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="7680" r="10512" b="7838" baseLine="7829" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7680" r="6485" b="7838">The</wd>

<space/>

<wd l="6571" t="7680" r="7133" b="7838">shared</wd>

<space/>

<wd l="7210" t="7680" r="7560" b="7838">task</wd>

<space/>

<wd l="7642" t="7680" r="7834" b="7838">of</wd>

<space/>

<wd l="7896" t="7685" r="8323" b="7838">ACL</wd>

<space/>

<wd l="8400" t="7685" r="9110" b="7838">W-NUT</wd>

<space/>

<wd l="9192" t="7680" r="9614" b="7838">2015</wd>

<space/>

<wd l="9701" t="7680" r="9840" b="7838">is</wd>

<space/>

<wd l="9926" t="7704" r="10090" b="7838">to</wd>

<space/>

<wd l="10176" t="7680" r="10512" b="7838">find</wd>

<space/>

</ln>

<ln l="6144" t="7949" r="10502" b="8136" baseLine="8102" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7949" r="6730" b="8107">named</wd>

<space/>

<wd l="6845" t="7949" r="7464" b="8107">entities</wd>

<space/>

<wd l="7589" t="8002" r="7805" b="8107">on</wd>

<space/>

<wd l="7915" t="7949" r="8573" b="8107">Twitter.</wd>

<space/>

<wd l="8827" t="7954" r="9298" b="8136">Here,</wd>

<space/>

<wd l="9437" t="8002" r="9691" b="8107">we</wd>

<space/>

<wd l="9802" t="7949" r="10133" b="8107">will</wd>

<space/>

<wd l="10258" t="7949" r="10502" b="8107">fo-</wd>

</ln>

<ln l="6149" t="8222" r="10502" b="8424" baseLine="8371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="8275" r="6427" b="8381">cus</wd>

<space/>

<wd l="6514" t="8275" r="6725" b="8381">on</wd>

<space/>

<wd l="6797" t="8246" r="7066" b="8381">ten</wd>

<space/>

<wd l="7133" t="8246" r="7584" b="8424">types</wd>

<space/>

<wd l="7670" t="8222" r="7858" b="8381">of</wd>

<space/>

<wd l="7915" t="8222" r="8501" b="8381">named</wd>

<space/>

<wd l="8573" t="8222" r="9240" b="8381">entities:</wd>

<space/>

<wd l="9365" t="8275" r="10186" b="8424">company,</wd>

<space/>

<wd l="10272" t="8222" r="10502" b="8381">fa-</wd>

</ln>

<ln l="6149" t="8491" r="10498" b="8693" baseLine="8645" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="8491" r="6624" b="8693">cility,</wd>

<space/>

<wd l="6725" t="8491" r="7416" b="8693">geo-loc,</wd>

<space/>

<wd l="7517" t="8491" r="8102" b="8678">movie,</wd>

<space/>

<wd l="8198" t="8491" r="9197" b="8678">musicartist,</wd>

<space/>

<wd l="9298" t="8491" r="9778" b="8678">other,</wd>

<space/>

<wd l="9874" t="8544" r="10498" b="8693">person,</wd>

<space/>

</ln>

<ln l="6144" t="8765" r="10512" b="8966" baseLine="8914" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8765" r="6854" b="8966">product,</wd>

<space/>

<wd l="6984" t="8789" r="7963" b="8966">sportsteam,</wd>

<space/>

<wd l="8088" t="8765" r="8400" b="8923">and</wd>

<space/>

<wd l="8496" t="8765" r="9149" b="8923">tvshow.</wd>

<space/>

<wd l="9360" t="8770" r="9643" b="8923">We</wd>

<space/>

<wd l="9744" t="8765" r="10147" b="8923">have</wd>

<space/>

<wd l="10243" t="8765" r="10512" b="8923">the</wd>

<space/>

</ln>

<ln l="6144" t="9034" r="10498" b="9235" baseLine="9187" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9034" r="6821" b="9235">training</wd>

<space/>

<wd l="6898" t="9034" r="7210" b="9192">and</wd>

<space/>

<wd l="7282" t="9034" r="8395" b="9235">development</wd>

<space/>

<wd l="8467" t="9034" r="8832" b="9192">data</wd>

<space/>

<wd l="8894" t="9034" r="9154" b="9192">for</wd>

<space/>

<wd l="9216" t="9034" r="9845" b="9192">Twitter</wd>

<space/>

<wd l="9912" t="9034" r="10224" b="9192">and</wd>

<space/>

<wd l="10296" t="9034" r="10498" b="9192">53</wd>

<space/>

</ln>

<ln l="6149" t="9307" r="10382" b="9509" baseLine="9456" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="9331" r="7008" b="9509">gazetteers</wd>

<space/>

<wd l="7070" t="9307" r="7498" b="9466">from</wd>

<space/>

<wd l="7550" t="9307" r="7814" b="9466">the</wd>

<space/>

<wd l="7877" t="9307" r="9307" b="9466">abovementioned</wd>

<space/>

<wd l="9370" t="9307" r="9931" b="9466">shared</wd>

<space/>

<wd l="9984" t="9307" r="10382" b="9466">task.</wd>

<space/>

</ln>

<ln l="6144" t="9576" r="10507" b="9778" baseLine="9730" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9581" r="6326" b="9730">In</wd>

<space/>

<wd l="6379" t="9576" r="6686" b="9734">this</wd>

<space/>

<wd l="6744" t="9629" r="7267" b="9778">paper,</wd>

<space/>

<wd l="7330" t="9629" r="7584" b="9734">we</wd>

<space/>

<wd l="7642" t="9576" r="8362" b="9734">describe</wd>

<space/>

<wd l="8414" t="9576" r="8678" b="9734">the</wd>

<space/>

<wd l="8736" t="9576" r="9413" b="9734">datasets</wd>

<space/>

<wd l="9475" t="9576" r="9643" b="9730">in</wd>

<space/>

<wd l="9701" t="9576" r="10354" b="9734">Section</wd>

<space/>

<wd l="10406" t="9581" r="10507" b="9730">2</wd>

<space/>

</ln>

<ln l="6149" t="9850" r="10512" b="10051" baseLine="9998" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="9850" r="6461" b="10008">and</wd>

<space/>

<wd l="6523" t="9874" r="7152" b="10051">present</wd>

<space/>

<wd l="7214" t="9850" r="7478" b="10008">the</wd>

<space/>

<wd l="7541" t="9850" r="8083" b="10008">model</wd>

<space/>

<wd l="8146" t="9850" r="8477" b="10008">that</wd>

<space/>

<wd l="8534" t="9902" r="8789" b="10008">we</wd>

<space/>

<wd l="8851" t="9902" r="9139" b="10008">use</wd>

<space/>

<wd l="9202" t="9850" r="9374" b="10003">in</wd>

<space/>

<wd l="9432" t="9850" r="9739" b="10008">this</wd>

<space/>

<wd l="9816" t="9850" r="10277" b="10051">study</wd>

<space/>

<wd l="10339" t="9850" r="10512" b="10003">in</wd>

<space/>

</ln>

<ln l="6149" t="10118" r="10502" b="10306" baseLine="10267" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="10118" r="6802" b="10277">Section</wd>

<space/>

<wd l="6883" t="10123" r="7032" b="10277">3.</wd>

<space/>

<wd l="7186" t="10123" r="7368" b="10272">In</wd>

<space/>

<wd l="7450" t="10118" r="8102" b="10277">Section</wd>

<space/>

<wd l="8179" t="10123" r="8333" b="10306">4,</wd>

<space/>

<wd l="8429" t="10171" r="8683" b="10277">we</wd>

<space/>

<wd l="8770" t="10118" r="9389" b="10277">discuss</wd>

<space/>

<wd l="9475" t="10118" r="9739" b="10277">the</wd>

<space/>

<wd l="9821" t="10118" r="10502" b="10277">features</wd>

<space/>

</ln>

<ln l="6144" t="10392" r="10512" b="10594" baseLine="10541" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10392" r="6547" b="10550">used</wd>

<space/>

<wd l="6638" t="10392" r="6950" b="10550">and</wd>

<space/>

<wd l="7037" t="10392" r="7306" b="10550">the</wd>

<space/>

<wd l="7392" t="10392" r="8126" b="10550">methods</wd>

<space/>

<wd l="8222" t="10392" r="8621" b="10550">used</wd>

<space/>

<wd l="8712" t="10392" r="8966" b="10550">for</wd>

<space/>

<wd l="9058" t="10392" r="9970" b="10594">generating</wd>

<space/>

<wd l="10061" t="10392" r="10512" b="10550">these</wd>

<space/>

</ln>

<ln l="6144" t="10661" r="10512" b="10862" baseLine="10810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10661" r="6878" b="10819">features.</wd>

<space/>

<wd l="7022" t="10666" r="7306" b="10819">We</wd>

<space/>

<wd l="7382" t="10685" r="8016" b="10862">present</wd>

<space/>

<wd l="8093" t="10714" r="8381" b="10819">our</wd>

<space/>

<wd l="8458" t="10661" r="8837" b="10819">final</wd>

<space/>

<wd l="8918" t="10661" r="9480" b="10819">results</wd>

<space/>

<wd l="9566" t="10661" r="10046" b="10862">along</wd>

<space/>

<wd l="10123" t="10661" r="10512" b="10819">with</wd>

<space/>

</ln>

<ln l="6144" t="10930" r="10517" b="11131" baseLine="11083" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10930" r="6552" b="11088">their</wd>

<space/>

<wd l="6605" t="10930" r="7296" b="11131">analysis</wd>

<space/>

<wd l="7354" t="10930" r="7526" b="11083">in</wd>

<space/>

<wd l="7584" t="10930" r="8232" b="11088">Section</wd>

<space/>

<wd l="8290" t="10930" r="8381" b="11088">5</wd>

<space/>

<wd l="8453" t="10930" r="8765" b="11088">and</wd>

<space/>

<wd l="8822" t="10930" r="9605" b="11088">conclude</wd>

<space/>

<wd l="9658" t="10930" r="9965" b="11088">this</wd>

<space/>

<wd l="10027" t="10982" r="10517" b="11131">paper</wd>

<space/>

</ln>

<ln l="6144" t="11203" r="7234" b="11362" baseLine="11352" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11203" r="6317" b="11357">in</wd>

<space/>

<wd l="6374" t="11203" r="7027" b="11362">Section</wd>

<space/>

<wd l="7085" t="11203" r="7234" b="11362">6.</wd>

</ln>

</para>

<para l="6144" t="11678" r="8170" b="11851" alignment="left" spaceBefore="223" lsp="exactly" lspExact="274" language="en">

<ln l="6144" t="11678" r="8170" b="11851" baseLine="11842" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">

<wd l="6144" t="11678" r="6259" b="11846">2</wd>

<space/>

<wd l="6504" t="11683" r="6998" b="11851">Data</wd>

<space/>

<wd l="7061" t="11683" r="7435" b="11851">and</wd>

<space/>

<wd l="7502" t="11683" r="8170" b="11851">Labels</wd>

</ln>

</para>

<para l="6144" t="12120" r="10512" b="13133" alignment="justified" spaceBefore="156" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="12120" r="10512" b="12307" baseLine="12269" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12125" r="6326" b="12274">In</wd>

<space/>

<wd l="6475" t="12120" r="6782" b="12278">this</wd>

<space/>

<wd l="6946" t="12120" r="7598" b="12307">section,</wd>

<space/>

<wd l="7781" t="12173" r="8035" b="12278">we</wd>

<space/>

<wd l="8179" t="12120" r="9005" b="12278">introduce</wd>

<space/>

<wd l="9154" t="12120" r="9418" b="12278">the</wd>

<space/>

<wd l="9571" t="12120" r="10512" b="12278">considered</wd>

<space/>

</ln>

<ln l="6149" t="12389" r="10512" b="12547" baseLine="12542" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="12389" r="6830" b="12547">datasets</wd>

<space/>

<wd l="6926" t="12389" r="7238" b="12547">and</wd>

<space/>

<wd l="7330" t="12389" r="8050" b="12547">describe</wd>

<space/>

<wd l="8136" t="12389" r="8405" b="12547">the</wd>

<space/>

<wd l="8496" t="12389" r="8856" b="12547">data</wd>

<space/>

<wd l="8942" t="12389" r="9523" b="12547">format</wd>

<space/>

<wd l="9610" t="12389" r="10051" b="12547">used.</wd>

<space/>

<wd l="10224" t="12394" r="10512" b="12547">We</wd>

<space/>

</ln>

<ln l="6149" t="12662" r="10512" b="12864" baseLine="12811" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="12662" r="6494" b="12821">also</wd>

<space/>

<wd l="6547" t="12662" r="6816" b="12821">list</wd>

<space/>

<wd l="6859" t="12662" r="7128" b="12821">the</wd>

<space/>

<wd l="7181" t="12662" r="8419" b="12821">characteristics</wd>

<space/>

<wd l="8477" t="12662" r="8669" b="12821">of</wd>

<space/>

<wd l="8707" t="12662" r="9106" b="12821">each</wd>

<space/>

<wd l="9158" t="12662" r="9648" b="12864">entity</wd>

<space/>

<wd l="9701" t="12686" r="10075" b="12864">type</wd>

<space/>

<wd l="10123" t="12662" r="10512" b="12821">with</wd>

<space/>

</ln>

<ln l="6154" t="12931" r="7526" b="13133" baseLine="13085" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="12984" r="6605" b="13090">some</wd>

<space/>

<wd l="6667" t="12931" r="7526" b="13133">examples.</wd>

</ln>

</para>

<para l="6144" t="13392" r="7085" b="13550" alignment="left" spaceBefore="211" lsp="exactly" lspExact="254" language="en">

<ln l="6144" t="13392" r="7085" b="13550" baseLine="13546" bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">

<wd l="6144" t="13392" r="6408" b="13550">2.1</wd>

<space/>

<wd l="6638" t="13397" r="7085" b="13550">Data</wd>

</ln>

</para>

<para l="6144" t="13752" r="10526" b="15307" alignment="justified" spaceBefore="89" spaceAfter="21" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="13752" r="10507" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="13752" r="6485" b="13910">The</wd>

<space/>

<wd l="6610" t="13752" r="7286" b="13910">datasets</wd>

<space/>

<wd l="7416" t="13752" r="8189" b="13954">provided</wd>

<space/>

<wd l="8304" t="13752" r="8520" b="13954">by</wd>

<space/>

<wd l="8654" t="13752" r="9211" b="13910">shared</wd>

<space/>

<wd l="9331" t="13752" r="9682" b="13910">task</wd>

<space/>

<wd l="9806" t="13805" r="10066" b="13910">are</wd>

<space/>

<wd l="10186" t="13805" r="10507" b="13910">raw</wd>

<space/>

</ln>

<ln l="6144" t="14021" r="10526" b="14179" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="14045" r="6744" b="14179">tweets.</wd>

<space/>

<wd l="6840" t="14021" r="7320" b="14179">Table</wd>

<space/>

<wd l="7406" t="14026" r="7469" b="14174">1</wd>

<space/>

<wd l="7560" t="14021" r="8083" b="14179">shows</wd>

<space/>

<wd l="8155" t="14074" r="8352" b="14179">an</wd>

<space/>

<wd l="8419" t="14021" r="9211" b="14179">overview</wd>

<space/>

<wd l="9283" t="14021" r="9470" b="14179">of</wd>

<space/>

<wd l="9518" t="14021" r="9782" b="14179">the</wd>

<space/>

<wd l="9854" t="14021" r="10262" b="14179">sizes</wd>

<space/>

<wd l="10334" t="14021" r="10526" b="14179">of</wd>

<space/>

</ln>

<ln l="6144" t="14294" r="10502" b="14482" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="14294" r="6595" b="14453">these</wd>

<space/>

<wd l="6643" t="14294" r="7373" b="14453">datasets.</wd>

<space/>

<wd l="7450" t="14299" r="7632" b="14448">In</wd>

<space/>

<wd l="7680" t="14347" r="7776" b="14453">a</wd>

<space/>

<wd l="7819" t="14318" r="8333" b="14482">tweet,</wd>

<space/>

<wd l="8395" t="14294" r="8794" b="14453">each</wd>

<space/>

<wd l="8837" t="14294" r="9163" b="14453">line</wd>

<space/>

<wd l="9211" t="14294" r="9926" b="14453">contains</wd>

<space/>

<wd l="9979" t="14294" r="10502" b="14453">words</wd>

<space/>

</ln>

<ln l="6149" t="14563" r="10512" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="14563" r="6461" b="14722">and</wd>

<space/>

<wd l="6518" t="14563" r="6715" b="14722">its</wd>

<space/>

<wd l="6782" t="14563" r="7205" b="14722">label</wd>

<space/>

<wd l="7267" t="14563" r="7406" b="14722">is</wd>

<space/>

<wd l="7478" t="14563" r="8294" b="14765">separated</wd>

<space/>

<wd l="8352" t="14563" r="8568" b="14765">by</wd>

<space/>

<wd l="8635" t="14616" r="8731" b="14722">a</wd>

<space/>

<wd l="8784" t="14563" r="9048" b="14722">tab</wd>

<space/>

<wd l="9115" t="14563" r="9427" b="14722">and</wd>

<space/>

<wd l="9490" t="14616" r="9586" b="14722">a</wd>

<space/>

<wd l="9638" t="14563" r="10128" b="14722">blank</wd>

<space/>

<wd l="10186" t="14563" r="10512" b="14722">line</wd>

<space/>

</ln>

<ln l="6144" t="14837" r="10507" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="14837" r="6475" b="14995">that</wd>

<space/>

<wd l="6528" t="14837" r="7032" b="14995">forms</wd>

<space/>

<wd l="7099" t="14890" r="7195" b="14995">a</wd>

<space/>

<wd l="7258" t="14861" r="7997" b="14995">sentence</wd>

<space/>

<wd l="8054" t="14837" r="8904" b="15038">boundary.</wd>

<space/>

<wd l="8990" t="14837" r="9259" b="14990">All</wd>

<space/>

<wd l="9322" t="14837" r="9883" b="14995">tokens</wd>

<space/>

<wd l="9946" t="14837" r="10507" b="14995">follow</wd>

<space/>

</ln>

<ln l="6144" t="15106" r="10502" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="15106" r="6413" b="15264">the</wd>

<space/>

<wd l="6485" t="15110" r="6850" b="15264">IOB</wd>

<space/>

<wd l="6936" t="15106" r="7560" b="15264">format.</wd>

<space/>

<wd l="7694" t="15106" r="8035" b="15264">The</wd>

<space/>

<wd l="8107" t="15106" r="8592" b="15264">token</wd>

<space/>

<wd l="8664" t="15106" r="9053" b="15264">with</wd>

<space/>

<wd l="9134" t="15158" r="9230" b="15264">a</wd>

<space/>

<wd l="9298" t="15106" r="10022" b="15307">B-prefix</wd>

<space/>

<wd l="10099" t="15106" r="10502" b="15264">indi-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<section l="1433" t="15336" r="10531" b="16480">

<column l="1433" t="15336" r="10531" b="16480">

<para l="5800" t="15787" r="6148" b="15946" alignment="centered" spaceBefore="386" lsp="exactly" lspExact="270" language="en">

<ln l="5866" t="15787" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="42">

<wd l="5866" t="15792" r="6082" b="15946">72</wd>

</ln>

</para>

<para l="2918" t="16133" r="8981" b="16469" alignment="centered" spaceBefore="140" lsp="exactly" lspExact="170" language="en">

<ln l="2918" t="16133" r="8981" b="16301" baseLine="16253" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2918" t="16133" r="3802" b="16296">Proceedings</wd>

<space/>

<wd l="3854" t="16133" r="4018" b="16296">of</wd>

<space/>

<wd l="4037" t="16133" r="4248" b="16262">the</wd>

<space/>

<wd l="4286" t="16138" r="4622" b="16262">ACL</wd>

<space/>

<wd l="4666" t="16133" r="5026" b="16262">2015</wd>

<space/>

<wd l="5078" t="16133" r="5779" b="16296">Workshop</wd>

<space/>

<wd l="5832" t="16176" r="6000" b="16262">on</wd>

<space/>

<wd l="6043" t="16138" r="6456" b="16296">Noisy</wd>

<space/>

<wd l="6518" t="16133" r="7627" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7675" t="16138" r="7992" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8045" t="16171" r="8443" b="16301">pages</wd>

<space/>

<wd l="8496" t="16133" r="8981" b="16286">72–77,
</wd>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4310.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1430" marginTop="1260" marginRight="1381" marginBottom="1302" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1430" t="1260" r="10528" b="15307">

<column l="1430" t="1260" r="5817" b="15307">

<para l="1440" t="1320" r="5808" b="2606" alignment="justified" spaceAfter="266" lsp="exactly" lspExact="270" language="en">

<ln l="1445" t="1320" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="1344" r="1867" b="1478">cates</wd>

<space/>

<wd l="1944" t="1320" r="2208" b="1478">the</wd>

<space/>

<wd l="2280" t="1320" r="3144" b="1522">beginning</wd>

<space/>

<wd l="3221" t="1320" r="3413" b="1478">of</wd>

<space/>

<wd l="3470" t="1373" r="3566" b="1478">a</wd>

<space/>

<wd l="3629" t="1320" r="4214" b="1478">named</wd>

<space/>

<wd l="4286" t="1320" r="4776" b="1522">entity</wd>

<space/>

<wd l="4848" t="1320" r="5160" b="1478">and</wd>

<space/>

<wd l="5227" t="1320" r="5496" b="1478">the</wd>

<space/>

<wd l="5563" t="1344" r="5794" b="1478">to-</wd>

</ln>

<ln l="1440" t="1594" r="5808" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="1594" r="1752" b="1752">ken</wd>

<space/>

<wd l="1795" t="1594" r="2184" b="1752">with</wd>

<space/>

<wd l="2232" t="1646" r="2429" b="1752">an</wd>

<space/>

<wd l="2472" t="1594" r="3125" b="1795">I-prefix</wd>

<space/>

<wd l="3168" t="1594" r="3936" b="1752">indicates</wd>

<space/>

<wd l="3989" t="1594" r="4253" b="1752">the</wd>

<space/>

<wd l="4296" t="1594" r="4819" b="1752">inside</wd>

<space/>

<wd l="4867" t="1594" r="5054" b="1752">of</wd>

<space/>

<wd l="5088" t="1646" r="5184" b="1752">a</wd>

<space/>

<wd l="5222" t="1594" r="5808" b="1752">named</wd>

<space/>

</ln>

<ln l="1445" t="1862" r="5808" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="1862" r="1968" b="2064">entity.</wd>

<space/>

<wd l="2059" t="1867" r="2328" b="2016">An</wd>

<space/>

<wd l="2386" t="1862" r="3038" b="2064">I-prefix</wd>

<space/>

<wd l="3106" t="1862" r="3485" b="2064">only</wd>

<space/>

<wd l="3552" t="1862" r="4190" b="2021">follows</wd>

<space/>

<wd l="4262" t="1862" r="4661" b="2021">after</wd>

<space/>

<wd l="4723" t="1915" r="4819" b="2021">a</wd>

<space/>

<wd l="4877" t="1862" r="5357" b="2021">token</wd>

<space/>

<wd l="5419" t="1862" r="5808" b="2021">with</wd>

<space/>

</ln>

<ln l="1445" t="2136" r="5798" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="2189" r="1541" b="2294">a</wd>

<space/>

<wd l="1613" t="2136" r="2381" b="2338">B-prefix.</wd>

<space/>

<wd l="2515" t="2141" r="2784" b="2290">An</wd>

<space/>

<wd l="2861" t="2141" r="3010" b="2294">O</wd>

<space/>

<wd l="3086" t="2160" r="3350" b="2338">tag</wd>

<space/>

<wd l="3427" t="2136" r="4195" b="2294">indicates</wd>

<space/>

<wd l="4277" t="2136" r="4608" b="2294">that</wd>

<space/>

<wd l="4685" t="2189" r="4781" b="2294">a</wd>

<space/>

<wd l="4848" t="2136" r="5333" b="2294">token</wd>

<space/>

<wd l="5410" t="2136" r="5798" b="2294">does</wd>

<space/>

</ln>

<ln l="1440" t="2405" r="4680" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="2429" r="1718" b="2563">not</wd>

<space/>

<wd l="1771" t="2405" r="2362" b="2606">belong</wd>

<space/>

<wd l="2424" t="2429" r="2587" b="2563">to</wd>

<space/>

<wd l="2650" t="2458" r="2746" b="2563">a</wd>

<space/>

<wd l="2808" t="2405" r="3461" b="2606">specific</wd>

<space/>

<wd l="3518" t="2405" r="4104" b="2563">named</wd>

<space/>

<wd l="4162" t="2405" r="4680" b="2606">entity.</wd>

</ln>

</para>

<table l="2386" t="2890" r="4853" b="3768" alignment="left" li="956" ri="964" spaceBefore="10" spaceAfter="251">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>696</gridCol>

<gridCol>874</gridCol>

<gridCol>897</gridCol>

<gridRow>302</gridRow>

<gridRow>274</gridRow>

<gridRow>302</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2510" t="2942" r="2962" b="3096" alignment="centered" spaceAfter="37" lsp="exactly" lspExact="251" language="en">

<ln l="2510" t="2942" r="2962" b="3096" baseLine="3086" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2510" t="2942" r="2962" b="3096">Data</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3206" t="2942" r="3835" b="3096" alignment="centered" spaceAfter="37" lsp="exactly" lspExact="251" language="en">

<ln l="3206" t="2942" r="3835" b="3096" baseLine="3086" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="3206" t="2942" r="3835" b="3096">Tweets</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4080" t="2942" r="4728" b="3096" alignment="centered" spaceAfter="37" lsp="exactly" lspExact="251" language="en">

<ln l="4080" t="2942" r="4728" b="3096" baseLine="3086" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="4080" t="2942" r="4728" b="3096">Tokens</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="2534" t="3254" r="2938" b="3413" alignment="centered" lsp="exactly" lspExact="264" language="en">

<ln l="2534" t="3254" r="2938" b="3413" baseLine="3403" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="3254" r="2938" b="3413">train</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<para l="3298" t="3254" r="3749" b="3442" alignment="centered" lsp="exactly" lspExact="264" language="en">

<ln l="3298" t="3254" r="3749" b="3442" baseLine="3403" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">

<wd l="3298" t="3254" r="3749" b="3442">1,795</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4109" t="3259" r="4694" b="3442" alignment="centered" lsp="exactly" lspExact="264" language="en">

<ln l="4109" t="3259" r="4694" b="3442" baseLine="3403" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4109" t="3259" r="4694" b="3442">37,899</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2582" t="3533" r="2890" b="3682" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="267" language="en">

<ln l="2582" t="3533" r="2890" b="3682" baseLine="3677" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2582" t="3547" r="2890" b="3682">test</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3298" t="3528" r="3758" b="3710" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="267" language="en">

<ln l="3298" t="3528" r="3758" b="3710" baseLine="3677" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="3298" t="3528" r="3758" b="3710">1,000</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4128" t="3523" r="4680" b="3710" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="267" language="en">

<ln l="4128" t="3523" r="4680" b="3710" baseLine="3677" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">

<wd l="4128" t="3523" r="4680" b="3710">16,261</wd>

</ln>

</para>

</cell>

</table>

<para l="2160" t="4080" r="5074" b="4238" alignment="centered" lsp="exactly" lspExact="271" language="en">

<ln l="2160" t="4080" r="5074" b="4238" baseLine="4234" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2160" t="4080" r="2635" b="4238">Table</wd>

<space/>

<wd l="2717" t="4085" r="2846" b="4238">1:</wd>

<space/>

<wd l="2928" t="4085" r="3197" b="4234">An</wd>

<space/>

<wd l="3254" t="4080" r="4046" b="4238">overview</wd>

<space/>

<wd l="4109" t="4080" r="4301" b="4238">of</wd>

<space/>

<wd l="4349" t="4080" r="5074" b="4238">datasets.</wd>

</ln>

</para>

<para l="1440" t="4824" r="2544" b="4982" alignment="left" spaceBefore="496" lsp="exactly" lspExact="251" language="en">

<ln l="1440" t="4824" r="2544" b="4982" baseLine="4978" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">

<wd l="1440" t="4824" r="1709" b="4982">2.2</wd>

<space/>

<wd l="1930" t="4829" r="2544" b="4982">Labels</wd>

</ln>

</para>

<para l="1440" t="5218" r="5798" b="5650" alignment="justified" spaceBefore="117" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="5218" r="5798" b="5419" baseLine="5371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5222" r="1622" b="5371">In</wd>

<space/>

<wd l="1675" t="5218" r="1939" b="5376">the</wd>

<space/>

<wd l="2002" t="5242" r="2645" b="5419">system,</wd>

<space/>

<wd l="2707" t="5270" r="2962" b="5376">we</wd>

<space/>

<wd l="3014" t="5218" r="3480" b="5376">focus</wd>

<space/>

<wd l="3542" t="5270" r="3758" b="5376">on</wd>

<space/>

<wd l="3811" t="5218" r="4075" b="5376">the</wd>

<space/>

<wd l="4128" t="5218" r="4968" b="5419">following</wd>

<space/>

<wd l="5026" t="5242" r="5294" b="5376">ten</wd>

<space/>

<wd l="5347" t="5242" r="5798" b="5419">types</wd>

<space/>

</ln>

<ln l="1445" t="5491" r="2986" b="5650" baseLine="5640" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5491" r="1637" b="5650">of</wd>

<space/>

<wd l="1675" t="5491" r="2261" b="5650">named</wd>

<space/>

<wd l="2318" t="5491" r="2986" b="5650">entities:</wd>

</ln>

</para>

<para l="1454" t="6029" r="5443" b="6504" alignment="left" li="432" ri="360" spaceBefore="269" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1454" t="6029" r="5443" b="6230" baseLine="6182">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1454" t="6077" r="2294" b="6230">company</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2400" t="6029" r="2736" b="6187">The</wd>

<space/>

<wd l="2794" t="6082" r="3264" b="6187">name</wd>

<space/>

<wd l="3322" t="6029" r="3514" b="6187">of</wd>

<space/>

<wd l="3562" t="6082" r="3658" b="6187">a</wd>

<space/>

<wd l="3710" t="6082" r="4498" b="6230">company</wd>

<space/>

<wd l="4560" t="6082" r="4742" b="6187">or</wd>

<space/>

<wd l="4800" t="6082" r="4896" b="6187">a</wd>

<space/>

<wd l="4944" t="6029" r="5443" b="6187">brand</wd>

<space/>

</run>

</ln>

<ln l="1882" t="6302" r="5150" b="6504" baseLine="6451" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="6355" r="2237" b="6504">e.g.,</wd>

<space/>

<wd l="2304" t="6302" r="3144" b="6504">Snapchat,</wd>

<space/>

<wd l="3211" t="6302" r="3869" b="6490">Twitter,</wd>

<space/>

<wd l="3941" t="6302" r="4253" b="6461">and</wd>

<space/>

<wd l="4306" t="6302" r="5150" b="6461">Facebook</wd>

</ln>

</para>

<para l="1450" t="6874" r="5794" b="7330" alignment="justified" li="432" spaceBefore="303" fli="-432" lsp="exactly" lspExact="270" language="en">

<ln l="1450" t="6874" r="5794" b="7075" baseLine="7022">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="6874" r="2088" b="7075">facility</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2194" t="6874" r="2530" b="7032">The</wd>

<space/>

<wd l="2592" t="6926" r="3067" b="7032">name</wd>

<space/>

<wd l="3134" t="6874" r="3322" b="7032">of</wd>

<space/>

<wd l="3379" t="6926" r="3576" b="7032">an</wd>

<space/>

<wd l="3638" t="6874" r="4526" b="7032">institution</wd>

<space/>

<wd l="4598" t="6874" r="4987" b="7032">such</wd>

<space/>

<wd l="5054" t="6926" r="5222" b="7032">as</wd>

<space/>

<wd l="5299" t="6926" r="5395" b="7032">a</wd>

<space/>

<wd l="5453" t="6926" r="5794" b="7032">mu-</wd>

</run>

</ln>

<ln l="1886" t="7147" r="4478" b="7330" baseLine="7296" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1886" t="7195" r="2381" b="7330">seum,</wd>

<space/>

<wd l="2453" t="7195" r="2549" b="7301">a</wd>

<space/>

<wd l="2602" t="7166" r="3163" b="7330">center,</wd>

<space/>

<wd l="3235" t="7195" r="3418" b="7301">or</wd>

<space/>

<wd l="3470" t="7195" r="3566" b="7301">a</wd>

<space/>

<wd l="3619" t="7166" r="4478" b="7301">restaurant</wd>

</ln>

</para>

<para l="1882" t="7416" r="5285" b="7618" alignment="left" li="432" lsp="exactly" lspExact="270" language="en">

<ln l="1882" t="7416" r="5285" b="7618" baseLine="7565" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="7469" r="2237" b="7618">e.g.,</wd>

<space/>

<wd l="2299" t="7421" r="2731" b="7574">Iowa</wd>

<space/>

<wd l="2789" t="7416" r="3158" b="7618">City</wd>

<space/>

<wd l="3226" t="7416" r="3859" b="7574">schools</wd>

<space/>

<wd l="3926" t="7416" r="4238" b="7574">and</wd>

<space/>

<wd l="4291" t="7416" r="5285" b="7618">Disneyland</wd>

</ln>

</para>

<para l="1454" t="7963" r="4795" b="8438" alignment="left" li="432" ri="1008" spaceBefore="279" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1454" t="7963" r="4795" b="8165" baseLine="8117">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1454" t="7968" r="2102" b="8165">geo-loc</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2203" t="7963" r="2544" b="8122">The</wd>

<space/>

<wd l="2597" t="8016" r="3067" b="8122">name</wd>

<space/>

<wd l="3130" t="7963" r="3322" b="8122">of</wd>

<space/>

<wd l="3365" t="8016" r="3461" b="8122">a</wd>

<space/>

<wd l="3518" t="7963" r="3835" b="8165">city</wd>

<space/>

<wd l="3898" t="8016" r="4080" b="8122">or</wd>

<space/>

<wd l="4133" t="7987" r="4795" b="8165">country</wd>

<space/>

</run>

</ln>

<ln l="1882" t="8237" r="4037" b="8438" baseLine="8386" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="8290" r="2237" b="8438">e.g.,</wd>

<space/>

<wd l="2304" t="8237" r="3024" b="8438">Chicago</wd>

<space/>

<wd l="3086" t="8237" r="3398" b="8395">and</wd>

<space/>

<wd l="3451" t="8237" r="4037" b="8395">Russia</wd>

</ln>

</para>

<para l="1450" t="8784" r="3821" b="8942" alignment="left" spaceBefore="279" lsp="exactly" lspExact="270" language="en">

<ln l="1450" t="8784" r="3821" b="8942" baseLine="8933">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="8784" r="2002" b="8942">movie</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2102" t="8784" r="2443" b="8942">The</wd>

<space/>

<wd l="2496" t="8784" r="2837" b="8942">title</wd>

<space/>

<wd l="2899" t="8784" r="3086" b="8942">of</wd>

<space/>

<wd l="3134" t="8837" r="3230" b="8942">a</wd>

<space/>

<wd l="3278" t="8784" r="3821" b="8942">movie</wd>

</run>

</ln>

</para>

<para l="1882" t="9053" r="4498" b="9254" alignment="left" li="432" lsp="exactly" lspExact="271" language="en">

<ln l="1882" t="9053" r="4498" b="9254" baseLine="9206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="9106" r="2237" b="9254">e.g.,</wd>

<space/>

<wd l="2299" t="9053" r="3250" b="9211">Interstellar</wd>

<space/>

<wd l="3307" t="9053" r="3614" b="9211">and</wd>

<space/>

<wd l="3672" t="9053" r="4498" b="9254">Inception</wd>

</ln>

</para>

<para l="1450" t="9605" r="5798" b="10075" alignment="justified" li="432" spaceBefore="279" fli="-432" lsp="exactly" lspExact="270" language="en">

<ln l="1450" t="9605" r="5798" b="9806" baseLine="9754">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="9605" r="2496" b="9763">musicartist</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2592" t="9605" r="2928" b="9763">The</wd>

<space/>

<wd l="3024" t="9658" r="3499" b="9763">name</wd>

<space/>

<wd l="3600" t="9605" r="3787" b="9763">of</wd>

<space/>

<wd l="3869" t="9605" r="4387" b="9763">music</wd>

<space/>

<wd l="4493" t="9658" r="5074" b="9806">groups</wd>

<space/>

<wd l="5179" t="9658" r="5362" b="9763">or</wd>

<space/>

<wd l="5458" t="9605" r="5798" b="9763">disc</wd>

<space/>

</run>

</ln>

<ln l="1858" t="9874" r="3053" b="10075" baseLine="10027" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1858" t="9874" r="2530" b="10075">jockeys</wd>

<space/>

<wd l="2602" t="9878" r="3053" b="10070">(DJs)</wd>

</ln>

</para>

<para l="1882" t="10147" r="4781" b="10349" alignment="left" li="432" lsp="exactly" lspExact="270" language="en">

<ln l="1882" t="10147" r="4781" b="10349" baseLine="10296" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="10200" r="2237" b="10349">e.g.,</wd>

<space/>

<wd l="2299" t="10147" r="2870" b="10349">Taylor</wd>

<space/>

<wd l="2923" t="10147" r="3394" b="10306">Swift</wd>

<space/>

<wd l="3451" t="10147" r="3763" b="10306">and</wd>

<space/>

<wd l="3816" t="10147" r="4262" b="10349">Lady</wd>

<space/>

<wd l="4325" t="10152" r="4781" b="10349">Gaga</wd>

</ln>

</para>

<para l="1454" t="10694" r="5808" b="11438" alignment="justified" li="432" spaceBefore="277" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1454" t="10694" r="5798" b="10896" baseLine="10848">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1454" t="10699" r="1944" b="10853">other</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2045" t="10699" r="2203" b="10848">A</wd>

<space/>

<wd l="2256" t="10694" r="2822" b="10896">phrase</wd>

<space/>

<wd l="2875" t="10694" r="3202" b="10853">that</wd>

<space/>

<wd l="3254" t="10747" r="3552" b="10853">can</wd>

<space/>

<wd l="3605" t="10694" r="3811" b="10853">be</wd>

<space/>

<wd l="3859" t="10694" r="4262" b="10853">used</wd>

<space/>

<wd l="4315" t="10694" r="5122" b="10896">generally</wd>

<space/>

<wd l="5184" t="10694" r="5573" b="10853">such</wd>

<space/>

<wd l="5630" t="10747" r="5798" b="10853">as</wd>

<space/>

</run>

</ln>

<ln l="1877" t="10968" r="5808" b="11170" baseLine="11117" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="10968" r="2141" b="11126">the</wd>

<space/>

<wd l="2198" t="11021" r="2669" b="11126">name</wd>

<space/>

<wd l="2731" t="10968" r="2918" b="11126">of</wd>

<space/>

<wd l="2966" t="11021" r="3062" b="11126">a</wd>

<space/>

<wd l="3115" t="11021" r="3965" b="11170">ceremony</wd>

<space/>

<wd l="4027" t="11021" r="4210" b="11126">or</wd>

<space/>

<wd l="4262" t="11021" r="4464" b="11126">an</wd>

<space/>

<wd l="4526" t="10968" r="5558" b="11170">anniversary,</wd>

<space/>

<wd l="5630" t="11021" r="5808" b="11126">or</wd>

<space/>

</ln>

<ln l="1877" t="11237" r="3389" b="11438" baseLine="11386" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="11237" r="2141" b="11395">the</wd>

<space/>

<wd l="2198" t="11237" r="2534" b="11395">title</wd>

<space/>

<wd l="2597" t="11237" r="2789" b="11395">of</wd>

<space/>

<wd l="2832" t="11290" r="2928" b="11395">a</wd>

<space/>

<wd l="2990" t="11290" r="3389" b="11438">song</wd>

</ln>

</para>

<para l="1882" t="11510" r="4517" b="11712" alignment="left" li="432" spaceBefore="2" lsp="exactly" lspExact="271" language="en">

<ln l="1882" t="11510" r="4517" b="11712" baseLine="11659" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="11563" r="2237" b="11712">e.g.,</wd>

<space/>

<wd l="2299" t="11515" r="2875" b="11669">X-mas</wd>

<space/>

<wd l="2942" t="11510" r="3254" b="11669">and</wd>

<space/>

<wd l="3307" t="11510" r="4147" b="11712">Murphy’s</wd>

<space/>

<wd l="4210" t="11510" r="4517" b="11669">law</wd>

</ln>

</para>

<para l="1450" t="12058" r="5794" b="12802" alignment="left" li="432" spaceBefore="277" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1450" t="12058" r="5794" b="12259" baseLine="12206">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="12106" r="2078" b="12259">person</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2179" t="12058" r="2520" b="12216">The</wd>

<space/>

<wd l="2592" t="12110" r="3062" b="12216">name</wd>

<space/>

<wd l="3139" t="12058" r="3331" b="12216">of</wd>

<space/>

<wd l="3394" t="12110" r="3490" b="12216">a</wd>

<space/>

<wd l="3557" t="12110" r="4186" b="12259">person;</wd>

<space/>

<wd l="4277" t="12058" r="4402" b="12216">it</wd>

<space/>

<wd l="4474" t="12110" r="4766" b="12216">can</wd>

<space/>

<wd l="4843" t="12058" r="5050" b="12216">be</wd>

<space/>

<wd l="5122" t="12058" r="5386" b="12216">the</wd>

<space/>

<wd l="5458" t="12110" r="5794" b="12259">per-</wd>

</run>

</ln>

<ln l="1886" t="12326" r="5362" b="12514" baseLine="12480" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1886" t="12331" r="2318" b="12485">son’s</wd>

<space/>

<wd l="2381" t="12326" r="2674" b="12485">full</wd>

<space/>

<wd l="2736" t="12379" r="3254" b="12514">name,</wd>

<space/>

<wd l="3317" t="12326" r="3624" b="12485">last</wd>

<space/>

<wd l="3677" t="12379" r="4190" b="12514">name,</wd>

<space/>

<wd l="4262" t="12379" r="4445" b="12485">or</wd>

<space/>

<wd l="4498" t="12326" r="4834" b="12485">first</wd>

<space/>

<wd l="4886" t="12379" r="5362" b="12485">name</wd>

<space/>

</ln>

<ln l="1882" t="12600" r="4152" b="12802" baseLine="12749" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="12653" r="2237" b="12802">e.g.,</wd>

<space/>

<wd l="2304" t="12605" r="2774" b="12758">Steve</wd>

<space/>

<wd l="2837" t="12600" r="3264" b="12802">King</wd>

<space/>

<wd l="3326" t="12600" r="3638" b="12758">and</wd>

<space/>

<wd l="3691" t="12600" r="4152" b="12758">Ellen</wd>

</ln>

</para>

<para l="1450" t="13147" r="4262" b="13622" alignment="left" li="432" ri="1584" spaceBefore="279" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1450" t="13147" r="4262" b="13349" baseLine="13301">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1450" t="13152" r="2189" b="13349">product</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="2285" t="13147" r="2621" b="13306">The</wd>

<space/>

<wd l="2678" t="13200" r="3149" b="13306">name</wd>

<space/>

<wd l="3211" t="13147" r="3403" b="13306">of</wd>

<space/>

<wd l="3446" t="13200" r="3542" b="13306">a</wd>

<space/>

<wd l="3595" t="13147" r="4262" b="13349">product</wd>

<space/>

</run>

</ln>

<ln l="1882" t="13421" r="4205" b="13622" baseLine="13570" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="13474" r="2237" b="13622">e.g.,</wd>

<space/>

<wd l="2299" t="13421" r="2837" b="13579">Nokia</wd>

<space/>

<wd l="2894" t="13421" r="3322" b="13579">5800</wd>

<space/>

<wd l="3384" t="13421" r="3696" b="13579">and</wd>

<space/>

<wd l="3754" t="13421" r="4205" b="13579">Coke</wd>

</ln>

</para>

<para l="1454" t="13968" r="4891" b="14438" alignment="left" li="432" ri="936" spaceBefore="278" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1454" t="13968" r="4891" b="14170" baseLine="14117">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1454" t="13982" r="2482" b="14170">sportsteam</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2578" t="13968" r="2918" b="14126">The</wd>

<space/>

<wd l="2971" t="14021" r="3446" b="14126">name</wd>

<space/>

<wd l="3504" t="13968" r="3696" b="14126">of</wd>

<space/>

<wd l="3739" t="14021" r="3835" b="14126">a</wd>

<space/>

<wd l="3898" t="13997" r="4402" b="14170">sports</wd>

<space/>

<wd l="4464" t="13992" r="4891" b="14126">team</wd>

<space/>

</run>

</ln>

<ln l="1882" t="14237" r="4315" b="14438" baseLine="14390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="14290" r="2237" b="14438">e.g.,</wd>

<space/>

<wd l="2299" t="14237" r="2976" b="14395">Arsenal</wd>

<space/>

<wd l="3038" t="14237" r="3350" b="14395">and</wd>

<space/>

<wd l="3403" t="14242" r="3835" b="14395">West</wd>

<space/>

<wd l="3888" t="14242" r="4315" b="14395">Ham</wd>

</ln>

</para>

<para l="1450" t="14789" r="5606" b="15259" alignment="left" li="432" ri="216" spaceBefore="279" spaceAfter="25" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="1450" t="14789" r="5218" b="14986" baseLine="14938">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1450" t="14794" r="2102" b="14947">tvshow</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2203" t="14789" r="2539" b="14947">The</wd>

<space/>

<wd l="2597" t="14789" r="2933" b="14947">title</wd>

<space/>

<wd l="2995" t="14789" r="3187" b="14947">of</wd>

<space/>

<wd l="3230" t="14842" r="3326" b="14947">a</wd>

<space/>

<wd l="3379" t="14789" r="4219" b="14947">television</wd>

<space/>

<wd l="4286" t="14794" r="4699" b="14986">(TV)</wd>

<space/>

<wd l="4776" t="14789" r="5218" b="14947">show</wd>

<space/>

</run>

</ln>

<ln l="1882" t="15058" r="5606" b="15259" baseLine="15211" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="15110" r="2237" b="15259">e.g.,</wd>

<space/>

<wd l="2299" t="15058" r="2640" b="15216">The</wd>

<space/>

<wd l="2693" t="15058" r="3634" b="15216">Persuaders</wd>

<space/>

<wd l="3701" t="15058" r="4013" b="15216">and</wd>

<space/>

<wd l="4066" t="15062" r="4579" b="15259">Pretty</wd>

<space/>

<wd l="4642" t="15058" r="5112" b="15216">Little</wd>

<space/>

<wd l="5165" t="15058" r="5606" b="15216">Liars</wd>

</ln>

</para>

</column>

<column l="6141" t="1260" r="10528" b="15307">

<para l="6144" t="1306" r="7152" b="1478" alignment="left" spaceBefore="3" lsp="exactly" lspExact="273" language="en">

<ln l="6144" t="1306" r="7152" b="1478" baseLine="1474" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="21">

<wd l="6144" t="1306" r="6259" b="1478">3</wd>

<space/>

<wd l="6504" t="1310" r="7152" b="1478">Model</wd>

</ln>

</para>

<para l="6144" t="1738" r="10517" b="4608" alignment="justified" spaceBefore="137" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="1738" r="10512" b="1939" baseLine="1891" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="1738" r="7171" b="1896">Conditional</wd>

<space/>

<wd l="7258" t="1738" r="7997" b="1896">Random</wd>

<space/>

<wd l="8074" t="1738" r="8602" b="1896">Fields</wd>

<space/>

<wd l="8698" t="1742" r="9322" b="1934">(CRFs)</wd>

<space/>

<wd l="9499" t="1738" r="10272" b="1939">(Lafferty</wd>

<space/>

<wd l="10358" t="1762" r="10512" b="1896">et</wd>

<space/>

</ln>

<ln l="6149" t="2011" r="10507" b="2213" baseLine="2160" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="2011" r="6403" b="2198">al.,</wd>

<space/>

<wd l="6494" t="2016" r="6984" b="2208">2001)</wd>

<space/>

<wd l="7070" t="2011" r="7382" b="2170">and</wd>

<space/>

<wd l="7454" t="2011" r="7651" b="2170">its</wd>

<space/>

<wd l="7728" t="2011" r="8410" b="2170">variants</wd>

<space/>

<wd l="8486" t="2011" r="8890" b="2170">have</wd>

<space/>

<wd l="8962" t="2011" r="9374" b="2170">been</wd>

<space/>

<wd l="9456" t="2011" r="10507" b="2213">successfully</wd>

<space/>

</ln>

<ln l="6149" t="2280" r="10512" b="2482" baseLine="2434" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="2280" r="6787" b="2482">applied</wd>

<space/>

<wd l="6830" t="2304" r="6994" b="2438">to</wd>

<space/>

<wd l="7042" t="2280" r="7670" b="2438">various</wd>

<space/>

<wd l="7728" t="2333" r="8520" b="2482">sequence</wd>

<space/>

<wd l="8563" t="2280" r="9259" b="2482">labeling</wd>

<space/>

<wd l="9307" t="2280" r="9734" b="2438">tasks</wd>

<space/>

<wd l="9792" t="2285" r="10512" b="2477">(Maaten</wd>

<space/>

</ln>

<ln l="6149" t="2554" r="10498" b="2741" baseLine="2702" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="2578" r="6307" b="2712">et</wd>

<space/>

<wd l="6408" t="2554" r="6658" b="2741">al.,</wd>

<space/>

<wd l="6787" t="2558" r="7262" b="2741">2011;</wd>

<space/>

<wd l="7406" t="2554" r="8074" b="2741">Collins,</wd>

<space/>

<wd l="8198" t="2558" r="8678" b="2741">2002;</wd>

<space/>

<wd l="8813" t="2554" r="9749" b="2712">McCallum</wd>

<space/>

<wd l="9854" t="2554" r="10166" b="2712">and</wd>

<space/>

<wd l="10262" t="2554" r="10498" b="2741">Li,</wd>

<space/>

</ln>

<ln l="6149" t="2822" r="10498" b="3024" baseLine="2971" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="2827" r="6629" b="3010">2003;</wd>

<space/>

<wd l="6725" t="2822" r="7114" b="2976">Kim</wd>

<space/>

<wd l="7186" t="2822" r="7498" b="2981">and</wd>

<space/>

<wd l="7570" t="2822" r="8213" b="3024">Snyder,</wd>

<space/>

<wd l="8304" t="2827" r="8784" b="3010">2012;</wd>

<space/>

<wd l="8880" t="2822" r="9269" b="2976">Kim</wd>

<space/>

<wd l="9341" t="2846" r="9494" b="2981">et</wd>

<space/>

<wd l="9566" t="2822" r="9821" b="3010">al.,</wd>

<space/>

<wd l="9912" t="2822" r="10498" b="3010">2015b;</wd>

<space/>

</ln>

<ln l="6149" t="3096" r="10512" b="3298" baseLine="3245" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3096" r="6538" b="3250">Kim</wd>

<space/>

<wd l="6610" t="3120" r="6768" b="3254">et</wd>

<space/>

<wd l="6840" t="3096" r="7094" b="3283">al.,</wd>

<space/>

<wd l="7186" t="3096" r="7762" b="3283">2015a;</wd>

<space/>

<wd l="7862" t="3096" r="8251" b="3250">Kim</wd>

<space/>

<wd l="8323" t="3096" r="8635" b="3254">and</wd>

<space/>

<wd l="8712" t="3096" r="9355" b="3298">Snyder,</wd>

<space/>

<wd l="9451" t="3101" r="10027" b="3283">2013a;</wd>

<space/>

<wd l="10128" t="3096" r="10512" b="3250">Kim</wd>

<space/>

</ln>

<ln l="6149" t="3365" r="10517" b="3566" baseLine="3514" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3365" r="6461" b="3523">and</wd>

<space/>

<wd l="6552" t="3365" r="7200" b="3566">Snyder,</wd>

<space/>

<wd l="7310" t="3365" r="7968" b="3562">2013b).</wd>

<space/>

<wd l="8146" t="3365" r="8486" b="3523">The</wd>

<space/>

<wd l="8573" t="3370" r="9010" b="3523">NER</wd>

<space/>

<wd l="9101" t="3365" r="9451" b="3523">task</wd>

<space/>

<wd l="9538" t="3365" r="10320" b="3566">produces</wd>

<space/>

<wd l="10421" t="3418" r="10517" b="3523">a</wd>

<space/>

</ln>

<ln l="6154" t="3619" r="10498" b="3845" baseLine="3789">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6154" t="3686" r="6946" b="3835">sequence</wd>

<space/>

<wd l="7032" t="3634" r="7224" b="3792">of</wd>

<space/>

<wd l="7291" t="3634" r="7877" b="3792">named</wd>

<space/>

<wd l="7958" t="3634" r="8448" b="3835">entity</wd>

<space/>

<wd l="8534" t="3658" r="8928" b="3835">tags,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9034" t="3686" r="9139" b="3835">y</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9264" t="3706" r="9413" b="3758">=</wd>

<space/>

</run>

<wd l="9557" t="3619" r="9802" b="3845"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9874" t="3763" r="10099" b="3787">...</wd>

<space/>

</run>

<wd l="10157" t="3619" r="10498" b="3845"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">n</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="6149" t="3893" r="10512" b="4118" baseLine="4058">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="3907" r="6624" b="4109">given</wd>

<space/>

<wd l="6696" t="3960" r="6792" b="4066">a</wd>

<space/>

<wd l="6869" t="3960" r="7656" b="4109">sequence</wd>

<space/>

<wd l="7733" t="3907" r="7920" b="4066">of</wd>

<space/>

<wd l="7978" t="3907" r="8554" b="4094">words,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8640" t="3960" r="8750" b="4066">x</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8856" t="3979" r="9005" b="4032">=</wd>

<space/>

</run>

<wd l="9125" t="3893" r="9389" b="4118"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9461" t="4037" r="9682" b="4061">...</wd>

<space/>

</run>

<wd l="9744" t="3893" r="10104" b="4118"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x</run>

<run underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">n</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10224" t="3912" r="10512" b="4066">We</wd>

<space/>

</run>

</ln>

<ln l="6144" t="4162" r="10507" b="4387" baseLine="4330">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4176" r="6686" b="4334">model</wd>

<space/>

<wd l="6763" t="4176" r="7027" b="4334">the</wd>

<space/>

<wd l="7104" t="4176" r="8078" b="4334">conditional</wd>

<space/>

<wd l="8155" t="4176" r="9106" b="4378">probability</wd>

<space/>

</run>

<wd l="9173" t="4162" r="9720" b="4387"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">p</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">;</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="9778" t="4162" r="9950" b="4387"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10037" t="4176" r="10507" b="4378">using</wd>

<space/>

</run>

</ln>

<ln l="6144" t="4450" r="7776" b="4608" baseLine="4598" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4450" r="7186" b="4608">linear-chain</wd>

<space/>

<wd l="7243" t="4454" r="7776" b="4608">CRFs:</wd>

</ln>

</para>

<para l="8155" t="4829" r="9566" b="5054" alignment="left" li="2016" spaceBefore="139" lsp="exactly" lspExact="192" language="en">

<ln l="8155" t="4829" r="9566" b="5054" baseLine="4992">

<wd l="8155" t="4829" r="8669" b="5054"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">exp(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">0</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="3"><wd l="8741" t="4930" r="8770" b="4958">·</wd>

<space/>

</run>

<wd l="8842" t="4829" r="9250" b="5054"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">Φ(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">x,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3"><space/>

</run>

<wd l="9302" t="4829" r="9566" b="5054"><run italic="true" underlined="single" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">y</run>

<run italic="true" underlined="single" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">))</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6571" t="4906" r="7584" b="5203" alignment="left" li="432" lsp="exactly" lspExact="163" language="en">

<ln l="6571" t="4906" r="7584" b="5203" baseLine="5141">

<wd l="6571" t="4978" r="7118" b="5203"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">p</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">y</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="4">|</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">x</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">;</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4"><space/>

</run>

<wd l="7176" t="4978" r="7349" b="5203"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">)</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4"><space/>

<wd l="7435" t="5064" r="7584" b="5117">=</wd>

</run>

</ln>

</para>

<para l="7690" t="5107" r="10037" b="5400" alignment="left" li="1512" lsp="exactly" lspExact="386" language="en">

<ln l="7690" t="5107" r="10037" b="5400" baseLine="5299">

<wd l="7690" t="5131" r="8506" b="5400"><run italic="true" underlined="none" subsuperscript="none" fontSize="1500" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6">E</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6">y</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6">I</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6">EY</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6">(x)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6"><space/>

</run>

<wd l="8568" t="5126" r="9082" b="5352"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">exp(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">0</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6"><wd l="9154" t="5227" r="9182" b="5256">·</wd>

<space/>

</run>

<wd l="9259" t="5126" r="9662" b="5352"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">Φ(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">x,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><space/>

</run>

<wd l="9720" t="5126" r="10037" b="5352"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">y</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6">&apos;</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">))</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="5621" r="10512" b="8035" alignment="justified" spaceBefore="74" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="5621" r="10507" b="5827" baseLine="5774">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="5626" r="6677" b="5784">where</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6773" t="5621" r="6869" b="5784">0</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6974" t="5626" r="7627" b="5784">denotes</wd>

<space/>

<wd l="7733" t="5678" r="7829" b="5784">a</wd>

<space/>

<wd l="7925" t="5650" r="8160" b="5784">set</wd>

<space/>

<wd l="8251" t="5626" r="8443" b="5784">of</wd>

<space/>

<wd l="8520" t="5626" r="9062" b="5784">model</wd>

<space/>

<wd l="9158" t="5650" r="10157" b="5827">parameters.</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="10354" t="5626" r="10507" b="5813">Y</wd>

<space/>

</run>

</ln>

<ln l="6144" t="5894" r="10502" b="6096" baseLine="6048">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="5918" r="6744" b="6053">returns</wd>

<space/>

<wd l="6840" t="5894" r="7051" b="6053">all</wd>

<space/>

<wd l="7138" t="5894" r="7853" b="6096">possible</wd>

<space/>

<wd l="7939" t="5894" r="8362" b="6053">label</wd>

<space/>

<wd l="8458" t="5947" r="9322" b="6096">sequences</wd>

<space/>

<wd l="9422" t="5894" r="9610" b="6053">of</wd>

<space/>

</run>

<wd l="9686" t="5947" r="9850" b="6082"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9960" t="5894" r="10272" b="6053">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10363" t="5894" r="10502" b="6048">Φ</wd>

<space/>

</run>

</ln>

<ln l="6144" t="6154" r="10502" b="6379" baseLine="6317">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="6221" r="6600" b="6370">maps</wd>

<space/>

</run>

<wd l="6730" t="6154" r="6970" b="6379"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7022" t="6154" r="7200" b="6379"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7320" t="6168" r="7656" b="6326">into</wd>

<space/>

<wd l="7771" t="6221" r="7867" b="6326">a</wd>

<space/>

<wd l="7968" t="6168" r="8573" b="6326">feature</wd>

<space/>

<wd l="8678" t="6192" r="9226" b="6326">vector</wd>

<space/>

<wd l="9326" t="6168" r="9653" b="6326">that</wd>

<space/>

<wd l="9758" t="6168" r="9893" b="6326">is</wd>

<space/>

<wd l="10013" t="6221" r="10109" b="6326">a</wd>

<space/>

<wd l="10210" t="6168" r="10502" b="6322">lin-</wd>

</run>

</ln>

<ln l="6149" t="6422" r="10498" b="6648" baseLine="6590">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="6490" r="6418" b="6595">ear</wd>

<space/>

<wd l="6504" t="6490" r="6864" b="6595">sum</wd>

<space/>

<wd l="6946" t="6437" r="7138" b="6595">of</wd>

<space/>

<wd l="7205" t="6437" r="7474" b="6595">the</wd>

<space/>

<wd l="7555" t="6437" r="7978" b="6595">local</wd>

<space/>

<wd l="8064" t="6437" r="8669" b="6595">feature</wd>

<space/>

<wd l="8750" t="6461" r="9422" b="6595">vectors:</wd>

<space/>

</run>

<wd l="9576" t="6422" r="9979" b="6648"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Φ(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="10032" t="6422" r="10210" b="6648"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10349" t="6509" r="10498" b="6562">=</wd>

<space/>

</run>

</ln>

<ln l="6154" t="6648" r="10512" b="6960" baseLine="6859">

<wd l="6154" t="6691" r="6475" b="6922"><run italic="true" underlined="none" subsuperscript="none" fontSize="1500" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">E</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">n</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

<wd l="6370" t="6816" r="6658" b="6960">j=1</wd>

<space/>

</run>

<wd l="6725" t="6696" r="7104" b="6922"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">O</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7147" t="6715" r="7291" b="6912">j,</wd>

<space/>

</run>

<wd l="7344" t="6763" r="7800" b="6926"><run italic="true" underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">j</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">−</run>

<run underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7853" t="6696" r="8170" b="6926"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">j</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8386" t="6710" r="8909" b="6869">Given</wd>

<space/>

<wd l="9005" t="6710" r="9269" b="6869">the</wd>

<space/>

<wd l="9370" t="6710" r="9778" b="6912">fully</wd>

<space/>

<wd l="9878" t="6710" r="10512" b="6869">labeled</wd>

<space/>

</run>

</ln>

<ln l="6154" t="6979" r="10512" b="7243" baseLine="7168">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6154" t="7075" r="7022" b="7224">sequences</wd>

<space/>

</run>

<wd l="7142" t="6979" r="7694" b="7234"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">{</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x</run>

<run underlined="none" subsuperscript="superscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">(i)</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7752" t="6979" r="8582" b="7243"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="superscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">(i)</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="superscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">N</run>

<run underlined="none" subsuperscript="subscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">i=1</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8702" t="7022" r="8971" b="7181">the</wd>

<space/>

<wd l="9077" t="7022" r="9859" b="7224">objective</wd>

<space/>

<wd l="9965" t="7022" r="10157" b="7181">of</wd>

<space/>

<wd l="10243" t="7022" r="10512" b="7181">the</wd>

<space/>

</run>

</ln>

<ln l="6144" t="7291" r="10502" b="7498" baseLine="7445">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="7296" r="6821" b="7498">training</wd>

<space/>

<wd l="6902" t="7296" r="7042" b="7454">is</wd>

<space/>

<wd l="7128" t="7320" r="7291" b="7454">to</wd>

<space/>

<wd l="7382" t="7296" r="7718" b="7454">find</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7800" t="7291" r="7896" b="7454">0</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7982" t="7296" r="8309" b="7454">that</wd>

<space/>

<wd l="8386" t="7296" r="9322" b="7454">maximizes</wd>

<space/>

<wd l="9413" t="7296" r="9677" b="7454">the</wd>

<space/>

<wd l="9754" t="7296" r="10032" b="7498">log</wd>

<space/>

<wd l="10114" t="7296" r="10502" b="7454">like-</wd>

</run>

</ln>

<ln l="6144" t="7565" r="10512" b="7766" baseLine="7714" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7565" r="6706" b="7723">lihood</wd>

<space/>

<wd l="6787" t="7565" r="6974" b="7723">of</wd>

<space/>

<wd l="7042" t="7565" r="7306" b="7723">the</wd>

<space/>

<wd l="7382" t="7565" r="8059" b="7766">training</wd>

<space/>

<wd l="8146" t="7565" r="8506" b="7723">data</wd>

<space/>

<wd l="8582" t="7565" r="9082" b="7723">under</wd>

<space/>

<wd l="9154" t="7565" r="9422" b="7723">the</wd>

<space/>

<wd l="9499" t="7565" r="10042" b="7723">model</wd>

<space/>

<wd l="10123" t="7565" r="10512" b="7723">with</wd>

<space/>

</ln>

<ln l="6154" t="7834" r="7632" b="8035" baseLine="7988">

<wd l="6154" t="7834" r="7632" b="8035"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">l</run>

<run underlined="none" subsuperscript="none" fontSize="950" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">-regularization:</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="8376" t="8458" r="9859" b="8726" alignment="left" spaceBefore="387" spaceAfter="144" lsp="exactly" lspExact="292" language="en" id="_1_2_146">

<ln l="8376" t="8458" r="9859" b="8726" baseLine="8638">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8376" t="8515" r="8654" b="8717">log</wd>

<space/>

</run>

<wd l="8683" t="8458" r="9629" b="8726"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">p</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">y</run>

<run underlined="none" subsuperscript="superscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">(i)</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">x</run>

<run underlined="none" subsuperscript="superscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">(i)</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">;</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="9686" t="8501" r="9859" b="8726"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="8900" t="9029" r="9859" b="9480" alignment="left" li="2736" spaceBefore="146" lsp="exactly" lspExact="451" language="en">

<ln l="8966" t="9029" r="9859" b="9480" baseLine="9310">

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-7"><wd l="8966" t="9269" r="9106" b="9283">�</wd>

<space/>

</run>

<wd l="9154" t="9029" r="9264" b="9480"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">λ</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">2</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><space/>

</run>

<wd l="9355" t="9120" r="9758" b="9389"><run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-7">||</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">0</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-7">||</run>

<run underlined="none" subsuperscript="superscript" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-7">2</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><space/>

<wd l="9830" t="9307" r="9859" b="9331">.</wd>

</run>

</ln>

</para>

<para l="6144" t="9706" r="7378" b="9878" alignment="left" spaceBefore="178" lsp="exactly" lspExact="273" language="en">

<ln l="6144" t="9706" r="7378" b="9878" baseLine="9869" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="14">

<wd l="6144" t="9706" r="6259" b="9874">4</wd>

<space/>

<wd l="6504" t="9710" r="7378" b="9878">Features</wd>

</ln>

</para>

<para l="6144" t="10138" r="10512" b="12461" alignment="justified" spaceBefore="142" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="10138" r="10502" b="10339" baseLine="10286" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10142" r="6326" b="10291">In</wd>

<space/>

<wd l="6408" t="10138" r="6715" b="10296">this</wd>

<space/>

<wd l="6811" t="10138" r="7464" b="10325">section,</wd>

<space/>

<wd l="7560" t="10190" r="7814" b="10296">we</wd>

<space/>

<wd l="7901" t="10138" r="8621" b="10296">describe</wd>

<space/>

<wd l="8707" t="10190" r="8803" b="10296">a</wd>

<space/>

<wd l="8880" t="10138" r="9475" b="10339">variety</wd>

<space/>

<wd l="9562" t="10138" r="9754" b="10296">of</wd>

<space/>

<wd l="9821" t="10138" r="10502" b="10296">features</wd>

<space/>

</ln>

<ln l="6144" t="10406" r="10512" b="10608" baseLine="10560" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10406" r="6475" b="10565">that</wd>

<space/>

<wd l="6566" t="10459" r="6821" b="10565">we</wd>

<space/>

<wd l="6917" t="10406" r="7320" b="10565">have</wd>

<space/>

<wd l="7416" t="10406" r="7814" b="10565">used</wd>

<space/>

<wd l="7910" t="10406" r="8083" b="10560">in</wd>

<space/>

<wd l="8174" t="10406" r="8482" b="10565">this</wd>

<space/>

<wd l="8592" t="10406" r="9086" b="10608">study.</wd>

<space/>

<wd l="9283" t="10411" r="9571" b="10565">We</wd>

<space/>

<wd l="9672" t="10406" r="10013" b="10565">also</wd>

<space/>

<wd l="10109" t="10406" r="10512" b="10565">used</wd>

<space/>

</ln>

<ln l="6149" t="10642" r="10507" b="10882" baseLine="10825">

<wd l="6149" t="10642" r="7046" b="10838"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">CRFsuite</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">2</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="7104" t="10680" r="7795" b="10838">because</wd>

<space/>

<wd l="7838" t="10680" r="7963" b="10838">it</wd>

<space/>

<wd l="8002" t="10680" r="8549" b="10838">makes</wd>

<space/>

<wd l="8602" t="10680" r="8870" b="10838">the</wd>

<space/>

<wd l="8918" t="10680" r="9883" b="10882">application</wd>

<space/>

<wd l="9931" t="10680" r="10123" b="10838">of</wd>

<space/>

<wd l="10152" t="10733" r="10507" b="10838">new</wd>

<space/>

</run>

</ln>

<ln l="6144" t="10949" r="10512" b="11150" baseLine="11098" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="10949" r="6830" b="11107">features</wd>

<space/>

<wd l="6926" t="11002" r="7339" b="11150">easy.</wd>

<space/>

<wd l="7507" t="10954" r="8006" b="11150">Apart</wd>

<space/>

<wd l="8088" t="10949" r="8515" b="11107">from</wd>

<space/>

<wd l="8597" t="10949" r="8861" b="11107">the</wd>

<space/>

<wd l="8947" t="10949" r="9336" b="11107">base</wd>

<space/>

<wd l="9422" t="10949" r="10104" b="11107">features</wd>

<space/>

<wd l="10200" t="10949" r="10512" b="11107">and</wd>

<space/>

</ln>

<ln l="6149" t="11222" r="10512" b="11424" baseLine="11371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="11246" r="6936" b="11424">gazetteer</wd>

<space/>

<wd l="7003" t="11222" r="7685" b="11381">features</wd>

<space/>

<wd l="7762" t="11222" r="8534" b="11424">provided</wd>

<space/>

<wd l="8602" t="11222" r="8818" b="11424">by</wd>

<space/>

<wd l="8890" t="11222" r="9154" b="11381">the</wd>

<space/>

<wd l="9230" t="11222" r="10171" b="11424">organizers,</wd>

<space/>

<wd l="10258" t="11275" r="10512" b="11381">we</wd>

<space/>

</ln>

<ln l="6144" t="11491" r="10498" b="11693" baseLine="11640" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="11491" r="6547" b="11650">have</wd>

<space/>

<wd l="6624" t="11491" r="7022" b="11650">used</wd>

<space/>

<wd l="7094" t="11491" r="7358" b="11650">the</wd>

<space/>

<wd l="7435" t="11491" r="8270" b="11693">following</wd>

<space/>

<wd l="8347" t="11544" r="8702" b="11650">new</wd>

<space/>

<wd l="8779" t="11491" r="9514" b="11650">features:</wd>

<space/>

<wd l="9634" t="11496" r="10022" b="11650">POS</wd>

<space/>

<wd l="10104" t="11515" r="10498" b="11693">tags,</wd>

<space/>

</ln>

<ln l="6149" t="11760" r="10502" b="11962" baseLine="11914" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="11760" r="6806" b="11947">chunks,</wd>

<space/>

<wd l="6922" t="11760" r="7478" b="11918">brown</wd>

<space/>

<wd l="7574" t="11760" r="8472" b="11962">clustering,</wd>

<space/>

<wd l="8597" t="11760" r="8909" b="11918">and</wd>

<space/>

<wd l="9000" t="11760" r="9446" b="11918">word</wd>

<space/>

<wd l="9542" t="11784" r="10502" b="11962">representa-</wd>

</ln>

<ln l="6144" t="12034" r="10502" b="12235" baseLine="12182" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="12034" r="6528" b="12192">tion.</wd>

<space/>

<wd l="6610" t="12038" r="6950" b="12192">Our</wd>

<space/>

<wd l="6998" t="12034" r="7541" b="12192">model</wd>

<space/>

<wd l="7594" t="12034" r="7733" b="12192">is</wd>

<space/>

<wd l="7795" t="12034" r="8678" b="12235">composed</wd>

<space/>

<wd l="8731" t="12034" r="8923" b="12192">of</wd>

<space/>

<wd l="8962" t="12034" r="9226" b="12192">the</wd>

<space/>

<wd l="9278" t="12034" r="10118" b="12235">following</wd>

<space/>

<wd l="10171" t="12034" r="10502" b="12192">fea-</wd>

</ln>

<ln l="6144" t="12312" r="6614" b="12461" baseLine="12456" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="12326" r="6614" b="12461">tures:</wd>

</ln>

</para>

<para l="6144" t="12749" r="7872" b="12907" alignment="left" spaceBefore="198" lsp="exactly" lspExact="251" language="en">

<ln l="6144" t="12749" r="7872" b="12907" baseLine="12902" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">

<wd l="6144" t="12749" r="6408" b="12907">4.1</wd>

<space/>

<wd l="6638" t="12754" r="7070" b="12907">Base</wd>

<space/>

<wd l="7128" t="12749" r="7872" b="12907">features</wd>

</ln>

</para>

<para l="6144" t="13099" r="10512" b="14928" alignment="justified" spaceBefore="73" spaceAfter="102" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="13099" r="10512" b="13301" baseLine="13248" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13104" r="6571" b="13258">Base</wd>

<space/>

<wd l="6662" t="13099" r="7344" b="13258">features</wd>

<space/>

<wd l="7445" t="13099" r="8083" b="13258">include</wd>

<space/>

<wd l="8179" t="13099" r="8443" b="13258">the</wd>

<space/>

<wd l="8539" t="13123" r="9326" b="13301">gazetteer</wd>

<space/>

<wd l="9413" t="13099" r="10094" b="13258">features</wd>

<space/>

<wd l="10200" t="13099" r="10512" b="13258">and</wd>

<space/>

</ln>

<ln l="6149" t="13373" r="10512" b="13574" baseLine="13522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="13373" r="7253" b="13574">orthographic</wd>

<space/>

<wd l="7349" t="13373" r="8083" b="13531">features.</wd>

<space/>

<wd l="8256" t="13378" r="8438" b="13526">In</wd>

<space/>

<wd l="8525" t="13373" r="8794" b="13531">the</wd>

<space/>

<wd l="8880" t="13378" r="9312" b="13531">NER</wd>

<space/>

<wd l="9403" t="13373" r="9797" b="13560">task,</wd>

<space/>

<wd l="9907" t="13426" r="10003" b="13531">a</wd>

<space/>

<wd l="10085" t="13373" r="10512" b="13574">huge</wd>

<space/>

</ln>

<ln l="6149" t="13642" r="10502" b="13800" baseLine="13790" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="13666" r="6802" b="13800">amount</wd>

<space/>

<wd l="6883" t="13642" r="7075" b="13800">of</wd>

<space/>

<wd l="7138" t="13642" r="7987" b="13800">unlabeled</wd>

<space/>

<wd l="8069" t="13642" r="8429" b="13800">data</wd>

<space/>

<wd l="8506" t="13642" r="8640" b="13800">is</wd>

<space/>

<wd l="8731" t="13642" r="9178" b="13800">often</wd>

<space/>

<wd l="9254" t="13642" r="9653" b="13800">used</wd>

<space/>

<wd l="9730" t="13642" r="9989" b="13800">for</wd>

<space/>

<wd l="10061" t="13642" r="10502" b="13800">iden-</wd>

</ln>

<ln l="6144" t="13910" r="10498" b="14112" baseLine="14064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="13910" r="6725" b="14112">tifying</wd>

<space/>

<wd l="6845" t="13963" r="7454" b="14069">unseen</wd>

<space/>

<wd l="7574" t="13910" r="8246" b="14069">entities.</wd>

<space/>

<wd l="8520" t="13910" r="9024" b="14069">There</wd>

<space/>

<wd l="9149" t="13963" r="9413" b="14069">are</wd>

<space/>

<wd l="9538" t="13910" r="10171" b="14112">already</wd>

<space/>

<wd l="10296" t="13910" r="10498" b="14069">53</wd>

<space/>

</ln>

<ln l="6149" t="14184" r="10512" b="14386" baseLine="14333" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="14208" r="7008" b="14386">gazetteers</wd>

<space/>

<wd l="7085" t="14184" r="7258" b="14338">in</wd>

<space/>

<wd l="7325" t="14184" r="7589" b="14342">the</wd>

<space/>

<wd l="7661" t="14184" r="8376" b="14342">baseline</wd>

<space/>

<wd l="8453" t="14208" r="9096" b="14386">system.</wd>

<space/>

<wd l="9216" t="14184" r="9557" b="14342">The</wd>

<space/>

<wd l="9624" t="14184" r="10512" b="14342">maximum</wd>

<space/>

</ln>

<ln l="6144" t="14453" r="10512" b="14654" baseLine="14606" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14453" r="6840" b="14611">window</wd>

<space/>

<wd l="6941" t="14453" r="7267" b="14611">size</wd>

<space/>

<wd l="7358" t="14453" r="7618" b="14611">for</wd>

<space/>

<wd l="7704" t="14477" r="8491" b="14654">gazetteer</wd>

<space/>

<wd l="8573" t="14453" r="9254" b="14611">features</wd>

<space/>

<wd l="9350" t="14453" r="9490" b="14611">is</wd>

<space/>

<wd l="9586" t="14453" r="9734" b="14640">6,</wd>

<space/>

<wd l="9845" t="14453" r="10157" b="14611">and</wd>

<space/>

<wd l="10243" t="14453" r="10512" b="14611">the</wd>

<space/>

</ln>

<ln l="6144" t="14726" r="10512" b="14928" baseLine="14875" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="14726" r="6686" b="14885">model</wd>

<space/>

<wd l="6754" t="14726" r="7090" b="14885">will</wd>

<space/>

<wd l="7152" t="14726" r="7584" b="14885">learn</wd>

<space/>

<wd l="7651" t="14726" r="7915" b="14885">the</wd>

<space/>

<wd l="7978" t="14726" r="8558" b="14885">named</wd>

<space/>

<wd l="8626" t="14726" r="9115" b="14928">entity</wd>

<space/>

<wd l="9178" t="14750" r="9552" b="14928">type</wd>

<space/>

<wd l="9619" t="14726" r="10512" b="14885">associated</wd>

</ln>

</para>

<rulerline l="6141" t="15048" r="7344" b="15048" type="single" width="10" color="000000"/>

<para l="6398" t="15101" r="9514" b="15302" alignment="left" li="216" spaceBefore="59" lsp="exactly" lspExact="191" language="en">

<ln l="6398" t="15101" r="9514" b="15302" baseLine="15257">

<wd l="6398" t="15101" r="9514" b="15302"><run underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">http://www.chokkan.org/software/crfsuite/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<dd l="6141" t="8163" r="8376" b="9190" anchorTo="toPage" refTo="_1_2_146">

<dd l="6141" t="8163" r="8001" b="9190" anchorTo="toPage" refTo="_1_2_146">

<para l="6787" t="8501" r="7987" b="8717" alignment="right" spaceBefore="292" lsp="exactly" lspExact="253" language="en">

<ln l="6787" t="8501" r="7987" b="8717" baseLine="8649">

<wd l="6787" t="8501" r="6965" b="8674"><run italic="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17">0</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="17">∗</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="17"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17"><wd l="7056" t="8587" r="7205" b="8640">=</wd>

<space/>

<wd l="7282" t="8568" r="7987" b="8717">argmax</wd>

</run>

</ln>

</para>

<para l="7594" t="8693" r="7666" b="8861" alignment="right" ri="252" spaceAfter="289" lsp="exactly" lspExact="190" language="en">

<ln l="7594" t="8693" r="7666" b="8861" baseLine="8856" underlined="none" subsuperscript="none" fontSize="950" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="7594" t="8741" r="7666" b="8861">θ</wd>

</ln>

</para>

</dd>

<dd l="8001" t="8163" r="8376" b="9190" anchorTo="toPage" refTo="_1_2_146">

<para l="8001" t="8285" r="8370" b="8933" alignment="left" spaceAfter="217" lsp="exactly" lspExact="403" language="en">

<ln l="8107" t="8285" r="8251" b="8395" baseLine="8390" underlined="none" subsuperscript="none" fontSize="950" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="36">

<wd l="8107" t="8285" r="8251" b="8395">N</wd>

<space/>

</ln>

<ln l="8040" t="8774" r="8304" b="8933" baseLine="8928" underlined="none" subsuperscript="none" fontSize="950" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="36">

<wd l="8040" t="8818" r="8304" b="8933">i=1</wd>

</ln>

</para>

</dd>

</dd>

<dd l="1430" t="15736" r="10528" b="15977">

<para l="5800" t="15792" r="6138" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5866" t="15792" r="6072" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="39">

<wd l="5866" t="15792" r="6072" b="15946">73</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4310.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1437" marginTop="1260" marginRight="1378" marginBottom="1302" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1437" t="1260" r="10531" b="15333">

<column l="1437" t="1260" r="5824" b="15333">

<para l="1440" t="1320" r="5803" b="2338" alignment="justified" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="1320" r="5803" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1320" r="1829" b="1478">with</wd>

<space/>

<wd l="1886" t="1373" r="1982" b="1478">a</wd>

<space/>

<wd l="2040" t="1320" r="2688" b="1522">specific</wd>

<space/>

<wd l="2746" t="1320" r="3360" b="1522">phrase,</wd>

<space/>

<wd l="3422" t="1320" r="3571" b="1474">if</wd>

<space/>

<wd l="3610" t="1320" r="3734" b="1478">it</wd>

<space/>

<wd l="3782" t="1320" r="3922" b="1478">is</wd>

<space/>

<wd l="3979" t="1320" r="4152" b="1474">in</wd>

<space/>

<wd l="4210" t="1373" r="4517" b="1478">one</wd>

<space/>

<wd l="4574" t="1373" r="4757" b="1478">or</wd>

<space/>

<wd l="4805" t="1373" r="5251" b="1478">more</wd>

<space/>

<wd l="5309" t="1320" r="5501" b="1478">of</wd>

<space/>

<wd l="5539" t="1320" r="5803" b="1478">the</wd>

<space/>

</ln>

<ln l="1445" t="1594" r="5803" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1618" r="2232" b="1795">gazetteer</wd>

<space/>

<wd l="2304" t="1594" r="3072" b="1752">lexicons.</wd>

<space/>

<wd l="3221" t="1594" r="4373" b="1795">Orthographic</wd>

<space/>

<wd l="4454" t="1594" r="5136" b="1752">features</wd>

<space/>

<wd l="5227" t="1646" r="5520" b="1752">can</wd>

<space/>

<wd l="5602" t="1594" r="5803" b="1752">be</wd>

<space/>

</ln>

<ln l="1445" t="1862" r="5803" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1862" r="2093" b="2021">divided</wd>

<space/>

<wd l="2160" t="1862" r="2496" b="2021">into</wd>

<space/>

<wd l="2578" t="1862" r="2890" b="2021">five</wd>

<space/>

<wd l="2966" t="1886" r="3470" b="2064">types.</wd>

<space/>

<wd l="3600" t="1862" r="3941" b="2021">The</wd>

<space/>

<wd l="4018" t="1862" r="5122" b="2064">orthographic</wd>

<space/>

<wd l="5198" t="1862" r="5803" b="2021">feature</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="3581" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2136" r="2270" b="2338">templates</wd>

<space/>

<wd l="2338" t="2189" r="2597" b="2294">are</wd>

<space/>

<wd l="2654" t="2189" r="2827" b="2294">as</wd>

<space/>

<wd l="2890" t="2136" r="3581" b="2294">follows:</wd>

</ln>

</para>

<para l="1675" t="2678" r="5818" b="3446" alignment="justified" li="432" spaceBefore="300" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="2678" r="5818" b="2904" baseLine="2847">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1675" t="2746" r="1882" b="2846">•</wd>

<tab position="1731"/>

<wd l="1882" t="2746" r="2573" b="2894">n-gram:</wd>

<space/>

</run>

<wd l="2688" t="2746" r="2890" b="2885"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">w</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">i</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2971" t="2693" r="3230" b="2851">for</wd>

<space/>

<wd l="3298" t="2698" r="3360" b="2851">i</wd>

<space/>

<wd l="3437" t="2693" r="3610" b="2846">in</wd>

<space/>

</run>

<wd l="3686" t="2678" r="4445" b="2904"><run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">-1,0,1</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4531" t="2693" r="5558" b="2894">conjunction</wd>

<space/>

<wd l="5630" t="2693" r="5818" b="2851">of</wd>

<space/>

</run>

</ln>

<ln l="1877" t="2938" r="5808" b="3178" baseLine="3118">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="2966" r="2616" b="3168">previous</wd>

<space/>

<wd l="2683" t="2966" r="3134" b="3125">word</wd>

<space/>

<wd l="3202" t="2966" r="3509" b="3125">and</wd>

<space/>

<wd l="3576" t="2990" r="4190" b="3125">current</wd>

<space/>

<wd l="4253" t="2966" r="4699" b="3125">word</wd>

<space/>

</run>

<wd l="4766" t="2952" r="5472" b="3178"><run underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">w</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">i</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">−</run>

<run underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

<run underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">w</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">i</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5549" t="2966" r="5808" b="3125">for</wd>

<space/>

</run>

</ln>

<ln l="1882" t="3221" r="2837" b="3446" baseLine="3389">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1882" t="3240" r="1944" b="3394">i</wd>

<space/>

<wd l="2006" t="3235" r="2179" b="3389">in</wd>

<space/>

</run>

<wd l="2246" t="3221" r="2837" b="3446"><run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">-1,0</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1675" t="3797" r="5808" b="4267" alignment="justified" li="432" spaceBefore="279" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="3797" r="5808" b="3989" baseLine="3946">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1675" t="3802" r="1877" b="3946">•</wd>

<tab position="1756"/>

<wd l="1877" t="3797" r="2554" b="3955">Affixes:</wd>

<space/>

<wd l="2645" t="3797" r="3336" b="3955">Prefixes</wd>

<space/>

<wd l="3408" t="3797" r="3720" b="3955">and</wd>

<space/>

<wd l="3787" t="3797" r="4440" b="3955">suffixes</wd>

<space/>

<wd l="4507" t="3797" r="4699" b="3955">of</wd>

<space/>

</run>

<wd l="4747" t="3850" r="4978" b="3989"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">x</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-1">i</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="5069" t="3797" r="5405" b="3955">The</wd>

<space/>

<wd l="5472" t="3797" r="5808" b="3955">first</wd>

<space/>

</run>

</ln>

<ln l="1882" t="4066" r="5467" b="4267" baseLine="4219" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1882" t="4066" r="2194" b="4224">and</wd>

<space/>

<wd l="2246" t="4066" r="2549" b="4224">last</wd>

<space/>

<wd l="2606" t="4118" r="2726" b="4224">n</wd>

<space/>

<wd l="2794" t="4066" r="3667" b="4224">characters</wd>

<space/>

<wd l="3730" t="4066" r="4392" b="4267">ranging</wd>

<space/>

<wd l="4450" t="4066" r="4877" b="4224">from</wd>

<space/>

<wd l="4954" t="4070" r="5016" b="4219">1</wd>

<space/>

<wd l="5093" t="4090" r="5256" b="4224">to</wd>

<space/>

<wd l="5318" t="4070" r="5467" b="4224">3.</wd>

</ln>

</para>

<para l="1675" t="4627" r="5803" b="5640" alignment="justified" li="432" spaceBefore="289" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="4627" r="5794" b="4829" baseLine="4776" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1675" t="4632" r="1882" b="4776">•</wd>

<tab position="1756"/>

<wd l="1882" t="4627" r="3144" b="4829">Capitalization:</wd>

<space/>

<wd l="3226" t="4627" r="3734" b="4786">There</wd>

<space/>

<wd l="3787" t="4680" r="4046" b="4786">are</wd>

<space/>

<wd l="4094" t="4651" r="4416" b="4786">two</wd>

<space/>

<wd l="4464" t="4651" r="5146" b="4829">patterns</wd>

<space/>

<wd l="5208" t="4627" r="5395" b="4786">of</wd>

<space/>

<wd l="5434" t="4680" r="5794" b="4829">cap-</wd>

</ln>

<ln l="1877" t="4901" r="5794" b="5102" baseLine="5050" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="4901" r="2794" b="5059">italization:</wd>

<space/>

<wd l="2904" t="4906" r="3259" b="5059">One</wd>

<space/>

<wd l="3326" t="4901" r="3466" b="5059">is</wd>

<space/>

<wd l="3542" t="4954" r="3739" b="5059">an</wd>

<space/>

<wd l="3811" t="4901" r="4589" b="5059">indicator</wd>

<space/>

<wd l="4656" t="4901" r="4843" b="5059">of</wd>

<space/>

<wd l="4901" t="4901" r="5794" b="5102">capitaliza-</wd>

</ln>

<ln l="1877" t="5170" r="5803" b="5357" baseLine="5318" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="5170" r="2218" b="5328">tion</wd>

<space/>

<wd l="2270" t="5170" r="2530" b="5328">for</wd>

<space/>

<wd l="2582" t="5170" r="2846" b="5328">the</wd>

<space/>

<wd l="2909" t="5170" r="3245" b="5328">first</wd>

<space/>

<wd l="3302" t="5170" r="4133" b="5357">character,</wd>

<space/>

<wd l="4205" t="5170" r="4517" b="5328">and</wd>

<space/>

<wd l="4570" t="5170" r="4838" b="5328">the</wd>

<space/>

<wd l="4901" t="5170" r="5347" b="5328">other</wd>

<space/>

<wd l="5400" t="5170" r="5534" b="5328">is</wd>

<space/>

<wd l="5606" t="5222" r="5803" b="5328">an</wd>

<space/>

</ln>

<ln l="1877" t="5438" r="5683" b="5640" baseLine="5592" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="5438" r="2654" b="5597">indicator</wd>

<space/>

<wd l="2712" t="5438" r="2904" b="5597">of</wd>

<space/>

<wd l="2947" t="5438" r="4118" b="5640">capitalization</wd>

<space/>

<wd l="4171" t="5438" r="4430" b="5597">for</wd>

<space/>

<wd l="4488" t="5438" r="4699" b="5597">all</wd>

<space/>

<wd l="4762" t="5438" r="5683" b="5597">characters.</wd>

</ln>

</para>

<para l="1675" t="6000" r="5808" b="7013" alignment="justified" li="432" spaceBefore="289" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="6000" r="5789" b="6202" baseLine="6149" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1675" t="6005" r="1877" b="6149">•</wd>

<tab position="1756"/>

<wd l="1877" t="6000" r="2366" b="6202">Digit:</wd>

<space/>

<wd l="2486" t="6000" r="2995" b="6158">There</wd>

<space/>

<wd l="3067" t="6053" r="3331" b="6158">are</wd>

<space/>

<wd l="3403" t="6000" r="3835" b="6158">three</wd>

<space/>

<wd l="3907" t="6024" r="4589" b="6202">patterns</wd>

<space/>

<wd l="4670" t="6000" r="4925" b="6158">for</wd>

<space/>

<wd l="4992" t="6000" r="5789" b="6158">numbers:</wd>

<space/>

</ln>

<ln l="1877" t="6274" r="5794" b="6475" baseLine="6422" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="6274" r="2002" b="6470">i)</wd>

<space/>

<wd l="2093" t="6274" r="2851" b="6432">Whether</wd>

<space/>

<wd l="2928" t="6274" r="3192" b="6432">the</wd>

<space/>

<wd l="3283" t="6298" r="3898" b="6432">current</wd>

<space/>

<wd l="3979" t="6274" r="4430" b="6432">word</wd>

<space/>

<wd l="4512" t="6274" r="4795" b="6432">has</wd>

<space/>

<wd l="4891" t="6326" r="4987" b="6432">a</wd>

<space/>

<wd l="5069" t="6274" r="5510" b="6475">digit,</wd>

<space/>

<wd l="5611" t="6274" r="5794" b="6470">ii)</wd>

<space/>

</ln>

<ln l="1877" t="6542" r="5808" b="6744" baseLine="6691" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="6542" r="2582" b="6701">whether</wd>

<space/>

<wd l="2626" t="6542" r="2890" b="6701">the</wd>

<space/>

<wd l="2942" t="6566" r="3557" b="6701">current</wd>

<space/>

<wd l="3600" t="6542" r="4046" b="6701">word</wd>

<space/>

<wd l="4090" t="6542" r="4229" b="6701">is</wd>

<space/>

<wd l="4286" t="6595" r="4382" b="6701">a</wd>

<space/>

<wd l="4430" t="6542" r="4944" b="6744">single</wd>

<space/>

<wd l="4992" t="6542" r="5434" b="6744">digit,</wd>

<space/>

<wd l="5496" t="6542" r="5808" b="6701">and</wd>

<space/>

</ln>

<ln l="1877" t="6811" r="5693" b="7013" baseLine="6965" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="6811" r="2122" b="7008">iii)</wd>

<space/>

<wd l="2184" t="6811" r="2894" b="6970">whether</wd>

<space/>

<wd l="2942" t="6811" r="3206" b="6970">the</wd>

<space/>

<wd l="3269" t="6835" r="3883" b="6970">current</wd>

<space/>

<wd l="3936" t="6811" r="4382" b="6970">word</wd>

<space/>

<wd l="4435" t="6811" r="4718" b="6970">has</wd>

<space/>

<wd l="4781" t="6835" r="5102" b="6970">two</wd>

<space/>

<wd l="5165" t="6811" r="5693" b="7013">digits.</wd>

</ln>

</para>

<para l="1675" t="7373" r="5808" b="9202" alignment="justified" li="432" spaceBefore="287" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="7373" r="5808" b="7574" baseLine="7522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="7378" r="1877" b="7522">•</wd>

<tab position="1756"/>

<wd l="1877" t="7373" r="3106" b="7574">Non-alphabet:</wd>

<space/>

<wd l="3341" t="7373" r="4094" b="7531">Whether</wd>

<space/>

<wd l="4219" t="7373" r="4483" b="7531">the</wd>

<space/>

<wd l="4618" t="7397" r="5232" b="7531">current</wd>

<space/>

<wd l="5362" t="7373" r="5808" b="7531">word</wd>

<space/>

</ln>

<ln l="1882" t="7646" r="5808" b="7848" baseLine="7795" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="7646" r="2597" b="7805">contains</wd>

<space/>

<wd l="2741" t="7699" r="2837" b="7805">a</wd>

<space/>

<wd l="2966" t="7646" r="3610" b="7848">hyphen</wd>

<space/>

<wd l="3749" t="7646" r="4061" b="7805">and</wd>

<space/>

<wd l="4200" t="7646" r="4646" b="7805">other</wd>

<space/>

<wd l="4776" t="7646" r="5808" b="7848">punctuation</wd>

<space/>

</ln>

<ln l="1877" t="7915" r="5798" b="8117" baseLine="8064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="7915" r="2453" b="8074">marks.</wd>

<space/>

<wd l="2582" t="7920" r="3235" b="8117">Among</wd>

<space/>

<wd l="3312" t="7915" r="3576" b="8074">the</wd>

<space/>

<wd l="3653" t="7915" r="4104" b="8074">other</wd>

<space/>

<wd l="4171" t="7915" r="5203" b="8117">punctuation</wd>

<space/>

<wd l="5270" t="7915" r="5798" b="8074">marks</wd>

<space/>

</ln>

<ln l="1877" t="8184" r="5798" b="8386" baseLine="8338" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="8184" r="2016" b="8342">is</wd>

<space/>

<wd l="2136" t="8184" r="2400" b="8342">the</wd>

<space/>

<wd l="2520" t="8184" r="3250" b="8381">colon(:).</wd>

<space/>

<wd l="3499" t="8189" r="3686" b="8338">In</wd>

<space/>

<wd l="3802" t="8184" r="4483" b="8386">general,</wd>

<space/>

<wd l="4618" t="8184" r="5045" b="8342">what</wd>

<space/>

<wd l="5155" t="8184" r="5798" b="8342">follows</wd>

<space/>

</ln>

<ln l="1877" t="8458" r="5803" b="8659" baseLine="8606" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="8458" r="2290" b="8659">right</wd>

<space/>

<wd l="2366" t="8458" r="2765" b="8616">after</wd>

<space/>

<wd l="2837" t="8510" r="2933" b="8616">a</wd>

<space/>

<wd l="3005" t="8458" r="3485" b="8616">colon</wd>

<space/>

<wd l="3557" t="8458" r="4003" b="8616">mark</wd>

<space/>

<wd l="4075" t="8482" r="4954" b="8659">represents</wd>

<space/>

<wd l="5035" t="8510" r="5131" b="8616">a</wd>

<space/>

<wd l="5198" t="8458" r="5803" b="8616">feature</wd>

<space/>

</ln>

<ln l="1877" t="8726" r="5794" b="8928" baseLine="8880" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="8726" r="2515" b="8928">weight.</wd>

<space/>

<wd l="2659" t="8731" r="2880" b="8885">To</wd>

<space/>

<wd l="2962" t="8726" r="3432" b="8885">make</wd>

<space/>

<wd l="3509" t="8726" r="3778" b="8885">the</wd>

<space/>

<wd l="3854" t="8726" r="4397" b="8885">model</wd>

<space/>

<wd l="4478" t="8726" r="4910" b="8885">learn</wd>

<space/>

<wd l="4997" t="8726" r="5794" b="8928">correctly,</wd>

<space/>

</ln>

<ln l="1877" t="9000" r="4906" b="9202" baseLine="9149" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9053" r="2131" b="9158">we</wd>

<space/>

<wd l="2184" t="9000" r="3058" b="9158">normalize</wd>

<space/>

<wd l="3115" t="9000" r="3499" b="9202">only</wd>

<space/>

<wd l="3557" t="9000" r="3821" b="9158">the</wd>

<space/>

<wd l="3883" t="9000" r="4363" b="9158">colon</wd>

<space/>

<wd l="4416" t="9000" r="4906" b="9158">mark.</wd>

</ln>

</para>

<para l="1440" t="9557" r="3912" b="9758" alignment="left" spaceBefore="312" lsp="exactly" lspExact="250" language="en">

<ln l="1440" t="9557" r="3912" b="9758" baseLine="9710" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="1440" t="9557" r="1709" b="9715">4.2</wd>

<space/>

<wd l="1930" t="9557" r="2347" b="9715">POS</wd>

<space/>

<wd l="2410" t="9571" r="2784" b="9758">tags</wd>

<space/>

<wd l="2846" t="9562" r="3192" b="9715">and</wd>

<space/>

<wd l="3250" t="9562" r="3912" b="9715">chunks</wd>

</ln>

</para>

<para l="1440" t="9965" r="5808" b="12830" alignment="justified" spaceBefore="134" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="9965" r="5808" b="10166" baseLine="10114" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="9970" r="1622" b="10118">In</wd>

<space/>

<wd l="1714" t="9965" r="1978" b="10123">the</wd>

<space/>

<wd l="2074" t="9970" r="2506" b="10123">NER</wd>

<space/>

<wd l="2602" t="9965" r="2995" b="10152">task,</wd>

<space/>

<wd l="3110" t="9970" r="3499" b="10123">POS</wd>

<space/>

<wd l="3600" t="9989" r="3946" b="10166">tags</wd>

<space/>

<wd l="4051" t="9965" r="4363" b="10123">and</wd>

<space/>

<wd l="4459" t="9965" r="5064" b="10123">chunks</wd>

<space/>

<wd l="5170" t="9965" r="5808" b="10123">contain</wd>

<space/>

</ln>

<ln l="1440" t="10234" r="5803" b="10435" baseLine="10382" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10286" r="1819" b="10435">very</wd>

<space/>

<wd l="1872" t="10234" r="2400" b="10392">useful</wd>

<space/>

<wd l="2453" t="10234" r="3485" b="10392">information</wd>

<space/>

<wd l="3528" t="10234" r="3787" b="10392">for</wd>

<space/>

<wd l="3835" t="10234" r="4445" b="10435">finding</wd>

<space/>

<wd l="4502" t="10234" r="4814" b="10392">and</wd>

<space/>

<wd l="4867" t="10234" r="5803" b="10435">classifying</wd>

<space/>

</ln>

<ln l="1440" t="10502" r="5798" b="10704" baseLine="10656" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10502" r="2021" b="10661">named</wd>

<space/>

<wd l="2098" t="10502" r="2765" b="10661">entities.</wd>

<space/>

<wd l="2885" t="10507" r="3168" b="10661">We</wd>

<space/>

<wd l="3240" t="10502" r="3850" b="10704">predict</wd>

<space/>

<wd l="3917" t="10507" r="4306" b="10661">POS</wd>

<space/>

<wd l="4382" t="10526" r="4728" b="10704">tags</wd>

<space/>

<wd l="4810" t="10502" r="5122" b="10661">and</wd>

<space/>

<wd l="5194" t="10502" r="5798" b="10661">chunks</wd>

<space/>

</ln>

<ln l="1440" t="10776" r="5808" b="10978" baseLine="10925" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10776" r="1656" b="10978">by</wd>

<space/>

<wd l="1738" t="10776" r="2208" b="10978">using</wd>

<space/>

<wd l="2294" t="10829" r="2390" b="10934">a</wd>

<space/>

<wd l="2467" t="10776" r="3010" b="10934">model</wd>

<space/>

<wd l="3091" t="10776" r="3696" b="10934">trained</wd>

<space/>

<wd l="3773" t="10776" r="4166" b="10934">with</wd>

<space/>

<wd l="4243" t="10776" r="4872" b="10934">Twitter</wd>

<space/>

<wd l="4949" t="10776" r="5352" b="10934">data.</wd>

<space/>

<wd l="5506" t="10781" r="5808" b="10934">For</wd>

<space/>

</ln>

<ln l="1440" t="11045" r="5808" b="11246" baseLine="11198" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11050" r="1829" b="11203">POS</wd>

<space/>

<wd l="1915" t="11069" r="2309" b="11246">tags,</wd>

<space/>

<wd l="2400" t="11098" r="2654" b="11203">we</wd>

<space/>

<wd l="2731" t="11098" r="3019" b="11203">use</wd>

<space/>

<wd l="3101" t="11098" r="3197" b="11203">a</wd>

<space/>

<wd l="3264" t="11045" r="3806" b="11203">model</wd>

<space/>

<wd l="3883" t="11045" r="4493" b="11203">trained</wd>

<space/>

<wd l="4565" t="11045" r="4954" b="11203">with</wd>

<space/>

<wd l="5030" t="11045" r="5294" b="11203">the</wd>

<space/>

<wd l="5371" t="11050" r="5808" b="11203">Penn</wd>

<space/>

</ln>

<ln l="1440" t="11318" r="5808" b="11520" baseLine="11467" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11318" r="2741" b="11520">Treebank-style</wd>

<space/>

<wd l="2832" t="11342" r="3341" b="11520">tagset</wd>

<space/>

<wd l="3437" t="11318" r="4003" b="11515">(Ritter</wd>

<space/>

<wd l="4094" t="11342" r="4248" b="11477">et</wd>

<space/>

<wd l="4339" t="11318" r="4589" b="11506">al.,</wd>

<space/>

<wd l="4704" t="11323" r="5251" b="11515">2011).</wd>

<space/>

<wd l="5438" t="11323" r="5621" b="11472">In</wd>

<space/>

<wd l="5712" t="11371" r="5808" b="11477">a</wd>

<space/>

</ln>

<ln l="1440" t="11587" r="5803" b="11789" baseLine="11741" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11587" r="2030" b="11774">model,</wd>

<space/>

<wd l="2155" t="11640" r="2606" b="11746">some</wd>

<space/>

<wd l="2702" t="11587" r="4056" b="11789">Twitter-specific</wd>

<space/>

<wd l="4162" t="11611" r="4502" b="11789">tags</wd>

<space/>

<wd l="4613" t="11640" r="4872" b="11746">are</wd>

<space/>

<wd l="4973" t="11587" r="5491" b="11746">added</wd>

<space/>

<wd l="5587" t="11587" r="5803" b="11789">by</wd>

<space/>

</ln>

<ln l="1440" t="11861" r="5794" b="12058" baseLine="12010" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11861" r="1939" b="12019">Ritter</wd>

<space/>

<wd l="1992" t="11885" r="2146" b="12019">et</wd>

<space/>

<wd l="2198" t="11861" r="2395" b="12019">al.</wd>

<space/>

<wd l="2467" t="11866" r="3082" b="12058">(2011):</wd>

<space/>

<wd l="3163" t="11885" r="3936" b="12048">retweets,</wd>

<space/>

<wd l="4022" t="11866" r="5160" b="12048">@usernames,</wd>

<space/>

<wd l="5222" t="11861" r="5794" b="12019">#hash-</wd>

</ln>

<ln l="1440" t="12130" r="5803" b="12331" baseLine="12283" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12154" r="1834" b="12331">tags,</wd>

<space/>

<wd l="1910" t="12130" r="2222" b="12288">and</wd>

<space/>

<wd l="2285" t="12130" r="2654" b="12288">urls.</wd>

<space/>

<wd l="2750" t="12134" r="3053" b="12288">For</wd>

<space/>

<wd l="3115" t="12130" r="3773" b="12317">chunks,</wd>

<space/>

<wd l="3845" t="12182" r="4099" b="12288">we</wd>

<space/>

<wd l="4157" t="12182" r="4450" b="12288">use</wd>

<space/>

<wd l="4512" t="12182" r="4608" b="12288">a</wd>

<space/>

<wd l="4666" t="12130" r="5251" b="12288">named</wd>

<space/>

<wd l="5314" t="12130" r="5803" b="12331">entity</wd>

<space/>

</ln>

<ln l="1440" t="12365" r="5803" b="12605" baseLine="12549">

<wd l="1440" t="12365" r="2059" b="12605"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">tagger</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">3</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2141" t="12403" r="2357" b="12605">by</wd>

<space/>

<wd l="2424" t="12403" r="2928" b="12562">Ritter</wd>

<space/>

<wd l="2995" t="12427" r="3149" b="12562">et</wd>

<space/>

<wd l="3216" t="12403" r="3413" b="12562">al.</wd>

<space/>

<wd l="3499" t="12408" r="4118" b="12600">(2012).</wd>

<space/>

<wd l="4229" t="12403" r="5054" b="12562">Predicted</wd>

<space/>

<wd l="5122" t="12427" r="5462" b="12605">tags</wd>

<space/>

<wd l="5544" t="12456" r="5803" b="12562">are</wd>

<space/>

</run>

</ln>

<ln l="1440" t="12672" r="3806" b="12830" baseLine="12826" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12672" r="1843" b="12830">used</wd>

<space/>

<wd l="1901" t="12725" r="2069" b="12830">as</wd>

<space/>

<wd l="2131" t="12672" r="2813" b="12830">features</wd>

<space/>

<wd l="2880" t="12725" r="3048" b="12830">as</wd>

<space/>

<wd l="3110" t="12672" r="3806" b="12830">follows:</wd>

</ln>

</para>

<para l="1675" t="13234" r="5794" b="13714" alignment="justified" li="432" spaceBefore="298" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="13234" r="5794" b="13435" baseLine="13382" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="13238" r="1877" b="13382">•</wd>

<tab position="1756"/>

<wd l="1877" t="13238" r="2266" b="13392">POS</wd>

<space/>

<wd l="2342" t="13258" r="2650" b="13435">tag:</wd>

<space/>

<wd l="2760" t="13286" r="2856" b="13392">a</wd>

<space/>

<wd l="2918" t="13234" r="3946" b="13435">conjunction</wd>

<space/>

<wd l="4008" t="13234" r="4613" b="13392">feature</wd>

<space/>

<wd l="4675" t="13234" r="5064" b="13392">with</wd>

<space/>

<wd l="5126" t="13234" r="5395" b="13392">the</wd>

<space/>

<wd l="5462" t="13286" r="5794" b="13392">cur-</wd>

</ln>

<ln l="1877" t="13488" r="5467" b="13714" baseLine="13657">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="13526" r="2218" b="13661">rent</wd>

<space/>

<wd l="2270" t="13502" r="2717" b="13661">word</wd>

<space/>

<wd l="2774" t="13502" r="3086" b="13661">and</wd>

<space/>

<wd l="3139" t="13502" r="3408" b="13661">the</wd>

<space/>

<wd l="3466" t="13526" r="4080" b="13661">current</wd>

<space/>

<wd l="4133" t="13507" r="4522" b="13661">POS</wd>

<space/>

<wd l="4589" t="13526" r="4853" b="13704">tag</wd>

<space/>

</run>

<wd l="4915" t="13488" r="5467" b="13714"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">w</run>

<run underlined="none" subsuperscript="none" fontSize="750" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">0</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">p</run>

<run underlined="none" subsuperscript="none" fontSize="750" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">0</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1675" t="14059" r="5808" b="14818" alignment="justified" li="432" spaceBefore="287" spaceAfter="210" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="14064" r="5803" b="14266" baseLine="14213" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="14069" r="1882" b="14213">•</wd>

<tab position="1756"/>

<wd l="1882" t="14064" r="2458" b="14222">Chunk</wd>

<space/>

<wd l="2530" t="14088" r="2842" b="14266">tag:</wd>

<space/>

<wd l="2966" t="14117" r="3062" b="14222">a</wd>

<space/>

<wd l="3130" t="14064" r="3859" b="14266">unigram</wd>

<space/>

<wd l="3931" t="14064" r="4536" b="14222">feature</wd>

<space/>

<wd l="4608" t="14064" r="4867" b="14222">for</wd>

<space/>

<wd l="4939" t="14064" r="5467" b="14222">chunk</wd>

<space/>

<wd l="5539" t="14088" r="5803" b="14266">tag</wd>

<space/>

</ln>

<ln l="1882" t="14333" r="5808" b="14534" baseLine="14487">

<wd l="1882" t="14386" r="2054" b="14525"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="750" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">0</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="750" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2131" t="14333" r="2443" b="14491">and</wd>

<space/>

<wd l="2506" t="14386" r="2602" b="14491">a</wd>

<space/>

<wd l="2664" t="14333" r="3691" b="14534">conjunction</wd>

<space/>

<wd l="3749" t="14333" r="4354" b="14491">feature</wd>

<space/>

<wd l="4411" t="14333" r="4800" b="14491">with</wd>

<space/>

<wd l="4862" t="14333" r="5126" b="14491">the</wd>

<space/>

<wd l="5194" t="14357" r="5808" b="14491">current</wd>

<space/>

</run>

</ln>

<ln l="1877" t="14592" r="5194" b="14818" baseLine="14756">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="14606" r="2323" b="14765">word</wd>

<space/>

<wd l="2381" t="14606" r="2693" b="14765">and</wd>

<space/>

<wd l="2746" t="14606" r="3014" b="14765">the</wd>

<space/>

<wd l="3072" t="14630" r="3686" b="14765">current</wd>

<space/>

<wd l="3744" t="14606" r="4277" b="14765">chunk</wd>

<space/>

<wd l="4330" t="14630" r="4594" b="14808">tag</wd>

<space/>

</run>

<wd l="4656" t="14592" r="5194" b="14818"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">w</run>

<run underlined="none" subsuperscript="none" fontSize="750" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">0</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">|</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="750" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">0</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<rulerline l="1437" t="15048" r="2640" b="15048" type="single" width="10" color="000000"/>

<para l="1699" t="15101" r="4354" b="15302" alignment="left" li="216" spaceBefore="58" spaceAfter="14" lsp="exactly" lspExact="207" language="en">

<ln l="1699" t="15101" r="4354" b="15302" baseLine="15257">

<wd l="1699" t="15101" r="4066" b="15302"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">https://github.com/aritter/twitter</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4128" t="15134" r="4354" b="15302">nlp</wd>

</run>

</ln>

</para>

</column>

<column l="6144" t="1260" r="10531" b="15333">

<para l="6144" t="1320" r="8232" b="1522" alignment="left" spaceBefore="22" lsp="exactly" lspExact="250" language="en">

<ln l="6144" t="1320" r="8232" b="1522" baseLine="1474" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">

<wd l="6144" t="1320" r="6413" b="1478">4.3</wd>

<space/>

<wd l="6638" t="1325" r="7258" b="1478">Brown</wd>

<space/>

<wd l="7320" t="1320" r="8232" b="1522">clustering</wd>

</ln>

</para>

<para l="6144" t="1670" r="10526" b="3187" alignment="justified" spaceBefore="77" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="1670" r="10507" b="1872" baseLine="1824" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1675" r="6734" b="1829">Brown</wd>

<space/>

<wd l="6898" t="1670" r="7747" b="1872">clustering</wd>

<space/>

<wd l="7910" t="1670" r="8045" b="1829">is</wd>

<space/>

<wd l="8213" t="1723" r="8309" b="1829">a</wd>

<space/>

<wd l="8462" t="1670" r="9490" b="1829">hierarchical</wd>

<space/>

<wd l="9658" t="1670" r="10507" b="1872">clustering</wd>

<space/>

</ln>

<ln l="6144" t="1944" r="10526" b="2146" baseLine="2093" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1944" r="6802" b="2102">method</wd>

<space/>

<wd l="6893" t="1944" r="7224" b="2102">that</wd>

<space/>

<wd l="7320" t="1997" r="7901" b="2146">groups</wd>

<space/>

<wd l="8006" t="1944" r="8530" b="2102">words</wd>

<space/>

<wd l="8630" t="1944" r="8966" b="2102">into</wd>

<space/>

<wd l="9067" t="1997" r="9163" b="2102">a</wd>

<space/>

<wd l="9254" t="1944" r="9811" b="2146">binary</wd>

<space/>

<wd l="9907" t="1968" r="10234" b="2102">tree</wd>

<space/>

<wd l="10334" t="1944" r="10526" b="2102">of</wd>

<space/>

</ln>

<ln l="6149" t="2213" r="10517" b="2410" baseLine="2366" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="2213" r="6744" b="2371">classes</wd>

<space/>

<wd l="6845" t="2218" r="7498" b="2410">(Brown</wd>

<space/>

<wd l="7584" t="2237" r="7738" b="2371">et</wd>

<space/>

<wd l="7829" t="2213" r="8078" b="2400">al.,</wd>

<space/>

<wd l="8203" t="2218" r="8731" b="2410">1992).</wd>

<space/>

<wd l="8899" t="2218" r="9182" b="2371">We</wd>

<space/>

<wd l="9274" t="2213" r="10330" b="2371">downloaded</wd>

<space/>

<wd l="10421" t="2266" r="10517" b="2371">a</wd>

<space/>

</ln>

<ln l="6144" t="2448" r="10507" b="2688" baseLine="2631">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="2486" r="6701" b="2645">brown</wd>

<space/>

</run>

<wd l="6744" t="2448" r="7680" b="2688"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">clustering</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">4</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7733" t="2486" r="8232" b="2645">based</wd>

<space/>

<wd l="8280" t="2539" r="8491" b="2645">on</wd>

<space/>

<wd l="8534" t="2486" r="9437" b="2688">Wikipedia</wd>

<space/>

<wd l="9475" t="2486" r="10253" b="2688">provided</wd>

<space/>

<wd l="10291" t="2486" r="10507" b="2688">by</wd>

<space/>

</run>

</ln>

<ln l="6144" t="2755" r="10526" b="2957" baseLine="2904" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2755" r="6715" b="2914">Turian</wd>

<space/>

<wd l="6792" t="2779" r="6946" b="2914">et</wd>

<space/>

<wd l="7018" t="2755" r="7214" b="2914">al.</wd>

<space/>

<wd l="7301" t="2760" r="7920" b="2952">(2010).</wd>

<space/>

<wd l="8040" t="2760" r="8323" b="2914">We</wd>

<space/>

<wd l="8395" t="2755" r="8794" b="2914">used</wd>

<space/>

<wd l="8861" t="2755" r="9394" b="2914">whole</wd>

<space/>

<wd l="9466" t="2755" r="9696" b="2914">bit</wd>

<space/>

<wd l="9773" t="2755" r="10258" b="2957">string</wd>

<space/>

<wd l="10334" t="2755" r="10526" b="2914">of</wd>

<space/>

</ln>

<ln l="6144" t="3029" r="7627" b="3187" baseLine="3178" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3029" r="6413" b="3187">the</wd>

<space/>

<wd l="6470" t="3053" r="7085" b="3187">current</wd>

<space/>

<wd l="7138" t="3029" r="7627" b="3187">word.</wd>

</ln>

</para>

<para l="6144" t="3470" r="8568" b="3672" alignment="left" spaceBefore="197" lsp="exactly" lspExact="250" language="en">

<ln l="6144" t="3470" r="8568" b="3672" baseLine="3624" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="6144" t="3470" r="6413" b="3629">4.4</wd>

<space/>

<wd l="6638" t="3475" r="7166" b="3629">Word</wd>

<space/>

<wd l="7224" t="3470" r="8568" b="3672">representation</wd>

</ln>

</para>

<para l="6144" t="3821" r="10512" b="9715" alignment="justified" spaceBefore="75" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="3821" r="10507" b="4022" baseLine="3970" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="3826" r="6379" b="3979">As</wd>

<space/>

<wd l="6461" t="3874" r="6557" b="3979">a</wd>

<space/>

<wd l="6614" t="3874" r="6970" b="3979">new</wd>

<space/>

<wd l="7051" t="3874" r="7651" b="4008">source,</wd>

<space/>

<wd l="7733" t="3845" r="8208" b="3979">tweet</wd>

<space/>

<wd l="8275" t="3821" r="8640" b="3979">data</wd>

<space/>

<wd l="8707" t="3874" r="8966" b="3979">are</wd>

<space/>

<wd l="9034" t="3845" r="9312" b="3979">not</wd>

<space/>

<wd l="9384" t="3821" r="10277" b="4022">applicable</wd>

<space/>

<wd l="10339" t="3845" r="10507" b="3979">to</wd>

<space/>

</ln>

<ln l="6144" t="4094" r="10512" b="4253" baseLine="4243" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="4094" r="6413" b="4253">the</wd>

<space/>

<wd l="6475" t="4094" r="7368" b="4253">traditional</wd>

<space/>

<wd l="7435" t="4094" r="7978" b="4253">model</wd>

<space/>

<wd l="8045" t="4094" r="8736" b="4253">because</wd>

<space/>

<wd l="8808" t="4094" r="8995" b="4253">of</wd>

<space/>

<wd l="9048" t="4094" r="9312" b="4253">the</wd>

<space/>

<wd l="9384" t="4094" r="10123" b="4253">different</wd>

<space/>

<wd l="10186" t="4118" r="10512" b="4253">text</wd>

<space/>

</ln>

<ln l="6154" t="4363" r="10512" b="4550" baseLine="4512" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="4387" r="6950" b="4522">structure.</wd>

<space/>

<wd l="7128" t="4368" r="7430" b="4522">For</wd>

<space/>

<wd l="7517" t="4416" r="7613" b="4522">a</wd>

<space/>

<wd l="7694" t="4416" r="8050" b="4522">new</wd>

<space/>

<wd l="8141" t="4363" r="8726" b="4550">model,</wd>

<space/>

<wd l="8832" t="4363" r="8957" b="4522">it</wd>

<space/>

<wd l="9038" t="4363" r="9178" b="4522">is</wd>

<space/>

<wd l="9274" t="4363" r="9874" b="4522">natural</wd>

<space/>

<wd l="9965" t="4387" r="10133" b="4522">to</wd>

<space/>

<wd l="10219" t="4416" r="10512" b="4522">use</wd>

<space/>

</ln>

<ln l="6149" t="4632" r="10512" b="4819" baseLine="4786" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="4632" r="6994" b="4790">annotated</wd>

<space/>

<wd l="7080" t="4632" r="7478" b="4790">data.</wd>

<space/>

<wd l="7632" t="4637" r="8453" b="4819">However,</wd>

<space/>

<wd l="8549" t="4632" r="8674" b="4790">it</wd>

<space/>

<wd l="8750" t="4632" r="8890" b="4790">is</wd>

<space/>

<wd l="8981" t="4632" r="9662" b="4790">difficult</wd>

<space/>

<wd l="9739" t="4656" r="9907" b="4790">to</wd>

<space/>

<wd l="9994" t="4656" r="10512" b="4790">create</wd>

<space/>

</ln>

<ln l="6144" t="4906" r="10498" b="5107" baseLine="5054" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="4958" r="6499" b="5064">new</wd>

<space/>

<wd l="6566" t="4906" r="7195" b="5064">labeled</wd>

<space/>

<wd l="7262" t="4906" r="7627" b="5064">data</wd>

<space/>

<wd l="7685" t="4906" r="7944" b="5064">for</wd>

<space/>

<wd l="8006" t="4958" r="8102" b="5064">a</wd>

<space/>

<wd l="8160" t="4906" r="8611" b="5107">rapid</wd>

<space/>

<wd l="8678" t="4906" r="9595" b="5107">generation</wd>

<space/>

<wd l="9658" t="4906" r="9850" b="5064">of</wd>

<space/>

<wd l="9898" t="4930" r="10498" b="5064">tweets.</wd>

<space/>

</ln>

<ln l="6144" t="5174" r="10502" b="5376" baseLine="5328" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="5174" r="6778" b="5333">Instead</wd>

<space/>

<wd l="6850" t="5174" r="7042" b="5333">of</wd>

<space/>

<wd l="7099" t="5174" r="7987" b="5376">constantly</wd>

<space/>

<wd l="8064" t="5198" r="8798" b="5333">annotate</wd>

<space/>

<wd l="8870" t="5227" r="9226" b="5333">new</wd>

<space/>

<wd l="9302" t="5174" r="9706" b="5362">data,</wd>

<space/>

<wd l="9787" t="5174" r="10051" b="5333">the</wd>

<space/>

<wd l="10128" t="5227" r="10502" b="5376">gen-</wd>

</ln>

<ln l="6149" t="5448" r="10502" b="5650" baseLine="5597" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="5448" r="6470" b="5606">eral</wd>

<space/>

<wd l="6547" t="5448" r="7238" b="5606">solution</wd>

<space/>

<wd l="7301" t="5448" r="7440" b="5606">is</wd>

<space/>

<wd l="7517" t="5448" r="8213" b="5650">creating</wd>

<space/>

<wd l="8280" t="5448" r="8971" b="5606">induced</wd>

<space/>

<wd l="9034" t="5448" r="9480" b="5606">word</wd>

<space/>

<wd l="9542" t="5472" r="10502" b="5650">representa-</wd>

</ln>

<ln l="6144" t="5717" r="10507" b="5918" baseLine="5870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="5717" r="6562" b="5875">tions</wd>

<space/>

<wd l="6614" t="5717" r="7042" b="5875">from</wd>

<space/>

<wd l="7085" t="5770" r="7181" b="5875">a</wd>

<space/>

<wd l="7219" t="5717" r="7651" b="5918">large</wd>

<space/>

<wd l="7694" t="5717" r="8126" b="5918">body</wd>

<space/>

<wd l="8174" t="5717" r="8366" b="5875">of</wd>

<space/>

<wd l="8395" t="5717" r="9245" b="5875">unlabeled</wd>

<space/>

<wd l="9293" t="5717" r="9653" b="5875">data</wd>

<space/>

<wd l="9701" t="5717" r="10507" b="5914">(Mikolov</wd>

<space/>

</ln>

<ln l="6149" t="5990" r="10498" b="6192" baseLine="6139" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="6014" r="6307" b="6149">et</wd>

<space/>

<wd l="6384" t="5990" r="6634" b="6178">al.,</wd>

<space/>

<wd l="6734" t="5995" r="7210" b="6178">2013;</wd>

<space/>

<wd l="7310" t="5990" r="8309" b="6192">Pennington</wd>

<space/>

<wd l="8386" t="6014" r="8539" b="6149">et</wd>

<space/>

<wd l="8621" t="5990" r="8870" b="6178">al.,</wd>

<space/>

<wd l="8966" t="5995" r="9446" b="6178">2014;</wd>

<space/>

<wd l="9552" t="5990" r="9936" b="6144">Kim</wd>

<space/>

<wd l="10018" t="6014" r="10171" b="6149">et</wd>

<space/>

<wd l="10248" t="5990" r="10498" b="6178">al.,</wd>

<space/>

</ln>

<ln l="6149" t="6259" r="10502" b="6461" baseLine="6413" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="6264" r="6629" b="6446">2014;</wd>

<space/>

<wd l="6734" t="6259" r="7814" b="6418">Anastasakos</wd>

<space/>

<wd l="7906" t="6283" r="8059" b="6418">et</wd>

<space/>

<wd l="8141" t="6259" r="8390" b="6446">al.,</wd>

<space/>

<wd l="8491" t="6264" r="9038" b="6456">2014).</wd>

<space/>

<wd l="9192" t="6264" r="9350" b="6413">A</wd>

<space/>

<wd l="9427" t="6259" r="9658" b="6418">lot</wd>

<space/>

<wd l="9739" t="6259" r="9931" b="6418">of</wd>

<space/>

<wd l="9994" t="6259" r="10502" b="6461">previ-</wd>

</ln>

<ln l="6149" t="6533" r="10502" b="6734" baseLine="6682" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="6586" r="6442" b="6691">ous</wd>

<space/>

<wd l="6518" t="6533" r="6970" b="6691">work</wd>

<space/>

<wd l="7037" t="6533" r="7440" b="6691">have</wd>

<space/>

<wd l="7512" t="6533" r="7915" b="6691">used</wd>

<space/>

<wd l="7987" t="6538" r="8434" b="6691">CCA</wd>

<space/>

<wd l="8506" t="6533" r="9192" b="6691">because</wd>

<space/>

<wd l="9269" t="6533" r="9461" b="6691">of</wd>

<space/>

<wd l="9518" t="6533" r="9715" b="6691">its</wd>

<space/>

<wd l="9806" t="6533" r="10502" b="6734">simplic-</wd>

</ln>

<ln l="6144" t="6802" r="10498" b="7003" baseLine="6950" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="6802" r="6374" b="7003">ity</wd>

<space/>

<wd l="6451" t="6802" r="6763" b="6960">and</wd>

<space/>

<wd l="6840" t="6802" r="7704" b="7003">generality</wd>

<space/>

<wd l="7786" t="6802" r="8242" b="6998">(Kim</wd>

<space/>

<wd l="8314" t="6826" r="8472" b="6960">et</wd>

<space/>

<wd l="8544" t="6802" r="8794" b="6989">al.,</wd>

<space/>

<wd l="8885" t="6802" r="9461" b="6989">2015c;</wd>

<space/>

<wd l="9562" t="6802" r="9946" b="6955">Kim</wd>

<space/>

<wd l="10022" t="6826" r="10176" b="6960">et</wd>

<space/>

<wd l="10248" t="6802" r="10498" b="6989">al.,</wd>

<space/>

</ln>

<ln l="6149" t="7075" r="10512" b="7272" baseLine="7224" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="7075" r="6739" b="7262">2015d;</wd>

<space/>

<wd l="6806" t="7080" r="7402" b="7234">Stratos</wd>

<space/>

<wd l="7464" t="7099" r="7618" b="7234">et</wd>

<space/>

<wd l="7670" t="7075" r="7920" b="7262">al.,</wd>

<space/>

<wd l="7987" t="7080" r="8462" b="7262">2014;</wd>

<space/>

<wd l="8534" t="7075" r="8918" b="7229">Kim</wd>

<space/>

<wd l="8971" t="7099" r="9125" b="7234">et</wd>

<space/>

<wd l="9178" t="7075" r="9427" b="7262">al.,</wd>

<space/>

<wd l="9494" t="7075" r="10147" b="7272">2015b).</wd>

<space/>

<wd l="10224" t="7080" r="10512" b="7234">We</wd>

<space/>

</ln>

<ln l="6149" t="7344" r="10502" b="7546" baseLine="7493" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="7368" r="6667" b="7502">create</wd>

<space/>

<wd l="6744" t="7397" r="6840" b="7502">a</wd>

<space/>

<wd l="6912" t="7344" r="7358" b="7502">word</wd>

<space/>

<wd l="7430" t="7344" r="8669" b="7546">representation</wd>

<space/>

<wd l="8741" t="7344" r="8952" b="7546">by</wd>

<space/>

<wd l="9029" t="7344" r="9499" b="7546">using</wd>

<space/>

<wd l="9576" t="7344" r="9845" b="7502">the</wd>

<space/>

<wd l="9922" t="7397" r="10502" b="7502">canon-</wd>

</ln>

<ln l="6144" t="7613" r="10502" b="7814" baseLine="7766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="7613" r="6456" b="7771">ical</wd>

<space/>

<wd l="6552" t="7613" r="7493" b="7771">correlation</wd>

<space/>

<wd l="7584" t="7613" r="8275" b="7814">analysis</wd>

<space/>

<wd l="8376" t="7613" r="9307" b="7814">(Hotelling,</wd>

<space/>

<wd l="9437" t="7613" r="9965" b="7810">1936).</wd>

<space/>

<wd l="10138" t="7618" r="10502" b="7771">Fur-</wd>

</ln>

<ln l="6144" t="7886" r="10498" b="8088" baseLine="8035" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="7886" r="6974" b="8074">thermore,</wd>

<space/>

<wd l="7061" t="7886" r="7507" b="8045">word</wd>

<space/>

<wd l="7584" t="7886" r="8626" b="8088">embeddings</wd>

<space/>

<wd l="8707" t="7939" r="8966" b="8045">are</wd>

<space/>

<wd l="9038" t="7886" r="9730" b="8045">induced</wd>

<space/>

<wd l="9797" t="7886" r="10224" b="8045">from</wd>

<space/>

<wd l="10315" t="7891" r="10498" b="8045">13</wd>

<space/>

</ln>

<ln l="6144" t="8155" r="10512" b="8357" baseLine="8309" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="8155" r="6778" b="8314">million</wd>

<space/>

<wd l="6830" t="8179" r="7378" b="8314">tweets</wd>

<space/>

<wd l="7445" t="8155" r="8357" b="8357">containing</wd>

<space/>

<wd l="8419" t="8160" r="8741" b="8314">270</wd>

<space/>

<wd l="8798" t="8155" r="9432" b="8314">million</wd>

<space/>

<wd l="9480" t="8155" r="10094" b="8314">tokens.</wd>

<space/>

<wd l="10171" t="8155" r="10512" b="8314">The</wd>

<space/>

</ln>

<ln l="6149" t="8429" r="10512" b="8630" baseLine="8578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="8429" r="7056" b="8587">dimension</wd>

<space/>

<wd l="7104" t="8429" r="7296" b="8587">of</wd>

<space/>

<wd l="7330" t="8429" r="7776" b="8587">word</wd>

<space/>

<wd l="7824" t="8429" r="8866" b="8630">embeddings</wd>

<space/>

<wd l="8923" t="8482" r="9173" b="8587">we</wd>

<space/>

<wd l="9221" t="8429" r="9624" b="8587">used</wd>

<space/>

<wd l="9667" t="8429" r="9806" b="8587">is</wd>

<space/>

<wd l="9864" t="8429" r="10075" b="8587">50</wd>

<space/>

<wd l="10123" t="8429" r="10512" b="8587">with</wd>

<space/>

</ln>

<ln l="6144" t="8693" r="10512" b="8899" baseLine="8851" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="8698" r="6667" b="8856">words</wd>

<space/>

<wd l="6734" t="8698" r="7565" b="8899">occurring</wd>

<space/>

<wd l="7622" t="8750" r="8069" b="8856">more</wd>

<space/>

<wd l="8126" t="8698" r="8501" b="8856">than</wd>

<space/>

<wd l="8558" t="8698" r="9029" b="8856">twice</wd>

<space/>

<wd l="9082" t="8698" r="9254" b="8851">in</wd>

<space/>

<wd l="9307" t="8698" r="9576" b="8856">the</wd>

<space/>

<wd l="9634" t="8698" r="10090" b="8856">data.</wd>

<space/>

<wd l="10171" t="8698" r="10512" b="8856">The</wd>

<space/>

</ln>

<ln l="6144" t="8971" r="10493" b="9130" baseLine="9120" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="8971" r="6840" b="9130">window</wd>

<space/>

<wd l="6931" t="8971" r="7262" b="9130">size</wd>

<space/>

<wd l="7339" t="8971" r="7598" b="9130">for</wd>

<space/>

<wd l="7675" t="8971" r="7939" b="9130">the</wd>

<space/>

<wd l="8026" t="8971" r="8923" b="9130">contextual</wd>

<space/>

<wd l="9005" t="8971" r="10037" b="9130">information</wd>

<space/>

<wd l="10118" t="8971" r="10253" b="9130">is</wd>

<space/>

<wd l="10344" t="8976" r="10493" b="9130">3:</wd>

<space/>

</ln>

<ln l="6144" t="9240" r="10512" b="9398" baseLine="9394" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9240" r="6413" b="9398">the</wd>

<space/>

<wd l="6504" t="9264" r="7118" b="9398">current</wd>

<space/>

<wd l="7205" t="9240" r="7651" b="9398">word</wd>

<space/>

<wd l="7742" t="9240" r="8054" b="9398">and</wd>

<space/>

<wd l="8146" t="9293" r="8242" b="9398">a</wd>

<space/>

<wd l="8323" t="9240" r="8770" b="9398">word</wd>

<space/>

<wd l="8856" t="9264" r="9019" b="9398">to</wd>

<space/>

<wd l="9110" t="9240" r="9379" b="9398">the</wd>

<space/>

<wd l="9466" t="9240" r="9758" b="9398">left</wd>

<space/>

<wd l="9850" t="9240" r="10157" b="9398">and</wd>

<space/>

<wd l="10243" t="9240" r="10512" b="9398">the</wd>

<space/>

</ln>

<ln l="6144" t="9514" r="8333" b="9715" baseLine="9662" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9514" r="6562" b="9715">right</wd>

<space/>

<wd l="6619" t="9514" r="6806" b="9672">of</wd>

<space/>

<wd l="6850" t="9514" r="7114" b="9672">the</wd>

<space/>

<wd l="7176" t="9538" r="7790" b="9672">current</wd>

<space/>

<wd l="7843" t="9514" r="8333" b="9672">word.</wd>

</ln>

</para>

<para l="6149" t="9974" r="7243" b="10142" alignment="left" spaceBefore="203" lsp="exactly" lspExact="273" language="en">

<ln l="6149" t="9974" r="7243" b="10142" baseLine="10133" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="16">

<wd l="6149" t="9974" r="6259" b="10142">5</wd>

<space/>

<wd l="6509" t="9974" r="7243" b="10142">Results</wd>

</ln>

</para>

<para l="6149" t="10402" r="7968" b="10603" alignment="left" spaceBefore="163" lsp="exactly" lspExact="250" language="en">

<ln l="6149" t="10402" r="7968" b="10603" baseLine="10550" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">

<wd l="6149" t="10402" r="6408" b="10560">5.1</wd>

<space/>

<wd l="6638" t="10406" r="7176" b="10560">Error</wd>

<space/>

<wd l="7238" t="10402" r="7968" b="10603">analysis</wd>

</ln>

</para>

<para l="6144" t="10752" r="10512" b="12533" alignment="justified" spaceBefore="80" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="10752" r="10512" b="10954" baseLine="10901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="10752" r="6773" b="10910">Twitter</wd>

<space/>

<wd l="6826" t="10752" r="7541" b="10910">contains</wd>

<space/>

<wd l="7603" t="10752" r="8074" b="10954">noisy</wd>

<space/>

<wd l="8131" t="10752" r="8443" b="10910">and</wd>

<space/>

<wd l="8496" t="10752" r="9245" b="10910">informal</wd>

<space/>

<wd l="9307" t="10752" r="9710" b="10954">style</wd>

<space/>

<wd l="9763" t="10776" r="10133" b="10939">text,</wd>

<space/>

<wd l="10200" t="10752" r="10512" b="10910">and</wd>

<space/>

</ln>

<ln l="6144" t="11021" r="10512" b="11222" baseLine="11170" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11045" r="6571" b="11179">most</wd>

<space/>

<wd l="6643" t="11021" r="6830" b="11179">of</wd>

<space/>

<wd l="6888" t="11021" r="7152" b="11179">the</wd>

<space/>

<wd l="7229" t="11021" r="8179" b="11179">state-of-art</wd>

<space/>

<wd l="8246" t="11021" r="9288" b="11222">applications</wd>

<space/>

<wd l="9374" t="11021" r="9816" b="11179">show</wd>

<space/>

<wd l="9893" t="11074" r="9989" b="11179">a</wd>

<space/>

<wd l="10051" t="11021" r="10512" b="11179">weak</wd>

<space/>

</ln>

<ln l="6144" t="11290" r="10498" b="11491" baseLine="11443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11290" r="7248" b="11491">performance</wd>

<space/>

<wd l="7325" t="11342" r="7536" b="11448">on</wd>

<space/>

<wd l="7608" t="11290" r="8237" b="11448">Twitter</wd>

<space/>

<wd l="8309" t="11290" r="8669" b="11448">data</wd>

<space/>

<wd l="8746" t="11290" r="9312" b="11486">(Ritter</wd>

<space/>

<wd l="9384" t="11314" r="9538" b="11448">et</wd>

<space/>

<wd l="9610" t="11290" r="9859" b="11477">al.,</wd>

<space/>

<wd l="9950" t="11294" r="10498" b="11486">2011).</wd>

<space/>

</ln>

<ln l="6144" t="11563" r="10512" b="11765" baseLine="11712" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11568" r="6326" b="11717">In</wd>

<space/>

<wd l="6394" t="11563" r="6701" b="11722">this</wd>

<space/>

<wd l="6787" t="11563" r="7440" b="11750">section,</wd>

<space/>

<wd l="7522" t="11616" r="7771" b="11722">we</wd>

<space/>

<wd l="7843" t="11563" r="8352" b="11722">check</wd>

<space/>

<wd l="8414" t="11563" r="8683" b="11722">the</wd>

<space/>

<wd l="8755" t="11616" r="9250" b="11722">errors</wd>

<space/>

<wd l="9326" t="11563" r="9586" b="11722">for</wd>

<space/>

<wd l="9648" t="11563" r="10118" b="11765">noisy</wd>

<space/>

<wd l="10186" t="11587" r="10512" b="11722">text</wd>

<space/>

</ln>

<ln l="6144" t="11832" r="10512" b="12034" baseLine="11986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11832" r="6571" b="11990">from</wd>

<space/>

<wd l="6610" t="11832" r="6878" b="11990">the</wd>

<space/>

<wd l="6922" t="11832" r="7632" b="11990">baseline</wd>

<space/>

<wd l="7685" t="11856" r="8285" b="12034">system</wd>

<space/>

<wd l="8328" t="11832" r="8640" b="11990">and</wd>

<space/>

<wd l="8688" t="11832" r="9576" b="12034">categorize</wd>

<space/>

<wd l="9619" t="11832" r="10099" b="11990">them.</wd>

<space/>

<wd l="10171" t="11832" r="10512" b="11990">The</wd>

<space/>

</ln>

<ln l="6144" t="12106" r="10502" b="12307" baseLine="12254" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="12106" r="6451" b="12264">last</wd>

<space/>

<wd l="6523" t="12130" r="6845" b="12264">two</wd>

<space/>

<wd l="6926" t="12158" r="7421" b="12264">errors</wd>

<space/>

<wd l="7507" t="12158" r="7766" b="12264">are</wd>

<space/>

<wd l="7838" t="12106" r="8434" b="12264">related</wd>

<space/>

<wd l="8506" t="12130" r="8674" b="12264">to</wd>

<space/>

<wd l="8750" t="12106" r="10032" b="12307">user-generated</wd>

<space/>

<wd l="10104" t="12130" r="10502" b="12264">texts</wd>

<space/>

</ln>

<ln l="6154" t="12374" r="7925" b="12533" baseLine="12528" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6154" t="12374" r="6547" b="12533">such</wd>

<space/>

<wd l="6605" t="12427" r="6773" b="12533">as</wd>

<space/>

<wd l="6835" t="12374" r="7464" b="12533">Twitter</wd>

<space/>

<wd l="7522" t="12374" r="7925" b="12533">data.</wd>

</ln>

</para>

<para l="6154" t="12830" r="10512" b="14928" alignment="justified" li="432" spaceBefore="184" spaceAfter="96" fli="-432" lsp="exactly" lspExact="271" language="en">

<ln l="6154" t="12830" r="10502" b="13032" baseLine="12979">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6154" t="12835" r="6830" b="12989">Unseen</wd>

<space/>

<wd l="6893" t="12835" r="7368" b="12989">word</wd>

<space/>

<wd l="7430" t="12878" r="8405" b="13032">sequences:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="8520" t="12830" r="8856" b="12989">The</wd>

<space/>

<wd l="8918" t="12830" r="9355" b="12989">main</wd>

<space/>

<wd l="9418" t="12883" r="9898" b="12989">cause</wd>

<space/>

<wd l="9960" t="12830" r="10152" b="12989">of</wd>

<space/>

<wd l="10195" t="12830" r="10502" b="12989">this</wd>

<space/>

</run>

</ln>

<ln l="6586" t="13104" r="10512" b="13306" baseLine="13253" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6586" t="13157" r="7008" b="13262">error</wd>

<space/>

<wd l="7080" t="13104" r="7214" b="13262">is</wd>

<space/>

<wd l="7296" t="13104" r="7469" b="13258">in</wd>

<space/>

<wd l="7546" t="13157" r="7642" b="13262">a</wd>

<space/>

<wd l="7709" t="13104" r="8621" b="13306">previously</wd>

<space/>

<wd l="8698" t="13157" r="9307" b="13262">unseen</wd>

<space/>

<wd l="9384" t="13157" r="10219" b="13306">sequence.</wd>

<space/>

<wd l="10354" t="13109" r="10512" b="13258">A</wd>

<space/>

</ln>

<ln l="6581" t="13373" r="10502" b="13574" baseLine="13522" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="13373" r="7003" b="13574">huge</wd>

<space/>

<wd l="7090" t="13373" r="7762" b="13531">number</wd>

<space/>

<wd l="7843" t="13373" r="8035" b="13531">of</wd>

<space/>

<wd l="8102" t="13397" r="8650" b="13531">tweets</wd>

<space/>

<wd l="8746" t="13426" r="9010" b="13531">are</wd>

<space/>

<wd l="9091" t="13373" r="9662" b="13574">posted</wd>

<space/>

<wd l="9749" t="13426" r="9965" b="13531">on</wd>

<space/>

<wd l="10042" t="13373" r="10502" b="13531">Twit-</wd>

</ln>

<ln l="6581" t="13642" r="10502" b="13843" baseLine="13795" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="13666" r="6816" b="13800">ter</wd>

<space/>

<wd l="6878" t="13694" r="7349" b="13843">every</wd>

<space/>

<wd l="7416" t="13642" r="7723" b="13843">day</wd>

<space/>

<wd l="7795" t="13642" r="8107" b="13800">and</wd>

<space/>

<wd l="8170" t="13642" r="8539" b="13843">they</wd>

<space/>

<wd l="8611" t="13642" r="9250" b="13800">contain</wd>

<space/>

<wd l="9307" t="13642" r="10205" b="13843">up-to-date</wd>

<space/>

<wd l="10267" t="13642" r="10502" b="13795">in-</wd>

</ln>

<ln l="6581" t="13915" r="10502" b="14074" baseLine="14064" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="13915" r="7445" b="14074">formation</wd>

<space/>

<wd l="7517" t="13968" r="7733" b="14074">on</wd>

<space/>

<wd l="7805" t="13939" r="8390" b="14074">events.</wd>

<space/>

<wd l="8515" t="13915" r="8851" b="14074">The</wd>

<space/>

<wd l="8923" t="13939" r="9350" b="14074">most</wd>

<space/>

<wd l="9418" t="13939" r="9950" b="14074">recent</wd>

<space/>

<wd l="10018" t="13915" r="10502" b="14074">infor-</wd>

</ln>

<ln l="6581" t="14184" r="10507" b="14386" baseLine="14338" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="14184" r="7190" b="14342">mation</wd>

<space/>

<wd l="7262" t="14184" r="7651" b="14342">such</wd>

<space/>

<wd l="7718" t="14237" r="7891" b="14342">as</wd>

<space/>

<wd l="7963" t="14237" r="8314" b="14342">new</wd>

<space/>

<wd l="8386" t="14184" r="9053" b="14386">product</wd>

<space/>

<wd l="9115" t="14184" r="10147" b="14342">information</wd>

<space/>

<wd l="10214" t="14237" r="10507" b="14342">can</wd>

<space/>

</ln>

<ln l="6581" t="14458" r="10512" b="14659" baseLine="14606" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="14458" r="6946" b="14616">lead</wd>

<space/>

<wd l="7008" t="14482" r="7171" b="14616">to</wd>

<space/>

<wd l="7238" t="14458" r="7502" b="14616">the</wd>

<space/>

<wd l="7565" t="14458" r="8429" b="14616">formation</wd>

<space/>

<wd l="8491" t="14458" r="8683" b="14616">of</wd>

<space/>

<wd l="8731" t="14458" r="10003" b="14659">unprecedented</wd>

<space/>

<wd l="10066" t="14458" r="10512" b="14616">word</wd>

<space/>

</ln>

<ln l="6590" t="14726" r="10512" b="14928" baseLine="14880" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6590" t="14779" r="7512" b="14928">sequences.</wd>

<space/>

<wd l="7589" t="14726" r="8107" b="14885">These</wd>

<space/>

<wd l="8174" t="14779" r="9038" b="14928">sequences</wd>

<space/>

<wd l="9106" t="14726" r="9317" b="14885">do</wd>

<space/>

<wd l="9374" t="14750" r="9653" b="14885">not</wd>

<space/>

<wd l="9710" t="14779" r="10291" b="14928">appear</wd>

<space/>

<wd l="10339" t="14726" r="10512" b="14880">in</wd>

</ln>

</para>

<rulerline l="6144" t="15048" r="7344" b="15048" type="single" width="10" color="000000"/>

<para l="6398" t="15101" r="9672" b="15302" alignment="left" li="216" spaceBefore="59" spaceAfter="13" lsp="exactly" lspExact="207" language="en">

<ln l="6398" t="15101" r="9672" b="15302" baseLine="15257">

<wd l="6398" t="15101" r="9672" b="15302"><run underlined="none" subsuperscript="none" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">4</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">http://metaoptimize.com/projects/wordreprs/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<dd l="1437" t="15736" r="10531" b="15977">

<para l="5800" t="15787" r="6148" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5866" t="15787" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="43">

<wd l="5866" t="15792" r="6082" b="15946">74</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4310.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1437" marginTop="1240" marginRight="1369" marginBottom="1302" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1437" t="1240" r="10540" b="6503">

<column l="1437" t="1240" r="10540" b="6503">

<table l="2894" t="1258" r="9053" b="4819" alignment="left" li="1457" ri="1487" spaceBefore="18" spaceAfter="186">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<gridTable>

<gridCol>1286</gridCol>

<gridCol>1460</gridCol>

<gridCol>729</gridCol>

<gridCol>1459</gridCol>

<gridCol>730</gridCol>

<gridCol>495</gridCol>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>254</gridRow>

<gridRow>269</gridRow>

<gridRow>269</gridRow>

<gridRow>274</gridRow>

<gridRow>273</gridRow>

<gridRow>269</gridRow>

<gridRow>269</gridRow>

<gridRow>273</gridRow>

<gridRow>269</gridRow>

<gridRow>302</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="2894" t="1258" r="4180" b="1541" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4646" t="1301" r="5890" b="1522" alignment="centered" lsp="exactly" lspExact="270" language="en">

<ln l="4646" t="1301" r="5890" b="1522" baseLine="1485">

<wd l="4646" t="1301" r="5890" b="1522"><run italic="true" underlined="none" subsuperscript="none" fontSize="1400" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="8">M</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="750" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="8">noEmbedding</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="750" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="8"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="4" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6931" t="1301" r="7987" b="1522" alignment="centered" lsp="exactly" lspExact="270" language="en">

<ln l="6931" t="1301" r="7987" b="1522" baseLine="1484">

<wd l="6931" t="1301" r="7987" b="1522"><run italic="true" underlined="none" subsuperscript="none" fontSize="1400" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="7">M</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="750" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="7">Embedding</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="750" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="7"><nl orig="true"/>

</run>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8683" t="1301" r="8923" b="1459" alignment="centered" spaceAfter="32" lsp="exactly" lspExact="250" language="en">

<ln l="8683" t="1301" r="8923" b="1459" baseLine="1450" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="8683" t="1306" r="8923" b="1459">+/-</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3312" t="1584" r="3763" b="1781" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="248" language="en">

<ln l="3312" t="1584" r="3763" b="1781" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="3312" t="1584" r="3763" b="1781">Type</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4478" t="1584" r="5352" b="1733" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="248" language="en">

<tabs position="4478"/>

<ln l="4478" t="1584" r="5352" b="1733" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-73">

<wd l="4478" t="1584" r="4613" b="1733">P</wd>

<tab position="4613"/>

<wd l="5198" t="1584" r="5352" b="1733">R</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5880" t="1579" r="6115" b="1733" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="248" language="en">

<ln l="5880" t="1579" r="6115" b="1733" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5880" t="1579" r="6115" b="1733">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6667" t="1584" r="7541" b="1733" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="248" language="en">

<tabs position="6667"/>

<ln l="6667" t="1584" r="7541" b="1733" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-73">

<wd l="6667" t="1584" r="6802" b="1733">P</wd>

<tab position="6802"/>

<wd l="7387" t="1584" r="7541" b="1733">R</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8074" t="1579" r="8304" b="1733" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="248" language="en">

<ln l="8074" t="1579" r="8304" b="1733" baseLine="1728" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="8074" t="1579" r="8304" b="1733">F1</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8558" t="1541" r="9053" b="1820" language="en">

<ln l="0" t="0" r="0" b="0" baseLine="0" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable">

<nl orig="true"/>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3192" t="1858" r="3883" b="2016" alignment="centered" spaceAfter="16" lsp="exactly" lspExact="252" language="en">

<ln l="3192" t="1858" r="3883" b="2016" baseLine="2011" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="3192" t="1858" r="3883" b="2016">Overall</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4301" t="1858" r="5515" b="2016" alignment="right" ri="125" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="1858" r="5515" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4301" t="1858" r="4776" b="2016">35.95</wd>

<tab position="4776"/>

<wd l="5030" t="1862" r="5515" b="2016">31.92</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5765" t="1862" r="6226" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="5765"/>

<ln l="5765" t="1862" r="6226" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5765" t="1862" r="6226" b="2016">33.81</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6494" t="1858" r="7704" b="2016" alignment="right" ri="124" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="6494"/>

<ln l="6494" t="1858" r="7704" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6494" t="1858" r="6970" b="2016">39.59</wd>

<tab position="6970"/>

<wd l="7224" t="1858" r="7704" b="2016">35.10</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="7954" t="1862" r="8414" b="2016" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="7954"/>

<ln l="7954" t="1862" r="8414" b="2016" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="7954" t="1862" r="8414" b="2016">37.21</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8750" t="1862" r="8866" b="2011" alignment="centered" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="8750" t="1862" r="8866" b="2011" baseLine="2011" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="1901" r="8866" b="2011">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3120" t="2141" r="3960" b="2338" alignment="centered" lsp="exactly" lspExact="249" language="en">

<ln l="3120" t="2141" r="3960" b="2338" baseLine="2290" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3120" t="2184" r="3960" b="2338">company</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4301" t="2136" r="5496" b="2294" alignment="right" ri="125" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="2136" r="5496" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4301" t="2136" r="4781" b="2294">27.59</wd>

<tab position="4781"/>

<wd l="5030" t="2136" r="5496" b="2294">20.51</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5765" t="2136" r="6235" b="2294" alignment="left" lsp="exactly" lspExact="249" language="en">

<tabs position="5765"/>

<ln l="5765" t="2136" r="6235" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="5765" t="2136" r="6235" b="2294">23.53</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6494" t="2141" r="7699" b="2294" alignment="right" ri="124" lsp="exactly" lspExact="249" language="en">

<tabs position="6494"/>

<ln l="6494" t="2141" r="7699" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6494" t="2141" r="6974" b="2294">32.14</wd>

<tab position="6974"/>

<wd l="7224" t="2141" r="7699" b="2294">23.08</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="3" gridRowTill="3" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7954" t="2136" r="8429" b="2294" alignment="left" lsp="exactly" lspExact="249" language="en">

<tabs position="7954"/>

<ln l="7954" t="2136" r="8429" b="2294" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7954" t="2136" r="8429" b="2294">26.87</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<topBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="2141" r="8866" b="2290" alignment="centered" lsp="exactly" lspExact="249" language="en">

<ln l="8750" t="2141" r="8866" b="2290" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="2179" r="8866" b="2290">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3216" t="2410" r="3854" b="2611" alignment="centered" spaceAfter="1" lsp="exactly" lspExact="253" language="en">

<ln l="3216" t="2410" r="3854" b="2611" baseLine="2558" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3216" t="2410" r="3854" b="2611">facility</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4301" t="2414" r="5515" b="2568" alignment="right" ri="125" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="4301"/>

<ln l="4301" t="2414" r="5515" b="2568" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4301" t="2414" r="4786" b="2568">24.14</wd>

<tab position="4786"/>

<wd l="5050" t="2414" r="5515" b="2568">18.42</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5765" t="2414" r="6245" b="2568" alignment="left" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="5765"/>

<ln l="5765" t="2414" r="6245" b="2568" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5765" t="2414" r="6245" b="2568">20.90</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6494" t="2410" r="7694" b="2568" alignment="right" ri="124" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="6494"/>

<ln l="6494" t="2410" r="7694" b="2568" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6494" t="2414" r="6974" b="2568">32.00</wd>

<tab position="6974"/>

<wd l="7224" t="2410" r="7694" b="2568">21.05</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7954" t="2410" r="8434" b="2568" alignment="left" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="7954"/>

<ln l="7954" t="2410" r="8434" b="2568" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="7954" t="2410" r="8434" b="2568">25.40</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="2414" r="8866" b="2563" alignment="centered" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<ln l="8750" t="2414" r="8866" b="2563" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="2453" r="8866" b="2563">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3216" t="2683" r="3864" b="2880" alignment="centered" lsp="exactly" lspExact="240" language="en">

<ln l="3216" t="2683" r="3864" b="2880" baseLine="2832" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3216" t="2683" r="3864" b="2880">geo-loc</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4296" t="2678" r="5510" b="2837" alignment="right" ri="125" lsp="exactly" lspExact="259" language="en">

<tabs position="4296"/>

<ln l="4296" t="2678" r="5510" b="2837" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4296" t="2678" r="4786" b="2837">42.66</wd>

<tab position="4786"/>

<wd l="5030" t="2678" r="5510" b="2837">52.59</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5760" t="2683" r="6245" b="2837" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="5760"/>

<ln l="5760" t="2683" r="6245" b="2837" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="5760" t="2683" r="6245" b="2837">47.10</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6490" t="2678" r="7699" b="2837" alignment="right" ri="124" lsp="exactly" lspExact="259" language="en">

<tabs position="6490"/>

<ln l="6490" t="2678" r="7699" b="2837" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6490" t="2678" r="6974" b="2837">46.00</wd>

<tab position="6974"/>

<wd l="7224" t="2678" r="7699" b="2837">59.48</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7954" t="2678" r="8429" b="2837" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="7954"/>

<ln l="7954" t="2678" r="8429" b="2837" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="7954" t="2678" r="8429" b="2837">51.88</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="2683" r="8866" b="2832" alignment="centered" lsp="exactly" lspExact="259" language="en">

<ln l="8750" t="2683" r="8866" b="2832" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="2722" r="8866" b="2832">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3259" t="2952" r="3816" b="3110" alignment="centered" lsp="exactly" lspExact="244" language="en">

<ln l="3259" t="2952" r="3816" b="3110" baseLine="3101" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3259" t="2952" r="3816" b="3110">movie</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4320" t="2952" r="5458" b="3110" alignment="right" ri="125" lsp="exactly" lspExact="263" language="en">

<tabs position="4320"/>

<ln l="4320" t="2952" r="5458" b="3110" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4320" t="2957" r="4781" b="3110">14.29</wd>

<tab position="4781"/>

<wd l="5088" t="2952" r="5458" b="3110">6.67</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5818" t="2957" r="6187" b="3110" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="5818"/>

<ln l="5818" t="2957" r="6187" b="3110" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5818" t="2957" r="6187" b="3110">9.09</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6552" t="2952" r="7646" b="3110" alignment="right" ri="124" lsp="exactly" lspExact="263" language="en">

<tabs position="6552"/>

<ln l="6552" t="2952" r="7646" b="3110" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6552" t="2957" r="6912" b="3110">8.33</wd>

<tab position="6912"/>

<wd l="7277" t="2952" r="7646" b="3110">6.67</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8002" t="2957" r="8362" b="3110" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="8002"/>

<ln l="8002" t="2957" r="8362" b="3110" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="8002" t="2957" r="8362" b="3110">7.41</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8774" t="2952" r="8832" b="3101" alignment="centered" lsp="exactly" lspExact="263" language="en">

<ln l="8774" t="2952" r="8832" b="3101" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8774" t="3048" r="8832" b="3067">-</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3014" t="3221" r="4061" b="3379" alignment="centered" lsp="exactly" lspExact="245" language="en">

<ln l="3014" t="3221" r="4061" b="3379" baseLine="3374" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3014" t="3221" r="4061" b="3379">musicartist</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4358" t="3226" r="5462" b="3379" alignment="right" ri="125" lsp="exactly" lspExact="263" language="en">

<tabs position="4358"/>

<ln l="4358" t="3226" r="5462" b="3379" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4358" t="3226" r="4733" b="3379">0.00</wd>

<tab position="4733"/>

<wd l="5088" t="3226" r="5462" b="3379">0.00</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5818" t="3226" r="6192" b="3379" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="5818"/>

<ln l="5818" t="3226" r="6192" b="3379" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5818" t="3226" r="6192" b="3379">0.00</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6542" t="3221" r="7651" b="3379" alignment="right" ri="124" lsp="exactly" lspExact="263" language="en">

<tabs position="6542"/>

<ln l="6542" t="3221" r="7651" b="3379" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6542" t="3221" r="6917" b="3379">7.69</wd>

<tab position="6917"/>

<wd l="7277" t="3226" r="7651" b="3379">2.44</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8006" t="3226" r="8381" b="3379" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="8006"/>

<ln l="8006" t="3226" r="8381" b="3379" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8006" t="3226" r="8381" b="3379">3.70</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="3226" r="8866" b="3374" alignment="centered" lsp="exactly" lspExact="263" language="en">

<ln l="8750" t="3226" r="8866" b="3374" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="3264" r="8866" b="3374">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3293" t="3499" r="3787" b="3653" alignment="centered" lsp="exactly" lspExact="249" language="en">

<ln l="3293" t="3499" r="3787" b="3653" baseLine="3643" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3293" t="3499" r="3787" b="3653">other</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4320" t="3494" r="5510" b="3653" alignment="right" ri="125" lsp="exactly" lspExact="263" language="en">

<tabs position="4320"/>

<ln l="4320" t="3494" r="5510" b="3653" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4320" t="3499" r="4776" b="3653">18.33</wd>

<tab position="4776"/>

<wd l="5050" t="3494" r="5510" b="3653">16.67</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="8" gridRowTill="8" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5784" t="3494" r="6245" b="3653" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="5784"/>

<ln l="5784" t="3494" r="6245" b="3653" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5784" t="3494" r="6245" b="3653">17.46</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6494" t="3499" r="7704" b="3653" alignment="right" ri="124" lsp="exactly" lspExact="263" language="en">

<tabs position="6494"/>

<ln l="6494" t="3499" r="7704" b="3653" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6494" t="3499" r="6970" b="3653">20.49</wd>

<tab position="6970"/>

<wd l="7243" t="3499" r="7704" b="3653">18.94</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="8" gridRowTill="8" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7973" t="3494" r="8429" b="3653" alignment="left" lsp="exactly" lspExact="263" language="en">

<tabs position="7973"/>

<ln l="7973" t="3494" r="8429" b="3653" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">

<wd l="7973" t="3494" r="8429" b="3653">19.69</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="3499" r="8866" b="3648" alignment="centered" lsp="exactly" lspExact="263" language="en">

<ln l="8750" t="3499" r="8866" b="3648" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="3538" r="8866" b="3648">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3221" t="3768" r="3850" b="3965" alignment="centered" spaceAfter="1" lsp="exactly" lspExact="253" language="en">

<ln l="3221" t="3768" r="3850" b="3965" baseLine="3912" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3221" t="3811" r="3850" b="3965">person</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4301" t="3763" r="5510" b="3922" alignment="right" ri="125" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="4301"/>

<ln l="4301" t="3763" r="5510" b="3922" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4301" t="3763" r="4781" b="3922">53.27</wd>

<tab position="4781"/>

<wd l="5030" t="3763" r="5510" b="3922">61.99</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5765" t="3763" r="6245" b="3922" alignment="left" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="5765"/>

<ln l="5765" t="3763" r="6245" b="3922" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5765" t="3763" r="6245" b="3922">57.30</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6494" t="3763" r="7694" b="3922" alignment="right" ri="124" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="6494"/>

<ln l="6494" t="3763" r="7694" b="3922" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6494" t="3763" r="6970" b="3922">56.99</wd>

<tab position="6970"/>

<wd l="7224" t="3763" r="7694" b="3922">64.33</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7954" t="3763" r="8434" b="3922" alignment="left" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<tabs position="7954"/>

<ln l="7954" t="3763" r="8434" b="3922" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="7954" t="3763" r="8434" b="3922">60.44</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="3768" r="8866" b="3917" alignment="centered" spaceAfter="4" lsp="exactly" lspExact="264" language="en">

<ln l="8750" t="3768" r="8866" b="3917" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="3806" r="8866" b="3917">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3168" t="4042" r="3907" b="4238" alignment="centered" spaceAfter="1" lsp="exactly" lspExact="253" language="en">

<ln l="3168" t="4042" r="3907" b="4238" baseLine="4186" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3168" t="4042" r="3907" b="4238">product</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4358" t="4037" r="5462" b="4195" alignment="right" ri="125" spaceAfter="4" lsp="exactly" lspExact="269" language="en">

<tabs position="4358"/>

<ln l="4358" t="4037" r="5462" b="4195" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4358" t="4037" r="4728" b="4195">3.57</wd>

<tab position="4728"/>

<wd l="5088" t="4042" r="5462" b="4195">2.70</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5818" t="4042" r="6187" b="4195" alignment="left" spaceAfter="4" lsp="exactly" lspExact="269" language="en">

<tabs position="5818"/>

<ln l="5818" t="4042" r="6187" b="4195" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5818" t="4042" r="6187" b="4195">3.08</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6514" t="4042" r="7632" b="4195" alignment="right" ri="124" spaceAfter="4" lsp="exactly" lspExact="269" language="en">

<tabs position="6514"/>

<ln l="6514" t="4042" r="7632" b="4195" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6514" t="4042" r="6970" b="4195">14.29</wd>

<tab position="6970"/>

<wd l="7282" t="4042" r="7632" b="4195">8.11</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7973" t="4042" r="8434" b="4195" alignment="left" spaceAfter="4" lsp="exactly" lspExact="269" language="en">

<tabs position="7973"/>

<ln l="7973" t="4042" r="8434" b="4195" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="7973" t="4042" r="8434" b="4195">10.34</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="4042" r="8866" b="4190" alignment="centered" spaceAfter="4" lsp="exactly" lspExact="269" language="en">

<ln l="8750" t="4042" r="8866" b="4190" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="4080" r="8866" b="4190">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="3029" t="4310" r="4051" b="4507" alignment="centered" lsp="exactly" lspExact="245" language="en">

<ln l="3029" t="4310" r="4051" b="4507" baseLine="4454" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3029" t="4320" r="4051" b="4507">sportsteam</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="4301" t="4306" r="5462" b="4464" alignment="right" ri="125" lsp="exactly" lspExact="259" language="en">

<tabs position="4301"/>

<ln l="4301" t="4306" r="5462" b="4464" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4301" t="4306" r="4786" b="4464">62.50</wd>

<tab position="4786"/>

<wd l="5083" t="4310" r="5462" b="4464">7.14</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="11" gridRowTill="11" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="5784" t="4310" r="6245" b="4464" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="5784"/>

<ln l="5784" t="4310" r="6245" b="4464" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5784" t="4310" r="6245" b="4464">12.82</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="6494" t="4306" r="7646" b="4464" alignment="right" ri="124" lsp="exactly" lspExact="259" language="en">

<tabs position="6494"/>

<ln l="6494" t="4306" r="7646" b="4464" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6494" t="4306" r="6965" b="4464">54.55</wd>

<tab position="6965"/>

<wd l="7282" t="4306" r="7646" b="4464">8.57</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="11" gridRowTill="11" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="7973" t="4310" r="8414" b="4464" alignment="left" lsp="exactly" lspExact="259" language="en">

<tabs position="7973"/>

<ln l="7973" t="4310" r="8414" b="4464" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-9">

<wd l="7973" t="4310" r="8414" b="4464">14.81</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<para l="8750" t="4310" r="8866" b="4459" alignment="centered" lsp="exactly" lspExact="259" language="en">

<ln l="8750" t="4310" r="8866" b="4459" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8750" t="4349" r="8866" b="4459">+</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="3211" t="4579" r="3864" b="4733" alignment="centered" spaceAfter="20" lsp="exactly" lspExact="253" language="en">

<ln l="3211" t="4579" r="3864" b="4733" baseLine="4728" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3211" t="4579" r="3864" b="4733">tvshow</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="4358" t="4579" r="5462" b="4733" alignment="right" ri="125" spaceAfter="23" lsp="exactly" lspExact="269" language="en">

<tabs position="4358"/>

<ln l="4358" t="4579" r="5462" b="4733" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4358" t="4579" r="4733" b="4733">0.00</wd>

<tab position="4733"/>

<wd l="5088" t="4579" r="5462" b="4733">0.00</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="12" gridRowTill="12" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="5818" t="4579" r="6192" b="4733" alignment="left" spaceAfter="23" lsp="exactly" lspExact="269" language="en">

<tabs position="5818"/>

<ln l="5818" t="4579" r="6192" b="4733" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5818" t="4579" r="6192" b="4733">0.00</wd>

</ln>

</para>

</cell>

<cell gridColFrom="3" gridColTill="3" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="6547" t="4579" r="7651" b="4733" alignment="right" ri="124" spaceAfter="23" lsp="exactly" lspExact="269" language="en">

<tabs position="6547"/>

<ln l="6547" t="4579" r="7651" b="4733" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6547" t="4579" r="6922" b="4733">0.00</wd>

<tab position="6922"/>

<wd l="7277" t="4579" r="7651" b="4733">0.00</wd>

</ln>

</para>

</cell>

<cell gridColFrom="4" gridColTill="4" gridRowFrom="12" gridRowTill="12" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8006" t="4579" r="8381" b="4733" alignment="left" spaceAfter="23" lsp="exactly" lspExact="269" language="en">

<tabs position="8006"/>

<ln l="8006" t="4579" r="8381" b="4733" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="8006" t="4579" r="8381" b="4733">0.00</wd>

</ln>

</para>

</cell>

<cell gridColFrom="5" gridColTill="5" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="10"/>

<rightBorder type="single" width="10"/>

<bottomBorder type="single" width="10"/>

<para l="8794" t="4584" r="8822" b="4733" alignment="centered" spaceAfter="23" lsp="exactly" lspExact="269" language="en">

<ln l="8794" t="4584" r="8822" b="4733" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="8794" t="4704" r="8822" b="4733">.</wd>

</ln>

</para>

</cell>

</table>

<para l="1440" t="5136" r="10517" b="6106" alignment="justified" spaceBefore="69" spaceAfter="340" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="5136" r="10512" b="5357" baseLine="5292">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="5136" r="1920" b="5294">Table</wd>

<space/>

<wd l="1973" t="5141" r="2122" b="5294">2:</wd>

<space/>

<wd l="2203" t="5136" r="2842" b="5294">Results</wd>

<space/>

<wd l="2899" t="5136" r="3158" b="5294">for</wd>

<space/>

<wd l="3202" t="5136" r="3744" b="5294">model</wd>

<space/>

<wd l="3797" t="5136" r="4190" b="5294">with</wd>

<space/>

<wd l="4243" t="5136" r="4555" b="5294">and</wd>

<space/>

<wd l="4603" t="5136" r="5270" b="5294">without</wd>

<space/>

<wd l="5318" t="5136" r="5770" b="5294">word</wd>

<space/>

<wd l="5822" t="5136" r="6830" b="5338">embedding.</wd>

<space/>

</run>

<wd l="6912" t="5136" r="8155" b="5357"><run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">M</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">noEmbedding</run>

</wd>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8222" t="5136" r="8534" b="5294">and</wd>

</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="8587" t="5136" r="9648" b="5357"><run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">M</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">Embedding</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9710" t="5160" r="10512" b="5338">represent</wd>

<space/>

</run>

</ln>

<ln l="1440" t="5405" r="10517" b="5606" baseLine="5554" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5405" r="1704" b="5563">the</wd>

<space/>

<wd l="1762" t="5405" r="2304" b="5563">model</wd>

<space/>

<wd l="2362" t="5405" r="2750" b="5563">with</wd>

<space/>

<wd l="2803" t="5405" r="3115" b="5563">and</wd>

<space/>

<wd l="3168" t="5405" r="3840" b="5563">without</wd>

<space/>

<wd l="3888" t="5405" r="4339" b="5563">word</wd>

<space/>

<wd l="4392" t="5405" r="5400" b="5606">embedding,</wd>

<space/>

<wd l="5467" t="5405" r="6542" b="5606">respectively.</wd>

<space/>

<wd l="6619" t="5405" r="6960" b="5563">The</wd>

<space/>

<wd l="7013" t="5405" r="7853" b="5606">rightmost</wd>

<space/>

<wd l="7906" t="5405" r="8558" b="5563">column</wd>

<space/>

<wd l="8621" t="5405" r="9144" b="5563">shows</wd>

<space/>

<wd l="9206" t="5405" r="9470" b="5563">the</wd>

<space/>

<wd l="9528" t="5405" r="10277" b="5563">decrease</wd>

<space/>

<wd l="10334" t="5458" r="10517" b="5563">or</wd>

<space/>

</ln>

<ln l="1440" t="5674" r="10517" b="5899" baseLine="5830">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="5674" r="2155" b="5832">increase</wd>

<space/>

<wd l="2222" t="5674" r="2395" b="5827">in</wd>

<space/>

<wd l="2462" t="5674" r="2726" b="5832">the</wd>

<space/>

<wd l="2798" t="5678" r="3005" b="5827">F1</wd>

<space/>

<wd l="3106" t="5726" r="3557" b="5832">score</wd>

<space/>

<wd l="3624" t="5674" r="4013" b="5832">with</wd>

<space/>

<wd l="4080" t="5698" r="4699" b="5875">respect</wd>

<space/>

<wd l="4766" t="5698" r="4934" b="5832">to</wd>

<space/>

<wd l="5006" t="5674" r="5270" b="5832">the</wd>

<space/>

<wd l="5342" t="5674" r="5885" b="5832">model</wd>

<space/>

<wd l="5957" t="5674" r="6624" b="5832">without</wd>

<space/>

<wd l="6691" t="5674" r="7138" b="5832">word</wd>

<space/>

<wd l="7210" t="5674" r="8218" b="5875">embedding.</wd>

<space/>

</run>

<wd l="8342" t="5674" r="9403" b="5899"><run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">M</run>

<run italic="true" underlined="none" subsuperscript="subscript" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">Embedding</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9490" t="5674" r="10142" b="5832">denotes</wd>

<space/>

<wd l="10224" t="5726" r="10517" b="5832">our</wd>

<space/>

</run>

</ln>

<ln l="1445" t="5947" r="2472" b="6106" baseLine="6096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5947" r="1824" b="6106">final</wd>

<space/>

<wd l="1882" t="5947" r="2472" b="6106">model.</wd>

</ln>

</para>

</column>

</section>

<section l="1437" t="6503" r="10531" b="15317">

<column l="1437" t="6503" r="5824" b="15317">

<para l="1877" t="6566" r="5803" b="6998" alignment="justified" li="432" spaceBefore="4" lsp="exactly" lspExact="270" language="en">

<ln l="1877" t="6566" r="5803" b="6768" baseLine="6715" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="6566" r="2141" b="6725">the</wd>

<space/>

<wd l="2198" t="6566" r="2870" b="6768">training</wd>

<space/>

<wd l="2933" t="6566" r="3298" b="6725">data</wd>

<space/>

<wd l="3350" t="6566" r="3662" b="6725">and</wd>

<space/>

<wd l="3720" t="6590" r="4632" b="6768">gazetteers,</wd>

<space/>

<wd l="4704" t="6566" r="5011" b="6725">and</wd>

<space/>

<wd l="5064" t="6566" r="5472" b="6754">thus,</wd>

<space/>

<wd l="5539" t="6566" r="5803" b="6725">the</wd>

<space/>

</ln>

<ln l="1877" t="6840" r="4085" b="6998" baseLine="6989" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="6840" r="2419" b="6998">model</wd>

<space/>

<wd l="2482" t="6864" r="3058" b="6998">cannot</wd>

<space/>

<wd l="3110" t="6840" r="3547" b="6998">learn</wd>

<space/>

<wd l="3605" t="6840" r="4085" b="6998">them.</wd>

</ln>

</para>

<para l="1450" t="7243" r="5808" b="9614" alignment="justified" li="432" spaceBefore="143" fli="-432" lsp="exactly" lspExact="270" language="en">

<ln l="1450" t="7243" r="5803" b="7445" baseLine="7397">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1450" t="7243" r="2165" b="7445">Foreign</wd>

<space/>

<wd l="2222" t="7248" r="3202" b="7445">languages:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="3317" t="7243" r="3696" b="7402">This</wd>

<space/>

<wd l="3888" t="7296" r="4310" b="7402">error</wd>

<space/>

<wd l="4488" t="7243" r="4627" b="7402">is</wd>

<space/>

<wd l="4819" t="7243" r="5410" b="7402">caused</wd>

<space/>

<wd l="5587" t="7243" r="5803" b="7445">by</wd>

<space/>

</run>

</ln>

<ln l="1877" t="7517" r="5794" b="7718" baseLine="7666" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1877" t="7541" r="2424" b="7675">tweets</wd>

<space/>

<wd l="2530" t="7517" r="3149" b="7675">written</wd>

<space/>

<wd l="3245" t="7517" r="3413" b="7670">in</wd>

<space/>

<wd l="3509" t="7517" r="4373" b="7718">languages</wd>

<space/>

<wd l="4478" t="7517" r="4930" b="7675">other</wd>

<space/>

<wd l="5021" t="7517" r="5390" b="7675">than</wd>

<space/>

<wd l="5491" t="7522" r="5794" b="7670">En-</wd>

</ln>

<ln l="1882" t="7786" r="5798" b="7987" baseLine="7939" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1882" t="7786" r="2342" b="7987">glish.</wd>

<space/>

<wd l="2554" t="7786" r="3110" b="7944">Words</wd>

<space/>

<wd l="3221" t="7786" r="3840" b="7944">written</wd>

<space/>

<wd l="3936" t="7786" r="4109" b="7939">in</wd>

<space/>

<wd l="4205" t="7786" r="4834" b="7987">foreign</wd>

<space/>

<wd l="4934" t="7786" r="5798" b="7987">languages</wd>

<space/>

</ln>

<ln l="1882" t="8059" r="5808" b="8261" baseLine="8208" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1882" t="8112" r="2141" b="8218">are</wd>

<space/>

<wd l="2213" t="8059" r="3058" b="8218">annotated</wd>

<space/>

<wd l="3120" t="8059" r="3331" b="8261">by</wd>

<space/>

<wd l="3398" t="8059" r="3667" b="8218">the</wd>

<space/>

<wd l="3734" t="8064" r="3883" b="8218">O</wd>

<space/>

<wd l="3950" t="8083" r="4214" b="8261">tag</wd>

<space/>

<wd l="4286" t="8059" r="4598" b="8218">and</wd>

<space/>

<wd l="4661" t="8083" r="4939" b="8218">not</wd>

<space/>

<wd l="5002" t="8059" r="5645" b="8218">include</wd>

<space/>

<wd l="5712" t="8112" r="5808" b="8218">a</wd>

<space/>

</ln>

<ln l="1877" t="8328" r="5803" b="8530" baseLine="8482" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1877" t="8328" r="2458" b="8486">named</wd>

<space/>

<wd l="2510" t="8328" r="3034" b="8530">entity.</wd>

<space/>

<wd l="3110" t="8333" r="3931" b="8515">However,</wd>

<space/>

<wd l="4003" t="8381" r="4454" b="8486">some</wd>

<space/>

<wd l="4502" t="8328" r="5026" b="8486">words</wd>

<space/>

<wd l="5083" t="8328" r="5486" b="8486">have</wd>

<space/>

<wd l="5539" t="8328" r="5803" b="8486">the</wd>

<space/>

</ln>

<ln l="1886" t="8602" r="5794" b="8803" baseLine="8750" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1886" t="8654" r="2323" b="8760">same</wd>

<space/>

<wd l="2414" t="8602" r="3091" b="8803">spelling</wd>

<space/>

<wd l="3178" t="8654" r="3350" b="8760">as</wd>

<space/>

<wd l="3442" t="8654" r="3638" b="8760">an</wd>

<space/>

<wd l="3720" t="8602" r="4387" b="8803">English</wd>

<space/>

<wd l="4469" t="8602" r="4915" b="8760">word</wd>

<space/>

<wd l="4997" t="8602" r="5309" b="8760">and</wd>

<space/>

<wd l="5386" t="8602" r="5794" b="8789">thus,</wd>

<space/>

</ln>

<ln l="1882" t="8870" r="5808" b="9072" baseLine="9024" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1882" t="8870" r="2544" b="9029">activate</wd>

<space/>

<wd l="2606" t="8870" r="2875" b="9029">the</wd>

<space/>

<wd l="2942" t="8894" r="3730" b="9072">gazetteer</wd>

<space/>

<wd l="3787" t="8870" r="4522" b="9029">features.</wd>

<space/>

<wd l="4627" t="8870" r="5006" b="9029">This</wd>

<space/>

<wd l="5078" t="8870" r="5808" b="9072">problem</wd>

<space/>

</ln>

<ln l="1877" t="9144" r="5808" b="9346" baseLine="9293" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1877" t="9144" r="2318" b="9302">leads</wd>

<space/>

<wd l="2376" t="9168" r="2544" b="9302">to</wd>

<space/>

<wd l="2597" t="9144" r="3120" b="9302">words</wd>

<space/>

<wd l="3178" t="9144" r="3566" b="9302">with</wd>

<space/>

<wd l="3614" t="9144" r="3883" b="9302">the</wd>

<space/>

<wd l="3936" t="9149" r="4085" b="9302">O</wd>

<space/>

<wd l="4142" t="9168" r="4406" b="9346">tag</wd>

<space/>

<wd l="4459" t="9144" r="4939" b="9346">being</wd>

<space/>

<wd l="4992" t="9144" r="5808" b="9346">predicted</wd>

<space/>

</ln>

<ln l="1882" t="9413" r="3869" b="9614" baseLine="9562" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1882" t="9466" r="2050" b="9571">as</wd>

<space/>

<wd l="2117" t="9466" r="2213" b="9571">a</wd>

<space/>

<wd l="2266" t="9413" r="2846" b="9571">named</wd>

<space/>

<wd l="2904" t="9413" r="3394" b="9614">entity</wd>

<space/>

<wd l="3451" t="9437" r="3869" b="9614">type.</wd>

</ln>

</para>

<para l="1454" t="9821" r="5808" b="14088" alignment="justified" li="432" spaceBefore="155" fli="-432" lsp="exactly" lspExact="270" language="en">

<ln l="1454" t="9821" r="5798" b="10022" baseLine="9970">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1454" t="9826" r="1906" b="10022">Type</wd>

<space/>

<wd l="1963" t="9821" r="3461" b="10022">disambiguation:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="3576" t="9821" r="4085" b="9979">There</wd>

<space/>

<wd l="4243" t="9874" r="4502" b="9979">are</wd>

<space/>

<wd l="4670" t="9874" r="5117" b="9979">some</wd>

<space/>

<wd l="5275" t="9821" r="5798" b="9979">words</wd>

<space/>

</run>

</ln>

<ln l="1877" t="10090" r="5794" b="10291" baseLine="10243" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="10090" r="2203" b="10248">that</wd>

<space/>

<wd l="2261" t="10090" r="2664" b="10248">have</wd>

<space/>

<wd l="2717" t="10090" r="2986" b="10248">the</wd>

<space/>

<wd l="3048" t="10142" r="3485" b="10248">same</wd>

<space/>

<wd l="3552" t="10090" r="4229" b="10291">spelling</wd>

<space/>

<wd l="4286" t="10090" r="4565" b="10248">but</wd>

<space/>

<wd l="4618" t="10090" r="5208" b="10291">belong</wd>

<space/>

<wd l="5266" t="10114" r="5434" b="10248">to</wd>

<space/>

<wd l="5496" t="10090" r="5794" b="10248">dif-</wd>

</ln>

<ln l="1877" t="10363" r="5794" b="10565" baseLine="10512" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="10363" r="2386" b="10522">ferent</wd>

<space/>

<wd l="2472" t="10387" r="2923" b="10565">types</wd>

<space/>

<wd l="3024" t="10363" r="3874" b="10565">according</wd>

<space/>

<wd l="3965" t="10387" r="4128" b="10522">to</wd>

<space/>

<wd l="4219" t="10363" r="4483" b="10522">the</wd>

<space/>

<wd l="4574" t="10363" r="5472" b="10522">contextual</wd>

<space/>

<wd l="5563" t="10363" r="5794" b="10517">in-</wd>

</ln>

<ln l="1877" t="10632" r="5808" b="10790" baseLine="10786" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="10632" r="2779" b="10790">formation.</wd>

<space/>

<wd l="2947" t="10632" r="3326" b="10790">This</wd>

<space/>

<wd l="3422" t="10685" r="3845" b="10790">error</wd>

<space/>

<wd l="3922" t="10632" r="4061" b="10790">is</wd>

<space/>

<wd l="4157" t="10632" r="4603" b="10790">often</wd>

<space/>

<wd l="4690" t="10632" r="5467" b="10790">observed</wd>

<space/>

<wd l="5549" t="10632" r="5808" b="10790">for</wd>

<space/>

</ln>

<ln l="1877" t="10906" r="5794" b="11107" baseLine="11054">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1877" t="10906" r="2458" b="11064">named</wd>

<space/>

<wd l="2525" t="10906" r="3144" b="11064">entities</wd>

<space/>

<wd l="3226" t="10906" r="3614" b="11064">such</wd>

<space/>

<wd l="3682" t="10958" r="3850" b="11064">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="3922" t="10939" r="4877" b="11107">sportsteam</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="4949" t="10906" r="5261" b="11064">and</wd>

<space/>

</run>

<wd l="5318" t="10915" r="5794" b="11064" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">musi-</wd>

</ln>

<ln l="1882" t="11174" r="5808" b="11376" baseLine="11328">

<wd l="1882" t="11184" r="2477" b="11333"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">cartist</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="2626" t="11174" r="2962" b="11333">The</wd>

<space/>

<wd l="3038" t="11174" r="3490" b="11333">word</wd>

<space/>

<wd l="3571" t="11227" r="4440" b="11376">sequences</wd>

<space/>

<wd l="4526" t="11174" r="4915" b="11333">with</wd>

<space/>

<wd l="4987" t="11174" r="5294" b="11333">this</wd>

<space/>

<wd l="5386" t="11227" r="5808" b="11333">error</wd>

<space/>

</run>

</ln>

<ln l="1877" t="11448" r="5794" b="11650" baseLine="11597" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1877" t="11448" r="2280" b="11606">have</wd>

<space/>

<wd l="2362" t="11501" r="2458" b="11606">a</wd>

<space/>

<wd l="2530" t="11448" r="3298" b="11650">correctly</wd>

<space/>

<wd l="3384" t="11448" r="4541" b="11650">distinguished</wd>

<space/>

<wd l="4622" t="11448" r="5107" b="11650">entity</wd>

<space/>

<wd l="5189" t="11448" r="5794" b="11606">bound-</wd>

</ln>

<ln l="1882" t="11717" r="5794" b="11918" baseLine="11870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1882" t="11770" r="2150" b="11918">ary</wd>

<space/>

<wd l="2208" t="11717" r="2486" b="11875">but</wd>

<space/>

<wd l="2539" t="11717" r="3144" b="11918">predict</wd>

<space/>

<wd l="3197" t="11717" r="3461" b="11875">the</wd>

<space/>

<wd l="3518" t="11770" r="4070" b="11918">wrong</wd>

<space/>

<wd l="4133" t="11717" r="4622" b="11918">entity</wd>

<space/>

<wd l="4680" t="11741" r="5098" b="11918">type.</wd>

<space/>

<wd l="5174" t="11722" r="5482" b="11875">For</wd>

<space/>

<wd l="5534" t="11770" r="5794" b="11875">ex-</wd>

</ln>

<ln l="1882" t="11990" r="5798" b="12192" baseLine="12139">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1882" t="11990" r="2453" b="12192">ample,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2520" t="12000" r="3091" b="12192">Tampa</wd>

<space/>

<wd l="3134" t="12000" r="3480" b="12192">Bay</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="3523" t="11990" r="3691" b="12144">in</wd>

<space/>

<wd l="3739" t="11990" r="4435" b="12192">“Losing</wd>

<space/>

<wd l="4483" t="12014" r="4646" b="12149">to</wd>

<space/>

<wd l="4694" t="11990" r="4963" b="12149">the</wd>

<space/>

<wd l="5006" t="11990" r="5798" b="12192">Penguins</wd>

<space/>

</run>

</ln>

<ln l="1882" t="12259" r="5803" b="12461" baseLine="12408" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1882" t="12259" r="2861" b="12461">quasi-AHL</wd>

<space/>

<wd l="2899" t="12259" r="3442" b="12461">lineup</wd>

<space/>

<wd l="3490" t="12259" r="3662" b="12413">in</wd>

<space/>

<wd l="3701" t="12259" r="4603" b="12418">December</wd>

<space/>

<wd l="4642" t="12259" r="4781" b="12418">is</wd>

<space/>

<wd l="4834" t="12312" r="4930" b="12418">a</wd>

<space/>

<wd l="4968" t="12259" r="5803" b="12418">non-issue</wd>

<space/>

</ln>

<ln l="1877" t="12533" r="5794" b="12734" baseLine="12682">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1877" t="12533" r="2136" b="12691">for</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2218" t="12542" r="2789" b="12734">Tampa</wd>

<space/>

</run>

<wd l="2866" t="12538" r="3302" b="12734"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">Bay</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">”</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="3384" t="12533" r="3518" b="12691">is</wd>

<space/>

<wd l="3610" t="12586" r="3806" b="12691">an</wd>

<space/>

<wd l="3893" t="12533" r="4382" b="12734">entity</wd>

<space/>

<wd l="4464" t="12533" r="4718" b="12691">for</wd>

<space/>

</run>

<wd l="4795" t="12566" r="5794" b="12734"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">sportsteam</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

</run>

</ln>

<ln l="1877" t="12802" r="5808" b="13003" baseLine="12950">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1877" t="12802" r="2150" b="12960">but</wd>

<space/>

<wd l="2218" t="12802" r="2486" b="12960">the</wd>

<space/>

<wd l="2554" t="12802" r="3096" b="12960">model</wd>

<space/>

<wd l="3173" t="12802" r="3950" b="12960">classifies</wd>

<space/>

<wd l="4027" t="12802" r="4147" b="12960">it</wd>

<space/>

<wd l="4219" t="12854" r="4392" b="12960">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="4464" t="12802" r="5117" b="13003">geo-loc</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="5189" t="12802" r="5808" b="12960">instead</wd>

<space/>

</run>

</ln>

<ln l="1882" t="13070" r="5798" b="13272" baseLine="13224">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1882" t="13070" r="2074" b="13229">of</wd>

<space/>

</run>

<wd l="2102" t="13104" r="3101" b="13272"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">sportsteam</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="3178" t="13075" r="3360" b="13224">In</wd>

<space/>

<wd l="3408" t="13070" r="4061" b="13229">another</wd>

<space/>

<wd l="4104" t="13070" r="4882" b="13272">example,</wd>

<space/>

<wd l="4939" t="13070" r="5203" b="13229">the</wd>

<space/>

<wd l="5246" t="13123" r="5798" b="13229">names</wd>

<space/>

</run>

</ln>

<ln l="1882" t="13344" r="5808" b="13517" baseLine="13493">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1882" t="13344" r="2074" b="13502">of</wd>

<space/>

<wd l="2126" t="13368" r="2448" b="13502">two</wd>

<space/>

<wd l="2520" t="13344" r="3034" b="13502">music</wd>

<space/>

<wd l="3110" t="13344" r="3619" b="13502">artists</wd>

<space/>

<wd l="3696" t="13344" r="3869" b="13498">in</wd>

<space/>

<wd l="3941" t="13344" r="4406" b="13502">“Will</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="4478" t="13344" r="5054" b="13502">Shawn</wd>

<space/>

<wd l="5122" t="13344" r="5808" b="13517">Mendez</wd>

<space/>

</run>

</ln>

<ln l="1877" t="13613" r="5808" b="13814" baseLine="13766">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1877" t="13613" r="2083" b="13771">be</wd>

<space/>

<wd l="2141" t="13613" r="2837" b="13814">opening</wd>

<space/>

<wd l="2890" t="13666" r="3106" b="13814">up</wd>

<space/>

<wd l="3163" t="13613" r="3422" b="13771">for</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="3480" t="13613" r="4037" b="13814">Taylor</wd>

<space/>

</run>

<wd l="4085" t="13618" r="4618" b="13814"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">Swift</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">”</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="4680" t="13666" r="4939" b="13771">are</wd>

<space/>

<wd l="4992" t="13613" r="5808" b="13814">predicted</wd>

<space/>

</run>

</ln>

<ln l="1882" t="13886" r="4709" b="14088" baseLine="14035">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1882" t="13939" r="2050" b="14045">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2093" t="13939" r="2702" b="14088">person</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2765" t="13886" r="3077" b="14045">and</wd>

<space/>

<wd l="3130" t="13910" r="3408" b="14045">not</wd>

<space/>

<wd l="3466" t="13939" r="3634" b="14045">as</wd>

<space/>

</run>

<wd l="3696" t="13896" r="4709" b="14045"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">musicartist</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1450" t="14294" r="5803" b="15264" alignment="justified" li="432" spaceBefore="142" fli="-432" lsp="exactly" lspExact="267" language="en">

<ln l="1450" t="14294" r="5798" b="14453" baseLine="14443">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="14294" r="2275" b="14453">Informal</wd>

<space/>

<wd l="2333" t="14342" r="2842" b="14453">name</wd>

<space/>

<wd l="2904" t="14342" r="3106" b="14453">or</wd>

<space/>

<wd l="3163" t="14294" r="4478" b="14453">abbreviations:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4594" t="14294" r="5222" b="14453">Twitter</wd>

<space/>

<wd l="5357" t="14347" r="5798" b="14453">users</wd>

<space/>

</run>

</ln>

<ln l="1882" t="14563" r="5803" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="14616" r="2693" b="14765">compress</wd>

<space/>

<wd l="2770" t="14563" r="3197" b="14722">what</wd>

<space/>

<wd l="3264" t="14563" r="3634" b="14765">they</wd>

<space/>

<wd l="3710" t="14587" r="4133" b="14722">want</wd>

<space/>

<wd l="4200" t="14587" r="4368" b="14722">to</wd>

<space/>

<wd l="4450" t="14616" r="4728" b="14765">say</wd>

<space/>

<wd l="4805" t="14587" r="4968" b="14722">to</wd>

<space/>

<wd l="5045" t="14587" r="5472" b="14722">meet</wd>

<space/>

<wd l="5539" t="14563" r="5803" b="14722">the</wd>

<space/>

</ln>

<ln l="1877" t="14837" r="5794" b="14995" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="14837" r="2290" b="14995">limit</wd>

<space/>

<wd l="2395" t="14837" r="2587" b="14995">of</wd>

<space/>

<wd l="2698" t="14842" r="3000" b="14995">140</wd>

<space/>

<wd l="3110" t="14837" r="4032" b="14995">characters.</wd>

<space/>

<wd l="4253" t="14837" r="4632" b="14995">This</wd>

<space/>

<wd l="4742" t="14837" r="5184" b="14995">leads</wd>

<space/>

<wd l="5290" t="14861" r="5458" b="14995">to</wd>

<space/>

<wd l="5563" t="14837" r="5794" b="14990">in-</wd>

</ln>

<ln l="1877" t="15106" r="5803" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="15106" r="2453" b="15264">formal</wd>

<space/>

<wd l="2554" t="15130" r="2957" b="15264">texts</wd>

<space/>

<wd l="3058" t="15106" r="3600" b="15264">unlike</wd>

<space/>

<wd l="3701" t="15106" r="3869" b="15259">in</wd>

<space/>

<wd l="3965" t="15158" r="4402" b="15264">news</wd>

<space/>

<wd l="4507" t="15106" r="5179" b="15264">articles.</wd>

<space/>

<wd l="5381" t="15110" r="5803" b="15264">Note</wd>

</ln>

</para>

</column>

<column l="6144" t="6503" r="10531" b="15317">

<para l="6576" t="6566" r="10526" b="10022" alignment="justified" li="432" spaceBefore="15" lsp="exactly" lspExact="270" language="en">

<ln l="6581" t="6566" r="10502" b="6725" baseLine="6715" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="6566" r="6912" b="6725">that</wd>

<space/>

<wd l="6970" t="6566" r="8126" b="6725">abbreviations</wd>

<space/>

<wd l="8194" t="6566" r="8405" b="6725">do</wd>

<space/>

<wd l="8462" t="6590" r="8741" b="6725">not</wd>

<space/>

<wd l="8794" t="6566" r="9485" b="6725">indicate</wd>

<space/>

<wd l="9547" t="6566" r="10152" b="6725">official</wd>

<space/>

<wd l="10210" t="6566" r="10502" b="6725">full</wd>

<space/>

</ln>

<ln l="6581" t="6840" r="10502" b="7042" baseLine="6989" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="6840" r="7085" b="6998">forms</wd>

<space/>

<wd l="7171" t="6840" r="7565" b="6998">such</wd>

<space/>

<wd l="7642" t="6893" r="7810" b="6998">as</wd>

<space/>

<wd l="7896" t="6840" r="8549" b="7042">airports</wd>

<space/>

<wd l="8635" t="6893" r="8818" b="6998">or</wd>

<space/>

<wd l="8890" t="6840" r="9730" b="6998">countries.</wd>

<space/>

<wd l="9864" t="6845" r="10166" b="6998">For</wd>

<space/>

<wd l="10238" t="6893" r="10502" b="6998">ex-</wd>

</ln>

<ln l="6586" t="7109" r="10512" b="7310" baseLine="7258">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6586" t="7109" r="7157" b="7310">ample,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7224" t="7109" r="7872" b="7267">Southie</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7934" t="7109" r="8107" b="7262">in</wd>

<space/>

<wd l="8165" t="7109" r="8779" b="7267">“Proud</wd>

<space/>

<wd l="8832" t="7109" r="9158" b="7267">that</wd>

<space/>

<wd l="9211" t="7109" r="9480" b="7267">the</wd>

<space/>

<wd l="9557" t="7114" r="9792" b="7267">1st</wd>

<space/>

<wd l="9845" t="7109" r="10512" b="7267">modern</wd>

<space/>

</run>

</ln>

<ln l="6586" t="7378" r="10502" b="7579" baseLine="7531" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6586" t="7378" r="7339" b="7579">Olympic</wd>

<space/>

<wd l="7430" t="7378" r="8338" b="7579">Champion</wd>

<space/>

<wd l="8414" t="7378" r="8554" b="7536">is</wd>

<space/>

<wd l="8640" t="7382" r="9168" b="7536">James</wd>

<space/>

<wd l="9254" t="7378" r="9989" b="7536">Brendan</wd>

<space/>

<wd l="10080" t="7382" r="10502" b="7536">Con-</wd>

</ln>

<ln l="6581" t="7651" r="10526" b="7853" baseLine="7800">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6581" t="7651" r="7027" b="7853">nolly</wd>

<space/>

<wd l="7109" t="7651" r="7301" b="7810">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7358" t="7651" r="8117" b="7810">#Southie</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8213" t="7656" r="8328" b="7810">.”</wd>

<space/>

<wd l="8458" t="7651" r="8597" b="7810">is</wd>

<space/>

<wd l="8683" t="7704" r="8880" b="7810">an</wd>

<space/>

<wd l="8957" t="7651" r="9706" b="7810">informal</wd>

<space/>

<wd l="9782" t="7704" r="10253" b="7810">name</wd>

<space/>

<wd l="10334" t="7651" r="10526" b="7810">of</wd>

<space/>

</run>

</ln>

<ln l="6581" t="7920" r="10517" b="8122" baseLine="8074">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6581" t="7920" r="7075" b="8078">South</wd>

<space/>

</run>

<wd l="7138" t="7930" r="7790" b="8107"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Boston</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="7872" t="7920" r="8179" b="8078">and</wd>

<space/>

<wd l="8242" t="7920" r="8549" b="8078">this</wd>

<space/>

<wd l="8621" t="7920" r="9067" b="8078">word</wd>

<space/>

<wd l="9130" t="7920" r="9518" b="8078">does</wd>

<space/>

<wd l="9590" t="7944" r="9869" b="8078">not</wd>

<space/>

<wd l="9936" t="7973" r="10517" b="8122">appear</wd>

<space/>

</run>

</ln>

<ln l="6581" t="8194" r="10502" b="8395" baseLine="8342" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="8194" r="6754" b="8347">in</wd>

<space/>

<wd l="6835" t="8194" r="7099" b="8352">the</wd>

<space/>

<wd l="7186" t="8194" r="7862" b="8395">training</wd>

<space/>

<wd l="7958" t="8218" r="8194" b="8352">set</wd>

<space/>

<wd l="8280" t="8194" r="8592" b="8352">and</wd>

<space/>

<wd l="8678" t="8218" r="9590" b="8395">gazetteers.</wd>

<space/>

<wd l="9758" t="8194" r="10186" b="8352">With</wd>

<space/>

<wd l="10267" t="8246" r="10502" b="8352">re-</wd>

</ln>

<ln l="6590" t="8462" r="10502" b="8664" baseLine="8616" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6590" t="8486" r="7032" b="8664">spect</wd>

<space/>

<wd l="7094" t="8486" r="7262" b="8621">to</wd>

<space/>

<wd l="7339" t="8462" r="8544" b="8650">abbreviations,</wd>

<space/>

<wd l="8626" t="8462" r="9206" b="8664">people</wd>

<space/>

<wd l="9274" t="8515" r="9566" b="8621">use</wd>

<space/>

<wd l="9638" t="8462" r="10502" b="8621">abbreviat-</wd>

</ln>

<ln l="6581" t="8736" r="10502" b="8938" baseLine="8885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="8736" r="6998" b="8894">tions</wd>

<space/>

<wd l="7061" t="8736" r="7320" b="8894">for</wd>

<space/>

<wd l="7368" t="8736" r="8242" b="8938">indicating</wd>

<space/>

<wd l="8304" t="8789" r="8400" b="8894">a</wd>

<space/>

<wd l="8453" t="8736" r="8760" b="8938">day</wd>

<space/>

<wd l="8822" t="8789" r="9005" b="8894">or</wd>

<space/>

<wd l="9062" t="8789" r="9158" b="8894">a</wd>

<space/>

<wd l="9206" t="8736" r="9806" b="8923">month,</wd>

<space/>

<wd l="9883" t="8736" r="10277" b="8894">such</wd>

<space/>

<wd l="10334" t="8789" r="10502" b="8894">as</wd>

<space/>

</ln>

<ln l="6576" t="9005" r="10512" b="9206" baseLine="9158">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6576" t="9014" r="6979" b="9163">Mon</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7042" t="9005" r="7301" b="9163">for</wd>

<space/>

<wd l="7354" t="9005" r="8078" b="9206">Monday</wd>

<space/>

<wd l="8146" t="9005" r="8458" b="9163">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8506" t="9014" r="8818" b="9163">Jan</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8880" t="9005" r="9139" b="9163">for</wd>

<space/>

<wd l="9192" t="9010" r="9898" b="9206">January.</wd>

<space/>

<wd l="9989" t="9005" r="10512" b="9163">These</wd>

<space/>

</run>

</ln>

<ln l="6581" t="9278" r="10512" b="9480" baseLine="9427" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="9278" r="7104" b="9437">words</wd>

<space/>

<wd l="7162" t="9331" r="7421" b="9437">are</wd>

<space/>

<wd l="7469" t="9278" r="8314" b="9437">contained</wd>

<space/>

<wd l="8357" t="9278" r="8530" b="9432">in</wd>

<space/>

<wd l="8578" t="9302" r="9432" b="9480">gazetteers</wd>

<space/>

<wd l="9490" t="9278" r="9802" b="9437">and</wd>

<space/>

<wd l="9850" t="9278" r="10512" b="9437">activate</wd>

<space/>

</ln>

<ln l="6581" t="9547" r="10502" b="9749" baseLine="9696" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="9547" r="6850" b="9706">the</wd>

<space/>

<wd l="6912" t="9571" r="7694" b="9749">gazetteer</wd>

<space/>

<wd l="7752" t="9547" r="8482" b="9706">features.</wd>

<space/>

<wd l="8573" t="9552" r="8731" b="9701">A</wd>

<space/>

<wd l="8789" t="9547" r="9331" b="9706">model</wd>

<space/>

<wd l="9389" t="9547" r="9936" b="9706">makes</wd>

<space/>

<wd l="10008" t="9600" r="10502" b="9706">errors</wd>

<space/>

</ln>

<ln l="6581" t="9821" r="9830" b="10022" baseLine="9970" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6581" t="9821" r="6797" b="10022">by</wd>

<space/>

<wd l="6854" t="9821" r="7738" b="10022">predicting</wd>

<space/>

<wd l="7795" t="9821" r="8232" b="9979">them</wd>

<space/>

<wd l="8290" t="9874" r="8458" b="9979">as</wd>

<space/>

<wd l="8520" t="9821" r="9106" b="9979">named</wd>

<space/>

<wd l="9163" t="9821" r="9830" b="9979">entities.</wd>

</ln>

</para>

<para l="6154" t="10258" r="10512" b="12355" alignment="justified" li="432" spaceBefore="172" fli="-432" lsp="exactly" lspExact="270" language="en">

<ln l="6154" t="10258" r="10507" b="10459" baseLine="10406">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6154" t="10262" r="6989" b="10459">Hashtag:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7104" t="10262" r="7262" b="10411">A</wd>

<space/>

<wd l="7330" t="10258" r="7997" b="10459">hashtag</wd>

<space/>

<wd l="8069" t="10258" r="8208" b="10416">is</wd>

<space/>

<wd l="8290" t="10310" r="8386" b="10416">a</wd>

<space/>

<wd l="8458" t="10258" r="9547" b="10416">combination</wd>

<space/>

<wd l="9624" t="10258" r="9811" b="10416">of</wd>

<space/>

<wd l="9869" t="10258" r="10138" b="10416">the</wd>

<space/>

<wd l="10214" t="10262" r="10507" b="10411">“#”</wd>

<space/>

</run>

</ln>

<ln l="6590" t="10526" r="10512" b="10728" baseLine="10675" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6590" t="10526" r="6946" b="10728">sign</wd>

<space/>

<wd l="6998" t="10526" r="7310" b="10685">and</wd>

<space/>

<wd l="7363" t="10579" r="7814" b="10685">some</wd>

<space/>

<wd l="7862" t="10526" r="8736" b="10685">characters</wd>

<space/>

<wd l="8789" t="10526" r="9048" b="10685">for</wd>

<space/>

<wd l="9096" t="10526" r="10018" b="10728">organizing</wd>

<space/>

<wd l="10066" t="10526" r="10512" b="10685">word</wd>

<space/>

</ln>

<ln l="6590" t="10795" r="10512" b="10997" baseLine="10949" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6590" t="10848" r="7459" b="10997">sequences</wd>

<space/>

<wd l="7526" t="10848" r="7694" b="10954">as</wd>

<space/>

<wd l="7766" t="10795" r="8678" b="10954">searchable</wd>

<space/>

<wd l="8731" t="10795" r="9149" b="10954">links</wd>

<space/>

<wd l="9211" t="10795" r="9384" b="10949">in</wd>

<space/>

<wd l="9437" t="10795" r="10094" b="10954">Twitter.</wd>

<space/>

<wd l="10171" t="10795" r="10512" b="10954">The</wd>

<space/>

</ln>

<ln l="6581" t="11069" r="10502" b="11270" baseLine="11218" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6581" t="11069" r="6922" b="11227">rule</wd>

<space/>

<wd l="6974" t="11069" r="7109" b="11227">is</wd>

<space/>

<wd l="7171" t="11093" r="7339" b="11227">to</wd>

<space/>

<wd l="7392" t="11093" r="7675" b="11227">not</wd>

<space/>

<wd l="7723" t="11122" r="8016" b="11227">use</wd>

<space/>

<wd l="8074" t="11122" r="8376" b="11270">any</wd>

<space/>

<wd l="8443" t="11122" r="8914" b="11270">space</wd>

<space/>

<wd l="8971" t="11069" r="9696" b="11227">between</wd>

<space/>

<wd l="9749" t="11069" r="10013" b="11227">the</wd>

<space/>

<wd l="10070" t="11069" r="10502" b="11227">char-</wd>

</ln>

<ln l="6586" t="11338" r="10512" b="11539" baseLine="11491" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6586" t="11362" r="7085" b="11496">acters</wd>

<space/>

<wd l="7157" t="11338" r="7325" b="11491">in</wd>

<space/>

<wd l="7387" t="11338" r="7656" b="11496">the</wd>

<space/>

<wd l="7718" t="11338" r="8429" b="11539">hashtag.</wd>

<space/>

<wd l="8534" t="11342" r="8837" b="11496">For</wd>

<space/>

<wd l="8899" t="11338" r="9658" b="11525">instance,</wd>

<space/>

<wd l="9734" t="11338" r="9998" b="11496">the</wd>

<space/>

<wd l="10066" t="11338" r="10512" b="11496">word</wd>

<space/>

</ln>

<ln l="6576" t="11611" r="10507" b="11770" baseLine="11760">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6576" t="11621" r="6965" b="11770">New</wd>

<space/>

<wd l="7070" t="11611" r="7555" b="11770">Delhi</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7670" t="11611" r="7805" b="11770">is</wd>

<space/>

<wd l="7920" t="11611" r="8976" b="11770">transformed</wd>

<space/>

<wd l="9086" t="11611" r="9422" b="11770">into</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="9533" t="11611" r="10507" b="11770">#NewDelhi</wd>

<space/>

</run>

</ln>

<ln l="6586" t="11880" r="10512" b="12082" baseLine="12034" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6586" t="11933" r="6754" b="12038">as</wd>

<space/>

<wd l="6859" t="11933" r="6955" b="12038">a</wd>

<space/>

<wd l="7046" t="11880" r="7757" b="12082">hashtag,</wd>

<space/>

<wd l="7877" t="11933" r="8059" b="12038">so</wd>

<space/>

<wd l="8155" t="11880" r="8275" b="12038">it</wd>

<space/>

<wd l="8366" t="11880" r="8506" b="12038">is</wd>

<space/>

<wd l="8611" t="11880" r="9293" b="12038">difficult</wd>

<space/>

<wd l="9384" t="11904" r="9547" b="12038">to</wd>

<space/>

<wd l="9648" t="11880" r="10152" b="12038">check</wd>

<space/>

<wd l="10243" t="11880" r="10512" b="12038">the</wd>

<space/>

</ln>

<ln l="6586" t="12154" r="9331" b="12355" baseLine="12302" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6586" t="12178" r="7373" b="12355">gazetteer</wd>

<space/>

<wd l="7421" t="12154" r="8141" b="12312">lexicons</wd>

<space/>

<wd l="8203" t="12154" r="8458" b="12312">for</wd>

<space/>

<wd l="8520" t="12154" r="8914" b="12312">such</wd>

<space/>

<wd l="8966" t="12178" r="9331" b="12312">text.</wd>

</ln>

</para>

<para l="6149" t="12590" r="10070" b="12792" alignment="left" spaceBefore="187" lsp="exactly" lspExact="253" language="en">

<ln l="6149" t="12590" r="10070" b="12792" baseLine="12739" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">

<wd l="6149" t="12590" r="6413" b="12749">5.2</wd>

<space/>

<wd l="6643" t="12595" r="6998" b="12749">The</wd>

<space/>

<wd l="7061" t="12590" r="8208" b="12749">effectiveness</wd>

<space/>

<wd l="8275" t="12590" r="8462" b="12749">of</wd>

<space/>

<wd l="8510" t="12595" r="8986" b="12749">word</wd>

<space/>

<wd l="9048" t="12590" r="10070" b="12792">embedding</wd>

</ln>

</para>

<para l="6144" t="12941" r="10512" b="14496" alignment="justified" spaceBefore="81" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="12941" r="10502" b="13128" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12946" r="6326" b="13094">In</wd>

<space/>

<wd l="6413" t="12941" r="6720" b="13099">this</wd>

<space/>

<wd l="6821" t="12941" r="7776" b="13128">subsection,</wd>

<space/>

<wd l="7882" t="12994" r="8136" b="13099">we</wd>

<space/>

<wd l="8227" t="12941" r="8947" b="13099">describe</wd>

<space/>

<wd l="9034" t="12941" r="9302" b="13099">the</wd>

<space/>

<wd l="9389" t="12941" r="10502" b="13099">effectiveness</wd>

<space/>

</ln>

<ln l="6149" t="13210" r="10502" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13210" r="6341" b="13368">of</wd>

<space/>

<wd l="6470" t="13210" r="6917" b="13368">word</wd>

<space/>

<wd l="7066" t="13210" r="8030" b="13411">embedding</wd>

<space/>

<wd l="8174" t="13210" r="8390" b="13411">by</wd>

<space/>

<wd l="8544" t="13210" r="9384" b="13411">analyzing</wd>

<space/>

<wd l="9533" t="13210" r="9797" b="13368">the</wd>

<space/>

<wd l="9941" t="13210" r="10502" b="13368">results</wd>

<space/>

</ln>

<ln l="6149" t="13478" r="10512" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13478" r="6898" b="13637">obtained</wd>

<space/>

<wd l="7003" t="13478" r="7219" b="13680">by</wd>

<space/>

<wd l="7325" t="13478" r="7795" b="13680">using</wd>

<space/>

<wd l="7906" t="13478" r="8170" b="13637">the</wd>

<space/>

<wd l="8280" t="13478" r="8822" b="13637">model</wd>

<space/>

<wd l="8928" t="13478" r="9317" b="13637">with</wd>

<space/>

<wd l="9427" t="13478" r="9739" b="13637">and</wd>

<space/>

<wd l="9845" t="13478" r="10512" b="13637">without</wd>

<space/>

</ln>

<ln l="6144" t="13752" r="10512" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13752" r="6595" b="13910">word</wd>

<space/>

<wd l="6691" t="13752" r="7699" b="13954">embedding.</wd>

<space/>

<wd l="7896" t="13752" r="8232" b="13910">The</wd>

<space/>

<wd l="8333" t="13752" r="8712" b="13954">only</wd>

<space/>

<wd l="8818" t="13752" r="9691" b="13910">difference</wd>

<space/>

<wd l="9782" t="13752" r="10512" b="13910">between</wd>

<space/>

</ln>

<ln l="6144" t="14021" r="10512" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14021" r="6533" b="14179">both</wd>

<space/>

<wd l="6586" t="14021" r="6850" b="14179">the</wd>

<space/>

<wd l="6902" t="14021" r="7526" b="14179">models</wd>

<space/>

<wd l="7589" t="14021" r="7723" b="14179">is</wd>

<space/>

<wd l="7786" t="14021" r="8050" b="14179">the</wd>

<space/>

<wd l="8102" t="14074" r="8390" b="14179">use</wd>

<space/>

<wd l="8453" t="14021" r="8640" b="14179">of</wd>

<space/>

<wd l="8678" t="14021" r="9230" b="14179">brown</wd>

<space/>

<wd l="9288" t="14021" r="10142" b="14222">clustering</wd>

<space/>

<wd l="10200" t="14021" r="10512" b="14179">and</wd>

<space/>

</ln>

<ln l="6144" t="14294" r="9576" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14294" r="6413" b="14453">the</wd>

<space/>

<wd l="6466" t="14294" r="6912" b="14453">word</wd>

<space/>

<wd l="6970" t="14294" r="8203" b="14496">representation</wd>

<space/>

<wd l="8256" t="14294" r="8755" b="14453">based</wd>

<space/>

<wd l="8813" t="14347" r="9029" b="14453">on</wd>

<space/>

<wd l="9086" t="14299" r="9576" b="14453">CCA.</wd>

</ln>

</para>

<para l="6144" t="14563" r="10512" b="15307" alignment="justified" spaceBefore="6" lsp="exactly" lspExact="266" language="en">

<ln l="6144" t="14563" r="10502" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14568" r="6326" b="14717">In</wd>

<space/>

<wd l="6413" t="14563" r="6677" b="14722">the</wd>

<space/>

<wd l="6763" t="14568" r="7200" b="14722">NER</wd>

<space/>

<wd l="7286" t="14563" r="7680" b="14750">task,</wd>

<space/>

<wd l="7786" t="14563" r="8050" b="14722">the</wd>

<space/>

<wd l="8136" t="14568" r="8342" b="14717">F1</wd>

<space/>

<wd l="8462" t="14616" r="8909" b="14722">score</wd>

<space/>

<wd l="8995" t="14563" r="9134" b="14722">is</wd>

<space/>

<wd l="9230" t="14616" r="9326" b="14722">a</wd>

<space/>

<wd l="9408" t="14616" r="9854" b="14722">more</wd>

<space/>

<wd l="9946" t="14616" r="10502" b="14765">appro-</wd>

</ln>

<ln l="6144" t="14837" r="10512" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14837" r="6643" b="15038">priate</wd>

<space/>

<wd l="6706" t="14837" r="7258" b="14995">metric</wd>

<space/>

<wd l="7330" t="14837" r="7699" b="14995">than</wd>

<space/>

<wd l="7771" t="14890" r="8568" b="15038">accuracy.</wd>

<space/>

<wd l="8678" t="14842" r="9130" b="14995">Most</wd>

<space/>

<wd l="9197" t="14837" r="9384" b="14995">of</wd>

<space/>

<wd l="9437" t="14837" r="9701" b="14995">the</wd>

<space/>

<wd l="9768" t="14837" r="10267" b="14995">labels</wd>

<space/>

<wd l="10339" t="14837" r="10512" b="14990">in</wd>

<space/>

</ln>

<ln l="6144" t="15106" r="10512" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="15106" r="6413" b="15264">the</wd>

<space/>

<wd l="6499" t="15110" r="6936" b="15264">NER</wd>

<space/>

<wd l="7027" t="15106" r="7392" b="15264">data</wd>

<space/>

<wd l="7478" t="15106" r="8122" b="15264">contain</wd>

<space/>

<wd l="8208" t="15106" r="8472" b="15264">the</wd>

<space/>

<wd l="8563" t="15110" r="8712" b="15264">O</wd>

<space/>

<wd l="8808" t="15130" r="9115" b="15307">tag,</wd>

<space/>

<wd l="9221" t="15106" r="10094" b="15307">indicating</wd>

<space/>

<wd l="10186" t="15106" r="10512" b="15264">that</wd>

</ln>

</para>

</column>

</section>

<dd l="1437" t="15736" r="10540" b="15977">

<para l="5800" t="15787" r="6138" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5866" t="15787" r="6072" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="39">

<wd l="5866" t="15787" r="6072" b="15946">75</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4310.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1427" marginTop="1263" marginRight="1363" marginBottom="1302" offsetX="-32" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1427" t="1263" r="10546" b="15315">

<column l="1427" t="1263" r="5829" b="15315">

<para l="1440" t="1320" r="5808" b="2294" alignment="justified" spaceBefore="1" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="1320" r="5808" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="1320" r="1810" b="1522">they</wd>

<space/>

<wd l="1906" t="1373" r="2170" b="1478">are</wd>

<space/>

<wd l="2261" t="1344" r="2539" b="1478">not</wd>

<space/>

<wd l="2635" t="1373" r="2832" b="1478">an</wd>

<space/>

<wd l="2928" t="1320" r="3451" b="1522">entity.</wd>

<space/>

<wd l="3643" t="1320" r="4123" b="1478">Since</wd>

<space/>

<wd l="4214" t="1320" r="4522" b="1478">this</wd>

<space/>

<wd l="4618" t="1320" r="5059" b="1478">leads</wd>

<space/>

<wd l="5155" t="1344" r="5323" b="1478">to</wd>

<space/>

<wd l="5419" t="1320" r="5808" b="1522">high</wd>

<space/>

</ln>

<ln l="1445" t="1594" r="5803" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="1646" r="2242" b="1795">accuracy,</wd>

<space/>

<wd l="2309" t="1594" r="2525" b="1795">by</wd>

<space/>

<wd l="2582" t="1594" r="3053" b="1795">using</wd>

<space/>

<wd l="3110" t="1594" r="3379" b="1752">the</wd>

<space/>

<wd l="3437" t="1598" r="3643" b="1747">F1</wd>

<space/>

<wd l="3730" t="1646" r="4224" b="1781">score,</wd>

<space/>

<wd l="4291" t="1646" r="4546" b="1752">we</wd>

<space/>

<wd l="4608" t="1594" r="5150" b="1752">obtain</wd>

<space/>

<wd l="5208" t="1646" r="5304" b="1752">a</wd>

<space/>

<wd l="5357" t="1646" r="5803" b="1752">more</wd>

<space/>

</ln>

<ln l="1440" t="1862" r="5808" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="1862" r="2371" b="2021">reasonable</wd>

<space/>

<wd l="2424" t="1862" r="3245" b="2021">harmonic</wd>

<space/>

<wd l="3302" t="1862" r="4032" b="2021">function</wd>

<space/>

<wd l="4090" t="1862" r="4277" b="2021">of</wd>

<space/>

<wd l="4320" t="1862" r="4584" b="2021">the</wd>

<space/>

<wd l="4637" t="1862" r="5438" b="2064">precision</wd>

<space/>

<wd l="5496" t="1862" r="5808" b="2021">and</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="2290" b="2294" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="2136" r="1704" b="2294">the</wd>

<space/>

<wd l="1762" t="2136" r="2290" b="2294">recall.</wd>

</ln>

</para>

<para l="1435" t="2405" r="5818" b="10195" alignment="justified" spaceBefore="28" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="2405" r="5803" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="2405" r="1920" b="2563">Table</wd>

<space/>

<wd l="2059" t="2410" r="2160" b="2558">2</wd>

<space/>

<wd l="2314" t="2405" r="2832" b="2563">shows</wd>

<space/>

<wd l="2981" t="2405" r="3245" b="2563">the</wd>

<space/>

<wd l="3384" t="2405" r="3946" b="2563">results</wd>

<space/>

<wd l="4094" t="2405" r="4843" b="2563">obtained</wd>

<space/>

<wd l="4978" t="2405" r="5194" b="2606">by</wd>

<space/>

<wd l="5333" t="2405" r="5803" b="2606">using</wd>

<space/>

</ln>

<ln l="1440" t="2678" r="5798" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="2678" r="2064" b="2837">models</wd>

<space/>

<wd l="2165" t="2678" r="2554" b="2837">with</wd>

<space/>

<wd l="2650" t="2678" r="2962" b="2837">and</wd>

<space/>

<wd l="3053" t="2678" r="3725" b="2837">without</wd>

<space/>

<wd l="3816" t="2678" r="4262" b="2837">word</wd>

<space/>

<wd l="4358" t="2678" r="5366" b="2880">embedding.</wd>

<space/>

<wd l="5563" t="2683" r="5798" b="2837">As</wd>

<space/>

</ln>

<ln l="1450" t="2947" r="5808" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="2947" r="2006" b="3106">shown</wd>

<space/>

<wd l="2126" t="2947" r="2299" b="3101">in</wd>

<space/>

<wd l="2419" t="2947" r="2842" b="3106">table</wd>

<space/>

<wd l="2966" t="2952" r="3115" b="3134">2,</wd>

<space/>

<wd l="3264" t="2947" r="3821" b="3106">brown</wd>

<space/>

<wd l="3946" t="2947" r="4795" b="3149">clustering</wd>

<space/>

<wd l="4925" t="2947" r="5237" b="3106">and</wd>

<space/>

<wd l="5362" t="2947" r="5808" b="3106">word</wd>

<space/>

</ln>

<ln l="1445" t="3221" r="5794" b="3422" baseLine="3370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="3221" r="2405" b="3422">embedding</wd>

<space/>

<wd l="2510" t="3221" r="2914" b="3379">have</wd>

<space/>

<wd l="3014" t="3274" r="3110" b="3379">a</wd>

<space/>

<wd l="3211" t="3221" r="3643" b="3422">good</wd>

<space/>

<wd l="3749" t="3221" r="4234" b="3379">effect</wd>

<space/>

<wd l="4334" t="3274" r="4550" b="3379">on</wd>

<space/>

<wd l="4646" t="3221" r="5794" b="3422">performance.</wd>

<space/>

</ln>

<ln l="1440" t="3490" r="5808" b="3691" baseLine="3638">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="3490" r="1709" b="3643">All</wd>

<space/>

<wd l="1838" t="3514" r="2294" b="3691">types</wd>

<space/>

<wd l="2429" t="3490" r="2616" b="3648">of</wd>

<space/>

<wd l="2731" t="3490" r="3346" b="3648">entities</wd>

<space/>

<wd l="3480" t="3514" r="4046" b="3691">except</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="4166" t="3499" r="4680" b="3648">movie</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="4814" t="3490" r="5256" b="3648">show</wd>

<space/>

<wd l="5386" t="3542" r="5808" b="3648">error</wd>

<space/>

</run>

</ln>

<ln l="1440" t="3763" r="5808" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="3763" r="2309" b="3922">reduction.</wd>

<space/>

<wd l="2467" t="3768" r="2770" b="3922">For</wd>

<space/>

<wd l="2851" t="3763" r="3898" b="3965">determining</wd>

<space/>

<wd l="3984" t="3763" r="4248" b="3922">the</wd>

<space/>

<wd l="4339" t="3763" r="5011" b="3965">efficacy</wd>

<space/>

<wd l="5102" t="3763" r="5290" b="3922">of</wd>

<space/>

<wd l="5362" t="3763" r="5808" b="3922">word</wd>

<space/>

</ln>

<ln l="1445" t="4032" r="5803" b="4234" baseLine="4181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="4032" r="2453" b="4234">embedding,</wd>

<space/>

<wd l="2568" t="4085" r="2822" b="4190">we</wd>

<space/>

<wd l="2918" t="4085" r="3662" b="4234">compare</wd>

<space/>

<wd l="3758" t="4032" r="4022" b="4190">the</wd>

<space/>

<wd l="4123" t="4085" r="4618" b="4190">errors</wd>

<space/>

<wd l="4718" t="4032" r="5448" b="4190">between</wd>

<space/>

<wd l="5539" t="4032" r="5803" b="4190">the</wd>

<space/>

</ln>

<ln l="1440" t="4301" r="5808" b="4502" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="4301" r="2064" b="4459">models</wd>

<space/>

<wd l="2155" t="4301" r="2822" b="4459">without</wd>

<space/>

<wd l="2904" t="4301" r="3350" b="4459">word</wd>

<space/>

<wd l="3442" t="4301" r="4402" b="4502">embedding</wd>

<space/>

<wd l="4493" t="4301" r="4805" b="4459">and</wd>

<space/>

<wd l="4886" t="4301" r="5275" b="4459">with</wd>

<space/>

<wd l="5362" t="4301" r="5808" b="4459">word</wd>

<space/>

</ln>

<ln l="1445" t="4574" r="5798" b="4776" baseLine="4723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="4574" r="2453" b="4776">embedding.</wd>

<space/>

<wd l="2597" t="4579" r="2880" b="4733">We</wd>

<space/>

<wd l="2962" t="4574" r="3298" b="4733">find</wd>

<space/>

<wd l="3374" t="4574" r="3701" b="4733">that</wd>

<space/>

<wd l="3778" t="4574" r="4224" b="4733">word</wd>

<space/>

<wd l="4306" t="4574" r="5266" b="4776">embedding</wd>

<space/>

<wd l="5347" t="4574" r="5798" b="4776">plays</wd>

<space/>

</ln>

<ln l="1445" t="4843" r="5818" b="5045" baseLine="4997" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="4896" r="1642" b="5002">an</wd>

<space/>

<wd l="1762" t="4843" r="2611" b="5045">important</wd>

<space/>

<wd l="2726" t="4843" r="3067" b="5002">role</wd>

<space/>

<wd l="3182" t="4843" r="3355" b="4997">in</wd>

<space/>

<wd l="3470" t="4843" r="4277" b="5045">resolving</wd>

<space/>

<wd l="4397" t="4843" r="4661" b="5002">the</wd>

<space/>

<wd l="4781" t="4843" r="5510" b="5045">problem</wd>

<space/>

<wd l="5630" t="4843" r="5818" b="5002">of</wd>

<space/>

</ln>

<ln l="1440" t="5117" r="5803" b="5318" baseLine="5266" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="5170" r="2050" b="5275">unseen</wd>

<space/>

<wd l="2126" t="5117" r="2573" b="5275">word</wd>

<space/>

<wd l="2664" t="5170" r="3528" b="5318">sequences</wd>

<space/>

<wd l="3624" t="5117" r="3936" b="5275">and</wd>

<space/>

<wd l="4013" t="5117" r="4277" b="5275">the</wd>

<space/>

<wd l="4358" t="5117" r="5088" b="5318">problem</wd>

<space/>

<wd l="5174" t="5117" r="5362" b="5275">of</wd>

<space/>

<wd l="5429" t="5141" r="5803" b="5318">type</wd>

<space/>

</ln>

<ln l="1445" t="5386" r="5808" b="5587" baseLine="5539" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="5386" r="2827" b="5587">disambiguation.</wd>

<space/>

<wd l="3034" t="5386" r="3475" b="5573">First,</wd>

<space/>

<wd l="3590" t="5386" r="3859" b="5544">the</wd>

<space/>

<wd l="3955" t="5386" r="4498" b="5544">model</wd>

<space/>

<wd l="4598" t="5386" r="5266" b="5544">without</wd>

<space/>

<wd l="5362" t="5386" r="5808" b="5544">word</wd>

<space/>

</ln>

<ln l="1445" t="5659" r="5813" b="5861" baseLine="5808">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1445" t="5659" r="2405" b="5861">embedding</wd>

<space/>

<wd l="2515" t="5659" r="2904" b="5818">does</wd>

<space/>

<wd l="3010" t="5683" r="3293" b="5818">not</wd>

<space/>

<wd l="3389" t="5659" r="3826" b="5818">learn</wd>

<space/>

<wd l="3931" t="5659" r="4416" b="5818">about</wd>

<space/>

<wd l="4517" t="5712" r="4714" b="5818">an</wd>

<space/>

<wd l="4824" t="5659" r="5314" b="5861">entity</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="5429" t="5659" r="5813" b="5861">ipad</wd>

<space/>

</run>

</ln>

<ln l="1435" t="5928" r="5803" b="6130" baseLine="6082">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1435" t="5938" r="1848" b="6086">Mini</wd>

<space/>

<wd l="1939" t="5938" r="2510" b="6086">Retina</wd>

<space/>

<wd l="2606" t="5928" r="2938" b="6086">2nd</wd>

<space/>

<wd l="3034" t="5933" r="4013" b="6086">Generation</wd>

<space/>

<wd l="4118" t="5928" r="4613" b="6086">16GB</wd>

<space/>

<wd l="4709" t="5933" r="5026" b="6130">wifi</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="5117" t="5928" r="5803" b="6086">because</wd>

<space/>

</run>

</ln>

<ln l="1450" t="6202" r="5803" b="6403" baseLine="6350" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="6254" r="1901" b="6360">some</wd>

<space/>

<wd l="1987" t="6202" r="2179" b="6360">of</wd>

<space/>

<wd l="2246" t="6202" r="2510" b="6360">the</wd>

<space/>

<wd l="2592" t="6202" r="3115" b="6360">words</wd>

<space/>

<wd l="3211" t="6202" r="3422" b="6360">do</wd>

<space/>

<wd l="3504" t="6226" r="3787" b="6360">not</wd>

<space/>

<wd l="3869" t="6254" r="4450" b="6403">appear</wd>

<space/>

<wd l="4526" t="6202" r="4699" b="6355">in</wd>

<space/>

<wd l="4781" t="6202" r="5045" b="6360">the</wd>

<space/>

<wd l="5126" t="6202" r="5803" b="6403">training</wd>

<space/>

</ln>

<ln l="1445" t="6470" r="5803" b="6672" baseLine="6624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="6470" r="1848" b="6629">data.</wd>

<space/>

<wd l="1978" t="6475" r="2160" b="6624">In</wd>

<space/>

<wd l="2232" t="6494" r="2962" b="6658">contrast,</wd>

<space/>

<wd l="3048" t="6470" r="3317" b="6629">the</wd>

<space/>

<wd l="3389" t="6470" r="3931" b="6629">model</wd>

<space/>

<wd l="4003" t="6470" r="4392" b="6629">with</wd>

<space/>

<wd l="4469" t="6470" r="5429" b="6672">embedding</wd>

<space/>

<wd l="5506" t="6523" r="5803" b="6629">can</wd>

<space/>

</ln>

<ln l="1440" t="6744" r="5794" b="6946" baseLine="6893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="6744" r="1872" b="6902">learn</wd>

<space/>

<wd l="1939" t="6797" r="2549" b="6902">unseen</wd>

<space/>

<wd l="2611" t="6744" r="3130" b="6902">words</wd>

<space/>

<wd l="3202" t="6744" r="3629" b="6902">from</wd>

<space/>

<wd l="3691" t="6744" r="3955" b="6902">the</wd>

<space/>

<wd l="4022" t="6744" r="4714" b="6902">induced</wd>

<space/>

<wd l="4776" t="6744" r="5222" b="6902">word</wd>

<space/>

<wd l="5285" t="6797" r="5794" b="6946">repre-</wd>

</ln>

<ln l="1450" t="7013" r="5803" b="7214" baseLine="7162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="7013" r="2270" b="7171">sentation.</wd>

<space/>

<wd l="2362" t="7013" r="2741" b="7171">This</wd>

<space/>

<wd l="2808" t="7013" r="3264" b="7214">helps</wd>

<space/>

<wd l="3331" t="7013" r="3595" b="7171">the</wd>

<space/>

<wd l="3653" t="7013" r="4195" b="7171">model</wd>

<space/>

<wd l="4258" t="7037" r="4426" b="7171">to</wd>

<space/>

<wd l="4488" t="7013" r="5098" b="7214">predict</wd>

<space/>

<wd l="5150" t="7013" r="5482" b="7171">that</wd>

<space/>

<wd l="5539" t="7013" r="5803" b="7171">the</wd>

<space/>

</ln>

<ln l="1445" t="7282" r="5794" b="7483" baseLine="7435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="7282" r="2875" b="7440">abovementioned</wd>

<space/>

<wd l="2952" t="7282" r="3442" b="7483">entity</wd>

<space/>

<wd l="3518" t="7282" r="4286" b="7440">indicates</wd>

<space/>

<wd l="4373" t="7334" r="4469" b="7440">a</wd>

<space/>

<wd l="4541" t="7282" r="5208" b="7483">product</wd>

<space/>

<wd l="5280" t="7334" r="5794" b="7440">name.</wd>

<space/>

</ln>

<ln l="1440" t="7555" r="5798" b="7757" baseLine="7704" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="7555" r="1781" b="7714">The</wd>

<space/>

<wd l="1906" t="7555" r="2448" b="7714">model</wd>

<space/>

<wd l="2578" t="7555" r="3245" b="7714">without</wd>

<space/>

<wd l="3370" t="7555" r="3816" b="7714">word</wd>

<space/>

<wd l="3946" t="7555" r="4906" b="7757">embedding</wd>

<space/>

<wd l="5040" t="7555" r="5386" b="7714">also</wd>

<space/>

<wd l="5515" t="7555" r="5798" b="7714">has</wd>

<space/>

</ln>

<ln l="1440" t="7824" r="5803" b="8026" baseLine="7978">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="7824" r="1704" b="7982">the</wd>

<space/>

<wd l="1781" t="7824" r="2510" b="8026">problem</wd>

<space/>

<wd l="2587" t="7824" r="2774" b="7982">of</wd>

<space/>

<wd l="2842" t="7824" r="4181" b="8026">disambiguation</wd>

<space/>

<wd l="4258" t="7824" r="4450" b="7982">of</wd>

<space/>

<wd l="4517" t="7877" r="4613" b="7982">a</wd>

<space/>

<wd l="4680" t="7824" r="5126" b="7982">word</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="5194" t="7824" r="5803" b="7982">Edison</wd>

<space/>

</run>

</ln>

<ln l="1440" t="8098" r="5808" b="8299" baseLine="8246" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8098" r="2131" b="8256">because</wd>

<space/>

<wd l="2198" t="8098" r="2467" b="8256">the</wd>

<space/>

<wd l="2534" t="8098" r="3077" b="8256">model</wd>

<space/>

<wd l="3154" t="8098" r="3533" b="8299">only</wd>

<space/>

<wd l="3610" t="8098" r="4118" b="8256">learns</wd>

<space/>

<wd l="4195" t="8098" r="4526" b="8256">that</wd>

<space/>

<wd l="4594" t="8098" r="4901" b="8256">this</wd>

<space/>

<wd l="4978" t="8098" r="5424" b="8256">word</wd>

<space/>

<wd l="5496" t="8098" r="5630" b="8256">is</wd>

<space/>

<wd l="5712" t="8150" r="5808" b="8256">a</wd>

<space/>

</ln>

<ln l="1440" t="8366" r="5808" b="8568" baseLine="8520" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8371" r="2160" b="8568">person’s</wd>

<space/>

<wd l="2246" t="8419" r="2717" b="8525">name</wd>

<space/>

<wd l="2798" t="8366" r="3226" b="8525">from</wd>

<space/>

<wd l="3302" t="8366" r="3571" b="8525">the</wd>

<space/>

<wd l="3653" t="8390" r="4565" b="8568">gazetteers.</wd>

<space/>

<wd l="4718" t="8371" r="5539" b="8554">However,</wd>

<space/>

<wd l="5635" t="8366" r="5808" b="8520">in</wd>

<space/>

</ln>

<ln l="1440" t="8640" r="5803" b="8842" baseLine="8789" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="8640" r="1704" b="8798">the</wd>

<space/>

<wd l="1781" t="8640" r="2232" b="8798">word</wd>

<space/>

<wd l="2314" t="8693" r="3101" b="8842">sequence</wd>

<space/>

<wd l="3182" t="8640" r="3883" b="8798">“Edison</wd>

<space/>

<wd l="3960" t="8640" r="4762" b="8798">#weather</wd>

<space/>

<wd l="4838" t="8693" r="5054" b="8798">on</wd>

<space/>

<wd l="5126" t="8645" r="5803" b="8842">January</wd>

<space/>

</ln>

<ln l="1464" t="8909" r="5794" b="9110" baseLine="9062">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1464" t="8909" r="1656" b="9067">16</wd>

<space/>

<wd l="1718" t="9038" r="1752" b="9096">,</wd>

<space/>

<wd l="1814" t="8909" r="2386" b="9096">2015”,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="2443" t="8909" r="3053" b="9067">Edison</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="3101" t="8909" r="3869" b="9067">indicates</wd>

<space/>

<wd l="3931" t="8962" r="4027" b="9067">a</wd>

<space/>

<wd l="4070" t="8933" r="4502" b="9067">town</wd>

<space/>

<wd l="4550" t="8909" r="4723" b="9062">in</wd>

<space/>

<wd l="4766" t="8914" r="5170" b="9067">New</wd>

<space/>

<wd l="5222" t="8914" r="5794" b="9110">Jersey.</wd>

<space/>

</run>

</ln>

<ln l="1440" t="9182" r="5808" b="9384" baseLine="9331" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9182" r="1781" b="9341">The</wd>

<space/>

<wd l="1906" t="9182" r="2448" b="9341">model</wd>

<space/>

<wd l="2578" t="9182" r="2966" b="9341">with</wd>

<space/>

<wd l="3091" t="9182" r="3538" b="9341">word</wd>

<space/>

<wd l="3672" t="9182" r="4632" b="9384">embedding</wd>

<space/>

<wd l="4762" t="9182" r="4901" b="9341">is</wd>

<space/>

<wd l="5035" t="9182" r="5808" b="9384">provided</wd>

<space/>

</ln>

<ln l="1445" t="9451" r="5803" b="9653" baseLine="9605" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="9451" r="2309" b="9610">additional</wd>

<space/>

<wd l="2424" t="9451" r="3456" b="9610">information</wd>

<space/>

<wd l="3566" t="9451" r="3782" b="9653">by</wd>

<space/>

<wd l="3898" t="9451" r="4166" b="9610">the</wd>

<space/>

<wd l="4277" t="9451" r="4723" b="9610">word</wd>

<space/>

<wd l="4838" t="9451" r="5803" b="9653">embedding</wd>

<space/>

</ln>

<ln l="1440" t="9725" r="5798" b="9926" baseLine="9874" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="9778" r="2088" b="9926">process</wd>

<space/>

<wd l="2160" t="9725" r="2472" b="9883">and</wd>

<space/>

<wd l="2534" t="9725" r="3216" b="9926">predicts</wd>

<space/>

<wd l="3288" t="9725" r="3552" b="9883">the</wd>

<space/>

<wd l="3624" t="9725" r="5054" b="9883">abovementioned</wd>

<space/>

<wd l="5117" t="9725" r="5563" b="9883">word</wd>

<space/>

<wd l="5630" t="9778" r="5798" b="9883">as</wd>

<space/>

</ln>

<ln l="1440" t="9994" r="2952" b="10195" baseLine="10142">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="9994" r="2093" b="10195">geo-loc</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="2150" t="9994" r="2952" b="10195">correctly.</wd>

</run>

</ln>

</para>

<para l="1445" t="10709" r="2938" b="10882" alignment="left" spaceBefore="464" lsp="exactly" lspExact="273" language="en">

<ln l="1445" t="10709" r="2938" b="10882" baseLine="10877" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="12">

<wd l="1445" t="10709" r="1555" b="10882">6</wd>

<space/>

<wd l="1810" t="10709" r="2938" b="10882">Conclusion</wd>

</ln>

</para>

<para l="1440" t="11126" r="5808" b="13229" alignment="justified" spaceBefore="136" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="11126" r="5798" b="11328" baseLine="11280" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11131" r="1622" b="11280">In</wd>

<space/>

<wd l="1699" t="11126" r="2006" b="11285">this</wd>

<space/>

<wd l="2088" t="11179" r="2606" b="11328">paper,</wd>

<space/>

<wd l="2702" t="11179" r="2952" b="11285">we</wd>

<space/>

<wd l="3034" t="11126" r="3869" b="11285">described</wd>

<space/>

<wd l="3941" t="11126" r="4210" b="11285">the</wd>

<space/>

<wd l="4291" t="11126" r="4651" b="11285">data</wd>

<space/>

<wd l="4728" t="11126" r="5040" b="11285">and</wd>

<space/>

<wd l="5117" t="11126" r="5798" b="11285">features</wd>

<space/>

</ln>

<ln l="1440" t="11400" r="5798" b="11602" baseLine="11549" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11400" r="1843" b="11558">used</wd>

<space/>

<wd l="1901" t="11400" r="2160" b="11558">for</wd>

<space/>

<wd l="2222" t="11400" r="3139" b="11602">generating</wd>

<space/>

<wd l="3206" t="11453" r="3499" b="11558">our</wd>

<space/>

<wd l="3557" t="11400" r="4147" b="11558">model.</wd>

<space/>

<wd l="4248" t="11400" r="4920" b="11558">Besides</wd>

<space/>

<wd l="4992" t="11405" r="5381" b="11558">POS</wd>

<space/>

<wd l="5453" t="11424" r="5798" b="11602">tags</wd>

<space/>

</ln>

<ln l="1445" t="11669" r="5808" b="11870" baseLine="11822" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="11669" r="1757" b="11827">and</wd>

<space/>

<wd l="1858" t="11669" r="2386" b="11827">chunk</wd>

<space/>

<wd l="2477" t="11693" r="2875" b="11870">tags,</wd>

<space/>

<wd l="2990" t="11722" r="3245" b="11827">we</wd>

<space/>

<wd l="3341" t="11669" r="3744" b="11827">used</wd>

<space/>

<wd l="3840" t="11722" r="3936" b="11827">a</wd>

<space/>

<wd l="4027" t="11669" r="4474" b="11827">word</wd>

<space/>

<wd l="4570" t="11669" r="5808" b="11870">representation</wd>

<space/>

</ln>

<ln l="1440" t="11942" r="5794" b="12144" baseLine="12091" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11942" r="1939" b="12101">based</wd>

<space/>

<wd l="2011" t="11995" r="2227" b="12101">on</wd>

<space/>

<wd l="2299" t="11947" r="2741" b="12101">CCA</wd>

<space/>

<wd l="2813" t="11942" r="3067" b="12101">for</wd>

<space/>

<wd l="3134" t="11942" r="4037" b="12144">improving</wd>

<space/>

<wd l="4109" t="11942" r="4373" b="12101">the</wd>

<space/>

<wd l="4445" t="11942" r="5126" b="12101">model’s</wd>

<space/>

<wd l="5203" t="11942" r="5794" b="12144">perfor-</wd>

</ln>

<ln l="1440" t="12211" r="5794" b="12370" baseLine="12365" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12264" r="2054" b="12370">mance.</wd>

<space/>

<wd l="2251" t="12216" r="2592" b="12370">Our</wd>

<space/>

<wd l="2683" t="12211" r="3062" b="12370">final</wd>

<space/>

<wd l="3158" t="12211" r="3701" b="12370">model</wd>

<space/>

<wd l="3806" t="12211" r="4330" b="12370">shows</wd>

<space/>

<wd l="4435" t="12264" r="4637" b="12370">an</wd>

<space/>

<wd l="4738" t="12264" r="5160" b="12370">error</wd>

<space/>

<wd l="5246" t="12211" r="5794" b="12370">reduc-</wd>

</ln>

<ln l="1440" t="12485" r="5803" b="12686" baseLine="12634" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12485" r="1781" b="12643">tion</wd>

<space/>

<wd l="1843" t="12485" r="2030" b="12643">of</wd>

<space/>

<wd l="2098" t="12490" r="2736" b="12643">14.08%</wd>

<space/>

<wd l="2803" t="12485" r="3230" b="12643">from</wd>

<space/>

<wd l="3283" t="12485" r="3547" b="12643">the</wd>

<space/>

<wd l="3605" t="12485" r="4320" b="12643">baseline</wd>

<space/>

<wd l="4387" t="12509" r="5026" b="12686">system.</wd>

<space/>

<wd l="5112" t="12490" r="5395" b="12643">We</wd>

<space/>

<wd l="5458" t="12485" r="5803" b="12643">also</wd>

<space/>

</ln>

<ln l="1440" t="12754" r="5794" b="12955" baseLine="12907" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12754" r="2275" b="12955">presented</wd>

<space/>

<wd l="2333" t="12806" r="2784" b="12912">some</wd>

<space/>

<wd l="2827" t="12754" r="3518" b="12955">primary</wd>

<space/>

<wd l="3571" t="12754" r="3883" b="12912">and</wd>

<space/>

<wd l="3926" t="12754" r="5280" b="12955">Twitter-specific</wd>

<space/>

<wd l="5333" t="12754" r="5794" b="12955">prob-</wd>

</ln>

<ln l="1440" t="13027" r="3859" b="13229" baseLine="13176" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13027" r="1843" b="13186">lems</wd>

<space/>

<wd l="1906" t="13027" r="2122" b="13229">by</wd>

<space/>

<wd l="2184" t="13027" r="3250" b="13229">categorizing</wd>

<space/>

<wd l="3312" t="13080" r="3859" b="13186">errors.</wd>

</ln>

</para>

<para l="1445" t="13728" r="2544" b="13901" alignment="left" spaceBefore="445" lsp="exactly" lspExact="273" language="en">

<ln l="1445" t="13728" r="2544" b="13901" baseLine="13891" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="13728" r="2544" b="13901">References</wd>

</ln>

</para>

<para l="1440" t="14093" r="5803" b="14938" alignment="justified" li="216" spaceBefore="110" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="14093" r="5798" b="14280" baseLine="14232" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14098" r="1882" b="14237">Tasos</wd>

<space/>

<wd l="1934" t="14093" r="2971" b="14261">Anastasakos,</wd>

<space/>

<wd l="3024" t="14098" r="3998" b="14280">Young-Bum</wd>

<space/>

<wd l="4046" t="14093" r="4435" b="14261">Kim,</wd>

<space/>

<wd l="4493" t="14093" r="4776" b="14237">and</wd>

<space/>

<wd l="4819" t="14098" r="5362" b="14275">Anoop</wd>

<space/>

<wd l="5405" t="14098" r="5798" b="14237">Deo-</wd>

</ln>

<ln l="1656" t="14314" r="5798" b="14496" baseLine="14453" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="14357" r="1930" b="14458">ras.</wd>

<space/>

<wd l="2040" t="14314" r="2472" b="14458">2014.</wd>

<space/>

<wd l="2578" t="14314" r="2947" b="14458">Task</wd>

<space/>

<wd l="3014" t="14314" r="3610" b="14496">specific</wd>

<space/>

<wd l="3672" t="14314" r="4536" b="14458">continuous</wd>

<space/>

<wd l="4598" t="14314" r="5011" b="14458">word</wd>

<space/>

<wd l="5064" t="14357" r="5798" b="14496">represen-</wd>

</ln>

<ln l="1656" t="14534" r="5803" b="14722" baseLine="14669" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="14534" r="2184" b="14678">tations</wd>

<space/>

<wd l="2242" t="14534" r="2477" b="14678">for</wd>

<space/>

<wd l="2530" t="14578" r="2981" b="14678">mono</wd>

<space/>

<wd l="3038" t="14534" r="3326" b="14678">and</wd>

<space/>

<wd l="3374" t="14534" r="4416" b="14722">multi-lingual</wd>

<space/>

<wd l="4478" t="14534" r="5035" b="14717">spoken</wd>

<space/>

<wd l="5088" t="14534" r="5803" b="14722">language</wd>

<space/>

</ln>

<ln l="1656" t="14750" r="5794" b="14938" baseLine="14890">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1656" t="14750" r="2827" b="14938">understanding.</wd>

<space/>

<wd l="2909" t="14755" r="3077" b="14890">In</wd>

<space/>

</run>

<wd l="3110" t="14755" r="3802" b="14918"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">ICASSP</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="3845" t="14794" r="4296" b="14938">pages</wd>

<space/>

<wd l="4344" t="14750" r="5275" b="14894">3246–3250.</wd>

<space/>

<wd l="5323" t="14755" r="5794" b="14894">IEEE.</wd>

</run>

</ln>

</para>

<para l="1440" t="15120" r="5794" b="15307" alignment="justified" spaceBefore="142" lsp="exactly" lspExact="222" language="en">

<ln l="1440" t="15120" r="5794" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1440" t="15120" r="1901" b="15264">Johan</wd>

<space/>

<wd l="1978" t="15120" r="2549" b="15288">Bollen,</wd>

<space/>

<wd l="2635" t="15120" r="3125" b="15264">Huina</wd>

<space/>

<wd l="3192" t="15125" r="3600" b="15288">Mao,</wd>

<space/>

<wd l="3691" t="15120" r="3974" b="15264">and</wd>

<space/>

<wd l="4042" t="15120" r="4685" b="15307">Xiaojun</wd>

<space/>

<wd l="4757" t="15125" r="5203" b="15307">Zeng.</wd>

<space/>

<wd l="5362" t="15120" r="5794" b="15264">2011.</wd>

</ln>

</para>

</column>

<column l="6144" t="1263" r="10546" b="15315">

<para l="6365" t="1334" r="10541" b="1738" alignment="justified" li="216" spaceBefore="44" lsp="exactly" lspExact="220" language="en">

<ln l="6365" t="1334" r="10541" b="1517" baseLine="1474">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="1334" r="6936" b="1478">Twitter</wd>

<space/>

<wd l="6994" t="1334" r="7450" b="1478">mood</wd>

<space/>

<wd l="7507" t="1334" r="8131" b="1517">predicts</wd>

<space/>

<wd l="8198" t="1334" r="8438" b="1478">the</wd>

<space/>

<wd l="8510" t="1334" r="8923" b="1478">stock</wd>

<space/>

<wd l="8981" t="1334" r="9571" b="1478">market.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9677" t="1334" r="10301" b="1478">Journal</wd>

<space/>

<wd l="10358" t="1334" r="10541" b="1517">of</wd>

<space/>

</run>

</ln>

<ln l="6374" t="1555" r="9043" b="1738" baseLine="1694">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="1555" r="7560" b="1738">Computational</wd>

<space/>

</run>

<wd l="7608" t="1560" r="8261" b="1723"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Science</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8323" t="1555" r="9043" b="1733">2(1):1–8.</wd>

</run>

</ln>

</para>

<para l="6144" t="2011" r="10502" b="2851" alignment="justified" li="216" spaceBefore="229" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="2011" r="10502" b="2179" baseLine="2146" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2016" r="6557" b="2155">Peter</wd>

<space/>

<wd l="6638" t="2016" r="6749" b="2150">F</wd>

<space/>

<wd l="6835" t="2016" r="7416" b="2179">Brown,</wd>

<space/>

<wd l="7512" t="2016" r="7925" b="2155">Peter</wd>

<space/>

<wd l="8006" t="2016" r="8146" b="2155">V</wd>

<space/>

<wd l="8232" t="2016" r="8962" b="2179">Desouza,</wd>

<space/>

<wd l="9062" t="2011" r="9605" b="2155">Robert</wd>

<space/>

<wd l="9686" t="2016" r="9806" b="2150">L</wd>

<space/>

<wd l="9893" t="2016" r="10502" b="2179">Mercer,</wd>

<space/>

</ln>

<ln l="6365" t="2232" r="10498" b="2400" baseLine="2366" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="2232" r="6984" b="2376">Vincent</wd>

<space/>

<wd l="7066" t="2237" r="7142" b="2376">J</wd>

<space/>

<wd l="7229" t="2232" r="7661" b="2376">Della</wd>

<space/>

<wd l="7742" t="2232" r="8251" b="2400">Pietra,</wd>

<space/>

<wd l="8357" t="2232" r="8640" b="2376">and</wd>

<space/>

<wd l="8722" t="2232" r="9264" b="2376">Jenifer</wd>

<space/>

<wd l="9355" t="2232" r="9480" b="2376">C</wd>

<space/>

<wd l="9566" t="2232" r="9869" b="2376">Lai.</wd>

<space/>

<wd l="10080" t="2232" r="10498" b="2376">1992.</wd>

<space/>

</ln>

<ln l="6370" t="2448" r="10498" b="2635" baseLine="2587" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="2448" r="7315" b="2592">Class-based</wd>

<space/>

<wd l="7426" t="2491" r="8006" b="2635">n-gram</wd>

<space/>

<wd l="8112" t="2448" r="8683" b="2592">models</wd>

<space/>

<wd l="8803" t="2448" r="8976" b="2592">of</wd>

<space/>

<wd l="9077" t="2448" r="9629" b="2592">natural</wd>

<space/>

<wd l="9744" t="2448" r="10498" b="2635">language.</wd>

<space/>

</ln>

<ln l="6374" t="2669" r="9749" b="2851" baseLine="2803">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="2669" r="7560" b="2851">Computational</wd>

<space/>

</run>

<wd l="7613" t="2669" r="8472" b="2851"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">linguistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8549" t="2669" r="9749" b="2846">18(4):467–479.</wd>

</run>

</ln>

</para>

<para l="6144" t="3125" r="10512" b="4406" alignment="justified" li="216" spaceBefore="231" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="3125" r="10502" b="3312" baseLine="3259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3125" r="6797" b="3269">Michael</wd>

<space/>

<wd l="6864" t="3125" r="7474" b="3269">Collins.</wd>

<space/>

<wd l="7589" t="3125" r="8021" b="3269">2002.</wd>

<space/>

<wd l="8131" t="3125" r="9307" b="3269">Discriminative</wd>

<space/>

<wd l="9370" t="3125" r="9984" b="3312">training</wd>

<space/>

<wd l="10046" t="3125" r="10502" b="3269">meth-</wd>

</ln>

<ln l="6370" t="3341" r="10502" b="3528" baseLine="3480" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="3341" r="6634" b="3485">ods</wd>

<space/>

<wd l="6706" t="3341" r="6941" b="3485">for</wd>

<space/>

<wd l="7008" t="3341" r="7550" b="3485">hidden</wd>

<space/>

<wd l="7618" t="3341" r="8218" b="3485">markov</wd>

<space/>

<wd l="8285" t="3341" r="8899" b="3485">models:</wd>

<space/>

<wd l="9014" t="3341" r="9586" b="3528">Theory</wd>

<space/>

<wd l="9658" t="3341" r="9946" b="3485">and</wd>

<space/>

<wd l="10013" t="3384" r="10502" b="3523">exper-</wd>

</ln>

<ln l="6365" t="3562" r="10512" b="3749" baseLine="3696">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="3562" r="6888" b="3706">iments</wd>

<space/>

<wd l="6955" t="3562" r="7310" b="3706">with</wd>

<space/>

<wd l="7373" t="3581" r="8227" b="3744">perceptron</wd>

<space/>

<wd l="8290" t="3562" r="9178" b="3749">algorithms.</wd>

<space/>

<wd l="9298" t="3566" r="9466" b="3701">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9523" t="3562" r="10512" b="3744">Proceedings</wd>

<space/>

</run>

</ln>

<ln l="6370" t="3782" r="10507" b="3965" baseLine="3917" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="3782" r="6552" b="3965">of</wd>

<space/>

<wd l="6586" t="3782" r="6826" b="3926">the</wd>

<space/>

<wd l="6874" t="3782" r="7507" b="3926">ACL-02</wd>

<space/>

<wd l="7579" t="3782" r="8443" b="3965">conference</wd>

<space/>

<wd l="8510" t="3830" r="8702" b="3926">on</wd>

<space/>

<wd l="8765" t="3782" r="9566" b="3965">Empirical</wd>

<space/>

<wd l="9629" t="3782" r="10291" b="3926">methods</wd>

<space/>

<wd l="10363" t="3787" r="10507" b="3926">in</wd>

<space/>

</ln>

<ln l="6365" t="3998" r="10498" b="4186" baseLine="4138">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="3998" r="6950" b="4142">natural</wd>

<space/>

<wd l="7003" t="3998" r="7738" b="4181">language</wd>

<space/>

<wd l="7771" t="3998" r="9298" b="4181">processing-Volume</wd>

<space/>

</run>

<wd l="9360" t="3998" r="9595" b="4166"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">10</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9658" t="4042" r="10104" b="4186">pages</wd>

<space/>

<wd l="10181" t="3998" r="10498" b="4142">1–8.</wd>

<space/>

</run>

</ln>

<ln l="6365" t="4219" r="9797" b="4406" baseLine="4354" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="4219" r="7306" b="4363">Association</wd>

<space/>

<wd l="7354" t="4219" r="7589" b="4363">for</wd>

<space/>

<wd l="7642" t="4219" r="8818" b="4402">Computational</wd>

<space/>

<wd l="8870" t="4219" r="9797" b="4406">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="4675" r="10522" b="5078" alignment="justified" li="216" spaceBefore="236" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="4675" r="10522" b="4862" baseLine="4810" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4675" r="6701" b="4819">Harold</wd>

<space/>

<wd l="6749" t="4675" r="7536" b="4862">Hotelling.</wd>

<space/>

<wd l="7642" t="4675" r="8059" b="4819">1936.</wd>

<space/>

<wd l="8141" t="4675" r="8890" b="4819">Relations</wd>

<space/>

<wd l="8942" t="4675" r="9605" b="4819">between</wd>

<space/>

<wd l="9653" t="4694" r="9946" b="4819">two</wd>

<space/>

<wd l="10008" t="4694" r="10291" b="4819">sets</wd>

<space/>

<wd l="10349" t="4675" r="10522" b="4819">of</wd>

<space/>

</ln>

<ln l="6365" t="4891" r="9326" b="5078" baseLine="5030">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="4891" r="7018" b="5035">variates.</wd>

<space/>

</run>

<wd l="7094" t="4891" r="8030" b="5059"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Biometrika</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8083" t="4934" r="8534" b="5078">pages</wd>

<space/>

<wd l="8592" t="4891" r="9326" b="5035">321–377.</wd>

</run>

</ln>

</para>

<para l="6144" t="5347" r="10512" b="6192" alignment="justified" li="216" spaceBefore="229" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="5347" r="10502" b="5534" baseLine="5482" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5352" r="7123" b="5534">Young-Bum</wd>

<space/>

<wd l="7166" t="5347" r="7522" b="5486">Kim</wd>

<space/>

<wd l="7565" t="5347" r="7848" b="5491">and</wd>

<space/>

<wd l="7891" t="5347" r="8669" b="5534">Benjamin</wd>

<space/>

<wd l="8712" t="5347" r="9298" b="5534">Snyder.</wd>

<space/>

<wd l="9389" t="5347" r="9821" b="5491">2012.</wd>

<space/>

<wd l="9902" t="5347" r="10502" b="5491">Univer-</wd>

</ln>

<ln l="6374" t="5568" r="10502" b="5755" baseLine="5702" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6374" t="5568" r="6581" b="5712">sal</wd>

<space/>

<wd l="6672" t="5568" r="8467" b="5755">grapheme-to-phoneme</wd>

<space/>

<wd l="8549" t="5568" r="9360" b="5750">prediction</wd>

<space/>

<wd l="9442" t="5611" r="9787" b="5712">over</wd>

<space/>

<wd l="9864" t="5568" r="10224" b="5712">latin</wd>

<space/>

<wd l="10306" t="5568" r="10502" b="5712">al-</wd>

</ln>

<ln l="6365" t="5784" r="10512" b="5971" baseLine="5923">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="5784" r="7013" b="5966">phabets.</wd>

<space/>

<wd l="7186" t="5789" r="7354" b="5923">In</wd>

<space/>

</run>

<wd l="7426" t="5789" r="8126" b="5952"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">EMNLP</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8213" t="5827" r="8659" b="5971">pages</wd>

<space/>

<wd l="8750" t="5784" r="9480" b="5928">332–343.</wd>

<space/>

<wd l="9571" t="5784" r="10512" b="5928">Association</wd>

<space/>

</run>

</ln>

<ln l="6365" t="6005" r="8803" b="6192" baseLine="6139" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="6005" r="6595" b="6149">for</wd>

<space/>

<wd l="6653" t="6005" r="7829" b="6187">Computational</wd>

<space/>

<wd l="7882" t="6005" r="8803" b="6192">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="6461" r="10507" b="7478" alignment="justified" li="216" spaceBefore="235" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="6461" r="10502" b="6648" baseLine="6595" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6466" r="7123" b="6648">Young-Bum</wd>

<space/>

<wd l="7181" t="6461" r="7536" b="6600">Kim</wd>

<space/>

<wd l="7594" t="6461" r="7877" b="6605">and</wd>

<space/>

<wd l="7934" t="6461" r="8707" b="6648">Benjamin</wd>

<space/>

<wd l="8770" t="6461" r="9355" b="6648">Snyder.</wd>

<space/>

<wd l="9466" t="6461" r="9984" b="6605">2013a.</wd>

<space/>

<wd l="10094" t="6461" r="10502" b="6643">Opti-</wd>

</ln>

<ln l="6365" t="6677" r="10502" b="6864" baseLine="6816" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="6677" r="6662" b="6821">mal</wd>

<space/>

<wd l="6720" t="6677" r="7051" b="6821">data</wd>

<space/>

<wd l="7114" t="6696" r="7325" b="6821">set</wd>

<space/>

<wd l="7387" t="6677" r="8126" b="6821">selection:</wd>

<space/>

<wd l="8213" t="6682" r="8458" b="6816">An</wd>

<space/>

<wd l="8515" t="6677" r="9398" b="6859">application</wd>

<space/>

<wd l="9451" t="6696" r="9600" b="6821">to</wd>

<space/>

<wd l="9662" t="6677" r="10502" b="6864">grapheme-</wd>

</ln>

<ln l="6365" t="6898" r="10507" b="7085" baseLine="7032">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="6898" r="7315" b="7080">to-phoneme</wd>

<space/>

<wd l="7430" t="6898" r="8328" b="7042">conversion.</wd>

<space/>

<wd l="8602" t="6902" r="8770" b="7037">In</wd>

<space/>

</run>

<wd l="8870" t="6902" r="9941" b="7066"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">HLT-NAACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="10056" t="6941" r="10507" b="7085">pages</wd>

<space/>

</run>

</ln>

<ln l="6384" t="7118" r="10502" b="7306" baseLine="7253" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="7118" r="7301" b="7262">1196–1205.</wd>

<space/>

<wd l="7354" t="7118" r="8294" b="7262">Association</wd>

<space/>

<wd l="8333" t="7118" r="8568" b="7262">for</wd>

<space/>

<wd l="8616" t="7118" r="9792" b="7301">Computational</wd>

<space/>

<wd l="9835" t="7118" r="10502" b="7306">Linguis-</wd>

</ln>

<ln l="6365" t="7334" r="6677" b="7478" baseLine="7474" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="7334" r="6677" b="7478">tics.</wd>

</ln>

</para>

<para l="6144" t="7790" r="10507" b="8414" alignment="justified" li="216" spaceBefore="232" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="7790" r="10502" b="7978" baseLine="7925" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="7795" r="7123" b="7978">Young-Bum</wd>

<space/>

<wd l="7176" t="7790" r="7526" b="7930">Kim</wd>

<space/>

<wd l="7579" t="7790" r="7862" b="7934">and</wd>

<space/>

<wd l="7910" t="7790" r="8688" b="7978">Benjamin</wd>

<space/>

<wd l="8741" t="7790" r="9326" b="7978">Snyder.</wd>

<space/>

<wd l="9418" t="7790" r="9941" b="7934">2013b.</wd>

<space/>

<wd l="10022" t="7795" r="10502" b="7934">Unsu-</wd>

</ln>

<ln l="6365" t="8011" r="10507" b="8194" baseLine="8146" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="8011" r="7042" b="8194">pervised</wd>

<space/>

<wd l="7104" t="8011" r="8448" b="8155">consonant-vowel</wd>

<space/>

<wd l="8506" t="8011" r="9317" b="8194">prediction</wd>

<space/>

<wd l="9379" t="8054" r="9725" b="8155">over</wd>

<space/>

<wd l="9782" t="8011" r="10507" b="8155">hundreds</wd>

<space/>

</ln>

<ln l="6370" t="8227" r="9893" b="8414" baseLine="8366">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6370" t="8227" r="6542" b="8371">of</wd>

<space/>

<wd l="6581" t="8227" r="7416" b="8414">languages.</wd>

<space/>

<wd l="7498" t="8232" r="7666" b="8366">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7699" t="8232" r="8078" b="8371">ACL</wd>

<space/>

</run>

<wd l="8126" t="8227" r="8400" b="8405"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">(1)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="8453" t="8270" r="8904" b="8414">pages</wd>

<space/>

<wd l="8976" t="8227" r="9893" b="8371">1527–1536.</wd>

</run>

</ln>

</para>

<para l="6144" t="8683" r="10507" b="9749" alignment="justified" li="216" spaceBefore="230" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="8683" r="10502" b="8870" baseLine="8818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8688" r="7123" b="8870">Young-Bum</wd>

<space/>

<wd l="7195" t="8683" r="7589" b="8851">Kim,</wd>

<space/>

<wd l="7675" t="8688" r="8453" b="8827">Heemoon</wd>

<space/>

<wd l="8530" t="8683" r="8976" b="8851">Chae,</wd>

<space/>

<wd l="9058" t="8683" r="9835" b="8870">Benjamin</wd>

<space/>

<wd l="9912" t="8683" r="10502" b="8870">Snyder,</wd>

<space/>

</ln>

<ln l="6370" t="8904" r="10507" b="9091" baseLine="9038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="8904" r="6653" b="9048">and</wd>

<space/>

<wd l="6739" t="8904" r="7421" b="9086">Yu-Seop</wd>

<space/>

<wd l="7517" t="8904" r="7906" b="9048">Kim.</wd>

<space/>

<wd l="8112" t="8904" r="8544" b="9048">2014.</wd>

<space/>

<wd l="8746" t="8904" r="9418" b="9091">Training</wd>

<space/>

<wd l="9514" t="8947" r="9600" b="9048">a</wd>

<space/>

<wd l="9686" t="8904" r="10219" b="9048">korean</wd>

<space/>

<wd l="10320" t="8904" r="10507" b="9048">srl</wd>

<space/>

</ln>

<ln l="6374" t="9120" r="10502" b="9307" baseLine="9259">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="9139" r="6922" b="9307">system</wd>

<space/>

<wd l="6989" t="9120" r="7344" b="9264">with</wd>

<space/>

<wd l="7416" t="9120" r="7728" b="9264">rich</wd>

<space/>

<wd l="7800" t="9120" r="8962" b="9307">morphological</wd>

<space/>

<wd l="9034" t="9120" r="9706" b="9264">features.</wd>

<space/>

<wd l="9864" t="9125" r="10032" b="9259">In</wd>

<space/>

</run>

<wd l="10090" t="9125" r="10502" b="9288"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="6365" t="9341" r="10502" b="9528" baseLine="9475" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9384" r="6811" b="9528">pages</wd>

<space/>

<wd l="6874" t="9341" r="7603" b="9485">637–642.</wd>

<space/>

<wd l="7661" t="9341" r="8606" b="9485">Association</wd>

<space/>

<wd l="8654" t="9341" r="8885" b="9485">for</wd>

<space/>

<wd l="8938" t="9341" r="10118" b="9523">Computational</wd>

<space/>

<wd l="10166" t="9341" r="10502" b="9480">Lin-</wd>

</ln>

<ln l="6370" t="9562" r="7013" b="9749" baseLine="9696" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="9562" r="7013" b="9749">guistics.</wd>

</ln>

</para>

<para l="6144" t="10013" r="10512" b="11078" alignment="justified" li="216" spaceBefore="230" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="10013" r="10512" b="10200" baseLine="10152" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10018" r="7123" b="10200">Young-Bum</wd>

<space/>

<wd l="7214" t="10013" r="7603" b="10181">Kim,</wd>

<space/>

<wd l="7709" t="10013" r="8376" b="10157">Minwoo</wd>

<space/>

<wd l="8467" t="10018" r="8976" b="10200">Jeong,</wd>

<space/>

<wd l="9086" t="10013" r="9432" b="10157">Karl</wd>

<space/>

<wd l="9528" t="10013" r="10118" b="10181">Stratos,</wd>

<space/>

<wd l="10229" t="10013" r="10512" b="10157">and</wd>

<space/>

</ln>

<ln l="6365" t="10234" r="10512" b="10421" baseLine="10368" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="10234" r="6749" b="10378">Ruhi</wd>

<space/>

<wd l="6854" t="10234" r="7584" b="10421">Sarikaya.</wd>

<space/>

<wd l="7819" t="10234" r="8342" b="10378">2015a.</wd>

<space/>

<wd l="8573" t="10234" r="9173" b="10421">Weakly</wd>

<space/>

<wd l="9283" t="10234" r="10128" b="10416">supervised</wd>

<space/>

<wd l="10234" t="10234" r="10512" b="10378">slot</wd>

<space/>

</ln>

<ln l="6365" t="10454" r="10507" b="10642" baseLine="10589" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="10454" r="6960" b="10642">tagging</wd>

<space/>

<wd l="7032" t="10454" r="7387" b="10598">with</wd>

<space/>

<wd l="7459" t="10454" r="8117" b="10642">partially</wd>

<space/>

<wd l="8194" t="10454" r="8770" b="10598">labeled</wd>

<space/>

<wd l="8851" t="10498" r="9643" b="10637">sequences</wd>

<space/>

<wd l="9720" t="10454" r="10109" b="10598">from</wd>

<space/>

<wd l="10181" t="10454" r="10507" b="10598">web</wd>

<space/>

</ln>

<ln l="6374" t="10670" r="10502" b="10858" baseLine="10810">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="10670" r="6874" b="10814">search</wd>

<space/>

<wd l="6922" t="10670" r="7306" b="10814">click</wd>

<space/>

<wd l="7349" t="10670" r="7718" b="10858">logs.</wd>

<space/>

<wd l="7805" t="10675" r="7973" b="10810">In</wd>

<space/>

</run>

<wd l="8011" t="10675" r="9082" b="10838"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">HLT-NAACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9130" t="10714" r="9581" b="10858">pages</wd>

<space/>

<wd l="9638" t="10670" r="10166" b="10814">84–92.</wd>

<space/>

<wd l="10224" t="10675" r="10502" b="10814">As-</wd>

</run>

</ln>

<ln l="6374" t="10891" r="9576" b="11078" baseLine="11026" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="10891" r="7085" b="11035">sociation</wd>

<space/>

<wd l="7133" t="10891" r="7368" b="11035">for</wd>

<space/>

<wd l="7421" t="10891" r="8597" b="11074">Computational</wd>

<space/>

<wd l="8650" t="10891" r="9576" b="11078">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="11347" r="10512" b="12192" alignment="justified" li="216" spaceBefore="233" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="11347" r="10507" b="11534" baseLine="11482" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11352" r="7123" b="11534">Young-Bum</wd>

<space/>

<wd l="7186" t="11347" r="7579" b="11515">Kim,</wd>

<space/>

<wd l="7656" t="11347" r="8002" b="11491">Karl</wd>

<space/>

<wd l="8069" t="11347" r="8664" b="11515">Stratos,</wd>

<space/>

<wd l="8736" t="11347" r="9317" b="11491">Xiaohu</wd>

<space/>

<wd l="9384" t="11347" r="9701" b="11515">Liu,</wd>

<space/>

<wd l="9778" t="11347" r="10061" b="11491">and</wd>

<space/>

<wd l="10123" t="11347" r="10507" b="11491">Ruhi</wd>

<space/>

</ln>

<ln l="6370" t="11563" r="10512" b="11750" baseLine="11702" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="11563" r="7099" b="11750">Sarikaya.</wd>

<space/>

<wd l="7258" t="11563" r="7781" b="11707">2015b.</wd>

<space/>

<wd l="7934" t="11563" r="8654" b="11746">Compact</wd>

<space/>

<wd l="8722" t="11563" r="9307" b="11707">lexicon</wd>

<space/>

<wd l="9389" t="11563" r="10085" b="11707">selection</wd>

<space/>

<wd l="10157" t="11563" r="10512" b="11707">with</wd>

<space/>

</ln>

<ln l="6374" t="11784" r="10502" b="11966" baseLine="11918">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="11784" r="6979" b="11966">spectral</wd>

<space/>

<wd l="7042" t="11784" r="7757" b="11928">methods.</wd>

<space/>

<wd l="7872" t="11789" r="8040" b="11923">In</wd>

<space/>

</run>

<wd l="8083" t="11789" r="8496" b="11928"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8563" t="11784" r="9509" b="11928">Association</wd>

<space/>

<wd l="9566" t="11784" r="9797" b="11928">for</wd>

<space/>

<wd l="9864" t="11784" r="10502" b="11966">Compu-</wd>

</run>

</ln>

<ln l="6365" t="12005" r="7934" b="12192" baseLine="12139" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12005" r="6960" b="12149">tational</wd>

<space/>

<wd l="7013" t="12005" r="7934" b="12192">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="12456" r="10498" b="13085" alignment="justified" li="216" spaceBefore="233" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="12456" r="10498" b="12643" baseLine="12595" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12461" r="7123" b="12643">Young-Bum</wd>

<space/>

<wd l="7224" t="12456" r="7613" b="12624">Kim,</wd>

<space/>

<wd l="7733" t="12456" r="8083" b="12600">Karl</wd>

<space/>

<wd l="8189" t="12456" r="8779" b="12624">Stratos,</wd>

<space/>

<wd l="8899" t="12456" r="9182" b="12600">and</wd>

<space/>

<wd l="9278" t="12456" r="9662" b="12600">Ruhi</wd>

<space/>

<wd l="9768" t="12456" r="10498" b="12643">Sarikaya.</wd>

<space/>

</ln>

<ln l="6370" t="12677" r="10498" b="12864" baseLine="12811">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="12677" r="6888" b="12821">2015c.</wd>

<space/>

<wd l="7066" t="12677" r="8016" b="12864">Pre-training</wd>

<space/>

<wd l="8102" t="12677" r="8275" b="12821">of</wd>

<space/>

<wd l="8342" t="12677" r="9264" b="12821">hidden-unit</wd>

<space/>

<wd l="9346" t="12677" r="9677" b="12821">crfs.</wd>

<space/>

<wd l="9854" t="12682" r="10022" b="12816">In</wd>

<space/>

</run>

<wd l="10090" t="12682" r="10498" b="12821"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="6365" t="12898" r="9797" b="13085" baseLine="13032" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="12898" r="7306" b="13042">Association</wd>

<space/>

<wd l="7354" t="12898" r="7589" b="13042">for</wd>

<space/>

<wd l="7642" t="12898" r="8818" b="13080">Computational</wd>

<space/>

<wd l="8870" t="12898" r="9797" b="13085">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="13349" r="10512" b="14194" alignment="justified" li="216" spaceBefore="234" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="13349" r="10512" b="13536" baseLine="13488" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13354" r="7123" b="13536">Young-Bum</wd>

<space/>

<wd l="7219" t="13349" r="7613" b="13517">Kim,</wd>

<space/>

<wd l="7733" t="13349" r="8078" b="13493">Karl</wd>

<space/>

<wd l="8179" t="13349" r="8774" b="13517">Stratos,</wd>

<space/>

<wd l="8885" t="13349" r="9274" b="13493">Ruhi</wd>

<space/>

<wd l="9374" t="13349" r="10109" b="13536">Sarikaya,</wd>

<space/>

<wd l="10229" t="13349" r="10512" b="13493">and</wd>

<space/>

</ln>

<ln l="6365" t="13570" r="10502" b="13757" baseLine="13704" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="13570" r="7032" b="13714">Minwoo</wd>

<space/>

<wd l="7090" t="13574" r="7594" b="13757">Jeong.</wd>

<space/>

<wd l="7694" t="13570" r="8227" b="13714">2015d.</wd>

<space/>

<wd l="8318" t="13574" r="8688" b="13714">New</wd>

<space/>

<wd l="8746" t="13570" r="9355" b="13714">transfer</wd>

<space/>

<wd l="9408" t="13570" r="10056" b="13757">learning</wd>

<space/>

<wd l="10114" t="13570" r="10502" b="13714">tech-</wd>

</ln>

<ln l="6365" t="13790" r="10512" b="13973" baseLine="13925">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="13790" r="6878" b="13973">niques</wd>

<space/>

<wd l="6941" t="13790" r="7171" b="13934">for</wd>

<space/>

<wd l="7234" t="13790" r="7944" b="13973">disparate</wd>

<space/>

<wd l="8002" t="13790" r="8386" b="13934">label</wd>

<space/>

<wd l="8453" t="13810" r="8784" b="13934">sets.</wd>

<space/>

<wd l="8885" t="13795" r="9053" b="13930">In</wd>

<space/>

</run>

<wd l="9091" t="13795" r="9504" b="13934"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9571" t="13790" r="10512" b="13934">Association</wd>

<space/>

</run>

</ln>

<ln l="6365" t="14006" r="8803" b="14194" baseLine="14146" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14006" r="6595" b="14150">for</wd>

<space/>

<wd l="6653" t="14006" r="7829" b="14189">Computational</wd>

<space/>

<wd l="7882" t="14006" r="8803" b="14194">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="14462" r="10512" b="15302" alignment="justified" li="216" spaceBefore="237" fli="-216" lsp="exactly" lspExact="217" language="en">

<ln l="6144" t="14462" r="10512" b="14650" baseLine="14602" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14462" r="6523" b="14606">John</wd>

<space/>

<wd l="6595" t="14462" r="7272" b="14650">Lafferty,</wd>

<space/>

<wd l="7358" t="14462" r="7992" b="14606">Andrew</wd>

<space/>

<wd l="8069" t="14462" r="8962" b="14630">McCallum,</wd>

<space/>

<wd l="9053" t="14462" r="9336" b="14606">and</wd>

<space/>

<wd l="9408" t="14462" r="10157" b="14606">Fernando</wd>

<space/>

<wd l="10238" t="14462" r="10512" b="14606">CN</wd>

<space/>

</ln>

<ln l="6365" t="14683" r="10502" b="14827" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="14683" r="6965" b="14827">Pereira.</wd>

<space/>

<wd l="7147" t="14683" r="7579" b="14827">2001.</wd>

<space/>

<wd l="7757" t="14683" r="8693" b="14827">Conditional</wd>

<space/>

<wd l="8774" t="14683" r="9384" b="14827">random</wd>

<space/>

<wd l="9466" t="14683" r="9931" b="14827">fields:</wd>

<space/>

<wd l="10070" t="14683" r="10502" b="14827">Prob-</wd>

</ln>

<ln l="6370" t="14899" r="10502" b="15086" baseLine="15038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="14899" r="6994" b="15043">abilistic</wd>

<space/>

<wd l="7099" t="14899" r="7670" b="15043">models</wd>

<space/>

<wd l="7781" t="14899" r="8016" b="15043">for</wd>

<space/>

<wd l="8126" t="14899" r="9029" b="15086">segmenting</wd>

<space/>

<wd l="9144" t="14899" r="9427" b="15043">and</wd>

<space/>

<wd l="9533" t="14899" r="10171" b="15086">labeling</wd>

<space/>

<wd l="10286" t="14942" r="10502" b="15043">se-</wd>

</ln>

<ln l="6370" t="15120" r="7349" b="15302" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="15163" r="6926" b="15302">quence</wd>

<space/>

<wd l="6984" t="15120" r="7349" b="15264">data.</wd>

</ln>

</para>

</column>

</section>

<dd l="1427" t="15736" r="10546" b="15977">

<para l="5800" t="15787" r="6148" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5866" t="15787" r="6082" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="43">

<wd l="5866" t="15787" r="6082" b="15946">76</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4310.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1280" marginRight="6089" marginBottom="858" offsetX="8" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1280" r="5820" b="15980">

<column l="1440" t="1280" r="5820" b="15980">

<para l="1440" t="1334" r="5813" b="2136" alignment="justified" li="216" spaceBefore="24" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="1334" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1339" r="2078" b="1478">Laurens</wd>

<space/>

<wd l="2141" t="1339" r="2779" b="1502">Maaten,</wd>

<space/>

<wd l="2851" t="1339" r="3211" b="1478">Max</wd>

<space/>

<wd l="3274" t="1334" r="3941" b="1522">Welling,</wd>

<space/>

<wd l="4018" t="1334" r="4301" b="1478">and</wd>

<space/>

<wd l="4358" t="1339" r="5136" b="1478">Lawrence</wd>

<space/>

<wd l="5203" t="1339" r="5342" b="1474">K</wd>

<space/>

<wd l="5405" t="1334" r="5794" b="1478">Saul.</wd>

<space/>

</ln>

<ln l="1661" t="1555" r="5798" b="1699" baseLine="1694">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="1555" r="2093" b="1699">2011.</wd>

<space/>

<wd l="2179" t="1555" r="3144" b="1699">Hidden-unit</wd>

<space/>

<wd l="3197" t="1555" r="4090" b="1699">conditional</wd>

<space/>

<wd l="4142" t="1555" r="4752" b="1699">random</wd>

<space/>

<wd l="4805" t="1555" r="5270" b="1699">fields.</wd>

<space/>

<wd l="5357" t="1560" r="5525" b="1694">In</wd>

<space/>

</run>

<wd l="5568" t="1560" r="5798" b="1699" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">In-</wd>

</ln>

<ln l="1661" t="1776" r="5813" b="1958" baseLine="1910" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="1776" r="2544" b="1920">ternational</wd>

<space/>

<wd l="2597" t="1776" r="3494" b="1958">Conference</wd>

<space/>

<wd l="3542" t="1824" r="3734" b="1920">on</wd>

<space/>

<wd l="3763" t="1776" r="4488" b="1958">Artificial</wd>

<space/>

<wd l="4522" t="1776" r="5462" b="1958">Intelligence</wd>

<space/>

<wd l="5506" t="1776" r="5813" b="1920">and</wd>

<space/>

</ln>

<ln l="1656" t="1997" r="2414" b="2136" baseLine="2131">

<wd l="1656" t="1997" r="2414" b="2136"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Statistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="2390" r="5798" b="3413" alignment="justified" li="216" spaceBefore="175" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="2390" r="5798" b="2534" baseLine="2530" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2390" r="2088" b="2534">Michael</wd>

<space/>

<wd l="2150" t="2390" r="3240" b="2534">Mathioudakis</wd>

<space/>

<wd l="3307" t="2390" r="3590" b="2534">and</wd>

<space/>

<wd l="3648" t="2390" r="4037" b="2534">Nick</wd>

<space/>

<wd l="4094" t="2390" r="4733" b="2534">Koudas.</wd>

<space/>

<wd l="4843" t="2390" r="5275" b="2534">2010.</wd>

<space/>

<wd l="5381" t="2390" r="5798" b="2534">Twit-</wd>

</ln>

<ln l="1656" t="2611" r="5794" b="2755" baseLine="2750" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="2611" r="2539" b="2755">termonitor:</wd>

<space/>

<wd l="2645" t="2611" r="3058" b="2755">trend</wd>

<space/>

<wd l="3125" t="2611" r="3854" b="2755">detection</wd>

<space/>

<wd l="3922" t="2654" r="4267" b="2755">over</wd>

<space/>

<wd l="4330" t="2611" r="4570" b="2755">the</wd>

<space/>

<wd l="4637" t="2611" r="5160" b="2755">twitter</wd>

<space/>

<wd l="5232" t="2630" r="5794" b="2755">stream.</wd>

<space/>

</ln>

<ln l="1656" t="2832" r="5798" b="3014" baseLine="2966">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="2837" r="1824" b="2971">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1906" t="2832" r="2890" b="3014">Proceedings</wd>

<space/>

<wd l="2981" t="2832" r="3158" b="3014">of</wd>

<space/>

<wd l="3216" t="2832" r="3451" b="2976">the</wd>

<space/>

<wd l="3533" t="2832" r="3936" b="2976">2010</wd>

<space/>

<wd l="3998" t="2837" r="4440" b="2976">ACM</wd>

<space/>

<wd l="4512" t="2837" r="5275" b="2976">SIGMOD</wd>

<space/>

<wd l="5352" t="2837" r="5798" b="2976">Inter-</wd>

</run>

</ln>

<ln l="1656" t="3048" r="5798" b="3235" baseLine="3187">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="3048" r="2323" b="3192">national</wd>

<space/>

<wd l="2386" t="3048" r="3283" b="3230">Conference</wd>

<space/>

<wd l="3346" t="3096" r="3538" b="3192">on</wd>

<space/>

<wd l="3590" t="3053" r="4637" b="3230">Management</wd>

<space/>

<wd l="4690" t="3048" r="4872" b="3230">of</wd>

<space/>

</run>

<wd l="4891" t="3048" r="5290" b="3216"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">data</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5352" t="3091" r="5798" b="3235">pages</wd>

<space/>

</run>

</ln>

<ln l="1675" t="3269" r="3139" b="3413" baseLine="3408" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1675" t="3269" r="2592" b="3413">1155–1158.</wd>

<space/>

<wd l="2654" t="3269" r="3139" b="3413">ACM.</wd>

</ln>

</para>

<para l="1440" t="3667" r="5808" b="4733" alignment="justified" li="216" spaceBefore="174" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="3667" r="5798" b="3854" baseLine="3806" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3667" r="2074" b="3811">Andrew</wd>

<space/>

<wd l="2150" t="3667" r="3005" b="3811">McCallum</wd>

<space/>

<wd l="3077" t="3667" r="3360" b="3811">and</wd>

<space/>

<wd l="3432" t="3667" r="3744" b="3811">Wei</wd>

<space/>

<wd l="3821" t="3667" r="4037" b="3811">Li.</wd>

<space/>

<wd l="4195" t="3667" r="4627" b="3811">2003.</wd>

<space/>

<wd l="4781" t="3667" r="5208" b="3854">Early</wd>

<space/>

<wd l="5285" t="3667" r="5798" b="3811">results</wd>

<space/>

</ln>

<ln l="1656" t="3888" r="5798" b="4075" baseLine="4022" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="3888" r="1891" b="4032">for</wd>

<space/>

<wd l="1968" t="3888" r="2496" b="4032">named</wd>

<space/>

<wd l="2578" t="3888" r="3024" b="4075">entity</wd>

<space/>

<wd l="3101" t="3888" r="4008" b="4075">recognition</wd>

<space/>

<wd l="4085" t="3888" r="4440" b="4032">with</wd>

<space/>

<wd l="4517" t="3888" r="5405" b="4032">conditional</wd>

<space/>

<wd l="5486" t="3931" r="5798" b="4032">ran-</wd>

</ln>

<ln l="1661" t="4104" r="5798" b="4272" baseLine="4243" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1661" t="4104" r="2016" b="4248">dom</wd>

<space/>

<wd l="2059" t="4104" r="2530" b="4272">fields,</wd>

<space/>

<wd l="2582" t="4104" r="3134" b="4248">feature</wd>

<space/>

<wd l="3178" t="4104" r="3931" b="4248">induction</wd>

<space/>

<wd l="3979" t="4104" r="4262" b="4248">and</wd>

<space/>

<wd l="4306" t="4104" r="5458" b="4248">web-enhanced</wd>

<space/>

<wd l="5501" t="4104" r="5798" b="4248">lex-</wd>

</ln>

<ln l="1656" t="4325" r="5808" b="4512" baseLine="4464">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1656" t="4325" r="2117" b="4469">icons.</wd>

<space/>

<wd l="2213" t="4330" r="2381" b="4464">In</wd>

<space/>

</run>

<wd l="2429" t="4330" r="3494" b="4493"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">HLT-NAACL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="3557" t="4368" r="4003" b="4512">pages</wd>

<space/>

<wd l="4085" t="4325" r="4800" b="4469">188–191.</wd>

<space/>

<wd l="4862" t="4325" r="5808" b="4469">Association</wd>

<space/>

</run>

</ln>

<ln l="1656" t="4546" r="4099" b="4733" baseLine="4680" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="4546" r="1891" b="4690">for</wd>

<space/>

<wd l="1944" t="4546" r="3120" b="4728">Computational</wd>

<space/>

<wd l="3173" t="4546" r="4099" b="4733">Linguistics.</wd>

</ln>

</para>

<para l="1440" t="4944" r="5803" b="6005" alignment="justified" li="216" spaceBefore="177" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="4944" r="5798" b="5131" baseLine="5078" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="4949" r="1963" b="5088">Tomas</wd>

<space/>

<wd l="2011" t="4944" r="2722" b="5112">Mikolov,</wd>

<space/>

<wd l="2779" t="4944" r="3091" b="5131">Ilya</wd>

<space/>

<wd l="3139" t="4944" r="3946" b="5112">Sutskever,</wd>

<space/>

<wd l="4003" t="4944" r="4282" b="5088">Kai</wd>

<space/>

<wd l="4334" t="4944" r="4795" b="5112">Chen,</wd>

<space/>

<wd l="4853" t="4944" r="5237" b="5131">Greg</wd>

<space/>

<wd l="5294" t="4944" r="5390" b="5088">S</wd>

<space/>

<wd l="5448" t="4944" r="5798" b="5088">Cor-</wd>

</ln>

<ln l="1656" t="5160" r="5798" b="5342" baseLine="5299" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="5160" r="2054" b="5328">rado,</wd>

<space/>

<wd l="2131" t="5160" r="2414" b="5304">and</wd>

<space/>

<wd l="2477" t="5160" r="2779" b="5304">Jeff</wd>

<space/>

<wd l="2832" t="5165" r="3288" b="5304">Dean.</wd>

<space/>

<wd l="3413" t="5160" r="3845" b="5304">2013.</wd>

<space/>

<wd l="3965" t="5160" r="4862" b="5304">Distributed</wd>

<space/>

<wd l="4920" t="5179" r="5798" b="5342">representa-</wd>

</ln>

<ln l="1656" t="5381" r="5798" b="5563" baseLine="5520" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="5381" r="2040" b="5525">tions</wd>

<space/>

<wd l="2102" t="5381" r="2275" b="5525">of</wd>

<space/>

<wd l="2318" t="5381" r="2798" b="5525">words</wd>

<space/>

<wd l="2861" t="5381" r="3144" b="5525">and</wd>

<space/>

<wd l="3197" t="5381" r="3792" b="5563">phrases</wd>

<space/>

<wd l="3854" t="5381" r="4138" b="5525">and</wd>

<space/>

<wd l="4190" t="5381" r="4555" b="5525">their</wd>

<space/>

<wd l="4613" t="5381" r="5798" b="5563">compositional-</wd>

</ln>

<ln l="1656" t="5602" r="5803" b="5789" baseLine="5736">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1656" t="5602" r="1896" b="5789">ity.</wd>

<space/>

<wd l="2050" t="5606" r="2218" b="5741">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2270" t="5602" r="3048" b="5746">Advances</wd>

<space/>

<wd l="3130" t="5606" r="3274" b="5746">in</wd>

<space/>

<wd l="3350" t="5602" r="3869" b="5746">neural</wd>

<space/>

<wd l="3946" t="5602" r="4877" b="5784">information</wd>

<space/>

<wd l="4930" t="5606" r="5803" b="5784">processing</wd>

<space/>

</run>

</ln>

<ln l="1656" t="5818" r="3806" b="6005" baseLine="5957">

<wd l="1656" t="5846" r="2309" b="6000"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">systems</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2366" t="5861" r="2813" b="6005">pages</wd>

<space/>

<wd l="2875" t="5818" r="3806" b="5962">3111–3119.</wd>

</run>

</ln>

</para>

<para l="1440" t="6221" r="5808" b="7272" alignment="justified" li="216" spaceBefore="177" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="6221" r="5798" b="6408" baseLine="6355" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6221" r="1982" b="6408">Jeffrey</wd>

<space/>

<wd l="2030" t="6221" r="2981" b="6408">Pennington,</wd>

<space/>

<wd l="3034" t="6221" r="3662" b="6365">Richard</wd>

<space/>

<wd l="3710" t="6221" r="4296" b="6389">Socher,</wd>

<space/>

<wd l="4349" t="6221" r="4637" b="6365">and</wd>

<space/>

<wd l="4680" t="6221" r="5621" b="6403">Christopher</wd>

<space/>

<wd l="5659" t="6226" r="5798" b="6360">D</wd>

<space/>

</ln>

<ln l="1656" t="6437" r="5808" b="6624" baseLine="6576" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="6437" r="2414" b="6624">Manning.</wd>

<space/>

<wd l="2731" t="6437" r="3163" b="6581">2014.</wd>

<space/>

<wd l="3480" t="6437" r="3994" b="6581">Glove:</wd>

<space/>

<wd l="4219" t="6437" r="4757" b="6581">Global</wd>

<space/>

<wd l="4882" t="6456" r="5448" b="6581">vectors</wd>

<space/>

<wd l="5573" t="6437" r="5808" b="6581">for</wd>

<space/>

</ln>

<ln l="1656" t="6658" r="5808" b="6840" baseLine="6792">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="6658" r="2069" b="6802">word</wd>

<space/>

<wd l="2122" t="6658" r="3288" b="6840">representation.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3398" t="6658" r="4382" b="6840">Proceedings</wd>

<space/>

<wd l="4445" t="6658" r="4627" b="6840">of</wd>

<space/>

<wd l="4656" t="6658" r="4896" b="6802">the</wd>

<space/>

<wd l="4949" t="6658" r="5808" b="6840">Empiricial</wd>

<space/>

</run>

</ln>

<ln l="1651" t="6874" r="5808" b="7056" baseLine="7013" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="6874" r="2342" b="7018">Methods</wd>

<space/>

<wd l="2414" t="6878" r="2554" b="7018">in</wd>

<space/>

<wd l="2616" t="6874" r="3240" b="7018">Natural</wd>

<space/>

<wd l="3293" t="6878" r="4090" b="7056">Language</wd>

<space/>

<wd l="4147" t="6878" r="5021" b="7056">Processing</wd>

<space/>

<wd l="5093" t="6878" r="5808" b="7051">(EMNLP</wd>

<space/>

</ln>

<ln l="1656" t="7094" r="3413" b="7272" baseLine="7234">

<wd l="1656" t="7094" r="2165" b="7272"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2014)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2242" t="7094" r="3413" b="7238">12:1532–1543.</wd>

</run>

</ln>

</para>

<para l="1440" t="7493" r="5803" b="8731" alignment="justified" li="216" spaceBefore="170" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="7493" r="5794" b="7661" baseLine="7632" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="7493" r="1824" b="7637">Alan</wd>

<space/>

<wd l="1915" t="7493" r="2405" b="7661">Ritter,</wd>

<space/>

<wd l="2510" t="7493" r="2866" b="7637">Sam</wd>

<space/>

<wd l="2952" t="7493" r="3432" b="7661">Clark,</wd>

<space/>

<wd l="3542" t="7493" r="3936" b="7637">Oren</wd>

<space/>

<wd l="4022" t="7493" r="4642" b="7661">Etzioni,</wd>

<space/>

<wd l="4747" t="7512" r="4886" b="7637">et</wd>

<space/>

<wd l="4978" t="7493" r="5155" b="7637">al.</wd>

<space/>

<wd l="5362" t="7493" r="5794" b="7637">2011.</wd>

<space/>

</ln>

<ln l="1656" t="7714" r="5803" b="7901" baseLine="7848" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="7714" r="2237" b="7858">Named</wd>

<space/>

<wd l="2280" t="7714" r="2726" b="7901">entity</wd>

<space/>

<wd l="2770" t="7714" r="3682" b="7901">recognition</wd>

<space/>

<wd l="3720" t="7714" r="3874" b="7853">in</wd>

<space/>

<wd l="3917" t="7733" r="4464" b="7858">tweets:</wd>

<space/>

<wd l="4541" t="7757" r="4723" b="7858">an</wd>

<space/>

<wd l="4771" t="7714" r="5803" b="7896">experimental</wd>

<space/>

</ln>

<ln l="1666" t="7930" r="5798" b="8117" baseLine="8069">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1666" t="7930" r="2117" b="8117">study.</wd>

<space/>

<wd l="2208" t="7934" r="2376" b="8069">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="2424" t="7930" r="3413" b="8112">Proceedings</wd>

<space/>

<wd l="3470" t="7930" r="3653" b="8112">of</wd>

<space/>

<wd l="3677" t="7930" r="3917" b="8074">the</wd>

<space/>

<wd l="3979" t="7930" r="4877" b="8112">Conference</wd>

<space/>

<wd l="4939" t="7978" r="5131" b="8074">on</wd>

<space/>

<wd l="5179" t="7934" r="5798" b="8112">Empiri-</wd>

</run>

</ln>

<ln l="1661" t="8150" r="5798" b="8338" baseLine="8290">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1661" t="8150" r="1906" b="8294">cal</wd>

<space/>

<wd l="1944" t="8150" r="2630" b="8294">Methods</wd>

<space/>

<wd l="2688" t="8155" r="2832" b="8294">in</wd>

<space/>

<wd l="2875" t="8150" r="3499" b="8294">Natural</wd>

<space/>

<wd l="3538" t="8155" r="4330" b="8333">Language</wd>

<space/>

</run>

<wd l="4378" t="8155" r="5299" b="8333"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Processing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="5352" t="8194" r="5798" b="8338">pages</wd>

<space/>

</run>

</ln>

<ln l="1675" t="8371" r="5798" b="8558" baseLine="8506" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1675" t="8371" r="2592" b="8515">1524–1534.</wd>

<space/>

<wd l="2645" t="8371" r="3590" b="8515">Association</wd>

<space/>

<wd l="3629" t="8371" r="3864" b="8515">for</wd>

<space/>

<wd l="3907" t="8371" r="5083" b="8554">Computational</wd>

<space/>

<wd l="5131" t="8371" r="5798" b="8558">Linguis-</wd>

</ln>

<ln l="1656" t="8587" r="1973" b="8731" baseLine="8726" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="8587" r="1973" b="8731">tics.</wd>

</ln>

</para>

<para l="1440" t="8990" r="5794" b="9571" alignment="justified" li="216" spaceBefore="178" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="8990" r="5794" b="9158" baseLine="9125" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8990" r="1824" b="9134">Alan</wd>

<space/>

<wd l="1910" t="8990" r="2395" b="9158">Ritter,</wd>

<space/>

<wd l="2491" t="8995" r="3221" b="9158">Mausam,</wd>

<space/>

<wd l="3322" t="8990" r="3715" b="9134">Oren</wd>

<space/>

<wd l="3797" t="8990" r="4416" b="9158">Etzioni,</wd>

<space/>

<wd l="4512" t="8990" r="4800" b="9134">and</wd>

<space/>

<wd l="4882" t="8990" r="5237" b="9134">Sam</wd>

<space/>

<wd l="5318" t="8990" r="5794" b="9134">Clark.</wd>

<space/>

</ln>

<ln l="1661" t="9206" r="5794" b="9389" baseLine="9346" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="9206" r="2093" b="9350">2012.</wd>

<space/>

<wd l="2256" t="9206" r="2683" b="9389">Open</wd>

<space/>

<wd l="2760" t="9206" r="3355" b="9350">domain</wd>

<space/>

<wd l="3427" t="9226" r="3850" b="9350">event</wd>

<space/>

<wd l="3926" t="9206" r="4714" b="9350">extraction</wd>

<space/>

<wd l="4786" t="9206" r="5179" b="9350">from</wd>

<space/>

<wd l="5246" t="9206" r="5794" b="9350">twitter.</wd>

<space/>

</ln>

<ln l="1656" t="9432" r="2333" b="9571" baseLine="9562">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="9432" r="1824" b="9566">In</wd>

<space/>

</run>

<wd l="1872" t="9432" r="2333" b="9571"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">KDD</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1445" t="9826" r="5808" b="10627" alignment="justified" li="216" spaceBefore="176" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="9826" r="5808" b="10013" baseLine="9960" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="9826" r="1790" b="9970">Karl</wd>

<space/>

<wd l="1906" t="9826" r="2496" b="9994">Stratos,</wd>

<space/>

<wd l="2621" t="9826" r="3389" b="10013">Do-kyum</wd>

<space/>

<wd l="3494" t="9826" r="3888" b="9994">Kim,</wd>

<space/>

<wd l="4013" t="9826" r="4666" b="9970">Michael</wd>

<space/>

<wd l="4776" t="9826" r="5390" b="9994">Collins,</wd>

<space/>

<wd l="5525" t="9826" r="5808" b="9970">and</wd>

<space/>

</ln>

<ln l="1656" t="10046" r="5803" b="10234" baseLine="10181" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="10046" r="2189" b="10190">Daniel</wd>

<space/>

<wd l="2237" t="10051" r="2597" b="10190">Hsu.</wd>

<space/>

<wd l="2683" t="10046" r="3115" b="10190">2014.</wd>

<space/>

<wd l="3197" t="10051" r="3341" b="10186">A</wd>

<space/>

<wd l="3398" t="10046" r="4003" b="10229">spectral</wd>

<space/>

<wd l="4061" t="10046" r="4834" b="10234">algorithm</wd>

<space/>

<wd l="4877" t="10046" r="5107" b="10190">for</wd>

<space/>

<wd l="5150" t="10046" r="5803" b="10234">learning</wd>

<space/>

</ln>

<ln l="1661" t="10262" r="5808" b="10450" baseLine="10402">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="10262" r="2568" b="10406">class-based</wd>

<space/>

</run>

<wd l="2630" t="10306" r="3226" b="10450"><run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">n</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">-gram</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3283" t="10262" r="3854" b="10406">models</wd>

<space/>

<wd l="3926" t="10262" r="4099" b="10406">of</wd>

<space/>

<wd l="4147" t="10262" r="4699" b="10406">natural</wd>

<space/>

<wd l="4762" t="10262" r="5520" b="10450">language.</wd>

<space/>

<wd l="5640" t="10267" r="5808" b="10402">In</wd>

<space/>

</run>

</ln>

<ln l="1675" t="10488" r="2021" b="10627" baseLine="10618">

<wd l="1675" t="10488" r="2021" b="10627"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">UAI</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="10882" r="5808" b="12163" alignment="justified" li="216" spaceBefore="175" spaceAfter="3803" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="10882" r="5794" b="11069" baseLine="11016" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10882" r="1982" b="11064">Joseph</wd>

<space/>

<wd l="2026" t="10882" r="2592" b="11050">Turian,</wd>

<space/>

<wd l="2640" t="10886" r="2942" b="11026">Lev</wd>

<space/>

<wd l="2990" t="10882" r="3648" b="11050">Ratinov,</wd>

<space/>

<wd l="3706" t="10882" r="3989" b="11026">and</wd>

<space/>

<wd l="4027" t="10882" r="4618" b="11026">Yoshua</wd>

<space/>

<wd l="4661" t="10882" r="5270" b="11069">Bengio.</wd>

<space/>

<wd l="5362" t="10882" r="5794" b="11026">2010.</wd>

<space/>

</ln>

<ln l="1656" t="11102" r="5808" b="11290" baseLine="11237" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="11102" r="2098" b="11246">Word</wd>

<space/>

<wd l="2150" t="11102" r="3398" b="11285">representations:</wd>

<space/>

<wd l="3494" t="11146" r="3581" b="11246">a</wd>

<space/>

<wd l="3643" t="11102" r="4162" b="11285">simple</wd>

<space/>

<wd l="4224" t="11102" r="4512" b="11246">and</wd>

<space/>

<wd l="4570" t="11102" r="5150" b="11290">general</wd>

<space/>

<wd l="5208" t="11102" r="5808" b="11246">method</wd>

<space/>

</ln>

<ln l="1656" t="11318" r="5803" b="11506" baseLine="11458">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1656" t="11318" r="1891" b="11462">for</wd>

<space/>

<wd l="1954" t="11318" r="3240" b="11501">semi-supervised</wd>

<space/>

<wd l="3298" t="11318" r="3989" b="11506">learning.</wd>

<space/>

<wd l="4090" t="11323" r="4253" b="11458">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="4310" t="11318" r="5294" b="11501">Proceedings</wd>

<space/>

<wd l="5357" t="11318" r="5539" b="11501">of</wd>

<space/>

<wd l="5568" t="11318" r="5803" b="11462">the</wd>

<space/>

</run>

</ln>

<ln l="1656" t="11539" r="5798" b="11722" baseLine="11674" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="11539" r="2011" b="11683">48th</wd>

<space/>

<wd l="2078" t="11539" r="2635" b="11683">annual</wd>

<space/>

<wd l="2702" t="11544" r="3326" b="11722">meeting</wd>

<space/>

<wd l="3403" t="11539" r="3586" b="11722">of</wd>

<space/>

<wd l="3629" t="11539" r="3864" b="11683">the</wd>

<space/>

<wd l="3931" t="11544" r="4838" b="11683">association</wd>

<space/>

<wd l="4872" t="11539" r="5150" b="11722">for</wd>

<space/>

<wd l="5213" t="11587" r="5798" b="11722">compu-</wd>

</ln>

<ln l="1661" t="11760" r="5808" b="11947" baseLine="11894">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1661" t="11760" r="2280" b="11904">tational</wd>

<space/>

</run>

<wd l="2338" t="11760" r="3197" b="11942"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">linguistics</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="3264" t="11803" r="3710" b="11947">pages</wd>

<space/>

<wd l="3778" t="11760" r="4507" b="11904">384–394.</wd>

<space/>

<wd l="4574" t="11760" r="5520" b="11904">Association</wd>

<space/>

<wd l="5573" t="11760" r="5808" b="11904">for</wd>

<space/>

</run>

</ln>

<ln l="1661" t="11976" r="3816" b="12163" baseLine="12115" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1661" t="11976" r="2842" b="12158">Computational</wd>

<space/>

<wd l="2894" t="11976" r="3816" b="12163">Linguistics.</wd>

</ln>

</para>

</column>

</section>

<dd l="5820" t="15726" r="6176" b="15980">

<para l="5820" t="15792" r="6143" b="15946" alignment="left" spaceBefore="12" lsp="exactly" lspExact="231" language="en">

<ln l="5866" t="15792" r="6077" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="4">

<wd l="5866" t="15792" r="6077" b="15946">77</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

