<?xml version="1.0" encoding="UTF-16"?>

<!--XML document generated using OCR technology from Nuance Communications, Inc.-->

<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1433" marginTop="1180" marginRight="1378" marginBottom="358" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1433" t="1180" r="10531" b="4092">

<column l="1433" t="1180" r="10531" b="4092">

<para l="1459" t="1253" r="10488" b="1517" alignment="left" spaceBefore="17" lsp="exactly" lspExact="326" language="en">

<ln l="1459" t="1253" r="10488" b="1517" baseLine="1450" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1459" t="1253" r="2554" b="1517">Minority</wd>

<space/>

<wd l="2635" t="1258" r="3840" b="1517">Language</wd>

<space/>

<wd l="3917" t="1253" r="4886" b="1459">Twitter:</wd>

<space/>

<wd l="5002" t="1253" r="6826" b="1517">Part-of-Speech</wd>

<space/>

<wd l="6907" t="1253" r="7877" b="1517">Tagging</wd>

<space/>

<wd l="7954" t="1258" r="8410" b="1459">and</wd>

<space/>

<wd l="8486" t="1253" r="9514" b="1517">Analysis</wd>

<space/>

<wd l="9600" t="1253" r="9850" b="1459">of</wd>

<space/>

<wd l="9907" t="1253" r="10488" b="1459">Irish</wd>

</ln>

</para>

<para l="5558" t="1574" r="6389" b="1776" alignment="centered" lsp="exactly" lspExact="327" language="en">

<ln l="5558" t="1574" r="6389" b="1776" baseLine="1771" bold="true" underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5558" t="1574" r="6389" b="1776">Tweets</wd>

</ln>

</para>

<para l="2160" t="1992" r="9797" b="3926" alignment="centered" spaceBefore="120" spaceAfter="159" lsp="exactly" lspExact="280" language="en">

<ln l="3154" t="1992" r="8779" b="2242" baseLine="2174" forcedEOF="true">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3154" t="2026" r="3816" b="2194">Teresa</wd>

<space/>

</run>

<wd l="3874" t="1992" r="4690" b="2242"><run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Lynn</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;</run>

<run underlined="none" subsuperscript="superscript" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">,3</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4757" t="2021" r="5352" b="2194">Kevin</wd>

<space/>

</run>

<wd l="5419" t="1992" r="6432" b="2232"><run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Scannell</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6557" t="2026" r="6898" b="2194">and</wd>

<space/>

</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7018" t="2021" r="7771" b="2194">Eimear</wd>

<space/>

</run>

<wd l="7834" t="1992" r="8779" b="2242"><run bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Maguire</run>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;
</run>

</wd>

</ln>

<ln l="2563" t="2270" r="9403" b="2520" baseLine="2460" forcedEOF="true">

<wd l="2563" t="2270" r="3427" b="2467"><run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ADAPT</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3494" t="2304" r="4176" b="2501">Centre,</wd>

<space/>

<wd l="4258" t="2304" r="4906" b="2472">School</wd>

<space/>

<wd l="4978" t="2304" r="5189" b="2472">of</wd>

<space/>

<wd l="5237" t="2304" r="6355" b="2520">Computing,</wd>

<space/>

<wd l="6427" t="2304" r="7090" b="2472">Dublin</wd>

<space/>

<wd l="7157" t="2304" r="7555" b="2520">City</wd>

<space/>

<wd l="7622" t="2304" r="8654" b="2520">University,</wd>

<space/>

<wd l="8726" t="2304" r="9403" b="2472">Ireland
</wd>

</run>

</ln>

<ln l="2160" t="2549" r="9797" b="2798" baseLine="2739" forcedEOF="true">

<wd l="2160" t="2549" r="3379" b="2798"><run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Department</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3442" t="2582" r="3653" b="2750">of</wd>

<space/>

<wd l="3696" t="2582" r="4925" b="2750">Mathematics</wd>

<space/>

<wd l="4997" t="2582" r="5338" b="2750">and</wd>

<space/>

<wd l="5400" t="2582" r="6355" b="2798">Computer</wd>

<space/>

<wd l="6422" t="2582" r="7205" b="2779">Science,</wd>

<space/>

<wd l="7286" t="2582" r="7517" b="2750">St.</wd>

<space/>

<wd l="7608" t="2582" r="8146" b="2750">Louis</wd>

<space/>

<wd l="8213" t="2582" r="9245" b="2798">University,</wd>

<space/>

<wd l="9317" t="2582" r="9797" b="2750">USA
</wd>

</run>

</ln>

<ln l="2669" t="2827" r="9288" b="3077" baseLine="3022" forcedEOF="true">

<wd l="2669" t="2827" r="3893" b="3077"><run underlined="none" subsuperscript="superscript" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Department</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="3955" t="2861" r="4166" b="3029">of</wd>

<space/>

<wd l="4214" t="2861" r="5333" b="3077">Computing,</wd>

<space/>

<wd l="5405" t="2861" r="6427" b="3077">Macquarie</wd>

<space/>

<wd l="6485" t="2861" r="7517" b="3077">University,</wd>

<space/>

<wd l="7598" t="2861" r="8338" b="3077">Sydney,</wd>

<space/>

<wd l="8410" t="2861" r="9288" b="3029">Australia
</wd>

</run>

</ln>

<ln l="3600" t="3106" r="8347" b="3365" baseLine="3299" forcedEOF="true">

<wd l="3600" t="3106" r="8347" b="3365">&apos;{tlynn,emaguire}@computing.dcu.ie
</wd>

</ln>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;</run>

<run underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">tlynn,emaguire</run>

<run underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">@computing.dcu.ie
</run>

<ln l="4594" t="3384" r="7363" b="3643" baseLine="3576" forcedEOF="true">

<wd l="4594" t="3384" r="7363" b="3643">&apos;{kscanne}@gmail.com
</wd>

</ln>

<run underlined="none" subsuperscript="none" fontSize="800" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&apos;</run>

<run underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">kscanne</run>

<run underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">@gmail.com
</run>

<ln l="4277" t="3662" r="7666" b="3926" baseLine="3855" forcedEOF="true">

<wd l="4277" t="3662" r="7666" b="3926"><run underlined="none" subsuperscript="superscript" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">{</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">teresa.lynn</run>

<run underlined="none" subsuperscript="none" fontSize="1450" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">}</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="0">@mq.edu.au</run>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

</section>

<section l="1433" t="4092" r="10531" b="15318">

<column l="1433" t="4092" r="5820" b="15318">

<para l="3178" t="4142" r="4070" b="4315" alignment="centered" spaceBefore="3" lsp="exactly" lspExact="273" language="en">

<ln l="3178" t="4142" r="4070" b="4315" baseLine="4306" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3178" t="4142" r="4070" b="4315">Abstract</wd>

</ln>

</para>

<para l="1781" t="4546" r="5477" b="8813" alignment="justified" li="288" ri="360" spaceBefore="119" lsp="exactly" lspExact="271" language="en">

<ln l="1781" t="4546" r="5458" b="4747" baseLine="4699" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4546" r="2299" b="4747">Noisy</wd>

<space/>

<wd l="2366" t="4546" r="3648" b="4747">user-generated</wd>

<space/>

<wd l="3715" t="4570" r="4037" b="4704">text</wd>

<space/>

<wd l="4104" t="4598" r="4579" b="4747">poses</wd>

<space/>

<wd l="4651" t="4546" r="5458" b="4747">problems</wd>

<space/>

</ln>

<ln l="1781" t="4819" r="5458" b="5021" baseLine="4968" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="4819" r="2040" b="4978">for</wd>

<space/>

<wd l="2126" t="4819" r="2731" b="4978">natural</wd>

<space/>

<wd l="2827" t="4819" r="3614" b="5021">language</wd>

<space/>

<wd l="3706" t="4819" r="4685" b="5021">processing.</wd>

<space/>

<wd l="4877" t="4824" r="5059" b="4973">In</wd>

<space/>

<wd l="5150" t="4819" r="5458" b="4978">this</wd>

<space/>

</ln>

<ln l="1781" t="5088" r="5462" b="5290" baseLine="5242" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5141" r="2299" b="5290">paper,</wd>

<space/>

<wd l="2424" t="5141" r="2678" b="5246">we</wd>

<space/>

<wd l="2789" t="5088" r="3230" b="5246">show</wd>

<space/>

<wd l="3331" t="5088" r="3662" b="5246">that</wd>

<space/>

<wd l="3763" t="5088" r="4070" b="5246">this</wd>

<space/>

<wd l="4186" t="5112" r="5016" b="5246">statement</wd>

<space/>

<wd l="5117" t="5088" r="5462" b="5246">also</wd>

<space/>

</ln>

<ln l="1781" t="5362" r="5467" b="5563" baseLine="5510" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5362" r="2246" b="5520">holds</wd>

<space/>

<wd l="2352" t="5386" r="2693" b="5520">true</wd>

<space/>

<wd l="2794" t="5362" r="3053" b="5520">for</wd>

<space/>

<wd l="3149" t="5362" r="3413" b="5520">the</wd>

<space/>

<wd l="3518" t="5362" r="3917" b="5520">Irish</wd>

<space/>

<wd l="4018" t="5362" r="4848" b="5563">language.</wd>

<space/>

<wd l="5064" t="5362" r="5467" b="5520">Irish</wd>

<space/>

</ln>

<ln l="1781" t="5630" r="5453" b="5832" baseLine="5784" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5630" r="1920" b="5789">is</wd>

<space/>

<wd l="2011" t="5630" r="2770" b="5832">regarded</wd>

<space/>

<wd l="2856" t="5683" r="3024" b="5789">as</wd>

<space/>

<wd l="3120" t="5683" r="3216" b="5789">a</wd>

<space/>

<wd l="3298" t="5630" r="4541" b="5789">low-resourced</wd>

<space/>

<wd l="4622" t="5630" r="5453" b="5832">language,</wd>

<space/>

</ln>

<ln l="1781" t="5904" r="5462" b="6106" baseLine="6053" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="5904" r="2170" b="6062">with</wd>

<space/>

<wd l="2266" t="5904" r="2885" b="6062">limited</wd>

<space/>

<wd l="2986" t="5904" r="3830" b="6062">annotated</wd>

<space/>

<wd l="3931" t="5957" r="4594" b="6106">corpora</wd>

<space/>

<wd l="4694" t="5904" r="5462" b="6062">available</wd>

<space/>

</ln>

<ln l="1781" t="6173" r="5462" b="6374" baseLine="6326" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="6197" r="1949" b="6331">to</wd>

<space/>

<wd l="2030" t="6178" r="2443" b="6331">NLP</wd>

<space/>

<wd l="2525" t="6173" r="3499" b="6331">researchers</wd>

<space/>

<wd l="3590" t="6173" r="3902" b="6331">and</wd>

<space/>

<wd l="3984" t="6173" r="4714" b="6374">linguists</wd>

<space/>

<wd l="4805" t="6197" r="4968" b="6331">to</wd>

<space/>

<wd l="5054" t="6173" r="5462" b="6374">fully</wd>

<space/>

</ln>

<ln l="1786" t="6446" r="5462" b="6648" baseLine="6595" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="6446" r="2434" b="6648">analyse</wd>

<space/>

<wd l="2496" t="6446" r="2760" b="6605">the</wd>

<space/>

<wd l="2822" t="6446" r="3629" b="6648">linguistic</wd>

<space/>

<wd l="3696" t="6470" r="4378" b="6648">patterns</wd>

<space/>

<wd l="4445" t="6446" r="4618" b="6600">in</wd>

<space/>

<wd l="4680" t="6446" r="5462" b="6648">language</wd>

<space/>

</ln>

<ln l="1781" t="6715" r="5453" b="6874" baseLine="6864" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="6768" r="2069" b="6874">use</wd>

<space/>

<wd l="2141" t="6715" r="2314" b="6869">in</wd>

<space/>

<wd l="2395" t="6715" r="2890" b="6874">social</wd>

<space/>

<wd l="2966" t="6715" r="3542" b="6874">media.</wd>

<space/>

<wd l="3672" t="6720" r="3955" b="6874">We</wd>

<space/>

<wd l="4032" t="6715" r="4910" b="6874">contribute</wd>

<space/>

<wd l="4982" t="6739" r="5146" b="6874">to</wd>

<space/>

<wd l="5222" t="6768" r="5453" b="6874">re-</wd>

</ln>

<ln l="1786" t="6989" r="5462" b="7190" baseLine="7138" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="7013" r="2146" b="7147">cent</wd>

<space/>

<wd l="2227" t="6989" r="3010" b="7147">advances</wd>

<space/>

<wd l="3096" t="6989" r="3269" b="7142">in</wd>

<space/>

<wd l="3346" t="6989" r="3653" b="7147">this</wd>

<space/>

<wd l="3744" t="7042" r="4104" b="7147">area</wd>

<space/>

<wd l="4186" t="6989" r="4378" b="7147">of</wd>

<space/>

<wd l="4440" t="6989" r="5170" b="7147">research</wd>

<space/>

<wd l="5246" t="6989" r="5462" b="7190">by</wd>

<space/>

</ln>

<ln l="1781" t="7258" r="5453" b="7459" baseLine="7406" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="7258" r="2578" b="7459">reporting</wd>

<space/>

<wd l="2674" t="7310" r="2885" b="7416">on</wd>

<space/>

<wd l="2971" t="7258" r="3240" b="7416">the</wd>

<space/>

<wd l="3331" t="7258" r="4445" b="7459">development</wd>

<space/>

<wd l="4536" t="7258" r="4728" b="7416">of</wd>

<space/>

<wd l="4800" t="7258" r="5453" b="7459">part-of-</wd>

</ln>

<ln l="1790" t="7526" r="5467" b="7728" baseLine="7680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1790" t="7526" r="2376" b="7728">speech</wd>

<space/>

<wd l="2467" t="7526" r="3384" b="7685">annotation</wd>

<space/>

<wd l="3480" t="7526" r="4123" b="7685">scheme</wd>

<space/>

<wd l="4219" t="7526" r="4531" b="7685">and</wd>

<space/>

<wd l="4622" t="7526" r="5467" b="7685">annotated</wd>

<space/>

</ln>

<ln l="1786" t="7800" r="5462" b="8002" baseLine="7949" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1786" t="7853" r="2352" b="8002">corpus</wd>

<space/>

<wd l="2424" t="7800" r="2683" b="7958">for</wd>

<space/>

<wd l="2746" t="7800" r="3144" b="7958">Irish</wd>

<space/>

<wd l="3206" t="7800" r="3994" b="8002">language</wd>

<space/>

<wd l="4056" t="7824" r="4661" b="7958">tweets.</wd>

<space/>

<wd l="4766" t="7805" r="5050" b="7958">We</wd>

<space/>

<wd l="5117" t="7800" r="5462" b="7958">also</wd>

<space/>

</ln>

<ln l="1781" t="8069" r="5477" b="8270" baseLine="8222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8098" r="2304" b="8270">report</wd>

<space/>

<wd l="2357" t="8122" r="2568" b="8227">on</wd>

<space/>

<wd l="2626" t="8069" r="3917" b="8227">state-of-the-art</wd>

<space/>

<wd l="3960" t="8069" r="4613" b="8270">tagging</wd>

<space/>

<wd l="4666" t="8069" r="5227" b="8227">results</wd>

<space/>

<wd l="5290" t="8069" r="5477" b="8227">of</wd>

<space/>

</ln>

<ln l="1781" t="8342" r="5453" b="8544" baseLine="8491" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8342" r="2458" b="8544">training</wd>

<space/>

<wd l="2568" t="8342" r="2880" b="8501">and</wd>

<space/>

<wd l="2981" t="8342" r="3557" b="8544">testing</wd>

<space/>

<wd l="3662" t="8342" r="4099" b="8501">three</wd>

<space/>

<wd l="4205" t="8342" r="4886" b="8544">existing</wd>

<space/>

<wd l="4992" t="8347" r="5453" b="8501">POS-</wd>

</ln>

<ln l="1781" t="8611" r="4142" b="8813" baseLine="8765" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1781" t="8635" r="2400" b="8813">taggers</wd>

<space/>

<wd l="2472" t="8664" r="2683" b="8770">on</wd>

<space/>

<wd l="2741" t="8664" r="3034" b="8770">our</wd>

<space/>

<wd l="3082" t="8664" r="3437" b="8770">new</wd>

<space/>

<wd l="3499" t="8611" r="4142" b="8770">dataset.</wd>

</ln>

</para>

<para l="1454" t="8995" r="3091" b="9168" alignment="left" spaceBefore="129" lsp="exactly" lspExact="273" language="en">

<ln l="1454" t="8995" r="3091" b="9168" baseLine="9163" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1454" t="8995" r="1550" b="9163">1</wd>

<space/>

<wd l="1805" t="8995" r="3091" b="9168">Introduction</wd>

</ln>

</para>

<para l="1440" t="9418" r="5808" b="14765" alignment="justified" spaceBefore="130" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="9418" r="5808" b="9619" baseLine="9566" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9418" r="1781" b="9576">The</wd>

<space/>

<wd l="1834" t="9418" r="2621" b="9619">language</wd>

<space/>

<wd l="2688" t="9418" r="3091" b="9619">style</wd>

<space/>

<wd l="3149" t="9418" r="3922" b="9576">variation</wd>

<space/>

<wd l="3974" t="9418" r="4378" b="9576">used</wd>

<space/>

<wd l="4435" t="9470" r="4651" b="9576">on</wd>

<space/>

<wd l="4718" t="9418" r="5213" b="9576">social</wd>

<space/>

<wd l="5270" t="9418" r="5808" b="9576">media</wd>

<space/>

</ln>

<ln l="1440" t="9686" r="5808" b="9888" baseLine="9835" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9686" r="2318" b="9888">platforms,</wd>

<space/>

<wd l="2438" t="9686" r="2827" b="9845">such</wd>

<space/>

<wd l="2918" t="9739" r="3086" b="9845">as</wd>

<space/>

<wd l="3182" t="9686" r="3811" b="9845">Twitter</wd>

<space/>

<wd l="3898" t="9686" r="4157" b="9845">for</wd>

<space/>

<wd l="4243" t="9686" r="5016" b="9888">example,</wd>

<space/>

<wd l="5126" t="9686" r="5261" b="9845">is</wd>

<space/>

<wd l="5362" t="9686" r="5808" b="9845">often</wd>

<space/>

</ln>

<ln l="1440" t="9960" r="5798" b="10162" baseLine="10109" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9960" r="2131" b="10118">referred</wd>

<space/>

<wd l="2213" t="9984" r="2381" b="10118">to</wd>

<space/>

<wd l="2472" t="10013" r="2645" b="10118">as</wd>

<space/>

<wd l="2736" t="9960" r="3206" b="10162">noisy</wd>

<space/>

<wd l="3293" t="9960" r="4574" b="10162">user-generated</wd>

<space/>

<wd l="4656" t="9984" r="5026" b="10118">text.</wd>

<space/>

<wd l="5194" t="9965" r="5798" b="10118">Tweets</wd>

<space/>

</ln>

<ln l="1445" t="10229" r="5794" b="10430" baseLine="10378" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="10282" r="1738" b="10387">can</wd>

<space/>

<wd l="1814" t="10229" r="2453" b="10387">contain</wd>

<space/>

<wd l="2515" t="10229" r="3715" b="10430">typographical</wd>

<space/>

<wd l="3787" t="10282" r="4282" b="10387">errors</wd>

<space/>

<wd l="4363" t="10229" r="4675" b="10387">and</wd>

<space/>

<wd l="4738" t="10253" r="5794" b="10430">ungrammat-</wd>

</ln>

<ln l="1440" t="10498" r="5794" b="10699" baseLine="10651" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10498" r="1752" b="10656">ical</wd>

<space/>

<wd l="1862" t="10522" r="2693" b="10656">structures</wd>

<space/>

<wd l="2794" t="10498" r="3125" b="10656">that</wd>

<space/>

<wd l="3216" t="10550" r="3614" b="10699">pose</wd>

<space/>

<wd l="3715" t="10498" r="4627" b="10699">challenges</wd>

<space/>

<wd l="4728" t="10498" r="4987" b="10656">for</wd>

<space/>

<wd l="5078" t="10550" r="5794" b="10699">process-</wd>

</ln>

<ln l="1440" t="10771" r="5794" b="10973" baseLine="10920" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10771" r="1714" b="10973">ing</wd>

<space/>

<wd l="1829" t="10771" r="2246" b="10930">tools</wd>

<space/>

<wd l="2362" t="10771" r="2693" b="10930">that</wd>

<space/>

<wd l="2803" t="10771" r="3206" b="10930">have</wd>

<space/>

<wd l="3317" t="10771" r="3730" b="10930">been</wd>

<space/>

<wd l="3845" t="10771" r="4618" b="10973">designed</wd>

<space/>

<wd l="4723" t="10771" r="4982" b="10930">for</wd>

<space/>

<wd l="5093" t="10771" r="5405" b="10930">and</wd>

<space/>

<wd l="5515" t="10771" r="5794" b="10930">tai-</wd>

</ln>

<ln l="1440" t="11040" r="5808" b="11242" baseLine="11194" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11040" r="1891" b="11198">lored</wd>

<space/>

<wd l="1949" t="11064" r="2117" b="11198">to</wd>

<space/>

<wd l="2184" t="11040" r="2573" b="11242">high</wd>

<space/>

<wd l="2635" t="11040" r="3269" b="11242">quality,</wd>

<space/>

<wd l="3341" t="11040" r="4325" b="11198">well-edited</wd>

<space/>

<wd l="4387" t="11064" r="4714" b="11198">text</wd>

<space/>

<wd l="4781" t="11040" r="5174" b="11198">such</wd>

<space/>

<wd l="5242" t="11093" r="5410" b="11198">as</wd>

<space/>

<wd l="5477" t="11040" r="5808" b="11198">that</wd>

<space/>

</ln>

<ln l="1440" t="11314" r="5794" b="11501" baseLine="11462" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11314" r="1949" b="11472">found</wd>

<space/>

<wd l="2045" t="11314" r="2218" b="11467">in</wd>

<space/>

<wd l="2314" t="11314" r="3187" b="11501">newswire,</wd>

<space/>

<wd l="3302" t="11314" r="4090" b="11472">literature</wd>

<space/>

<wd l="4195" t="11314" r="4502" b="11472">and</wd>

<space/>

<wd l="4603" t="11314" r="5208" b="11472">official</wd>

<space/>

<wd l="5314" t="11314" r="5794" b="11472">docu-</wd>

</ln>

<ln l="1440" t="11582" r="5808" b="11779" baseLine="11736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11606" r="2006" b="11741">ments.</wd>

<space/>

<wd l="2136" t="11582" r="2890" b="11741">Previous</wd>

<space/>

<wd l="2976" t="11582" r="3619" b="11770">studies,</wd>

<space/>

<wd l="3706" t="11587" r="4253" b="11741">Foster</wd>

<space/>

<wd l="4325" t="11606" r="4478" b="11741">et</wd>

<space/>

<wd l="4555" t="11582" r="4752" b="11741">al.</wd>

<space/>

<wd l="4848" t="11587" r="5410" b="11779">(2011)</wd>

<space/>

<wd l="5496" t="11582" r="5808" b="11741">and</wd>

<space/>

</ln>

<ln l="1440" t="11856" r="5803" b="12058" baseLine="12005" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11861" r="2002" b="12014">Petrov</wd>

<space/>

<wd l="2098" t="11856" r="2410" b="12014">and</wd>

<space/>

<wd l="2491" t="11856" r="3427" b="12014">McDonald</wd>

<space/>

<wd l="3518" t="11861" r="4080" b="12053">(2012)</wd>

<space/>

<wd l="4176" t="11856" r="4435" b="12014">for</wd>

<space/>

<wd l="4522" t="11856" r="5294" b="12058">example,</wd>

<space/>

<wd l="5400" t="11856" r="5803" b="12014">have</wd>

<space/>

</ln>

<ln l="1445" t="12125" r="5808" b="12326" baseLine="12278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12125" r="2203" b="12326">explored</wd>

<space/>

<wd l="2261" t="12125" r="2525" b="12283">the</wd>

<space/>

<wd l="2592" t="12125" r="3077" b="12283">effect</wd>

<space/>

<wd l="3134" t="12125" r="3466" b="12283">that</wd>

<space/>

<wd l="3523" t="12125" r="3787" b="12283">the</wd>

<space/>

<wd l="3854" t="12125" r="4258" b="12326">style</wd>

<space/>

<wd l="4325" t="12125" r="4512" b="12283">of</wd>

<space/>

<wd l="4560" t="12125" r="5347" b="12326">language</wd>

<space/>

<wd l="5405" t="12125" r="5808" b="12283">used</wd>

<space/>

</ln>

<ln l="1440" t="12398" r="5803" b="12600" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12398" r="1613" b="12552">in</wd>

<space/>

<wd l="1675" t="12398" r="2957" b="12600">user-generated</wd>

<space/>

<wd l="3024" t="12422" r="3667" b="12557">content</wd>

<space/>

<wd l="3730" t="12398" r="4013" b="12557">has</wd>

<space/>

<wd l="4090" t="12451" r="4306" b="12557">on</wd>

<space/>

<wd l="4373" t="12398" r="4637" b="12557">the</wd>

<space/>

<wd l="4704" t="12398" r="5803" b="12600">performance</wd>

<space/>

</ln>

<ln l="1445" t="12667" r="5803" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12667" r="1637" b="12826">of</wd>

<space/>

<wd l="1704" t="12667" r="2438" b="12826">standard</wd>

<space/>

<wd l="2510" t="12672" r="2923" b="12826">NLP</wd>

<space/>

<wd l="3000" t="12667" r="3466" b="12826">tools.</wd>

<space/>

<wd l="3610" t="12667" r="4104" b="12826">Other</wd>

<space/>

<wd l="4186" t="12667" r="4776" b="12826">studies</wd>

<space/>

<wd l="4858" t="12667" r="5074" b="12869">by</wd>

<space/>

<wd l="5155" t="12667" r="5803" b="12869">Gimpel</wd>

<space/>

</ln>

<ln l="1445" t="12941" r="5808" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12965" r="1598" b="13099">et</wd>

<space/>

<wd l="1680" t="12941" r="1872" b="13099">al.</wd>

<space/>

<wd l="1973" t="12946" r="2587" b="13138">(2011),</wd>

<space/>

<wd l="2683" t="12941" r="3437" b="13142">Owoputi</wd>

<space/>

<wd l="3523" t="12965" r="3677" b="13099">et</wd>

<space/>

<wd l="3754" t="12941" r="3950" b="13099">al.</wd>

<space/>

<wd l="4046" t="12946" r="4666" b="13138">(2013),</wd>

<space/>

<wd l="4757" t="12946" r="5578" b="13099">Avontuur</wd>

<space/>

<wd l="5654" t="12965" r="5808" b="13099">et</wd>

<space/>

</ln>

<ln l="1445" t="13210" r="5794" b="13411" baseLine="13358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="13210" r="1642" b="13368">al.</wd>

<space/>

<wd l="1738" t="13214" r="2352" b="13406">(2012),</wd>

<space/>

<wd l="2443" t="13210" r="3173" b="13368">Rehbein</wd>

<space/>

<wd l="3254" t="13214" r="3816" b="13406">(2013)</wd>

<space/>

<wd l="3907" t="13210" r="4219" b="13368">and</wd>

<space/>

<wd l="4291" t="13210" r="5285" b="13411">Derczynski</wd>

<space/>

<wd l="5366" t="13234" r="5520" b="13368">et</wd>

<space/>

<wd l="5597" t="13210" r="5794" b="13368">al.</wd>

<space/>

</ln>

<ln l="1450" t="13478" r="5808" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="13483" r="2011" b="13675">(2013)</wd>

<space/>

<wd l="2088" t="13478" r="3398" b="13680">(POS-tagging),</wd>

<space/>

<wd l="3466" t="13478" r="3970" b="13637">Ritter</wd>

<space/>

<wd l="4027" t="13502" r="4181" b="13637">et</wd>

<space/>

<wd l="4243" t="13478" r="4440" b="13637">al.</wd>

<space/>

<wd l="4522" t="13483" r="5083" b="13675">(2011)</wd>

<space/>

<wd l="5160" t="13478" r="5808" b="13675">(named</wd>

<space/>

</ln>

<ln l="1445" t="13752" r="5808" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="13752" r="1934" b="13954">entity</wd>

<space/>

<wd l="1987" t="13752" r="3096" b="13954">recognition),</wd>

<space/>

<wd l="3168" t="13757" r="3634" b="13954">Kong</wd>

<space/>

<wd l="3696" t="13776" r="3850" b="13910">et</wd>

<space/>

<wd l="3902" t="13752" r="4099" b="13910">al.</wd>

<space/>

<wd l="4171" t="13757" r="4733" b="13949">(2014)</wd>

<space/>

<wd l="4800" t="13752" r="5112" b="13910">and</wd>

<space/>

<wd l="5170" t="13752" r="5808" b="13910">Seddah</wd>

<space/>

</ln>

<ln l="1445" t="14021" r="5798" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="14045" r="1598" b="14179">et</wd>

<space/>

<wd l="1666" t="14021" r="1862" b="14179">al.</wd>

<space/>

<wd l="1944" t="14026" r="2506" b="14218">(2012)</wd>

<space/>

<wd l="2587" t="14021" r="3355" b="14222">(parsing)</wd>

<space/>

<wd l="3427" t="14021" r="3830" b="14179">have</wd>

<space/>

<wd l="3902" t="14021" r="4459" b="14179">shown</wd>

<space/>

<wd l="4517" t="14021" r="4848" b="14179">that</wd>

<space/>

<wd l="4906" t="14026" r="5318" b="14179">NLP</wd>

<space/>

<wd l="5381" t="14021" r="5798" b="14179">tools</wd>

<space/>

</ln>

<ln l="1445" t="14294" r="5803" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="14294" r="1757" b="14453">and</wd>

<space/>

<wd l="1829" t="14347" r="2645" b="14453">resources</wd>

<space/>

<wd l="2722" t="14294" r="3134" b="14453">need</wd>

<space/>

<wd l="3206" t="14318" r="3374" b="14453">to</wd>

<space/>

<wd l="3446" t="14294" r="3653" b="14453">be</wd>

<space/>

<wd l="3730" t="14294" r="4406" b="14496">adapted</wd>

<space/>

<wd l="4474" t="14318" r="4642" b="14453">to</wd>

<space/>

<wd l="4723" t="14318" r="5146" b="14453">cater</wd>

<space/>

<wd l="5213" t="14294" r="5472" b="14453">for</wd>

<space/>

<wd l="5539" t="14294" r="5803" b="14453">the</wd>

<space/>

</ln>

<ln l="1440" t="14563" r="5054" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="14563" r="2246" b="14765">linguistic</wd>

<space/>

<wd l="2314" t="14563" r="3264" b="14722">differences</wd>

<space/>

<wd l="3326" t="14587" r="3955" b="14765">present</wd>

<space/>

<wd l="4008" t="14563" r="4181" b="14717">in</wd>

<space/>

<wd l="4243" t="14563" r="4637" b="14722">such</wd>

<space/>

<wd l="4690" t="14587" r="5054" b="14722">text.</wd>

</ln>

</para>

<para l="1445" t="14837" r="5808" b="15307" alignment="justified" fli="216" lsp="exactly" lspExact="266" language="en">

<ln l="1656" t="14837" r="5808" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="14837" r="2179" b="14995">When</wd>

<space/>

<wd l="2227" t="14837" r="3235" b="15038">considering</wd>

<space/>

<wd l="3288" t="14837" r="4267" b="14995">data-driven</wd>

<space/>

<wd l="4310" t="14842" r="4723" b="14995">NLP</wd>

<space/>

<wd l="4766" t="14837" r="5246" b="15024">tasks,</wd>

<space/>

<wd l="5309" t="14890" r="5405" b="14995">a</wd>

<space/>

<wd l="5443" t="14837" r="5808" b="14995">lack</wd>

<space/>

</ln>

<ln l="1445" t="15106" r="5794" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="15106" r="1637" b="15264">of</wd>

<space/>

<wd l="1738" t="15158" r="2554" b="15264">resources</wd>

<space/>

<wd l="2683" t="15158" r="2976" b="15264">can</wd>

<space/>

<wd l="3101" t="15106" r="3442" b="15264">also</wd>

<space/>

<wd l="3562" t="15106" r="4262" b="15307">produce</wd>

<space/>

<wd l="4387" t="15106" r="5251" b="15264">additional</wd>

<space/>

<wd l="5376" t="15106" r="5794" b="15264">chal-</wd>

</ln>

<ln l="0" t="0" r="0" b="0" baseLine="0" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<space/>

</ln>

</para>

</column>

<column l="6144" t="4092" r="10531" b="15318">

<para l="6144" t="4157" r="10517" b="5712" alignment="justified" spaceBefore="4" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="4157" r="10507" b="4358" baseLine="4306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4157" r="6744" b="4358">lenges.</wd>

<space/>

<wd l="6835" t="4162" r="7123" b="4315">We</wd>

<space/>

<wd l="7181" t="4157" r="7968" b="4315">therefore</wd>

<space/>

<wd l="8030" t="4157" r="8760" b="4315">examine</wd>

<space/>

<wd l="8822" t="4157" r="9086" b="4315">the</wd>

<space/>

<wd l="9144" t="4157" r="9739" b="4358">impact</wd>

<space/>

<wd l="9802" t="4157" r="9994" b="4315">of</wd>

<space/>

<wd l="10037" t="4157" r="10507" b="4358">noisy</wd>

<space/>

</ln>

<ln l="6144" t="4426" r="10517" b="4627" baseLine="4579" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4426" r="7426" b="4627">user-generated</wd>

<space/>

<wd l="7512" t="4450" r="7838" b="4584">text</wd>

<space/>

<wd l="7925" t="4478" r="8141" b="4584">on</wd>

<space/>

<wd l="8222" t="4426" r="8486" b="4584">the</wd>

<space/>

<wd l="8578" t="4426" r="9259" b="4627">existing</wd>

<space/>

<wd l="9346" t="4478" r="10162" b="4584">resources</wd>

<space/>

<wd l="10258" t="4426" r="10517" b="4584">for</wd>

<space/>

</ln>

<ln l="6144" t="4699" r="10512" b="4901" baseLine="4848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4699" r="6590" b="4886">Irish,</wd>

<space/>

<wd l="6677" t="4752" r="6773" b="4858">a</wd>

<space/>

<wd l="6835" t="4699" r="8078" b="4858">low-resourced</wd>

<space/>

<wd l="8141" t="4699" r="8976" b="4901">language.</wd>

<space/>

<wd l="9091" t="4704" r="9374" b="4858">We</wd>

<space/>

<wd l="9446" t="4699" r="9792" b="4858">also</wd>

<space/>

<wd l="9864" t="4699" r="10512" b="4901">explore</wd>

<space/>

</ln>

<ln l="6149" t="4968" r="10507" b="5170" baseLine="5122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4968" r="6782" b="5170">options</wd>

<space/>

<wd l="6864" t="4968" r="7123" b="5126">for</wd>

<space/>

<wd l="7195" t="4968" r="8102" b="5170">leveraging</wd>

<space/>

<wd l="8179" t="4968" r="8606" b="5126">from</wd>

<space/>

<wd l="8683" t="4968" r="9365" b="5170">existing</wd>

<space/>

<wd l="9442" t="5021" r="10258" b="5126">resources</wd>

<space/>

<wd l="10339" t="4992" r="10507" b="5126">to</wd>

<space/>

</ln>

<ln l="6144" t="5242" r="10517" b="5443" baseLine="5390" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5242" r="6850" b="5443">produce</wd>

<space/>

<wd l="6960" t="5294" r="7056" b="5400">a</wd>

<space/>

<wd l="7157" t="5294" r="7512" b="5400">new</wd>

<space/>

<wd l="7627" t="5242" r="9029" b="5443">domain-adapted</wd>

<space/>

<wd l="9134" t="5246" r="10157" b="5443">POS-tagger</wd>

<space/>

<wd l="10258" t="5242" r="10517" b="5400">for</wd>

<space/>

</ln>

<ln l="6144" t="5510" r="10435" b="5712" baseLine="5664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5510" r="7075" b="5712">processing</wd>

<space/>

<wd l="7133" t="5510" r="7536" b="5669">Irish</wd>

<space/>

<wd l="7589" t="5510" r="8218" b="5669">Twitter</wd>

<space/>

<wd l="8270" t="5510" r="8674" b="5669">data.</wd>

<space/>

<wd l="8755" t="5515" r="9038" b="5669">We</wd>

<space/>

<wd l="9096" t="5510" r="9749" b="5669">achieve</wd>

<space/>

<wd l="9806" t="5510" r="10114" b="5669">this</wd>

<space/>

<wd l="10176" t="5510" r="10435" b="5712">by:</wd>

</ln>

</para>

<para l="6384" t="5942" r="10248" b="6149" alignment="left" li="432" spaceBefore="161" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="5947" r="10248" b="6149" baseLine="6096" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6384" t="5947" r="6586" b="6096">•</wd>

<tab position="6467"/>

<wd l="6586" t="5947" r="7296" b="6149">defining</wd>

<space/>

<wd l="7358" t="6000" r="7454" b="6106">a</wd>

<space/>

<wd l="7502" t="6000" r="7858" b="6106">new</wd>

<space/>

<wd l="7915" t="5952" r="8304" b="6106">POS</wd>

<space/>

<wd l="8371" t="5971" r="8880" b="6149">tagset</wd>

<space/>

<wd l="8933" t="5947" r="9192" b="6106">for</wd>

<space/>

<wd l="9245" t="5947" r="9643" b="6106">Irish</wd>

<space/>

<wd l="9696" t="5971" r="10248" b="6106">tweets</wd>

</ln>

</para>

<para l="6384" t="6389" r="10512" b="6864" alignment="justified" li="432" spaceBefore="173" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="6394" r="10512" b="6595" baseLine="6542" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="6446" r="6581" b="6542">•</wd>

<tab position="6438"/>

<wd l="6581" t="6394" r="7426" b="6595">providing</wd>

<space/>

<wd l="7483" t="6446" r="7579" b="6552">a</wd>

<space/>

<wd l="7627" t="6394" r="8390" b="6595">mapping</wd>

<space/>

<wd l="8443" t="6394" r="8870" b="6552">from</wd>

<space/>

<wd l="8918" t="6394" r="9187" b="6552">the</wd>

<space/>

<wd l="9240" t="6398" r="10061" b="6552">PAROLE</wd>

<space/>

<wd l="10109" t="6394" r="10512" b="6552">Irish</wd>

<space/>

</ln>

<ln l="6581" t="6662" r="8938" b="6864" baseLine="6811" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="6667" r="7565" b="6864">POS-tagset</wd>

<space/>

<wd l="7618" t="6686" r="7786" b="6821">to</wd>

<space/>

<wd l="7843" t="6662" r="8150" b="6821">this</wd>

<space/>

<wd l="8213" t="6715" r="8568" b="6821">new</wd>

<space/>

<wd l="8630" t="6715" r="8938" b="6821">one</wd>

</ln>

</para>

<para l="6384" t="7109" r="10512" b="7536" alignment="justified" li="432" spaceBefore="173" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="7109" r="10512" b="7310" baseLine="7258">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6384" t="7162" r="6581" b="7258">•</wd>

<tab position="6438"/>

<wd l="6581" t="7109" r="7392" b="7310">manually</wd>

<space/>

<wd l="7483" t="7109" r="8395" b="7310">annotating</wd>

<space/>

<wd l="8486" t="7162" r="8582" b="7267">a</wd>

<space/>

<wd l="8669" t="7162" r="9235" b="7310">corpus</wd>

<space/>

<wd l="9331" t="7109" r="9523" b="7267">of</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="9610" t="7114" r="10027" b="7267">1537</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10109" t="7109" r="10512" b="7267">Irish</wd>

<space/>

</run>

</ln>

<ln l="6581" t="7387" r="7133" b="7536" baseLine="7526" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6581" t="7402" r="7133" b="7536">tweets</wd>

</ln>

</para>

<para l="6384" t="7824" r="10517" b="8294" alignment="justified" li="432" spaceBefore="174" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="6384" t="7824" r="10517" b="8026" baseLine="7973" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6384" t="7848" r="6581" b="7973">•</wd>

<tab position="6454"/>

<wd l="6581" t="7824" r="7258" b="8026">training</wd>

<space/>

<wd l="7344" t="7824" r="7776" b="7982">three</wd>

<space/>

<wd l="7867" t="7824" r="8678" b="7982">statistical</wd>

<space/>

<wd l="8765" t="7848" r="9389" b="8026">taggers</wd>

<space/>

<wd l="9480" t="7877" r="9696" b="7982">on</wd>

<space/>

<wd l="9782" t="7877" r="10070" b="7982">our</wd>

<space/>

<wd l="10152" t="7824" r="10517" b="7982">data</wd>

<space/>

</ln>

<ln l="6586" t="8093" r="8366" b="8294" baseLine="8242" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6586" t="8093" r="6898" b="8251">and</wd>

<space/>

<wd l="6950" t="8093" r="7747" b="8294">reporting</wd>

<space/>

<wd l="7805" t="8093" r="8366" b="8251">results</wd>

</ln>

</para>

<para l="6144" t="8530" r="10512" b="10896" alignment="justified" spaceBefore="167" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="8530" r="10507" b="8731" baseLine="8678" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="8530" r="6744" b="8688">This</wd>

<space/>

<wd l="6859" t="8582" r="7349" b="8731">paper</wd>

<space/>

<wd l="7454" t="8530" r="7589" b="8688">is</wd>

<space/>

<wd l="7714" t="8530" r="8357" b="8688">divided</wd>

<space/>

<wd l="8467" t="8582" r="8640" b="8688">as</wd>

<space/>

<wd l="8755" t="8530" r="9446" b="8688">follows:</wd>

<space/>

<wd l="9643" t="8530" r="10296" b="8688">Section</wd>

<space/>

<wd l="10406" t="8534" r="10507" b="8683">2</wd>

<space/>

</ln>

<ln l="6149" t="8798" r="10507" b="9000" baseLine="8947" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="8798" r="6590" b="9000">gives</wd>

<space/>

<wd l="6701" t="8851" r="6797" b="8957">a</wd>

<space/>

<wd l="6902" t="8851" r="7699" b="9000">summary</wd>

<space/>

<wd l="7810" t="8798" r="8002" b="8957">of</wd>

<space/>

<wd l="8083" t="8798" r="8717" b="8957">Twitter</wd>

<space/>

<wd l="8813" t="8798" r="9125" b="8957">and</wd>

<space/>

<wd l="9226" t="8798" r="9739" b="8957">issues</wd>

<space/>

<wd l="9854" t="8798" r="10507" b="9000">specific</wd>

<space/>

</ln>

<ln l="6144" t="9072" r="10512" b="9230" baseLine="9221" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9096" r="6312" b="9230">to</wd>

<space/>

<wd l="6389" t="9072" r="6653" b="9230">the</wd>

<space/>

<wd l="6730" t="9072" r="7133" b="9230">Irish</wd>

<space/>

<wd l="7205" t="9072" r="7834" b="9230">Twitter</wd>

<space/>

<wd l="7906" t="9072" r="8309" b="9230">data.</wd>

<space/>

<wd l="8453" t="9072" r="9101" b="9230">Section</wd>

<space/>

<wd l="9182" t="9077" r="9274" b="9230">3</wd>

<space/>

<wd l="9365" t="9072" r="10162" b="9230">discusses</wd>

<space/>

<wd l="10243" t="9072" r="10512" b="9230">the</wd>

<space/>

</ln>

<ln l="6144" t="9341" r="10498" b="9542" baseLine="9490" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9394" r="6499" b="9499">new</wd>

<space/>

<wd l="6566" t="9341" r="7829" b="9542">part-of-speech</wd>

<space/>

<wd l="7896" t="9341" r="8477" b="9542">tagged</wd>

<space/>

<wd l="8544" t="9394" r="9115" b="9542">corpus</wd>

<space/>

<wd l="9192" t="9341" r="9384" b="9499">of</wd>

<space/>

<wd l="9432" t="9341" r="9835" b="9499">Irish</wd>

<space/>

<wd l="9898" t="9365" r="10498" b="9499">tweets.</wd>

<space/>

</ln>

<ln l="6149" t="9610" r="10512" b="9811" baseLine="9763" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9610" r="6802" b="9768">Section</wd>

<space/>

<wd l="6859" t="9614" r="6965" b="9763">4</wd>

<space/>

<wd l="7032" t="9610" r="7834" b="9768">discusses</wd>

<space/>

<wd l="7906" t="9662" r="8194" b="9768">our</wd>

<space/>

<wd l="8251" t="9610" r="9547" b="9768">inter-annotator</wd>

<space/>

<wd l="9605" t="9634" r="10512" b="9811">agreement</wd>

<space/>

</ln>

<ln l="6154" t="9883" r="10502" b="10085" baseLine="10032" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="9883" r="6614" b="10085">study</wd>

<space/>

<wd l="6696" t="9883" r="7008" b="10042">and</wd>

<space/>

<wd l="7080" t="9883" r="7344" b="10042">the</wd>

<space/>

<wd l="7421" t="9883" r="8506" b="10042">observations</wd>

<space/>

<wd l="8587" t="9936" r="8842" b="10042">we</wd>

<space/>

<wd l="8914" t="9907" r="9288" b="10042">note</wd>

<space/>

<wd l="9360" t="9883" r="9787" b="10042">from</wd>

<space/>

<wd l="9859" t="9907" r="10502" b="10042">annota-</wd>

</ln>

<ln l="6144" t="10152" r="10507" b="10354" baseLine="10306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10176" r="6394" b="10310">tor</wd>

<space/>

<wd l="6466" t="10152" r="7757" b="10354">disagreements.</wd>

<space/>

<wd l="7901" t="10152" r="8554" b="10310">Section</wd>

<space/>

<wd l="8630" t="10152" r="8722" b="10310">5</wd>

<space/>

<wd l="8808" t="10181" r="9408" b="10354">reports</wd>

<space/>

<wd l="9494" t="10205" r="9787" b="10310">our</wd>

<space/>

<wd l="9854" t="10152" r="10507" b="10354">tagging</wd>

<space/>

</ln>

<ln l="6149" t="10426" r="10507" b="10627" baseLine="10574" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10478" r="6912" b="10627">accuracy</wd>

<space/>

<wd l="6970" t="10426" r="7531" b="10584">results</wd>

<space/>

<wd l="7594" t="10478" r="7805" b="10584">on</wd>

<space/>

<wd l="7853" t="10426" r="8290" b="10584">three</wd>

<space/>

<wd l="8352" t="10426" r="9638" b="10584">state-of-the-art</wd>

<space/>

<wd l="9696" t="10426" r="10507" b="10584">statistical</wd>

<space/>

</ln>

<ln l="6144" t="10704" r="6821" b="10896" baseLine="10848" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10718" r="6821" b="10896">taggers.</wd>

</ln>

</para>

<para l="6144" t="11155" r="7747" b="11328" alignment="left" spaceBefore="201" lsp="exactly" lspExact="273" language="en">

<ln l="6144" t="11155" r="7747" b="11328" baseLine="11318" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">

<wd l="6144" t="11155" r="6259" b="11323">2</wd>

<space/>

<wd l="6509" t="11155" r="6994" b="11328">Irish</wd>

<space/>

<wd l="7061" t="11160" r="7747" b="11328">Tweets</wd>

</ln>

</para>

<para l="6144" t="11582" r="10526" b="15307" alignment="justified" spaceBefore="144" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="11582" r="10498" b="11784" baseLine="11736" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11582" r="6590" b="11770">Irish,</wd>

<space/>

<wd l="6653" t="11582" r="6922" b="11741">the</wd>

<space/>

<wd l="6979" t="11582" r="7584" b="11741">official</wd>

<space/>

<wd l="7642" t="11582" r="7954" b="11741">and</wd>

<space/>

<wd l="8006" t="11582" r="8707" b="11741">national</wd>

<space/>

<wd l="8765" t="11582" r="9552" b="11784">language</wd>

<space/>

<wd l="9610" t="11582" r="9802" b="11741">of</wd>

<space/>

<wd l="9840" t="11582" r="10498" b="11770">Ireland,</wd>

<space/>

</ln>

<ln l="6144" t="11856" r="10502" b="12058" baseLine="12005" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11856" r="6283" b="12014">is</wd>

<space/>

<wd l="6365" t="11909" r="6461" b="12014">a</wd>

<space/>

<wd l="6533" t="11856" r="7277" b="12058">minority</wd>

<space/>

<wd l="7354" t="11856" r="8184" b="12058">language.</wd>

<space/>

<wd l="8314" t="11856" r="8846" b="12014">While</wd>

<space/>

<wd l="8918" t="11856" r="9038" b="12014">it</wd>

<space/>

<wd l="9110" t="11856" r="9250" b="12014">is</wd>

<space/>

<wd l="9331" t="11909" r="9427" b="12014">a</wd>

<space/>

<wd l="9504" t="11856" r="10104" b="12014">second</wd>

<space/>

<wd l="10171" t="11856" r="10502" b="12014">lan-</wd>

</ln>

<ln l="6149" t="12125" r="10526" b="12326" baseLine="12278" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="12178" r="6667" b="12326">guage</wd>

<space/>

<wd l="6734" t="12125" r="6994" b="12283">for</wd>

<space/>

<wd l="7056" t="12149" r="7478" b="12283">most</wd>

<space/>

<wd l="7555" t="12125" r="8338" b="12326">speakers,</wd>

<space/>

<wd l="8424" t="12125" r="9206" b="12326">everyday</wd>

<space/>

<wd l="9274" t="12178" r="9566" b="12283">use</wd>

<space/>

<wd l="9638" t="12125" r="10262" b="12283">outside</wd>

<space/>

<wd l="10334" t="12125" r="10526" b="12283">of</wd>

<space/>

</ln>

<ln l="6149" t="12398" r="10502" b="12557" baseLine="12547" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="12398" r="6965" b="12557">academic</wd>

<space/>

<wd l="7066" t="12398" r="8232" b="12557">environments</wd>

<space/>

<wd l="8333" t="12398" r="8616" b="12557">has</wd>

<space/>

<wd l="8722" t="12451" r="9101" b="12557">seen</wd>

<space/>

<wd l="9197" t="12451" r="9293" b="12557">a</wd>

<space/>

<wd l="9384" t="12422" r="9917" b="12557">recent</wd>

<space/>

<wd l="10008" t="12451" r="10502" b="12557">resur-</wd>

</ln>

<ln l="6149" t="12667" r="10512" b="12869" baseLine="12816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="12720" r="6653" b="12869">gence</wd>

<space/>

<wd l="6710" t="12667" r="6878" b="12821">in</wd>

<space/>

<wd l="6941" t="12667" r="7440" b="12826">social</wd>

<space/>

<wd l="7498" t="12667" r="8035" b="12826">media</wd>

<space/>

<wd l="8083" t="12667" r="8914" b="12869">platforms</wd>

<space/>

<wd l="8986" t="12667" r="9374" b="12826">such</wd>

<space/>

<wd l="9437" t="12720" r="9605" b="12826">as</wd>

<space/>

<wd l="9667" t="12667" r="10512" b="12826">Facebook</wd>

<space/>

</ln>

<ln l="6149" t="12941" r="10512" b="13142" baseLine="13090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="12941" r="6461" b="13099">and</wd>

<space/>

<wd l="6523" t="12941" r="7181" b="13099">Twitter.</wd>

<space/>

<wd l="7282" t="12941" r="7910" b="13099">Twitter</wd>

<space/>

<wd l="7973" t="12941" r="8107" b="13099">is</wd>

<space/>

<wd l="8184" t="12994" r="8280" b="13099">a</wd>

<space/>

<wd l="8338" t="12941" r="9691" b="13142">micro-blogging</wd>

<space/>

<wd l="9758" t="12941" r="10512" b="13142">platform</wd>

<space/>

</ln>

<ln l="6144" t="13210" r="10507" b="13406" baseLine="13358">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="13210" r="6682" b="13368">which</wd>

<space/>

<wd l="6778" t="13210" r="7330" b="13368">allows</wd>

<space/>

<wd l="7430" t="13262" r="7872" b="13368">users</wd>

<space/>

</run>

<wd l="7982" t="13214" r="8832" b="13406"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">(</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">tweeters</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="8933" t="13234" r="9101" b="13368">to</wd>

<space/>

<wd l="9202" t="13234" r="9720" b="13368">create</wd>

<space/>

<wd l="9816" t="13262" r="9912" b="13368">a</wd>

<space/>

<wd l="10013" t="13210" r="10507" b="13368">social</wd>

<space/>

</run>

</ln>

<ln l="6144" t="13478" r="10502" b="13680" baseLine="13632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13478" r="6859" b="13637">network</wd>

<space/>

<wd l="6922" t="13478" r="7598" b="13680">through</wd>

<space/>

<wd l="7670" t="13478" r="8299" b="13680">sharing</wd>

<space/>

<wd l="8366" t="13531" r="8549" b="13637">or</wd>

<space/>

<wd l="8611" t="13478" r="9696" b="13680">commenting</wd>

<space/>

<wd l="9763" t="13531" r="9979" b="13637">on</wd>

<space/>

<wd l="10037" t="13478" r="10502" b="13637">items</wd>

<space/>

</ln>

<ln l="6149" t="13752" r="10502" b="13954" baseLine="13901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="13752" r="6341" b="13910">of</wd>

<space/>

<wd l="6418" t="13752" r="6917" b="13910">social</wd>

<space/>

<wd l="7003" t="13752" r="7646" b="13910">interest</wd>

<space/>

<wd l="7738" t="13752" r="8126" b="13910">such</wd>

<space/>

<wd l="8213" t="13805" r="8381" b="13910">as</wd>

<space/>

<wd l="8472" t="13752" r="8966" b="13939">ideas,</wd>

<space/>

<wd l="9072" t="13752" r="9859" b="13954">opinions,</wd>

<space/>

<wd l="9965" t="13776" r="10502" b="13910">events</wd>

<space/>

</ln>

<ln l="6149" t="14021" r="10512" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="14021" r="6461" b="14179">and</wd>

<space/>

<wd l="6504" t="14074" r="6989" b="14179">news.</wd>

<space/>

<wd l="7066" t="14026" r="7838" b="14179">Tweeters</wd>

<space/>

<wd l="7896" t="14074" r="8189" b="14179">can</wd>

<space/>

<wd l="8237" t="14045" r="8602" b="14222">post</wd>

<space/>

<wd l="8654" t="14021" r="9082" b="14179">short</wd>

<space/>

<wd l="9125" t="14074" r="9941" b="14222">messages</wd>

<space/>

<wd l="9994" t="14021" r="10512" b="14179">called</wd>

<space/>

</ln>

<ln l="6149" t="14294" r="10507" b="14496" baseLine="14443">

<wd l="6149" t="14328" r="6734" b="14482"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">tweets</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="6816" t="14294" r="7008" b="14453">of</wd>

<space/>

<wd l="7056" t="14347" r="7272" b="14496">up</wd>

<space/>

<wd l="7339" t="14318" r="7507" b="14453">to</wd>

<space/>

<wd l="7598" t="14299" r="7901" b="14453">140</wd>

<space/>

<wd l="7973" t="14294" r="8842" b="14453">characters</wd>

<space/>

<wd l="8914" t="14294" r="9086" b="14448">in</wd>

<space/>

<wd l="9149" t="14294" r="9739" b="14496">length,</wd>

<space/>

<wd l="9816" t="14294" r="10147" b="14453">that</wd>

<space/>

<wd l="10214" t="14347" r="10507" b="14453">can</wd>

<space/>

</run>

</ln>

<ln l="6144" t="14563" r="10502" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14563" r="6907" b="14765">typically</wd>

<space/>

<wd l="7003" t="14563" r="7210" b="14722">be</wd>

<space/>

<wd l="7310" t="14616" r="7690" b="14722">seen</wd>

<space/>

<wd l="7781" t="14563" r="7997" b="14765">by</wd>

<space/>

<wd l="8093" t="14563" r="8362" b="14722">the</wd>

<space/>

<wd l="8458" t="14563" r="9091" b="14765">general</wd>

<space/>

<wd l="9192" t="14563" r="9778" b="14765">public,</wd>

<space/>

<wd l="9893" t="14563" r="10502" b="14722">includ-</wd>

</ln>

<ln l="6144" t="14837" r="10512" b="15038" baseLine="14986">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="14837" r="6422" b="15038">ing</wd>

<space/>

<wd l="6494" t="14837" r="6758" b="14995">the</wd>

<space/>

<wd l="6826" t="14842" r="7330" b="14995">user’s</wd>

<space/>

</run>

<wd l="7368" t="14837" r="8256" b="15038"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">followers</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="8376" t="14842" r="8981" b="14995">Tweets</wd>

<space/>

<wd l="9058" t="14890" r="9355" b="14995">can</wd>

<space/>

<wd l="9427" t="14837" r="9629" b="14995">be</wd>

<space/>

<wd l="9706" t="14837" r="10512" b="14995">classified</wd>

<space/>

</run>

</ln>

<ln l="6144" t="15106" r="10502" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="15106" r="6360" b="15307">by</wd>

<space/>

<wd l="6432" t="15106" r="6864" b="15307">topic</wd>

<space/>

<wd l="6936" t="15106" r="7152" b="15307">by</wd>

<space/>

<wd l="7224" t="15106" r="7694" b="15307">using</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="7766" t="15106" r="8539" b="15307">hashtags</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="8621" t="15110" r="8986" b="15307">(e.g.</wd>

<space/>

<wd l="9110" t="15110" r="10502" b="15307">#categoryname)</wd>

</run>

</ln>

</para>

</column>

</section>

<section l="1433" t="15318" r="10531" b="16480">

<column l="1433" t="15318" r="10531" b="16480">

<para l="5881" t="15792" r="6076" b="15941" alignment="centered" spaceBefore="405" lsp="exactly" lspExact="271" language="en">

<ln l="5947" t="15792" r="6010" b="15941" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="5947" t="15792" r="6010" b="15941">1</wd>

</ln>

</para>

<para l="3005" t="16133" r="8894" b="16469" alignment="centered" spaceBefore="138" lsp="exactly" lspExact="170" language="en">

<ln l="3005" t="16133" r="8894" b="16301" baseLine="16253" forcedEOF="true">

<run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3005" t="16133" r="3893" b="16296">Proceedings</wd>

<space/>

<wd l="3946" t="16133" r="4104" b="16296">of</wd>

<space/>

<wd l="4128" t="16133" r="4339" b="16262">the</wd>

<space/>

<wd l="4378" t="16138" r="4714" b="16262">ACL</wd>

<space/>

<wd l="4757" t="16133" r="5117" b="16262">2015</wd>

<space/>

<wd l="5170" t="16133" r="5866" b="16296">Workshop</wd>

<space/>

<wd l="5918" t="16176" r="6091" b="16262">on</wd>

<space/>

<wd l="6134" t="16138" r="6542" b="16296">Noisy</wd>

<space/>

<wd l="6605" t="16133" r="7714" b="16296">User-generated</wd>

<space/>

</run>

<wd l="7762" t="16138" r="8083" b="16286"><run italic="true" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Text</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8131" t="16171" r="8534" b="16301">pages</wd>

<space/>

<wd l="8606" t="16133" r="8894" b="16286">1–8,
</wd>

</run>

</ln>

<ln l="3029" t="16296" r="8870" b="16469" baseLine="16425" forcedEOF="true">

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3029" t="16301" r="3595" b="16469">Beijing,</wd>

<space/>

<wd l="3653" t="16301" r="4114" b="16454">China,</wd>

<space/>

<wd l="4166" t="16301" r="4459" b="16469">July</wd>

<space/>

<wd l="4512" t="16301" r="4723" b="16454">31,</wd>

<space/>

<wd l="4781" t="16301" r="5170" b="16430">2015.</wd>

<space/>

</run>

<wd l="5246" t="16296" r="5770" b="16469"><run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">c</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">�</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2015</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5822" t="16301" r="6672" b="16430">Association</wd>

<space/>

<wd l="6715" t="16301" r="6926" b="16430">for</wd>

<space/>

<wd l="6974" t="16301" r="8035" b="16469">Computational</wd>

<space/>

<wd l="8078" t="16301" r="8870" b="16469">Linguistics</wd>

</run>

</ln>

</para>

</column>

</section>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1432" marginTop="1227" marginRight="1379" marginBottom="1302" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1432" t="1227" r="10530" b="15324">

<column l="1432" t="1227" r="5819" b="15324">

<para l="1440" t="1320" r="5794" b="1795" alignment="justified" spaceBefore="31" lsp="exactly" lspExact="271" language="en">

<ln l="1445" t="1320" r="5794" b="1522" baseLine="1474">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="1320" r="1757" b="1478">and</wd>

<space/>

<wd l="1810" t="1320" r="2357" b="1478">linked</wd>

<space/>

<wd l="2410" t="1344" r="2578" b="1478">to</wd>

<space/>

<wd l="2640" t="1320" r="3086" b="1478">other</wd>

<space/>

<wd l="3139" t="1344" r="3859" b="1478">tweeters</wd>

<space/>

<wd l="3922" t="1320" r="4603" b="1522">through</wd>

<space/>

<wd l="4656" t="1320" r="4925" b="1478">the</wd>

<space/>

<wd l="4978" t="1373" r="5270" b="1478">use</wd>

<space/>

<wd l="5328" t="1320" r="5520" b="1478">of</wd>

<space/>

</run>

<wd l="5563" t="1354" r="5794" b="1478" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">at-</wd>

</ln>

<ln l="1440" t="1598" r="3893" b="1795" baseLine="1742">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="1603" r="2222" b="1752">mentions</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2294" t="1598" r="2659" b="1795">(e.g.</wd>

<space/>

<wd l="2760" t="1598" r="3893" b="1790">@username).</wd>

</run>

</ln>

</para>

<para l="1440" t="1867" r="5808" b="2837" alignment="justified" spaceBefore="1" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="1867" r="5808" b="2069" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="1867" r="1997" b="2026">The</wd>

<space/>

<wd l="2064" t="1867" r="2400" b="2026">first</wd>

<space/>

<wd l="2458" t="1891" r="3010" b="2026">tweets</wd>

<space/>

<wd l="3077" t="1867" r="3250" b="2021">in</wd>

<space/>

<wd l="3307" t="1867" r="3710" b="2026">Irish</wd>

<space/>

<wd l="3773" t="1867" r="4555" b="2069">appeared</wd>

<space/>

<wd l="4618" t="1891" r="4896" b="2026">not</wd>

<space/>

<wd l="4958" t="1867" r="5342" b="2069">long</wd>

<space/>

<wd l="5410" t="1867" r="5808" b="2026">after</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="5808" b="2323" baseLine="2290" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2136" r="1704" b="2294">the</wd>

<space/>

<wd l="1762" t="2136" r="2342" b="2294">launch</wd>

<space/>

<wd l="2400" t="2136" r="2592" b="2294">of</wd>

<space/>

<wd l="2630" t="2136" r="3259" b="2294">Twitter</wd>

<space/>

<wd l="3307" t="2136" r="3480" b="2290">in</wd>

<space/>

<wd l="3538" t="2136" r="4013" b="2323">2006,</wd>

<space/>

<wd l="4080" t="2136" r="4392" b="2294">and</wd>

<space/>

<wd l="4445" t="2136" r="4882" b="2294">there</wd>

<space/>

<wd l="4934" t="2136" r="5338" b="2294">have</wd>

<space/>

<wd l="5395" t="2136" r="5808" b="2294">been</wd>

<space/>

</ln>

<ln l="1440" t="2410" r="5803" b="2611" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2462" r="1886" b="2568">more</wd>

<space/>

<wd l="1954" t="2410" r="2333" b="2568">than</wd>

<space/>

<wd l="2400" t="2462" r="2496" b="2568">a</wd>

<space/>

<wd l="2558" t="2410" r="3187" b="2568">million</wd>

<space/>

<wd l="3254" t="2434" r="3802" b="2568">tweets</wd>

<space/>

<wd l="3874" t="2410" r="4046" b="2563">in</wd>

<space/>

<wd l="4109" t="2410" r="4512" b="2568">Irish</wd>

<space/>

<wd l="4584" t="2410" r="5021" b="2568">since</wd>

<space/>

<wd l="5088" t="2410" r="5510" b="2597">then,</wd>

<space/>

<wd l="5587" t="2410" r="5803" b="2611">by</wd>

<space/>

</ln>

<ln l="1445" t="2645" r="4210" b="2837" baseLine="2829">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="2731" r="1824" b="2837">over</wd>

<space/>

<wd l="1886" t="2683" r="2309" b="2837">8000</wd>

<space/>

<wd l="2366" t="2702" r="3086" b="2837">tweeters</wd>

<space/>

</run>

<wd l="3149" t="2645" r="4210" b="2837"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">worldwide</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="2952" r="5808" b="5050" alignment="justified" spaceBefore="6" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="2952" r="5803" b="3110" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="2952" r="1997" b="3110">The</wd>

<space/>

<wd l="2064" t="2952" r="2558" b="3110">social</wd>

<space/>

<wd l="2616" t="2976" r="3163" b="3110">nature</wd>

<space/>

<wd l="3221" t="2952" r="3413" b="3110">of</wd>

<space/>

<wd l="3456" t="2976" r="4003" b="3110">tweets</wd>

<space/>

<wd l="4075" t="3005" r="4368" b="3110">can</wd>

<space/>

<wd l="4426" t="2952" r="4915" b="3110">result</wd>

<space/>

<wd l="4968" t="2952" r="5136" b="3106">in</wd>

<space/>

<wd l="5194" t="2952" r="5458" b="3110">the</wd>

<space/>

<wd l="5515" t="3005" r="5803" b="3110">use</wd>

<space/>

</ln>

<ln l="1445" t="3226" r="5803" b="3427" baseLine="3374" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="3226" r="1637" b="3384">of</wd>

<space/>

<wd l="1714" t="3226" r="2462" b="3384">informal</wd>

<space/>

<wd l="2558" t="3250" r="2928" b="3413">text,</wd>

<space/>

<wd l="3038" t="3226" r="4133" b="3384">unstructured</wd>

<space/>

<wd l="4229" t="3278" r="4406" b="3384">or</wd>

<space/>

<wd l="4498" t="3226" r="5803" b="3427">ungrammatical</wd>

<space/>

</ln>

<ln l="1440" t="3494" r="5803" b="3696" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3494" r="2136" b="3696">phrases,</wd>

<space/>

<wd l="2203" t="3494" r="2515" b="3653">and</wd>

<space/>

<wd l="2568" t="3547" r="2664" b="3653">a</wd>

<space/>

<wd l="2707" t="3494" r="3307" b="3696">variety</wd>

<space/>

<wd l="3365" t="3494" r="3552" b="3653">of</wd>

<space/>

<wd l="3590" t="3494" r="4786" b="3696">typographical</wd>

<space/>

<wd l="4843" t="3547" r="5390" b="3653">errors.</wd>

<space/>

<wd l="5467" t="3494" r="5803" b="3653">The</wd>

<space/>

</ln>

<ln l="1464" t="3763" r="5794" b="3922" baseLine="3917" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1464" t="3768" r="1762" b="3922">140</wd>

<space/>

<wd l="1838" t="3763" r="2640" b="3922">character</wd>

<space/>

<wd l="2702" t="3763" r="3115" b="3922">limit</wd>

<space/>

<wd l="3187" t="3816" r="3480" b="3922">can</wd>

<space/>

<wd l="3557" t="3763" r="3898" b="3922">also</wd>

<space/>

<wd l="3970" t="3763" r="4334" b="3922">lead</wd>

<space/>

<wd l="4397" t="3787" r="4565" b="3922">to</wd>

<space/>

<wd l="4642" t="3763" r="5448" b="3922">truncated</wd>

<space/>

<wd l="5515" t="3816" r="5794" b="3922">un-</wd>

</ln>

<ln l="1445" t="4037" r="5808" b="4238" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="4037" r="2530" b="4238">grammatical</wd>

<space/>

<wd l="2621" t="4061" r="3490" b="4224">sentences,</wd>

<space/>

<wd l="3590" t="4037" r="4493" b="4195">innovative</wd>

<space/>

<wd l="4584" t="4037" r="5390" b="4238">spellings,</wd>

<space/>

<wd l="5496" t="4037" r="5808" b="4195">and</wd>

<space/>

</ln>

<ln l="1440" t="4306" r="5808" b="4507" baseLine="4459" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="4306" r="1886" b="4464">word</wd>

<space/>

<wd l="1958" t="4306" r="2362" b="4507">play,</wd>

<space/>

<wd l="2462" t="4306" r="2851" b="4464">such</wd>

<space/>

<wd l="2928" t="4358" r="3096" b="4464">as</wd>

<space/>

<wd l="3178" t="4306" r="3638" b="4464">those</wd>

<space/>

<wd l="3715" t="4306" r="4546" b="4464">discussed</wd>

<space/>

<wd l="4618" t="4306" r="4834" b="4507">by</wd>

<space/>

<wd l="4910" t="4306" r="5808" b="4464">Eisenstein</wd>

<space/>

</ln>

<ln l="1450" t="4579" r="5794" b="4781" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1450" t="4584" r="2011" b="4776">(2013)</wd>

<space/>

<wd l="2098" t="4579" r="2357" b="4738">for</wd>

<space/>

<wd l="2424" t="4579" r="3134" b="4781">English.</wd>

<space/>

<wd l="3278" t="4584" r="3754" b="4738">From</wd>

<space/>

<wd l="3830" t="4632" r="4118" b="4738">our</wd>

<space/>

<wd l="4195" t="4579" r="4934" b="4781">analysis,</wd>

<space/>

<wd l="5026" t="4579" r="5333" b="4738">this</wd>

<space/>

<wd l="5419" t="4579" r="5794" b="4781">phe-</wd>

</ln>

<ln l="1440" t="4848" r="5568" b="5050" baseLine="5002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="4901" r="2251" b="5006">nomenon</wd>

<space/>

<wd l="2314" t="4901" r="2966" b="5050">appears</wd>

<space/>

<wd l="3029" t="4872" r="3192" b="5006">to</wd>

<space/>

<wd l="3254" t="4848" r="3830" b="5006">extend</wd>

<space/>

<wd l="3888" t="4848" r="4234" b="5006">also</wd>

<space/>

<wd l="4291" t="4872" r="4459" b="5006">to</wd>

<space/>

<wd l="4517" t="4848" r="4915" b="5006">Irish</wd>

<space/>

<wd l="4968" t="4872" r="5568" b="5006">tweets.</wd>

</ln>

</para>

<para l="1440" t="5122" r="5808" b="5597" alignment="justified" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="5122" r="5808" b="5323" baseLine="5275" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="5126" r="1843" b="5275">In</wd>

<space/>

<wd l="1906" t="5122" r="2472" b="5323">Figure</wd>

<space/>

<wd l="2563" t="5126" r="2693" b="5309">1,</wd>

<space/>

<wd l="2770" t="5174" r="3024" b="5280">we</wd>

<space/>

<wd l="3091" t="5122" r="3754" b="5323">provide</wd>

<space/>

<wd l="3821" t="5174" r="4018" b="5280">an</wd>

<space/>

<wd l="4094" t="5122" r="4824" b="5323">example</wd>

<space/>

<wd l="4891" t="5122" r="5083" b="5280">of</wd>

<space/>

<wd l="5141" t="5174" r="5338" b="5280">an</wd>

<space/>

<wd l="5405" t="5122" r="5808" b="5280">Irish</wd>

<space/>

</ln>

<ln l="1440" t="5395" r="5789" b="5597" baseLine="5544" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="5419" r="1915" b="5554">tweet</wd>

<space/>

<wd l="1963" t="5395" r="2294" b="5554">that</wd>

<space/>

<wd l="2347" t="5395" r="3062" b="5554">contains</wd>

<space/>

<wd l="3130" t="5448" r="3581" b="5554">some</wd>

<space/>

<wd l="3634" t="5395" r="3826" b="5554">of</wd>

<space/>

<wd l="3864" t="5395" r="4310" b="5554">these</wd>

<space/>

<wd l="4363" t="5400" r="4771" b="5554">NLP</wd>

<space/>

<wd l="4829" t="5395" r="5789" b="5597">challenges:</wd>

</ln>

</para>

<para l="1440" t="5832" r="5717" b="6576" alignment="left" ri="72" spaceBefore="171" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="5832" r="5429" b="6034" baseLine="5986">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><wd l="1440" t="5842" r="2194" b="6034">Freezing</wd>

<space/>

<wd l="2261" t="5842" r="2309" b="5990">i</wd>

<space/>

<wd l="2366" t="5832" r="2770" b="5990">dTra</wd>

<space/>

<wd l="2822" t="5837" r="3720" b="6014">Li,Ciarrai</wd>

<space/>

<wd l="3778" t="5832" r="4190" b="5990">chun</wd>

<space/>

<wd l="4253" t="5842" r="4618" b="5990">cinn</wd>

<space/>

<wd l="4680" t="5832" r="4829" b="5990">le</wd>

<space/>

</run>

<wd l="4896" t="5832" r="5429" b="5990"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">cuilin</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><space/>

</run>

</ln>

<ln l="1440" t="6096" r="5717" b="6307" baseLine="6254">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><wd l="1440" t="6106" r="2198" b="6307">Freezing</wd>

<space/>

<wd l="2256" t="6106" r="2314" b="6259">i</wd>

<space/>

</run>

<wd l="2376" t="6096" r="2789" b="6264"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">dTr</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">´a</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><wd l="2846" t="6110" r="3082" b="6293">L´ı,</wd>

<space/>

</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><wd l="3149" t="6096" r="3331" b="6264">t´a</wd>

<space/>

</run>

<wd l="3389" t="6101" r="4469" b="6264"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">Ciarra</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">i</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">chun</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><space/>

<wd l="4526" t="6106" r="4901" b="6264">cinn</wd>

<space/>

<wd l="4954" t="6106" r="5112" b="6264">le</wd>

<space/>

</run>

<wd l="5170" t="6101" r="5717" b="6264"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">c</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">´u</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">il</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">i</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">n.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7"><space/>

</run>

</ln>

<ln l="1464" t="6374" r="5640" b="6576" baseLine="6528" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">

<wd l="1464" t="6374" r="2270" b="6576">‘Freezing</wd>

<space/>

<wd l="2333" t="6374" r="2501" b="6528">in</wd>

<space/>

<wd l="2554" t="6374" r="3149" b="6562">Tralee,</wd>

<space/>

<wd l="3221" t="6379" r="3715" b="6576">Kerry</wd>

<space/>

<wd l="3782" t="6374" r="4051" b="6571">(is)</wd>

<space/>

<wd l="4123" t="6374" r="4627" b="6533">ahead</wd>

<space/>

<wd l="4680" t="6374" r="4896" b="6576">by</wd>

<space/>

<wd l="4958" t="6427" r="5054" b="6533">a</wd>

<space/>

<wd l="5102" t="6374" r="5640" b="6576">point.’</wd>

</ln>

</para>

<para l="1930" t="7118" r="5314" b="7320" alignment="centered" spaceBefore="468" lsp="exactly" lspExact="271" language="en">

<ln l="1930" t="7118" r="5314" b="7320" baseLine="7267" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1930" t="7118" r="2501" b="7320">Figure</wd>

<space/>

<wd l="2578" t="7123" r="2707" b="7277">1:</wd>

<space/>

<wd l="2794" t="7118" r="3566" b="7320">Example</wd>

<space/>

<wd l="3629" t="7118" r="3821" b="7277">of</wd>

<space/>

<wd l="3859" t="7118" r="4330" b="7320">noisy</wd>

<space/>

<wd l="4387" t="7118" r="4790" b="7277">Irish</wd>

<space/>

<wd l="4843" t="7142" r="5314" b="7277">tweet</wd>

</ln>

</para>

<para l="1440" t="7786" r="5813" b="11510" alignment="justified" spaceBefore="397" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="7786" r="5794" b="7987" baseLine="7934">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1440" t="7786" r="2333" b="7944">Diacritics</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2554" t="7786" r="3000" b="7973">Irish,</wd>

<space/>

<wd l="3168" t="7786" r="3341" b="7939">in</wd>

<space/>

<wd l="3475" t="7786" r="3677" b="7944">its</wd>

<space/>

<wd l="3830" t="7786" r="4565" b="7944">standard</wd>

<space/>

<wd l="4704" t="7786" r="5794" b="7987">orthography,</wd>

<space/>

</run>

</ln>

<ln l="1440" t="8054" r="5808" b="8256" baseLine="8203" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="8054" r="1963" b="8213">marks</wd>

<space/>

<wd l="2040" t="8054" r="2424" b="8256">long</wd>

<space/>

<wd l="2491" t="8054" r="3091" b="8213">vowels</wd>

<space/>

<wd l="3163" t="8054" r="3552" b="8213">with</wd>

<space/>

<wd l="3619" t="8054" r="4406" b="8213">diacritics</wd>

<space/>

<wd l="4488" t="8059" r="5357" b="8251">(´a,´ej,´o,´u).</wd>

<space/>

<wd l="5472" t="8059" r="5808" b="8213">Our</wd>

<space/>

</ln>

<ln l="1445" t="8328" r="5794" b="8530" baseLine="8477" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="8328" r="2136" b="8530">analysis</wd>

<space/>

<wd l="2203" t="8328" r="2395" b="8486">of</wd>

<space/>

<wd l="2434" t="8328" r="2837" b="8486">Irish</wd>

<space/>

<wd l="2890" t="8352" r="3442" b="8486">tweets</wd>

<space/>

<wd l="3504" t="8328" r="4234" b="8486">revealed</wd>

<space/>

<wd l="4291" t="8328" r="4618" b="8486">that</wd>

<space/>

<wd l="4670" t="8328" r="5117" b="8486">these</wd>

<space/>

<wd l="5179" t="8328" r="5794" b="8486">diacrit-</wd>

</ln>

<ln l="1440" t="8597" r="5798" b="8798" baseLine="8746" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="8597" r="1675" b="8755">ics</wd>

<space/>

<wd l="1771" t="8650" r="2035" b="8755">are</wd>

<space/>

<wd l="2122" t="8597" r="2568" b="8755">often</wd>

<space/>

<wd l="2654" t="8597" r="3394" b="8798">replaced</wd>

<space/>

<wd l="3475" t="8597" r="3864" b="8755">with</wd>

<space/>

<wd l="3950" t="8597" r="5112" b="8755">non-accented</wd>

<space/>

<wd l="5198" t="8597" r="5798" b="8755">vowels</wd>

<space/>

</ln>

<ln l="1450" t="8866" r="5808" b="9062" baseLine="9019">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1450" t="8866" r="2011" b="9062">(c´uil´ın</wd>

<space/>

</run>

<wd l="2098" t="8899" r="2410" b="9029"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">=</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-4">&gt;</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-4"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2506" t="8866" r="3115" b="9062">cuilin).</wd>

<space/>

<wd l="3259" t="8866" r="3768" b="9024">There</wd>

<space/>

<wd l="3850" t="8918" r="4109" b="9024">are</wd>

<space/>

<wd l="4190" t="8918" r="4286" b="9024">a</wd>

<space/>

<wd l="4358" t="8866" r="5030" b="9024">number</wd>

<space/>

<wd l="5107" t="8866" r="5294" b="9024">of</wd>

<space/>

<wd l="5357" t="8866" r="5808" b="9024">word</wd>

<space/>

</run>

</ln>

<ln l="1440" t="9139" r="5803" b="9341" baseLine="9288" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="9139" r="1858" b="9341">pairs</wd>

<space/>

<wd l="1944" t="9139" r="2270" b="9298">that</wd>

<space/>

<wd l="2352" t="9192" r="2611" b="9298">are</wd>

<space/>

<wd l="2693" t="9139" r="3859" b="9298">differentiated</wd>

<space/>

<wd l="3941" t="9139" r="4320" b="9341">only</wd>

<space/>

<wd l="4402" t="9139" r="4618" b="9341">by</wd>

<space/>

<wd l="4699" t="9139" r="4963" b="9298">the</wd>

<space/>

<wd l="5040" t="9192" r="5803" b="9341">presence</wd>

<space/>

</ln>

<ln l="1445" t="9408" r="5813" b="9610" baseLine="9562">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1445" t="9461" r="1627" b="9566">or</wd>

<space/>

<wd l="1704" t="9408" r="2386" b="9566">absence</wd>

<space/>

<wd l="2467" t="9408" r="2659" b="9566">of</wd>

<space/>

<wd l="2722" t="9408" r="3168" b="9566">these</wd>

<space/>

<wd l="3250" t="9408" r="4037" b="9566">diacritics</wd>

<space/>

<wd l="4128" t="9408" r="4450" b="9605">(for</wd>

<space/>

<wd l="4526" t="9408" r="5299" b="9610">example,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="5400" t="9408" r="5813" b="9566">cead</wd>

<space/>

</run>

</ln>

<ln l="1464" t="9682" r="5803" b="9883" baseLine="9830">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1464" t="9682" r="2520" b="9883">‘permission’</wd>

<space/>

<wd l="2630" t="9734" r="2659" b="9840">:</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2794" t="9682" r="3206" b="9840">c´ead</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="3307" t="9682" r="4258" b="9878">‘hundred’).</wd>

<space/>

<wd l="4397" t="9682" r="4906" b="9840">There</wd>

<space/>

<wd l="4987" t="9734" r="5246" b="9840">are</wd>

<space/>

<wd l="5323" t="9734" r="5803" b="9883">many</wd>

<space/>

</run>

</ln>

<ln l="1440" t="9950" r="5803" b="10152" baseLine="10104" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="9950" r="2155" b="10152">possible</wd>

<space/>

<wd l="2218" t="10003" r="2866" b="10109">reasons</wd>

<space/>

<wd l="2938" t="9950" r="3197" b="10109">for</wd>

<space/>

<wd l="3259" t="9950" r="3994" b="10152">omitting</wd>

<space/>

<wd l="4066" t="9950" r="4906" b="10138">diacritics,</wd>

<space/>

<wd l="4982" t="9950" r="5803" b="10152">including</wd>

<space/>

</ln>

<ln l="1450" t="10224" r="5808" b="10426" baseLine="10373" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1450" t="10224" r="2357" b="10426">shortening</wd>

<space/>

<wd l="2443" t="10224" r="2707" b="10382">the</wd>

<space/>

<wd l="2789" t="10224" r="3173" b="10382">time</wd>

<space/>

<wd l="3254" t="10224" r="3984" b="10426">required</wd>

<space/>

<wd l="4061" t="10248" r="4229" b="10382">to</wd>

<space/>

<wd l="4310" t="10248" r="4786" b="10382">tweet</wd>

<space/>

<wd l="4877" t="10224" r="5246" b="10421">(this</wd>

<space/>

<wd l="5333" t="10248" r="5808" b="10382">tweet</wd>

<space/>

</ln>

<ln l="1440" t="10493" r="5794" b="10694" baseLine="10646" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="10493" r="1579" b="10651">is</wd>

<space/>

<wd l="1675" t="10493" r="2102" b="10651">from</wd>

<space/>

<wd l="2189" t="10546" r="2285" b="10651">a</wd>

<space/>

<wd l="2381" t="10517" r="3163" b="10694">spectator</wd>

<space/>

<wd l="3250" t="10517" r="3403" b="10651">at</wd>

<space/>

<wd l="3494" t="10546" r="3590" b="10651">a</wd>

<space/>

<wd l="3682" t="10493" r="4238" b="10651">Gaelic</wd>

<space/>

<wd l="4334" t="10493" r="5054" b="10651">Football</wd>

<space/>

<wd l="5146" t="10493" r="5794" b="10690">match),</wd>

<space/>

</ln>

<ln l="1445" t="10766" r="5808" b="10968" baseLine="10915" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="10819" r="1541" b="10925">a</wd>

<space/>

<wd l="1608" t="10766" r="1973" b="10925">lack</wd>

<space/>

<wd l="2050" t="10766" r="2242" b="10925">of</wd>

<space/>

<wd l="2299" t="10766" r="3250" b="10968">knowledge</wd>

<space/>

<wd l="3331" t="10819" r="3547" b="10925">on</wd>

<space/>

<wd l="3614" t="10766" r="3984" b="10925">how</wd>

<space/>

<wd l="4061" t="10790" r="4224" b="10925">to</wd>

<space/>

<wd l="4306" t="10766" r="4642" b="10925">find</wd>

<space/>

<wd l="4718" t="10766" r="5506" b="10925">diacritics</wd>

<space/>

<wd l="5592" t="10819" r="5808" b="10925">on</wd>

<space/>

</ln>

<ln l="1445" t="11035" r="5803" b="11237" baseLine="11184" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="11088" r="1541" b="11194">a</wd>

<space/>

<wd l="1622" t="11035" r="2318" b="11194">device’s</wd>

<space/>

<wd l="2405" t="11035" r="3254" b="11237">keyboard,</wd>

<space/>

<wd l="3360" t="11035" r="4464" b="11222">carelessness,</wd>

<space/>

<wd l="4565" t="11088" r="4747" b="11194">or</wd>

<space/>

<wd l="4824" t="11035" r="5803" b="11237">uncertainty</wd>

<space/>

</ln>

<ln l="1445" t="11309" r="3696" b="11510" baseLine="11458" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="11309" r="1925" b="11467">about</wd>

<space/>

<wd l="1978" t="11309" r="2246" b="11467">the</wd>

<space/>

<wd l="2304" t="11333" r="2909" b="11467">correct</wd>

<space/>

<wd l="2971" t="11309" r="3696" b="11510">spelling.</wd>

</ln>

</para>

<para l="1440" t="11731" r="5808" b="14914" alignment="justified" spaceBefore="156" spaceAfter="110" lsp="exactly" lspExact="271" language="en">

<ln l="1450" t="11731" r="5808" b="11933" baseLine="11885">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1450" t="11731" r="2880" b="11933">Code-switching</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="3101" t="11731" r="4090" b="11933">Alternating</wd>

<space/>

<wd l="4253" t="11731" r="4982" b="11890">between</wd>

<space/>

<wd l="5141" t="11731" r="5808" b="11933">English</wd>

<space/>

</run>

</ln>

<ln l="1445" t="12005" r="5794" b="12163" baseLine="12154" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="12005" r="1757" b="12163">and</wd>

<space/>

<wd l="1838" t="12005" r="2237" b="12163">Irish</wd>

<space/>

<wd l="2318" t="12005" r="2453" b="12163">is</wd>

<space/>

<wd l="2549" t="12058" r="3307" b="12163">common</wd>

<space/>

<wd l="3389" t="12005" r="3562" b="12158">in</wd>

<space/>

<wd l="3643" t="12058" r="3936" b="12163">our</wd>

<space/>

<wd l="4018" t="12005" r="4661" b="12163">dataset.</wd>

<space/>

<wd l="4819" t="12005" r="5198" b="12163">This</wd>

<space/>

<wd l="5290" t="12005" r="5424" b="12163">is</wd>

<space/>

<wd l="5515" t="12058" r="5794" b="12163">un-</wd>

</ln>

<ln l="1450" t="12274" r="5808" b="12475" baseLine="12427" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1450" t="12274" r="2309" b="12475">surprising</wd>

<space/>

<wd l="2381" t="12326" r="2549" b="12432">as</wd>

<space/>

<wd l="2621" t="12274" r="3355" b="12475">virtually</wd>

<space/>

<wd l="3427" t="12274" r="3638" b="12432">all</wd>

<space/>

<wd l="3706" t="12274" r="4104" b="12432">Irish</wd>

<space/>

<wd l="4176" t="12274" r="4906" b="12475">speakers</wd>

<space/>

<wd l="4982" t="12326" r="5246" b="12432">are</wd>

<space/>

<wd l="5314" t="12274" r="5808" b="12432">fluent</wd>

<space/>

</ln>

<ln l="1440" t="12547" r="5808" b="12749" baseLine="12696" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="12547" r="2107" b="12749">English</wd>

<space/>

<wd l="2194" t="12547" r="2976" b="12749">speakers,</wd>

<space/>

<wd l="3082" t="12547" r="3389" b="12706">and</wd>

<space/>

<wd l="3470" t="12600" r="3946" b="12749">many</wd>

<space/>

<wd l="4027" t="12600" r="4320" b="12706">use</wd>

<space/>

<wd l="4397" t="12547" r="5069" b="12749">English</wd>

<space/>

<wd l="5150" t="12600" r="5318" b="12706">as</wd>

<space/>

<wd l="5405" t="12547" r="5808" b="12706">their</wd>

<space/>

</ln>

<ln l="1445" t="12816" r="5794" b="13018" baseLine="12965" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="12816" r="1781" b="12974">first</wd>

<space/>

<wd l="1867" t="12816" r="2654" b="13018">language</wd>

<space/>

<wd l="2746" t="12816" r="2914" b="12970">in</wd>

<space/>

<wd l="3000" t="12816" r="3403" b="12974">their</wd>

<space/>

<wd l="3494" t="12816" r="3922" b="13018">daily</wd>

<space/>

<wd l="4013" t="12816" r="4459" b="12974">lives.</wd>

<space/>

<wd l="4637" t="12821" r="4824" b="12970">In</wd>

<space/>

<wd l="4910" t="12816" r="5174" b="12974">the</wd>

<space/>

<wd l="5270" t="12869" r="5794" b="12974">exam-</wd>

</ln>

<ln l="1440" t="13090" r="5794" b="13291" baseLine="13238" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="13090" r="1704" b="13291">ple</wd>

<space/>

<wd l="1771" t="13090" r="2285" b="13291">given,</wd>

<space/>

<wd l="2357" t="13090" r="2794" b="13248">there</wd>

<space/>

<wd l="2856" t="13090" r="2990" b="13248">is</wd>

<space/>

<wd l="3062" t="13142" r="3274" b="13248">no</wd>

<space/>

<wd l="3346" t="13090" r="4018" b="13248">obvious</wd>

<space/>

<wd l="4085" t="13142" r="4656" b="13248">reason</wd>

<space/>

<wd l="4718" t="13090" r="5088" b="13291">why</wd>

<space/>

<wd l="5155" t="13094" r="5794" b="13248">“Freez-</wd>

</ln>

<ln l="1440" t="13358" r="5808" b="13560" baseLine="13507" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="13358" r="1810" b="13560">ing”</wd>

<space/>

<wd l="1906" t="13411" r="2237" b="13517">was</wd>

<space/>

<wd l="2333" t="13358" r="2736" b="13517">used</wd>

<space/>

<wd l="2822" t="13358" r="2995" b="13512">in</wd>

<space/>

<wd l="3086" t="13358" r="3542" b="13560">place</wd>

<space/>

<wd l="3643" t="13358" r="3830" b="13517">of</wd>

<space/>

<wd l="3907" t="13358" r="4536" b="13517">various</wd>

<space/>

<wd l="4646" t="13358" r="5314" b="13517">suitable</wd>

<space/>

<wd l="5405" t="13358" r="5808" b="13517">Irish</wd>

<space/>

</ln>

<ln l="1440" t="13627" r="5794" b="13829" baseLine="13781">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="1440" t="13627" r="1963" b="13786">words</wd>

<space/>

<wd l="2064" t="13632" r="2429" b="13829">(e.g.</wd>

<space/>

</run>

<wd l="2587" t="13627" r="3499" b="13824"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">Pr´eachta</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">),</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="3605" t="13627" r="4051" b="13786">other</wd>

<space/>

<wd l="4128" t="13627" r="4507" b="13786">than</wd>

<space/>

<wd l="4584" t="13627" r="5256" b="13829">perhaps</wd>

<space/>

<wd l="5357" t="13627" r="5794" b="13786">seek-</wd>

</run>

</ln>

<ln l="1440" t="13901" r="5794" b="14102" baseLine="14050" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="13901" r="1714" b="14102">ing</wd>

<space/>

<wd l="1829" t="13954" r="1925" b="14059">a</wd>

<space/>

<wd l="2026" t="13954" r="2477" b="14059">more</wd>

<space/>

<wd l="2587" t="13901" r="3341" b="14059">dramatic</wd>

<space/>

<wd l="3456" t="13901" r="3984" b="14059">effect.</wd>

<space/>

<wd l="4224" t="13901" r="5232" b="14088">Sometimes,</wd>

<space/>

<wd l="5362" t="13901" r="5794" b="14059">how-</wd>

</ln>

<ln l="1445" t="14170" r="5803" b="14371" baseLine="14323" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="14222" r="1843" b="14357">ever,</wd>

<space/>

<wd l="1939" t="14170" r="2611" b="14371">English</wd>

<space/>

<wd l="2688" t="14170" r="2827" b="14328">is</wd>

<space/>

<wd l="2918" t="14170" r="4248" b="14371">understandably</wd>

<space/>

<wd l="4334" t="14170" r="4733" b="14328">used</wd>

<space/>

<wd l="4814" t="14170" r="5290" b="14328">when</wd>

<space/>

<wd l="5371" t="14170" r="5803" b="14328">there</wd>

<space/>

</ln>

<ln l="1440" t="14443" r="5803" b="14645" baseLine="14592" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="14443" r="1579" b="14602">is</wd>

<space/>

<wd l="1651" t="14496" r="1867" b="14602">no</wd>

<space/>

<wd l="1944" t="14443" r="2611" b="14602">suitable</wd>

<space/>

<wd l="2678" t="14443" r="3082" b="14602">Irish</wd>

<space/>

<wd l="3144" t="14467" r="3547" b="14602">term</wd>

<space/>

<wd l="3610" t="14443" r="3782" b="14597">in</wd>

<space/>

<wd l="3845" t="14443" r="4267" b="14602">wide</wd>

<space/>

<wd l="4334" t="14496" r="4670" b="14630">use,</wd>

<space/>

<wd l="4747" t="14443" r="5006" b="14602">for</wd>

<space/>

<wd l="5074" t="14443" r="5803" b="14645">example</wd>

<space/>

</ln>

<ln l="1464" t="14712" r="5803" b="14914" baseLine="14866" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1464" t="14712" r="2155" b="14870">‘hoodie’</wd>

<space/>

<wd l="2251" t="14765" r="2434" b="14870">or</wd>

<space/>

<wd l="2520" t="14712" r="3782" b="14870">‘rodeo-clown’.</wd>

<space/>

<wd l="3902" t="14712" r="4411" b="14870">Aside</wd>

<space/>

<wd l="4478" t="14712" r="4906" b="14870">from</wd>

<space/>

<wd l="4973" t="14712" r="5803" b="14914">occurring</wd>

</ln>

</para>

<rulerline l="1432" t="15048" r="2640" b="15048" type="single" width="10" color="000000"/>

<para l="1704" t="15101" r="5083" b="15293" alignment="centered" spaceBefore="59" spaceAfter="26" lsp="exactly" lspExact="194" language="en">

<ln l="1704" t="15101" r="5083" b="15293" baseLine="15256">

<wd l="1704" t="15101" r="5083" b="15293"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">1</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">http://indigenoustweets.com/ga/</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

</column>

<column l="6143" t="1227" r="10530" b="15324">

<para l="6144" t="1320" r="10517" b="3149" alignment="justified" spaceBefore="30" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="1320" r="10507" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="1344" r="6307" b="1478">at</wd>

<space/>

<wd l="6394" t="1373" r="6590" b="1478">an</wd>

<space/>

<wd l="6682" t="1320" r="7987" b="1478">intra-sentential</wd>

<space/>

<wd l="8078" t="1320" r="8534" b="1507">level,</wd>

<space/>

<wd l="8645" t="1320" r="9970" b="1522">code-switching</wd>

<space/>

<wd l="10066" t="1344" r="10219" b="1478">at</wd>

<space/>

<wd l="10310" t="1373" r="10507" b="1478">an</wd>

<space/>

</ln>

<ln l="6144" t="1594" r="10502" b="1752" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="1594" r="7445" b="1752">inter-sentential</wd>

<space/>

<wd l="7498" t="1594" r="7910" b="1752">level</wd>

<space/>

<wd l="7963" t="1594" r="8098" b="1752">is</wd>

<space/>

<wd l="8160" t="1594" r="8506" b="1752">also</wd>

<space/>

<wd l="8558" t="1646" r="9322" b="1752">common</wd>

<space/>

<wd l="9370" t="1594" r="9538" b="1747">in</wd>

<space/>

<wd l="9586" t="1594" r="10027" b="1752">Irish:</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="10109" t="1646" r="10325" b="1752">an</wd>

<space/>

<wd l="10382" t="1627" r="10502" b="1752">t-</wd>

</run>

</ln>

<ln l="6144" t="1862" r="10507" b="2064" baseLine="2016" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="1915" r="6408" b="2021">am</wd>

<space/>

<wd l="6470" t="1915" r="6758" b="2021">seo</wd>

<space/>

<wd l="6826" t="1915" r="7037" b="2021">an</wd>

<space/>

<wd l="7109" t="1867" r="7546" b="2021">t7ain</wd>

<space/>

<wd l="7608" t="1915" r="7896" b="2021">seo</wd>

<space/>

<wd l="7968" t="1862" r="8765" b="2064">chugainn</wd>

<space/>

<wd l="8837" t="1862" r="9096" b="2021">bei</wd>

<space/>

<wd l="9158" t="1867" r="9259" b="2016">2</wd>

<space/>

<wd l="9326" t="1915" r="9538" b="2064">ag</wd>

<space/>

<wd l="9581" t="1862" r="10296" b="2064">party´ail</wd>

<space/>

<wd l="10358" t="1862" r="10507" b="2021">le</wd>

<space/>

</ln>

<ln l="6144" t="2136" r="10517" b="2338" baseLine="2285" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2146" r="6797" b="2294">muintir</wd>

<space/>

<wd l="6840" t="2136" r="7258" b="2294">R´ath</wd>

<space/>

<wd l="7310" t="2141" r="8098" b="2338">Daingin!</wd>

<space/>

<wd l="8179" t="2146" r="8650" b="2338">Hope</wd>

<space/>

<wd l="8707" t="2189" r="9197" b="2338">youre</wd>

<space/>

<wd l="9264" t="2170" r="9547" b="2294">not</wd>

<space/>

<wd l="9605" t="2170" r="9874" b="2294">too</wd>

<space/>

<wd l="9936" t="2136" r="10517" b="2294">scared</wd>

<space/>

</ln>

<ln l="6144" t="2405" r="10517" b="2606" baseLine="2558">

<wd l="6144" t="2405" r="7368" b="2606"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">#upthevillage</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7493" t="2410" r="7675" b="2558">In</wd>

<space/>

<wd l="7742" t="2405" r="8174" b="2592">total,</wd>

<space/>

<wd l="8266" t="2405" r="8458" b="2563">of</wd>

<space/>

<wd l="8510" t="2405" r="8779" b="2563">the</wd>

<space/>

<wd l="8866" t="2410" r="9283" b="2563">1537</wd>

<space/>

<wd l="9355" t="2429" r="9902" b="2563">tweets</wd>

<space/>

<wd l="9979" t="2405" r="10152" b="2558">in</wd>

<space/>

<wd l="10224" t="2458" r="10517" b="2563">our</wd>

<space/>

</run>

</ln>

<ln l="6149" t="2664" r="10512" b="2880" baseLine="2827">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="2678" r="7349" b="2880">gold-standard</wd>

<space/>

<wd l="7397" t="2731" r="8016" b="2880">corpus,</wd>

<space/>

<wd l="8083" t="2683" r="8395" b="2837">326</wd>

<space/>

</run>

<wd l="8462" t="2664" r="9158" b="2875"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(21</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">.</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2%)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="9221" t="2678" r="9859" b="2837">contain</wd>

<space/>

<wd l="9912" t="2702" r="10066" b="2837">at</wd>

<space/>

<wd l="10109" t="2678" r="10512" b="2837">least</wd>

<space/>

</run>

</ln>

<ln l="6149" t="2914" r="9110" b="3149" baseLine="3098">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="3000" r="6461" b="3106">one</wd>

<space/>

<wd l="6514" t="2947" r="7186" b="3149">English</wd>

<space/>

<wd l="7238" t="2947" r="7685" b="3106">word</wd>

<space/>

<wd l="7738" t="2947" r="8126" b="3106">with</wd>

<space/>

<wd l="8179" t="2947" r="8443" b="3106">the</wd>

<space/>

<wd l="8501" t="2971" r="8765" b="3149">tag</wd>

<space/>

</run>

<wd l="8827" t="2914" r="9110" b="3106"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">G</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="3374" r="10512" b="4661" alignment="justified" spaceBefore="156" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="3374" r="10512" b="3576" baseLine="3523">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="3379" r="6590" b="3533">Verb</wd>

<space/>

<wd l="6672" t="3379" r="7104" b="3576">drop</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7330" t="3379" r="7613" b="3533">We</wd>

<space/>

<wd l="7690" t="3427" r="7987" b="3533">can</wd>

<space/>

<wd l="8069" t="3427" r="8338" b="3533">see</wd>

<space/>

<wd l="8410" t="3374" r="8582" b="3528">in</wd>

<space/>

<wd l="8650" t="3374" r="8957" b="3533">this</wd>

<space/>

<wd l="9043" t="3374" r="9773" b="3576">example</wd>

<space/>

<wd l="9845" t="3374" r="10176" b="3533">that</wd>

<space/>

<wd l="10243" t="3374" r="10512" b="3533">the</wd>

<space/>

</run>

</ln>

<ln l="6144" t="3643" r="10512" b="3845" baseLine="3797">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="3643" r="6528" b="3802">verb</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6605" t="3653" r="6768" b="3802">t´a</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6859" t="3643" r="7104" b="3802">‘is’</wd>

<space/>

<wd l="7195" t="3643" r="7478" b="3802">has</wd>

<space/>

<wd l="7555" t="3643" r="7968" b="3802">been</wd>

<space/>

<wd l="8040" t="3643" r="8794" b="3845">dropped.</wd>

<space/>

<wd l="8914" t="3643" r="9293" b="3802">This</wd>

<space/>

<wd l="9370" t="3643" r="9504" b="3802">is</wd>

<space/>

<wd l="9586" t="3696" r="9682" b="3802">a</wd>

<space/>

<wd l="9754" t="3696" r="10512" b="3802">common</wd>

<space/>

</run>

</ln>

<ln l="6144" t="3917" r="10507" b="4118" baseLine="4066" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="3917" r="7272" b="4118">phenomenon</wd>

<space/>

<wd l="7354" t="3917" r="7526" b="4070">in</wd>

<space/>

<wd l="7608" t="3917" r="8890" b="4118">user-generated</wd>

<space/>

<wd l="8971" t="3941" r="9614" b="4075">content</wd>

<space/>

<wd l="9691" t="3917" r="9950" b="4075">for</wd>

<space/>

<wd l="10027" t="3970" r="10507" b="4118">many</wd>

<space/>

</ln>

<ln l="6144" t="4186" r="10507" b="4387" baseLine="4339" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="4186" r="7061" b="4387">languages.</wd>

<space/>

<wd l="7138" t="4186" r="7478" b="4344">The</wd>

<space/>

<wd l="7526" t="4186" r="7906" b="4344">verb</wd>

<space/>

<wd l="7958" t="4186" r="8093" b="4344">is</wd>

<space/>

<wd l="8150" t="4186" r="8779" b="4387">usually</wd>

<space/>

<wd l="8827" t="4186" r="9797" b="4344">understood</wd>

<space/>

<wd l="9850" t="4186" r="10162" b="4344">and</wd>

<space/>

<wd l="10214" t="4238" r="10507" b="4344">can</wd>

<space/>

</ln>

<ln l="6144" t="4459" r="10229" b="4661" baseLine="4608" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="4459" r="6350" b="4618">be</wd>

<space/>

<wd l="6408" t="4459" r="7354" b="4661">interpreted</wd>

<space/>

<wd l="7406" t="4459" r="8088" b="4661">through</wd>

<space/>

<wd l="8141" t="4459" r="8405" b="4618">the</wd>

<space/>

<wd l="8467" t="4483" r="9101" b="4618">context</wd>

<space/>

<wd l="9158" t="4459" r="9350" b="4618">of</wd>

<space/>

<wd l="9389" t="4459" r="9658" b="4618">the</wd>

<space/>

<wd l="9710" t="4483" r="10229" b="4618">tweet.</wd>

</ln>

</para>

<para l="6144" t="4886" r="10517" b="6154" alignment="justified" spaceBefore="164" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="4886" r="10502" b="5088" baseLine="5035">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="4886" r="6883" b="5088">Spacing</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7109" t="4886" r="7805" b="5088">Spacing</wd>

<space/>

<wd l="7858" t="4886" r="8256" b="5045">after</wd>

<space/>

<wd l="8299" t="4886" r="9331" b="5088">punctuation</wd>

<space/>

<wd l="9374" t="4886" r="9514" b="5045">is</wd>

<space/>

<wd l="9571" t="4886" r="10018" b="5045">often</wd>

<space/>

<wd l="10066" t="4939" r="10502" b="5045">over-</wd>

</run>

</ln>

<ln l="6144" t="5155" r="10517" b="5357" baseLine="5304" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5155" r="6739" b="5314">looked</wd>

<space/>

<wd l="6835" t="5155" r="7022" b="5352">(i)</wd>

<space/>

<wd l="7123" t="5155" r="7296" b="5309">in</wd>

<space/>

<wd l="7387" t="5208" r="7584" b="5314">an</wd>

<space/>

<wd l="7685" t="5179" r="8333" b="5357">attempt</wd>

<space/>

<wd l="8424" t="5179" r="8587" b="5314">to</wd>

<space/>

<wd l="8693" t="5155" r="9326" b="5314">shorten</wd>

<space/>

<wd l="9418" t="5208" r="10234" b="5357">messages</wd>

<space/>

<wd l="10334" t="5208" r="10517" b="5314">or</wd>

<space/>

</ln>

<ln l="6154" t="5429" r="10498" b="5630" baseLine="5578" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="5429" r="6403" b="5626">(ii)</wd>

<space/>

<wd l="6523" t="5429" r="7200" b="5630">through</wd>

<space/>

<wd l="7315" t="5429" r="8419" b="5587">carelessness.</wd>

<space/>

<wd l="8664" t="5434" r="8846" b="5582">In</wd>

<space/>

<wd l="8957" t="5429" r="9547" b="5587">certain</wd>

<space/>

<wd l="9658" t="5429" r="10498" b="5616">instances,</wd>

<space/>

</ln>

<ln l="6144" t="5698" r="10498" b="5899" baseLine="5846" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5698" r="6451" b="5856">this</wd>

<space/>

<wd l="6538" t="5750" r="6835" b="5856">can</wd>

<space/>

<wd l="6917" t="5750" r="7397" b="5856">cause</wd>

<space/>

<wd l="7469" t="5698" r="8270" b="5899">problems</wd>

<space/>

<wd l="8352" t="5698" r="8827" b="5856">when</wd>

<space/>

<wd l="8899" t="5698" r="9816" b="5899">tokenizing</wd>

<space/>

<wd l="9893" t="5722" r="10498" b="5885">tweets;</wd>

<space/>

</ln>

<ln l="6144" t="5966" r="8400" b="6154" baseLine="6120">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="5966" r="6998" b="6154">Li,Ciarrai</wd>

<space/>

</run>

<wd l="7066" t="6000" r="7378" b="6130"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">=</run>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">&gt;</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1250" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7450" t="5966" r="7685" b="6154">Li,</wd>

<space/>

<wd l="7757" t="5966" r="8400" b="6125">Ciarrai.</wd>

</run>

</ln>

</para>

<para l="6144" t="6394" r="10517" b="9029" alignment="justified" spaceBefore="150" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="6394" r="10512" b="6595" baseLine="6547">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="6394" r="6955" b="6552">Phonetic</wd>

<space/>

<wd l="7056" t="6394" r="7762" b="6595">spelling</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7982" t="6394" r="8861" b="6595">Linguistic</wd>

<space/>

<wd l="8962" t="6394" r="9960" b="6552">innovations</wd>

<space/>

<wd l="10066" t="6394" r="10512" b="6552">often</wd>

<space/>

</run>

</ln>

<ln l="6144" t="6667" r="10507" b="6869" baseLine="6816" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="6667" r="6634" b="6826">result</wd>

<space/>

<wd l="6677" t="6667" r="7104" b="6826">from</wd>

<space/>

<wd l="7147" t="6691" r="7867" b="6826">tweeters</wd>

<space/>

<wd l="7925" t="6667" r="8443" b="6869">trying</wd>

<space/>

<wd l="8491" t="6691" r="8659" b="6826">to</wd>

<space/>

<wd l="8712" t="6667" r="8894" b="6826">fit</wd>

<space/>

<wd l="8938" t="6667" r="9341" b="6826">their</wd>

<space/>

<wd l="9384" t="6720" r="10123" b="6869">message</wd>

<space/>

<wd l="10171" t="6667" r="10507" b="6826">into</wd>

<space/>

</ln>

<ln l="6144" t="6936" r="10512" b="7094" baseLine="7090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="6936" r="6413" b="7094">the</wd>

<space/>

<wd l="6490" t="6941" r="6787" b="7094">140</wd>

<space/>

<wd l="6845" t="6936" r="7646" b="7094">character</wd>

<space/>

<wd l="7690" t="6936" r="8146" b="7094">limit.</wd>

<space/>

<wd l="8232" t="6941" r="8568" b="7094">Our</wd>

<space/>

<wd l="8621" t="6936" r="9221" b="7094">dataset</wd>

<space/>

<wd l="9278" t="6936" r="9994" b="7094">contains</wd>

<space/>

<wd l="10061" t="6989" r="10512" b="7094">some</wd>

<space/>

</ln>

<ln l="6144" t="7210" r="10502" b="7411" baseLine="7358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="7210" r="7066" b="7411">interesting</wd>

<space/>

<wd l="7162" t="7210" r="7968" b="7411">examples</wd>

<space/>

<wd l="8069" t="7210" r="8261" b="7368">of</wd>

<space/>

<wd l="8338" t="7210" r="8645" b="7368">this</wd>

<space/>

<wd l="8741" t="7210" r="9869" b="7411">phenomenon</wd>

<space/>

<wd l="9965" t="7262" r="10502" b="7368">occur-</wd>

</ln>

<ln l="6144" t="7478" r="10502" b="7680" baseLine="7627">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="7478" r="6494" b="7680">ring</wd>

<space/>

<wd l="6547" t="7478" r="6720" b="7632">in</wd>

<space/>

<wd l="6768" t="7478" r="7210" b="7637">Irish.</wd>

<space/>

<wd l="7291" t="7483" r="7594" b="7637">For</wd>

<space/>

<wd l="7646" t="7478" r="8376" b="7680">example</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="8429" t="7483" r="8870" b="7637">t7ain</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="8923" t="7478" r="9062" b="7637">is</wd>

<space/>

<wd l="9125" t="7531" r="9221" b="7637">a</wd>

<space/>

<wd l="9278" t="7478" r="10118" b="7637">shortened</wd>

<space/>

<wd l="10166" t="7531" r="10502" b="7637">ver-</wd>

</run>

</ln>

<ln l="6154" t="7752" r="10517" b="7910" baseLine="7901">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6154" t="7752" r="6509" b="7910">sion</wd>

<space/>

<wd l="6590" t="7752" r="6778" b="7910">of</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6845" t="7752" r="7728" b="7910">tseachtain</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7834" t="7752" r="8458" b="7910">‘week’.</wd>

<space/>

<wd l="8597" t="7757" r="9019" b="7910">Here</wd>

<space/>

<wd l="9096" t="7752" r="9360" b="7910">the</wd>

<space/>

<wd l="9437" t="7752" r="9883" b="7910">word</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="9955" t="7752" r="10517" b="7910">seacht</wd>

<space/>

</run>

</ln>

<ln l="6168" t="8021" r="10512" b="8179" baseLine="8170" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6168" t="8026" r="6754" b="8179">‘seven’</wd>

<space/>

<wd l="6859" t="8021" r="6998" b="8179">is</wd>

<space/>

<wd l="7094" t="8021" r="7934" b="8179">shortened</wd>

<space/>

<wd l="8011" t="8045" r="8179" b="8179">to</wd>

<space/>

<wd l="8266" t="8021" r="8462" b="8179">its</wd>

<space/>

<wd l="8549" t="8021" r="9259" b="8179">numeral</wd>

<space/>

<wd l="9346" t="8021" r="9773" b="8179">form</wd>

<space/>

<wd l="9854" t="8021" r="10166" b="8179">and</wd>

<space/>

<wd l="10243" t="8021" r="10512" b="8179">the</wd>

<space/>

</ln>

<ln l="6144" t="8290" r="10502" b="8448" baseLine="8443">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="8290" r="6653" b="8448">initial</wd>

<space/>

<wd l="6730" t="8290" r="7507" b="8448">mutation</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7584" t="8323" r="7646" b="8448">t</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7718" t="8290" r="8405" b="8448">remains</wd>

<space/>

<wd l="8491" t="8290" r="9254" b="8448">attached.</wd>

<space/>

<wd l="9403" t="8290" r="9898" b="8448">Other</wd>

<space/>

<wd l="9974" t="8342" r="10502" b="8448">exam-</wd>

</run>

</ln>

<ln l="6144" t="8563" r="10512" b="8765" baseLine="8712">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6144" t="8563" r="6490" b="8765">ples</wd>

<space/>

<wd l="6605" t="8616" r="6869" b="8722">are</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6970" t="8563" r="7459" b="8765">gowil</wd>

<space/>

<wd l="7565" t="8568" r="7848" b="8765">(go</wd>

<space/>

<wd l="7958" t="8563" r="8573" b="8765">bhfuil),</wd>

<space/>

<wd l="8712" t="8563" r="9235" b="8722">beidir</wd>

<space/>

<wd l="9341" t="8563" r="10277" b="8765">(b’fh´eidir),</wd>

<space/>

<wd l="10416" t="8616" r="10512" b="8722">v</wd>

<space/>

</run>

</ln>

<ln l="6149" t="8832" r="6614" b="9029" baseLine="8986">

<wd l="6149" t="8832" r="6614" b="9029"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">(bh´ı)</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="9259" r="10512" b="10814" alignment="justified" spaceBefore="153" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="9259" r="10502" b="9461" baseLine="9413">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="9259" r="7454" b="9418">Abbreviations</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7675" t="9259" r="8078" b="9418">Irish</wd>

<space/>

<wd l="8160" t="9259" r="9442" b="9461">user-generated</wd>

<space/>

<wd l="9523" t="9283" r="9850" b="9418">text</wd>

<space/>

<wd l="9931" t="9259" r="10214" b="9418">has</wd>

<space/>

<wd l="10306" t="9259" r="10502" b="9418">its</wd>

<space/>

</run>

</ln>

<ln l="6149" t="9533" r="10512" b="9734" baseLine="9682" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="9586" r="6518" b="9691">own</wd>

<space/>

<wd l="6586" t="9557" r="6821" b="9691">set</wd>

<space/>

<wd l="6883" t="9533" r="7075" b="9691">of</wd>

<space/>

<wd l="7123" t="9533" r="8016" b="9734">frequently</wd>

<space/>

<wd l="8078" t="9533" r="8482" b="9691">used</wd>

<space/>

<wd l="8539" t="9533" r="9110" b="9734">phrase</wd>

<space/>

<wd l="9178" t="9533" r="10334" b="9691">abbreviations</wd>

<space/>

<wd l="10402" t="9629" r="10512" b="9643">–</wd>

<space/>

</ln>

<ln l="6144" t="9802" r="10512" b="10003" baseLine="9950" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9802" r="6835" b="9960">referred</wd>

<space/>

<wd l="6907" t="9826" r="7075" b="9960">to</wd>

<space/>

<wd l="7162" t="9802" r="8078" b="9960">sometimes</wd>

<space/>

<wd l="8165" t="9854" r="8333" b="9960">as</wd>

<space/>

<wd l="8414" t="9802" r="9350" b="10003">text-speak.</wd>

<space/>

<wd l="9485" t="9806" r="10032" b="9960">Forms</wd>

<space/>

<wd l="10118" t="9802" r="10512" b="9960">such</wd>

<space/>

</ln>

<ln l="6149" t="10075" r="10507" b="10277" baseLine="10224">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="10128" r="6322" b="10234">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6398" t="10075" r="7291" b="10277">mgl:maith</wd>

<space/>

<wd l="7368" t="10128" r="7584" b="10277">go</wd>

<space/>

</run>

<wd l="7661" t="10075" r="8054" b="10262"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">leor</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8165" t="10075" r="8520" b="10234">‘fair</wd>

<space/>

<wd l="8592" t="10075" r="9274" b="10277">enough’</wd>

<space/>

<wd l="9379" t="10075" r="9691" b="10234">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="9758" t="10128" r="10507" b="10277">grma:go</wd>

<space/>

</run>

</ln>

<ln l="6154" t="10344" r="10507" b="10546" baseLine="10493">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6154" t="10344" r="6610" b="10502">raibh</wd>

<space/>

<wd l="6706" t="10344" r="7200" b="10502">maith</wd>

<space/>

<wd l="7296" t="10378" r="7690" b="10546">agat</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7800" t="10344" r="8338" b="10502">‘thank</wd>

<space/>

<wd l="8424" t="10349" r="8803" b="10546">you’</wd>

<space/>

<wd l="8918" t="10344" r="9322" b="10502">have</wd>

<space/>

<wd l="9413" t="10344" r="9826" b="10502">been</wd>

<space/>

<wd l="9917" t="10344" r="10507" b="10546">widely</wd>

<space/>

</run>

</ln>

<ln l="6149" t="10613" r="9806" b="10814" baseLine="10766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10613" r="6840" b="10814">adopted</wd>

<space/>

<wd l="6893" t="10613" r="7104" b="10814">by</wd>

<space/>

<wd l="7162" t="10613" r="7430" b="10771">the</wd>

<space/>

<wd l="7483" t="10613" r="7886" b="10771">Irish</wd>

<space/>

<wd l="7939" t="10613" r="8726" b="10814">language</wd>

<space/>

<wd l="8784" t="10613" r="9806" b="10814">community.</wd>

</ln>

</para>

<para l="6144" t="11160" r="10512" b="12672" alignment="justified" spaceBefore="275" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="11160" r="10512" b="11362" baseLine="11309" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="11160" r="6701" b="11318">The</wd>

<space/>

<wd l="6778" t="11160" r="7584" b="11362">linguistic</wd>

<space/>

<wd l="7666" t="11160" r="8438" b="11318">variation</wd>

<space/>

<wd l="8515" t="11160" r="8707" b="11318">of</wd>

<space/>

<wd l="8770" t="11160" r="9168" b="11318">Irish</wd>

<space/>

<wd l="9245" t="11160" r="9571" b="11318">that</wd>

<space/>

<wd l="9643" t="11160" r="9782" b="11318">is</wd>

<space/>

<wd l="9864" t="11160" r="10267" b="11318">used</wd>

<space/>

<wd l="10339" t="11160" r="10512" b="11314">in</wd>

<space/>

</ln>

<ln l="6154" t="11429" r="10512" b="11630" baseLine="11582" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="11429" r="6653" b="11587">social</wd>

<space/>

<wd l="6725" t="11429" r="7262" b="11587">media</wd>

<space/>

<wd l="7330" t="11429" r="7464" b="11587">is</wd>

<space/>

<wd l="7541" t="11429" r="8357" b="11630">relatively</wd>

<space/>

<wd l="8429" t="11429" r="9451" b="11630">unexplored,</wd>

<space/>

<wd l="9538" t="11453" r="9696" b="11587">at</wd>

<space/>

<wd l="9763" t="11429" r="10166" b="11587">least</wd>

<space/>

<wd l="10234" t="11453" r="10512" b="11587">not</wd>

<space/>

</ln>

<ln l="6144" t="11702" r="10512" b="11904" baseLine="11851" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11702" r="6317" b="11856">in</wd>

<space/>

<wd l="6379" t="11755" r="6682" b="11904">any</wd>

<space/>

<wd l="6754" t="11702" r="7526" b="11861">scientific</wd>

<space/>

<wd l="7594" t="11755" r="8275" b="11861">manner.</wd>

<space/>

<wd l="8366" t="11707" r="8654" b="11861">We</wd>

<space/>

<wd l="8717" t="11726" r="9278" b="11904">expect</wd>

<space/>

<wd l="9336" t="11702" r="10123" b="11861">therefore</wd>

<space/>

<wd l="10186" t="11702" r="10512" b="11861">that</wd>

<space/>

</ln>

<ln l="6144" t="11971" r="10512" b="12173" baseLine="12125" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11971" r="6413" b="12130">the</wd>

<space/>

<wd l="6480" t="11971" r="7742" b="12173">part-of-speech</wd>

<space/>

<wd l="7805" t="11971" r="8390" b="12173">tagged</wd>

<space/>

<wd l="8462" t="12024" r="9029" b="12173">corpus</wd>

<space/>

<wd l="9110" t="11971" r="9422" b="12130">and</wd>

<space/>

<wd l="9485" t="11995" r="10109" b="12173">taggers</wd>

<space/>

<wd l="10186" t="11971" r="10512" b="12130">that</wd>

<space/>

</ln>

<ln l="6144" t="12245" r="10502" b="12446" baseLine="12394" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12298" r="6398" b="12403">we</wd>

<space/>

<wd l="6470" t="12245" r="6874" b="12403">have</wd>

<space/>

<wd l="6946" t="12245" r="7829" b="12446">developed</wd>

<space/>

<wd l="7896" t="12245" r="8155" b="12403">for</wd>

<space/>

<wd l="8222" t="12245" r="8621" b="12403">Irish</wd>

<space/>

<wd l="8688" t="12245" r="9475" b="12446">language</wd>

<space/>

<wd l="9547" t="12269" r="10094" b="12403">tweets</wd>

<space/>

<wd l="10171" t="12245" r="10502" b="12403">will</wd>

<space/>

</ln>

<ln l="6149" t="12514" r="9734" b="12672" baseLine="12667" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="12514" r="7027" b="12672">contribute</wd>

<space/>

<wd l="7080" t="12538" r="7248" b="12672">to</wd>

<space/>

<wd l="7306" t="12514" r="7901" b="12672">further</wd>

<space/>

<wd l="7954" t="12514" r="8683" b="12672">research</wd>

<space/>

<wd l="8736" t="12514" r="8904" b="12667">in</wd>

<space/>

<wd l="8957" t="12514" r="9264" b="12672">this</wd>

<space/>

<wd l="9331" t="12566" r="9734" b="12672">area.</wd>

</ln>

</para>

<para l="6144" t="12984" r="10200" b="13435" alignment="justified" li="360" ri="288" spaceBefore="212" fli="-360" lsp="exactly" lspExact="279" language="en">

<ln l="6144" t="12984" r="10200" b="13205" baseLine="13147" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12984" r="6259" b="13157">3</wd>

<space/>

<wd l="6504" t="12984" r="7382" b="13205">Building</wd>

<space/>

<wd l="7445" t="13037" r="7560" b="13157">a</wd>

<space/>

<wd l="7627" t="13037" r="8304" b="13205">corpus</wd>

<space/>

<wd l="8371" t="12984" r="8582" b="13157">of</wd>

<space/>

<wd l="8630" t="12989" r="9648" b="13157">annotated</wd>

<space/>

<wd l="9715" t="12984" r="10200" b="13157">Irish</wd>

<space/>

</ln>

<ln l="6509" t="13267" r="7133" b="13435" baseLine="13426" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6509" t="13277" r="7133" b="13435">tweets</wd>

</ln>

</para>

<para l="6144" t="13699" r="10512" b="14717" alignment="justified" spaceBefore="143" spaceAfter="111" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="13699" r="10512" b="13901" baseLine="13853" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13699" r="6734" b="13858">Unlike</wd>

<space/>

<wd l="6811" t="13699" r="7723" b="13858">rule-based</wd>

<space/>

<wd l="7810" t="13723" r="8534" b="13901">systems,</wd>

<space/>

<wd l="8635" t="13699" r="9446" b="13858">statistical</wd>

<space/>

<wd l="9533" t="13699" r="10512" b="13858">data-driven</wd>

<space/>

</ln>

<ln l="6144" t="13973" r="10507" b="14174" baseLine="14122" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13978" r="7238" b="14174">POS-taggers</wd>

<space/>

<wd l="7301" t="13973" r="7915" b="14174">require</wd>

<space/>

<wd l="7973" t="13973" r="8818" b="14131">annotated</wd>

<space/>

<wd l="8875" t="13973" r="9235" b="14131">data</wd>

<space/>

<wd l="9288" t="14026" r="9504" b="14131">on</wd>

<space/>

<wd l="9552" t="13973" r="10090" b="14131">which</wd>

<space/>

<wd l="10138" t="13973" r="10507" b="14174">they</wd>

<space/>

</ln>

<ln l="6149" t="14242" r="10502" b="14443" baseLine="14395" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="14294" r="6446" b="14400">can</wd>

<space/>

<wd l="6571" t="14242" r="6778" b="14400">be</wd>

<space/>

<wd l="6898" t="14242" r="7550" b="14400">trained.</wd>

<space/>

<wd l="7834" t="14242" r="8736" b="14429">Therefore,</wd>

<space/>

<wd l="8885" t="14294" r="9139" b="14400">we</wd>

<space/>

<wd l="9264" t="14242" r="9710" b="14400">build</wd>

<space/>

<wd l="9835" t="14294" r="9931" b="14400">a</wd>

<space/>

<wd l="10056" t="14242" r="10502" b="14443">gold-</wd>

</ln>

<ln l="6154" t="14515" r="10512" b="14717" baseLine="14664" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="14515" r="6888" b="14674">standard</wd>

<space/>

<wd l="6994" t="14568" r="7560" b="14717">corpus</wd>

<space/>

<wd l="7680" t="14515" r="7867" b="14674">of</wd>

<space/>

<wd l="7982" t="14515" r="8386" b="14674">1537</wd>

<space/>

<wd l="8501" t="14515" r="8899" b="14674">Irish</wd>

<space/>

<wd l="9000" t="14539" r="9552" b="14674">tweets</wd>

<space/>

<wd l="9667" t="14515" r="10512" b="14674">annotated</wd>

</ln>

</para>

<rulerline l="6143" t="14846" r="7344" b="14846" type="single" width="10" color="000000"/>

<para l="6149" t="14904" r="10502" b="15288" alignment="justified" spaceBefore="60" spaceAfter="15" fli="216" lsp="exactly" lspExact="203" language="en">

<ln l="6398" t="14904" r="10502" b="15106" baseLine="15056">

<wd l="6398" t="14904" r="6744" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">The</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6787" t="14957" r="7003" b="15106">tag</wd>

<space/>

<wd l="7051" t="14938" r="7176" b="15067">G</wd>

<space/>

<wd l="7214" t="14938" r="7330" b="15067">is</wd>

<space/>

<wd l="7378" t="14938" r="7704" b="15067">used</wd>

<space/>

<wd l="7747" t="14938" r="7958" b="15067">for</wd>

<space/>

<wd l="7992" t="14938" r="8515" b="15106">foreign</wd>

<space/>

<wd l="8554" t="14938" r="9029" b="15091">words,</wd>

<space/>

<wd l="9082" t="14938" r="10075" b="15091">abbreviations,</wd>

<space/>

<wd l="10123" t="14938" r="10502" b="15067">items</wd>

<space/>

</run>

</ln>

<ln l="6149" t="15134" r="8722" b="15288" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="15134" r="6408" b="15264">and</wd>

<space/>

<wd l="6451" t="15134" r="7219" b="15288">unknowns,</wd>

<space/>

<wd l="7277" t="15173" r="7416" b="15264">as</wd>

<space/>

<wd l="7469" t="15134" r="7930" b="15264">shown</wd>

<space/>

<wd l="7973" t="15134" r="8117" b="15259">in</wd>

<space/>

<wd l="8160" t="15134" r="8549" b="15264">Table</wd>

<space/>

<wd l="8616" t="15134" r="8722" b="15264">1.</wd>

</ln>

</para>

</column>

</section>

<dd l="1432" t="15736" r="10530" b="15977">

<para l="5862" t="15792" r="6095" b="15941" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5928" t="15792" r="6029" b="15941" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5928" t="15792" r="6029" b="15941">2</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1433" marginTop="1260" marginRight="1378" marginBottom="1302" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1433" t="1260" r="10531" b="15316">

<column l="1433" t="1260" r="5820" b="15316">

<para l="1440" t="1320" r="5794" b="1795" alignment="justified" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="1320" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1320" r="1829" b="1478">with</wd>

<space/>

<wd l="1891" t="1373" r="1987" b="1478">a</wd>

<space/>

<wd l="2040" t="1320" r="2563" b="1522">newly</wd>

<space/>

<wd l="2626" t="1320" r="3264" b="1478">defined</wd>

<space/>

<wd l="3322" t="1320" r="3950" b="1478">Twitter</wd>

<space/>

<wd l="4003" t="1325" r="4392" b="1478">POS</wd>

<space/>

<wd l="4459" t="1344" r="5011" b="1522">tagset.</wd>

<space/>

<wd l="5093" t="1320" r="5434" b="1478">The</wd>

<space/>

<wd l="5491" t="1320" r="5794" b="1478">fol-</wd>

</ln>

<ln l="1440" t="1594" r="5203" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1594" r="2035" b="1795">lowing</wd>

<space/>

<wd l="2102" t="1594" r="2899" b="1752">describes</wd>

<space/>

<wd l="2962" t="1594" r="3269" b="1752">this</wd>

<space/>

<wd l="3336" t="1594" r="4450" b="1795">development</wd>

<space/>

<wd l="4502" t="1646" r="5203" b="1795">process.</wd>

</ln>

</para>

<para l="1440" t="2026" r="4670" b="2227" alignment="left" spaceBefore="183" lsp="exactly" lspExact="252" language="en">

<ln l="1440" t="2026" r="4670" b="2227" baseLine="2174" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">

<wd l="1440" t="2026" r="1704" b="2184">3.1</wd>

<space/>

<wd l="1930" t="2030" r="2342" b="2184">New</wd>

<space/>

<wd l="2395" t="2026" r="2846" b="2184">Irish</wd>

<space/>

<wd l="2904" t="2026" r="3586" b="2184">Twitter</wd>

<space/>

<wd l="3643" t="2026" r="4061" b="2184">POS</wd>

<space/>

<wd l="4118" t="2040" r="4670" b="2227">tagset</wd>

</ln>

</para>

<para l="1440" t="2371" r="5808" b="4742" alignment="justified" spaceBefore="74" lsp="exactly" lspExact="270" language="en">

<ln l="1440" t="2371" r="5794" b="2573" baseLine="2525" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="2371" r="1781" b="2530">The</wd>

<space/>

<wd l="1930" t="2371" r="2837" b="2530">rule-based</wd>

<space/>

<wd l="2986" t="2371" r="3384" b="2530">Irish</wd>

<space/>

<wd l="3533" t="2376" r="4555" b="2573">POS-tagger</wd>

<space/>

<wd l="4709" t="2376" r="4997" b="2568">(U´ı</wd>

<space/>

<wd l="5141" t="2371" r="5794" b="2530">Dhonn-</wd>

</ln>

<ln l="1445" t="2645" r="5808" b="2842" baseLine="2794" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="2645" r="2064" b="2803">chadha</wd>

<space/>

<wd l="2117" t="2645" r="2429" b="2803">and</wd>

<space/>

<wd l="2477" t="2698" r="2784" b="2803">van</wd>

<space/>

<wd l="2846" t="2645" r="3682" b="2832">Genabith,</wd>

<space/>

<wd l="3749" t="2645" r="4243" b="2842">2006)</wd>

<space/>

<wd l="4306" t="2645" r="4565" b="2803">for</wd>

<space/>

<wd l="4622" t="2645" r="5357" b="2803">standard</wd>

<space/>

<wd l="5405" t="2645" r="5808" b="2803">Irish</wd>

<space/>

</ln>

<ln l="1440" t="2914" r="5798" b="3115" baseLine="3067" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="2938" r="1766" b="3072">text</wd>

<space/>

<wd l="1867" t="2914" r="2006" b="3072">is</wd>

<space/>

<wd l="2117" t="2914" r="2611" b="3072">based</wd>

<space/>

<wd l="2722" t="2966" r="2933" b="3072">on</wd>

<space/>

<wd l="3034" t="2914" r="3302" b="3072">the</wd>

<space/>

<wd l="3403" t="2918" r="4224" b="3072">PAROLE</wd>

<space/>

<wd l="4325" t="2914" r="5798" b="3115">Morphosyntactic</wd>

<space/>

</ln>

<ln l="1440" t="3144" r="5798" b="3389" baseLine="3334" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3192" r="2006" b="3389">Tagset</wd>

<space/>

<wd l="2112" t="3144" r="2558" b="3384">(IT´E,</wd>

<space/>

<wd l="2674" t="3192" r="3221" b="3384">2002).</wd>

<space/>

<wd l="3427" t="3192" r="3715" b="3346">We</wd>

<space/>

<wd l="3811" t="3187" r="4214" b="3346">used</wd>

<space/>

<wd l="4310" t="3187" r="4618" b="3346">this</wd>

<space/>

<wd l="4728" t="3240" r="4896" b="3346">as</wd>

<space/>

<wd l="5006" t="3187" r="5270" b="3346">the</wd>

<space/>

<wd l="5371" t="3187" r="5798" b="3346">basis</wd>

<space/>

</ln>

<ln l="1440" t="3456" r="5803" b="3658" baseLine="3610" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3456" r="1699" b="3614">for</wd>

<space/>

<wd l="1786" t="3509" r="2078" b="3614">our</wd>

<space/>

<wd l="2160" t="3456" r="2558" b="3614">Irish</wd>

<space/>

<wd l="2645" t="3456" r="3274" b="3614">Twitter</wd>

<space/>

<wd l="3355" t="3461" r="3744" b="3614">POS</wd>

<space/>

<wd l="3845" t="3480" r="4397" b="3658">tagset.</wd>

<space/>

<wd l="4570" t="3461" r="4858" b="3614">We</wd>

<space/>

<wd l="4944" t="3509" r="5366" b="3614">were</wd>

<space/>

<wd l="5458" t="3456" r="5803" b="3614">also</wd>

<space/>

</ln>

<ln l="1440" t="3730" r="5808" b="3931" baseLine="3878" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3730" r="2146" b="3931">inspired</wd>

<space/>

<wd l="2213" t="3730" r="2429" b="3931">by</wd>

<space/>

<wd l="2501" t="3730" r="2765" b="3888">the</wd>

<space/>

<wd l="2837" t="3730" r="4046" b="3931">English-tweet</wd>

<space/>

<wd l="4114" t="3734" r="4507" b="3888">POS</wd>

<space/>

<wd l="4584" t="3754" r="5098" b="3931">tagset</wd>

<space/>

<wd l="5170" t="3730" r="5808" b="3888">defined</wd>

<space/>

</ln>

<ln l="1440" t="3998" r="5803" b="4200" baseLine="4152" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="3998" r="1656" b="4200">by</wd>

<space/>

<wd l="1742" t="3998" r="2390" b="4200">Gimpel</wd>

<space/>

<wd l="2477" t="4022" r="2630" b="4157">et</wd>

<space/>

<wd l="2712" t="3998" r="2909" b="4157">al.</wd>

<space/>

<wd l="3005" t="4003" r="3619" b="4195">(2011),</wd>

<space/>

<wd l="3720" t="3998" r="4032" b="4157">and</wd>

<space/>

<wd l="4109" t="3998" r="4517" b="4157">have</wd>

<space/>

<wd l="4598" t="3998" r="5126" b="4157">aimed</wd>

<space/>

<wd l="5208" t="4022" r="5371" b="4157">to</wd>

<space/>

<wd l="5462" t="4022" r="5803" b="4200">stay</wd>

<space/>

</ln>

<ln l="1445" t="4272" r="5794" b="4474" baseLine="4421" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="4272" r="2054" b="4474">closely</wd>

<space/>

<wd l="2141" t="4272" r="2779" b="4474">aligned</wd>

<space/>

<wd l="2851" t="4296" r="3019" b="4430">to</wd>

<space/>

<wd l="3101" t="4272" r="3221" b="4430">it</wd>

<space/>

<wd l="3298" t="4272" r="3466" b="4426">in</wd>

<space/>

<wd l="3547" t="4272" r="4008" b="4430">order</wd>

<space/>

<wd l="4080" t="4296" r="4248" b="4430">to</wd>

<space/>

<wd l="4325" t="4272" r="5088" b="4430">facilitate</wd>

<space/>

<wd l="5170" t="4325" r="5472" b="4474">any</wd>

<space/>

<wd l="5549" t="4272" r="5794" b="4430">fu-</wd>

</ln>

<ln l="1440" t="4541" r="4440" b="4742" baseLine="4690" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="4565" r="1781" b="4699">ture</wd>

<space/>

<wd l="1834" t="4541" r="2280" b="4699">work</wd>

<space/>

<wd l="2338" t="4594" r="2554" b="4699">on</wd>

<space/>

<wd l="2611" t="4541" r="3730" b="4742">cross-lingual</wd>

<space/>

<wd l="3797" t="4541" r="4440" b="4699">studies.</wd>

</ln>

</para>

<para l="1440" t="4814" r="5808" b="7723" alignment="justified" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="4814" r="5803" b="5016" baseLine="4963" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1656" t="4819" r="1944" b="4973">We</wd>

<space/>

<wd l="2002" t="4814" r="2578" b="4973">started</wd>

<space/>

<wd l="2626" t="4814" r="2837" b="5016">by</wd>

<space/>

<wd l="2899" t="4814" r="3662" b="5016">selecting</wd>

<space/>

<wd l="3720" t="4867" r="3816" b="4973">a</wd>

<space/>

<wd l="3864" t="4814" r="4531" b="4973">random</wd>

<space/>

<wd l="4589" t="4814" r="5198" b="5016">sample</wd>

<space/>

<wd l="5251" t="4814" r="5443" b="4973">of</wd>

<space/>

<wd l="5482" t="4814" r="5803" b="4973">500</wd>

<space/>

</ln>

<ln l="1440" t="5083" r="5808" b="5285" baseLine="5232" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5083" r="1843" b="5242">Irish</wd>

<space/>

<wd l="1906" t="5107" r="2458" b="5242">tweets</wd>

<space/>

<wd l="2530" t="5107" r="2698" b="5242">to</wd>

<space/>

<wd l="2770" t="5136" r="3211" b="5285">carry</wd>

<space/>

<wd l="3283" t="5107" r="3562" b="5242">out</wd>

<space/>

<wd l="3629" t="5136" r="3826" b="5242">an</wd>

<space/>

<wd l="3898" t="5083" r="4402" b="5242">initial</wd>

<space/>

<wd l="4478" t="5083" r="5218" b="5285">analysis.</wd>

<space/>

<wd l="5333" t="5088" r="5808" b="5242">From</wd>

<space/>

</ln>

<ln l="1445" t="5352" r="5808" b="5554" baseLine="5506" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="5405" r="1733" b="5510">our</wd>

<space/>

<wd l="1786" t="5352" r="2477" b="5554">analysis</wd>

<space/>

<wd l="2544" t="5352" r="2731" b="5510">of</wd>

<space/>

<wd l="2770" t="5352" r="3221" b="5510">these</wd>

<space/>

<wd l="3274" t="5376" r="3821" b="5510">tweets</wd>

<space/>

<wd l="3878" t="5405" r="4133" b="5510">we</wd>

<space/>

<wd l="4190" t="5352" r="5083" b="5510">concluded</wd>

<space/>

<wd l="5136" t="5352" r="5462" b="5510">that</wd>

<space/>

<wd l="5520" t="5405" r="5808" b="5510">our</wd>

<space/>

</ln>

<ln l="1440" t="5626" r="5803" b="5827" baseLine="5774" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5678" r="1795" b="5784">new</wd>

<space/>

<wd l="1848" t="5626" r="3202" b="5827">Twitter-specific</wd>

<space/>

<wd l="3259" t="5630" r="3648" b="5784">POS</wd>

<space/>

<wd l="3706" t="5650" r="4219" b="5827">tagset</wd>

<space/>

<wd l="4267" t="5626" r="4810" b="5784">would</wd>

<space/>

<wd l="4858" t="5650" r="5141" b="5784">not</wd>

<space/>

<wd l="5189" t="5626" r="5803" b="5827">require</wd>

<space/>

</ln>

<ln l="1440" t="5894" r="5794" b="6096" baseLine="6048" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5894" r="1704" b="6053">the</wd>

<space/>

<wd l="1781" t="5894" r="2726" b="6096">granularity</wd>

<space/>

<wd l="2803" t="5894" r="2995" b="6053">of</wd>

<space/>

<wd l="3048" t="5894" r="3317" b="6053">the</wd>

<space/>

<wd l="3389" t="5894" r="4061" b="6096">original</wd>

<space/>

<wd l="4142" t="5894" r="4872" b="6053">standard</wd>

<space/>

<wd l="4939" t="5894" r="5338" b="6053">Irish</wd>

<space/>

<wd l="5405" t="5899" r="5794" b="6053">POS</wd>

<space/>

</ln>

<ln l="1450" t="6168" r="5803" b="6370" baseLine="6317" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1450" t="6192" r="1728" b="6326">set.</wd>

<space/>

<wd l="1862" t="6173" r="2165" b="6326">For</wd>

<space/>

<wd l="2242" t="6168" r="2971" b="6370">example</wd>

<space/>

<wd l="3043" t="6221" r="3298" b="6326">we</wd>

<space/>

<wd l="3379" t="6168" r="3586" b="6326">do</wd>

<space/>

<wd l="3662" t="6192" r="3946" b="6326">not</wd>

<space/>

<wd l="4018" t="6168" r="4430" b="6326">need</wd>

<space/>

<wd l="4502" t="6192" r="4666" b="6326">to</wd>

<space/>

<wd l="4747" t="6168" r="5803" b="6326">differentiate</wd>

<space/>

</ln>

<ln l="1440" t="6437" r="5794" b="6638" baseLine="6590" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="6437" r="2170" b="6595">between</wd>

<space/>

<wd l="2232" t="6490" r="2328" b="6595">a</wd>

<space/>

<wd l="2390" t="6437" r="3072" b="6595">locative</wd>

<space/>

<wd l="3139" t="6437" r="3720" b="6595">adverb</wd>

<space/>

<wd l="3792" t="6437" r="4104" b="6595">and</wd>

<space/>

<wd l="4166" t="6490" r="4262" b="6595">a</wd>

<space/>

<wd l="4325" t="6437" r="5093" b="6638">temporal</wd>

<space/>

<wd l="5165" t="6437" r="5794" b="6624">adverb,</wd>

<space/>

</ln>

<ln l="1445" t="6710" r="5794" b="6912" baseLine="6859" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6763" r="1627" b="6869">or</wd>

<space/>

<wd l="1666" t="6710" r="2390" b="6869">between</wd>

<space/>

<wd l="2438" t="6763" r="2534" b="6869">a</wd>

<space/>

<wd l="2568" t="6710" r="3298" b="6869">vocative</wd>

<space/>

<wd l="3336" t="6710" r="3994" b="6912">particle</wd>

<space/>

<wd l="4037" t="6710" r="4349" b="6869">and</wd>

<space/>

<wd l="4397" t="6763" r="4594" b="6869">an</wd>

<space/>

<wd l="4637" t="6710" r="5414" b="6869">infinitive</wd>

<space/>

<wd l="5458" t="6763" r="5794" b="6912">par-</wd>

</ln>

<ln l="1440" t="6979" r="5808" b="7181" baseLine="7133" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="6979" r="1858" b="7138">ticle.</wd>

<space/>

<wd l="1939" t="6979" r="2472" b="7138">While</wd>

<space/>

<wd l="2534" t="7032" r="2822" b="7138">our</wd>

<space/>

<wd l="2875" t="7003" r="3384" b="7181">tagset</wd>

<space/>

<wd l="3437" t="6979" r="3576" b="7138">is</wd>

<space/>

<wd l="3643" t="6979" r="3989" b="7138">also</wd>

<space/>

<wd l="4051" t="6979" r="4661" b="7181">closely</wd>

<space/>

<wd l="4723" t="6979" r="5362" b="7181">aligned</wd>

<space/>

<wd l="5419" t="6979" r="5808" b="7138">with</wd>

<space/>

</ln>

<ln l="1440" t="7253" r="5803" b="7454" baseLine="7402" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="7253" r="1704" b="7411">the</wd>

<space/>

<wd l="1800" t="7253" r="3014" b="7454">English-tweet</wd>

<space/>

<wd l="3110" t="7258" r="3499" b="7411">POS</wd>

<space/>

<wd l="3605" t="7277" r="4157" b="7454">tagset,</wd>

<space/>

<wd l="4272" t="7306" r="4526" b="7411">we</wd>

<space/>

<wd l="4622" t="7253" r="5443" b="7411">introduce</wd>

<space/>

<wd l="5539" t="7253" r="5803" b="7411">the</wd>

<space/>

</ln>

<ln l="1440" t="7522" r="5587" b="7723" baseLine="7670" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="7522" r="2280" b="7723">following</wd>

<space/>

<wd l="2338" t="7546" r="2683" b="7723">tags</wd>

<space/>

<wd l="2746" t="7522" r="3072" b="7680">that</wd>

<space/>

<wd l="3125" t="7522" r="3394" b="7680">the</wd>

<space/>

<wd l="3446" t="7522" r="4114" b="7723">English</wd>

<space/>

<wd l="4176" t="7546" r="4411" b="7680">set</wd>

<space/>

<wd l="4469" t="7522" r="4858" b="7680">does</wd>

<space/>

<wd l="4920" t="7546" r="5198" b="7680">not</wd>

<space/>

<wd l="5251" t="7574" r="5587" b="7680">use:</wd>

</ln>

</para>

<para l="1675" t="7896" r="5808" b="9725" alignment="justified" li="432" spaceBefore="105" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="7896" r="5803" b="8098" baseLine="8050">

<wd l="1675" t="7920" r="1872" b="8050">•</wd>

<tab position="1748"/>

<wd l="1872" t="7920" r="2194" b="8054"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontPitch="fixed" spacing="0">VN</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2371" t="7901" r="2990" b="8054">Verbal</wd>

<space/>

<wd l="3154" t="7901" r="3662" b="8054">Noun</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3826" t="7896" r="4834" b="8098">Progressive</wd>

<space/>

<wd l="4997" t="7896" r="5803" b="8098">aspectual</wd>

<space/>

</run>

</ln>

<ln l="1877" t="8170" r="5794" b="8371" baseLine="8318" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="8170" r="2525" b="8371">phrases</wd>

<space/>

<wd l="2611" t="8170" r="2779" b="8323">in</wd>

<space/>

<wd l="2856" t="8170" r="3259" b="8328">Irish</wd>

<space/>

<wd l="3341" t="8222" r="3600" b="8328">are</wd>

<space/>

<wd l="3686" t="8170" r="4373" b="8328">denoted</wd>

<space/>

<wd l="4450" t="8170" r="4666" b="8371">by</wd>

<space/>

<wd l="4747" t="8170" r="5011" b="8328">the</wd>

<space/>

<wd l="5093" t="8170" r="5794" b="8371">preposi-</wd>

</ln>

<ln l="1877" t="8438" r="5803" b="8640" baseLine="8592">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1877" t="8438" r="2218" b="8597">tion</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2294" t="8491" r="2510" b="8640">ag</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2592" t="8438" r="3365" b="8597">followed</wd>

<space/>

<wd l="3442" t="8438" r="3658" b="8640">by</wd>

<space/>

<wd l="3744" t="8491" r="3840" b="8597">a</wd>

<space/>

<wd l="3917" t="8438" r="4459" b="8597">verbal</wd>

<space/>

<wd l="4541" t="8491" r="4978" b="8597">noun</wd>

<space/>

<wd l="5069" t="8443" r="5434" b="8640">(e.g.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5587" t="8491" r="5803" b="8640">ag</wd>

<space/>

</run>

</ln>

<ln l="1886" t="8712" r="5803" b="8914" baseLine="8861">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1886" t="8712" r="2189" b="8870">rith</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2309" t="8712" r="3221" b="8914">‘running’).</wd>

<space/>

<wd l="3413" t="8717" r="3696" b="8870">We</wd>

<space/>

<wd l="3792" t="8712" r="4392" b="8870">choose</wd>

<space/>

<wd l="4483" t="8736" r="4651" b="8870">to</wd>

<space/>

<wd l="4747" t="8712" r="5803" b="8870">differentiate</wd>

<space/>

</run>

</ln>

<ln l="1877" t="8981" r="5794" b="9182" baseLine="9130" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="8981" r="2606" b="9139">between</wd>

<space/>

<wd l="2674" t="8986" r="2832" b="9139">N</wd>

<space/>

<wd l="2909" t="8981" r="3221" b="9139">and</wd>

<space/>

<wd l="3293" t="8986" r="3610" b="9139">VN</wd>

<space/>

<wd l="3677" t="9005" r="3845" b="9139">to</wd>

<space/>

<wd l="3926" t="8981" r="4397" b="9139">avoid</wd>

<space/>

<wd l="4469" t="8981" r="4997" b="9182">losing</wd>

<space/>

<wd l="5074" t="8981" r="5381" b="9139">this</wd>

<space/>

<wd l="5462" t="9034" r="5794" b="9139">ver-</wd>

</ln>

<ln l="1877" t="9254" r="5808" b="9413" baseLine="9403" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9254" r="2141" b="9413">bal</wd>

<space/>

<wd l="2194" t="9254" r="3226" b="9413">information</wd>

<space/>

<wd l="3274" t="9254" r="3442" b="9408">in</wd>

<space/>

<wd l="3490" t="9254" r="3917" b="9413">what</wd>

<space/>

<wd l="3965" t="9254" r="4507" b="9413">would</wd>

<space/>

<wd l="4560" t="9254" r="5405" b="9413">otherwise</wd>

<space/>

<wd l="5453" t="9254" r="5659" b="9413">be</wd>

<space/>

<wd l="5712" t="9307" r="5808" b="9413">a</wd>

<space/>

</ln>

<ln l="1877" t="9523" r="4354" b="9725" baseLine="9672" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="9523" r="2496" b="9725">regular</wd>

<space/>

<wd l="2544" t="9523" r="3682" b="9725">prepositional</wd>

<space/>

<wd l="3739" t="9523" r="4354" b="9725">phrase.</wd>

</ln>

</para>

<para l="1675" t="9941" r="5803" b="11496" alignment="justified" li="432" spaceBefore="145" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="9941" r="5794" b="10142" baseLine="10090">

<wd l="1675" t="9946" r="1886" b="10090">•</wd>

<tab position="1756"/>

<wd l="1886" t="9946" r="2458" b="10118"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontPitch="fixed" spacing="-2">#MWE</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">:</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2539" t="9941" r="3542" b="10099">Multiword</wd>

<space/>

<wd l="3614" t="9946" r="4339" b="10142">hashtag</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="4411" t="9941" r="4930" b="10099">These</wd>

<space/>

<wd l="5002" t="9994" r="5266" b="10099">are</wd>

<space/>

<wd l="5333" t="9941" r="5794" b="10099">hash-</wd>

</run>

</ln>

<ln l="1877" t="10210" r="5794" b="10411" baseLine="10358" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="10234" r="2218" b="10411">tags</wd>

<space/>

<wd l="2285" t="10210" r="3197" b="10411">containing</wd>

<space/>

<wd l="3264" t="10210" r="3830" b="10411">strings</wd>

<space/>

<wd l="3893" t="10210" r="4085" b="10368">of</wd>

<space/>

<wd l="4123" t="10210" r="4646" b="10368">words</wd>

<space/>

<wd l="4709" t="10210" r="5107" b="10368">used</wd>

<space/>

<wd l="5160" t="10234" r="5323" b="10368">to</wd>

<space/>

<wd l="5386" t="10234" r="5794" b="10368">cate-</wd>

</ln>

<ln l="1882" t="10483" r="5794" b="10685" baseLine="10632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="10483" r="2410" b="10685">gorise</wd>

<space/>

<wd l="2472" t="10536" r="2568" b="10642">a</wd>

<space/>

<wd l="2621" t="10507" r="2947" b="10642">text</wd>

<space/>

<wd l="3010" t="10488" r="3374" b="10685">(e.g.</wd>

<space/>

<wd l="3461" t="10483" r="4584" b="10685">#godhelpus).</wd>

<space/>

<wd l="4666" t="10488" r="4954" b="10642">We</wd>

<space/>

<wd l="5011" t="10483" r="5506" b="10642">retain</wd>

<space/>

<wd l="5563" t="10483" r="5794" b="10637">in-</wd>

</ln>

<ln l="1877" t="10752" r="5803" b="10910" baseLine="10901" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="10752" r="2736" b="10910">formation</wd>

<space/>

<wd l="2813" t="10805" r="3029" b="10910">on</wd>

<space/>

<wd l="3096" t="10752" r="3365" b="10910">the</wd>

<space/>

<wd l="3437" t="10752" r="4416" b="10910">multi-word</wd>

<space/>

<wd l="4488" t="10776" r="5030" b="10910">nature</wd>

<space/>

<wd l="5107" t="10752" r="5299" b="10910">of</wd>

<space/>

<wd l="5357" t="10752" r="5803" b="10910">these</wd>

<space/>

</ln>

<ln l="1877" t="11021" r="5798" b="11222" baseLine="11174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1877" t="11021" r="2621" b="11222">hashtags</wd>

<space/>

<wd l="2683" t="11021" r="2851" b="11174">in</wd>

<space/>

<wd l="2909" t="11021" r="3370" b="11179">order</wd>

<space/>

<wd l="3418" t="11045" r="3586" b="11179">to</wd>

<space/>

<wd l="3643" t="11021" r="4402" b="11179">facilitate</wd>

<space/>

<wd l="4454" t="11021" r="4978" b="11179">future</wd>

<space/>

<wd l="5040" t="11021" r="5798" b="11222">syntactic</wd>

<space/>

</ln>

<ln l="1882" t="11294" r="3240" b="11496" baseLine="11443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1882" t="11294" r="2573" b="11496">analysis</wd>

<space/>

<wd l="2640" t="11294" r="3240" b="11453">efforts.</wd>

</ln>

</para>

<para l="1440" t="11669" r="5794" b="12096" alignment="justified" spaceBefore="106" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="11669" r="5794" b="11870" baseLine="11818">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="11674" r="1944" b="11827">We</wd>

<space/>

<wd l="1997" t="11669" r="2338" b="11827">also</wd>

<space/>

<wd l="2395" t="11669" r="2866" b="11870">adapt</wd>

<space/>

<wd l="2914" t="11669" r="3178" b="11827">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3240" t="11698" r="3346" b="11822">T</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3408" t="11669" r="4061" b="11870">particle</wd>

<space/>

<wd l="4109" t="11693" r="4277" b="11827">to</wd>

<space/>

<wd l="4334" t="11669" r="4642" b="11827">suit</wd>

<space/>

<wd l="4690" t="11669" r="5093" b="11827">Irish</wd>

<space/>

<wd l="5141" t="11669" r="5794" b="11870">linguis-</wd>

</run>

</ln>

<ln l="1440" t="11938" r="2448" b="12096" baseLine="12091" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="11938" r="1651" b="12096">tic</wd>

<space/>

<wd l="1714" t="11938" r="2448" b="12096">features.</wd>

</ln>

</para>

<para l="1675" t="12298" r="5803" b="13862" alignment="justified" li="432" spaceBefore="93" fli="-216" lsp="exactly" lspExact="271" language="en">

<bullet type="bulleted" value="smallCircle" numChars="2">

</bullet>

<ln l="1675" t="12302" r="5803" b="12504" baseLine="12456">

<wd l="1675" t="12326" r="1882" b="12456">•</wd>

<tab position="1748"/>

<wd l="1882" t="12326" r="2064" b="12461"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontPitch="fixed" spacing="0">T</run>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">:</run>

</wd>

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2150" t="12302" r="2875" b="12461">Particle</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2947" t="12307" r="3230" b="12461">We</wd>

<space/>

<wd l="3307" t="12302" r="3883" b="12461">extend</wd>

<space/>

<wd l="3950" t="12302" r="4219" b="12461">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4301" t="12331" r="4406" b="12456">T</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4488" t="12326" r="4752" b="12504">tag</wd>

<space/>

<wd l="4829" t="12326" r="4992" b="12461">to</wd>

<space/>

<wd l="5069" t="12326" r="5347" b="12461">not</wd>

<space/>

<wd l="5424" t="12302" r="5803" b="12504">only</wd>

<space/>

</run>

</ln>

<ln l="1882" t="12576" r="5794" b="12778" baseLine="12725" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="12629" r="2357" b="12734">cover</wd>

<space/>

<wd l="2419" t="12576" r="2798" b="12734">verb</wd>

<space/>

<wd l="2870" t="12576" r="3653" b="12778">particles,</wd>

<space/>

<wd l="3730" t="12576" r="4008" b="12734">but</wd>

<space/>

<wd l="4075" t="12576" r="4286" b="12734">all</wd>

<space/>

<wd l="4358" t="12576" r="4805" b="12734">other</wd>

<space/>

<wd l="4867" t="12576" r="5270" b="12734">Irish</wd>

<space/>

<wd l="5333" t="12576" r="5794" b="12778">parti-</wd>

</ln>

<ln l="1882" t="12845" r="5794" b="13046" baseLine="12998" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="12845" r="2261" b="13003">cles:</wd>

<space/>

<wd l="2352" t="12845" r="2995" b="13003">relative</wd>

<space/>

<wd l="3058" t="12845" r="3840" b="13046">particles,</wd>

<space/>

<wd l="3922" t="12898" r="4651" b="13003">surname</wd>

<space/>

<wd l="4709" t="12845" r="5491" b="13046">particles,</wd>

<space/>

<wd l="5563" t="12845" r="5794" b="12998">in-</wd>

</ln>

<ln l="1882" t="13118" r="5794" b="13320" baseLine="13267" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="13118" r="2486" b="13277">finitive</wd>

<space/>

<wd l="2558" t="13118" r="3341" b="13320">particles,</wd>

<space/>

<wd l="3427" t="13118" r="4138" b="13277">numeric</wd>

<space/>

<wd l="4214" t="13118" r="4997" b="13320">particles,</wd>

<space/>

<wd l="5088" t="13171" r="5794" b="13320">compar-</wd>

</ln>

<ln l="1882" t="13387" r="5794" b="13589" baseLine="13536" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1882" t="13387" r="2290" b="13546">ative</wd>

<space/>

<wd l="2362" t="13387" r="3144" b="13589">particles,</wd>

<space/>

<wd l="3230" t="13387" r="3494" b="13546">the</wd>

<space/>

<wd l="3566" t="13387" r="4291" b="13546">vocative</wd>

<space/>

<wd l="4358" t="13387" r="5059" b="13589">particle,</wd>

<space/>

<wd l="5146" t="13387" r="5458" b="13546">and</wd>

<space/>

<wd l="5530" t="13387" r="5794" b="13546">ad-</wd>

</ln>

<ln l="1877" t="13661" r="3317" b="13862" baseLine="13810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1877" t="13661" r="2477" b="13819">verbial</wd>

<space/>

<wd l="2534" t="13661" r="3317" b="13862">particles.</wd>

</ln>

</para>

<para l="1440" t="14021" r="5794" b="15307" alignment="justified" spaceBefore="94" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="14021" r="5794" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14026" r="1723" b="14179">We</wd>

<space/>

<wd l="1824" t="14021" r="2030" b="14179">do</wd>

<space/>

<wd l="2126" t="14045" r="2410" b="14179">not</wd>

<space/>

<wd l="2496" t="14074" r="2789" b="14179">use</wd>

<space/>

<wd l="2880" t="14021" r="3144" b="14179">the</wd>

<space/>

<wd l="3240" t="14021" r="4080" b="14222">following</wd>

<space/>

<wd l="4171" t="14045" r="4517" b="14222">tags</wd>

<space/>

<wd l="4618" t="14021" r="5045" b="14179">from</wd>

<space/>

<wd l="5131" t="14021" r="5400" b="14179">the</wd>

<space/>

<wd l="5491" t="14026" r="5794" b="14174">En-</wd>

</ln>

<ln l="1445" t="14294" r="5794" b="14496" baseLine="14443">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="14294" r="1867" b="14496">glish</wd>

<space/>

<wd l="1930" t="14318" r="2208" b="14453">set:</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2314" t="14318" r="2501" b="14482">S,</wd>

<space/>

<wd l="2707" t="14323" r="2894" b="14482">Z,</wd>

<space/>

<wd l="3091" t="14323" r="3288" b="14482">L,</wd>

<space/>

<wd l="3475" t="14323" r="3682" b="14482">M,</wd>

<space/>

<wd l="3869" t="14323" r="4075" b="14482">X,</wd>

<space/>

<wd l="4267" t="14323" r="4469" b="14482">Y,</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4584" t="14347" r="4752" b="14453">as</wd>

<space/>

<wd l="4814" t="14294" r="5083" b="14453">the</wd>

<space/>

<wd l="5141" t="14294" r="5794" b="14496">linguis-</wd>

</run>

</ln>

<ln l="1440" t="14563" r="5794" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14563" r="1651" b="14722">tic</wd>

<space/>

<wd l="1723" t="14616" r="2170" b="14722">cases</wd>

<space/>

<wd l="2237" t="14563" r="2606" b="14765">they</wd>

<space/>

<wd l="2674" t="14563" r="3149" b="14765">apply</wd>

<space/>

<wd l="3211" t="14587" r="3379" b="14722">to</wd>

<space/>

<wd l="3446" t="14563" r="3653" b="14722">do</wd>

<space/>

<wd l="3715" t="14587" r="3998" b="14722">not</wd>

<space/>

<wd l="4061" t="14616" r="4541" b="14722">occur</wd>

<space/>

<wd l="4598" t="14563" r="4766" b="14717">in</wd>

<space/>

<wd l="4829" t="14563" r="5328" b="14722">either</wd>

<space/>

<wd l="5390" t="14587" r="5794" b="14722">stan-</wd>

</ln>

<ln l="1445" t="14837" r="5784" b="14995" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="14837" r="1829" b="14995">dard</wd>

<space/>

<wd l="1925" t="14890" r="2107" b="14995">or</wd>

<space/>

<wd l="2194" t="14837" r="3336" b="14995">non-standard</wd>

<space/>

<wd l="3427" t="14837" r="3869" b="14995">Irish.</wd>

<space/>

<wd l="4066" t="14837" r="4402" b="14995">The</wd>

<space/>

<wd l="4502" t="14837" r="4882" b="14995">final</wd>

<space/>

<wd l="4987" t="14861" r="5222" b="14995">set</wd>

<space/>

<wd l="5318" t="14837" r="5510" b="14995">of</wd>

<space/>

<wd l="5592" t="14842" r="5784" b="14990">21</wd>

<space/>

</ln>

<ln l="1440" t="15106" r="4320" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="15110" r="2256" b="15307">POS-tags</wd>

<space/>

<wd l="2318" t="15106" r="2458" b="15264">is</wd>

<space/>

<wd l="2520" t="15106" r="3355" b="15307">presented</wd>

<space/>

<wd l="3408" t="15106" r="3581" b="15259">in</wd>

<space/>

<wd l="3634" t="15106" r="4114" b="15264">Table</wd>

<space/>

<wd l="4190" t="15110" r="4320" b="15264">1.</wd>

</ln>

</para>

</column>

<column l="6144" t="1260" r="10531" b="15316">

<para l="6144" t="1320" r="10526" b="5861" alignment="justified" spaceBefore="18" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="6365" t="1320" r="10512" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="1325" r="6816" b="1478">Most</wd>

<space/>

<wd l="6936" t="1320" r="7128" b="1478">of</wd>

<space/>

<wd l="7238" t="1320" r="7502" b="1478">the</wd>

<space/>

<wd l="7622" t="1344" r="7968" b="1522">tags</wd>

<space/>

<wd l="8098" t="1320" r="8266" b="1474">in</wd>

<space/>

<wd l="8386" t="1320" r="8654" b="1478">the</wd>

<space/>

<wd l="8774" t="1344" r="9283" b="1522">tagset</wd>

<space/>

<wd l="9408" t="1373" r="9672" b="1478">are</wd>

<space/>

<wd l="9792" t="1320" r="10512" b="1478">intuitive</wd>

<space/>

</ln>

<ln l="6144" t="1594" r="10512" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1618" r="6312" b="1752">to</wd>

<space/>

<wd l="6432" t="1646" r="6629" b="1752">an</wd>

<space/>

<wd l="6744" t="1594" r="7142" b="1752">Irish</wd>

<space/>

<wd l="7253" t="1594" r="8040" b="1795">language</wd>

<space/>

<wd l="8160" t="1594" r="8846" b="1795">speaker.</wd>

<space/>

<wd l="9096" t="1598" r="9912" b="1781">However,</wd>

<space/>

<wd l="10061" t="1646" r="10512" b="1752">some</wd>

<space/>

</ln>

<ln l="6144" t="1862" r="10502" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1886" r="6490" b="2064">tags</wd>

<space/>

<wd l="6619" t="1862" r="7234" b="2064">require</wd>

<space/>

<wd l="7363" t="1862" r="8016" b="2064">specific</wd>

<space/>

<wd l="8146" t="1862" r="9158" b="2064">explanation</wd>

<space/>

<wd l="9278" t="1862" r="9446" b="2016">in</wd>

<space/>

<wd l="9566" t="1862" r="9830" b="2021">the</wd>

<space/>

<wd l="9960" t="1862" r="10502" b="2064">guide-</wd>

</ln>

<ln l="6144" t="2136" r="10502" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2136" r="6600" b="2294">lines.</wd>

<space/>

<wd l="6720" t="2136" r="7512" b="2338">Hashtags</wd>

<space/>

<wd l="7594" t="2136" r="7906" b="2294">and</wd>

<space/>

<wd l="7978" t="2136" r="8995" b="2294">at-mentions</wd>

<space/>

<wd l="9077" t="2189" r="9370" b="2294">can</wd>

<space/>

<wd l="9442" t="2136" r="9648" b="2294">be</wd>

<space/>

<wd l="9720" t="2189" r="9816" b="2294">a</wd>

<space/>

<wd l="9893" t="2160" r="10502" b="2338">syntac-</wd>

</ln>

<ln l="6144" t="2405" r="10498" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2405" r="6360" b="2563">tic</wd>

<space/>

<wd l="6456" t="2434" r="6797" b="2606">part</wd>

<space/>

<wd l="6898" t="2405" r="7085" b="2563">of</wd>

<space/>

<wd l="7171" t="2458" r="7267" b="2563">a</wd>

<space/>

<wd l="7368" t="2429" r="8107" b="2563">sentence</wd>

<space/>

<wd l="8208" t="2458" r="8390" b="2563">or</wd>

<space/>

<wd l="8477" t="2405" r="9048" b="2606">phrase</wd>

<space/>

<wd l="9139" t="2405" r="9701" b="2563">within</wd>

<space/>

<wd l="9797" t="2458" r="9893" b="2563">a</wd>

<space/>

<wd l="9984" t="2429" r="10498" b="2563">tweet.</wd>

<space/>

</ln>

<ln l="6144" t="2678" r="10512" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2678" r="6667" b="2837">When</wd>

<space/>

<wd l="6787" t="2678" r="7094" b="2837">this</wd>

<space/>

<wd l="7224" t="2678" r="7363" b="2837">is</wd>

<space/>

<wd l="7493" t="2678" r="7757" b="2837">the</wd>

<space/>

<wd l="7886" t="2731" r="8299" b="2866">case,</wd>

<space/>

<wd l="8448" t="2731" r="8702" b="2837">we</wd>

<space/>

<wd l="8827" t="2678" r="9307" b="2880">apply</wd>

<space/>

<wd l="9432" t="2678" r="9696" b="2837">the</wd>

<space/>

<wd l="9821" t="2678" r="10512" b="2837">relevant</wd>

<space/>

</ln>

<ln l="6154" t="2947" r="10517" b="3149" baseLine="3101">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6154" t="2947" r="6917" b="3149">syntactic</wd>

<space/>

<wd l="7022" t="2952" r="7411" b="3106">POS</wd>

<space/>

<wd l="7522" t="2971" r="7834" b="3149">tag.</wd>

<space/>

<wd l="8050" t="2952" r="8352" b="3106">For</wd>

<space/>

<wd l="8453" t="2947" r="9230" b="3149">example,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9346" t="2947" r="9859" b="3106">Beidh</wd>

<space/>

<wd l="9960" t="2957" r="10224" b="3106">m´e</wd>

<space/>

<wd l="10315" t="3000" r="10517" b="3106">ar</wd>

<space/>

</run>

</ln>

<ln l="6149" t="3221" r="10507" b="3422" baseLine="3371">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="3221" r="6610" b="3379">chl´ar</wd>

<space/>

</run>

<wd l="6701" t="3221" r="8376" b="3422"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">@SplancNewstalk</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">∧</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8467" t="3221" r="9067" b="3379">anocht</wd>

<space/>

<wd l="9134" t="3274" r="9350" b="3422">ag</wd>

<space/>

<wd l="9432" t="3221" r="10138" b="3379">labhairt</wd>

<space/>

<wd l="10214" t="3221" r="10507" b="3379">leis</wd>

<space/>

</run>

</ln>

<ln l="6168" t="3490" r="10512" b="3691" baseLine="3641">

<wd l="6168" t="3490" r="7618" b="3682"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">@AnRonanEile</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">∧</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7656" t="3494" r="8026" b="3691">faoi</wd>

<space/>

</run>

<wd l="8083" t="3490" r="9638" b="3677"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">#neknomination</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">N</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9730" t="3494" r="9854" b="3643">‘I</wd>

<space/>

<wd l="9907" t="3490" r="10248" b="3648">will</wd>

<space/>

<wd l="10306" t="3490" r="10512" b="3648">be</wd>

<space/>

</run>

</ln>

<ln l="6149" t="3763" r="10502" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3816" r="6365" b="3922">on</wd>

<space/>

<wd l="6475" t="3763" r="8064" b="3965">@SplancNewstalk</wd>

<space/>

<wd l="8150" t="3763" r="8770" b="3965">tonight</wd>

<space/>

<wd l="8861" t="3763" r="9624" b="3965">speaking</wd>

<space/>

<wd l="9715" t="3787" r="9883" b="3922">to</wd>

<space/>

<wd l="9994" t="3768" r="10502" b="3922">@An-</wd>

</ln>

<ln l="6144" t="4032" r="10526" b="4190" baseLine="4181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4032" r="7066" b="4190">RonanEile</wd>

<space/>

<wd l="7152" t="4032" r="7632" b="4190">about</wd>

<space/>

<wd l="7714" t="4032" r="9245" b="4190">#neknomination’.</wd>

<space/>

<wd l="9408" t="4032" r="10296" b="4190">Otherwise</wd>

<space/>

<wd l="10378" t="4032" r="10526" b="4186">if</wd>

<space/>

</ln>

<ln l="6144" t="4301" r="10512" b="4502" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4301" r="6514" b="4502">they</wd>

<space/>

<wd l="6600" t="4354" r="6859" b="4459">are</wd>

<space/>

<wd l="6936" t="4325" r="7214" b="4459">not</wd>

<space/>

<wd l="7286" t="4330" r="7627" b="4502">part</wd>

<space/>

<wd l="7704" t="4301" r="7896" b="4459">of</wd>

<space/>

<wd l="7958" t="4301" r="8222" b="4459">the</wd>

<space/>

<wd l="8309" t="4301" r="9067" b="4502">syntactic</wd>

<space/>

<wd l="9158" t="4325" r="9912" b="4459">structure</wd>

<space/>

<wd l="9994" t="4301" r="10186" b="4459">of</wd>

<space/>

<wd l="10243" t="4301" r="10512" b="4459">the</wd>

<space/>

</ln>

<ln l="6144" t="4574" r="10512" b="4776" baseLine="4723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="4598" r="6619" b="4733">tweet</wd>

<space/>

<wd l="6744" t="4574" r="7565" b="4776">(typically</wd>

<space/>

<wd l="7690" t="4574" r="8525" b="4776">appended</wd>

<space/>

<wd l="8640" t="4627" r="8822" b="4733">or</wd>

<space/>

<wd l="8933" t="4574" r="9845" b="4776">prepended</wd>

<space/>

<wd l="9960" t="4598" r="10123" b="4733">to</wd>

<space/>

<wd l="10243" t="4574" r="10512" b="4733">the</wd>

<space/>

</ln>

<ln l="6144" t="4843" r="10517" b="5045" baseLine="4997">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4843" r="6586" b="5002">main</wd>

<space/>

<wd l="6658" t="4867" r="7133" b="5002">tweet</wd>

<space/>

<wd l="7210" t="4848" r="7646" b="5040">text),</wd>

<space/>

<wd l="7742" t="4843" r="8112" b="5045">they</wd>

<space/>

<wd l="8194" t="4896" r="8458" b="5002">are</wd>

<space/>

<wd l="8534" t="4843" r="9115" b="5045">tagged</wd>

<space/>

<wd l="9197" t="4896" r="9365" b="5002">as</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9470" t="4858" r="9557" b="5011">@</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9662" t="4843" r="9974" b="5002">and</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10070" t="4853" r="10166" b="5011">#</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="10267" t="4848" r="10517" b="5040">(or</wd>

<space/>

</run>

</ln>

<ln l="6163" t="5098" r="10526" b="5318" baseLine="5266">

<wd l="6163" t="5122" r="6787" b="5314"><run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">#MWE</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6883" t="5122" r="7066" b="5270">In</wd>

<space/>

<wd l="7152" t="5170" r="7445" b="5275">our</wd>

<space/>

<wd l="7531" t="5117" r="7915" b="5318">gold</wd>

<space/>

<wd l="8006" t="5117" r="8741" b="5275">standard</wd>

<space/>

<wd l="8827" t="5170" r="9446" b="5318">corpus,</wd>

<space/>

<wd l="9557" t="5117" r="9874" b="5275">554</wd>

<space/>

<wd l="9970" t="5141" r="10243" b="5275">out</wd>

<space/>

<wd l="10334" t="5117" r="10526" b="5275">of</wd>

<space/>

</run>

</ln>

<ln l="6149" t="5371" r="10502" b="5587" baseLine="5539">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="5386" r="6461" b="5544">693</wd>

<space/>

<wd l="6552" t="5386" r="7296" b="5587">hashtags</wd>

<space/>

</run>

<wd l="7392" t="5371" r="8141" b="5582"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">79</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">9%</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">),</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8242" t="5386" r="8554" b="5544">and</wd>

<space/>

<wd l="8654" t="5386" r="9062" b="5544">1604</wd>

<space/>

<wd l="9154" t="5410" r="9427" b="5544">out</wd>

<space/>

<wd l="9509" t="5386" r="9701" b="5544">of</wd>

<space/>

<wd l="9787" t="5386" r="10200" b="5544">1946</wd>

<space/>

<wd l="10286" t="5410" r="10502" b="5544">at-</wd>

</run>

</ln>

<ln l="6144" t="5645" r="10344" b="5861" baseLine="5808">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="5659" r="6936" b="5818">mentions</wd>

<space/>

</run>

<wd l="7008" t="5645" r="7704" b="5856"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">82</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">.</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">4%</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7776" t="5712" r="8035" b="5818">are</wd>

<space/>

<wd l="8098" t="5659" r="8285" b="5818">of</wd>

<space/>

<wd l="8328" t="5659" r="8635" b="5818">this</wd>

<space/>

<wd l="8698" t="5659" r="9869" b="5861">non-syntactic</wd>

<space/>

<wd l="9926" t="5683" r="10344" b="5861">type.</wd>

</run>

</ln>

</para>

<para l="6144" t="5933" r="10517" b="7762" alignment="justified" spaceBefore="3" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="5933" r="10502" b="6120" baseLine="6086" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5933" r="6792" b="6091">With</wd>

<space/>

<wd l="6888" t="5986" r="7339" b="6091">some</wd>

<space/>

<wd l="7426" t="5933" r="8054" b="6091">Twitter</wd>

<space/>

<wd l="8146" t="5933" r="8750" b="6120">clients,</wd>

<space/>

<wd l="8861" t="5933" r="9005" b="6086">if</wd>

<space/>

<wd l="9086" t="5986" r="9182" b="6091">a</wd>

<space/>

<wd l="9264" t="5957" r="9739" b="6091">tweet</wd>

<space/>

<wd l="9830" t="5933" r="10502" b="6091">exceeds</wd>

<space/>

</ln>

<ln l="6144" t="6206" r="10512" b="6394" baseLine="6355" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6206" r="6413" b="6365">the</wd>

<space/>

<wd l="6552" t="6211" r="6850" b="6365">140</wd>

<space/>

<wd l="6970" t="6206" r="7771" b="6365">character</wd>

<space/>

<wd l="7877" t="6206" r="8333" b="6394">limit,</wd>

<space/>

<wd l="8472" t="6206" r="8741" b="6365">the</wd>

<space/>

<wd l="8856" t="6230" r="9326" b="6365">tweet</wd>

<space/>

<wd l="9442" t="6206" r="9576" b="6365">is</wd>

<space/>

<wd l="9706" t="6206" r="10512" b="6365">truncated</wd>

<space/>

</ln>

<ln l="6149" t="6475" r="10512" b="6677" baseLine="6624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="6475" r="6461" b="6634">and</wd>

<space/>

<wd l="6542" t="6528" r="6744" b="6634">an</wd>

<space/>

<wd l="6830" t="6475" r="7435" b="6677">ellipsis</wd>

<space/>

<wd l="7522" t="6475" r="7661" b="6634">is</wd>

<space/>

<wd l="7747" t="6475" r="8146" b="6634">used</wd>

<space/>

<wd l="8222" t="6499" r="8390" b="6634">to</wd>

<space/>

<wd l="8472" t="6475" r="9163" b="6634">indicate</wd>

<space/>

<wd l="9240" t="6475" r="9571" b="6634">that</wd>

<space/>

<wd l="9658" t="6528" r="10109" b="6634">some</wd>

<space/>

<wd l="10186" t="6499" r="10512" b="6634">text</wd>

<space/>

</ln>

<ln l="6144" t="6749" r="10502" b="6950" baseLine="6898" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6749" r="6283" b="6907">is</wd>

<space/>

<wd l="6398" t="6749" r="7118" b="6950">missing.</wd>

<space/>

<wd l="7354" t="6754" r="7637" b="6907">We</wd>

<space/>

<wd l="7747" t="6749" r="8198" b="6907">leave</wd>

<space/>

<wd l="8304" t="6749" r="8611" b="6907">this</wd>

<space/>

<wd l="8731" t="6749" r="9562" b="6950">appended</wd>

<space/>

<wd l="9667" t="6773" r="9835" b="6907">to</wd>

<space/>

<wd l="9946" t="6749" r="10210" b="6907">the</wd>

<space/>

<wd l="10320" t="6749" r="10502" b="6902">fi-</wd>

</ln>

<ln l="6144" t="7018" r="10517" b="7219" baseLine="7166" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7018" r="6408" b="7176">nal</wd>

<space/>

<wd l="6538" t="7018" r="7224" b="7219">(usually</wd>

<space/>

<wd l="7344" t="7018" r="7963" b="7219">partial)</wd>

<space/>

<wd l="8088" t="7018" r="8611" b="7205">token,</wd>

<space/>

<wd l="8755" t="7018" r="9288" b="7176">which</wd>

<space/>

<wd l="9398" t="7070" r="9730" b="7176">was</wd>

<space/>

<wd l="9854" t="7018" r="10301" b="7176">often</wd>

<space/>

<wd l="10421" t="7070" r="10517" b="7176">a</wd>

<space/>

</ln>

<ln l="6144" t="7286" r="10512" b="7488" baseLine="7440">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="7291" r="6624" b="7445">URL.</wd>

<space/>

<wd l="6715" t="7291" r="6998" b="7445">We</wd>

<space/>

<wd l="7080" t="7286" r="7733" b="7445">marked</wd>

<space/>

<wd l="7810" t="7286" r="8256" b="7445">these</wd>

<space/>

<wd l="8338" t="7339" r="8789" b="7445">cases</wd>

<space/>

<wd l="8880" t="7339" r="9048" b="7445">as</wd>

<space/>

</run>

<wd l="9144" t="7310" r="9307" b="7445"><run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">G</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9398" t="7291" r="9701" b="7445">For</wd>

<space/>

<wd l="9778" t="7286" r="10512" b="7488">example</wd>

<space/>

</run>

</ln>

<ln l="6144" t="7560" r="8410" b="7762" baseLine="7709">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="7560" r="8314" b="7762">http://t.co/2nvQsxaIa7...</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8381" t="7690" r="8410" b="7718">.</wd>

</run>

</ln>

</para>

<para l="6144" t="7834" r="10512" b="9350" alignment="justified" spaceBefore="4" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6370" t="7834" r="10502" b="8035" baseLine="7987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="7838" r="6859" b="7992">Some</wd>

<space/>

<wd l="6912" t="7834" r="7478" b="8035">strings</wd>

<space/>

<wd l="7536" t="7834" r="7723" b="7992">of</wd>

<space/>

<wd l="7757" t="7886" r="8328" b="8035">proper</wd>

<space/>

<wd l="8366" t="7886" r="8880" b="7992">nouns</wd>

<space/>

<wd l="8938" t="7834" r="9576" b="7992">contain</wd>

<space/>

<wd l="9624" t="7834" r="10070" b="7992">other</wd>

<space/>

<wd l="10109" t="7838" r="10502" b="7992">POS</wd>

<space/>

</ln>

<ln l="6149" t="8107" r="10498" b="8294" baseLine="8256" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="8107" r="6965" b="8294">elements,</wd>

<space/>

<wd l="7032" t="8107" r="7426" b="8266">such</wd>

<space/>

<wd l="7474" t="8160" r="7642" b="8266">as</wd>

<space/>

<wd l="7699" t="8107" r="8717" b="8266">determiners</wd>

<space/>

<wd l="8774" t="8107" r="9082" b="8266">and</wd>

<space/>

<wd l="9130" t="8160" r="9893" b="8266">common</wd>

<space/>

<wd l="9936" t="8160" r="10498" b="8266">nouns.</wd>

<space/>

</ln>

<ln l="6144" t="8376" r="10498" b="8578" baseLine="8530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8376" r="6811" b="8578">Despite</wd>

<space/>

<wd l="6878" t="8376" r="7358" b="8578">being</wd>

<space/>

<wd l="7435" t="8429" r="7531" b="8534">a</wd>

<space/>

<wd l="7594" t="8429" r="8165" b="8578">proper</wd>

<space/>

<wd l="8227" t="8429" r="8669" b="8534">noun</wd>

<space/>

<wd l="8731" t="8376" r="9302" b="8578">phrase</wd>

<space/>

<wd l="9379" t="8376" r="10498" b="8578">syntactically,</wd>

<space/>

</ln>

<ln l="6144" t="8650" r="10502" b="8851" baseLine="8798" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8702" r="6398" b="8808">we</wd>

<space/>

<wd l="6509" t="8674" r="6773" b="8851">tag</wd>

<space/>

<wd l="6893" t="8650" r="7291" b="8808">each</wd>

<space/>

<wd l="7402" t="8650" r="7882" b="8808">token</wd>

<space/>

<wd l="7997" t="8702" r="8165" b="8808">as</wd>

<space/>

<wd l="8285" t="8702" r="8568" b="8851">per</wd>

<space/>

<wd l="8674" t="8650" r="8875" b="8808">its</wd>

<space/>

<wd l="8990" t="8654" r="9437" b="8808">POS.</wd>

<space/>

<wd l="9557" t="8654" r="9864" b="8808">For</wd>

<space/>

<wd l="9974" t="8702" r="10502" b="8808">exam-</wd>

</ln>

<ln l="6144" t="8918" r="10512" b="9120" baseLine="9076">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="8918" r="6456" b="9120">ple,</wd>

<space/>

</run>

<wd l="6571" t="8923" r="6917" b="9110"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">C´u</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">∧</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7013" t="8971" r="7373" b="9106"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">na</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">D</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7469" t="8918" r="8712" b="9110"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">mBaskerville</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">∧</run>

</wd>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8837" t="8918" r="9221" b="9077">‘The</wd>

<space/>

<wd l="9302" t="8918" r="9898" b="9077">Hound</wd>

<space/>

<wd l="9984" t="8918" r="10176" b="9077">of</wd>

<space/>

<wd l="10243" t="8918" r="10512" b="9077">the</wd>

<space/>

</run>

</ln>

<ln l="6144" t="9192" r="7339" b="9350" baseLine="9341" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9192" r="7339" b="9350">Baskervilles’.</wd>

</ln>

</para>

<para l="6144" t="9653" r="9398" b="9854" alignment="left" spaceBefore="216" lsp="exactly" lspExact="252" language="en">

<ln l="6144" t="9653" r="9398" b="9854" baseLine="9806" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">

<wd l="6144" t="9653" r="6413" b="9811">3.2</wd>

<space/>

<wd l="6643" t="9658" r="7195" b="9811">Tweet</wd>

<space/>

<wd l="7243" t="9653" r="8602" b="9854">pre-processing</wd>

<space/>

<wd l="8659" t="9653" r="9398" b="9854">pipeline</wd>

</ln>

</para>

<para l="6144" t="10013" r="10517" b="12341" alignment="justified" spaceBefore="83" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="10013" r="10512" b="10214" baseLine="10162" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="10013" r="6691" b="10171">About</wd>

<space/>

<wd l="6758" t="10013" r="7459" b="10200">950,000</wd>

<space/>

<wd l="7526" t="10013" r="7925" b="10171">Irish</wd>

<space/>

<wd l="7987" t="10013" r="8774" b="10214">language</wd>

<space/>

<wd l="8837" t="10037" r="9384" b="10171">tweets</wd>

<space/>

<wd l="9456" t="10066" r="9878" b="10171">were</wd>

<space/>

<wd l="9941" t="10013" r="10512" b="10214">posted</wd>

<space/>

</ln>

<ln l="6144" t="10286" r="10517" b="10488" baseLine="10435" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="10286" r="6874" b="10445">between</wd>

<space/>

<wd l="6946" t="10286" r="7709" b="10445">Twitter’s</wd>

<space/>

<wd l="7786" t="10286" r="8371" b="10445">launch</wd>

<space/>

<wd l="8438" t="10286" r="8611" b="10440">in</wd>

<space/>

<wd l="8688" t="10286" r="9115" b="10445">2006</wd>

<space/>

<wd l="9197" t="10286" r="9509" b="10445">and</wd>

<space/>

<wd l="9581" t="10286" r="10517" b="10488">September</wd>

<space/>

</ln>

<ln l="6149" t="10555" r="10512" b="10757" baseLine="10704" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="10560" r="6581" b="10714">2014</wd>

<space/>

<wd l="6653" t="10555" r="6869" b="10757">by</wd>

<space/>

<wd l="6946" t="10555" r="8198" b="10757">approximately</wd>

<space/>

<wd l="8285" t="10560" r="8707" b="10714">8000</wd>

<space/>

<wd l="8779" t="10608" r="9221" b="10714">users</wd>

<space/>

<wd l="9302" t="10555" r="10128" b="10714">identified</wd>

<space/>

<wd l="10200" t="10555" r="10512" b="10714">and</wd>

<space/>

</ln>

<ln l="6144" t="10824" r="10502" b="11026" baseLine="10978" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="10824" r="6787" b="10982">tracked</wd>

<space/>

<wd l="6850" t="10824" r="7066" b="11026">by</wd>

<space/>

<wd l="7133" t="10824" r="7402" b="10982">the</wd>

<space/>

<wd l="7464" t="10824" r="8429" b="11026">Indigenous</wd>

<space/>

<wd l="8501" t="10829" r="9106" b="10982">Tweets</wd>

<space/>

<wd l="9178" t="10824" r="9538" b="10982">web</wd>

<space/>

<wd l="9614" t="10824" r="9950" b="10982">site.</wd>

<space/>

<wd l="10061" t="10829" r="10502" b="10982">Non-</wd>

</ln>

<ln l="6144" t="11098" r="10502" b="11256" baseLine="11246" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11098" r="6547" b="11256">Irish</wd>

<space/>

<wd l="6610" t="11122" r="7157" b="11256">tweets</wd>

<space/>

<wd l="7229" t="11098" r="7656" b="11256">from</wd>

<space/>

<wd l="7714" t="11098" r="8160" b="11256">these</wd>

<space/>

<wd l="8227" t="11150" r="8664" b="11256">users</wd>

<space/>

<wd l="8736" t="11150" r="9158" b="11256">were</wd>

<space/>

<wd l="9226" t="11098" r="9840" b="11256">filtered</wd>

<space/>

<wd l="9907" t="11122" r="10186" b="11256">out</wd>

<space/>

<wd l="10243" t="11150" r="10502" b="11256">us-</wd>

</ln>

<ln l="6144" t="11366" r="10498" b="11568" baseLine="11520" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11366" r="6422" b="11568">ing</wd>

<space/>

<wd l="6485" t="11419" r="6581" b="11525">a</wd>

<space/>

<wd l="6643" t="11366" r="7214" b="11568">simple</wd>

<space/>

<wd l="7277" t="11366" r="8784" b="11568">character-trigram</wd>

<space/>

<wd l="8837" t="11366" r="9624" b="11568">language</wd>

<space/>

<wd l="9682" t="11366" r="10498" b="11525">identifier.</wd>

<space/>

</ln>

<ln l="6144" t="11640" r="10512" b="11842" baseLine="11789" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11645" r="6432" b="11798">We</wd>

<space/>

<wd l="6490" t="11640" r="7186" b="11798">selected</wd>

<space/>

<wd l="7238" t="11693" r="7334" b="11798">a</wd>

<space/>

<wd l="7378" t="11640" r="8050" b="11798">random</wd>

<space/>

<wd l="8102" t="11640" r="8712" b="11842">sample</wd>

<space/>

<wd l="8770" t="11640" r="8957" b="11798">of</wd>

<space/>

<wd l="9019" t="11640" r="9427" b="11798">1550</wd>

<space/>

<wd l="9480" t="11664" r="10027" b="11798">tweets</wd>

<space/>

<wd l="10085" t="11640" r="10512" b="11798">from</wd>

<space/>

</ln>

<ln l="6144" t="11909" r="10502" b="12110" baseLine="12062" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="11909" r="6595" b="12067">these</wd>

<space/>

<wd l="6677" t="11909" r="7378" b="12096">950,000</wd>

<space/>

<wd l="7459" t="11933" r="8006" b="12067">tweets</wd>

<space/>

<wd l="8098" t="11909" r="8410" b="12067">and</wd>

<space/>

<wd l="8486" t="11909" r="9346" b="12110">processed</wd>

<space/>

<wd l="9422" t="11909" r="9864" b="12067">them</wd>

<space/>

<wd l="9941" t="11962" r="10109" b="12067">as</wd>

<space/>

<wd l="10195" t="11909" r="10502" b="12067">fol-</wd>

</ln>

<ln l="6144" t="12182" r="6595" b="12341" baseLine="12331" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="12182" r="6595" b="12341">lows:</wd>

</ln>

</para>

<para l="6144" t="12456" r="10502" b="13426" alignment="justified" spaceBefore="6" fli="216" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="6374" t="12456" r="10498" b="12658" baseLine="12610" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="12461" r="6710" b="12610">(1)</wd>

<space/>

<wd l="6710" t="12461" r="6994" b="12614">We</wd>

<space/>

<wd l="7090" t="12456" r="7925" b="12614">tokenised</wd>

<space/>

<wd l="8016" t="12456" r="8285" b="12614">the</wd>

<space/>

<wd l="8386" t="12480" r="8621" b="12614">set</wd>

<space/>

<wd l="8712" t="12456" r="9101" b="12614">with</wd>

<space/>

<wd l="9197" t="12456" r="9950" b="12658">Owoputi</wd>

<space/>

<wd l="10051" t="12480" r="10210" b="12614">et</wd>

<space/>

<wd l="10306" t="12456" r="10498" b="12614">al.</wd>

<space/>

</ln>

<ln l="6154" t="12691" r="10502" b="12926" baseLine="12876">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6154" t="12734" r="6864" b="12926">(2013)’s</wd>

<space/>

<wd l="6955" t="12730" r="7598" b="12888">version</wd>

<space/>

<wd l="7685" t="12730" r="7877" b="12888">of</wd>

<space/>

</run>

<wd l="7954" t="12691" r="9259" b="12917"><run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">twokenise</run>

<run underlined="none" subsuperscript="superscript" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9360" t="12730" r="9898" b="12888">which</wd>

<space/>

<wd l="9979" t="12730" r="10502" b="12888">works</wd>

<space/>

</run>

</ln>

<ln l="6144" t="12998" r="10502" b="13157" baseLine="13147" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12998" r="6518" b="13157">well</wd>

<space/>

<wd l="6610" t="13051" r="6826" b="13157">on</wd>

<space/>

<wd l="6912" t="12998" r="7272" b="13157">web</wd>

<space/>

<wd l="7363" t="13022" r="8002" b="13157">content</wd>

<space/>

<wd l="8088" t="12998" r="8770" b="13157">features</wd>

<space/>

<wd l="8870" t="12998" r="9264" b="13157">such</wd>

<space/>

<wd l="9350" t="13051" r="9518" b="13157">as</wd>

<space/>

<wd l="9619" t="12998" r="10502" b="13157">emoticons</wd>

<space/>

</ln>

<ln l="6149" t="13267" r="7080" b="13426" baseLine="13421" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13267" r="6461" b="13426">and</wd>

<space/>

<wd l="6514" t="13272" r="7080" b="13426">URLs.</wd>

</ln>

</para>

<para l="6144" t="13546" r="10517" b="14290" alignment="justified" spaceBefore="1" spaceAfter="122" fli="216" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="6374" t="13546" r="10517" b="13747" baseLine="13694" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="13550" r="6725" b="13694">(2)</wd>

<space/>

<wd l="6725" t="13546" r="7243" b="13747">Using</wd>

<space/>

<wd l="7358" t="13598" r="7454" b="13704">a</wd>

<space/>

<wd l="7555" t="13546" r="7824" b="13704">list</wd>

<space/>

<wd l="7934" t="13546" r="8126" b="13704">of</wd>

<space/>

<wd l="8218" t="13546" r="9125" b="13704">multiword</wd>

<space/>

<wd l="9230" t="13546" r="9648" b="13704">units</wd>

<space/>

<wd l="9763" t="13546" r="10190" b="13704">from</wd>

<space/>

<wd l="10291" t="13550" r="10517" b="13704">U´ı</wd>

<space/>

</ln>

<ln l="6144" t="13814" r="10502" b="14011" baseLine="13968" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13814" r="7363" b="13973">Dhonnchadha</wd>

<space/>

<wd l="7440" t="13819" r="8146" b="14011">(2009)’s</wd>

<space/>

<wd l="8227" t="13814" r="9134" b="13973">rule-based</wd>

<space/>

<wd l="9206" t="13819" r="9749" b="13973">Xerox</wd>

<space/>

<wd l="9821" t="13819" r="10195" b="13973">FST</wd>

<space/>

<wd l="10267" t="13838" r="10502" b="13973">to-</wd>

</ln>

<ln l="6144" t="14050" r="10512" b="14290" baseLine="14235">

<wd l="6144" t="14050" r="6907" b="14275"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">keniser</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">4</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7008" t="14141" r="7262" b="14246">we</wd>

<space/>

<wd l="7344" t="14088" r="8064" b="14290">rejoined</wd>

<space/>

<wd l="8146" t="14088" r="9053" b="14246">multiword</wd>

<space/>

<wd l="9134" t="14088" r="9696" b="14246">tokens</wd>

<space/>

<wd l="9787" t="14088" r="10114" b="14246">that</wd>

<space/>

<wd l="10195" t="14088" r="10512" b="14246">had</wd>

</run>

</ln>

</para>

<rulerline l="6144" t="14429" r="7344" b="14429" type="single" width="10" color="000000"/>

<para l="6158" t="14486" r="10469" b="14875" alignment="justified" spaceBefore="58" fli="216" lsp="exactly" lspExact="201" language="en">

<ln l="6403" t="14486" r="10469" b="14678" baseLine="14638">

<wd l="6403" t="14486" r="7147" b="14650"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">3</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Available</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7205" t="14539" r="7344" b="14650">to</wd>

<space/>

<wd l="7411" t="14520" r="8107" b="14650">download</wd>

<space/>

<wd l="8165" t="14520" r="8515" b="14650">from</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8578" t="14525" r="10469" b="14678">http://www.ark.cs.</wd>

<space/>

</run>

</ln>

<ln l="6158" t="14722" r="8390" b="14875" baseLine="14842" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6158" t="14722" r="8390" b="14875">cmu.edu/TweetNLP/#pos</wd>

</ln>

</para>

<para l="6158" t="14904" r="10469" b="15293" alignment="justified" spaceBefore="15" spaceAfter="7" fli="216" lsp="exactly" lspExact="201" language="en">

<ln l="6398" t="14904" r="10469" b="15096" baseLine="15056">

<wd l="6398" t="14904" r="7147" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="600" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="20">4</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="20">Available</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="20"><space/>

<wd l="7286" t="14957" r="7426" b="15067">to</wd>

<space/>

<wd l="7570" t="14938" r="8270" b="15067">download</wd>

<space/>

<wd l="8410" t="14938" r="8755" b="15067">from</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="20"><wd l="8904" t="14942" r="10469" b="15096">https://github.</wd>

<space/>

</run>

</ln>

<ln l="6158" t="15139" r="10334" b="15293" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="20">

<wd l="6158" t="15139" r="10334" b="15293">com/stesh/apertium-gle/tree/master/dev/</wd>

</ln>

</para>

</column>

</section>

<dd l="1433" t="15736" r="10531" b="15977">

<para l="5862" t="15792" r="6085" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5928" t="15792" r="6019" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5928" t="15792" r="6019" b="15946">3</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1430" marginTop="1253" marginRight="1381" marginBottom="1302" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1430" t="1253" r="10528" b="15358">

<column l="1430" t="1253" r="5817" b="15358">

<table l="1517" t="1258" r="5722" b="9298" alignment="left" li="87" ri="95" spaceBefore="5" spaceAfter="255">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<gridTable>

<gridCol>898</gridCol>

<gridCol>3307</gridCol>

<gridRow>283</gridRow>

<gridRow>547</gridRow>

<gridRow>552</gridRow>

<gridRow>548</gridRow>

<gridRow>283</gridRow>

<gridRow>278</gridRow>

<gridRow>547</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>552</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>552</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>552</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>283</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1651" t="1306" r="1987" b="1502" alignment="left" li="129" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="1651" t="1306" r="1987" b="1502" baseLine="1450" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-7">

<wd l="1651" t="1306" r="1987" b="1502">Tag</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="1301" r="5314" b="1502" alignment="left" li="119" spaceAfter="33" lsp="exactly" lspExact="249" language="en">

<ln l="2534" t="1301" r="5314" b="1502" baseLine="1450" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2534" t="1301" r="3614" b="1502">Description</wd>

<space/>

<wd l="3682" t="1301" r="4627" b="1493">(PAROLE</wd>

<space/>

<wd l="4690" t="1301" r="5314" b="1493">TAGS)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="1584" r="1805" b="1738" alignment="left" li="129" spaceAfter="304" lsp="exactly" lspExact="243" language="en">

<ln l="1646" t="1584" r="1805" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="1584" r="1805" b="1738">N</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="1584" r="3792" b="1738" alignment="left" li="72" lsp="exactly" lspExact="243" language="en">

<ln l="2539" t="1584" r="3792" b="1738" baseLine="1728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2539" t="1632" r="3302" b="1738">common</wd>

<space/>

<wd l="3355" t="1632" r="3792" b="1738">noun</wd>

</ln>

</para>

<para l="2544" t="1853" r="4642" b="2050" alignment="left" li="72" spaceBefore="2" spaceAfter="30" lsp="exactly" lspExact="272" language="en">

<ln l="2544" t="1853" r="4642" b="2050" baseLine="2002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2544" t="1858" r="3139" b="2050">(Noun,</wd>

<space/>

<wd l="3202" t="1858" r="3614" b="2011">Pron</wd>

<space/>

<wd l="3672" t="1853" r="4027" b="2040">Ref,</wd>

<space/>

<wd l="4099" t="1853" r="4642" b="2050">Subst)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1651" t="2136" r="1752" b="2323" alignment="left" li="129" spaceBefore="48" spaceAfter="267" lsp="exactly" lspExact="232" language="en">

<ln l="1651" t="2136" r="1752" b="2323" baseLine="2314" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="1651" t="2222" r="1752" b="2323">∧</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="2136" r="3624" b="2602" alignment="left" li="108" ri="2088" spaceAfter="25" lsp="exactly" lspExact="261" language="en">

<ln l="2534" t="2136" r="3600" b="2333" baseLine="2280" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2534" t="2184" r="3110" b="2333">proper</wd>

<space/>

<wd l="3158" t="2184" r="3600" b="2290">noun</wd>

<space/>

</ln>

<ln l="2544" t="2405" r="3624" b="2602" baseLine="2554" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2544" t="2405" r="3019" b="2602">(Prop</wd>

<space/>

<wd l="3077" t="2405" r="3624" b="2597">Noun)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1651" t="2683" r="1800" b="2837" alignment="left" li="129" spaceAfter="294" lsp="exactly" lspExact="248" language="en">

<ln l="1651" t="2683" r="1800" b="2837" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="2683" r="1800" b="2837">O</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="2678" r="5107" b="3149" alignment="left" li="108" ri="612" spaceAfter="25" lsp="exactly" lspExact="258" language="en">

<ln l="2534" t="2678" r="5107" b="2880" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="2731" r="3264" b="2880">pronoun</wd>

<space/>

<wd l="3326" t="2683" r="3806" b="2875">(Pron</wd>

<space/>

<wd l="3859" t="2683" r="4277" b="2866">Pers,</wd>

<space/>

<wd l="4344" t="2683" r="4757" b="2837">Pron</wd>

<space/>

<wd l="4810" t="2678" r="5107" b="2866">Idf,</wd>

<space/>

</ln>

<ln l="2534" t="2957" r="4224" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="2957" r="2952" b="3110">Pron</wd>

<space/>

<wd l="3010" t="2957" r="3206" b="3149">Q,</wd>

<space/>

<wd l="3269" t="2957" r="3682" b="3110">Pron</wd>

<space/>

<wd l="3734" t="2957" r="4224" b="3149">Dem)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="3235" r="1963" b="3389" alignment="left" li="129" spaceAfter="35" lsp="exactly" lspExact="247" language="en">

<ln l="1646" t="3235" r="1963" b="3389" baseLine="3379" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="3235" r="1963" b="3389">VN</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="3230" r="4867" b="3427" alignment="left" li="119" spaceAfter="35" lsp="exactly" lspExact="247" language="en">

<ln l="2534" t="3230" r="4867" b="3427" baseLine="3379" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2534" t="3230" r="3077" b="3389">verbal</wd>

<space/>

<wd l="3134" t="3283" r="3571" b="3389">noun</wd>

<space/>

<wd l="3634" t="3230" r="4262" b="3427">(Verbal</wd>

<space/>

<wd l="4320" t="3235" r="4867" b="3427">Noun)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="3514" r="1800" b="3667" alignment="left" li="129" spaceAfter="30" lsp="exactly" lspExact="243" language="en">

<ln l="1646" t="3514" r="1800" b="3667" baseLine="3658" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="3514" r="1800" b="3667">V</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="3509" r="4104" b="3710" alignment="left" li="119" spaceAfter="30" lsp="exactly" lspExact="243" language="en">

<ln l="2534" t="3509" r="4104" b="3710" baseLine="3658" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2534" t="3509" r="2918" b="3667">verb</wd>

<space/>

<wd l="2986" t="3514" r="3456" b="3710">(Cop,</wd>

<space/>

<wd l="3523" t="3509" r="4104" b="3706">Verb*)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="3792" r="1805" b="3941" alignment="left" li="129" spaceAfter="299" lsp="exactly" lspExact="243" language="en">

<ln l="1646" t="3792" r="1805" b="3941" baseLine="3936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="3792" r="1805" b="3941">A</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="3787" r="4872" b="4262" alignment="left" li="108" ri="864" spaceAfter="25" lsp="exactly" lspExact="258" language="en">

<ln l="2539" t="3787" r="4872" b="3989" baseLine="3936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2539" t="3787" r="3317" b="3989">adjective</wd>

<space/>

<wd l="3379" t="3787" r="3811" b="3989">(Adj,</wd>

<space/>

<wd l="3878" t="3787" r="4445" b="3946">Verbal</wd>

<space/>

<wd l="4502" t="3787" r="4872" b="3989">Adj,</wd>

<space/>

</ln>

<ln l="2534" t="4061" r="3394" b="4262" baseLine="4210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="4066" r="2947" b="4262">Prop</wd>

<space/>

<wd l="3005" t="4061" r="3394" b="4262">Adj)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="4344" r="1790" b="4493" alignment="left" li="129" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="1646" t="4344" r="1790" b="4493" baseLine="4488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="4344" r="1790" b="4493">R</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="4339" r="3802" b="4536" alignment="left" li="119" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="2539" t="4339" r="3802" b="4536" baseLine="4488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2539" t="4339" r="3125" b="4498">adverb</wd>

<space/>

<wd l="3192" t="4339" r="3802" b="4536">(Adv*)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="4622" r="1800" b="4771" alignment="left" li="129" spaceAfter="30" lsp="exactly" lspExact="247" language="en">

<ln l="1646" t="4622" r="1800" b="4771" baseLine="4766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="4622" r="1800" b="4771">D</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="4618" r="4387" b="4814" alignment="left" li="119" spaceAfter="30" lsp="exactly" lspExact="247" language="en">

<ln l="2539" t="4618" r="4387" b="4814" baseLine="4766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2539" t="4618" r="3485" b="4776">determiner</wd>

<space/>

<wd l="3547" t="4622" r="3941" b="4814">(Art,</wd>

<space/>

<wd l="4008" t="4622" r="4387" b="4814">Det)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="4901" r="1766" b="5050" alignment="left" li="129" spaceAfter="299" lsp="exactly" lspExact="248" language="en">

<ln l="1646" t="4901" r="1766" b="5050" baseLine="5045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="4901" r="1766" b="5050">P</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="4896" r="4867" b="5366" alignment="left" li="108" ri="864" spaceAfter="26" lsp="exactly" lspExact="260" language="en">

<ln l="2534" t="4896" r="4867" b="5098" baseLine="5045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2534" t="4896" r="3562" b="5098">preposition,</wd>

<space/>

<wd l="3629" t="4949" r="4061" b="5098">prep.</wd>

<space/>

<wd l="4138" t="4949" r="4867" b="5098">pronoun</wd>

<space/>

</ln>

<ln l="2544" t="5170" r="4157" b="5366" baseLine="5318" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2544" t="5170" r="3163" b="5366">(Prep*,</wd>

<space/>

<wd l="3226" t="5170" r="3643" b="5323">Pron</wd>

<space/>

<wd l="3696" t="5170" r="4157" b="5366">Prep)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="5448" r="1776" b="5597" alignment="left" li="129" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="1646" t="5448" r="1776" b="5597" baseLine="5597" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="5448" r="1776" b="5597">T</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="5443" r="3840" b="5645" alignment="left" li="119" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="2534" t="5443" r="3840" b="5645" baseLine="5597" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2534" t="5443" r="3192" b="5645">particle</wd>

<space/>

<wd l="3254" t="5448" r="3840" b="5640">(Part*)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1656" t="5736" r="1690" b="5914" alignment="left" li="129" spaceAfter="30" lsp="exactly" lspExact="247" language="en">

<ln l="1656" t="5736" r="1690" b="5914" baseLine="5875" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="5856" r="1690" b="5914">,</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="5726" r="4253" b="5928" alignment="left" li="119" spaceAfter="30" lsp="exactly" lspExact="247" language="en">

<ln l="2534" t="5726" r="4253" b="5928" baseLine="5875" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2534" t="5726" r="3566" b="5928">punctuation</wd>

<space/>

<wd l="3629" t="5731" r="4253" b="5923">(Punct)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1651" t="6010" r="1814" b="6163" alignment="left" li="129" spaceAfter="298" lsp="exactly" lspExact="248" language="en">

<ln l="1651" t="6010" r="1814" b="6163" baseLine="6154" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="6010" r="1814" b="6163">&amp;</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="6005" r="4762" b="6475" alignment="left" li="108" ri="972" spaceAfter="30" lsp="exactly" lspExact="258" language="en">

<ln l="2539" t="6005" r="4762" b="6206" baseLine="6154" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2539" t="6005" r="3566" b="6206">conjunction</wd>

<space/>

<wd l="3629" t="6005" r="4099" b="6206">(Conj</wd>

<space/>

<wd l="4176" t="6005" r="4762" b="6192">Coord,</wd>

<space/>

</ln>

<ln l="2539" t="6274" r="3710" b="6475" baseLine="6422" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="2539" t="6274" r="2942" b="6475">Conj</wd>

<space/>

<wd l="3019" t="6274" r="3710" b="6470">Subord)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="13" gridRowTill="13" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1656" t="6542" r="1747" b="6725" alignment="left" li="129" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="1656" t="6542" r="1747" b="6725" baseLine="6706" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="6542" r="1747" b="6725">$</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="13" gridRowTill="13" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="6552" r="4824" b="6754" alignment="left" li="119" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="2534" t="6552" r="4824" b="6754" baseLine="6706" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2534" t="6552" r="3293" b="6739">numeral,</wd>

<space/>

<wd l="3365" t="6552" r="4200" b="6754">quantifier</wd>

<space/>

<wd l="4262" t="6557" r="4824" b="6749">(Num)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="14" gridRowTill="14" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1670" t="6835" r="1699" b="6989" alignment="left" li="129" spaceAfter="30" lsp="exactly" lspExact="248" language="en">

<ln l="1670" t="6835" r="1699" b="6989" baseLine="6984" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1670" t="6835" r="1699" b="6989">!</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="14" gridRowTill="14" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="6830" r="3912" b="7032" alignment="left" li="119" spaceAfter="30" lsp="exactly" lspExact="248" language="en">

<ln l="2534" t="6830" r="3912" b="7032" baseLine="6984" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2534" t="6830" r="3533" b="7032">interjection</wd>

<space/>

<wd l="3595" t="6830" r="3912" b="7032">(Itj)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="15" gridRowTill="15" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1651" t="7114" r="1805" b="7267" alignment="left" li="129" spaceAfter="299" lsp="exactly" lspExact="247" language="en">

<ln l="1651" t="7114" r="1805" b="7267" baseLine="7262" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1651" t="7114" r="1805" b="7267">G</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="15" gridRowTill="15" alignment="left" verticalAlignment="top">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="7109" r="5530" b="7584" alignment="left" li="108" spaceAfter="30" lsp="exactly" lspExact="258" language="en">

<ln l="2534" t="7109" r="5530" b="7310" baseLine="7262" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="7109" r="3168" b="7310">foreign</wd>

<space/>

<wd l="3221" t="7109" r="3797" b="7296">words,</wd>

<space/>

<wd l="3864" t="7109" r="5074" b="7296">abbreviations,</wd>

<space/>

<wd l="5141" t="7109" r="5530" b="7267">item</wd>

<space/>

</ln>

<ln l="2544" t="7382" r="5261" b="7584" baseLine="7531" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2544" t="7382" r="3326" b="7584">(Foreign,</wd>

<space/>

<wd l="3394" t="7382" r="3768" b="7570">Abr,</wd>

<space/>

<wd l="3835" t="7387" r="4277" b="7570">Item,</wd>

<space/>

<wd l="4344" t="7382" r="5261" b="7579">Unknown)</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="16" gridRowTill="16" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1675" t="7680" r="1747" b="7810" alignment="left" li="129" spaceBefore="57" spaceAfter="35" lsp="exactly" lspExact="176" language="en">

<ln l="1675" t="7680" r="1747" b="7810" baseLine="7810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Lucida Console" fontPitch="fixed" spacing="0">

<wd l="1675" t="7680" r="1747" b="7704">˜</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="16" gridRowTill="16" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="7661" r="4037" b="7819" alignment="left" li="119" spaceAfter="25" lsp="exactly" lspExact="243" language="en">

<ln l="2539" t="7661" r="4037" b="7819" baseLine="7810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2539" t="7661" r="3360" b="7819">discourse</wd>

<space/>

<wd l="3418" t="7661" r="4037" b="7819">marker</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="17" gridRowTill="17" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="7944" r="1757" b="8093" alignment="left" li="129" spaceAfter="30" lsp="exactly" lspExact="248" language="en">

<ln l="1646" t="7944" r="1757" b="8093" baseLine="8093" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="7944" r="1757" b="8093">#</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="17" gridRowTill="17" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="7939" r="3202" b="8141" alignment="left" li="119" spaceAfter="30" lsp="exactly" lspExact="248" language="en">

<ln l="2534" t="7939" r="3202" b="8141" baseLine="8093" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="7939" r="3202" b="8141">hashtag</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="18" gridRowTill="18" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="8222" r="2290" b="8376" alignment="left" li="129" spaceAfter="25" lsp="exactly" lspExact="247" language="en">

<ln l="1646" t="8222" r="2290" b="8376" baseLine="8371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="8222" r="2290" b="8376">#MWE</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="18" gridRowTill="18" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="8218" r="4234" b="8419" alignment="left" li="119" spaceAfter="25" lsp="exactly" lspExact="247" language="en">

<ln l="2534" t="8218" r="4234" b="8419" baseLine="8371" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2534" t="8218" r="3518" b="8376">multi-word</wd>

<space/>

<wd l="3571" t="8218" r="4234" b="8419">hashtag</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="19" gridRowTill="19" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1670" t="8501" r="1824" b="8654" alignment="left" li="129" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="1670" t="8501" r="1824" b="8654" baseLine="8650" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1670" t="8501" r="1824" b="8654">@</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="19" gridRowTill="19" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="8496" r="3485" b="8654" alignment="left" li="119" spaceAfter="20" lsp="exactly" lspExact="248" language="en">

<ln l="2539" t="8496" r="3485" b="8654" baseLine="8650" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2539" t="8496" r="3485" b="8654">at-mention</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="20" gridRowTill="20" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="8779" r="1781" b="8928" alignment="left" li="129" spaceAfter="30" lsp="exactly" lspExact="248" language="en">

<ln l="1646" t="8779" r="1781" b="8928" baseLine="8928" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="8779" r="1781" b="8928">E</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="20" gridRowTill="20" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2539" t="8774" r="3350" b="8933" alignment="left" li="119" spaceAfter="30" lsp="exactly" lspExact="248" language="en">

<ln l="2539" t="8774" r="3350" b="8933" baseLine="8928" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2539" t="8774" r="3350" b="8933">emoticon</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="21" gridRowTill="21" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1646" t="9062" r="1805" b="9216" alignment="left" li="129" spaceAfter="26" lsp="exactly" lspExact="247" language="en">

<ln l="1646" t="9062" r="1805" b="9216" baseLine="9206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1646" t="9062" r="1805" b="9216">U</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="21" gridRowTill="21" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2534" t="9058" r="5357" b="9254" alignment="left" li="119" spaceAfter="26" lsp="exactly" lspExact="247" language="en">

<ln l="2534" t="9058" r="5357" b="9254" baseLine="9206" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="2534" t="9058" r="3514" b="9216">URL/email</wd>

<space/>

<wd l="3576" t="9058" r="4776" b="9216">address/XML</wd>

<space/>

<wd l="4838" t="9058" r="5357" b="9254">(Web)</wd>

</ln>

</para>

</cell>

</table>

<para l="1440" t="9614" r="5794" b="10358" alignment="justified" lsp="exactly" lspExact="269" language="en">

<ln l="1440" t="9614" r="5794" b="9816" baseLine="9763" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9614" r="1920" b="9773">Table</wd>

<space/>

<wd l="2026" t="9619" r="2155" b="9773">1:</wd>

<space/>

<wd l="2299" t="9614" r="3082" b="9816">Mapping</wd>

<space/>

<wd l="3173" t="9614" r="3365" b="9773">of</wd>

<space/>

<wd l="3437" t="9614" r="3835" b="9773">Irish</wd>

<space/>

<wd l="3922" t="9614" r="4550" b="9773">Twitter</wd>

<space/>

<wd l="4627" t="9638" r="5141" b="9816">tagset</wd>

<space/>

<wd l="5222" t="9638" r="5386" b="9773">to</wd>

<space/>

<wd l="5472" t="9619" r="5794" b="9768">PA-</wd>

</ln>

<ln l="1440" t="9883" r="5794" b="10085" baseLine="10032" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9888" r="2002" b="10042">ROLE</wd>

<space/>

<wd l="2083" t="9907" r="2635" b="10085">tagset.</wd>

<space/>

<wd l="2798" t="9888" r="2957" b="10080">(*</wd>

<space/>

<wd l="3053" t="9883" r="3821" b="10042">indicates</wd>

<space/>

<wd l="3912" t="9883" r="4123" b="10042">all</wd>

<space/>

<wd l="4205" t="9883" r="4709" b="10042">forms</wd>

<space/>

<wd l="4800" t="9883" r="4992" b="10042">of</wd>

<space/>

<wd l="5059" t="9883" r="5323" b="10042">the</wd>

<space/>

<wd l="5410" t="9883" r="5794" b="10042">fine-</wd>

</ln>

<ln l="1445" t="10157" r="3518" b="10358" baseLine="10306" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="10157" r="2098" b="10358">grained</wd>

<space/>

<wd l="2160" t="10181" r="2395" b="10315">set</wd>

<space/>

<wd l="2448" t="10157" r="2702" b="10315">for</wd>

<space/>

<wd l="2755" t="10157" r="3082" b="10315">that</wd>

<space/>

<wd l="3134" t="10162" r="3518" b="10358">tag.)</wd>

</ln>

</para>

<para l="1440" t="10848" r="5808" b="11323" alignment="justified" spaceBefore="421" lsp="exactly" lspExact="272" language="en">

<ln l="1440" t="10848" r="5808" b="11050" baseLine="11002" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="10848" r="1853" b="11006">been</wd>

<space/>

<wd l="1934" t="10848" r="2299" b="11050">split</wd>

<space/>

<wd l="2371" t="10848" r="2587" b="11050">by</wd>

<space/>

<wd l="2659" t="10848" r="2928" b="11006">the</wd>

<space/>

<wd l="3000" t="10848" r="4925" b="11050">language-independent</wd>

<space/>

<wd l="4997" t="10848" r="5808" b="11006">tokenizer</wd>

<space/>

</ln>

<ln l="1450" t="11122" r="4872" b="11323" baseLine="11270">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="11126" r="1814" b="11323">(e.g.</wd>

<space/>

<wd l="1896" t="11122" r="2160" b="11280">the</wd>

<space/>

<wd l="2222" t="11122" r="3139" b="11323">compound</wd>

<space/>

<wd l="3192" t="11122" r="4176" b="11323">preposition</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4229" t="11174" r="4445" b="11323">go</wd>

<space/>

</run>

<wd l="4526" t="11122" r="4872" b="11318"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">dta)</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="11405" r="5803" b="12422" alignment="justified" spaceBefore="12" fli="216" lsp="exactly" lspExact="272" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="1666" t="11405" r="5794" b="11606" baseLine="11558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="11410" r="1973" b="11558">(3)</wd>

<space/>

<wd l="1973" t="11405" r="2491" b="11606">Using</wd>

<space/>

<wd l="2558" t="11405" r="3178" b="11606">regular</wd>

<space/>

<wd l="3240" t="11405" r="4296" b="11606">expressions,</wd>

<space/>

<wd l="4368" t="11458" r="4622" b="11563">we</wd>

<space/>

<wd l="4685" t="11405" r="5064" b="11563">then</wd>

<space/>

<wd l="5136" t="11405" r="5501" b="11606">split</wd>

<space/>

<wd l="5563" t="11429" r="5794" b="11563">to-</wd>

</ln>

<ln l="1440" t="11678" r="5798" b="11875" baseLine="11827">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="11678" r="1829" b="11837">kens</wd>

<space/>

<wd l="1882" t="11678" r="2270" b="11837">with</wd>

<space/>

<wd l="2314" t="11678" r="2582" b="11837">the</wd>

<space/>

<wd l="2630" t="11678" r="3686" b="11837">contractions</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3744" t="11678" r="3912" b="11837">b’</wd>

<space/>

<wd l="3970" t="11678" r="4358" b="11875">(ba),</wd>

<space/>

<wd l="4426" t="11678" r="4603" b="11837">d’</wd>

<space/>

<wd l="4661" t="11678" r="5050" b="11875">(do),</wd>

<space/>

<wd l="5117" t="11683" r="5342" b="11837">m’</wd>

<space/>

<wd l="5400" t="11683" r="5798" b="11875">(mo)</wd>

<space/>

</run>

</ln>

<ln l="1440" t="11947" r="5803" b="12149" baseLine="12101">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="11947" r="2170" b="12149">prefixes.</wd>

<space/>

<wd l="2381" t="11952" r="2688" b="12106">For</wd>

<space/>

<wd l="2789" t="11947" r="3518" b="12149">example</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3619" t="11947" r="4387" b="12149">b’fheidir</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4507" t="11947" r="5261" b="12149">‘maybe’;</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5395" t="11947" r="5803" b="12106">d’ith</wd>

<space/>

</run>

</ln>

<ln l="1464" t="12221" r="3696" b="12422" baseLine="12370">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1464" t="12226" r="1886" b="12408">‘ate’;</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1954" t="12226" r="2664" b="12422">m’aigne</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2750" t="12226" r="3072" b="12422">‘my</wd>

<space/>

<wd l="3130" t="12221" r="3696" b="12379">mind’.</wd>

</run>

</ln>

</para>

<para l="1440" t="12504" r="5803" b="13522" alignment="justified" spaceBefore="10" fli="216" lsp="exactly" lspExact="272" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="1666" t="12504" r="5794" b="12706" baseLine="12658" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="12509" r="1992" b="12658">(4)</wd>

<space/>

<wd l="1992" t="12509" r="2275" b="12662">We</wd>

<space/>

<wd l="2357" t="12504" r="2746" b="12662">took</wd>

<space/>

<wd l="2827" t="12557" r="2923" b="12662">a</wd>

<space/>

<wd l="3000" t="12504" r="4195" b="12706">bootstrapping</wd>

<space/>

<wd l="4282" t="12504" r="5078" b="12706">approach</wd>

<space/>

<wd l="5155" t="12504" r="5371" b="12706">by</wd>

<space/>

<wd l="5453" t="12557" r="5794" b="12706">pre-</wd>

</ln>

<ln l="1440" t="12778" r="5794" b="12979" baseLine="12926" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12778" r="2093" b="12979">tagging</wd>

<space/>

<wd l="2189" t="12778" r="2501" b="12936">and</wd>

<space/>

<wd l="2587" t="12778" r="3662" b="12979">lemmatising</wd>

<space/>

<wd l="3754" t="12778" r="4022" b="12936">the</wd>

<space/>

<wd l="4114" t="12778" r="4478" b="12936">data</wd>

<space/>

<wd l="4560" t="12778" r="4949" b="12936">with</wd>

<space/>

<wd l="5040" t="12778" r="5304" b="12936">the</wd>

<space/>

<wd l="5395" t="12778" r="5794" b="12936">rule-</wd>

</ln>

<ln l="1440" t="13046" r="5803" b="13248" baseLine="13195" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13046" r="1939" b="13205">based</wd>

<space/>

<wd l="1997" t="13046" r="2395" b="13205">Irish</wd>

<space/>

<wd l="2453" t="13051" r="3475" b="13248">POS-tagger</wd>

<space/>

<wd l="3533" t="13046" r="3912" b="13234">first,</wd>

<space/>

<wd l="3989" t="13046" r="4301" b="13205">and</wd>

<space/>

<wd l="4354" t="13046" r="4733" b="13205">then</wd>

<space/>

<wd l="4790" t="13046" r="5482" b="13248">mapped</wd>

<space/>

<wd l="5539" t="13046" r="5803" b="13205">the</wd>

<space/>

</ln>

<ln l="1440" t="13320" r="4795" b="13522" baseLine="13469" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13344" r="1786" b="13522">tags</wd>

<space/>

<wd l="1848" t="13344" r="2011" b="13478">to</wd>

<space/>

<wd l="2074" t="13373" r="2366" b="13478">our</wd>

<space/>

<wd l="2414" t="13373" r="2770" b="13478">new</wd>

<space/>

<wd l="2827" t="13320" r="4181" b="13522">Twitter-specific</wd>

<space/>

<wd l="4243" t="13344" r="4795" b="13522">tagset.</wd>

</ln>

</para>

<para l="1440" t="13603" r="5808" b="14890" alignment="justified" spaceBefore="8" spaceAfter="169" fli="216" lsp="exactly" lspExact="272" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="1666" t="13603" r="5803" b="13805" baseLine="13752" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1666" t="13603" r="1954" b="13752">(5)</wd>

<space/>

<wd l="1954" t="13608" r="2136" b="13757">In</wd>

<space/>

<wd l="2184" t="13656" r="2630" b="13762">cases</wd>

<space/>

<wd l="2678" t="13603" r="3211" b="13762">where</wd>

<space/>

<wd l="3254" t="13603" r="3518" b="13762">the</wd>

<space/>

<wd l="3562" t="13603" r="4474" b="13762">rule-based</wd>

<space/>

<wd l="4512" t="13627" r="5064" b="13805">tagger</wd>

<space/>

<wd l="5098" t="13603" r="5597" b="13762">failed</wd>

<space/>

<wd l="5635" t="13627" r="5803" b="13762">to</wd>

<space/>

</ln>

<ln l="1440" t="13877" r="5803" b="14078" baseLine="14026" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1440" t="13877" r="2141" b="14078">produce</wd>

<space/>

<wd l="2194" t="13930" r="2290" b="14035">a</wd>

<space/>

<wd l="2338" t="13877" r="2928" b="14078">unique</wd>

<space/>

<wd l="2976" t="13901" r="3288" b="14078">tag,</wd>

<space/>

<wd l="3346" t="13930" r="3600" b="14035">we</wd>

<space/>

<wd l="3648" t="13877" r="4051" b="14035">used</wd>

<space/>

<wd l="4104" t="13930" r="4200" b="14035">a</wd>

<space/>

<wd l="4253" t="13877" r="4824" b="14078">simple</wd>

<space/>

<wd l="4872" t="13877" r="5496" b="14078">bigram</wd>

<space/>

<wd l="5539" t="13901" r="5803" b="14078">tag</wd>

<space/>

</ln>

<ln l="1440" t="14146" r="5808" b="14347" baseLine="14294" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1440" t="14146" r="1982" b="14304">model</wd>

<space/>

<wd l="2074" t="14146" r="2746" b="14342">(trained</wd>

<space/>

<wd l="2832" t="14198" r="3043" b="14304">on</wd>

<space/>

<wd l="3125" t="14146" r="3389" b="14304">the</wd>

<space/>

<wd l="3475" t="14146" r="4670" b="14347">gold-standard</wd>

<space/>

<wd l="4752" t="14146" r="5808" b="14347">POS-tagged</wd>

<space/>

</ln>

<ln l="1445" t="14414" r="5794" b="14616" baseLine="14568" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1445" t="14467" r="2016" b="14616">corpus</wd>

<space/>

<wd l="2102" t="14414" r="2530" b="14573">from</wd>

<space/>

<wd l="2611" t="14414" r="4123" b="14573">UiDhonnchadha</wd>

<space/>

<wd l="4214" t="14419" r="4776" b="14611">(2009)</wd>

<space/>

<wd l="4867" t="14510" r="4978" b="14525">–</wd>

<space/>

<wd l="5069" t="14467" r="5333" b="14573">see</wd>

<space/>

<wd l="5424" t="14419" r="5794" b="14573">Sec-</wd>

</ln>

<ln l="1440" t="14688" r="5803" b="14890" baseLine="14837" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="1440" t="14688" r="1781" b="14846">tion</wd>

<space/>

<wd l="1834" t="14688" r="2165" b="14885">5.1)</wd>

<space/>

<wd l="2222" t="14712" r="2386" b="14846">to</wd>

<space/>

<wd l="2443" t="14688" r="3043" b="14846">choose</wd>

<space/>

<wd l="3096" t="14688" r="3360" b="14846">the</wd>

<space/>

<wd l="3408" t="14712" r="3835" b="14846">most</wd>

<space/>

<wd l="3883" t="14688" r="4373" b="14890">likely</wd>

<space/>

<wd l="4426" t="14712" r="4690" b="14890">tag</wd>

<space/>

<wd l="4738" t="14688" r="5165" b="14846">from</wd>

<space/>

<wd l="5218" t="14741" r="5803" b="14890">among</wd>

</ln>

</para>

<rulerline l="1430" t="15072" r="2640" b="15072" type="single" width="10" color="000000"/>

<para l="1454" t="15144" r="2285" b="15264" alignment="left" spaceBefore="78" spaceAfter="55" lsp="exactly" lspExact="151" language="en">

<ln l="1454" t="15144" r="2285" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="850" fontFace="Lucida Console" fontPitch="fixed" spacing="1">

<wd l="1454" t="15144" r="2285" b="15264">irishfst</wd>

</ln>

</para>

</column>

<column l="6141" t="1253" r="10528" b="15358">

<para l="6144" t="1320" r="9408" b="1522" alignment="left" spaceBefore="5" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="1320" r="9408" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="1320" r="6605" b="1478">those</wd>

<space/>

<wd l="6667" t="1344" r="7219" b="1522">output</wd>

<space/>

<wd l="7272" t="1320" r="7488" b="1522">by</wd>

<space/>

<wd l="7546" t="1320" r="7810" b="1478">the</wd>

<space/>

<wd l="7867" t="1320" r="8779" b="1478">rule-based</wd>

<space/>

<wd l="8832" t="1344" r="9408" b="1522">tagger.</wd>

</ln>

</para>

<para l="6149" t="1594" r="10502" b="2069" alignment="justified" fli="216" lsp="exactly" lspExact="271" language="en">

<bullet type="ordered" numChars="4">

</bullet>

<ln l="6374" t="1594" r="10502" b="1795" baseLine="1747" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6374" t="1594" r="6667" b="1747">(6)</wd>

<space/>

<wd l="6667" t="1594" r="7315" b="1795">Finally,</wd>

<space/>

<wd l="7378" t="1646" r="7632" b="1752">we</wd>

<space/>

<wd l="7680" t="1594" r="8491" b="1795">manually</wd>

<space/>

<wd l="8549" t="1594" r="9355" b="1752">corrected</wd>

<space/>

<wd l="9403" t="1594" r="9797" b="1752">both</wd>

<space/>

<wd l="9845" t="1594" r="10109" b="1752">the</wd>

<space/>

<wd l="10162" t="1618" r="10502" b="1795">tags</wd>

<space/>

</ln>

<ln l="6149" t="1867" r="10080" b="2069" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="1867" r="6461" b="2026">and</wd>

<space/>

<wd l="6514" t="1867" r="7186" b="2026">lemmas</wd>

<space/>

<wd l="7248" t="1891" r="7416" b="2026">to</wd>

<space/>

<wd l="7478" t="1891" r="7992" b="2026">create</wd>

<space/>

<wd l="8054" t="1920" r="8150" b="2026">a</wd>

<space/>

<wd l="8203" t="1867" r="9398" b="2069">gold-standard</wd>

<space/>

<wd l="9461" t="1920" r="10080" b="2069">corpus.</wd>

</ln>

</para>

<para l="6144" t="2318" r="7690" b="2477" alignment="left" spaceBefore="203" lsp="exactly" lspExact="249" language="en">

<ln l="6144" t="2318" r="7690" b="2477" baseLine="2467" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="6144" t="2318" r="6413" b="2477">3.3</wd>

<space/>

<wd l="6638" t="2318" r="7690" b="2477">Annotation</wd>

</ln>

</para>

<para l="6144" t="2669" r="10517" b="6125" alignment="justified" spaceBefore="68" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="2669" r="10502" b="2827" baseLine="2822" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2669" r="6485" b="2827">The</wd>

<space/>

<wd l="6562" t="2669" r="7483" b="2827">annotation</wd>

<space/>

<wd l="7555" t="2669" r="7906" b="2827">task</wd>

<space/>

<wd l="7978" t="2722" r="8309" b="2827">was</wd>

<space/>

<wd l="8400" t="2669" r="8962" b="2827">shared</wd>

<space/>

<wd l="9034" t="2669" r="9763" b="2827">between</wd>

<space/>

<wd l="9835" t="2693" r="10157" b="2827">two</wd>

<space/>

<wd l="10238" t="2722" r="10502" b="2827">an-</wd>

</ln>

<ln l="6144" t="2942" r="10512" b="3101" baseLine="3091" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2966" r="6893" b="3101">notators.</wd>

<space/>

<wd l="6974" t="2942" r="7906" b="3101">Correction</wd>

<space/>

<wd l="7958" t="2942" r="8150" b="3101">of</wd>

<space/>

<wd l="8184" t="2942" r="8453" b="3101">the</wd>

<space/>

<wd l="8510" t="2942" r="8846" b="3101">first</wd>

<space/>

<wd l="8899" t="2942" r="9216" b="3101">500</wd>

<space/>

<wd l="9274" t="2966" r="9821" b="3101">tweets</wd>

<space/>

<wd l="9883" t="2942" r="10512" b="3101">formed</wd>

<space/>

</ln>

<ln l="6149" t="3211" r="10517" b="3413" baseLine="3360" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="3264" r="6245" b="3370">a</wd>

<space/>

<wd l="6312" t="3211" r="6739" b="3370">basis</wd>

<space/>

<wd l="6816" t="3211" r="7075" b="3370">for</wd>

<space/>

<wd l="7142" t="3211" r="7944" b="3413">assessing</wd>

<space/>

<wd l="8016" t="3211" r="8405" b="3370">both</wd>

<space/>

<wd l="8472" t="3211" r="8741" b="3370">the</wd>

<space/>

<wd l="8808" t="3211" r="9893" b="3370">intuitiveness</wd>

<space/>

<wd l="9974" t="3211" r="10166" b="3370">of</wd>

<space/>

<wd l="10224" t="3264" r="10517" b="3370">our</wd>

<space/>

</ln>

<ln l="6144" t="3485" r="10498" b="3686" baseLine="3634" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3509" r="6658" b="3686">tagset</wd>

<space/>

<wd l="6744" t="3485" r="7056" b="3643">and</wd>

<space/>

<wd l="7138" t="3485" r="7406" b="3643">the</wd>

<space/>

<wd l="7488" t="3485" r="8237" b="3686">usability</wd>

<space/>

<wd l="8328" t="3485" r="8520" b="3643">of</wd>

<space/>

<wd l="8597" t="3538" r="8885" b="3643">our</wd>

<space/>

<wd l="8971" t="3485" r="9888" b="3643">annotation</wd>

<space/>

<wd l="9974" t="3485" r="10498" b="3686">guide.</wd>

<space/>

</ln>

<ln l="6149" t="3754" r="10512" b="3912" baseLine="3902" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="3754" r="6787" b="3912">Several</wd>

<space/>

<wd l="6845" t="3754" r="7829" b="3912">discussions</wd>

<space/>

<wd l="7891" t="3754" r="8203" b="3912">and</wd>

<space/>

<wd l="8251" t="3754" r="9024" b="3912">revisions</wd>

<space/>

<wd l="9082" t="3806" r="9504" b="3912">were</wd>

<space/>

<wd l="9557" t="3754" r="10306" b="3912">involved</wd>

<space/>

<wd l="10358" t="3778" r="10512" b="3912">at</wd>

<space/>

</ln>

<ln l="6144" t="4022" r="10512" b="4224" baseLine="4176" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4022" r="6451" b="4181">this</wd>

<space/>

<wd l="6557" t="4046" r="6994" b="4224">stage</wd>

<space/>

<wd l="7085" t="4022" r="7642" b="4181">before</wd>

<space/>

<wd l="7733" t="4022" r="8539" b="4224">finalising</wd>

<space/>

<wd l="8630" t="4022" r="8894" b="4181">the</wd>

<space/>

<wd l="8981" t="4046" r="9533" b="4224">tagset.</wd>

<space/>

<wd l="9710" t="4022" r="10051" b="4181">The</wd>

<space/>

<wd l="10138" t="4046" r="10512" b="4181">next</wd>

<space/>

</ln>

<ln l="6168" t="4296" r="10512" b="4454" baseLine="4445" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6168" t="4301" r="6581" b="4454">1000</wd>

<space/>

<wd l="6677" t="4320" r="7224" b="4454">tweets</wd>

<space/>

<wd l="7325" t="4349" r="7747" b="4454">were</wd>

<space/>

<wd l="7848" t="4296" r="8693" b="4454">annotated</wd>

<space/>

<wd l="8784" t="4296" r="8957" b="4450">in</wd>

<space/>

<wd l="9053" t="4296" r="10027" b="4454">accordance</wd>

<space/>

<wd l="10123" t="4296" r="10512" b="4454">with</wd>

<space/>

</ln>

<ln l="6144" t="4565" r="10502" b="4766" baseLine="4718" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4565" r="6413" b="4723">the</wd>

<space/>

<wd l="6490" t="4565" r="7426" b="4766">guidelines,</wd>

<space/>

<wd l="7517" t="4565" r="7997" b="4723">while</wd>

<space/>

<wd l="8074" t="4565" r="8544" b="4766">using</wd>

<space/>

<wd l="8621" t="4565" r="8885" b="4723">the</wd>

<space/>

<wd l="8962" t="4565" r="9298" b="4723">first</wd>

<space/>

<wd l="9374" t="4565" r="9696" b="4723">500</wd>

<space/>

<wd l="9778" t="4618" r="9946" b="4723">as</wd>

<space/>

<wd l="10032" t="4618" r="10128" b="4723">a</wd>

<space/>

<wd l="10195" t="4565" r="10502" b="4723">ref-</wd>

</ln>

<ln l="6149" t="4838" r="10517" b="5040" baseLine="4987" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="4891" r="6758" b="4997">erence.</wd>

<space/>

<wd l="6840" t="4843" r="7061" b="4997">At</wd>

<space/>

<wd l="7114" t="4838" r="7421" b="4997">this</wd>

<space/>

<wd l="7493" t="4862" r="7973" b="5040">stage,</wd>

<space/>

<wd l="8040" t="4891" r="8294" b="4997">we</wd>

<space/>

<wd l="8352" t="4838" r="9110" b="4997">removed</wd>

<space/>

<wd l="9168" t="4891" r="9264" b="4997">a</wd>

<space/>

<wd l="9326" t="4838" r="9787" b="4997">small</wd>

<space/>

<wd l="9845" t="4838" r="10517" b="4997">number</wd>

<space/>

</ln>

<ln l="6149" t="5107" r="10502" b="5309" baseLine="5261" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="5107" r="6341" b="5266">of</wd>

<space/>

<wd l="6379" t="5131" r="6931" b="5266">tweets</wd>

<space/>

<wd l="6989" t="5107" r="7320" b="5266">that</wd>

<space/>

<wd l="7378" t="5107" r="8218" b="5266">contained</wd>

<space/>

<wd l="8294" t="5112" r="8770" b="5266">100%</wd>

<space/>

<wd l="8832" t="5107" r="9499" b="5309">English</wd>

<space/>

<wd l="9552" t="5131" r="9878" b="5266">text</wd>

<space/>

<wd l="9941" t="5112" r="10502" b="5304">(errors</wd>

<space/>

</ln>

<ln l="6144" t="5381" r="10502" b="5582" baseLine="5530" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5381" r="6317" b="5534">in</wd>

<space/>

<wd l="6389" t="5381" r="6653" b="5539">the</wd>

<space/>

<wd l="6725" t="5381" r="7512" b="5582">language</wd>

<space/>

<wd l="7584" t="5381" r="8491" b="5578">identifier).</wd>

<space/>

<wd l="8621" t="5381" r="8899" b="5534">All</wd>

<space/>

<wd l="8976" t="5381" r="9427" b="5539">other</wd>

<space/>

<wd l="9494" t="5405" r="10042" b="5539">tweets</wd>

<space/>

<wd l="10128" t="5434" r="10502" b="5539">con-</wd>

</ln>

<ln l="6144" t="5650" r="10502" b="5851" baseLine="5803" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="5650" r="6749" b="5851">taining</wd>

<space/>

<wd l="6830" t="5650" r="7632" b="5808">non-Irish</wd>

<space/>

<wd l="7714" t="5674" r="8035" b="5808">text</wd>

<space/>

<wd l="8117" t="5650" r="9120" b="5851">represented</wd>

<space/>

<wd l="9202" t="5650" r="9634" b="5808">valid</wd>

<space/>

<wd l="9710" t="5650" r="10502" b="5808">instances</wd>

<space/>

</ln>

<ln l="6149" t="5923" r="7757" b="6125" baseLine="6072" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="5923" r="6341" b="6082">of</wd>

<space/>

<wd l="6389" t="5923" r="7757" b="6125">code-switching.</wd>

</ln>

</para>

<para l="6144" t="6192" r="10517" b="7752" alignment="justified" fli="216" lsp="exactly" lspExact="272" language="en">

<ln l="6365" t="6192" r="10512" b="6394" baseLine="6346" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="6192" r="6701" b="6350">The</wd>

<space/>

<wd l="6797" t="6216" r="7694" b="6350">annotators</wd>

<space/>

<wd l="7790" t="6245" r="8213" b="6350">were</wd>

<space/>

<wd l="8309" t="6192" r="8654" b="6350">also</wd>

<space/>

<wd l="8750" t="6192" r="9240" b="6350">asked</wd>

<space/>

<wd l="9331" t="6216" r="9494" b="6350">to</wd>

<space/>

<wd l="9590" t="6192" r="10104" b="6394">verify</wd>

<space/>

<wd l="10200" t="6192" r="10512" b="6350">and</wd>

<space/>

</ln>

<ln l="6149" t="6466" r="10502" b="6624" baseLine="6614" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="6490" r="6754" b="6624">correct</wd>

<space/>

<wd l="6826" t="6466" r="7090" b="6624">the</wd>

<space/>

<wd l="7166" t="6466" r="7766" b="6624">lemma</wd>

<space/>

<wd l="7838" t="6466" r="8266" b="6624">form</wd>

<space/>

<wd l="8338" t="6466" r="8482" b="6619">if</wd>

<space/>

<wd l="8549" t="6518" r="8746" b="6624">an</wd>

<space/>

<wd l="8822" t="6466" r="9600" b="6624">incorrect</wd>

<space/>

<wd l="9677" t="6466" r="10104" b="6624">form</wd>

<space/>

<wd l="10176" t="6518" r="10502" b="6624">was</wd>

<space/>

</ln>

<ln l="6154" t="6734" r="10502" b="6936" baseLine="6888" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="6734" r="7008" b="6936">suggested</wd>

<space/>

<wd l="7118" t="6734" r="7334" b="6936">by</wd>

<space/>

<wd l="7450" t="6734" r="7718" b="6893">the</wd>

<space/>

<wd l="7834" t="6734" r="9101" b="6936">morphological</wd>

<space/>

<wd l="9221" t="6734" r="9974" b="6936">analyser.</wd>

<space/>

<wd l="10234" t="6734" r="10502" b="6888">All</wd>

<space/>

</ln>

<ln l="6149" t="7008" r="10502" b="7210" baseLine="7157" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="7008" r="6600" b="7166">other</wd>

<space/>

<wd l="6672" t="7008" r="7474" b="7166">tokeniser</wd>

<space/>

<wd l="7550" t="7008" r="8117" b="7195">issues,</wd>

<space/>

<wd l="8218" t="7008" r="8664" b="7166">often</wd>

<space/>

<wd l="8741" t="7008" r="9562" b="7210">involving</wd>

<space/>

<wd l="9643" t="7008" r="10046" b="7166">Irish</wd>

<space/>

<wd l="10128" t="7061" r="10502" b="7166">con-</wd>

</ln>

<ln l="6144" t="7277" r="10517" b="7478" baseLine="7430" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7277" r="6941" b="7464">tractions,</wd>

<space/>

<wd l="7042" t="7330" r="7464" b="7435">were</wd>

<space/>

<wd l="7550" t="7277" r="7896" b="7435">also</wd>

<space/>

<wd l="7982" t="7277" r="8842" b="7435">addressed</wd>

<space/>

<wd l="8928" t="7301" r="9082" b="7435">at</wd>

<space/>

<wd l="9163" t="7277" r="9470" b="7435">this</wd>

<space/>

<wd l="9566" t="7301" r="10051" b="7478">stage.</wd>

<space/>

<wd l="10210" t="7282" r="10517" b="7435">For</wd>

<space/>

</ln>

<ln l="6149" t="7550" r="8405" b="7752" baseLine="7699">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6149" t="7550" r="6878" b="7752">example</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6946" t="7555" r="7344" b="7709">Td’n</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7416" t="7642" r="7555" b="7656">−</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7646" t="7584" r="7786" b="7714">&gt;</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7867" t="7555" r="8088" b="7709">Td</wd>

<space/>

</run>

<wd l="8141" t="7603" r="8405" b="7709"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">an</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="8016" r="9341" b="8237" alignment="left" spaceBefore="209" lsp="exactly" lspExact="279" language="en">

<ln l="6144" t="8016" r="9341" b="8237" baseLine="8179" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">

<wd l="6144" t="8016" r="6259" b="8184">4</wd>

<space/>

<wd l="6509" t="8016" r="8155" b="8189">Inter-Annotator</wd>

<space/>

<wd l="8218" t="8016" r="9341" b="8237">Agreement</wd>

</ln>

</para>

<para l="6144" t="8448" r="10512" b="11626" alignment="justified" spaceBefore="131" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="8448" r="10502" b="8650" baseLine="8602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8453" r="7517" b="8606">Inter-Annotator</wd>

<space/>

<wd l="7584" t="8472" r="8491" b="8650">agreement</wd>

<space/>

<wd l="8568" t="8453" r="9082" b="8645">(IAA)</wd>

<space/>

<wd l="9173" t="8448" r="9763" b="8606">studies</wd>

<space/>

<wd l="9845" t="8501" r="10104" b="8606">are</wd>

<space/>

<wd l="10181" t="8501" r="10502" b="8606">car-</wd>

</ln>

<ln l="6144" t="8722" r="10502" b="8923" baseLine="8870" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="8722" r="6485" b="8880">ried</wd>

<space/>

<wd l="6562" t="8746" r="6835" b="8880">out</wd>

<space/>

<wd l="6912" t="8722" r="7474" b="8923">during</wd>

<space/>

<wd l="7550" t="8722" r="8472" b="8880">annotation</wd>

<space/>

<wd l="8539" t="8722" r="8966" b="8880">tasks</wd>

<space/>

<wd l="9048" t="8746" r="9216" b="8880">to</wd>

<space/>

<wd l="9293" t="8774" r="9811" b="8880">assess</wd>

<space/>

<wd l="9898" t="8722" r="10502" b="8880">consis-</wd>

</ln>

<ln l="6144" t="8990" r="10502" b="9192" baseLine="9144" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9014" r="6643" b="9192">tency,</wd>

<space/>

<wd l="6744" t="8990" r="7234" b="9149">levels</wd>

<space/>

<wd l="7330" t="8990" r="7517" b="9149">of</wd>

<space/>

<wd l="7584" t="8990" r="7982" b="9178">bias,</wd>

<space/>

<wd l="8083" t="8990" r="8395" b="9149">and</wd>

<space/>

<wd l="8477" t="8990" r="9322" b="9192">reliability</wd>

<space/>

<wd l="9408" t="8990" r="9600" b="9149">of</wd>

<space/>

<wd l="9667" t="8990" r="9931" b="9149">the</wd>

<space/>

<wd l="10018" t="9043" r="10502" b="9149">anno-</wd>

</ln>

<ln l="6144" t="9264" r="10512" b="9466" baseLine="9413" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9264" r="6571" b="9422">tated</wd>

<space/>

<wd l="6662" t="9264" r="7066" b="9422">data.</wd>

<space/>

<wd l="7238" t="9269" r="7546" b="9422">For</wd>

<space/>

<wd l="7632" t="9317" r="7920" b="9422">our</wd>

<space/>

<wd l="8016" t="9264" r="8506" b="9466">study,</wd>

<space/>

<wd l="8616" t="9317" r="8866" b="9422">we</wd>

<space/>

<wd l="8962" t="9264" r="9451" b="9422">chose</wd>

<space/>

<wd l="9542" t="9264" r="9754" b="9422">50</wd>

<space/>

<wd l="9845" t="9264" r="10512" b="9422">random</wd>

<space/>

</ln>

<ln l="6144" t="9533" r="10512" b="9734" baseLine="9686" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="9533" r="6547" b="9691">Irish</wd>

<space/>

<wd l="6629" t="9557" r="7229" b="9720">tweets,</wd>

<space/>

<wd l="7334" t="9533" r="7872" b="9691">which</wd>

<space/>

<wd l="7954" t="9533" r="8342" b="9691">both</wd>

<space/>

<wd l="8429" t="9557" r="9326" b="9691">annotators</wd>

<space/>

<wd l="9422" t="9533" r="10003" b="9734">tagged</wd>

<space/>

<wd l="10085" t="9533" r="10512" b="9691">from</wd>

<space/>

</ln>

<ln l="6154" t="9806" r="10502" b="9965" baseLine="9955" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6154" t="9806" r="6806" b="9965">scratch.</wd>

<space/>

<wd l="6950" t="9806" r="7330" b="9965">This</wd>

<space/>

<wd l="7421" t="9806" r="8102" b="9965">differed</wd>

<space/>

<wd l="8179" t="9806" r="8606" b="9965">from</wd>

<space/>

<wd l="8678" t="9806" r="8942" b="9965">the</wd>

<space/>

<wd l="9019" t="9830" r="9336" b="9965">rest</wd>

<space/>

<wd l="9418" t="9806" r="9610" b="9965">of</wd>

<space/>

<wd l="9672" t="9806" r="9936" b="9965">the</wd>

<space/>

<wd l="10018" t="9859" r="10502" b="9965">anno-</wd>

</ln>

<ln l="6144" t="10075" r="10502" b="10277" baseLine="10224" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="10075" r="6643" b="10234">tation</wd>

<space/>

<wd l="6706" t="10128" r="7402" b="10277">process,</wd>

<space/>

<wd l="7478" t="10075" r="8016" b="10234">which</wd>

<space/>

<wd l="8078" t="10128" r="8405" b="10234">was</wd>

<space/>

<wd l="8486" t="10075" r="9912" b="10234">semi-automated.</wd>

<space/>

<wd l="10018" t="10080" r="10502" b="10234">How-</wd>

</ln>

<ln l="6149" t="10349" r="10502" b="10550" baseLine="10498" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10402" r="6547" b="10536">ever,</wd>

<space/>

<wd l="6624" t="10349" r="7613" b="10507">elimination</wd>

<space/>

<wd l="7675" t="10349" r="7867" b="10507">of</wd>

<space/>

<wd l="7910" t="10349" r="8626" b="10550">possible</wd>

<space/>

<wd l="8683" t="10349" r="9029" b="10507">bias</wd>

<space/>

<wd l="9091" t="10349" r="9768" b="10507">towards</wd>

<space/>

<wd l="9835" t="10349" r="10099" b="10507">the</wd>

<space/>

<wd l="10162" t="10402" r="10502" b="10550">pre-</wd>

</ln>

<ln l="6149" t="10618" r="10512" b="10819" baseLine="10766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10618" r="7070" b="10776">annotation</wd>

<space/>

<wd l="7147" t="10642" r="7699" b="10819">output</wd>

<space/>

<wd l="7776" t="10618" r="8458" b="10776">allowed</wd>

<space/>

<wd l="8530" t="10618" r="8789" b="10776">for</wd>

<space/>

<wd l="8866" t="10670" r="8962" b="10776">a</wd>

<space/>

<wd l="9029" t="10670" r="9480" b="10776">more</wd>

<space/>

<wd l="9557" t="10618" r="10512" b="10819">disciplined</wd>

<space/>

</ln>

<ln l="6149" t="10886" r="10502" b="11088" baseLine="11040" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="10910" r="7118" b="11045">assessment</wd>

<space/>

<wd l="7186" t="10886" r="7378" b="11045">of</wd>

<space/>

<wd l="7435" t="10910" r="8342" b="11088">agreement</wd>

<space/>

<wd l="8405" t="10886" r="8818" b="11045">level</wd>

<space/>

<wd l="8890" t="10886" r="9614" b="11045">between</wd>

<space/>

<wd l="9682" t="10886" r="9946" b="11045">the</wd>

<space/>

<wd l="10018" t="10939" r="10502" b="11045">anno-</wd>

</ln>

<ln l="6144" t="11160" r="10512" b="11362" baseLine="11309" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="11184" r="6672" b="11318">tators.</wd>

<space/>

<wd l="6754" t="11165" r="7037" b="11318">We</wd>

<space/>

<wd l="7094" t="11160" r="7858" b="11318">achieved</wd>

<space/>

<wd l="7915" t="11213" r="8112" b="11318">an</wd>

<space/>

<wd l="8174" t="11184" r="9077" b="11362">agreement</wd>

<space/>

<wd l="9130" t="11184" r="9456" b="11318">rate</wd>

<space/>

<wd l="9514" t="11160" r="9706" b="11318">of</wd>

<space/>

<wd l="9749" t="11165" r="10133" b="11318">90%</wd>

<space/>

<wd l="10200" t="11160" r="10512" b="11318">and</wd>

<space/>

</ln>

<ln l="6149" t="11429" r="8966" b="11626" baseLine="11582">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="11482" r="6245" b="11587">a</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="6307" t="11482" r="6418" b="11587">κ</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6485" t="11482" r="6936" b="11587">score</wd>

<space/>

<wd l="7003" t="11429" r="7680" b="11626">(Cohen,</wd>

<space/>

<wd l="7766" t="11429" r="8242" b="11626">1960)</wd>

<space/>

<wd l="8314" t="11429" r="8501" b="11587">of</wd>

<space/>

<wd l="8549" t="11434" r="8966" b="11587">0.89.</wd>

</run>

</ln>

</para>

<para l="6144" t="11702" r="10517" b="14299" alignment="justified" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6370" t="11702" r="10502" b="11904" baseLine="11851" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="11702" r="7046" b="11861">Smaller</wd>

<space/>

<wd l="7138" t="11726" r="7723" b="11904">tagsets</wd>

<space/>

<wd l="7829" t="11702" r="8299" b="11861">make</wd>

<space/>

<wd l="8400" t="11755" r="8597" b="11861">an</wd>

<space/>

<wd l="8702" t="11702" r="9619" b="11861">annotation</wd>

<space/>

<wd l="9710" t="11702" r="10066" b="11861">task</wd>

<space/>

<wd l="10166" t="11755" r="10502" b="11861">eas-</wd>

</ln>

<ln l="6144" t="11976" r="10507" b="12134" baseLine="12125" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="11976" r="6379" b="12134">ier</wd>

<space/>

<wd l="6470" t="11976" r="6778" b="12134">due</wd>

<space/>

<wd l="6869" t="12000" r="7032" b="12134">to</wd>

<space/>

<wd l="7123" t="11976" r="7392" b="12134">the</wd>

<space/>

<wd l="7483" t="11976" r="8342" b="12134">constraint</wd>

<space/>

<wd l="8434" t="12029" r="8645" b="12134">on</wd>

<space/>

<wd l="8736" t="11976" r="9379" b="12134">choices</wd>

<space/>

<wd l="9480" t="11976" r="10253" b="12134">available</wd>

<space/>

<wd l="10339" t="12000" r="10507" b="12134">to</wd>

<space/>

</ln>

<ln l="6144" t="12245" r="10517" b="12446" baseLine="12394" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12245" r="6413" b="12403">the</wd>

<space/>

<wd l="6490" t="12269" r="7344" b="12432">annotator,</wd>

<space/>

<wd l="7435" t="12245" r="7747" b="12403">and</wd>

<space/>

<wd l="7814" t="12245" r="7954" b="12403">is</wd>

<space/>

<wd l="8035" t="12245" r="8794" b="12446">certainly</wd>

<space/>

<wd l="8870" t="12298" r="9182" b="12403">one</wd>

<space/>

<wd l="9254" t="12298" r="9826" b="12403">reason</wd>

<space/>

<wd l="9893" t="12245" r="10152" b="12403">for</wd>

<space/>

<wd l="10224" t="12298" r="10517" b="12403">our</wd>

<space/>

</ln>

<ln l="6144" t="12514" r="10512" b="12715" baseLine="12667" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12514" r="6533" b="12715">high</wd>

<space/>

<wd l="6595" t="12518" r="6984" b="12667">IAA</wd>

<space/>

<wd l="7051" t="12566" r="7546" b="12672">score.</wd>

<space/>

<wd l="7646" t="12514" r="8026" b="12672">This</wd>

<space/>

<wd l="8098" t="12514" r="8582" b="12672">result</wd>

<space/>

<wd l="8645" t="12514" r="8990" b="12672">also</wd>

<space/>

<wd l="9062" t="12538" r="9787" b="12715">suggests</wd>

<space/>

<wd l="9854" t="12514" r="10186" b="12672">that</wd>

<space/>

<wd l="10243" t="12514" r="10512" b="12672">the</wd>

<space/>

</ln>

<ln l="6144" t="12787" r="10502" b="12989" baseLine="12936" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="12787" r="6797" b="12989">tagging</wd>

<space/>

<wd l="6878" t="12787" r="7766" b="12989">guidelines</wd>

<space/>

<wd l="7848" t="12840" r="8270" b="12946">were</wd>

<space/>

<wd l="8352" t="12787" r="8774" b="12946">clear</wd>

<space/>

<wd l="8851" t="12787" r="9163" b="12946">and</wd>

<space/>

<wd l="9240" t="12840" r="9624" b="12989">easy</wd>

<space/>

<wd l="9701" t="12811" r="9869" b="12946">to</wd>

<space/>

<wd l="9946" t="12787" r="10502" b="12946">under-</wd>

</ln>

<ln l="6154" t="13056" r="10512" b="13258" baseLine="13210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="13056" r="6648" b="13214">stand.</wd>

<space/>

<wd l="6802" t="13061" r="6960" b="13210">A</wd>

<space/>

<wd l="7042" t="13056" r="7565" b="13214">closer</wd>

<space/>

<wd l="7642" t="13056" r="8659" b="13258">comparison</wd>

<space/>

<wd l="8741" t="13056" r="9432" b="13258">analysis</wd>

<space/>

<wd l="9523" t="13056" r="9710" b="13214">of</wd>

<space/>

<wd l="9778" t="13056" r="10042" b="13214">the</wd>

<space/>

<wd l="10123" t="13061" r="10512" b="13210">IAA</wd>

<space/>

</ln>

<ln l="6149" t="13330" r="10502" b="13531" baseLine="13478" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13330" r="6514" b="13488">data</wd>

<space/>

<wd l="6581" t="13330" r="7296" b="13531">explains</wd>

<space/>

<wd l="7382" t="13382" r="7829" b="13488">some</wd>

<space/>

<wd l="7906" t="13330" r="9192" b="13531">disagreements.</wd>

<space/>

<wd l="9317" t="13330" r="9653" b="13488">The</wd>

<space/>

<wd l="9725" t="13330" r="10502" b="13488">inconsis-</wd>

</ln>

<ln l="6144" t="13598" r="10502" b="13800" baseLine="13752" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13622" r="6610" b="13800">tency</wd>

<space/>

<wd l="6686" t="13598" r="6874" b="13757">of</wd>

<space/>

<wd l="6931" t="13598" r="7661" b="13757">conflicts</wd>

<space/>

<wd l="7742" t="13622" r="8462" b="13800">suggests</wd>

<space/>

<wd l="8539" t="13598" r="8866" b="13757">that</wd>

<space/>

<wd l="8933" t="13598" r="9197" b="13757">the</wd>

<space/>

<wd l="9269" t="13598" r="10502" b="13800">disagreements</wd>

<space/>

</ln>

<ln l="6149" t="13872" r="10512" b="14074" baseLine="14021" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13925" r="6605" b="14030">arose</wd>

<space/>

<wd l="6653" t="13872" r="7080" b="14030">from</wd>

<space/>

<wd l="7128" t="13872" r="7723" b="14030">human</wd>

<space/>

<wd l="7776" t="13925" r="8227" b="14030">error.</wd>

<space/>

<wd l="8309" t="13877" r="8798" b="14030">Some</wd>

<space/>

<wd l="8856" t="13872" r="9662" b="14074">examples</wd>

<space/>

<wd l="9725" t="13925" r="9984" b="14030">are</wd>

<space/>

<wd l="10042" t="13872" r="10512" b="14074">given</wd>

<space/>

</ln>

<ln l="6144" t="14141" r="6701" b="14299" baseLine="14294" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14141" r="6701" b="14299">below.</wd>

</ln>

</para>

<para l="6144" t="14563" r="10512" b="15307" alignment="justified" spaceBefore="149" spaceAfter="35" lsp="exactly" lspExact="272" language="en">

<ln l="6144" t="14563" r="10488" b="14765" baseLine="14717">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="14568" r="6653" b="14722">Noun</wd>

<space/>

<wd l="6701" t="14611" r="6888" b="14722">vs</wd>

<space/>

<wd l="6936" t="14568" r="7589" b="14765">Proper</wd>

<space/>

<wd l="7632" t="14568" r="8141" b="14722">Noun</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8357" t="14563" r="8698" b="14722">The</wd>

<space/>

<wd l="8741" t="14563" r="9192" b="14722">word</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9245" t="14563" r="9917" b="14765">Gaeilge</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9989" t="14563" r="10488" b="14722">‘Irish’</wd>

<space/>

</run>

</ln>

<ln l="6144" t="14837" r="10502" b="15038" baseLine="14986">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="14890" r="6475" b="14995">was</wd>

<space/>

<wd l="6600" t="14837" r="7181" b="15038">tagged</wd>

<space/>

<wd l="7301" t="14890" r="7517" b="14995">on</wd>

<space/>

<wd l="7632" t="14837" r="8395" b="14995">occasion</wd>

<space/>

<wd l="8510" t="14890" r="8683" b="14995">as</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontPitch="fixed" spacing="0"><wd l="8808" t="14866" r="8928" b="14990">N</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="9058" t="14842" r="9888" b="15034">(common</wd>

<space/>

<wd l="10003" t="14842" r="10502" b="15034">noun)</wd>

<space/>

</run>

</ln>

<ln l="6144" t="15106" r="10512" b="15307" baseLine="15259">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="15106" r="6763" b="15264">instead</wd>

<space/>

<wd l="6874" t="15106" r="7061" b="15264">of</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7162" t="15125" r="7286" b="15269">∧</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7411" t="15110" r="8045" b="15307">(proper</wd>

<space/>

<wd l="8146" t="15110" r="8698" b="15302">noun).</wd>

<space/>

<wd l="8923" t="15106" r="9302" b="15264">This</wd>

<space/>

<wd l="9418" t="15106" r="9763" b="15264">also</wd>

<space/>

<wd l="9874" t="15106" r="10512" b="15307">applied</wd>

</run>

</ln>

</para>

</column>

</section>

<dd l="1430" t="15736" r="10528" b="15977">

<para l="5857" t="15792" r="6095" b="15941" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5923" t="15792" r="6029" b="15941" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5923" t="15792" r="6029" b="15941">4</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1217" marginRight="1385" marginBottom="1302" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1217" r="10524" b="15331">

<column l="1440" t="1217" r="5822" b="15331">

<para l="1440" t="1277" r="5818" b="2059" alignment="justified" spaceBefore="42" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="1277" r="5803" b="1522" baseLine="1472">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1440" t="1344" r="1608" b="1478">to</wd>

<space/>

<wd l="1738" t="1373" r="2189" b="1478">some</wd>

<space/>

<wd l="2304" t="1373" r="2880" b="1522">proper</wd>

<space/>

<wd l="2990" t="1373" r="3427" b="1478">noun</wd>

<space/>

<wd l="3557" t="1320" r="4118" b="1522">strings</wd>

<space/>

<wd l="4253" t="1320" r="4646" b="1478">such</wd>

<space/>

<wd l="4766" t="1373" r="4934" b="1478">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5045" t="1277" r="5467" b="1478">´Aras</wd>

<space/>

<wd l="5587" t="1373" r="5803" b="1478">an</wd>

<space/>

</run>

</ln>

<ln l="1459" t="1594" r="5818" b="1790" baseLine="1742">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1459" t="1594" r="2438" b="1752">Uachtar´ain</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2525" t="1594" r="2851" b="1790">(the</wd>

<space/>

<wd l="2928" t="1594" r="3533" b="1752">official</wd>

<space/>

<wd l="3605" t="1646" r="4080" b="1752">name</wd>

<space/>

<wd l="4157" t="1594" r="4344" b="1752">of</wd>

<space/>

<wd l="4402" t="1594" r="4670" b="1752">the</wd>

<space/>

<wd l="4742" t="1594" r="5554" b="1752">President</wd>

<space/>

<wd l="5630" t="1594" r="5818" b="1752">of</wd>

<space/>

</run>

</ln>

<ln l="1440" t="1862" r="3197" b="2059" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1862" r="2194" b="2021">Ireland’s</wd>

<space/>

<wd l="2256" t="1862" r="3197" b="2059">residence).</wd>

</ln>

</para>

<para l="1440" t="2299" r="5818" b="3581" alignment="justified" spaceBefore="162" lsp="exactly" lspExact="271" language="en">

<ln l="1445" t="2299" r="5794" b="2501" baseLine="2453">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="2299" r="2299" b="2501">Syntactic</wd>

<space/>

<wd l="2400" t="2299" r="3494" b="2458">at-mentions</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3715" t="2304" r="3874" b="2453">A</wd>

<space/>

<wd l="3979" t="2299" r="4440" b="2458">small</wd>

<space/>

<wd l="4536" t="2299" r="5208" b="2458">number</wd>

<space/>

<wd l="5304" t="2299" r="5496" b="2458">of</wd>

<space/>

<wd l="5582" t="2323" r="5794" b="2458">at-</wd>

</run>

</ln>

<ln l="1440" t="2573" r="5808" b="2774" baseLine="2722" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2573" r="2232" b="2731">mentions</wd>

<space/>

<wd l="2328" t="2573" r="2659" b="2731">that</wd>

<space/>

<wd l="2746" t="2626" r="3168" b="2731">were</wd>

<space/>

<wd l="3269" t="2573" r="4358" b="2774">syntactically</wd>

<space/>

<wd l="4450" t="2602" r="4790" b="2774">part</wd>

<space/>

<wd l="4882" t="2573" r="5074" b="2731">of</wd>

<space/>

<wd l="5150" t="2626" r="5246" b="2731">a</wd>

<space/>

<wd l="5333" t="2597" r="5808" b="2731">tweet</wd>

<space/>

</ln>

<ln l="1450" t="2842" r="5818" b="3043" baseLine="2995">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1450" t="2846" r="1814" b="3043">(e.g.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2016" t="2894" r="2371" b="3000">mar</wd>

<space/>

<wd l="2467" t="2842" r="2947" b="3000">chuid</wd>

<space/>

<wd l="3038" t="2842" r="3240" b="3000">de</wd>

<space/>

<wd l="3360" t="2842" r="4550" b="3043">@SnaGaeilge</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4675" t="2846" r="4896" b="3000">‘as</wd>

<space/>

<wd l="5002" t="2894" r="5098" b="3000">a</wd>

<space/>

<wd l="5189" t="2870" r="5530" b="3043">part</wd>

<space/>

<wd l="5630" t="2842" r="5818" b="3000">of</wd>

<space/>

</run>

</ln>

<ln l="1464" t="3115" r="5808" b="3317" baseLine="3264" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1464" t="3115" r="2784" b="3317">@SnaGaeilge’)</wd>

<space/>

<wd l="2846" t="3168" r="3269" b="3274">were</wd>

<space/>

<wd l="3322" t="3115" r="4262" b="3317">incorrectly</wd>

<space/>

<wd l="4320" t="3115" r="4906" b="3317">tagged</wd>

<space/>

<wd l="4958" t="3168" r="5131" b="3274">as</wd>

<space/>

<wd l="5189" t="3115" r="5808" b="3317">regular</wd>

<space/>

</ln>

<ln l="1445" t="3384" r="2846" b="3581" baseLine="3533">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="3384" r="2462" b="3542">at-mentions</wd>

<space/>

</run>

<wd l="2534" t="3389" r="2846" b="3581"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">@</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="3821" r="5803" b="4565" alignment="justified" spaceBefore="166" lsp="exactly" lspExact="271" language="en">

<ln l="1445" t="3821" r="5798" b="3979" baseLine="3970">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="3826" r="2194" b="3979">Retweet</wd>

<space/>

<wd l="2299" t="3826" r="2875" b="3979">colons</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3101" t="3826" r="3456" b="3979">One</wd>

<space/>

<wd l="3566" t="3845" r="4392" b="3979">annotator</wd>

<space/>

<wd l="4493" t="3821" r="5146" b="3979">marked</wd>

<space/>

<wd l="5275" t="3826" r="5429" b="3979">‘:’</wd>

<space/>

<wd l="5630" t="3874" r="5798" b="3979">as</wd>

<space/>

</run>

</ln>

<ln l="1440" t="4090" r="5803" b="4291" baseLine="4243" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="4090" r="2472" b="4291">punctuation</wd>

<space/>

<wd l="2525" t="4114" r="2678" b="4248">at</wd>

<space/>

<wd l="2731" t="4090" r="3398" b="4248">random</wd>

<space/>

<wd l="3456" t="4114" r="3970" b="4291">stages</wd>

<space/>

<wd l="4032" t="4090" r="4541" b="4248">rather</wd>

<space/>

<wd l="4589" t="4090" r="4968" b="4248">than</wd>

<space/>

<wd l="5016" t="4090" r="5486" b="4291">using</wd>

<space/>

<wd l="5539" t="4090" r="5803" b="4248">the</wd>

<space/>

</ln>

<ln l="1445" t="4363" r="2813" b="4565" baseLine="4512">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="4363" r="2266" b="4522">discourse</wd>

<space/>

<wd l="2318" t="4387" r="2582" b="4565">tag</wd>

<space/>

</run>

<wd l="2669" t="4382" r="2813" b="4522"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">˜</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1445" t="4843" r="3096" b="5448" alignment="left" ri="2736" spaceBefore="66" lsp="exactly" lspExact="432" language="en">

<ln l="1445" t="4843" r="3096" b="5064" baseLine="5006" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4848" r="1555" b="5016">5</wd>

<space/>

<wd l="1800" t="4843" r="3096" b="5064">Experiments</wd>

<space/>

</ln>

<ln l="1445" t="5285" r="2381" b="5448" baseLine="5438" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="5290" r="1704" b="5448">5.1</wd>

<space/>

<wd l="1930" t="5294" r="2381" b="5448">Data</wd>

</ln>

</para>

<para l="1440" t="5650" r="5808" b="7200" alignment="justified" spaceBefore="84" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="5650" r="5808" b="5851" baseLine="5798" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5654" r="1723" b="5808">We</wd>

<space/>

<wd l="1843" t="5650" r="2232" b="5808">took</wd>

<space/>

<wd l="2342" t="5650" r="2611" b="5808">the</wd>

<space/>

<wd l="2731" t="5650" r="3466" b="5808">finalised</wd>

<space/>

<wd l="3590" t="5674" r="3826" b="5808">set</wd>

<space/>

<wd l="3946" t="5650" r="4133" b="5808">of</wd>

<space/>

<wd l="4234" t="5650" r="4637" b="5808">Irish</wd>

<space/>

<wd l="4752" t="5650" r="5808" b="5851">POS-tagged</wd>

<space/>

</ln>

<ln l="1440" t="5918" r="5798" b="6115" baseLine="6067" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="5942" r="1987" b="6077">tweets</wd>

<space/>

<wd l="2131" t="5918" r="2443" b="6077">and</wd>

<space/>

<wd l="2573" t="5918" r="3221" b="6077">divided</wd>

<space/>

<wd l="3346" t="5918" r="3787" b="6077">them</wd>

<space/>

<wd l="3912" t="5918" r="4248" b="6077">into</wd>

<space/>

<wd l="4382" t="5971" r="4478" b="6077">a</wd>

<space/>

<wd l="4603" t="5942" r="4910" b="6077">test</wd>

<space/>

<wd l="5045" t="5942" r="5280" b="6077">set</wd>

<space/>

<wd l="5414" t="5923" r="5798" b="6115">(148</wd>

<space/>

</ln>

<ln l="1440" t="6187" r="5794" b="6389" baseLine="6341" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6192" r="2112" b="6384">tweets),</wd>

<space/>

<wd l="2218" t="6187" r="3336" b="6389">development</wd>

<space/>

<wd l="3427" t="6211" r="3658" b="6346">set</wd>

<space/>

<wd l="3749" t="6192" r="4133" b="6384">(147</wd>

<space/>

<wd l="4224" t="6192" r="4843" b="6384">tweets)</wd>

<space/>

<wd l="4939" t="6187" r="5251" b="6346">and</wd>

<space/>

<wd l="5333" t="6187" r="5794" b="6346">train-</wd>

</ln>

<ln l="1440" t="6461" r="5803" b="6662" baseLine="6610" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6461" r="1714" b="6662">ing</wd>

<space/>

<wd l="1800" t="6485" r="2035" b="6619">set</wd>

<space/>

<wd l="2117" t="6466" r="2616" b="6658">(1242</wd>

<space/>

<wd l="2693" t="6466" r="3365" b="6658">tweets).</wd>

<space/>

<wd l="3499" t="6461" r="4378" b="6619">Variations</wd>

<space/>

<wd l="4464" t="6461" r="4656" b="6619">of</wd>

<space/>

<wd l="4714" t="6461" r="5021" b="6619">this</wd>

<space/>

<wd l="5107" t="6461" r="5467" b="6619">data</wd>

<space/>

<wd l="5544" t="6514" r="5803" b="6619">are</wd>

<space/>

</ln>

<ln l="1440" t="6730" r="5794" b="6931" baseLine="6883" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="6730" r="1843" b="6888">used</wd>

<space/>

<wd l="1906" t="6730" r="2078" b="6883">in</wd>

<space/>

<wd l="2146" t="6782" r="2434" b="6888">our</wd>

<space/>

<wd l="2501" t="6730" r="3552" b="6931">experiments</wd>

<space/>

<wd l="3624" t="6730" r="4157" b="6888">where</wd>

<space/>

<wd l="4224" t="6782" r="4478" b="6888">we</wd>

<space/>

<wd l="4546" t="6730" r="5405" b="6888">normalise</wd>

<space/>

<wd l="5477" t="6782" r="5794" b="6888">cer-</wd>

</ln>

<ln l="1440" t="7003" r="5381" b="7200" baseLine="7152" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="7003" r="1766" b="7162">tain</wd>

<space/>

<wd l="1824" t="7003" r="2381" b="7162">tokens</wd>

<space/>

<wd l="2453" t="7003" r="3355" b="7200">(described</wd>

<space/>

<wd l="3408" t="7003" r="4003" b="7162">further</wd>

<space/>

<wd l="4056" t="7003" r="4229" b="7157">in</wd>

<space/>

<wd l="4286" t="7003" r="4934" b="7162">Section</wd>

<space/>

<wd l="4992" t="7003" r="5381" b="7200">5.2.)</wd>

</ln>

</para>

<para l="1440" t="7277" r="5808" b="12317" alignment="justified" spaceBefore="6" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="7277" r="5794" b="7478" baseLine="7429" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="7282" r="1944" b="7435">We</wd>

<space/>

<wd l="2064" t="7277" r="2410" b="7435">also</wd>

<space/>

<wd l="2534" t="7277" r="3715" b="7478">automatically</wd>

<space/>

<wd l="3840" t="7277" r="4685" b="7435">converted</wd>

<space/>

<wd l="4805" t="7282" r="5026" b="7435">U´ı</wd>

<space/>

<wd l="5141" t="7277" r="5794" b="7435">Dhonn-</wd>

</ln>

<ln l="1445" t="7550" r="5794" b="7747" baseLine="7699" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="7550" r="2064" b="7709">chadha</wd>

<space/>

<wd l="2189" t="7555" r="2899" b="7747">(2009)’s</wd>

<space/>

<wd l="3034" t="7555" r="3456" b="7709">3198</wd>

<space/>

<wd l="3595" t="7574" r="4334" b="7709">sentence</wd>

<space/>

<wd l="4464" t="7550" r="5117" b="7747">(74,705</wd>

<space/>

<wd l="5251" t="7550" r="5794" b="7747">token)</wd>

<space/>

</ln>

<ln l="1445" t="7819" r="5794" b="8021" baseLine="7973" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="7819" r="2640" b="8021">gold-standard</wd>

<space/>

<wd l="2702" t="7819" r="3758" b="8021">POS-tagged</wd>

<space/>

<wd l="3826" t="7872" r="4397" b="8021">corpus</wd>

<space/>

<wd l="4469" t="7819" r="4934" b="8021">using</wd>

<space/>

<wd l="5006" t="7872" r="5299" b="7978">our</wd>

<space/>

<wd l="5357" t="7872" r="5794" b="8021">map-</wd>

</ln>

<ln l="1440" t="8093" r="5808" b="8294" baseLine="8242" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8093" r="1824" b="8294">ping</wd>

<space/>

<wd l="1882" t="8093" r="2573" b="8251">scheme.</wd>

<space/>

<wd l="2645" t="8093" r="3029" b="8251">This</wd>

<space/>

<wd l="3082" t="8117" r="3408" b="8251">text</wd>

<space/>

<wd l="3451" t="8093" r="3586" b="8251">is</wd>

<space/>

<wd l="3643" t="8093" r="4070" b="8251">from</wd>

<space/>

<wd l="4109" t="8093" r="4378" b="8251">the</wd>

<space/>

<wd l="4421" t="8098" r="4824" b="8251">New</wd>

<space/>

<wd l="4882" t="8098" r="5496" b="8294">Corpus</wd>

<space/>

<wd l="5549" t="8093" r="5808" b="8251">for</wd>

<space/>

</ln>

<ln l="1440" t="8328" r="5808" b="8549" baseLine="8513">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="8362" r="2059" b="8520">Ireland</wd>

<space/>

<wd l="2117" t="8458" r="2227" b="8472">–</wd>

<space/>

</run>

<wd l="2285" t="8328" r="2818" b="8549"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">Irish</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">5</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="2890" t="8362" r="3422" b="8520">which</wd>

<space/>

<wd l="3480" t="8362" r="3619" b="8520">is</wd>

<space/>

<wd l="3686" t="8414" r="3782" b="8520">a</wd>

<space/>

<wd l="3845" t="8362" r="4699" b="8520">collection</wd>

<space/>

<wd l="4762" t="8362" r="4954" b="8520">of</wd>

<space/>

<wd l="4997" t="8386" r="5323" b="8520">text</wd>

<space/>

<wd l="5381" t="8362" r="5808" b="8520">from</wd>

<space/>

</run>

</ln>

<ln l="1440" t="8635" r="5808" b="8837" baseLine="8784" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8635" r="2006" b="8822">books,</wd>

<space/>

<wd l="2179" t="8635" r="3053" b="8822">newswire,</wd>

<space/>

<wd l="3230" t="8659" r="4262" b="8837">government</wd>

<space/>

<wd l="4406" t="8635" r="5342" b="8794">documents</wd>

<space/>

<wd l="5496" t="8635" r="5808" b="8794">and</wd>

<space/>

</ln>

<ln l="1440" t="8904" r="5794" b="9091" baseLine="9053" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8904" r="2237" b="9062">websites.</wd>

<space/>

<wd l="2338" t="8904" r="2674" b="9062">The</wd>

<space/>

<wd l="2736" t="8928" r="3062" b="9062">text</wd>

<space/>

<wd l="3125" t="8904" r="3259" b="9062">is</wd>

<space/>

<wd l="3331" t="8904" r="4694" b="9091">well-structured,</wd>

<space/>

<wd l="4771" t="8904" r="5794" b="9091">well-edited,</wd>

<space/>

</ln>

<ln l="1445" t="9178" r="5794" b="9379" baseLine="9326" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9178" r="1757" b="9336">and</wd>

<space/>

<wd l="1872" t="9178" r="3005" b="9379">grammatical,</wd>

<space/>

<wd l="3149" t="9178" r="3461" b="9336">and</wd>

<space/>

<wd l="3576" t="9178" r="3768" b="9336">of</wd>

<space/>

<wd l="3874" t="9230" r="4435" b="9336">course</wd>

<space/>

<wd l="4550" t="9178" r="4992" b="9336">lacks</wd>

<space/>

<wd l="5112" t="9178" r="5794" b="9336">Twitter-</wd>

</ln>

<ln l="1450" t="9446" r="5808" b="9648" baseLine="9595" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="9446" r="2102" b="9648">specific</wd>

<space/>

<wd l="2198" t="9446" r="2880" b="9605">features</wd>

<space/>

<wd l="2981" t="9446" r="3307" b="9605">like</wd>

<space/>

<wd l="3398" t="9446" r="4190" b="9648">hashtags,</wd>

<space/>

<wd l="4310" t="9446" r="5376" b="9634">at-mentions,</wd>

<space/>

<wd l="5496" t="9446" r="5808" b="9605">and</wd>

<space/>

</ln>

<ln l="1445" t="9715" r="5808" b="9917" baseLine="9869" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9715" r="2381" b="9902">emoticons,</wd>

<space/>

<wd l="2448" t="9715" r="2808" b="9874">thus</wd>

<space/>

<wd l="2875" t="9715" r="3624" b="9917">differing</wd>

<space/>

<wd l="3691" t="9715" r="4291" b="9917">greatly</wd>

<space/>

<wd l="4349" t="9715" r="4776" b="9874">from</wd>

<space/>

<wd l="4838" t="9768" r="5126" b="9874">our</wd>

<space/>

<wd l="5179" t="9715" r="5808" b="9874">Twitter</wd>

<space/>

</ln>

<ln l="1445" t="9989" r="5798" b="10190" baseLine="10138" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="9989" r="1848" b="10147">data.</wd>

<space/>

<wd l="1987" t="9989" r="2323" b="10147">The</wd>

<space/>

<wd l="2405" t="10042" r="3067" b="10190">average</wd>

<space/>

<wd l="3154" t="10013" r="3893" b="10147">sentence</wd>

<space/>

<wd l="3970" t="9989" r="4517" b="10190">length</wd>

<space/>

<wd l="4589" t="9989" r="4762" b="10142">in</wd>

<space/>

<wd l="4834" t="9989" r="5141" b="10147">this</wd>

<space/>

<wd l="5227" t="10042" r="5798" b="10190">corpus</wd>

<space/>

</ln>

<ln l="1440" t="10258" r="5803" b="10459" baseLine="10411" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10258" r="1579" b="10416">is</wd>

<space/>

<wd l="1718" t="10262" r="1925" b="10416">27</wd>

<space/>

<wd l="2059" t="10258" r="2669" b="10445">tokens,</wd>

<space/>

<wd l="2832" t="10258" r="3648" b="10459">diverging</wd>

<space/>

<wd l="3787" t="10258" r="4858" b="10459">significantly</wd>

<space/>

<wd l="4987" t="10258" r="5414" b="10416">from</wd>

<space/>

<wd l="5539" t="10258" r="5803" b="10416">the</wd>

<space/>

</ln>

<ln l="1445" t="10531" r="5794" b="10733" baseLine="10680" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="10584" r="2112" b="10733">average</wd>

<space/>

<wd l="2170" t="10555" r="2645" b="10690">tweet</wd>

<space/>

<wd l="2707" t="10531" r="3254" b="10733">length</wd>

<space/>

<wd l="3317" t="10531" r="3509" b="10690">of</wd>

<space/>

<wd l="3581" t="10536" r="3936" b="10690">17.2</wd>

<space/>

<wd l="3998" t="10531" r="4608" b="10690">tokens.</wd>

<space/>

<wd l="4709" t="10531" r="5371" b="10733">Despite</wd>

<space/>

<wd l="5434" t="10531" r="5794" b="10718">this,</wd>

<space/>

</ln>

<ln l="1445" t="10800" r="5808" b="11002" baseLine="10954" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="10800" r="1757" b="10958">and</wd>

<space/>

<wd l="1843" t="10800" r="2458" b="11002">despite</wd>

<space/>

<wd l="2539" t="10800" r="2808" b="10958">the</wd>

<space/>

<wd l="2890" t="10800" r="3216" b="10958">fact</wd>

<space/>

<wd l="3302" t="10800" r="3566" b="10958">the</wd>

<space/>

<wd l="3658" t="10800" r="4502" b="10958">converted</wd>

<space/>

<wd l="4584" t="10824" r="4925" b="11002">tags</wd>

<space/>

<wd l="5021" t="10853" r="5443" b="10958">were</wd>

<space/>

<wd l="5525" t="10824" r="5808" b="10958">not</wd>

<space/>

</ln>

<ln l="1440" t="11074" r="5808" b="11275" baseLine="11222" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11074" r="2232" b="11232">reviewed</wd>

<space/>

<wd l="2338" t="11074" r="2597" b="11232">for</wd>

<space/>

<wd l="2702" t="11126" r="3499" b="11275">accuracy,</wd>

<space/>

<wd l="3629" t="11126" r="3883" b="11232">we</wd>

<space/>

<wd l="3994" t="11126" r="4416" b="11232">were</wd>

<space/>

<wd l="4531" t="11074" r="4848" b="11232">still</wd>

<space/>

<wd l="4958" t="11074" r="5808" b="11232">interested</wd>

<space/>

</ln>

<ln l="1440" t="11342" r="5803" b="11544" baseLine="11496" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11342" r="1613" b="11496">in</wd>

<space/>

<wd l="1709" t="11342" r="2534" b="11544">exploring</wd>

<space/>

<wd l="2635" t="11342" r="2899" b="11501">the</wd>

<space/>

<wd l="3005" t="11366" r="3533" b="11501">extent</wd>

<space/>

<wd l="3624" t="11366" r="3792" b="11501">to</wd>

<space/>

<wd l="3893" t="11342" r="4426" b="11501">which</wd>

<space/>

<wd l="4522" t="11342" r="4829" b="11501">this</wd>

<space/>

<wd l="4939" t="11342" r="5803" b="11501">additional</wd>

<space/>

</ln>

<ln l="1440" t="11616" r="5808" b="11818" baseLine="11765" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11616" r="2117" b="11818">training</wd>

<space/>

<wd l="2208" t="11616" r="2573" b="11774">data</wd>

<space/>

<wd l="2659" t="11616" r="3144" b="11774">could</wd>

<space/>

<wd l="3226" t="11616" r="3946" b="11818">improve</wd>

<space/>

<wd l="4032" t="11616" r="4301" b="11774">the</wd>

<space/>

<wd l="4392" t="11669" r="5155" b="11818">accuracy</wd>

<space/>

<wd l="5251" t="11616" r="5443" b="11774">of</wd>

<space/>

<wd l="5520" t="11669" r="5808" b="11774">our</wd>

<space/>

</ln>

<ln l="1440" t="11885" r="5798" b="12086" baseLine="12034" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11885" r="2842" b="12086">best-performing</wd>

<space/>

<wd l="2942" t="11885" r="3528" b="12043">model.</wd>

<space/>

<wd l="3730" t="11890" r="4013" b="12043">We</wd>

<space/>

<wd l="4109" t="11885" r="4522" b="12043">refer</wd>

<space/>

<wd l="4613" t="11909" r="4781" b="12043">to</wd>

<space/>

<wd l="4877" t="11885" r="5184" b="12043">this</wd>

<space/>

<wd l="5294" t="11909" r="5530" b="12043">set</wd>

<space/>

<wd l="5630" t="11938" r="5798" b="12043">as</wd>

<space/>

</ln>

<ln l="1445" t="12173" r="2611" b="12317" baseLine="12307">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1445" t="12182" r="1944" b="12317">NCII</wd>

<space/>

</run>

<wd l="2059" t="12173" r="2611" b="12317"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">3198</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1445" t="12893" r="2659" b="13094" alignment="left" spaceBefore="487" lsp="exactly" lspExact="252" language="en">

<ln l="1445" t="12893" r="2659" b="13094" baseLine="13042" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="1445" t="12893" r="1709" b="13051">5.2</wd>

<space/>

<wd l="1934" t="12898" r="2659" b="13094">Taggers</wd>

</ln>

</para>

<para l="1440" t="13253" r="5808" b="13997" alignment="justified" spaceBefore="85" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="13253" r="5808" b="13411" baseLine="13402" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13258" r="1723" b="13411">We</wd>

<space/>

<wd l="1848" t="13253" r="2453" b="13411">trained</wd>

<space/>

<wd l="2578" t="13253" r="2890" b="13411">and</wd>

<space/>

<wd l="3014" t="13253" r="3835" b="13411">evaluated</wd>

<space/>

<wd l="3950" t="13253" r="4387" b="13411">three</wd>

<space/>

<wd l="4517" t="13253" r="5808" b="13411">state-of-the-art</wd>

<space/>

</ln>

<ln l="1440" t="13522" r="5803" b="13723" baseLine="13675" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13526" r="2534" b="13723">POS-taggers</wd>

<space/>

<wd l="2616" t="13522" r="3005" b="13680">with</wd>

<space/>

<wd l="3082" t="13574" r="3370" b="13680">our</wd>

<space/>

<wd l="3442" t="13522" r="3845" b="13680">data.</wd>

<space/>

<wd l="3979" t="13522" r="4253" b="13675">All</wd>

<space/>

<wd l="4330" t="13522" r="4762" b="13680">three</wd>

<space/>

<wd l="4838" t="13546" r="5458" b="13723">taggers</wd>

<space/>

<wd l="5544" t="13574" r="5803" b="13680">are</wd>

<space/>

</ln>

<ln l="1445" t="13795" r="3029" b="13997" baseLine="13944" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="13848" r="2506" b="13997">open-source</wd>

<space/>

<wd l="2563" t="13795" r="3029" b="13954">tools.</wd>

</ln>

</para>

<para l="1440" t="14232" r="5794" b="14702" alignment="justified" spaceBefore="168" spaceAfter="122" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="14232" r="5794" b="14434" baseLine="14381">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1440" t="14232" r="2261" b="14390">Morfette</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2482" t="14237" r="2717" b="14390">As</wd>

<space/>

<wd l="2803" t="14232" r="3206" b="14390">Irish</wd>

<space/>

<wd l="3288" t="14232" r="3422" b="14390">is</wd>

<space/>

<wd l="3518" t="14285" r="3715" b="14390">an</wd>

<space/>

<wd l="3802" t="14232" r="4555" b="14390">inflected</wd>

<space/>

<wd l="4632" t="14232" r="5462" b="14434">language,</wd>

<space/>

<wd l="5563" t="14232" r="5794" b="14386">in-</wd>

</run>

</ln>

<ln l="1445" t="14501" r="5794" b="14702" baseLine="14654">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1445" t="14501" r="2074" b="14659">clusion</wd>

<space/>

<wd l="2131" t="14501" r="2318" b="14659">of</wd>

<space/>

<wd l="2362" t="14501" r="2626" b="14659">the</wd>

<space/>

<wd l="2683" t="14501" r="3278" b="14659">lemma</wd>

<space/>

<wd l="3336" t="14554" r="3504" b="14659">as</wd>

<space/>

<wd l="3571" t="14554" r="3667" b="14659">a</wd>

<space/>

<wd l="3720" t="14501" r="4397" b="14702">training</wd>

<space/>

<wd l="4454" t="14501" r="5059" b="14659">feature</wd>

<space/>

<wd l="5112" t="14501" r="5251" b="14659">is</wd>

<space/>

<wd l="5318" t="14501" r="5794" b="14659">desir-</wd>

</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>

</run>

</ln>

</para>

<rulerline l="1440" t="14846" r="2640" b="14846" type="single" width="10" color="000000"/>

<para l="1454" t="14899" r="5765" b="15264" alignment="justified" ri="72" spaceBefore="53" spaceAfter="22" fli="216" lsp="exactly" lspExact="203" language="en">

<ln l="1694" t="14899" r="5765" b="15106" baseLine="15056">

<wd l="1694" t="14899" r="2093" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">5</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">New</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2141" t="14938" r="2645" b="15106">Corpus</wd>

<space/>

<wd l="2688" t="14938" r="2899" b="15067">for</wd>

<space/>

<wd l="2933" t="14938" r="3446" b="15067">Ireland</wd>

<space/>

<wd l="3485" t="14938" r="3941" b="15067">-Irish.</wd>

<space/>

<wd l="4008" t="14938" r="4258" b="15067">See</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4306" t="14942" r="5765" b="15096">http://corpas.</wd>

<space/>

</run>

</ln>

<ln l="1454" t="15144" r="2506" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1454" t="15144" r="2506" b="15264">focloir.ie</wd>

</ln>

</para>

</column>

<column l="6142" t="1217" r="10524" b="15331">

<para l="6144" t="1315" r="10512" b="4502" alignment="justified" spaceBefore="41" lsp="exactly" lspExact="270" language="en">

<ln l="6149" t="1315" r="10502" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="1320" r="6509" b="1478">able</wd>

<space/>

<wd l="6566" t="1320" r="6734" b="1474">in</wd>

<space/>

<wd l="6797" t="1373" r="6994" b="1478">an</wd>

<space/>

<wd l="7056" t="1320" r="7531" b="1478">effort</wd>

<space/>

<wd l="7584" t="1344" r="7752" b="1478">to</wd>

<space/>

<wd l="7814" t="1373" r="8664" b="1478">overcome</wd>

<space/>

<wd l="8726" t="1320" r="9086" b="1478">data</wd>

<space/>

<wd l="9149" t="1320" r="9850" b="1522">sparsity.</wd>

<space/>

<wd l="9931" t="1320" r="10502" b="1478">There-</wd>

</ln>

<ln l="6144" t="1589" r="10498" b="1795" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="1594" r="6494" b="1752">fore</wd>

<space/>

<wd l="6571" t="1646" r="6826" b="1752">we</wd>

<space/>

<wd l="6902" t="1594" r="7507" b="1752">trained</wd>

<space/>

<wd l="7584" t="1594" r="8342" b="1752">Morfette</wd>

<space/>

<wd l="8429" t="1594" r="9298" b="1795">(Chrupala</wd>

<space/>

<wd l="9374" t="1618" r="9528" b="1752">et</wd>

<space/>

<wd l="9605" t="1594" r="9854" b="1781">al.,</wd>

<space/>

<wd l="9950" t="1598" r="10498" b="1790">2008),</wd>

<space/>

</ln>

<ln l="6149" t="1858" r="10502" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="1915" r="6245" b="2021">a</wd>

<space/>

<wd l="6322" t="1862" r="7574" b="2021">lemmatization</wd>

<space/>

<wd l="7651" t="1862" r="7987" b="2021">tool</wd>

<space/>

<wd l="8069" t="1862" r="8400" b="2021">that</wd>

<space/>

<wd l="8482" t="1862" r="8827" b="2021">also</wd>

<space/>

<wd l="8909" t="1862" r="9590" b="2064">predicts</wd>

<space/>

<wd l="9682" t="1867" r="10070" b="2021">POS</wd>

<space/>

<wd l="10162" t="1886" r="10502" b="2064">tags</wd>

<space/>

</ln>

<ln l="6149" t="2131" r="10502" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="2136" r="6461" b="2294">and</wd>

<space/>

<wd l="6528" t="2189" r="6898" b="2294">uses</wd>

<space/>

<wd l="6974" t="2136" r="7243" b="2294">the</wd>

<space/>

<wd l="7310" t="2136" r="7910" b="2294">lemma</wd>

<space/>

<wd l="7978" t="2189" r="8150" b="2294">as</wd>

<space/>

<wd l="8232" t="2189" r="8328" b="2294">a</wd>

<space/>

<wd l="8390" t="2136" r="9067" b="2338">training</wd>

<space/>

<wd l="9139" t="2136" r="9792" b="2294">feature.</wd>

<space/>

<wd l="9912" t="2141" r="10200" b="2294">We</wd>

<space/>

<wd l="10267" t="2189" r="10502" b="2294">re-</wd>

</ln>

<ln l="6144" t="2400" r="10502" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2434" r="6499" b="2606">port</wd>

<space/>

<wd l="6562" t="2458" r="6778" b="2563">on</wd>

<space/>

<wd l="6840" t="2405" r="7891" b="2606">experiments</wd>

<space/>

<wd l="7958" t="2405" r="8347" b="2563">both</wd>

<space/>

<wd l="8405" t="2405" r="8794" b="2563">with</wd>

<space/>

<wd l="8856" t="2405" r="9168" b="2563">and</wd>

<space/>

<wd l="9226" t="2405" r="9898" b="2563">without</wd>

<space/>

<wd l="9960" t="2458" r="10157" b="2563">an</wd>

<space/>

<wd l="10224" t="2458" r="10502" b="2606">op-</wd>

</ln>

<ln l="6144" t="2674" r="10512" b="2880" baseLine="2827">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6144" t="2678" r="6638" b="2837">tional</wd>

<space/>

<wd l="6691" t="2678" r="7565" b="2880">dictionary</wd>

<space/>

</run>

<wd l="7622" t="2683" r="8270" b="2875"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Dict</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="8323" t="2678" r="9398" b="2837">information.</wd>

<space/>

<wd l="9475" t="2683" r="9758" b="2837">We</wd>

<space/>

<wd l="9802" t="2678" r="10205" b="2837">used</wd>

<space/>

<wd l="10243" t="2678" r="10512" b="2837">the</wd>

<space/>

</run>

</ln>

<ln l="6149" t="2942" r="10502" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="2947" r="7027" b="3149">dictionary</wd>

<space/>

<wd l="7109" t="2947" r="7536" b="3106">from</wd>

<space/>

<wd l="7622" t="2947" r="8357" b="3106">Scannell</wd>

<space/>

<wd l="8458" t="2952" r="9072" b="3144">(2003),</wd>

<space/>

<wd l="9168" t="2947" r="9706" b="3106">which</wd>

<space/>

<wd l="9787" t="2947" r="10502" b="3106">contains</wd>

<space/>

</ln>

<ln l="6149" t="3216" r="10512" b="3418" baseLine="3370">

<wd l="6149" t="3226" r="6888" b="3418"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">350</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2">418</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7008" t="3221" r="7622" b="3379">surface</wd>

<space/>

<wd l="7723" t="3221" r="8275" b="3379">forms.</wd>

<space/>

<wd l="8496" t="3226" r="8837" b="3379">Our</wd>

<space/>

<wd l="8933" t="3221" r="9648" b="3379">baseline</wd>

<space/>

<wd l="9749" t="3221" r="10512" b="3379">Morfette</wd>

<space/>

</run>

</ln>

<ln l="6149" t="3490" r="10512" b="3686" baseLine="3638">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6149" t="3490" r="6514" b="3648">data</wd>

<space/>

</run>

<wd l="6581" t="3494" r="7752" b="3686"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">BaseMorf</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="7829" t="3490" r="8544" b="3648">contains</wd>

<space/>

<wd l="8611" t="3490" r="8880" b="3648">the</wd>

<space/>

<wd l="8942" t="3490" r="9466" b="3677">token,</wd>

<space/>

<wd l="9542" t="3490" r="10138" b="3648">lemma</wd>

<space/>

<wd l="10200" t="3490" r="10512" b="3648">and</wd>

<space/>

</run>

</ln>

<ln l="6144" t="3763" r="10507" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="3768" r="6926" b="3965">POS-tag.</wd>

<space/>

<wd l="7013" t="3763" r="7354" b="3922">The</wd>

<space/>

<wd l="7411" t="3763" r="8083" b="3922">lemmas</wd>

<space/>

<wd l="8150" t="3763" r="8342" b="3922">of</wd>

<space/>

<wd l="8386" t="3768" r="8899" b="3922">URLs</wd>

<space/>

<wd l="8966" t="3763" r="9278" b="3922">and</wd>

<space/>

<wd l="9336" t="3763" r="10507" b="3965">non-syntactic</wd>

<space/>

</ln>

<ln l="6144" t="4032" r="10512" b="4234" baseLine="4181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="4032" r="6888" b="4234">hashtags</wd>

<space/>

<wd l="6955" t="4032" r="7358" b="4190">have</wd>

<space/>

<wd l="7421" t="4032" r="7834" b="4190">been</wd>

<space/>

<wd l="7896" t="4032" r="8866" b="4190">normalised</wd>

<space/>

<wd l="8928" t="4085" r="9096" b="4190">as</wd>

<space/>

<wd l="9178" t="4066" r="9317" b="4195">&lt;</wd>

<space/>

<wd l="9422" t="4032" r="9893" b="4190">URL</wd>

<space/>

<wd l="9979" t="4066" r="10118" b="4195">&gt;</wd>

<space/>

<wd l="10200" t="4032" r="10512" b="4190">and</wd>

<space/>

</ln>

<ln l="6158" t="4301" r="7973" b="4502" baseLine="4454">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6158" t="4334" r="6298" b="4464">&lt;</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="-2"><wd l="6384" t="4301" r="6547" b="4498">#</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6634" t="4334" r="6830" b="4488">&gt;,</wd>

<space/>

<wd l="6898" t="4301" r="7973" b="4502">respectively.</wd>

</run>

</ln>

</para>

<para l="6144" t="4574" r="10517" b="5275" alignment="justified" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="4574" r="10502" b="4776" baseLine="4723" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="4579" r="6648" b="4733">We</wd>

<space/>

<wd l="6816" t="4574" r="7190" b="4733">then</wd>

<space/>

<wd l="7358" t="4574" r="8179" b="4733">evaluated</wd>

<space/>

<wd l="8342" t="4574" r="8611" b="4733">the</wd>

<space/>

<wd l="8774" t="4598" r="9326" b="4776">tagger</wd>

<space/>

<wd l="9485" t="4574" r="9874" b="4733">with</wd>

<space/>

<wd l="10046" t="4579" r="10502" b="4771">(non-</wd>

</ln>

<ln l="6154" t="4838" r="10493" b="5045" baseLine="4997">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6154" t="4843" r="6984" b="5045">syntactic)</wd>

<space/>

<wd l="7109" t="4877" r="7248" b="5006">&lt;</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="7421" t="4843" r="7584" b="5040">#</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7752" t="4877" r="7949" b="5030">&gt;,</wd>

<space/>

<wd l="8088" t="4877" r="8227" b="5006">&lt;</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="8400" t="4838" r="8549" b="5002">@</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8722" t="4877" r="8861" b="5006">&gt;</wd>

<space/>

<wd l="8981" t="4843" r="9293" b="5002">and</wd>

<space/>

<wd l="9403" t="4877" r="9542" b="5006">&lt;</wd>

<space/>

<wd l="9720" t="4843" r="10190" b="5002">URL</wd>

<space/>

<wd l="10354" t="4877" r="10493" b="5006">&gt;</wd>

<space/>

</run>

</ln>

<ln l="6144" t="5117" r="10517" b="5275" baseLine="5266" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5117" r="7349" b="5275">normalisation</wd>

<space/>

<wd l="7478" t="5117" r="7670" b="5275">of</wd>

<space/>

<wd l="7786" t="5117" r="8174" b="5275">both</wd>

<space/>

<wd l="8304" t="5117" r="8789" b="5275">token</wd>

<space/>

<wd l="8918" t="5117" r="9346" b="5275">form</wd>

<space/>

<wd l="9475" t="5117" r="9787" b="5275">and</wd>

<space/>

<wd l="9917" t="5117" r="10517" b="5275">lemma</wd>

</ln>

</para>

<para l="6144" t="5386" r="10507" b="6125" alignment="justified" spaceBefore="3" lsp="exactly" lspExact="271" language="en">

<tabs position="6144"/>

<ln l="6154" t="5386" r="10502" b="5587" baseLine="5539" forcedEOF="true">

<wd l="6154" t="5390" r="7382" b="5582"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">NormMorf</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="7382"/>

<wd l="7906" t="5386" r="8333" b="5544">Both</wd>

<space/>

<wd l="8539" t="5386" r="9590" b="5587">experiments</wd>

<space/>

<wd l="9806" t="5438" r="10066" b="5544">are</wd>

<space/>

</run>

<wd l="10267" t="5438" r="10502" b="5544"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">re-</run>

<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable">
</run>

</wd>

</ln>

<ln l="6144" t="5659" r="10507" b="5861" baseLine="5808" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">

<wd l="6144" t="5712" r="6437" b="5818">run</wd>

<space/>

<wd l="6648" t="5659" r="7037" b="5818">with</wd>

<space/>

<wd l="7243" t="5659" r="7512" b="5818">the</wd>

<space/>

<wd l="7723" t="5659" r="8525" b="5818">inclusion</wd>

<space/>

<wd l="8736" t="5659" r="8928" b="5818">of</wd>

<space/>

<wd l="9130" t="5712" r="9418" b="5818">our</wd>

<space/>

<wd l="9629" t="5659" r="10507" b="5861">dictionary</wd>

<space/>

</ln>

<ln l="6154" t="5933" r="9869" b="6125" baseLine="6082" forcedEOF="true">

<wd l="6154" t="5933" r="9869" b="6125"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">BaseMorf+Dict,NormMorf+Dict</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="6610" r="10512" b="9792" alignment="justified" spaceBefore="405" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="6610" r="10502" b="6768" baseLine="6758">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="6610" r="6629" b="6763">ARK</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6850" t="6614" r="7133" b="6768">We</wd>

<space/>

<wd l="7234" t="6610" r="7574" b="6768">also</wd>

<space/>

<wd l="7670" t="6610" r="8280" b="6768">trained</wd>

<space/>

<wd l="8371" t="6610" r="8635" b="6768">the</wd>

<space/>

<wd l="8736" t="6614" r="9230" b="6768">CMU</wd>

<space/>

<wd l="9322" t="6610" r="9950" b="6768">Twitter</wd>

<space/>

<wd l="10037" t="6614" r="10502" b="6768">POS-</wd>

</run>

</ln>

<ln l="6144" t="6878" r="10512" b="7080" baseLine="7032" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="6902" r="6696" b="7080">tagger</wd>

<space/>

<wd l="6782" t="6878" r="7603" b="7080">(Owoputi</wd>

<space/>

<wd l="7690" t="6902" r="7848" b="7037">et</wd>

<space/>

<wd l="7930" t="6878" r="8179" b="7066">al.,</wd>

<space/>

<wd l="8285" t="6883" r="8832" b="7075">2013),</wd>

<space/>

<wd l="8933" t="6878" r="9466" b="7037">which</wd>

<space/>

<wd l="9547" t="6878" r="9715" b="7032">in</wd>

<space/>

<wd l="9802" t="6878" r="10512" b="7037">addition</wd>

<space/>

</ln>

<ln l="6144" t="7152" r="10502" b="7354" baseLine="7301" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7176" r="6312" b="7310">to</wd>

<space/>

<wd l="6422" t="7152" r="7262" b="7354">providing</wd>

<space/>

<wd l="7373" t="7152" r="8333" b="7354">pre-trained</wd>

<space/>

<wd l="8434" t="7152" r="9110" b="7339">models,</wd>

<space/>

<wd l="9245" t="7152" r="9797" b="7310">allows</wd>

<space/>

<wd l="9907" t="7152" r="10166" b="7310">for</wd>

<space/>

<wd l="10267" t="7205" r="10502" b="7310">re-</wd>

</ln>

<ln l="6144" t="7421" r="10512" b="7622" baseLine="7574" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7421" r="6821" b="7622">training</wd>

<space/>

<wd l="6893" t="7421" r="7282" b="7579">with</wd>

<space/>

<wd l="7349" t="7474" r="7704" b="7579">new</wd>

<space/>

<wd l="7776" t="7421" r="8693" b="7622">languages.</wd>

<space/>

<wd l="8813" t="7421" r="9149" b="7579">The</wd>

<space/>

<wd l="9226" t="7445" r="9840" b="7579">current</wd>

<space/>

<wd l="9907" t="7421" r="10512" b="7579">release</wd>

<space/>

</ln>

<ln l="6149" t="7694" r="10502" b="7853" baseLine="7843" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="7694" r="6538" b="7853">does</wd>

<space/>

<wd l="6619" t="7718" r="6898" b="7853">not</wd>

<space/>

<wd l="6974" t="7694" r="7445" b="7853">allow</wd>

<space/>

<wd l="7526" t="7694" r="7781" b="7853">for</wd>

<space/>

<wd l="7853" t="7694" r="8117" b="7853">the</wd>

<space/>

<wd l="8194" t="7694" r="8995" b="7853">inclusion</wd>

<space/>

<wd l="9072" t="7694" r="9264" b="7853">of</wd>

<space/>

<wd l="9322" t="7694" r="9586" b="7853">the</wd>

<space/>

<wd l="9662" t="7694" r="10258" b="7853">lemma</wd>

<space/>

<wd l="10334" t="7747" r="10502" b="7853">as</wd>

<space/>

</ln>

<ln l="6149" t="7963" r="10502" b="8165" baseLine="8112" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="8016" r="6245" b="8122">a</wd>

<space/>

<wd l="6317" t="7963" r="6922" b="8122">feature</wd>

<space/>

<wd l="6998" t="7963" r="7171" b="8117">in</wd>

<space/>

<wd l="7243" t="7963" r="7968" b="8165">training,</wd>

<space/>

<wd l="8059" t="7963" r="8827" b="8122">however.</wd>

<space/>

<wd l="8966" t="7963" r="9643" b="8150">Instead,</wd>

<space/>

<wd l="9734" t="7963" r="9994" b="8122">for</wd>

<space/>

<wd l="10066" t="8016" r="10502" b="8122">com-</wd>

</ln>

<ln l="6144" t="8232" r="10502" b="8434" baseLine="8386" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8232" r="6787" b="8434">parison</wd>

<space/>

<wd l="6869" t="8285" r="7690" b="8434">purposes,</wd>

<space/>

<wd l="7790" t="8285" r="8045" b="8390">we</wd>

<space/>

<wd l="8126" t="8261" r="8650" b="8434">report</wd>

<space/>

<wd l="8736" t="8285" r="8952" b="8390">on</wd>

<space/>

<wd l="9029" t="8256" r="9350" b="8390">two</wd>

<space/>

<wd l="9446" t="8256" r="10152" b="8434">separate</wd>

<space/>

<wd l="10238" t="8285" r="10502" b="8390">ex-</wd>

</ln>

<ln l="6144" t="8506" r="10502" b="8707" baseLine="8654" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8506" r="7051" b="8707">periments,</wd>

<space/>

<wd l="7171" t="8558" r="7478" b="8664">one</wd>

<space/>

<wd l="7579" t="8506" r="8045" b="8707">using</wd>

<space/>

<wd l="8146" t="8506" r="8410" b="8664">the</wd>

<space/>

<wd l="8520" t="8506" r="9134" b="8664">surface</wd>

<space/>

<wd l="9230" t="8506" r="9792" b="8664">tokens</wd>

<space/>

<wd l="9898" t="8558" r="10070" b="8664">as</wd>

<space/>

<wd l="10171" t="8506" r="10502" b="8664">fea-</wd>

</ln>

<ln l="6144" t="8774" r="10502" b="8976" baseLine="8928" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8798" r="6614" b="8962">tures,</wd>

<space/>

<wd l="6691" t="8774" r="6998" b="8933">and</wd>

<space/>

<wd l="7056" t="8774" r="7325" b="8933">the</wd>

<space/>

<wd l="7387" t="8774" r="7834" b="8933">other</wd>

<space/>

<wd l="7891" t="8774" r="8362" b="8976">using</wd>

<space/>

<wd l="8429" t="8774" r="8808" b="8976">only</wd>

<space/>

<wd l="8870" t="8774" r="9134" b="8933">the</wd>

<space/>

<wd l="9192" t="8774" r="9864" b="8933">lemmas</wd>

<space/>

<wd l="9936" t="8827" r="10104" b="8933">as</wd>

<space/>

<wd l="10171" t="8774" r="10502" b="8933">fea-</wd>

</ln>

<ln l="6144" t="9048" r="10512" b="9245" baseLine="9197">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="9072" r="6562" b="9206">tures</wd>

<space/>

</run>

<wd l="6658" t="9053" r="7714" b="9245"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ArkForm,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7896" t="9053" r="9062" b="9245"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ArkLemma</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9211" t="9053" r="9494" b="9206">We</wd>

<space/>

<wd l="9576" t="9048" r="9922" b="9206">also</wd>

<space/>

<wd l="10003" t="9048" r="10512" b="9206">tested</wd>

<space/>

</run>

</ln>

<ln l="6144" t="9317" r="10498" b="9504" baseLine="9470" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9317" r="6859" b="9475">versions</wd>

<space/>

<wd l="6936" t="9317" r="7123" b="9475">of</wd>

<space/>

<wd l="7176" t="9370" r="7469" b="9475">our</wd>

<space/>

<wd l="7526" t="9317" r="7891" b="9475">data</wd>

<space/>

<wd l="7949" t="9317" r="8338" b="9475">with</wd>

<space/>

<wd l="8395" t="9317" r="9365" b="9475">normalised</wd>

<space/>

<wd l="9432" t="9317" r="10498" b="9504">at-mentions,</wd>

<space/>

</ln>

<ln l="6144" t="9590" r="8746" b="9792" baseLine="9739" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="9590" r="6888" b="9792">hashtags</wd>

<space/>

<wd l="6955" t="9590" r="7267" b="9749">and</wd>

<space/>

<wd l="7320" t="9595" r="7886" b="9778">URLs,</wd>

<space/>

<wd l="7958" t="9643" r="8126" b="9749">as</wd>

<space/>

<wd l="8194" t="9590" r="8746" b="9749">above.</wd>

</ln>

</para>

<para l="6144" t="9998" r="10512" b="12370" alignment="left" spaceBefore="180" lsp="exactly" lspExact="271" language="en">

<ln l="6149" t="9998" r="10512" b="10200" baseLine="10147">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="6149" t="9998" r="6965" b="10157">Stanford</wd>

<space/>

<wd l="7109" t="10013" r="7704" b="10200">tagger</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="7920" t="10003" r="8208" b="10157">We</wd>

<space/>

<wd l="8352" t="9998" r="9202" b="10157">re-trained</wd>

<space/>

<wd l="9346" t="9998" r="9614" b="10157">the</wd>

<space/>

<wd l="9763" t="9998" r="10512" b="10157">Stanford</wd>

<space/>

</run>

</ln>

<ln l="6144" t="10267" r="10498" b="10469" baseLine="10421" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="10291" r="6696" b="10469">tagger</wd>

<space/>

<wd l="6754" t="10272" r="7728" b="10464">(Toutanova</wd>

<space/>

<wd l="7776" t="10291" r="7934" b="10426">et</wd>

<space/>

<wd l="7987" t="10267" r="8237" b="10454">al.,</wd>

<space/>

<wd l="8304" t="10272" r="8798" b="10464">2003)</wd>

<space/>

<wd l="8861" t="10267" r="9250" b="10426">with</wd>

<space/>

<wd l="9302" t="10320" r="9595" b="10426">our</wd>

<space/>

<wd l="9643" t="10267" r="10042" b="10426">Irish</wd>

<space/>

<wd l="10099" t="10267" r="10498" b="10426">data.</wd>

<space/>

</ln>

<ln l="6144" t="10541" r="10512" b="10742" baseLine="10690" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="10546" r="6432" b="10699">We</wd>

<space/>

<wd l="6518" t="10541" r="7699" b="10742">experimented</wd>

<space/>

<wd l="7786" t="10541" r="8002" b="10742">by</wd>

<space/>

<wd l="8088" t="10541" r="8765" b="10742">training</wd>

<space/>

<wd l="8851" t="10541" r="9475" b="10699">models</wd>

<space/>

<wd l="9566" t="10541" r="10037" b="10742">using</wd>

<space/>

<wd l="10123" t="10541" r="10512" b="10699">both</wd>

<space/>

</ln>

<ln l="6144" t="10810" r="10512" b="11011" baseLine="10963">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="6144" t="10810" r="6413" b="10968">the</wd>

<space/>

<wd l="6547" t="10810" r="7166" b="10968">surface</wd>

<space/>

<wd l="7291" t="10810" r="7718" b="10968">form</wd>

<space/>

<wd l="7843" t="10810" r="8227" b="11011">only</wd>

<space/>

</run>

<wd l="8362" t="10814" r="10061" b="11006"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">BestStanForm</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><space/>

<wd l="10200" t="10810" r="10512" b="10968">and</wd>

<space/>

</run>

</ln>

<ln l="6144" t="11083" r="10512" b="11285" baseLine="11232">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="6144" t="11083" r="6413" b="11242">the</wd>

<space/>

<wd l="6499" t="11083" r="7099" b="11242">lemma</wd>

<space/>

<wd l="7190" t="11083" r="7570" b="11285">only</wd>

<space/>

</run>

<wd l="7670" t="11088" r="9552" b="11280"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">BestStanLemma</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">).</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><space/>

<wd l="9730" t="11083" r="10070" b="11242">The</wd>

<space/>

<wd l="10162" t="11083" r="10512" b="11242">best</wd>

<space/>

</run>

</ln>

<ln l="6144" t="11352" r="10512" b="11554" baseLine="11506" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6144" t="11352" r="7123" b="11554">performing</wd>

<space/>

<wd l="7224" t="11352" r="7766" b="11510">model</wd>

<space/>

<wd l="7862" t="11405" r="8194" b="11510">was</wd>

<space/>

<wd l="8299" t="11352" r="8794" b="11510">based</wd>

<space/>

<wd l="8894" t="11405" r="9110" b="11510">on</wd>

<space/>

<wd l="9206" t="11352" r="9470" b="11510">the</wd>

<space/>

<wd l="9566" t="11352" r="10171" b="11510">feature</wd>

<space/>

<wd l="10277" t="11376" r="10512" b="11510">set</wd>

<space/>

</ln>

<ln l="6163" t="11640" r="10411" b="11822" baseLine="11774" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">

<wd l="6163" t="11640" r="7531" b="11813">left3words,</wd>

<space/>

<wd l="7738" t="11640" r="8971" b="11813">suffix(4),</wd>

<space/>

<wd l="9163" t="11640" r="10411" b="11822">prefix(3),</wd>

<space/>

</ln>

<ln l="6149" t="11909" r="10248" b="12091" baseLine="12043">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="6149" t="11909" r="8318" b="12091">wordshapes(-3,3),</wd>

<space/>

</run>

<wd l="8506" t="11909" r="10248" b="12082"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">biwords(-1,1)</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><space/>

</run>

</ln>

<ln l="6144" t="12130" r="9134" b="12370" baseLine="12312">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="6144" t="12168" r="6614" b="12370">using</wd>

<space/>

<wd l="6672" t="12168" r="6941" b="12326">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="7008" t="12182" r="7752" b="12365">owlqn2</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><wd l="7843" t="12168" r="8390" b="12326">search</wd>

<space/>

</run>

<wd l="8453" t="12130" r="9134" b="12370"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">option.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2">6</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="2"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="12576" r="10517" b="14942" alignment="justified" spaceBefore="97" spaceAfter="83" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="12576" r="10512" b="12778" baseLine="12725">

<run bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="12576" r="6922" b="12734">Baseline</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7138" t="12576" r="7786" b="12778">Finally,</wd>

<space/>

<wd l="8074" t="12600" r="8242" b="12734">to</wd>

<space/>

<wd l="8477" t="12576" r="9240" b="12734">establish</wd>

<space/>

<wd l="9475" t="12629" r="9571" b="12734">a</wd>

<space/>

<wd l="9797" t="12576" r="10512" b="12734">baseline</wd>

<space/>

</run>

</ln>

<ln l="6154" t="12845" r="10512" b="13046" baseLine="12994">

<wd l="6154" t="12850" r="7382" b="13042"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Baseline</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">),</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7502" t="12845" r="7810" b="13003">and</wd>

<space/>

<wd l="7906" t="12898" r="8352" b="13003">more</wd>

<space/>

<wd l="8453" t="12845" r="9437" b="13046">specifically</wd>

<space/>

<wd l="9533" t="12869" r="9696" b="13003">to</wd>

<space/>

<wd l="9802" t="12845" r="10512" b="13003">evaluate</wd>

<space/>

</run>

</ln>

<ln l="6144" t="13118" r="10502" b="13320" baseLine="13267" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="13118" r="6413" b="13277">the</wd>

<space/>

<wd l="6576" t="13118" r="7555" b="13320">importance</wd>

<space/>

<wd l="7723" t="13118" r="7915" b="13277">of</wd>

<space/>

<wd l="8069" t="13118" r="9701" b="13320">domain-adaptation</wd>

<space/>

<wd l="9864" t="13118" r="10032" b="13272">in</wd>

<space/>

<wd l="10195" t="13118" r="10502" b="13277">this</wd>

<space/>

</ln>

<ln l="6149" t="13387" r="10512" b="13589" baseLine="13536" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13411" r="6826" b="13574">context,</wd>

<space/>

<wd l="6902" t="13440" r="7157" b="13546">we</wd>

<space/>

<wd l="7219" t="13387" r="8045" b="13546">evaluated</wd>

<space/>

<wd l="8107" t="13440" r="8203" b="13546">a</wd>

<space/>

<wd l="8270" t="13387" r="9811" b="13589">slightly-enhanced</wd>

<space/>

<wd l="9874" t="13387" r="10512" b="13546">version</wd>

<space/>

</ln>

<ln l="6149" t="13656" r="10517" b="13858" baseLine="13810" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13656" r="6341" b="13814">of</wd>

<space/>

<wd l="6466" t="13656" r="6730" b="13814">the</wd>

<space/>

<wd l="6869" t="13656" r="7776" b="13814">rule-based</wd>

<space/>

<wd l="7910" t="13656" r="8314" b="13814">Irish</wd>

<space/>

<wd l="8448" t="13680" r="8995" b="13858">tagger</wd>

<space/>

<wd l="9134" t="13709" r="9350" b="13814">on</wd>

<space/>

<wd l="9485" t="13656" r="9749" b="13814">the</wd>

<space/>

<wd l="9888" t="13656" r="10517" b="13814">Twitter</wd>

<space/>

</ln>

<ln l="6149" t="13930" r="10512" b="14131" baseLine="14078" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="13930" r="6797" b="14088">dataset.</wd>

<space/>

<wd l="7032" t="13930" r="7550" b="14088">When</wd>

<space/>

<wd l="7656" t="13930" r="7925" b="14088">the</wd>

<space/>

<wd l="8030" t="13930" r="8942" b="14088">rule-based</wd>

<space/>

<wd l="9048" t="13954" r="9595" b="14131">tagger</wd>

<space/>

<wd l="9701" t="13930" r="10512" b="14131">produced</wd>

<space/>

</ln>

<ln l="6144" t="14198" r="10498" b="14400" baseLine="14352" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14251" r="6595" b="14357">more</wd>

<space/>

<wd l="6706" t="14198" r="7075" b="14357">than</wd>

<space/>

<wd l="7195" t="14251" r="7502" b="14357">one</wd>

<space/>

<wd l="7613" t="14198" r="8328" b="14400">possible</wd>

<space/>

<wd l="8438" t="14222" r="8702" b="14400">tag</wd>

<space/>

<wd l="8818" t="14198" r="9077" b="14357">for</wd>

<space/>

<wd l="9187" t="14251" r="9283" b="14357">a</wd>

<space/>

<wd l="9394" t="14198" r="9864" b="14400">given</wd>

<space/>

<wd l="9974" t="14198" r="10498" b="14386">token,</wd>

<space/>

</ln>

<ln l="6144" t="14472" r="10512" b="14674" baseLine="14621" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14525" r="6398" b="14630">we</wd>

<space/>

<wd l="6518" t="14472" r="7157" b="14674">applied</wd>

<space/>

<wd l="7272" t="14525" r="7368" b="14630">a</wd>

<space/>

<wd l="7478" t="14472" r="8098" b="14674">bigram</wd>

<space/>

<wd l="8208" t="14496" r="8472" b="14674">tag</wd>

<space/>

<wd l="8587" t="14472" r="9130" b="14630">model</wd>

<space/>

<wd l="9245" t="14496" r="9408" b="14630">to</wd>

<space/>

<wd l="9533" t="14472" r="10133" b="14630">choose</wd>

<space/>

<wd l="10243" t="14472" r="10512" b="14630">the</wd>

<space/>

</ln>

<ln l="6144" t="14741" r="10512" b="14942" baseLine="14894" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="14765" r="6571" b="14899">most</wd>

<space/>

<wd l="6672" t="14741" r="7162" b="14942">likely</wd>

<space/>

<wd l="7267" t="14765" r="7579" b="14942">tag,</wd>

<space/>

<wd l="7709" t="14794" r="7877" b="14899">as</wd>

<space/>

<wd l="7987" t="14794" r="8242" b="14899">we</wd>

<space/>

<wd l="8352" t="14741" r="8626" b="14899">did</wd>

<space/>

<wd l="8726" t="14741" r="8899" b="14894">in</wd>

<space/>

<wd l="9005" t="14741" r="9696" b="14942">creating</wd>

<space/>

<wd l="9802" t="14741" r="10070" b="14899">the</wd>

<space/>

<wd l="10176" t="14741" r="10512" b="14899">first</wd>

</ln>

</para>

<rulerline l="6142" t="15048" r="7344" b="15048" type="single" width="10" color="000000"/>

<para l="6398" t="15096" r="9043" b="15302" alignment="left" li="216" spaceBefore="54" spaceAfter="12" lsp="exactly" lspExact="213" language="en">

<ln l="6398" t="15096" r="9043" b="15302" baseLine="15257">

<wd l="6398" t="15096" r="6691" b="15259"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">6</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">All</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6749" t="15134" r="7114" b="15264">other</wd>

<space/>

<wd l="7162" t="15134" r="7656" b="15264">default</wd>

<space/>

<wd l="7699" t="15134" r="8237" b="15302">settings</wd>

<space/>

<wd l="8290" t="15173" r="8635" b="15264">were</wd>

<space/>

<wd l="8683" t="15134" r="9043" b="15264">used.</wd>

</run>

</ln>

</para>

</column>

</section>

<dd l="1440" t="15736" r="10524" b="15977">

<para l="5862" t="15787" r="6085" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5928" t="15787" r="6019" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5928" t="15787" r="6019" b="15946">5</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1433" marginTop="1260" marginRight="1378" marginBottom="1302" offsetX="-26" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1433" t="1260" r="10531" b="15316">

<column l="1433" t="1260" r="5820" b="15316">

<para l="1445" t="1320" r="5803" b="2064" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="1445" t="1320" r="5803" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1320" r="1853" b="1478">draft</wd>

<space/>

<wd l="1920" t="1320" r="2107" b="1478">of</wd>

<space/>

<wd l="2160" t="1320" r="2424" b="1478">the</wd>

<space/>

<wd l="2491" t="1320" r="3686" b="1522">gold-standard</wd>

<space/>

<wd l="3754" t="1373" r="4373" b="1522">corpus.</wd>

<space/>

<wd l="4474" t="1325" r="4656" b="1474">In</wd>

<space/>

<wd l="4723" t="1320" r="5477" b="1507">addition,</wd>

<space/>

<wd l="5549" t="1373" r="5803" b="1478">we</wd>

<space/>

</ln>

<ln l="1445" t="1594" r="5803" b="1795" baseLine="1742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1445" t="1594" r="2626" b="1795">automatically</wd>

<space/>

<wd l="2688" t="1594" r="3437" b="1795">assigned</wd>

<space/>

<wd l="3494" t="1594" r="3758" b="1752">the</wd>

<space/>

<wd l="3821" t="1618" r="4080" b="1795">tag</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4147" t="1622" r="4267" b="1752">U</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4330" t="1618" r="4498" b="1752">to</wd>

<space/>

<wd l="4565" t="1594" r="4776" b="1752">all</wd>

<space/>

<wd l="4834" t="1598" r="5400" b="1781">URLs,</wd>

<space/>

<wd l="5467" t="1598" r="5578" b="1747">#</wd>

<space/>

<wd l="5635" t="1618" r="5803" b="1752">to</wd>

<space/>

</run>

</ln>

<ln l="1445" t="1862" r="4771" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1862" r="1656" b="2021">all</wd>

<space/>

<wd l="1714" t="1862" r="2506" b="2064">hashtags,</wd>

<space/>

<wd l="2578" t="1862" r="2890" b="2021">and</wd>

<space/>

<wd l="2966" t="1867" r="3120" b="2021">@</wd>

<space/>

<wd l="3197" t="1886" r="3365" b="2021">to</wd>

<space/>

<wd l="3427" t="1862" r="3638" b="2021">all</wd>

<space/>

<wd l="3701" t="1862" r="4771" b="2021">at-mentions.</wd>

</ln>

</para>

<para l="1445" t="2371" r="2606" b="2530" alignment="left" spaceBefore="260" spaceAfter="294" lsp="exactly" lspExact="253" language="en">

<ln l="1445" t="2371" r="2606" b="2530" baseLine="2525" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="12">

<wd l="1445" t="2371" r="1709" b="2530">5.3</wd>

<space/>

<wd l="1934" t="2376" r="2606" b="2530">Results</wd>

</ln>

</para>

<table l="1594" t="2899" r="5650" b="8208" alignment="left" li="161" ri="170" spaceBefore="5" spaceAfter="252">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<gridTable>

<gridCol>2578</gridCol>

<gridCol>739</gridCol>

<gridCol>739</gridCol>

<gridRow>283</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>283</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>283</gridRow>

<gridRow>278</gridRow>

<gridRow>279</gridRow>

<gridRow>283</gridRow>

</gridTable>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1728" t="2942" r="3034" b="3144" alignment="left" li="129" spaceAfter="16" lsp="exactly" lspExact="253" language="en">

<ln l="1728" t="2942" r="3034" b="3144" baseLine="3091" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1728" t="2942" r="2530" b="3144">Training</wd>

<space/>

<wd l="2587" t="2947" r="3034" b="3101">Data</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4291" t="2947" r="4656" b="3101" alignment="right" ri="220" spaceAfter="16" lsp="exactly" lspExact="253" language="en">

<ln l="4291" t="2947" r="4656" b="3101" baseLine="3091" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="4291" t="2947" r="4656" b="3101">Dev</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="2947" r="5414" b="3101" alignment="right" ri="220" spaceAfter="16" lsp="exactly" lspExact="253" language="en">

<ln l="5035" t="2947" r="5414" b="3101" baseLine="3091" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="5035" t="2947" r="5414" b="3101">Test</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3235" t="3221" r="4008" b="3379" alignment="centered" spaceAfter="21" lsp="exactly" lspExact="253" language="en">

<ln l="3235" t="3221" r="4008" b="3379" baseLine="3374" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3235" t="3221" r="4008" b="3379">Baseline</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="3499" r="3398" b="3701" alignment="left" li="129" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="3499" r="3398" b="3701" baseLine="3653" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1723" t="3499" r="2741" b="3658">Rule-Based</wd>

<space/>

<wd l="2794" t="3504" r="3398" b="3701">Tagger</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="3499" r="4776" b="3658" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="3499" r="4776" b="3658" baseLine="3653" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4301" t="3499" r="4776" b="3658">85.07</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="3499" r="5501" b="3658" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="5040"/>

<ln l="5040" t="3499" r="5501" b="3658" baseLine="3653" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-5">

<wd l="5040" t="3499" r="5501" b="3658">83.51</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3211" t="3778" r="4032" b="3936" alignment="centered" spaceAfter="11" lsp="exactly" lspExact="253" language="en">

<ln l="3211" t="3778" r="4032" b="3936" baseLine="3931" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="3211" t="3778" r="4032" b="3936">Morfette</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="4061" r="2611" b="4219" alignment="left" li="129" spaceAfter="24" lsp="exactly" lspExact="250" language="en">

<ln l="1723" t="4061" r="2611" b="4219" baseLine="4210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">

<wd l="1723" t="4061" r="2611" b="4219">BaseMorf</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="4061" r="4776" b="4219" alignment="left" spaceAfter="24" lsp="exactly" lspExact="250" language="en">

<tabs position="4301"/>

<ln l="4301" t="4061" r="4776" b="4219" baseLine="4210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4301" t="4061" r="4776" b="4219">86.77</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="4061" r="5515" b="4219" alignment="left" spaceAfter="24" lsp="exactly" lspExact="250" language="en">

<tabs position="5040"/>

<ln l="5040" t="4061" r="5515" b="4219" baseLine="4210" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5040" t="4061" r="5515" b="4219">88.67</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="5" gridRowTill="5" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="4339" r="2693" b="4498" alignment="left" li="129" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="4339" r="2693" b="4498" baseLine="4488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="4339" r="2693" b="4498">NormMorf</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="4339" r="4781" b="4498" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="4339" r="4781" b="4498" baseLine="4488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4301" t="4344" r="4781" b="4498">87.94</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="5" gridRowTill="5" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="4339" r="5520" b="4498" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="5040"/>

<ln l="5040" t="4339" r="5520" b="4498" baseLine="4488" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5040" t="4344" r="5520" b="4498">88.74</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="6" gridRowTill="6" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="4618" r="3096" b="4776" alignment="left" li="129" spaceAfter="29" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="4618" r="3096" b="4776" baseLine="4766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="4618" r="3096" b="4776">BaseMorf+Dict</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="4618" r="4781" b="4776" alignment="left" spaceAfter="29" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="4618" r="4781" b="4776" baseLine="4766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4301" t="4618" r="4781" b="4776">87.50</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="6" gridRowTill="6" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="4622" r="5515" b="4776" alignment="left" spaceAfter="29" lsp="exactly" lspExact="249" language="en">

<tabs position="5040"/>

<ln l="5040" t="4622" r="5515" b="4776" baseLine="4766" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5040" t="4622" r="5515" b="4776">89.27</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="7" gridRowTill="7" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="4896" r="3182" b="5054" alignment="left" li="129" spaceAfter="24" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="4896" r="3182" b="5054" baseLine="5045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="4896" r="3182" b="5054">NormMorf+Dict</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="4901" r="4776" b="5054" alignment="left" spaceAfter="24" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="4901" r="4776" b="5054" baseLine="5045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4301" t="4901" r="4776" b="5054">88.47</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="7" gridRowTill="7" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="4896" r="5520" b="5054" alignment="left" spaceAfter="24" lsp="exactly" lspExact="249" language="en">

<tabs position="5035"/>

<ln l="5035" t="4896" r="5520" b="5054" baseLine="5045" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5035" t="4901" r="5520" b="5054">90.22</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="2" gridRowFrom="8" gridRowTill="8" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3379" t="5174" r="3864" b="5328" alignment="centered" spaceAfter="16" lsp="exactly" lspExact="248" language="en">

<ln l="3379" t="5174" r="3864" b="5328" baseLine="5323" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3379" t="5174" r="3864" b="5328">ARK</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="9" gridRowTill="9" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="5453" r="2957" b="5611" alignment="left" li="129" spaceAfter="29" lsp="exactly" lspExact="245" language="en">

<ln l="1723" t="5453" r="2957" b="5611" baseLine="5602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="5453" r="2957" b="5611">BaseArkForm</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="5458" r="4776" b="5611" alignment="left" spaceAfter="29" lsp="exactly" lspExact="245" language="en">

<tabs position="4301"/>

<ln l="4301" t="5458" r="4776" b="5611" baseLine="5602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="4301" t="5458" r="4776" b="5611">88.39</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="9" gridRowTill="9" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="5453" r="5520" b="5611" alignment="left" spaceAfter="29" lsp="exactly" lspExact="245" language="en">

<tabs position="5040"/>

<ln l="5040" t="5453" r="5520" b="5611" baseLine="5602" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5040" t="5458" r="5520" b="5611">89.92</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="10" gridRowTill="10" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="5731" r="2818" b="5890" alignment="left" li="129" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="5731" r="2818" b="5890" baseLine="5885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1723" t="5731" r="2818" b="5890">ArkForm#@</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="5731" r="4781" b="5890" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="5731" r="4781" b="5890" baseLine="5885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4301" t="5731" r="4781" b="5890">89.36</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="10" gridRowTill="10" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="5731" r="5520" b="5890" alignment="left" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<tabs position="5035"/>

<ln l="5035" t="5731" r="5520" b="5890" baseLine="5885" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="5035" t="5736" r="5520" b="5890">90.94</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="11" gridRowTill="11" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="6010" r="3254" b="6168" alignment="left" li="129" spaceAfter="15" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="6010" r="3254" b="6168" baseLine="6163" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1723" t="6010" r="3254" b="6168">ArkForm#URL@</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="11" gridRowTill="11" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="6010" r="4781" b="6168" alignment="left" spaceAfter="15" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="6010" r="4781" b="6168" baseLine="6163" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4301" t="6014" r="4781" b="6168">89.32</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="11" gridRowTill="11" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="6010" r="5520" b="6168" alignment="left" spaceAfter="15" lsp="exactly" lspExact="249" language="en">

<tabs position="5035"/>

<ln l="5035" t="6010" r="5520" b="6168" baseLine="6163" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5035" t="6014" r="5520" b="6168">91.02</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="12" gridRowTill="12" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="6288" r="3701" b="6446" alignment="left" li="129" spaceAfter="24" lsp="exactly" lspExact="250" language="en">

<ln l="1723" t="6288" r="3701" b="6446" baseLine="6442" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="6288" r="3701" b="6446">BaseArkLemma#URL</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="12" gridRowTill="12" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4296" t="6288" r="4781" b="6446" alignment="left" spaceAfter="24" lsp="exactly" lspExact="250" language="en">

<tabs position="4296"/>

<ln l="4296" t="6288" r="4781" b="6446" baseLine="6442" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="4296" t="6293" r="4781" b="6446">90.74</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="12" gridRowTill="12" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="6288" r="5520" b="6446" alignment="left" spaceAfter="24" lsp="exactly" lspExact="250" language="en">

<tabs position="5035"/>

<ln l="5035" t="6288" r="5520" b="6446" baseLine="6442" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5035" t="6288" r="5520" b="6446">91.62</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="13" gridRowTill="13" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="6571" r="3451" b="6730" alignment="left" li="129" spaceAfter="19" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="6571" r="3451" b="6730" baseLine="6720" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1723" t="6571" r="3451" b="6730">ArkLemma#URL@</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="13" gridRowTill="13" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4296" t="6571" r="4781" b="6730" alignment="left" spaceAfter="15" lsp="exactly" lspExact="253" language="en">

<tabs position="4296"/>

<ln l="4296" t="6571" r="4781" b="6730" baseLine="6720" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" foreColor="0000ff">

<wd l="4296" t="6571" r="4781" b="6730">91.46</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="13" gridRowTill="13" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="6571" r="5520" b="6730" alignment="left" spaceAfter="15" lsp="exactly" lspExact="253" language="en">

<tabs position="5035"/>

<ln l="5035" t="6571" r="5520" b="6730" baseLine="6720" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" foreColor="0000ff">

<wd l="5035" t="6571" r="5520" b="6730">91.89</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="2" gridRowFrom="14" gridRowTill="14" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="3216" t="6850" r="4032" b="7008" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="253" language="en">

<ln l="3216" t="6850" r="4032" b="7008" baseLine="6998" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="3216" t="6850" r="4032" b="7008">Stanford</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="15" gridRowTill="15" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="7128" r="2971" b="7286" alignment="left" li="129" spaceAfter="24" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="7128" r="2971" b="7286" baseLine="7277" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="7133" r="2971" b="7286">BestStanForm</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="15" gridRowTill="15" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="7128" r="4781" b="7286" alignment="left" spaceAfter="24" lsp="exactly" lspExact="249" language="en">

<tabs position="4301"/>

<ln l="4301" t="7128" r="4781" b="7286" baseLine="7277" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4301" t="7128" r="4781" b="7286">82.36</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="15" gridRowTill="15" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="7133" r="5515" b="7286" alignment="left" spaceAfter="24" lsp="exactly" lspExact="249" language="en">

<tabs position="5040"/>

<ln l="5040" t="7133" r="5515" b="7286" baseLine="7277" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="5040" t="7133" r="5515" b="7286">84.08</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="16" gridRowTill="16" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="7411" r="3168" b="7565" alignment="left" li="129" spaceAfter="20" lsp="exactly" lspExact="244" language="en">

<ln l="1723" t="7411" r="3168" b="7565" baseLine="7555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="7411" r="3168" b="7565">BestStanLemma</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="16" gridRowTill="16" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4301" t="7406" r="4781" b="7565" alignment="left" spaceAfter="20" lsp="exactly" lspExact="244" language="en">

<tabs position="4301"/>

<ln l="4301" t="7406" r="4781" b="7565" baseLine="7555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="4301" t="7411" r="4781" b="7565">87.34</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="16" gridRowTill="16" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5040" t="7406" r="5520" b="7565" alignment="left" spaceAfter="20" lsp="exactly" lspExact="244" language="en">

<tabs position="5040"/>

<ln l="5040" t="7406" r="5520" b="7565" baseLine="7555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="5040" t="7406" r="5520" b="7565">88.36</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="2" gridRowFrom="17" gridRowTill="17" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="2405" t="7685" r="4838" b="7886" alignment="centered" spaceAfter="25" lsp="exactly" lspExact="249" language="en">

<ln l="2405" t="7685" r="4838" b="7886" baseLine="7834" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="2405" t="7685" r="3734" b="7886">Bootstrapping</wd>

<space/>

<wd l="3792" t="7690" r="4195" b="7843">Best</wd>

<space/>

<wd l="4248" t="7690" r="4838" b="7843">Model</wd>

</ln>

</para>

</cell>

<cell gridColFrom="0" gridColTill="0" gridRowFrom="18" gridRowTill="18" alignment="left" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="1723" t="7963" r="4046" b="8122" alignment="left" li="129" spaceAfter="34" lsp="exactly" lspExact="249" language="en">

<ln l="1723" t="7963" r="4046" b="8122" baseLine="8117" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1723" t="7963" r="4046" b="8122">ArkLemma#URL@+NCII</wd>

</ln>

</para>

</cell>

<cell gridColFrom="1" gridColTill="1" gridRowFrom="18" gridRowTill="18" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="4296" t="7963" r="4781" b="8122" alignment="left" spaceAfter="30" lsp="exactly" lspExact="253" language="en">

<tabs position="4296"/>

<ln l="4296" t="7963" r="4781" b="8122" baseLine="8117" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" foreColor="0000ff">

<wd l="4296" t="7963" r="4781" b="8122">92.60</wd>

</ln>

</para>

</cell>

<cell gridColFrom="2" gridColTill="2" gridRowFrom="18" gridRowTill="18" alignment="decimal" verticalAlignment="middle">

<leftBorder type="single" width="5"/>

<topBorder type="single" width="5"/>

<rightBorder type="single" width="5"/>

<bottomBorder type="single" width="5"/>

<para l="5035" t="7963" r="5520" b="8122" alignment="left" spaceAfter="30" lsp="exactly" lspExact="253" language="en">

<tabs position="5035"/>

<ln l="5035" t="7963" r="5520" b="8122" baseLine="8117" bold="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1" foreColor="0000ff">

<wd l="5035" t="7963" r="5520" b="8122">93.02</wd>

</ln>

</para>

</cell>

</table>

<para l="1440" t="8520" r="5808" b="8995" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="8520" r="5808" b="8722" baseLine="8674" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8520" r="1920" b="8678">Table</wd>

<space/>

<wd l="1992" t="8525" r="2136" b="8678">2:</wd>

<space/>

<wd l="2246" t="8520" r="2880" b="8678">Results</wd>

<space/>

<wd l="2962" t="8520" r="3154" b="8678">of</wd>

<space/>

<wd l="3211" t="8520" r="4104" b="8678">evaluation</wd>

<space/>

<wd l="4176" t="8520" r="4363" b="8678">of</wd>

<space/>

<wd l="4416" t="8525" r="5510" b="8722">POS-taggers</wd>

<space/>

<wd l="5592" t="8573" r="5808" b="8678">on</wd>

<space/>

</ln>

<ln l="1440" t="8794" r="3562" b="8995" baseLine="8942" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8846" r="1795" b="8952">new</wd>

<space/>

<wd l="1853" t="8794" r="2256" b="8952">Irish</wd>

<space/>

<wd l="2309" t="8794" r="2938" b="8952">Twitter</wd>

<space/>

<wd l="2990" t="8846" r="3562" b="8995">corpus</wd>

</ln>

</para>

<para l="1450" t="9379" r="5794" b="9854" alignment="justified" spaceBefore="318" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="9379" r="5794" b="9581" baseLine="9533" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="9379" r="1997" b="9538">The</wd>

<space/>

<wd l="2040" t="9379" r="2602" b="9538">results</wd>

<space/>

<wd l="2654" t="9379" r="2914" b="9538">for</wd>

<space/>

<wd l="2957" t="9379" r="3168" b="9538">all</wd>

<space/>

<wd l="3211" t="9403" r="3835" b="9581">taggers</wd>

<space/>

<wd l="3893" t="9379" r="4205" b="9538">and</wd>

<space/>

<wd l="4248" t="9379" r="5093" b="9538">variations</wd>

<space/>

<wd l="5150" t="9379" r="5338" b="9538">of</wd>

<space/>

<wd l="5376" t="9379" r="5794" b="9538">data-</wd>

</ln>

<ln l="1450" t="9653" r="4075" b="9854" baseLine="9802" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="9677" r="1896" b="9854">setup</wd>

<space/>

<wd l="1958" t="9706" r="2222" b="9811">are</wd>

<space/>

<wd l="2275" t="9653" r="3115" b="9854">presented</wd>

<space/>

<wd l="3168" t="9653" r="3336" b="9806">in</wd>

<space/>

<wd l="3389" t="9653" r="3869" b="9811">Table</wd>

<space/>

<wd l="3931" t="9658" r="4075" b="9811">2.</wd>

</ln>

</para>

<para l="1440" t="9941" r="5808" b="14165" alignment="justified" spaceBefore="17" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="9941" r="5803" b="10142" baseLine="10090" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="9941" r="2256" b="10142">Firstly,</wd>

<space/>

<wd l="2462" t="9994" r="2755" b="10099">our</wd>

<space/>

<wd l="2914" t="9941" r="3269" b="10099">best</wd>

<space/>

<wd l="3427" t="9941" r="4406" b="10142">performing</wd>

<space/>

<wd l="4584" t="9941" r="5098" b="10142">single</wd>

<space/>

<wd l="5261" t="9941" r="5803" b="10099">model</wd>

<space/>

</ln>

<ln l="1450" t="10210" r="5808" b="10406" baseLine="10363">

<wd l="1450" t="10214" r="3278" b="10406"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">ArkLemma#URL@</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="3398" t="10262" r="3614" b="10368">on</wd>

<space/>

<wd l="3720" t="10210" r="3989" b="10368">the</wd>

<space/>

<wd l="4094" t="10234" r="4402" b="10368">test</wd>

<space/>

<wd l="4517" t="10234" r="4752" b="10368">set</wd>

<space/>

<wd l="4862" t="10210" r="5592" b="10368">achieves</wd>

<space/>

<wd l="5712" t="10262" r="5808" b="10368">a</wd>

<space/>

</run>

</ln>

<ln l="1450" t="10483" r="5808" b="10685" baseLine="10632" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1450" t="10536" r="1901" b="10642">score</wd>

<space/>

<wd l="2011" t="10483" r="2203" b="10642">of</wd>

<space/>

<wd l="2299" t="10488" r="3014" b="10670">91.89%,</wd>

<space/>

<wd l="3144" t="10483" r="3677" b="10642">which</wd>

<space/>

<wd l="3782" t="10483" r="3922" b="10642">is</wd>

<space/>

<wd l="4046" t="10488" r="4138" b="10642">8</wd>

<space/>

<wd l="4253" t="10483" r="4776" b="10685">points</wd>

<space/>

<wd l="4896" t="10483" r="5405" b="10642">above</wd>

<space/>

<wd l="5520" t="10536" r="5808" b="10642">our</wd>

<space/>

</ln>

<ln l="1440" t="10752" r="5794" b="10910" baseLine="10906" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="10752" r="2352" b="10910">rule-based</wd>

<space/>

<wd l="2434" t="10752" r="3149" b="10910">baseline</wd>

<space/>

<wd l="3245" t="10805" r="3696" b="10910">score</wd>

<space/>

<wd l="3787" t="10752" r="3979" b="10910">of</wd>

<space/>

<wd l="4061" t="10752" r="4766" b="10910">83.51%.</wd>

<space/>

<wd l="4944" t="10752" r="5323" b="10910">This</wd>

<space/>

<wd l="5424" t="10805" r="5794" b="10910">con-</wd>

</ln>

<ln l="1445" t="11026" r="5794" b="11227" baseLine="11174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11026" r="1882" b="11184">firms</wd>

<space/>

<wd l="1968" t="11026" r="2299" b="11184">that</wd>

<space/>

<wd l="2376" t="11026" r="3115" b="11227">tailoring</wd>

<space/>

<wd l="3197" t="11026" r="3874" b="11227">training</wd>

<space/>

<wd l="3965" t="11026" r="4325" b="11184">data</wd>

<space/>

<wd l="4402" t="11026" r="4661" b="11184">for</wd>

<space/>

<wd l="4747" t="11026" r="5794" b="11227">statistically-</wd>

</ln>

<ln l="1445" t="11294" r="5803" b="11496" baseLine="11448" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="11294" r="1992" b="11453">driven</wd>

<space/>

<wd l="2059" t="11294" r="2477" b="11453">tools</wd>

<space/>

<wd l="2558" t="11294" r="2693" b="11453">is</wd>

<space/>

<wd l="2779" t="11347" r="2875" b="11453">a</wd>

<space/>

<wd l="2942" t="11294" r="3250" b="11496">key</wd>

<space/>

<wd l="3326" t="11294" r="4018" b="11453">element</wd>

<space/>

<wd l="4085" t="11294" r="4258" b="11448">in</wd>

<space/>

<wd l="4330" t="11294" r="5256" b="11496">processing</wd>

<space/>

<wd l="5333" t="11294" r="5803" b="11496">noisy</wd>

<space/>

</ln>

<ln l="1440" t="11568" r="5794" b="11770" baseLine="11717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11568" r="2722" b="11770">user-generated</wd>

<space/>

<wd l="2784" t="11592" r="3461" b="11755">content,</wd>

<space/>

<wd l="3538" t="11621" r="3936" b="11726">even</wd>

<space/>

<wd l="3994" t="11568" r="4162" b="11722">in</wd>

<space/>

<wd l="4219" t="11568" r="4488" b="11726">the</wd>

<space/>

<wd l="4550" t="11621" r="4920" b="11726">case</wd>

<space/>

<wd l="4982" t="11568" r="5174" b="11726">of</wd>

<space/>

<wd l="5218" t="11568" r="5794" b="11726">minor-</wd>

</ln>

<ln l="1440" t="11837" r="5794" b="12038" baseLine="11986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="11837" r="1666" b="12038">ity</wd>

<space/>

<wd l="1766" t="11837" r="2678" b="12038">languages.</wd>

<space/>

<wd l="2880" t="11842" r="3014" b="11995">It</wd>

<space/>

<wd l="3106" t="11837" r="3245" b="11995">is</wd>

<space/>

<wd l="3346" t="11837" r="3854" b="11995">worth</wd>

<space/>

<wd l="3946" t="11837" r="4502" b="12038">noting</wd>

<space/>

<wd l="4598" t="11837" r="4930" b="11995">that</wd>

<space/>

<wd l="5021" t="11837" r="5285" b="11995">the</wd>

<space/>

<wd l="5381" t="11837" r="5794" b="11995">best-</wd>

</ln>

<ln l="1440" t="12110" r="5794" b="12312" baseLine="12259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12110" r="2419" b="12312">performing</wd>

<space/>

<wd l="2510" t="12110" r="3053" b="12269">model</wd>

<space/>

<wd l="3149" t="12110" r="3662" b="12269">learns</wd>

<space/>

<wd l="3758" t="12110" r="4186" b="12269">from</wd>

<space/>

<wd l="4272" t="12110" r="4536" b="12269">the</wd>

<space/>

<wd l="4627" t="12110" r="5227" b="12269">lemma</wd>

<space/>

<wd l="5314" t="12110" r="5794" b="12269">infor-</wd>

</ln>

<ln l="1440" t="12379" r="5803" b="12581" baseLine="12528" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="12379" r="2050" b="12538">mation</wd>

<space/>

<wd l="2126" t="12379" r="2746" b="12538">instead</wd>

<space/>

<wd l="2827" t="12379" r="3014" b="12538">of</wd>

<space/>

<wd l="3082" t="12379" r="3346" b="12538">the</wd>

<space/>

<wd l="3432" t="12379" r="4051" b="12538">surface</wd>

<space/>

<wd l="4128" t="12379" r="4598" b="12538">form.</wd>

<space/>

<wd l="4747" t="12379" r="5126" b="12538">This</wd>

<space/>

<wd l="5218" t="12379" r="5803" b="12581">clearly</wd>

<space/>

</ln>

<ln l="1445" t="12648" r="5803" b="12806" baseLine="12802" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12648" r="2582" b="12806">demonstrates</wd>

<space/>

<wd l="2650" t="12648" r="2914" b="12806">the</wd>

<space/>

<wd l="2976" t="12648" r="3461" b="12806">effect</wd>

<space/>

<wd l="3518" t="12648" r="3845" b="12806">that</wd>

<space/>

<wd l="3902" t="12648" r="4166" b="12806">the</wd>

<space/>

<wd l="4224" t="12648" r="5203" b="12806">inflectional</wd>

<space/>

<wd l="5261" t="12672" r="5803" b="12806">nature</wd>

<space/>

</ln>

<ln l="1445" t="12922" r="5798" b="13123" baseLine="13070" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1445" t="12922" r="1637" b="13080">of</wd>

<space/>

<wd l="1690" t="12922" r="2088" b="13080">Irish</wd>

<space/>

<wd l="2150" t="12922" r="2434" b="13080">has</wd>

<space/>

<wd l="2515" t="12974" r="2726" b="13080">on</wd>

<space/>

<wd l="2798" t="12922" r="3158" b="13080">data</wd>

<space/>

<wd l="3230" t="12922" r="3931" b="13123">sparsity.</wd>

<space/>

<wd l="4042" t="12922" r="4378" b="13080">The</wd>

<space/>

<wd l="4445" t="12922" r="5798" b="13123">Twitter-specific</wd>

<space/>

</ln>

<ln l="1440" t="13190" r="5798" b="13392" baseLine="13344" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13190" r="2002" b="13349">tokens</wd>

<space/>

<wd l="2107" t="13190" r="2496" b="13349">such</wd>

<space/>

<wd l="2592" t="13243" r="2760" b="13349">as</wd>

<space/>

<wd l="2856" t="13195" r="3422" b="13378">URLs,</wd>

<space/>

<wd l="3533" t="13190" r="4272" b="13392">hashtags</wd>

<space/>

<wd l="4378" t="13190" r="4690" b="13349">and</wd>

<space/>

<wd l="4781" t="13190" r="5798" b="13349">at-mentions</wd>

<space/>

</ln>

<ln l="1440" t="13464" r="5794" b="13622" baseLine="13613" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13464" r="1843" b="13622">have</wd>

<space/>

<wd l="1901" t="13464" r="2314" b="13622">been</wd>

<space/>

<wd l="2366" t="13464" r="3336" b="13622">normalised</wd>

<space/>

<wd l="3389" t="13464" r="3922" b="13622">which</wd>

<space/>

<wd l="3979" t="13464" r="5122" b="13622">demonstrates</wd>

<space/>

<wd l="5179" t="13464" r="5448" b="13622">the</wd>

<space/>

<wd l="5501" t="13464" r="5794" b="13618">im-</wd>

</ln>

<ln l="1440" t="13733" r="5808" b="13934" baseLine="13886" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="13757" r="1805" b="13934">pact</wd>

<space/>

<wd l="1858" t="13733" r="2122" b="13891">the</wd>

<space/>

<wd l="2174" t="13733" r="2818" b="13891">relative</wd>

<space/>

<wd l="2870" t="13733" r="3830" b="13934">uniqueness</wd>

<space/>

<wd l="3898" t="13733" r="4090" b="13891">of</wd>

<space/>

<wd l="4123" t="13733" r="4574" b="13891">these</wd>

<space/>

<wd l="4627" t="13733" r="5184" b="13891">tokens</wd>

<space/>

<wd l="5246" t="13733" r="5530" b="13891">has</wd>

<space/>

<wd l="5592" t="13786" r="5808" b="13891">on</wd>

<space/>

</ln>

<ln l="1440" t="14006" r="2400" b="14165" baseLine="14155" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="14006" r="1704" b="14165">the</wd>

<space/>

<wd l="1762" t="14006" r="2400" b="14165">learner.</wd>

</ln>

</para>

<para l="1440" t="14294" r="5803" b="15307" alignment="justified" spaceBefore="20" fli="216" lsp="exactly" lspExact="268" language="en">

<ln l="1656" t="14294" r="5794" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1656" t="14294" r="1934" b="14448">All</wd>

<space/>

<wd l="2002" t="14294" r="2194" b="14453">of</wd>

<space/>

<wd l="2246" t="14347" r="2534" b="14453">our</wd>

<space/>

<wd l="2592" t="14294" r="3154" b="14453">results</wd>

<space/>

<wd l="3230" t="14347" r="3490" b="14453">are</wd>

<space/>

<wd l="3557" t="14294" r="4570" b="14496">comparable</wd>

<space/>

<wd l="4627" t="14294" r="5021" b="14453">with</wd>

<space/>

<wd l="5088" t="14294" r="5794" b="14453">state-of-</wd>

</ln>

<ln l="1440" t="14563" r="5794" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1440" t="14563" r="2011" b="14722">the-art</wd>

<space/>

<wd l="2093" t="14563" r="2654" b="14722">results</wd>

<space/>

<wd l="2746" t="14563" r="3562" b="14765">produced</wd>

<space/>

<wd l="3643" t="14563" r="3859" b="14765">by</wd>

<space/>

<wd l="3950" t="14563" r="4598" b="14765">Gimpel</wd>

<space/>

<wd l="4690" t="14587" r="4843" b="14722">et</wd>

<space/>

<wd l="4934" t="14563" r="5126" b="14722">al.</wd>

<space/>

<wd l="5232" t="14568" r="5794" b="14760">(2011)</wd>

<space/>

</ln>

<ln l="1445" t="14837" r="5794" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="14837" r="1757" b="14995">and</wd>

<space/>

<wd l="1858" t="14837" r="2611" b="15038">Owoputi</wd>

<space/>

<wd l="2717" t="14861" r="2870" b="14995">et</wd>

<space/>

<wd l="2971" t="14837" r="3163" b="14995">al.</wd>

<space/>

<wd l="3283" t="14842" r="3898" b="15034">(2013).</wd>

<space/>

<wd l="4104" t="14837" r="4483" b="14995">This</wd>

<space/>

<wd l="4589" t="14837" r="4723" b="14995">is</wd>

<space/>

<wd l="4829" t="14837" r="5794" b="15038">interesting,</wd>

<space/>

</ln>

<ln l="1445" t="15106" r="5803" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="1445" t="15106" r="1915" b="15307">given</wd>

<space/>

<wd l="2035" t="15106" r="2366" b="15264">that</wd>

<space/>

<wd l="2482" t="15106" r="2654" b="15259">in</wd>

<space/>

<wd l="2774" t="15130" r="3466" b="15264">contrast</wd>

<space/>

<wd l="3581" t="15130" r="3749" b="15264">to</wd>

<space/>

<wd l="3874" t="15106" r="4277" b="15264">their</wd>

<space/>

<wd l="4392" t="15106" r="4882" b="15293">work,</wd>

<space/>

<wd l="5026" t="15158" r="5280" b="15264">we</wd>

<space/>

<wd l="5400" t="15106" r="5803" b="15264">have</wd>

<space/>

</ln>

</para>

</column>

<column l="6144" t="1260" r="10531" b="15316">

<para l="6144" t="1320" r="10512" b="2563" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="6144" t="1320" r="10512" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="1344" r="6427" b="1478">not</wd>

<space/>

<wd l="6485" t="1320" r="7344" b="1522">optimised</wd>

<space/>

<wd l="7406" t="1373" r="7694" b="1478">our</wd>

<space/>

<wd l="7757" t="1344" r="8357" b="1522">system</wd>

<space/>

<wd l="8410" t="1320" r="8798" b="1478">with</wd>

<space/>

<wd l="8856" t="1320" r="10008" b="1522">unsupervised</wd>

<space/>

<wd l="10066" t="1320" r="10512" b="1478">word</wd>

<space/>

</ln>

<ln l="6149" t="1594" r="10512" b="1752" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="1594" r="6806" b="1752">clusters</wd>

<space/>

<wd l="6907" t="1594" r="7214" b="1752">due</wd>

<space/>

<wd l="7306" t="1618" r="7474" b="1752">to</wd>

<space/>

<wd l="7570" t="1594" r="7834" b="1752">the</wd>

<space/>

<wd l="7925" t="1594" r="8290" b="1752">lack</wd>

<space/>

<wd l="8386" t="1594" r="8573" b="1752">of</wd>

<space/>

<wd l="8659" t="1594" r="9461" b="1752">sufficient</wd>

<space/>

<wd l="9547" t="1594" r="9950" b="1752">Irish</wd>

<space/>

<wd l="10037" t="1618" r="10512" b="1752">tweet</wd>

<space/>

</ln>

<ln l="6149" t="1862" r="10502" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="1862" r="6552" b="2021">data.</wd>

<space/>

<wd l="6629" t="1867" r="6970" b="2021">Nor</wd>

<space/>

<wd l="7013" t="1862" r="7416" b="2021">have</wd>

<space/>

<wd l="7464" t="1915" r="7718" b="2021">we</wd>

<space/>

<wd l="7766" t="1862" r="8515" b="2021">included</wd>

<space/>

<wd l="8568" t="1915" r="8664" b="2021">a</wd>

<space/>

<wd l="8702" t="1886" r="8966" b="2064">tag</wd>

<space/>

<wd l="9024" t="1862" r="9931" b="2064">dictionary,</wd>

<space/>

<wd l="9994" t="1862" r="10502" b="2021">distri-</wd>

</ln>

<ln l="6144" t="2136" r="10507" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6144" t="2136" r="6701" b="2294">bution</wd>

<space/>

<wd l="6773" t="2136" r="7594" b="2338">similarity</wd>

<space/>

<wd l="7666" t="2189" r="7848" b="2294">or</wd>

<space/>

<wd l="7910" t="2136" r="8654" b="2338">phonetic</wd>

<space/>

<wd l="8722" t="2136" r="9926" b="2294">normalisation</wd>

<space/>

<wd l="9989" t="2232" r="10099" b="2246">–</wd>

<space/>

<wd l="10166" t="2136" r="10507" b="2294">also</wd>

<space/>

</ln>

<ln l="6149" t="2405" r="8414" b="2563" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="2405" r="6461" b="2563">due</wd>

<space/>

<wd l="6514" t="2429" r="6682" b="2563">to</wd>

<space/>

<wd l="6744" t="2458" r="6840" b="2563">a</wd>

<space/>

<wd l="6893" t="2405" r="7258" b="2563">lack</wd>

<space/>

<wd l="7315" t="2405" r="7502" b="2563">of</wd>

<space/>

<wd l="7546" t="2458" r="8414" b="2563">resources.</wd>

</ln>

</para>

<para l="6144" t="2698" r="10517" b="7234" alignment="justified" spaceBefore="16" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="2698" r="10512" b="2899" baseLine="2846" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6365" t="2702" r="6648" b="2856">We</wd>

<space/>

<wd l="6778" t="2698" r="7382" b="2856">carried</wd>

<space/>

<wd l="7512" t="2722" r="7786" b="2856">out</wd>

<space/>

<wd l="7915" t="2750" r="8011" b="2856">a</wd>

<space/>

<wd l="8136" t="2698" r="8654" b="2856">closer</wd>

<space/>

<wd l="8779" t="2698" r="9365" b="2856">textual</wd>

<space/>

<wd l="9499" t="2698" r="10512" b="2899">comparison</wd>

<space/>

</ln>

<ln l="6149" t="2966" r="10512" b="3168" baseLine="3120" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="2966" r="6341" b="3125">of</wd>

<space/>

<wd l="6413" t="2966" r="7166" b="3168">Owoputi</wd>

<space/>

<wd l="7258" t="2990" r="7416" b="3125">et</wd>

<space/>

<wd l="7498" t="2966" r="7694" b="3125">al.</wd>

<space/>

<wd l="7800" t="2971" r="8510" b="3163">(2013)’s</wd>

<space/>

<wd l="8602" t="2966" r="9269" b="3168">English</wd>

<space/>

<wd l="9350" t="2990" r="9826" b="3125">tweet</wd>

<space/>

<wd l="9912" t="2966" r="10512" b="3125">dataset</wd>

<space/>

</ln>

<ln l="6154" t="3240" r="10498" b="3437" baseLine="3389">

<wd l="6154" t="3245" r="7330" b="3437"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">(</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">daily547</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">)</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="7454" t="3240" r="7766" b="3398">and</wd>

<space/>

<wd l="7882" t="3293" r="8174" b="3398">our</wd>

<space/>

<wd l="8280" t="3293" r="8635" b="3398">new</wd>

<space/>

<wd l="8750" t="3240" r="9154" b="3398">Irish</wd>

<space/>

<wd l="9264" t="3264" r="9739" b="3398">tweet</wd>

<space/>

<wd l="9854" t="3240" r="10498" b="3398">dataset.</wd>

<space/>

</run>

</ln>

<ln l="6144" t="3509" r="10502" b="3710" baseLine="3662" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="3509" r="6610" b="3667">After</wd>

<space/>

<wd l="6706" t="3509" r="7378" b="3710">running</wd>

<space/>

<wd l="7483" t="3509" r="7882" b="3667">each</wd>

<space/>

<wd l="7982" t="3509" r="8582" b="3667">dataset</wd>

<space/>

<wd l="8678" t="3509" r="9360" b="3710">through</wd>

<space/>

<wd l="9461" t="3562" r="9557" b="3667">a</wd>

<space/>

<wd l="9653" t="3509" r="10502" b="3710">language-</wd>

</ln>

<ln l="6154" t="3782" r="10512" b="3984" baseLine="3931" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6154" t="3782" r="6806" b="3984">specific</wd>

<space/>

<wd l="6907" t="3782" r="8093" b="3984">spell-checker,</wd>

<space/>

<wd l="8198" t="3835" r="8453" b="3941">we</wd>

<space/>

<wd l="8544" t="3782" r="9029" b="3941">could</wd>

<space/>

<wd l="9120" t="3835" r="9389" b="3941">see</wd>

<space/>

<wd l="9475" t="3782" r="9806" b="3941">that</wd>

<space/>

<wd l="9893" t="3782" r="10157" b="3941">the</wd>

<space/>

<wd l="10243" t="3782" r="10512" b="3941">list</wd>

<space/>

</ln>

<ln l="6149" t="4051" r="10502" b="4253" baseLine="4200" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="4051" r="6341" b="4210">of</wd>

<space/>

<wd l="6389" t="4051" r="6946" b="4253">highly</wd>

<space/>

<wd l="7013" t="4051" r="7603" b="4210">ranked</wd>

<space/>

<wd l="7670" t="4056" r="8122" b="4210">OOV</wd>

<space/>

<wd l="8198" t="4056" r="8544" b="4248">(out</wd>

<space/>

<wd l="8606" t="4051" r="8798" b="4210">of</wd>

<space/>

<wd l="8846" t="4051" r="9869" b="4253">vocabulary)</wd>

<space/>

<wd l="9946" t="4051" r="10502" b="4210">tokens</wd>

<space/>

</ln>

<ln l="6144" t="4325" r="10512" b="4526" baseLine="4474">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6144" t="4325" r="6317" b="4478">in</wd>

<space/>

<wd l="6418" t="4325" r="7085" b="4526">English</wd>

<space/>

<wd l="7186" t="4378" r="7450" b="4483">are</wd>

<space/>

<wd l="7550" t="4325" r="8050" b="4483">forms</wd>

<space/>

<wd l="8165" t="4325" r="8352" b="4483">of</wd>

<space/>

<wd l="8438" t="4325" r="9374" b="4526">text-speak,</wd>

<space/>

<wd l="9509" t="4325" r="9902" b="4483">such</wd>

<space/>

<wd l="10003" t="4378" r="10171" b="4483">as</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="10286" t="4325" r="10512" b="4483">lol</wd>

<space/>

</run>

</ln>

<ln l="6168" t="4594" r="10517" b="4795" baseLine="4742">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="6168" t="4594" r="6706" b="4795">‘laugh</wd>

<space/>

<wd l="6778" t="4618" r="7051" b="4752">out</wd>

<space/>

<wd l="7123" t="4594" r="7627" b="4781">loud’,</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="7714" t="4594" r="8141" b="4752">lmao</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="8242" t="4594" r="8774" b="4795">‘laugh</wd>

<space/>

<wd l="8842" t="4646" r="9120" b="4795">my</wd>

<space/>

<wd l="9197" t="4646" r="9451" b="4752">ass</wd>

<space/>

<wd l="9533" t="4594" r="9840" b="4752">off’</wd>

<space/>

<wd l="9936" t="4594" r="10248" b="4752">and</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="10320" t="4646" r="10517" b="4752">ur</wd>

<space/>

</run>

</ln>

<ln l="6168" t="4862" r="10512" b="5064" baseLine="5016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6168" t="4867" r="6734" b="5064">‘your’,</wd>

<space/>

<wd l="6826" t="4862" r="7085" b="5021">for</wd>

<space/>

<wd l="7157" t="4862" r="7934" b="5064">example.</wd>

<space/>

<wd l="8069" t="4862" r="8827" b="5021">Whereas</wd>

<space/>

<wd l="8909" t="4862" r="9173" b="5021">the</wd>

<space/>

<wd l="9250" t="4886" r="9677" b="5021">most</wd>

<space/>

<wd l="9754" t="4915" r="10512" b="5021">common</wd>

<space/>

</ln>

<ln l="6149" t="5136" r="10498" b="5338" baseLine="5285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6149" t="5141" r="6686" b="5294">OOVs</wd>

<space/>

<wd l="6739" t="5136" r="6907" b="5290">in</wd>

<space/>

<wd l="6955" t="5136" r="7354" b="5294">Irish</wd>

<space/>

<wd l="7406" t="5189" r="7666" b="5294">are</wd>

<space/>

<wd l="7714" t="5136" r="8381" b="5338">English</wd>

<space/>

<wd l="8424" t="5136" r="8947" b="5294">words</wd>

<space/>

<wd l="9010" t="5136" r="9403" b="5294">such</wd>

<space/>

<wd l="9451" t="5189" r="9619" b="5294">as</wd>

<space/>

<wd l="9701" t="5141" r="10032" b="5323">‘to’,</wd>

<space/>

<wd l="10118" t="5141" r="10498" b="5323">‘on’,</wd>

<space/>

</ln>

<ln l="6168" t="5405" r="10502" b="5606" baseLine="5558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6168" t="5405" r="6590" b="5592">‘for’,</wd>

<space/>

<wd l="6686" t="5410" r="7118" b="5592">‘me’,</wd>

<space/>

<wd l="7195" t="5405" r="7507" b="5563">and</wd>

<space/>

<wd l="7565" t="5405" r="8088" b="5563">words</wd>

<space/>

<wd l="8160" t="5405" r="9096" b="5606">misspelled</wd>

<space/>

<wd l="9154" t="5405" r="9821" b="5563">without</wd>

<space/>

<wd l="9888" t="5405" r="10502" b="5563">diacrit-</wd>

</ln>

<ln l="6144" t="5678" r="10502" b="5837" baseLine="5827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5678" r="6432" b="5837">ics.</wd>

<space/>

<wd l="6614" t="5678" r="6994" b="5837">This</wd>

<space/>

<wd l="7094" t="5678" r="8107" b="5837">observation</wd>

<space/>

<wd l="8203" t="5678" r="8726" b="5837">shows</wd>

<space/>

<wd l="8822" t="5678" r="9091" b="5837">the</wd>

<space/>

<wd l="9182" t="5678" r="10133" b="5837">differences</wd>

<space/>

<wd l="10234" t="5678" r="10502" b="5837">be-</wd>

</ln>

<ln l="6144" t="5947" r="10507" b="6149" baseLine="6101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="5971" r="6667" b="6106">tween</wd>

<space/>

<wd l="6739" t="5947" r="7330" b="6106">textual</wd>

<space/>

<wd l="7411" t="5947" r="8318" b="6149">challenges</wd>

<space/>

<wd l="8405" t="5947" r="8597" b="6106">of</wd>

<space/>

<wd l="8654" t="5947" r="9586" b="6149">processing</wd>

<space/>

<wd l="9662" t="5947" r="10109" b="6106">these</wd>

<space/>

<wd l="10186" t="5971" r="10507" b="6106">two</wd>

<space/>

</ln>

<ln l="6144" t="6221" r="10517" b="6422" baseLine="6370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6221" r="7061" b="6422">languages.</wd>

<space/>

<wd l="7200" t="6226" r="7334" b="6379">It</wd>

<space/>

<wd l="7406" t="6274" r="7781" b="6422">may</wd>

<space/>

<wd l="7862" t="6221" r="8203" b="6379">also</wd>

<space/>

<wd l="8290" t="6245" r="8938" b="6422">suggest</wd>

<space/>

<wd l="9010" t="6221" r="9341" b="6379">that</wd>

<space/>

<wd l="9413" t="6221" r="9811" b="6379">Irish</wd>

<space/>

<wd l="9888" t="6221" r="10517" b="6379">Twitter</wd>

<space/>

</ln>

<ln l="6144" t="6490" r="10507" b="6691" baseLine="6643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6514" r="6470" b="6648">text</wd>

<space/>

<wd l="6523" t="6542" r="6898" b="6691">may</wd>

<space/>

<wd l="6950" t="6490" r="7512" b="6648">follow</wd>

<space/>

<wd l="7574" t="6542" r="7670" b="6648">a</wd>

<space/>

<wd l="7723" t="6542" r="8170" b="6648">more</wd>

<space/>

<wd l="8232" t="6490" r="8962" b="6648">standard</wd>

<space/>

<wd l="9019" t="6490" r="10080" b="6691">orthography</wd>

<space/>

<wd l="10138" t="6490" r="10507" b="6648">than</wd>

<space/>

</ln>

<ln l="6144" t="6763" r="10502" b="6965" baseLine="6912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="6763" r="6816" b="6965">English</wd>

<space/>

<wd l="6864" t="6763" r="7493" b="6922">Twitter</wd>

<space/>

<wd l="7536" t="6787" r="7901" b="6950">text,</wd>

<space/>

<wd l="7968" t="6763" r="8280" b="6922">and</wd>

<space/>

<wd l="8328" t="6763" r="8659" b="6922">will</wd>

<space/>

<wd l="8717" t="6763" r="9187" b="6922">make</wd>

<space/>

<wd l="9235" t="6763" r="9494" b="6922">for</wd>

<space/>

<wd l="9547" t="6816" r="9744" b="6922">an</wd>

<space/>

<wd l="9797" t="6763" r="10502" b="6922">interest-</wd>

</ln>

<ln l="6144" t="7032" r="10085" b="7234" baseLine="7181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="6144" t="7032" r="6422" b="7234">ing</wd>

<space/>

<wd l="6480" t="7032" r="6998" b="7190">future</wd>

<space/>

<wd l="7061" t="7032" r="8179" b="7234">cross-lingual</wd>

<space/>

<wd l="8246" t="7032" r="8707" b="7234">study</wd>

<space/>

<wd l="8770" t="7032" r="8957" b="7190">of</wd>

<space/>

<wd l="9000" t="7032" r="9629" b="7190">Twitter</wd>

<space/>

<wd l="9686" t="7032" r="10085" b="7190">data.</wd>

</ln>

</para>

<para l="6144" t="7325" r="10526" b="13214" alignment="justified" spaceBefore="23" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="6365" t="7325" r="10502" b="7526" baseLine="7474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6365" t="7325" r="7013" b="7526">Finally,</wd>

<space/>

<wd l="7138" t="7378" r="7387" b="7483">we</wd>

<space/>

<wd l="7498" t="7325" r="8251" b="7526">explored</wd>

<space/>

<wd l="8352" t="7325" r="8621" b="7483">the</wd>

<space/>

<wd l="8722" t="7325" r="9629" b="7526">possibility</wd>

<space/>

<wd l="9739" t="7325" r="9926" b="7483">of</wd>

<space/>

<wd l="10018" t="7325" r="10502" b="7483">lever-</wd>

</ln>

<ln l="6149" t="7594" r="10507" b="7795" baseLine="7742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="7594" r="6629" b="7795">aging</wd>

<space/>

<wd l="6720" t="7594" r="7147" b="7752">from</wd>

<space/>

<wd l="7238" t="7594" r="7920" b="7795">existing</wd>

<space/>

<wd l="8011" t="7594" r="9067" b="7795">POS-tagged</wd>

<space/>

<wd l="9158" t="7594" r="9523" b="7752">data</wd>

<space/>

<wd l="9610" t="7594" r="9826" b="7795">by</wd>

<space/>

<wd l="9922" t="7594" r="10507" b="7795">adding</wd>

<space/>

</ln>

<ln l="6149" t="7858" r="10507" b="8064" baseLine="8016">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6149" t="7886" r="6648" b="8021">NCTT</wd>

<space/>

<wd l="6768" t="7877" r="7253" b="8021">3198</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="7450" t="7886" r="7618" b="8021">to</wd>

<space/>

<wd l="7805" t="7915" r="8098" b="8021">our</wd>

<space/>

<wd l="8270" t="7862" r="8626" b="8021">best</wd>

<space/>

<wd l="8803" t="7862" r="9782" b="8064">performing</wd>

<space/>

<wd l="9965" t="7862" r="10507" b="8021">model</wd>

<space/>

</run>

</ln>

<ln l="6144" t="8136" r="10512" b="8338" baseLine="8285">

<wd l="6144" t="8146" r="7891" b="8304"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">ArkLemma#URL@</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="7987" t="8141" r="8270" b="8294">We</wd>

<space/>

<wd l="8338" t="8136" r="8678" b="8294">also</wd>

<space/>

<wd l="8746" t="8136" r="9653" b="8338">duplicated</wd>

<space/>

<wd l="9710" t="8136" r="9979" b="8294">the</wd>

<space/>

<wd l="10037" t="8160" r="10512" b="8294">tweet</wd>

<space/>

</run>

</ln>

<ln l="6144" t="8405" r="10502" b="8606" baseLine="8558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="8405" r="6821" b="8606">training</wd>

<space/>

<wd l="6926" t="8429" r="7162" b="8563">set</wd>

<space/>

<wd l="7253" t="8429" r="7416" b="8563">to</wd>

<space/>

<wd l="7517" t="8405" r="7973" b="8606">bring</wd>

<space/>

<wd l="8069" t="8405" r="8333" b="8563">the</wd>

<space/>

<wd l="8429" t="8405" r="9298" b="8606">weighting</wd>

<space/>

<wd l="9394" t="8405" r="9653" b="8563">for</wd>

<space/>

<wd l="9739" t="8405" r="10128" b="8563">both</wd>

<space/>

<wd l="10224" t="8405" r="10502" b="8563">do-</wd>

</ln>

<ln l="6144" t="8678" r="10512" b="8880" baseLine="8827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="8678" r="6658" b="8837">mains</wd>

<space/>

<wd l="6749" t="8678" r="7085" b="8837">into</wd>

<space/>

<wd l="7171" t="8678" r="7877" b="8837">balance.</wd>

<space/>

<wd l="8040" t="8678" r="8419" b="8837">This</wd>

<space/>

<wd l="8510" t="8678" r="9048" b="8880">brings</wd>

<space/>

<wd l="9139" t="8731" r="9432" b="8837">our</wd>

<space/>

<wd l="9509" t="8678" r="10186" b="8880">training</wd>

<space/>

<wd l="10277" t="8702" r="10512" b="8837">set</wd>

<space/>

</ln>

<ln l="6154" t="8947" r="10512" b="9144" baseLine="9101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="8947" r="6485" b="9106">size</wd>

<space/>

<wd l="6552" t="8971" r="6720" b="9106">to</wd>

<space/>

<wd l="6797" t="8947" r="7224" b="9106">5682</wd>

<space/>

<wd l="7306" t="8952" r="8064" b="9144">(117,273</wd>

<space/>

<wd l="8146" t="8947" r="8827" b="9144">tokens).</wd>

<space/>

<wd l="8947" t="8952" r="9768" b="9134">However,</wd>

<space/>

<wd l="9850" t="9000" r="10104" b="9106">we</wd>

<space/>

<wd l="10176" t="8947" r="10512" b="9106">find</wd>

<space/>

</ln>

<ln l="6144" t="9221" r="10512" b="9422" baseLine="9370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9221" r="6475" b="9379">that</wd>

<space/>

<wd l="6557" t="9274" r="6653" b="9379">a</wd>

<space/>

<wd l="6734" t="9221" r="7637" b="9422">significant</wd>

<space/>

<wd l="7714" t="9221" r="8424" b="9379">increase</wd>

<space/>

<wd l="8506" t="9221" r="8674" b="9374">in</wd>

<space/>

<wd l="8750" t="9221" r="9019" b="9379">the</wd>

<space/>

<wd l="9096" t="9221" r="9773" b="9422">training</wd>

<space/>

<wd l="9859" t="9245" r="10094" b="9379">set</wd>

<space/>

<wd l="10181" t="9221" r="10512" b="9379">size</wd>

<space/>

</ln>

<ln l="6149" t="9490" r="10502" b="9691" baseLine="9643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="9490" r="6528" b="9691">only</wd>

<space/>

<wd l="6586" t="9490" r="7147" b="9648">results</wd>

<space/>

<wd l="7210" t="9490" r="7382" b="9643">in</wd>

<space/>

<wd l="7411" t="9490" r="7747" b="9691">just</wd>

<space/>

<wd l="7805" t="9542" r="8184" b="9648">over</wd>

<space/>

<wd l="8237" t="9542" r="8333" b="9648">a</wd>

<space/>

<wd l="8410" t="9494" r="8472" b="9643">1</wd>

<space/>

<wd l="8544" t="9490" r="8995" b="9691">point</wd>

<space/>

<wd l="9048" t="9490" r="9763" b="9648">increase</wd>

<space/>

<wd l="9816" t="9490" r="9989" b="9643">in</wd>

<space/>

<wd l="10037" t="9494" r="10502" b="9648">POS-</wd>

</ln>

<ln l="6144" t="9763" r="10512" b="9965" baseLine="9912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="9763" r="6797" b="9965">tagging</wd>

<space/>

<wd l="6878" t="9816" r="7675" b="9965">accuracy.</wd>

<space/>

<wd l="7819" t="9768" r="8040" b="9922">At</wd>

<space/>

<wd l="8117" t="9816" r="8213" b="9922">a</wd>

<space/>

<wd l="8290" t="9763" r="8894" b="9965">glance,</wd>

<space/>

<wd l="8990" t="9816" r="9240" b="9922">we</wd>

<space/>

<wd l="9322" t="9816" r="9619" b="9922">can</wd>

<space/>

<wd l="9706" t="9816" r="9974" b="9922">see</wd>

<space/>

<wd l="10061" t="9816" r="10512" b="9922">some</wd>

<space/>

</ln>

<ln l="6149" t="10032" r="10517" b="10190" baseLine="10186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="10032" r="6826" b="10190">obvious</wd>

<space/>

<wd l="6922" t="10085" r="7421" b="10190">errors</wd>

<space/>

<wd l="7512" t="10032" r="7781" b="10190">the</wd>

<space/>

<wd l="7867" t="10032" r="8726" b="10190">combined</wd>

<space/>

<wd l="8813" t="10032" r="9355" b="10190">model</wd>

<space/>

<wd l="9442" t="10032" r="10042" b="10190">makes.</wd>

<space/>

<wd l="10210" t="10037" r="10517" b="10190">For</wd>

<space/>

</ln>

<ln l="6149" t="10306" r="10512" b="10507" baseLine="10454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="10306" r="6926" b="10507">example,</wd>

<space/>

<wd l="6979" t="10306" r="7416" b="10464">there</wd>

<space/>

<wd l="7459" t="10306" r="7594" b="10464">is</wd>

<space/>

<wd l="7651" t="10306" r="8506" b="10464">confusion</wd>

<space/>

<wd l="8549" t="10306" r="9019" b="10464">when</wd>

<space/>

<wd l="9062" t="10306" r="9710" b="10507">tagging</wd>

<space/>

<wd l="9758" t="10306" r="10022" b="10464">the</wd>

<space/>

<wd l="10066" t="10306" r="10512" b="10464">word</wd>

<space/>

</ln>

<ln l="6144" t="10574" r="10512" b="10733" baseLine="10723">

<wd l="6144" t="10627" r="6408" b="10733"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">an</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="6509" t="10574" r="6888" b="10733">This</wd>

<space/>

<wd l="6955" t="10574" r="7406" b="10733">word</wd>

<space/>

<wd l="7464" t="10574" r="8270" b="10733">functions</wd>

<space/>

<wd l="8342" t="10627" r="8510" b="10733">as</wd>

<space/>

<wd l="8582" t="10574" r="8971" b="10733">both</wd>

<space/>

<wd l="9034" t="10627" r="9130" b="10733">a</wd>

<space/>

<wd l="9192" t="10574" r="10138" b="10733">determiner</wd>

<space/>

<wd l="10200" t="10574" r="10512" b="10733">and</wd>

<space/>

</run>

</ln>

<ln l="6149" t="10843" r="10512" b="11045" baseLine="10997" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="10896" r="6350" b="11002">an</wd>

<space/>

<wd l="6427" t="10843" r="7531" b="11045">interrogative</wd>

<space/>

<wd l="7608" t="10843" r="7987" b="11002">verb</wd>

<space/>

<wd l="8064" t="10843" r="8765" b="11045">particle.</wd>

<space/>

<wd l="8904" t="10843" r="9245" b="11002">The</wd>

<space/>

<wd l="9317" t="10843" r="9682" b="11002">lack</wd>

<space/>

<wd l="9763" t="10843" r="9955" b="11002">of</wd>

<space/>

<wd l="10018" t="10843" r="10512" b="11002">direct</wd>

<space/>

</ln>

<ln l="6149" t="11117" r="10502" b="11318" baseLine="11266" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="11117" r="6960" b="11318">questions</wd>

<space/>

<wd l="7042" t="11117" r="7214" b="11270">in</wd>

<space/>

<wd l="7282" t="11117" r="7550" b="11275">the</wd>

<space/>

<wd l="7622" t="11122" r="8069" b="11275">NCII</wd>

<space/>

<wd l="8146" t="11170" r="8717" b="11318">corpus</wd>

<space/>

<wd l="8794" t="11117" r="9355" b="11275">results</wd>

<space/>

<wd l="9437" t="11117" r="9605" b="11270">in</wd>

<space/>

<wd l="9682" t="11170" r="9778" b="11275">a</wd>

<space/>

<wd l="9845" t="11117" r="10190" b="11275">bias</wd>

<space/>

<wd l="10267" t="11141" r="10502" b="11275">to-</wd>

</ln>

<ln l="6144" t="11386" r="10507" b="11587" baseLine="11539">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="6144" t="11386" r="6658" b="11544">wards</wd>

<space/>

<wd l="6744" t="11386" r="7008" b="11544">the</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="7090" t="11414" r="7200" b="11539">D</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="7301" t="11386" r="8376" b="11582">(determiner)</wd>

<space/>

<wd l="8462" t="11410" r="8770" b="11587">tag.</wd>

<space/>

<wd l="8918" t="11390" r="9101" b="11539">In</wd>

<space/>

<wd l="9182" t="11386" r="9936" b="11573">addition,</wd>

<space/>

<wd l="10027" t="11438" r="10507" b="11587">many</wd>

<space/>

</run>

</ln>

<ln l="6144" t="11659" r="10517" b="11861" baseLine="11808" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="11659" r="6811" b="11818">internal</wd>

<space/>

<wd l="6874" t="11659" r="7805" b="11861">capitalised</wd>

<space/>

<wd l="7862" t="11659" r="8386" b="11818">words</wd>

<space/>

<wd l="8462" t="11664" r="8827" b="11861">(e.g.</wd>

<space/>

<wd l="8918" t="11659" r="9187" b="11818">the</wd>

<space/>

<wd l="9245" t="11659" r="10114" b="11861">beginning</wd>

<space/>

<wd l="10181" t="11659" r="10368" b="11818">of</wd>

<space/>

<wd l="10421" t="11712" r="10517" b="11818">a</wd>

<space/>

</ln>

<ln l="6154" t="11928" r="10517" b="12130" baseLine="12082" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="11928" r="6754" b="12086">second</wd>

<space/>

<wd l="6821" t="11957" r="7166" b="12130">part</wd>

<space/>

<wd l="7238" t="11928" r="7430" b="12086">of</wd>

<space/>

<wd l="7493" t="11981" r="7589" b="12086">a</wd>

<space/>

<wd l="7656" t="11933" r="8189" b="12125">tweet)</wd>

<space/>

<wd l="8275" t="11981" r="8539" b="12086">are</wd>

<space/>

<wd l="8611" t="11928" r="9619" b="12086">mislabelled</wd>

<space/>

<wd l="9691" t="11981" r="9864" b="12086">as</wd>

<space/>

<wd l="9941" t="11981" r="10517" b="12130">proper</wd>

<space/>

</ln>

<ln l="6144" t="12202" r="10526" b="12403" baseLine="12350" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12254" r="6710" b="12360">nouns.</wd>

<space/>

<wd l="6792" t="12202" r="7176" b="12360">This</wd>

<space/>

<wd l="7238" t="12202" r="7378" b="12360">is</wd>

<space/>

<wd l="7445" t="12254" r="7541" b="12360">a</wd>

<space/>

<wd l="7594" t="12202" r="8078" b="12360">result</wd>

<space/>

<wd l="8141" t="12202" r="8328" b="12360">of</wd>

<space/>

<wd l="8371" t="12202" r="8640" b="12360">the</wd>

<space/>

<wd l="8702" t="12202" r="9451" b="12403">differing</wd>

<space/>

<wd l="9518" t="12226" r="10272" b="12360">structure</wd>

<space/>

<wd l="10334" t="12202" r="10526" b="12360">of</wd>

<space/>

</ln>

<ln l="6144" t="12470" r="10517" b="12672" baseLine="12624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12470" r="6413" b="12629">the</wd>

<space/>

<wd l="6470" t="12494" r="6792" b="12629">two</wd>

<space/>

<wd l="6859" t="12470" r="7224" b="12629">data</wd>

<space/>

<wd l="7286" t="12494" r="7598" b="12629">sets</wd>

<space/>

<wd l="7661" t="12566" r="7771" b="12581">–</wd>

<space/>

<wd l="7834" t="12470" r="8232" b="12629">each</wd>

<space/>

<wd l="8290" t="12494" r="8765" b="12629">tweet</wd>

<space/>

<wd l="8822" t="12523" r="9192" b="12672">may</wd>

<space/>

<wd l="9259" t="12470" r="9898" b="12629">contain</wd>

<space/>

<wd l="9960" t="12523" r="10272" b="12629">one</wd>

<space/>

<wd l="10334" t="12523" r="10517" b="12629">or</wd>

<space/>

</ln>

<ln l="6144" t="12744" r="10512" b="12946" baseLine="12893" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="12797" r="6595" b="12902">more</wd>

<space/>

<wd l="6653" t="12744" r="7301" b="12946">phrases</wd>

<space/>

<wd l="7368" t="12797" r="7550" b="12902">or</wd>

<space/>

<wd l="7618" t="12768" r="8486" b="12931">sentences,</wd>

<space/>

<wd l="8554" t="12744" r="9038" b="12902">while</wd>

<space/>

<wd l="9101" t="12744" r="9365" b="12902">the</wd>

<space/>

<wd l="9422" t="12749" r="9874" b="12902">NCII</wd>

<space/>

<wd l="9931" t="12744" r="10070" b="12902">is</wd>

<space/>

<wd l="10142" t="12744" r="10512" b="12946">split</wd>

<space/>

</ln>

<ln l="6144" t="13013" r="7997" b="13214" baseLine="13166" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="13013" r="6480" b="13171">into</wd>

<space/>

<wd l="6547" t="13013" r="7061" b="13214">single</wd>

<space/>

<wd l="7123" t="13037" r="7997" b="13171">sentences.</wd>

</ln>

</para>

<para l="6149" t="13541" r="7843" b="13714" alignment="left" spaceBefore="275" lsp="exactly" lspExact="273" language="en">

<ln l="6149" t="13541" r="7843" b="13714" baseLine="13709" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="10">

<wd l="6149" t="13541" r="6259" b="13714">6</wd>

<space/>

<wd l="6504" t="13546" r="7205" b="13714">Future</wd>

<space/>

<wd l="7262" t="13546" r="7843" b="13714">Work</wd>

</ln>

</para>

<para l="6144" t="14021" r="10517" b="15264" alignment="justified" spaceBefore="190" lsp="exactly" lspExact="269" language="en">

<ln l="6144" t="14021" r="10512" b="14222" baseLine="14174" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14021" r="6840" b="14179">Limited</wd>

<space/>

<wd l="6898" t="14074" r="7714" b="14179">resources</wd>

<space/>

<wd l="7786" t="14021" r="8098" b="14179">and</wd>

<space/>

<wd l="8160" t="14021" r="8544" b="14179">time</wd>

<space/>

<wd l="8606" t="14021" r="9461" b="14222">prevented</wd>

<space/>

<wd l="9523" t="14021" r="10512" b="14222">exploration</wd>

<space/>

</ln>

<ln l="6149" t="14294" r="10507" b="14496" baseLine="14443" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6149" t="14294" r="6341" b="14453">of</wd>

<space/>

<wd l="6422" t="14347" r="6869" b="14453">some</wd>

<space/>

<wd l="6960" t="14294" r="7589" b="14496">options</wd>

<space/>

<wd l="7680" t="14294" r="7939" b="14453">for</wd>

<space/>

<wd l="8021" t="14294" r="8923" b="14496">improving</wd>

<space/>

<wd l="9014" t="14347" r="9302" b="14453">our</wd>

<space/>

<wd l="9384" t="14294" r="10507" b="14496">POS-tagging</wd>

<space/>

</ln>

<ln l="6144" t="14563" r="10512" b="14765" baseLine="14717" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6144" t="14563" r="6758" b="14722">results.</wd>

<space/>

<wd l="6840" t="14568" r="7195" b="14722">One</wd>

<space/>

<wd l="7243" t="14563" r="7435" b="14722">of</wd>

<space/>

<wd l="7459" t="14563" r="7910" b="14722">these</wd>

<space/>

<wd l="7958" t="14563" r="8587" b="14765">options</wd>

<space/>

<wd l="8635" t="14563" r="8774" b="14722">is</wd>

<space/>

<wd l="8822" t="14587" r="8990" b="14722">to</wd>

<space/>

<wd l="9034" t="14563" r="9662" b="14765">modify</wd>

<space/>

<wd l="9706" t="14563" r="9970" b="14722">the</wd>

<space/>

<wd l="10018" t="14568" r="10512" b="14722">CMU</wd>

<space/>

</ln>

<ln l="6154" t="14837" r="10502" b="15038" baseLine="14986" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="14837" r="6946" b="15038">(English)</wd>

<space/>

<wd l="7042" t="14837" r="7670" b="14995">Twitter</wd>

<space/>

<wd l="7747" t="14842" r="8770" b="15038">POS-tagger</wd>

<space/>

<wd l="8851" t="14861" r="9014" b="14995">to</wd>

<space/>

<wd l="9106" t="14837" r="9576" b="14995">allow</wd>

<space/>

<wd l="9662" t="14837" r="9922" b="14995">for</wd>

<space/>

<wd l="10003" t="14837" r="10502" b="14995">inclu-</wd>

</ln>

<ln l="6154" t="15106" r="10517" b="15264" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="6154" t="15106" r="6509" b="15264">sion</wd>

<space/>

<wd l="6586" t="15106" r="6778" b="15264">of</wd>

<space/>

<wd l="6835" t="15106" r="7430" b="15264">lemma</wd>

<space/>

<wd l="7498" t="15106" r="8530" b="15264">information</wd>

<space/>

<wd l="8602" t="15158" r="8774" b="15264">as</wd>

<space/>

<wd l="8856" t="15158" r="8952" b="15264">a</wd>

<space/>

<wd l="9019" t="15106" r="9667" b="15264">feature.</wd>

<space/>

<wd l="9797" t="15106" r="10517" b="15264">Another</wd>

</ln>

</para>

</column>

</section>

<dd l="1433" t="15736" r="10531" b="15977">

<para l="5862" t="15787" r="6095" b="15946" alignment="centered" spaceBefore="4" lsp="exactly" lspExact="229" language="en">

<ln l="5928" t="15787" r="6029" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5928" t="15787" r="6029" b="15946">6</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1430" marginTop="1261" marginRight="1381" marginBottom="1312" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1430" t="1261" r="10528" b="15315">

<column l="1430" t="1261" r="5817" b="15315">

<para l="1440" t="1320" r="5803" b="2606" alignment="justified" lsp="exactly" lspExact="271" language="en">

<ln l="1445" t="1320" r="5794" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1320" r="2040" b="1522">option,</wd>

<space/>

<wd l="2126" t="1320" r="2602" b="1478">when</wd>

<space/>

<wd l="2669" t="1320" r="3101" b="1478">there</wd>

<space/>

<wd l="3173" t="1320" r="3312" b="1478">is</wd>

<space/>

<wd l="3389" t="1373" r="3835" b="1478">more</wd>

<space/>

<wd l="3907" t="1320" r="4819" b="1478">unlabelled</wd>

<space/>

<wd l="4891" t="1320" r="5251" b="1478">data</wd>

<space/>

<wd l="5323" t="1320" r="5794" b="1478">avail-</wd>

</ln>

<ln l="1445" t="1594" r="5803" b="1790" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="1594" r="1805" b="1752">able</wd>

<space/>

<wd l="1886" t="1594" r="2208" b="1790">(i.e.</wd>

<space/>

<wd l="2347" t="1646" r="2798" b="1752">more</wd>

<space/>

<wd l="2875" t="1594" r="3274" b="1752">Irish</wd>

<space/>

<wd l="3350" t="1618" r="3898" b="1752">tweets</wd>

<space/>

<wd l="3989" t="1594" r="4642" b="1790">online),</wd>

<space/>

<wd l="4738" t="1594" r="5280" b="1752">would</wd>

<space/>

<wd l="5352" t="1594" r="5558" b="1752">be</wd>

<space/>

<wd l="5635" t="1618" r="5803" b="1752">to</wd>

<space/>

</ln>

<ln l="1440" t="1862" r="5803" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1862" r="2083" b="2021">include</wd>

<space/>

<wd l="2150" t="1862" r="2554" b="2021">Irish</wd>

<space/>

<wd l="2621" t="1862" r="3072" b="2021">word</wd>

<space/>

<wd l="3144" t="1862" r="3725" b="2021">cluster</wd>

<space/>

<wd l="3792" t="1862" r="4474" b="2021">features</wd>

<space/>

<wd l="4550" t="1862" r="4723" b="2016">in</wd>

<space/>

<wd l="4790" t="1862" r="5054" b="2021">the</wd>

<space/>

<wd l="5126" t="1862" r="5803" b="2064">training</wd>

<space/>

</ln>

<ln l="1440" t="2136" r="5794" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2136" r="2030" b="2294">model.</wd>

<space/>

<wd l="2131" t="2136" r="2510" b="2294">This</wd>

<space/>

<wd l="2582" t="2136" r="3379" b="2338">approach</wd>

<space/>

<wd l="3442" t="2136" r="3720" b="2294">has</wd>

<space/>

<wd l="3797" t="2136" r="4142" b="2294">also</wd>

<space/>

<wd l="4205" t="2136" r="4618" b="2294">been</wd>

<space/>

<wd l="4680" t="2136" r="5150" b="2294">taken</wd>

<space/>

<wd l="5213" t="2136" r="5424" b="2338">by</wd>

<space/>

<wd l="5491" t="2141" r="5794" b="2294">Re-</wd>

</ln>

<ln l="1440" t="2405" r="5448" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="2405" r="1925" b="2563">hbein</wd>

<space/>

<wd l="1987" t="2410" r="2549" b="2602">(2013)</wd>

<space/>

<wd l="2616" t="2405" r="2875" b="2563">for</wd>

<space/>

<wd l="2923" t="2410" r="3312" b="2563">POS</wd>

<space/>

<wd l="3379" t="2405" r="4032" b="2606">tagging</wd>

<space/>

<wd l="4094" t="2410" r="4790" b="2563">German</wd>

<space/>

<wd l="4848" t="2429" r="5448" b="2563">tweets.</wd>

</ln>

</para>

<para l="1440" t="2678" r="5808" b="5318" alignment="justified" spaceBefore="2" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="2678" r="5803" b="2880" baseLine="2832" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="2678" r="1997" b="2837">The</wd>

<space/>

<wd l="2098" t="2731" r="2914" b="2837">resources</wd>

<space/>

<wd l="3019" t="2731" r="3274" b="2837">we</wd>

<space/>

<wd l="3374" t="2678" r="4037" b="2880">provide</wd>

<space/>

<wd l="4138" t="2678" r="4819" b="2880">through</wd>

<space/>

<wd l="4915" t="2678" r="5222" b="2837">this</wd>

<space/>

<wd l="5342" t="2678" r="5803" b="2880">study</wd>

<space/>

</ln>

<ln l="1445" t="2952" r="5794" b="3110" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="3005" r="1704" b="3110">are</wd>

<space/>

<wd l="1776" t="3005" r="1872" b="3110">a</wd>

<space/>

<wd l="1930" t="2952" r="2664" b="3110">valuable</wd>

<space/>

<wd l="2731" t="2952" r="3792" b="3110">contribution</wd>

<space/>

<wd l="3854" t="2976" r="4022" b="3110">to</wd>

<space/>

<wd l="4090" t="2952" r="4354" b="3110">the</wd>

<space/>

<wd l="4416" t="2952" r="4819" b="3110">Irish</wd>

<space/>

<wd l="4882" t="2957" r="5294" b="3110">NLP</wd>

<space/>

<wd l="5362" t="3005" r="5794" b="3110">com-</wd>

</ln>

<ln l="1440" t="3221" r="5794" b="3422" baseLine="3370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="3221" r="2088" b="3422">munity.</wd>

<space/>

<wd l="2232" t="3221" r="2832" b="3422">Firstly,</wd>

<space/>

<wd l="2923" t="3274" r="3178" b="3379">we</wd>

<space/>

<wd l="3259" t="3245" r="3821" b="3422">expect</wd>

<space/>

<wd l="3893" t="3221" r="4224" b="3379">that</wd>

<space/>

<wd l="4301" t="3221" r="4608" b="3379">this</wd>

<space/>

<wd l="4690" t="3274" r="5045" b="3379">new</wd>

<space/>

<wd l="5126" t="3221" r="5491" b="3379">data</wd>

<space/>

<wd l="5563" t="3274" r="5794" b="3379">re-</wd>

</ln>

<ln l="1450" t="3490" r="5794" b="3691" baseLine="3643" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="3542" r="2006" b="3648">source</wd>

<space/>

<wd l="2088" t="3490" r="2419" b="3686">(the</wd>

<space/>

<wd l="2491" t="3490" r="3542" b="3691">POS-tagged</wd>

<space/>

<wd l="3614" t="3490" r="4243" b="3648">Twitter</wd>

<space/>

<wd l="4315" t="3494" r="4954" b="3691">corpus)</wd>

<space/>

<wd l="5030" t="3490" r="5371" b="3648">will</wd>

<space/>

<wd l="5443" t="3542" r="5794" b="3691">pro-</wd>

</ln>

<ln l="1440" t="3763" r="5798" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="3763" r="1814" b="3922">vide</wd>

<space/>

<wd l="1877" t="3816" r="1973" b="3922">a</wd>

<space/>

<wd l="2030" t="3763" r="2448" b="3922">solid</wd>

<space/>

<wd l="2501" t="3763" r="2928" b="3922">basis</wd>

<space/>

<wd l="2990" t="3763" r="3250" b="3922">for</wd>

<space/>

<wd l="3298" t="3763" r="4104" b="3965">linguistic</wd>

<space/>

<wd l="4166" t="3763" r="4478" b="3922">and</wd>

<space/>

<wd l="4541" t="3763" r="5798" b="3965">sociolinguistic</wd>

<space/>

</ln>

<ln l="1450" t="4032" r="5798" b="4234" baseLine="4186" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="4032" r="1910" b="4234">study</wd>

<space/>

<wd l="2002" t="4032" r="2194" b="4190">of</wd>

<space/>

<wd l="2266" t="4032" r="2669" b="4190">Irish</wd>

<space/>

<wd l="2755" t="4085" r="2971" b="4190">on</wd>

<space/>

<wd l="3058" t="4085" r="3154" b="4190">a</wd>

<space/>

<wd l="3245" t="4032" r="3744" b="4190">social</wd>

<space/>

<wd l="3830" t="4032" r="4368" b="4190">media</wd>

<space/>

<wd l="4450" t="4032" r="5246" b="4234">platform.</wd>

<space/>

<wd l="5419" t="4032" r="5798" b="4190">This</wd>

<space/>

</ln>

<ln l="1440" t="4306" r="5808" b="4507" baseLine="4454" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="4358" r="1795" b="4464">new</wd>

<space/>

<wd l="1858" t="4306" r="2506" b="4464">domain</wd>

<space/>

<wd l="2563" t="4306" r="2755" b="4464">of</wd>

<space/>

<wd l="2794" t="4306" r="3192" b="4464">Irish</wd>

<space/>

<wd l="3245" t="4306" r="4032" b="4507">language</wd>

<space/>

<wd l="4085" t="4358" r="4373" b="4464">use</wd>

<space/>

<wd l="4435" t="4358" r="4728" b="4464">can</wd>

<space/>

<wd l="4786" t="4306" r="4987" b="4464">be</wd>

<space/>

<wd l="5045" t="4306" r="5808" b="4507">analysed</wd>

<space/>

</ln>

<ln l="1440" t="4574" r="5794" b="4776" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="4574" r="1613" b="4728">in</wd>

<space/>

<wd l="1670" t="4627" r="1867" b="4733">an</wd>

<space/>

<wd l="1930" t="4574" r="2746" b="4776">empirical</wd>

<space/>

<wd l="2808" t="4574" r="3120" b="4733">and</wd>

<space/>

<wd l="3182" t="4574" r="3955" b="4733">scientific</wd>

<space/>

<wd l="4018" t="4627" r="4675" b="4733">manner</wd>

<space/>

<wd l="4723" t="4574" r="5405" b="4776">through</wd>

<space/>

<wd l="5462" t="4627" r="5794" b="4733">cor-</wd>

</ln>

<ln l="1440" t="4848" r="5803" b="5050" baseLine="4997" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="4901" r="1733" b="5050">pus</wd>

<space/>

<wd l="1795" t="4848" r="2486" b="5050">analysis</wd>

<space/>

<wd l="2539" t="4848" r="2755" b="5050">by</wd>

<space/>

<wd l="2808" t="4901" r="3355" b="5006">means</wd>

<space/>

<wd l="3418" t="4848" r="3605" b="5006">of</wd>

<space/>

<wd l="3648" t="4901" r="3936" b="5006">our</wd>

<space/>

<wd l="3984" t="4848" r="4387" b="5006">data.</wd>

<space/>

<wd l="4464" t="4848" r="4800" b="5006">The</wd>

<space/>

<wd l="4853" t="4848" r="5482" b="5006">authors</wd>

<space/>

<wd l="5544" t="4901" r="5803" b="5006">are</wd>

<space/>

</ln>

<ln l="1445" t="5117" r="5582" b="5318" baseLine="5270" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="5117" r="2222" b="5318">currently</wd>

<space/>

<wd l="2280" t="5117" r="3005" b="5318">working</wd>

<space/>

<wd l="3062" t="5117" r="3739" b="5275">towards</wd>

<space/>

<wd l="3802" t="5117" r="4109" b="5275">this</wd>

<space/>

<wd l="4171" t="5117" r="5021" b="5318">follow-up</wd>

<space/>

<wd l="5088" t="5117" r="5582" b="5318">study.</wd>

</ln>

</para>

<para l="1440" t="5390" r="5808" b="7488" alignment="justified" spaceBefore="2" fli="216" lsp="exactly" lspExact="270" language="en">

<ln l="1656" t="5390" r="5794" b="5592" baseLine="5539" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1656" t="5395" r="2136" b="5549">From</wd>

<space/>

<wd l="2227" t="5443" r="2323" b="5549">a</wd>

<space/>

<wd l="2414" t="5390" r="3946" b="5592">tool-development</wd>

<space/>

<wd l="4042" t="5390" r="5069" b="5592">perspective,</wd>

<space/>

<wd l="5184" t="5443" r="5434" b="5549">we</wd>

<space/>

<wd l="5534" t="5443" r="5794" b="5549">ex-</wd>

</ln>

<ln l="1440" t="5664" r="5803" b="5866" baseLine="5813" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5688" r="1805" b="5866">pect</wd>

<space/>

<wd l="1930" t="5664" r="2237" b="5822">this</wd>

<space/>

<wd l="2376" t="5717" r="2942" b="5866">corpus</wd>

<space/>

<wd l="3082" t="5664" r="3394" b="5822">and</wd>

<space/>

<wd l="3514" t="5664" r="3782" b="5822">the</wd>

<space/>

<wd l="3912" t="5664" r="4555" b="5822">derived</wd>

<space/>

<wd l="4680" t="5664" r="5803" b="5866">POS-tagging</wd>

<space/>

</ln>

<ln l="1440" t="5933" r="5794" b="6134" baseLine="6082" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="5933" r="2064" b="6091">models</wd>

<space/>

<wd l="2141" t="5933" r="2621" b="6091">could</wd>

<space/>

<wd l="2688" t="5933" r="2894" b="6091">be</wd>

<space/>

<wd l="2962" t="5933" r="3360" b="6091">used</wd>

<space/>

<wd l="3427" t="5933" r="3595" b="6086">in</wd>

<space/>

<wd l="3667" t="5986" r="3763" b="6091">a</wd>

<space/>

<wd l="3830" t="5933" r="5462" b="6134">domain-adaptation</wd>

<space/>

<wd l="5530" t="5986" r="5794" b="6134">ap-</wd>

</ln>

<ln l="1440" t="6202" r="5808" b="6403" baseLine="6355" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="6202" r="2035" b="6403">proach</wd>

<space/>

<wd l="2093" t="6226" r="2256" b="6360">to</wd>

<space/>

<wd l="2318" t="6202" r="2957" b="6403">parsing</wd>

<space/>

<wd l="3019" t="6202" r="3418" b="6360">Irish</wd>

<space/>

<wd l="3475" t="6226" r="4075" b="6389">tweets,</wd>

<space/>

<wd l="4157" t="6202" r="4757" b="6360">similar</wd>

<space/>

<wd l="4810" t="6226" r="4973" b="6360">to</wd>

<space/>

<wd l="5035" t="6202" r="5299" b="6360">the</wd>

<space/>

<wd l="5362" t="6202" r="5808" b="6360">work</wd>

<space/>

</ln>

<ln l="1445" t="6475" r="5803" b="6677" baseLine="6624" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="6475" r="1637" b="6634">of</wd>

<space/>

<wd l="1670" t="6480" r="2141" b="6677">Kong</wd>

<space/>

<wd l="2194" t="6499" r="2347" b="6634">et</wd>

<space/>

<wd l="2395" t="6475" r="2592" b="6634">al.</wd>

<space/>

<wd l="2659" t="6480" r="3274" b="6672">(2014).</wd>

<space/>

<wd l="3350" t="6475" r="3730" b="6634">This</wd>

<space/>

<wd l="3782" t="6475" r="4325" b="6634">would</wd>

<space/>

<wd l="4373" t="6475" r="5006" b="6634">involve</wd>

<space/>

<wd l="5059" t="6475" r="5803" b="6677">adapting</wd>

<space/>

</ln>

<ln l="1440" t="6744" r="5803" b="6946" baseLine="6898" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="6749" r="1891" b="6946">Lynn</wd>

<space/>

<wd l="1987" t="6768" r="2141" b="6902">et</wd>

<space/>

<wd l="2237" t="6744" r="2434" b="6902">al.</wd>

<space/>

<wd l="2549" t="6749" r="3254" b="6941">(2012)’s</wd>

<space/>

<wd l="3355" t="6744" r="3758" b="6902">Irish</wd>

<space/>

<wd l="3859" t="6744" r="4670" b="6902">statistical</wd>

<space/>

<wd l="4771" t="6744" r="5803" b="6946">dependency</wd>

<space/>

</ln>

<ln l="1440" t="7018" r="5798" b="7219" baseLine="7166" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="7070" r="1978" b="7219">parser</wd>

<space/>

<wd l="2040" t="7018" r="2299" b="7176">for</wd>

<space/>

<wd l="2357" t="7070" r="2650" b="7176">use</wd>

<space/>

<wd l="2712" t="7018" r="3106" b="7176">with</wd>

<space/>

<wd l="3178" t="7018" r="3672" b="7176">social</wd>

<space/>

<wd l="3744" t="7018" r="4277" b="7176">media</wd>

<space/>

<wd l="4339" t="7042" r="4709" b="7176">text.</wd>

<space/>

<wd l="4824" t="7022" r="5165" b="7176">Our</wd>

<space/>

<wd l="5227" t="7070" r="5798" b="7219">corpus</wd>

<space/>

</ln>

<ln l="1445" t="7286" r="5794" b="7488" baseLine="7440" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1445" t="7286" r="1925" b="7445">could</wd>

<space/>

<wd l="1973" t="7286" r="2635" b="7488">provide</wd>

<space/>

<wd l="2678" t="7286" r="2947" b="7445">the</wd>

<space/>

<wd l="2995" t="7286" r="3422" b="7445">basis</wd>

<space/>

<wd l="3480" t="7286" r="3672" b="7445">of</wd>

<space/>

<wd l="3706" t="7339" r="3802" b="7445">a</wd>

<space/>

<wd l="3845" t="7286" r="4598" b="7445">treebank</wd>

<space/>

<wd l="4642" t="7286" r="4901" b="7445">for</wd>

<space/>

<wd l="4944" t="7286" r="5251" b="7445">this</wd>

<space/>

<wd l="5304" t="7286" r="5794" b="7445">work.</wd>

</ln>

</para>

<para l="1440" t="7560" r="5808" b="9931" alignment="justified" fli="216" lsp="exactly" lspExact="271" language="en">

<ln l="1656" t="7560" r="5794" b="7762" baseLine="7709" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1656" t="7560" r="2544" b="7762">Following</wd>

<space/>

<wd l="2602" t="7613" r="2890" b="7718">our</wd>

<space/>

<wd l="2938" t="7560" r="3773" b="7762">discovery</wd>

<space/>

<wd l="3830" t="7560" r="4018" b="7718">of</wd>

<space/>

<wd l="4051" t="7560" r="4320" b="7718">the</wd>

<space/>

<wd l="4373" t="7584" r="4901" b="7718">extent</wd>

<space/>

<wd l="4944" t="7560" r="5275" b="7718">that</wd>

<space/>

<wd l="5328" t="7560" r="5794" b="7718">code-</wd>

</ln>

<ln l="1450" t="7834" r="5803" b="8035" baseLine="7982" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1450" t="7834" r="2285" b="8035">switching</wd>

<space/>

<wd l="2342" t="7834" r="2482" b="7992">is</wd>

<space/>

<wd l="2539" t="7858" r="3173" b="8035">present</wd>

<space/>

<wd l="3230" t="7886" r="3518" b="7992">our</wd>

<space/>

<wd l="3566" t="7834" r="3970" b="7992">Irish</wd>

<space/>

<wd l="4022" t="7834" r="4651" b="7992">Twitter</wd>

<space/>

<wd l="4704" t="7834" r="5107" b="8021">data,</wd>

<space/>

<wd l="5170" t="7886" r="5424" b="7992">we</wd>

<space/>

<wd l="5477" t="7834" r="5803" b="7992">feel</wd>

<space/>

</ln>

<ln l="1440" t="8102" r="5794" b="8304" baseLine="8251" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8102" r="1958" b="8261">future</wd>

<space/>

<wd l="2021" t="8102" r="2611" b="8261">studies</wd>

<space/>

<wd l="2674" t="8155" r="2890" b="8261">on</wd>

<space/>

<wd l="2938" t="8102" r="3245" b="8261">this</wd>

<space/>

<wd l="3302" t="8102" r="4430" b="8304">phenomenon</wd>

<space/>

<wd l="4478" t="8102" r="5026" b="8261">would</wd>

<space/>

<wd l="5074" t="8102" r="5280" b="8261">be</wd>

<space/>

<wd l="5338" t="8102" r="5525" b="8261">of</wd>

<space/>

<wd l="5563" t="8102" r="5794" b="8256">in-</wd>

</ln>

<ln l="1440" t="8371" r="5803" b="8573" baseLine="8525" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="8395" r="1915" b="8530">terest</wd>

<space/>

<wd l="1987" t="8395" r="2155" b="8530">to</wd>

<space/>

<wd l="2232" t="8371" r="2861" b="8530">various</wd>

<space/>

<wd l="2942" t="8371" r="3672" b="8530">research</wd>

<space/>

<wd l="3749" t="8371" r="4670" b="8573">disciplines</wd>

<space/>

<wd l="4766" t="8376" r="5083" b="8573">(e.g</wd>

<space/>

<wd l="5170" t="8371" r="5803" b="8530">Solorio</wd>

<space/>

</ln>

<ln l="1445" t="8645" r="5794" b="8846" baseLine="8794" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="8669" r="1598" b="8803">et</wd>

<space/>

<wd l="1666" t="8645" r="1862" b="8803">al.</wd>

<space/>

<wd l="1949" t="8650" r="2635" b="8842">(2014)).</wd>

<space/>

<wd l="2741" t="8650" r="2928" b="8798">In</wd>

<space/>

<wd l="2995" t="8645" r="3451" b="8803">order</wd>

<space/>

<wd l="3514" t="8669" r="3682" b="8803">to</wd>

<space/>

<wd l="3754" t="8645" r="3960" b="8803">do</wd>

<space/>

<wd l="4027" t="8645" r="4402" b="8832">that,</wd>

<space/>

<wd l="4478" t="8698" r="4733" b="8803">we</wd>

<space/>

<wd l="4805" t="8669" r="5453" b="8846">suggest</wd>

<space/>

<wd l="5515" t="8698" r="5794" b="8846">up-</wd>

</ln>

<ln l="1445" t="8914" r="5808" b="9115" baseLine="9067" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="8914" r="1982" b="9115">dating</wd>

<space/>

<wd l="2059" t="8914" r="2323" b="9072">the</wd>

<space/>

<wd l="2405" t="8966" r="2971" b="9115">corpus</wd>

<space/>

<wd l="3053" t="8914" r="3442" b="9072">with</wd>

<space/>

<wd l="3518" t="8966" r="3614" b="9072">a</wd>

<space/>

<wd l="3691" t="8938" r="4397" b="9115">separate</wd>

<space/>

<wd l="4474" t="8938" r="4733" b="9115">tag</wd>

<space/>

<wd l="4810" t="8914" r="5069" b="9072">for</wd>

<space/>

<wd l="5141" t="8914" r="5808" b="9115">English</wd>

<space/>

</ln>

<ln l="1440" t="9187" r="5803" b="9389" baseLine="9336">

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1440" t="9187" r="2002" b="9346">tokens</wd>

<space/>

<wd l="2098" t="9187" r="2486" b="9384">(that</wd>

<space/>

<wd l="2563" t="9187" r="2755" b="9374">is,</wd>

<space/>

<wd l="2856" t="9240" r="2952" b="9346">a</wd>

<space/>

<wd l="3024" t="9211" r="3288" b="9389">tag</wd>

<space/>

<wd l="3374" t="9187" r="3826" b="9346">other</wd>

<space/>

<wd l="3898" t="9187" r="4272" b="9346">than</wd>

<space/>

</run>

<wd l="4363" t="9211" r="4526" b="9374"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="modern" fontPitch="fixed" spacing="-3">G</run>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="4618" t="9187" r="5150" b="9346">which</wd>

<space/>

<wd l="5227" t="9187" r="5366" b="9346">is</wd>

<space/>

<wd l="5458" t="9187" r="5803" b="9346">also</wd>

<space/>

</run>

</ln>

<ln l="1440" t="9456" r="5794" b="9653" baseLine="9610" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9456" r="1843" b="9614">used</wd>

<space/>

<wd l="1915" t="9456" r="2174" b="9614">for</wd>

<space/>

<wd l="2251" t="9456" r="3456" b="9643">abbreviations,</wd>

<space/>

<wd l="3547" t="9456" r="4013" b="9614">items</wd>

<space/>

<wd l="4104" t="9456" r="4416" b="9614">and</wd>

<space/>

<wd l="4488" t="9456" r="5443" b="9653">unknowns)</wd>

<space/>

<wd l="5525" t="9456" r="5794" b="9614">be-</wd>

</ln>

<ln l="1440" t="9730" r="5726" b="9931" baseLine="9878" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="9730" r="1790" b="9888">fore</wd>

<space/>

<wd l="1853" t="9730" r="2568" b="9931">carrying</wd>

<space/>

<wd l="2630" t="9754" r="2909" b="9888">out</wd>

<space/>

<wd l="2962" t="9730" r="3557" b="9888">further</wd>

<space/>

<wd l="3614" t="9730" r="4666" b="9931">experiments</wd>

<space/>

<wd l="4728" t="9730" r="4896" b="9883">in</wd>

<space/>

<wd l="4949" t="9730" r="5256" b="9888">this</wd>

<space/>

<wd l="5328" t="9782" r="5726" b="9888">area.</wd>

</ln>

</para>

<para l="1440" t="10195" r="2938" b="10368" alignment="left" spaceBefore="211" lsp="exactly" lspExact="279" language="en">

<ln l="1440" t="10195" r="2938" b="10368" baseLine="10358" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">

<wd l="1440" t="10200" r="1555" b="10363">7</wd>

<space/>

<wd l="1810" t="10195" r="2938" b="10368">Conclusion</wd>

</ln>

</para>

<para l="1440" t="10632" r="5803" b="13003" alignment="justified" spaceBefore="143" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="10632" r="5794" b="10834" baseLine="10781" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10637" r="1723" b="10790">We</wd>

<space/>

<wd l="1781" t="10656" r="2414" b="10834">present</wd>

<space/>

<wd l="2467" t="10632" r="2731" b="10790">the</wd>

<space/>

<wd l="2794" t="10632" r="3130" b="10790">first</wd>

<space/>

<wd l="3187" t="10632" r="3787" b="10790">dataset</wd>

<space/>

<wd l="3845" t="10632" r="4037" b="10790">of</wd>

<space/>

<wd l="4085" t="10632" r="5280" b="10834">gold-standard</wd>

<space/>

<wd l="5333" t="10637" r="5794" b="10790">POS-</wd>

</ln>

<ln l="1440" t="10906" r="5794" b="11107" baseLine="11054" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="10906" r="2021" b="11107">tagged</wd>

<space/>

<wd l="2122" t="10906" r="2525" b="11064">Irish</wd>

<space/>

<wd l="2621" t="10906" r="3408" b="11107">language</wd>

<space/>

<wd l="3509" t="10930" r="4061" b="11064">tweets</wd>

<space/>

<wd l="4171" t="10906" r="4483" b="11064">and</wd>

<space/>

<wd l="4584" t="10958" r="4838" b="11064">we</wd>

<space/>

<wd l="4939" t="10906" r="5342" b="11064">have</wd>

<space/>

<wd l="5443" t="10958" r="5794" b="11107">pro-</wd>

</ln>

<ln l="1445" t="11174" r="5794" b="11376" baseLine="11323" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="11174" r="1963" b="11333">duced</wd>

<space/>

<wd l="2069" t="11174" r="2746" b="11376">training</wd>

<space/>

<wd l="2856" t="11174" r="3475" b="11333">models</wd>

<space/>

<wd l="3595" t="11174" r="3850" b="11333">for</wd>

<space/>

<wd l="3960" t="11227" r="4056" b="11333">a</wd>

<space/>

<wd l="4171" t="11174" r="4939" b="11333">selection</wd>

<space/>

<wd l="5050" t="11174" r="5237" b="11333">of</wd>

<space/>

<wd l="5333" t="11179" r="5794" b="11333">POS-</wd>

</ln>

<ln l="1440" t="11414" r="5794" b="11645" baseLine="11593">

<wd l="1440" t="11414" r="2198" b="11645"><run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">taggers.</run>

<run underlined="none" subsuperscript="superscript" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">7</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><space/>

<wd l="2285" t="11448" r="2568" b="11602">We</wd>

<space/>

<wd l="2626" t="11443" r="3029" b="11602">have</wd>

<space/>

<wd l="3091" t="11443" r="3437" b="11602">also</wd>

<space/>

<wd l="3504" t="11443" r="4061" b="11602">shown</wd>

<space/>

<wd l="4114" t="11443" r="4478" b="11602">how</wd>

<space/>

<wd l="4541" t="11496" r="4795" b="11602">we</wd>

<space/>

<wd l="4848" t="11443" r="5251" b="11602">have</wd>

<space/>

<wd l="5309" t="11443" r="5794" b="11602">lever-</wd>

</run>

</ln>

<ln l="1445" t="11717" r="5798" b="11918" baseLine="11866" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="11717" r="1853" b="11918">aged</wd>

<space/>

<wd l="1925" t="11717" r="2352" b="11875">from</wd>

<space/>

<wd l="2429" t="11717" r="3106" b="11918">existing</wd>

<space/>

<wd l="3182" t="11717" r="3629" b="11875">work</wd>

<space/>

<wd l="3701" t="11741" r="3869" b="11875">to</wd>

<space/>

<wd l="3946" t="11717" r="4387" b="11875">build</wd>

<space/>

<wd l="4459" t="11717" r="4910" b="11875">these</wd>

<space/>

<wd l="4982" t="11770" r="5798" b="11875">resources</wd>

<space/>

</ln>

<ln l="1440" t="11986" r="5794" b="12187" baseLine="12139" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="11986" r="1699" b="12144">for</wd>

<space/>

<wd l="1762" t="12038" r="1858" b="12144">a</wd>

<space/>

<wd l="1915" t="11986" r="3158" b="12144">low-resourced</wd>

<space/>

<wd l="3221" t="11986" r="4051" b="12187">language,</wd>

<space/>

<wd l="4128" t="12010" r="4291" b="12144">to</wd>

<space/>

<wd l="4363" t="11986" r="5016" b="12144">achieve</wd>

<space/>

<wd l="5088" t="11986" r="5794" b="12144">state-of-</wd>

</ln>

<ln l="1440" t="12259" r="5794" b="12418" baseLine="12408" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12259" r="2011" b="12418">the-art</wd>

<space/>

<wd l="2059" t="12259" r="2674" b="12418">results.</wd>

<space/>

<wd l="2750" t="12264" r="3034" b="12418">We</wd>

<space/>

<wd l="3091" t="12259" r="3432" b="12418">also</wd>

<space/>

<wd l="3490" t="12259" r="4166" b="12418">confirm</wd>

<space/>

<wd l="4214" t="12259" r="4546" b="12418">that</wd>

<space/>

<wd l="4589" t="12259" r="4858" b="12418">the</wd>

<space/>

<wd l="4906" t="12264" r="5318" b="12418">NLP</wd>

<space/>

<wd l="5376" t="12259" r="5794" b="12418">chal-</wd>

</ln>

<ln l="1440" t="12528" r="5803" b="12730" baseLine="12682" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1440" t="12528" r="1987" b="12730">lenges</wd>

<space/>

<wd l="2069" t="12528" r="2654" b="12730">arising</wd>

<space/>

<wd l="2726" t="12528" r="3154" b="12686">from</wd>

<space/>

<wd l="3221" t="12528" r="3691" b="12730">noisy</wd>

<space/>

<wd l="3763" t="12528" r="5045" b="12730">user-generated</wd>

<space/>

<wd l="5112" t="12552" r="5434" b="12686">text</wd>

<space/>

<wd l="5506" t="12581" r="5803" b="12686">can</wd>

<space/>

</ln>

<ln l="1445" t="12802" r="4397" b="13003" baseLine="12950" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">

<wd l="1445" t="12802" r="1790" b="12960">also</wd>

<space/>

<wd l="1853" t="12802" r="2328" b="13003">apply</wd>

<space/>

<wd l="2386" t="12826" r="2554" b="12960">to</wd>

<space/>

<wd l="2616" t="12854" r="2712" b="12960">a</wd>

<space/>

<wd l="2760" t="12802" r="3509" b="13003">minority</wd>

<space/>

<wd l="3566" t="12802" r="4397" b="13003">language.</wd>

</ln>

</para>

<para l="1445" t="13267" r="3662" b="13488" alignment="left" spaceBefore="211" lsp="exactly" lspExact="279" language="en">

<ln l="1445" t="13267" r="3662" b="13488" baseLine="13430" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">

<wd l="1445" t="13267" r="1555" b="13440">8</wd>

<space/>

<wd l="1800" t="13267" r="3662" b="13488">Acknowledgments</wd>

</ln>

</para>

<para l="1440" t="13704" r="5808" b="14717" alignment="justified" spaceBefore="145" spaceAfter="105" lsp="exactly" lspExact="271" language="en">

<ln l="1440" t="13704" r="5794" b="13906" baseLine="13853" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13704" r="1781" b="13862">The</wd>

<space/>

<wd l="1853" t="13704" r="2482" b="13862">authors</wd>

<space/>

<wd l="2558" t="13704" r="3106" b="13862">would</wd>

<space/>

<wd l="3173" t="13704" r="3499" b="13862">like</wd>

<space/>

<wd l="3566" t="13728" r="3734" b="13862">to</wd>

<space/>

<wd l="3806" t="13704" r="4291" b="13862">thank</wd>

<space/>

<wd l="4363" t="13704" r="4627" b="13862">the</wd>

<space/>

<wd l="4699" t="13704" r="5131" b="13862">three</wd>

<space/>

<wd l="5208" t="13757" r="5794" b="13906">anony-</wd>

</ln>

<ln l="1440" t="13978" r="5803" b="14179" baseLine="14126" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="14030" r="1906" b="14136">mous</wd>

<space/>

<wd l="2006" t="13978" r="2837" b="14136">reviewers</wd>

<space/>

<wd l="2938" t="13978" r="3197" b="14136">for</wd>

<space/>

<wd l="3288" t="13978" r="3691" b="14136">their</wd>

<space/>

<wd l="3782" t="13978" r="4397" b="14179">helpful</wd>

<space/>

<wd l="4493" t="13978" r="5323" b="14136">feedback.</wd>

<space/>

<wd l="5520" t="13982" r="5803" b="14136">We</wd>

<space/>

</ln>

<ln l="1445" t="14246" r="5798" b="14448" baseLine="14395" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="14246" r="1790" b="14405">also</wd>

<space/>

<wd l="1891" t="14246" r="2438" b="14405">would</wd>

<space/>

<wd l="2534" t="14246" r="2861" b="14405">like</wd>

<space/>

<wd l="2962" t="14270" r="3130" b="14405">to</wd>

<space/>

<wd l="3230" t="14246" r="3720" b="14405">thank</wd>

<space/>

<wd l="3821" t="14246" r="4339" b="14405">Kevin</wd>

<space/>

<wd l="4445" t="14246" r="5093" b="14448">Gimpel</wd>

<space/>

<wd l="5194" t="14246" r="5453" b="14405">for</wd>

<space/>

<wd l="5549" t="14246" r="5798" b="14405">his</wd>

<space/>

</ln>

<ln l="1450" t="14515" r="5808" b="14717" baseLine="14669" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1450" t="14544" r="2098" b="14717">support</wd>

<space/>

<wd l="2227" t="14515" r="2616" b="14674">with</wd>

<space/>

<wd l="2746" t="14515" r="3216" b="14717">using</wd>

<space/>

<wd l="3355" t="14515" r="3619" b="14674">the</wd>

<space/>

<wd l="3758" t="14520" r="4248" b="14674">CMU</wd>

<space/>

<wd l="4382" t="14515" r="5050" b="14717">English</wd>

<space/>

<wd l="5179" t="14515" r="5808" b="14674">Twitter</wd>

</ln>

</para>

<rulerline l="1430" t="14846" r="2640" b="14846" type="single" width="5" color="000000"/>

<para l="1450" t="14904" r="5789" b="15293" alignment="justified" spaceBefore="45" spaceAfter="14" fli="216" lsp="exactly" lspExact="203" language="en">

<ln l="1694" t="14904" r="5789" b="15096" baseLine="15056">

<wd l="1694" t="14904" r="2045" b="15067"><run underlined="none" subsuperscript="superscript" fontSize="650" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">7</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0">Our</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2141" t="14938" r="2434" b="15067">data</wd>

<space/>

<wd l="2530" t="14938" r="2640" b="15067">is</wd>

<space/>

<wd l="2746" t="14938" r="3379" b="15067">available</wd>

<space/>

<wd l="3475" t="14957" r="3610" b="15067">to</wd>

<space/>

<wd l="3710" t="14938" r="4411" b="15067">download</wd>

<space/>

<wd l="4502" t="14938" r="4853" b="15067">from</wd>

<space/>

</run>

<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0"><wd l="4949" t="14942" r="5789" b="15096">https://</wd>

<space/>

</run>

</ln>

<ln l="1450" t="15139" r="5189" b="15293" baseLine="15259" underlined="none" subsuperscript="none" fontSize="900" fontFace="Courier New" fontFamily="modern" fontPitch="fixed" spacing="0">

<wd l="1450" t="15139" r="5189" b="15293">github.com/tlynn747/IrishTwitterPOS</wd>

</ln>

</para>

</column>

<column l="6141" t="1261" r="10528" b="15315">

<para l="6144" t="1320" r="10512" b="4234" alignment="justified" lsp="exactly" lspExact="270" language="en">

<ln l="6144" t="1320" r="10512" b="1522" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1325" r="6533" b="1478">POS</wd>

<space/>

<wd l="6629" t="1344" r="7210" b="1522">tagger,</wd>

<space/>

<wd l="7315" t="1320" r="7896" b="1522">Djam´e</wd>

<space/>

<wd l="7982" t="1320" r="8621" b="1478">Seddah</wd>

<space/>

<wd l="8707" t="1320" r="8966" b="1478">for</wd>

<space/>

<wd l="9043" t="1320" r="9293" b="1478">his</wd>

<space/>

<wd l="9394" t="1349" r="10042" b="1522">support</wd>

<space/>

<wd l="10123" t="1320" r="10512" b="1478">with</wd>

<space/>

</ln>

<ln l="6144" t="1594" r="10502" b="1781" baseLine="1742" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="1594" r="6950" b="1781">Morfette,</wd>

<space/>

<wd l="7051" t="1594" r="7358" b="1752">and</wd>

<space/>

<wd l="7435" t="1594" r="7992" b="1752">Elaine</wd>

<space/>

<wd l="8069" t="1598" r="8290" b="1752">U´ı</wd>

<space/>

<wd l="8362" t="1594" r="9576" b="1752">Dhonnchadha</wd>

<space/>

<wd l="9653" t="1594" r="9965" b="1752">and</wd>

<space/>

<wd l="10037" t="1598" r="10502" b="1752">Fran-</wd>

</ln>

<ln l="6149" t="1862" r="10502" b="2064" baseLine="2016" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="1862" r="6379" b="2021">cis</wd>

<space/>

<wd l="6494" t="1867" r="6970" b="2064">Tyers</wd>

<space/>

<wd l="7085" t="1862" r="7344" b="2021">for</wd>

<space/>

<wd l="7450" t="1862" r="7853" b="2021">their</wd>

<space/>

<wd l="7963" t="1891" r="8611" b="2064">support</wd>

<space/>

<wd l="8717" t="1862" r="9110" b="2021">with</wd>

<space/>

<wd l="9216" t="1862" r="9480" b="2021">the</wd>

<space/>

<wd l="9590" t="1862" r="9994" b="2021">Irish</wd>

<space/>

<wd l="10099" t="1862" r="10502" b="2021">rule-</wd>

</ln>

<ln l="6144" t="2136" r="10507" b="2338" baseLine="2285" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2136" r="6643" b="2294">based</wd>

<space/>

<wd l="6754" t="2141" r="7142" b="2294">POS</wd>

<space/>

<wd l="7262" t="2160" r="7838" b="2338">tagger.</wd>

<space/>

<wd l="8078" t="2136" r="8458" b="2294">This</wd>

<space/>

<wd l="8578" t="2136" r="9024" b="2294">work</wd>

<space/>

<wd l="9130" t="2189" r="9461" b="2294">was</wd>

<space/>

<wd l="9576" t="2136" r="10186" b="2294">funded</wd>

<space/>

<wd l="10291" t="2136" r="10507" b="2338">by</wd>

<space/>

</ln>

<ln l="6144" t="2405" r="10512" b="2606" baseLine="2558" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2405" r="6413" b="2563">the</wd>

<space/>

<wd l="6528" t="2405" r="7344" b="2606">Fulbright</wd>

<space/>

<wd l="7464" t="2405" r="8477" b="2563">Commision</wd>

<space/>

<wd l="8597" t="2405" r="8789" b="2563">of</wd>

<space/>

<wd l="8890" t="2405" r="9509" b="2563">Ireland</wd>

<space/>

<wd l="9634" t="2405" r="10512" b="2606">(Fulbright</wd>

<space/>

</ln>

<ln l="6144" t="2678" r="10502" b="2880" baseLine="2827" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2678" r="7733" b="2880">Enterprise-Ireland</wd>

<space/>

<wd l="7838" t="2678" r="8414" b="2837">Award</wd>

<space/>

<wd l="8525" t="2678" r="9581" b="2875">2014-2015),</wd>

<space/>

<wd l="9715" t="2678" r="10027" b="2837">and</wd>

<space/>

<wd l="10147" t="2731" r="10502" b="2880">sup-</wd>

</ln>

<ln l="6144" t="2947" r="10512" b="3149" baseLine="3101" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="2947" r="6706" b="3149">ported</wd>

<space/>

<wd l="6763" t="2947" r="6979" b="3149">by</wd>

<space/>

<wd l="7046" t="2947" r="7718" b="3106">Science</wd>

<space/>

<wd l="7776" t="2947" r="8770" b="3106">Foundation</wd>

<space/>

<wd l="8827" t="2947" r="9446" b="3106">Ireland</wd>

<space/>

<wd l="9504" t="2947" r="10186" b="3149">through</wd>

<space/>

<wd l="10243" t="2947" r="10512" b="3106">the</wd>

<space/>

</ln>

<ln l="6149" t="3221" r="10512" b="3422" baseLine="3370" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3226" r="6739" b="3379">CNGL</wd>

<space/>

<wd l="6850" t="3226" r="7867" b="3422">Programme</wd>

<space/>

<wd l="7987" t="3226" r="8549" b="3418">(Grant</wd>

<space/>

<wd l="8678" t="3221" r="9845" b="3418">12/CE/I2267)</wd>

<space/>

<wd l="9965" t="3221" r="10138" b="3374">in</wd>

<space/>

<wd l="10243" t="3221" r="10512" b="3379">the</wd>

<space/>

</ln>

<ln l="6144" t="3490" r="10512" b="3691" baseLine="3638" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="3494" r="6859" b="3643">ADAPT</wd>

<space/>

<wd l="6974" t="3494" r="7550" b="3648">Centre</wd>

<space/>

<wd l="7670" t="3490" r="9523" b="3691">(www.adaptcentre.ie)</wd>

<space/>

<wd l="9648" t="3514" r="9802" b="3648">at</wd>

<space/>

<wd l="9907" t="3490" r="10512" b="3648">Dublin</wd>

<space/>

</ln>

<ln l="6149" t="3763" r="10507" b="3965" baseLine="3912" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6149" t="3763" r="6518" b="3965">City</wd>

<space/>

<wd l="6590" t="3763" r="7536" b="3965">University.</wd>

<space/>

<wd l="7661" t="3763" r="8002" b="3922">The</wd>

<space/>

<wd l="8083" t="3763" r="8678" b="3922">second</wd>

<space/>

<wd l="8750" t="3763" r="9307" b="3922">author</wd>

<space/>

<wd l="9374" t="3816" r="9706" b="3922">was</wd>

<space/>

<wd l="9782" t="3763" r="10507" b="3965">partially</wd>

<space/>

</ln>

<ln l="6154" t="4032" r="9432" b="4234" baseLine="4181" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6154" t="4032" r="7008" b="4234">supported</wd>

<space/>

<wd l="7061" t="4032" r="7277" b="4234">by</wd>

<space/>

<wd l="7334" t="4037" r="7603" b="4190">US</wd>

<space/>

<wd l="7666" t="4037" r="8064" b="4190">NSF</wd>

<space/>

<wd l="8126" t="4056" r="8573" b="4234">grant</wd>

<space/>

<wd l="8650" t="4032" r="9432" b="4190">1159174.</wd>

</ln>

</para>

<para l="6149" t="4786" r="7248" b="4958" alignment="left" spaceBefore="504" lsp="exactly" lspExact="279" language="en">

<ln l="6149" t="4786" r="7248" b="4958" baseLine="4954" bold="true" underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="4786" r="7248" b="4958">References</wd>

</ln>

</para>

<para l="6144" t="5198" r="10507" b="6245" alignment="justified" li="216" spaceBefore="146" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="5198" r="10507" b="5366" baseLine="5333" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="5198" r="6658" b="5342">Tetske</wd>

<space/>

<wd l="6725" t="5203" r="7507" b="5366">Avontuur,</wd>

<space/>

<wd l="7584" t="5198" r="7843" b="5342">Iris</wd>

<space/>

<wd l="7915" t="5198" r="8746" b="5366">Balemans,</wd>

<space/>

<wd l="8822" t="5203" r="9288" b="5342">Laura</wd>

<space/>

<wd l="9350" t="5198" r="9912" b="5366">Elshof,</wd>

<space/>

<wd l="9989" t="5203" r="10507" b="5342">Nanne</wd>

<space/>

</ln>

<ln l="6365" t="5419" r="10502" b="5587" baseLine="5554" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5462" r="6648" b="5563">van</wd>

<space/>

<wd l="6730" t="5419" r="7282" b="5587">Noord,</wd>

<space/>

<wd l="7387" t="5419" r="7670" b="5563">and</wd>

<space/>

<wd l="7752" t="5424" r="8314" b="5563">Menno</wd>

<space/>

<wd l="8400" t="5462" r="8678" b="5563">van</wd>

<space/>

<wd l="8770" t="5424" r="9394" b="5563">Zaanen.</wd>

<space/>

<wd l="9590" t="5419" r="10022" b="5563">2012.</wd>

<space/>

<wd l="10214" t="5424" r="10502" b="5563">De-</wd>

</ln>

<ln l="6365" t="5635" r="10498" b="5822" baseLine="5774" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5635" r="7056" b="5822">veloping</wd>

<space/>

<wd l="7142" t="5678" r="7229" b="5779">a</wd>

<space/>

<wd l="7306" t="5635" r="8458" b="5818">part-of-speech</wd>

<space/>

<wd l="8539" t="5654" r="9038" b="5822">tagger</wd>

<space/>

<wd l="9115" t="5635" r="9350" b="5779">for</wd>

<space/>

<wd l="9432" t="5635" r="9874" b="5779">dutch</wd>

<space/>

<wd l="9950" t="5654" r="10498" b="5779">tweets.</wd>

<space/>

</ln>

<ln l="6374" t="5856" r="10502" b="6038" baseLine="5990" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="5856" r="7560" b="6038">Computational</wd>

<space/>

<wd l="7613" t="5861" r="8491" b="6038">Linguistics</wd>

<space/>

<wd l="8558" t="5861" r="8698" b="6000">in</wd>

<space/>

<wd l="8765" t="5856" r="9000" b="6000">the</wd>

<space/>

<wd l="9053" t="5856" r="10032" b="6000">Netherlands</wd>

<space/>

<wd l="10085" t="5861" r="10502" b="6000">Jour-</wd>

</ln>

<ln l="6365" t="6077" r="8160" b="6245" baseLine="6211">

<wd l="6365" t="6077" r="6662" b="6245"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">nal</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="6725" t="6077" r="7416" b="6245">2:34–51,</wd>

<space/>

<wd l="7488" t="6077" r="8160" b="6221">12/2012.</wd>

</run>

</ln>

</para>

<para l="6149" t="6523" r="10517" b="7584" alignment="justified" li="216" spaceBefore="230" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6149" t="6523" r="10507" b="6710" baseLine="6662" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="6523" r="6883" b="6710">Grzegorz</wd>

<space/>

<wd l="6984" t="6523" r="7752" b="6706">Chrupala,</wd>

<space/>

<wd l="7872" t="6523" r="8693" b="6710">Georgiana</wd>

<space/>

<wd l="8789" t="6523" r="9230" b="6691">Dinu,</wd>

<space/>

<wd l="9346" t="6523" r="9629" b="6667">and</wd>

<space/>

<wd l="9725" t="6523" r="10142" b="6667">Josef</wd>

<space/>

<wd l="10229" t="6566" r="10507" b="6667">van</wd>

<space/>

</ln>

<ln l="6370" t="6744" r="10502" b="6931" baseLine="6878" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="6744" r="7133" b="6888">Genabith.</wd>

<space/>

<wd l="7286" t="6744" r="7718" b="6888">2008.</wd>

<space/>

<wd l="7867" t="6744" r="8582" b="6931">Learning</wd>

<space/>

<wd l="8659" t="6744" r="9629" b="6931">morphology</wd>

<space/>

<wd l="9701" t="6744" r="10056" b="6888">with</wd>

<space/>

<wd l="10128" t="6787" r="10502" b="6888">mor-</wd>

</ln>

<ln l="6365" t="6960" r="10502" b="7142" baseLine="7099">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="6960" r="6758" b="7104">fette.</wd>

<space/>

<wd l="6917" t="6965" r="7085" b="7099">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="7162" t="6960" r="8146" b="7142">Proceedings</wd>

<space/>

<wd l="8227" t="6960" r="8405" b="7142">of</wd>

<space/>

<wd l="8458" t="6960" r="8693" b="7104">the</wd>

<space/>

<wd l="8765" t="6960" r="9821" b="7104">International</wd>

<space/>

<wd l="9902" t="6960" r="10502" b="7142">Confer-</wd>

</run>

</ln>

<ln l="6370" t="7181" r="10517" b="7363" baseLine="7315" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="7229" r="6725" b="7325">ence</wd>

<space/>

<wd l="6778" t="7229" r="6970" b="7325">on</wd>

<space/>

<wd l="7013" t="7186" r="7810" b="7363">Language</wd>

<space/>

<wd l="7848" t="7186" r="8664" b="7325">Resources</wd>

<space/>

<wd l="8712" t="7181" r="9014" b="7325">and</wd>

<space/>

<wd l="9048" t="7181" r="9955" b="7349">Evaluation,</wd>

<space/>

<wd l="10018" t="7186" r="10517" b="7325">LREC</wd>

<space/>

</ln>

<ln l="6365" t="7402" r="10426" b="7584" baseLine="7536">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="7402" r="6792" b="7570">2008,</wd>

<space/>

<wd l="6864" t="7402" r="7066" b="7546">26</wd>

<space/>

<wd l="7104" t="7406" r="7464" b="7584">May</wd>

<space/>

<wd l="7526" t="7488" r="7574" b="7502">-</wd>

<space/>

<wd l="7642" t="7402" r="7714" b="7541">1</wd>

<space/>

<wd l="7776" t="7406" r="8146" b="7546">June</wd>

<space/>

<wd l="8198" t="7402" r="8626" b="7570">2008,</wd>

<space/>

<wd l="8693" t="7402" r="9605" b="7570">Marrakech,</wd>

<space/>

</run>

<wd l="9672" t="7406" r="10426" b="7546"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">Morocco</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="7848" r="10502" b="8462" alignment="justified" li="216" spaceBefore="231" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="7848" r="10502" b="8035" baseLine="7987" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="7853" r="6259" b="7992">J.</wd>

<space/>

<wd l="6326" t="7848" r="6883" b="7992">Cohen.</wd>

<space/>

<wd l="6984" t="7848" r="7402" b="7992">1960.</wd>

<space/>

<wd l="7488" t="7853" r="7632" b="7987">A</wd>

<space/>

<wd l="7685" t="7848" r="8563" b="7992">Coefficient</wd>

<space/>

<wd l="8616" t="7848" r="8789" b="7992">of</wd>

<space/>

<wd l="8827" t="7853" r="9715" b="8035">Agreement</wd>

<space/>

<wd l="9763" t="7848" r="9998" b="7992">for</wd>

<space/>

<wd l="10046" t="7853" r="10502" b="7992">Nom-</wd>

</ln>

<ln l="6365" t="8069" r="10502" b="8251" baseLine="8203">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="8069" r="6662" b="8213">inal</wd>

<space/>

<wd l="6744" t="8069" r="7286" b="8213">Scales.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7454" t="8069" r="8438" b="8213">Educational</wd>

<space/>

<wd l="8510" t="8069" r="8818" b="8213">and</wd>

<space/>

<wd l="8890" t="8069" r="10013" b="8251">Psychological</wd>

<space/>

<wd l="10085" t="8074" r="10502" b="8213">Mea-</wd>

</run>

</ln>

<ln l="6365" t="8285" r="7910" b="8462" baseLine="8424">

<wd l="6365" t="8314" r="7128" b="8453"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">surement</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7190" t="8285" r="7910" b="8462">20(1):37.</wd>

</run>

</ln>

</para>

<para l="6144" t="8736" r="10512" b="10018" alignment="justified" li="216" spaceBefore="228" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="8736" r="10512" b="8923" baseLine="8870" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="8741" r="6557" b="8880">Leon</wd>

<space/>

<wd l="6619" t="8736" r="7570" b="8923">Derczynski,</wd>

<space/>

<wd l="7642" t="8736" r="8026" b="8880">Alan</wd>

<space/>

<wd l="8093" t="8736" r="8582" b="8904">Ritter,</wd>

<space/>

<wd l="8659" t="8736" r="9010" b="8880">Sam</wd>

<space/>

<wd l="9077" t="8736" r="9557" b="8904">Clark,</wd>

<space/>

<wd l="9634" t="8736" r="9917" b="8880">and</wd>

<space/>

<wd l="9984" t="8736" r="10512" b="8880">Kalina</wd>

<space/>

</ln>

<ln l="6365" t="8952" r="10507" b="9139" baseLine="9091" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="8952" r="7243" b="9096">Bontcheva.</wd>

<space/>

<wd l="7426" t="8952" r="7858" b="9096">2013.</wd>

<space/>

<wd l="8035" t="8952" r="8606" b="9096">Twitter</wd>

<space/>

<wd l="8683" t="8952" r="9835" b="9134">part-of-speech</wd>

<space/>

<wd l="9912" t="8952" r="10507" b="9139">tagging</wd>

<space/>

</ln>

<ln l="6365" t="9173" r="10512" b="9360" baseLine="9312" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9173" r="6595" b="9317">for</wd>

<space/>

<wd l="6653" t="9173" r="6888" b="9317">all:</wd>

<space/>

<wd l="6979" t="9173" r="7963" b="9360">Overcoming</wd>

<space/>

<wd l="8030" t="9216" r="8515" b="9355">sparse</wd>

<space/>

<wd l="8573" t="9173" r="8861" b="9317">and</wd>

<space/>

<wd l="8909" t="9173" r="9341" b="9360">noisy</wd>

<space/>

<wd l="9398" t="9173" r="9768" b="9317">data.</wd>

<space/>

<wd l="9859" t="9178" r="10027" b="9312">In</wd>

<space/>

<wd l="10085" t="9173" r="10512" b="9317">Galia</wd>

<space/>

</ln>

<ln l="6365" t="9394" r="10502" b="9581" baseLine="9528" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="9394" r="7176" b="9581">Angelova,</wd>

<space/>

<wd l="7282" t="9394" r="7810" b="9538">Kalina</wd>

<space/>

<wd l="7891" t="9394" r="8779" b="9562">Bontcheva,</wd>

<space/>

<wd l="8885" t="9394" r="9168" b="9538">and</wd>

<space/>

<wd l="9254" t="9394" r="9802" b="9538">Ruslan</wd>

<space/>

<wd l="9893" t="9394" r="10502" b="9562">Mitkov,</wd>

<space/>

</ln>

<ln l="6370" t="9610" r="10502" b="9797" baseLine="9749">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="9610" r="6950" b="9778">editors,</wd>

<space/>

</run>

<wd l="7018" t="9614" r="7670" b="9778"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">RANLP</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="7742" t="9653" r="8189" b="9797">pages</wd>

<space/>

<wd l="8275" t="9610" r="8990" b="9754">198–206.</wd>

<space/>

<wd l="9062" t="9614" r="9715" b="9754">RANLP</wd>

<space/>

<wd l="9782" t="9610" r="10157" b="9754">2011</wd>

<space/>

<wd l="10243" t="9610" r="10502" b="9754">Or-</wd>

</run>

</ln>

<ln l="6370" t="9830" r="8558" b="10018" baseLine="9970" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="9830" r="7032" b="10018">ganising</wd>

<space/>

<wd l="7094" t="9830" r="7973" b="9974">Committee</wd>

<space/>

<wd l="8021" t="9830" r="8083" b="9974">/</wd>

<space/>

<wd l="8126" t="9830" r="8558" b="9974">ACL.</wd>

</ln>

</para>

<para l="6144" t="10282" r="10507" b="11563" alignment="justified" li="216" spaceBefore="231" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="10282" r="10502" b="10426" baseLine="10416" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6144" t="10282" r="6595" b="10426">Jacob</wd>

<space/>

<wd l="6677" t="10282" r="7531" b="10426">Eisenstein.</wd>

<space/>

<wd l="7704" t="10282" r="8136" b="10426">2013.</wd>

<space/>

<wd l="8304" t="10282" r="8736" b="10426">What</wd>

<space/>

<wd l="8813" t="10301" r="8962" b="10426">to</wd>

<space/>

<wd l="9048" t="10282" r="9240" b="10426">do</wd>

<space/>

<wd l="9322" t="10282" r="9763" b="10426">about</wd>

<space/>

<wd l="9835" t="10282" r="10128" b="10426">bad</wd>

<space/>

<wd l="10200" t="10282" r="10502" b="10426">lan-</wd>

</ln>

<ln l="6370" t="10498" r="10507" b="10685" baseLine="10637">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6370" t="10541" r="6835" b="10685">guage</wd>

<space/>

<wd l="6912" t="10541" r="7109" b="10642">on</wd>

<space/>

<wd l="7176" t="10498" r="7421" b="10642">the</wd>

<space/>

<wd l="7493" t="10498" r="8136" b="10642">internet.</wd>

<space/>

<wd l="8285" t="10502" r="8453" b="10637">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8520" t="10498" r="9504" b="10680">Proceedings</wd>

<space/>

<wd l="9581" t="10498" r="9763" b="10680">of</wd>

<space/>

<wd l="9806" t="10498" r="10042" b="10642">the</wd>

<space/>

<wd l="10114" t="10498" r="10507" b="10642">2013</wd>

<space/>

</run>

</ln>

<ln l="6374" t="10718" r="10507" b="10901" baseLine="10853" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6374" t="10718" r="7272" b="10901">Conference</wd>

<space/>

<wd l="7358" t="10718" r="7541" b="10901">of</wd>

<space/>

<wd l="7589" t="10718" r="7829" b="10862">the</wd>

<space/>

<wd l="7901" t="10718" r="8371" b="10862">North</wd>

<space/>

<wd l="8438" t="10723" r="9221" b="10862">American</wd>

<space/>

<wd l="9312" t="10718" r="9965" b="10901">Chapter</wd>

<space/>

<wd l="10037" t="10718" r="10219" b="10901">of</wd>

<space/>

<wd l="10272" t="10718" r="10507" b="10862">the</wd>

<space/>

</ln>

<ln l="6350" t="10934" r="10507" b="11117" baseLine="11074" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6350" t="10939" r="7291" b="11078">Association</wd>

<space/>

<wd l="7320" t="10934" r="7594" b="11117">for</wd>

<space/>

<wd l="7656" t="10934" r="8842" b="11117">Computational</wd>

<space/>

<wd l="8894" t="10939" r="9835" b="11117">Linguistics:</wd>

<space/>

<wd l="9922" t="10939" r="10507" b="11078">Human</wd>

<space/>

</ln>

<ln l="6360" t="11155" r="10502" b="11342" baseLine="11294">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6360" t="11160" r="7157" b="11338">Language</wd>

<space/>

</run>

<wd l="7258" t="11155" r="8328" b="11338"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Technologies</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8434" t="11198" r="8885" b="11342">pages</wd>

<space/>

<wd l="8981" t="11155" r="9715" b="11299">359–369.</wd>

<space/>

<wd l="9816" t="11155" r="10502" b="11299">Associa-</wd>

</run>

</ln>

<ln l="6365" t="11376" r="9163" b="11563" baseLine="11510" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="11376" r="6677" b="11520">tion</wd>

<space/>

<wd l="6725" t="11376" r="6955" b="11520">for</wd>

<space/>

<wd l="7013" t="11376" r="8189" b="11558">Computational</wd>

<space/>

<wd l="8242" t="11376" r="9163" b="11563">Linguistics.</wd>

</ln>

</para>

<para l="6144" t="11794" r="10507" b="12888" alignment="justified" li="216" spaceBefore="230" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6144" t="11794" r="10502" b="12010" baseLine="11961">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="11827" r="6259" b="11966">J.</wd>

<space/>

<wd l="6398" t="11827" r="6931" b="11990">Foster,</wd>

<space/>

</run>

<wd l="7085" t="11794" r="7262" b="11966"><run underlined="none" subsuperscript="superscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">¨</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">O.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

<wd l="7406" t="11822" r="8232" b="12010"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">C</run>

<run underlined="none" subsuperscript="subscript" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">¸</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">etinoglu,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="8386" t="11827" r="8501" b="11966">J.</wd>

<space/>

<wd l="8635" t="11827" r="9288" b="12010">Wagner,</wd>

<space/>

<wd l="9437" t="11827" r="9557" b="11966">J.</wd>

<space/>

<wd l="9691" t="11827" r="9902" b="11966">Le</wd>

<space/>

<wd l="10027" t="11827" r="10502" b="11990">Roux,</wd>

<space/>

</run>

</ln>

<ln l="6370" t="12043" r="10498" b="12230" baseLine="12178" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="12043" r="6514" b="12187">S.</wd>

<space/>

<wd l="6571" t="12048" r="7142" b="12230">Hogan,</wd>

<space/>

<wd l="7195" t="12048" r="7310" b="12187">J.</wd>

<space/>

<wd l="7368" t="12043" r="7858" b="12211">Nivre,</wd>

<space/>

<wd l="7910" t="12048" r="8093" b="12187">D.</wd>

<space/>

<wd l="8150" t="12048" r="8722" b="12230">Hogan,</wd>

<space/>

<wd l="8774" t="12048" r="8890" b="12187">J.</wd>

<space/>

<wd l="8947" t="12048" r="9259" b="12187">Van</wd>

<space/>

<wd l="9307" t="12043" r="10075" b="12211">Genabith,</wd>

<space/>

<wd l="10133" t="12062" r="10277" b="12187">et</wd>

<space/>

<wd l="10320" t="12043" r="10498" b="12187">al.</wd>

<space/>

</ln>

<ln l="6370" t="12259" r="10507" b="12446" baseLine="12398" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6370" t="12259" r="6802" b="12403">2011.</wd>

<space/>

<wd l="6955" t="12264" r="7056" b="12398">#</wd>

<space/>

<wd l="7128" t="12259" r="8093" b="12442">hardtoparse:</wd>

<space/>

<wd l="8218" t="12264" r="8501" b="12403">Pos</wd>

<space/>

<wd l="8578" t="12259" r="9173" b="12446">tagging</wd>

<space/>

<wd l="9254" t="12259" r="9538" b="12403">and</wd>

<space/>

<wd l="9610" t="12259" r="10190" b="12446">parsing</wd>

<space/>

<wd l="10267" t="12259" r="10507" b="12403">the</wd>

<space/>

</ln>

<ln l="6365" t="12480" r="10507" b="12662" baseLine="12619">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6365" t="12480" r="7339" b="12624">twitterverse.</wd>

<space/>

<wd l="7522" t="12485" r="7690" b="12619">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7771" t="12480" r="8755" b="12662">Proceedings</wd>

<space/>

<wd l="8842" t="12480" r="9024" b="12662">of</wd>

<space/>

<wd l="9077" t="12480" r="9312" b="12624">the</wd>

<space/>

<wd l="9408" t="12480" r="10181" b="12662">Workshop</wd>

<space/>

<wd l="10277" t="12485" r="10507" b="12624">On</wd>

<space/>

</run>

</ln>

<ln l="6350" t="12701" r="10176" b="12888" baseLine="12835">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6350" t="12701" r="7157" b="12883">Analyzing</wd>

<space/>

<wd l="7205" t="12706" r="7978" b="12845">Microtext</wd>

<space/>

<wd l="8026" t="12706" r="8530" b="12878">(AAAI</wd>

<space/>

</run>

<wd l="8568" t="12701" r="9077" b="12878"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2011)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9134" t="12744" r="9581" b="12888">pages</wd>

<space/>

<wd l="9643" t="12701" r="10176" b="12845">20–25.</wd>

</run>

</ln>

</para>

<para l="6149" t="13147" r="10507" b="15307" alignment="justified" li="216" spaceBefore="229" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="6149" t="13147" r="10502" b="13330" baseLine="13286" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6149" t="13147" r="6624" b="13291">Kevin</wd>

<space/>

<wd l="6686" t="13147" r="7325" b="13330">Gimpel,</wd>

<space/>

<wd l="7392" t="13147" r="7963" b="13291">Nathan</wd>

<space/>

<wd l="8030" t="13147" r="8856" b="13315">Schneider,</wd>

<space/>

<wd l="8928" t="13147" r="9600" b="13291">Brendan</wd>

<space/>

<wd l="9667" t="13147" r="10502" b="13315">O’Connor,</wd>

<space/>

</ln>

<ln l="6365" t="13368" r="10502" b="13555" baseLine="13502" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="13368" r="7090" b="13555">Dipanjan</wd>

<space/>

<wd l="7234" t="13373" r="7584" b="13536">Das,</wd>

<space/>

<wd l="7752" t="13368" r="8280" b="13512">Daniel</wd>

<space/>

<wd l="8419" t="13368" r="8885" b="13536">Mills,</wd>

<space/>

<wd l="9053" t="13368" r="9499" b="13512">Jacob</wd>

<space/>

<wd l="9643" t="13368" r="10502" b="13536">Eisenstein,</wd>

<space/>

</ln>

<ln l="6365" t="13589" r="10502" b="13776" baseLine="13723" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="13589" r="7013" b="13733">Michael</wd>

<space/>

<wd l="7061" t="13589" r="7790" b="13757">Heilman,</wd>

<space/>

<wd l="7848" t="13589" r="8232" b="13733">Dani</wd>

<space/>

<wd l="8280" t="13594" r="9120" b="13776">Yogatama,</wd>

<space/>

<wd l="9173" t="13589" r="9715" b="13776">Jeffrey</wd>

<space/>

<wd l="9763" t="13589" r="10502" b="13776">Flanigan,</wd>

<space/>

</ln>

<ln l="6370" t="13805" r="10507" b="13992" baseLine="13944" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6370" t="13805" r="6653" b="13949">and</wd>

<space/>

<wd l="6715" t="13805" r="7147" b="13949">Noah</wd>

<space/>

<wd l="7214" t="13810" r="7397" b="13949">A.</wd>

<space/>

<wd l="7478" t="13805" r="7987" b="13949">Smith.</wd>

<space/>

<wd l="8126" t="13805" r="8558" b="13949">2011.</wd>

<space/>

<wd l="8688" t="13805" r="9850" b="13987">Part-of-speech</wd>

<space/>

<wd l="9912" t="13805" r="10507" b="13992">tagging</wd>

<space/>

</ln>

<ln l="6365" t="14026" r="10498" b="14208" baseLine="14160" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="14026" r="6595" b="14170">for</wd>

<space/>

<wd l="6662" t="14026" r="7267" b="14170">Twitter:</wd>

<space/>

<wd l="7378" t="14026" r="8318" b="14194">Annotation,</wd>

<space/>

<wd l="8390" t="14026" r="9062" b="14194">features,</wd>

<space/>

<wd l="9144" t="14026" r="9427" b="14170">and</wd>

<space/>

<wd l="9494" t="14026" r="10498" b="14208">experiments.</wd>

<space/>

</ln>

<ln l="6365" t="14242" r="10507" b="14424" baseLine="14381">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6365" t="14246" r="6533" b="14381">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6605" t="14242" r="7594" b="14424">Proceedings</wd>

<space/>

<wd l="7675" t="14242" r="7858" b="14424">of</wd>

<space/>

<wd l="7906" t="14242" r="8146" b="14386">the</wd>

<space/>

<wd l="8222" t="14242" r="8573" b="14386">49th</wd>

<space/>

<wd l="8640" t="14242" r="9230" b="14386">Annual</wd>

<space/>

<wd l="9302" t="14246" r="9955" b="14424">Meeting</wd>

<space/>

<wd l="10042" t="14242" r="10224" b="14424">of</wd>

<space/>

<wd l="10272" t="14242" r="10507" b="14386">the</wd>

<space/>

</run>

</ln>

<ln l="6350" t="14462" r="10507" b="14645" baseLine="14602" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6350" t="14467" r="7291" b="14606">Association</wd>

<space/>

<wd l="7320" t="14462" r="7594" b="14645">for</wd>

<space/>

<wd l="7656" t="14462" r="8842" b="14645">Computational</wd>

<space/>

<wd l="8894" t="14467" r="9835" b="14645">Linguistics:</wd>

<space/>

<wd l="9922" t="14467" r="10507" b="14606">Human</wd>

<space/>

</ln>

<ln l="6360" t="14683" r="10502" b="14866" baseLine="14818">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="6360" t="14688" r="7157" b="14866">Language</wd>

<space/>

<wd l="7238" t="14683" r="8328" b="14866">Technologies:</wd>

<space/>

<wd l="8443" t="14683" r="8880" b="14827">Short</wd>

<space/>

<wd l="8947" t="14688" r="9490" b="14866">Papers</wd>

<space/>

<wd l="9576" t="14770" r="9624" b="14784">-</wd>

<space/>

<wd l="9715" t="14683" r="10286" b="14827">Volume</wd>

<space/>

</run>

<wd l="10363" t="14683" r="10502" b="14851"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">2</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

</run>

</ln>

<ln l="6365" t="14894" r="10502" b="15086" baseLine="15038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6365" t="14904" r="6730" b="15038">HLT</wd>

<space/>

<wd l="6806" t="14899" r="7099" b="15067">’11,</wd>

<space/>

<wd l="7171" t="14942" r="7618" b="15086">pages</wd>

<space/>

<wd l="7680" t="14899" r="8222" b="15067">42–47,</wd>

<space/>

<wd l="8294" t="14899" r="9302" b="15086">Stroudsburg,</wd>

<space/>

<wd l="9370" t="14904" r="9648" b="15067">PA,</wd>

<space/>

<wd l="9715" t="14899" r="10152" b="15043">USA.</wd>

<space/>

<wd l="10224" t="14904" r="10502" b="15043">As-</wd>

</ln>

<ln l="6374" t="15120" r="9576" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="6374" t="15120" r="7085" b="15264">sociation</wd>

<space/>

<wd l="7133" t="15120" r="7368" b="15264">for</wd>

<space/>

<wd l="7421" t="15120" r="8597" b="15302">Computational</wd>

<space/>

<wd l="8650" t="15120" r="9576" b="15307">Linguistics.</wd>

</ln>

</para>

</column>

</section>

<dd l="1430" t="15726" r="10528" b="15979">

<para l="5857" t="15792" r="6090" b="15946" alignment="centered" spaceBefore="12" lsp="exactly" lspExact="231" language="en">

<ln l="5923" t="15792" r="6024" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5923" t="15792" r="6024" b="15946">7</wd>

</ln>

</para>

</dd>

</body>

</page>

<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">

<description>

<source file="C://Users//wing.nus//Documents//pdf\W15-4301.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>

<theoreticalPage size="A4" marginLeft="1440" marginTop="1291" marginRight="1385" marginBottom="1292" offsetX="-22" offsetY="16" width="11918" height="16854"/>

<language>en</language>

</description>

<body>

<section l="1440" t="1291" r="10524" b="15315">

<column l="1440" t="1291" r="5822" b="15315">

<para l="1440" t="1291" r="5808" b="1766" alignment="justified" li="216" fli="-216" lsp="exactly" lspExact="237" language="en">

<ln l="1440" t="1291" r="5808" b="1522" baseLine="1473" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="1291" r="1790" b="1478">IT´E.</wd>

<space/>

<wd l="2011" t="1334" r="2443" b="1478">2002.</wd>

<space/>

<wd l="2664" t="1334" r="3413" b="1478">PAROLE</wd>

<space/>

<wd l="3504" t="1334" r="4853" b="1522">Morphosyntactic</wd>

<space/>

<wd l="4949" t="1339" r="5482" b="1522">Tagset</wd>

<space/>

<wd l="5573" t="1334" r="5808" b="1478">for</wd>

<space/>

</ln>

<ln l="1656" t="1536" r="4925" b="1766" baseLine="1713" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="1579" r="2064" b="1723">Irish.</wd>

<space/>

<wd l="2146" t="1579" r="2866" b="1723">Institi´uid</wd>

<space/>

<wd l="2914" t="1579" r="4219" b="1766">Teangeola´ıochta</wd>

<space/>

<wd l="4267" t="1536" r="4925" b="1723">´Eireann.</wd>

</ln>

</para>

<para l="1440" t="1987" r="5808" b="3490" alignment="justified" li="216" spaceBefore="184" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="1987" r="5808" b="2174" baseLine="2126" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1440" t="1987" r="2198" b="2174">Lingpeng</wd>

<space/>

<wd l="2453" t="1992" r="2928" b="2174">Kong,</wd>

<space/>

<wd l="3226" t="1987" r="3797" b="2131">Nathan</wd>

<space/>

<wd l="4051" t="1987" r="4877" b="2155">Schneider,</wd>

<space/>

<wd l="5179" t="1987" r="5808" b="2131">Swabha</wd>

<space/>

</ln>

<ln l="1661" t="2208" r="5808" b="2395" baseLine="2342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1661" t="2208" r="2784" b="2395">Swayamdipta,</wd>

<space/>

<wd l="2938" t="2208" r="3528" b="2352">Archna</wd>

<space/>

<wd l="3653" t="2208" r="4214" b="2376">Bhatia,</wd>

<space/>

<wd l="4373" t="2208" r="4795" b="2352">Chris</wd>

<space/>

<wd l="4930" t="2213" r="5362" b="2395">Dyer,</wd>

<space/>

<wd l="5525" t="2208" r="5808" b="2352">and</wd>

<space/>

</ln>

<ln l="1656" t="2424" r="5808" b="2611" baseLine="2563" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="2424" r="2093" b="2568">Noah</wd>

<space/>

<wd l="2170" t="2429" r="2352" b="2568">A.</wd>

<space/>

<wd l="2448" t="2424" r="2957" b="2568">Smith.</wd>

<space/>

<wd l="3144" t="2424" r="3576" b="2568">2014.</wd>

<space/>

<wd l="3754" t="2429" r="3898" b="2563">A</wd>

<space/>

<wd l="3984" t="2424" r="4925" b="2611">dependency</wd>

<space/>

<wd l="5006" t="2467" r="5496" b="2606">parser</wd>

<space/>

<wd l="5573" t="2424" r="5808" b="2568">for</wd>

<space/>

</ln>

<ln l="1656" t="2645" r="5803" b="2827" baseLine="2779">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="1656" t="2664" r="2208" b="2789">tweets.</wd>

<space/>

<wd l="2342" t="2650" r="2510" b="2784">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><wd l="2578" t="2645" r="3562" b="2827">Proceedings</wd>

<space/>

<wd l="3634" t="2645" r="3816" b="2827">of</wd>

<space/>

<wd l="3859" t="2645" r="4094" b="2789">the</wd>

<space/>

<wd l="4162" t="2645" r="4555" b="2789">2014</wd>

<space/>

<wd l="4637" t="2645" r="5539" b="2827">Conference</wd>

<space/>

<wd l="5611" t="2693" r="5803" b="2789">on</wd>

<space/>

</run>

</ln>

<ln l="1651" t="2866" r="5803" b="3048" baseLine="3000" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1651" t="2866" r="2458" b="3048">Empirical</wd>

<space/>

<wd l="2496" t="2866" r="3187" b="3010">Methods</wd>

<space/>

<wd l="3240" t="2870" r="3384" b="3010">in</wd>

<space/>

<wd l="3427" t="2866" r="4051" b="3010">Natural</wd>

<space/>

<wd l="4085" t="2870" r="4882" b="3048">Language</wd>

<space/>

<wd l="4930" t="2870" r="5803" b="3048">Processing</wd>

<space/>

</ln>

<ln l="1661" t="3082" r="5794" b="3269" baseLine="3221">

<wd l="1661" t="3086" r="2486" b="3259"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">(EMNLP)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2"><space/>

<wd l="2549" t="3125" r="2995" b="3269">pages</wd>

<space/>

<wd l="3072" t="3082" r="3994" b="3250">1001–1012,</wd>

<space/>

<wd l="4051" t="3082" r="4526" b="3250">Doha,</wd>

<space/>

<wd l="4594" t="3082" r="5064" b="3259">Qatar,</wd>

<space/>

<wd l="5131" t="3082" r="5794" b="3226">October.</wd>

<space/>

</run>

</ln>

<ln l="1656" t="3302" r="5088" b="3490" baseLine="3437" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-2">

<wd l="1656" t="3302" r="2602" b="3446">Association</wd>

<space/>

<wd l="2650" t="3302" r="2880" b="3446">for</wd>

<space/>

<wd l="2938" t="3302" r="4114" b="3485">Computational</wd>

<space/>

<wd l="4166" t="3302" r="5088" b="3490">Linguistics.</wd>

</ln>

</para>

<para l="1440" t="3710" r="5813" b="4555" alignment="justified" li="216" spaceBefore="190" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="3710" r="5813" b="3898" baseLine="3849" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1440" t="3715" r="1958" b="3854">Teresa</wd>

<space/>

<wd l="2002" t="3715" r="2453" b="3898">Lynn,</wd>

<space/>

<wd l="2506" t="3710" r="3149" b="3854">Jennifer</wd>

<space/>

<wd l="3192" t="3715" r="3720" b="3878">Foster,</wd>

<space/>

<wd l="3773" t="3710" r="4205" b="3854">Mark</wd>

<space/>

<wd l="4248" t="3715" r="4670" b="3878">Dras,</wd>

<space/>

<wd l="4728" t="3710" r="5011" b="3854">and</wd>

<space/>

<wd l="5054" t="3710" r="5558" b="3854">Elaine</wd>

<space/>

<wd l="5606" t="3710" r="5813" b="3854">U´ı</wd>

<space/>

</ln>

<ln l="1656" t="3931" r="5808" b="4118" baseLine="4066" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">

<wd l="1656" t="3931" r="2803" b="4075">Dhonnchadha.</wd>

<space/>

<wd l="2928" t="3931" r="3360" b="4075">2012.</wd>

<space/>

<wd l="3485" t="3931" r="4008" b="4075">Active</wd>

<space/>

<wd l="4070" t="3931" r="4718" b="4118">learning</wd>

<space/>

<wd l="4790" t="3931" r="5074" b="4075">and</wd>

<space/>

<wd l="5136" t="3931" r="5376" b="4075">the</wd>

<space/>

<wd l="5438" t="3931" r="5808" b="4075">Irish</wd>

<space/>

</ln>

<ln l="1656" t="4152" r="5798" b="4334" baseLine="4286">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1656" t="4152" r="2381" b="4296">treebank.</wd>

<space/>

<wd l="2525" t="4157" r="2693" b="4291">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="2760" t="4152" r="3744" b="4334">Proceedings</wd>

<space/>

<wd l="3821" t="4152" r="3998" b="4334">of</wd>

<space/>

<wd l="4042" t="4152" r="4277" b="4296">the</wd>

<space/>

<wd l="4334" t="4152" r="5357" b="4296">Australasian</wd>

<space/>

<wd l="5424" t="4157" r="5798" b="4296">Lan-</wd>

</run>

</ln>

<ln l="1656" t="4368" r="5712" b="4555" baseLine="4507">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><wd l="1656" t="4416" r="2141" b="4550">guage</wd>

<space/>

<wd l="2198" t="4368" r="3096" b="4550">Technology</wd>

<space/>

<wd l="3158" t="4368" r="3931" b="4550">Workshop</wd>

<space/>

</run>

<wd l="3994" t="4373" r="4613" b="4546"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">(ALTA)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-4"><space/>

<wd l="4670" t="4411" r="5117" b="4555">pages</wd>

<space/>

<wd l="5179" t="4368" r="5712" b="4512">23–32.</wd>

</run>

</ln>

</para>

<para l="1445" t="4776" r="5808" b="6720" alignment="justified" li="216" spaceBefore="180" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="4776" r="5798" b="4963" baseLine="4915" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="4776" r="2045" b="4920">Olutobi</wd>

<space/>

<wd l="2170" t="4776" r="2904" b="4958">Owoputi,</wd>

<space/>

<wd l="3043" t="4776" r="3715" b="4920">Brendan</wd>

<space/>

<wd l="3840" t="4776" r="4680" b="4944">O’Connor,</wd>

<space/>

<wd l="4824" t="4776" r="5242" b="4920">Chris</wd>

<space/>

<wd l="5366" t="4781" r="5798" b="4963">Dyer,</wd>

<space/>

</ln>

<ln l="1661" t="4997" r="5794" b="5179" baseLine="5131" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="4997" r="2136" b="5141">Kevin</wd>

<space/>

<wd l="2251" t="4997" r="2885" b="5179">Gimpel,</wd>

<space/>

<wd l="3019" t="4997" r="3590" b="5141">Nathan</wd>

<space/>

<wd l="3710" t="4997" r="4536" b="5165">Schneider,</wd>

<space/>

<wd l="4675" t="4997" r="4958" b="5141">and</wd>

<space/>

<wd l="5069" t="4997" r="5501" b="5141">Noah</wd>

<space/>

<wd l="5611" t="5002" r="5794" b="5141">A.</wd>

<space/>

</ln>

<ln l="1661" t="5218" r="5808" b="5405" baseLine="5352" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="5218" r="2174" b="5362">Smith.</wd>

<space/>

<wd l="2304" t="5218" r="2736" b="5362">2013.</wd>

<space/>

<wd l="2866" t="5218" r="3634" b="5400">Improved</wd>

<space/>

<wd l="3696" t="5218" r="4848" b="5400">part-of-speech</wd>

<space/>

<wd l="4910" t="5218" r="5506" b="5405">tagging</wd>

<space/>

<wd l="5573" t="5218" r="5808" b="5362">for</wd>

<space/>

</ln>

<ln l="1661" t="5434" r="5808" b="5578" baseLine="5573" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="5434" r="2155" b="5578">online</wd>

<space/>

<wd l="2246" t="5434" r="3389" b="5578">conversational</wd>

<space/>

<wd l="3480" t="5453" r="3778" b="5578">text</wd>

<space/>

<wd l="3859" t="5434" r="4214" b="5578">with</wd>

<space/>

<wd l="4301" t="5434" r="4709" b="5578">word</wd>

<space/>

<wd l="4800" t="5434" r="5443" b="5578">clusters.</wd>

<space/>

<wd l="5640" t="5438" r="5808" b="5573">In</wd>

<space/>

</ln>

<ln l="1656" t="5654" r="5803" b="5837" baseLine="5789" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="5654" r="2645" b="5837">Proceedings</wd>

<space/>

<wd l="2736" t="5654" r="2914" b="5837">of</wd>

<space/>

<wd l="2971" t="5654" r="3211" b="5798">the</wd>

<space/>

<wd l="3298" t="5654" r="3691" b="5798">2013</wd>

<space/>

<wd l="3787" t="5654" r="4690" b="5837">Conference</wd>

<space/>

<wd l="4781" t="5654" r="4958" b="5837">of</wd>

<space/>

<wd l="5016" t="5654" r="5256" b="5798">the</wd>

<space/>

<wd l="5338" t="5654" r="5803" b="5798">North</wd>

<space/>

</ln>

<ln l="1642" t="5875" r="5798" b="6058" baseLine="6010" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="5880" r="2429" b="6019">American</wd>

<space/>

<wd l="2501" t="5875" r="3154" b="6058">Chapter</wd>

<space/>

<wd l="3211" t="5875" r="3394" b="6058">of</wd>

<space/>

<wd l="3427" t="5875" r="3662" b="6019">the</wd>

<space/>

<wd l="3710" t="5880" r="4651" b="6019">Association</wd>

<space/>

<wd l="4680" t="5875" r="4958" b="6058">for</wd>

<space/>

<wd l="5016" t="5880" r="5798" b="6058">Computa-</wd>

</ln>

<ln l="1661" t="6091" r="5798" b="6274" baseLine="6230">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="6091" r="2126" b="6235">tional</wd>

<space/>

<wd l="2179" t="6096" r="3115" b="6274">Linguistics:</wd>

<space/>

<wd l="3206" t="6096" r="3797" b="6235">Human</wd>

<space/>

<wd l="3854" t="6096" r="4651" b="6274">Language</wd>

<space/>

</run>

<wd l="4728" t="6091" r="5798" b="6274"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Technologies</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

</run>

</ln>

<ln l="1656" t="6312" r="5808" b="6499" baseLine="6446" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="6355" r="2107" b="6499">pages</wd>

<space/>

<wd l="2170" t="6312" r="2904" b="6480">380–390,</wd>

<space/>

<wd l="2966" t="6312" r="3595" b="6480">Atlanta,</wd>

<space/>

<wd l="3662" t="6312" r="4334" b="6499">Georgia,</wd>

<space/>

<wd l="4397" t="6317" r="4800" b="6456">June.</wd>

<space/>

<wd l="4862" t="6312" r="5808" b="6456">Association</wd>

<space/>

</ln>

<ln l="1656" t="6533" r="4099" b="6720" baseLine="6667" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="6533" r="1891" b="6677">for</wd>

<space/>

<wd l="1944" t="6533" r="3120" b="6715">Computational</wd>

<space/>

<wd l="3173" t="6533" r="4099" b="6720">Linguistics.</wd>

</ln>

</para>

<para l="1445" t="6941" r="5818" b="7781" alignment="justified" li="216" spaceBefore="186" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="6941" r="5818" b="7128" baseLine="7075" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="6941" r="1786" b="7085">Slav</wd>

<space/>

<wd l="1848" t="6946" r="2362" b="7085">Petrov</wd>

<space/>

<wd l="2429" t="6941" r="2712" b="7085">and</wd>

<space/>

<wd l="2770" t="6946" r="3187" b="7128">Ryan</wd>

<space/>

<wd l="3250" t="6941" r="4142" b="7085">McDonald.</wd>

<space/>

<wd l="4258" t="6941" r="4690" b="7085">2012.</wd>

<space/>

<wd l="4810" t="6941" r="5578" b="7085">Overview</wd>

<space/>

<wd l="5645" t="6941" r="5818" b="7085">of</wd>

<space/>

</ln>

<ln l="1656" t="7162" r="5813" b="7349" baseLine="7296">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="7162" r="1901" b="7306">the</wd>

<space/>

<wd l="1968" t="7162" r="2357" b="7306">2012</wd>

<space/>

<wd l="2424" t="7162" r="2976" b="7306">Shared</wd>

<space/>

<wd l="3034" t="7162" r="3408" b="7306">Task</wd>

<space/>

<wd l="3470" t="7205" r="3667" b="7306">on</wd>

<space/>

<wd l="3725" t="7162" r="4320" b="7349">Parsing</wd>

<space/>

<wd l="4382" t="7162" r="4622" b="7306">the</wd>

<space/>

<wd l="4685" t="7162" r="5083" b="7306">Web.</wd>

<space/>

<wd l="5203" t="7166" r="5371" b="7301">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5429" t="7166" r="5813" b="7306">First</wd>

<space/>

</run>

</ln>

<ln l="1666" t="7378" r="5808" b="7560" baseLine="7517" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1666" t="7378" r="2443" b="7560">Workshop</wd>

<space/>

<wd l="2525" t="7426" r="2717" b="7522">on</wd>

<space/>

<wd l="2794" t="7382" r="3523" b="7560">Syntactic</wd>

<space/>

<wd l="3586" t="7378" r="4272" b="7560">Analysis</wd>

<space/>

<wd l="4354" t="7378" r="4536" b="7560">of</wd>

<space/>

<wd l="4570" t="7378" r="5808" b="7522">Non-Canonical</wd>

<space/>

</ln>

<ln l="1651" t="7603" r="3269" b="7781" baseLine="7733">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="7603" r="2448" b="7781">Language</wd>

<space/>

</run>

<wd l="2506" t="7603" r="3269" b="7776"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(SANCL)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>

</run>

</ln>

</para>

<para l="1440" t="8006" r="5818" b="9072" alignment="justified" li="216" spaceBefore="186" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="8006" r="5798" b="8194" baseLine="8141" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="8011" r="1766" b="8150">Ines</wd>

<space/>

<wd l="1829" t="8006" r="2534" b="8150">Rehbein.</wd>

<space/>

<wd l="2650" t="8006" r="3082" b="8150">2013.</wd>

<space/>

<wd l="3197" t="8006" r="4214" b="8194">Fine-grained</wd>

<space/>

<wd l="4272" t="8050" r="4541" b="8189">pos</wd>

<space/>

<wd l="4608" t="8006" r="5203" b="8194">tagging</wd>

<space/>

<wd l="5270" t="8006" r="5438" b="8150">of</wd>

<space/>

<wd l="5491" t="8050" r="5798" b="8194">ger-</wd>

</ln>

<ln l="1656" t="8227" r="5798" b="8414" baseLine="8362" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="8270" r="1997" b="8371">man</wd>

<space/>

<wd l="2088" t="8246" r="2635" b="8371">tweets.</wd>

<space/>

<wd l="2832" t="8232" r="3000" b="8366">In</wd>

<space/>

<wd l="3086" t="8232" r="3509" b="8414">Iryna</wd>

<space/>

<wd l="3595" t="8227" r="4416" b="8414">Gurevych,</wd>

<space/>

<wd l="4522" t="8227" r="4944" b="8371">Chris</wd>

<space/>

<wd l="5035" t="8227" r="5798" b="8395">Biemann,</wd>

<space/>

</ln>

<ln l="1661" t="8443" r="5818" b="8611" baseLine="8582">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="8443" r="1949" b="8587">and</wd>

<space/>

<wd l="2011" t="8448" r="2602" b="8587">Torsten</wd>

<space/>

<wd l="2664" t="8443" r="3187" b="8611">Zesch,</wd>

<space/>

<wd l="3264" t="8443" r="3845" b="8611">editors,</wd>

<space/>

</run>

<wd l="3926" t="8448" r="4450" b="8611"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">GSCL</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4522" t="8443" r="5112" b="8587">volume</wd>

<space/>

<wd l="5189" t="8443" r="5568" b="8587">8105</wd>

<space/>

<wd l="5645" t="8443" r="5818" b="8587">of</wd>

<space/>

</run>

</ln>

<ln l="1651" t="8664" r="5794" b="8851" baseLine="8798">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1651" t="8669" r="2256" b="8808">Lecture</wd>

<space/>

<wd l="2299" t="8669" r="2760" b="8808">Notes</wd>

<space/>

<wd l="2818" t="8669" r="2957" b="8808">in</wd>

<space/>

<wd l="3019" t="8669" r="3816" b="8846">Computer</wd>

<space/>

</run>

<wd l="3854" t="8669" r="4502" b="8832"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Science</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="4560" t="8707" r="5006" b="8851">pages</wd>

<space/>

<wd l="5078" t="8664" r="5794" b="8808">162–175.</wd>

<space/>

</run>

</ln>

<ln l="1661" t="8885" r="2371" b="9072" baseLine="9019" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="8885" r="2371" b="9072">Springer.</wd>

</ln>

</para>

<para l="1440" t="9293" r="5803" b="10795" alignment="justified" li="216" spaceBefore="183" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="9293" r="5794" b="9461" baseLine="9427" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="9293" r="1824" b="9437">Alan</wd>

<space/>

<wd l="1910" t="9293" r="2395" b="9461">Ritter,</wd>

<space/>

<wd l="2496" t="9293" r="2851" b="9437">Sam</wd>

<space/>

<wd l="2933" t="9293" r="3413" b="9461">Clark,</wd>

<space/>

<wd l="3509" t="9298" r="4238" b="9461">Mausam,</wd>

<space/>

<wd l="4339" t="9293" r="4622" b="9437">and</wd>

<space/>

<wd l="4704" t="9293" r="5102" b="9437">Oren</wd>

<space/>

<wd l="5179" t="9293" r="5794" b="9437">Etzioni.</wd>

<space/>

</ln>

<ln l="1661" t="9509" r="5798" b="9696" baseLine="9648" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="9509" r="2093" b="9653">2011.</wd>

<space/>

<wd l="2232" t="9509" r="2808" b="9653">Named</wd>

<space/>

<wd l="2875" t="9509" r="3322" b="9696">entity</wd>

<space/>

<wd l="3394" t="9509" r="4301" b="9696">recognition</wd>

<space/>

<wd l="4363" t="9509" r="4522" b="9648">in</wd>

<space/>

<wd l="4584" t="9528" r="5131" b="9653">tweets:</wd>

<space/>

<wd l="5246" t="9514" r="5491" b="9648">An</wd>

<space/>

<wd l="5558" t="9552" r="5798" b="9653">ex-</wd>

</ln>

<ln l="1656" t="9730" r="5803" b="9917" baseLine="9864">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="9730" r="2506" b="9912">perimental</wd>

<space/>

<wd l="2573" t="9730" r="3024" b="9917">study.</wd>

<space/>

<wd l="3125" t="9734" r="3288" b="9869">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3346" t="9730" r="4330" b="9912">Proceedings</wd>

<space/>

<wd l="4392" t="9730" r="4570" b="9912">of</wd>

<space/>

<wd l="4598" t="9730" r="4838" b="9874">the</wd>

<space/>

<wd l="4906" t="9730" r="5803" b="9912">Conference</wd>

<space/>

</run>

</ln>

<ln l="1661" t="9950" r="5798" b="10133" baseLine="10085" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="9998" r="1853" b="10094">on</wd>

<space/>

<wd l="1944" t="9950" r="2746" b="10133">Empirical</wd>

<space/>

<wd l="2832" t="9950" r="3523" b="10094">Methods</wd>

<space/>

<wd l="3624" t="9955" r="3763" b="10094">in</wd>

<space/>

<wd l="3854" t="9950" r="4478" b="10094">Natural</wd>

<space/>

<wd l="4560" t="9955" r="5357" b="10133">Language</wd>

<space/>

<wd l="5448" t="9955" r="5798" b="10094">Pro-</wd>

</ln>

<ln l="1661" t="10166" r="5798" b="10354" baseLine="10306">

<wd l="1661" t="10171" r="2290" b="10349"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">cessing</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2386" t="10171" r="3062" b="10310">EMNLP</wd>

<space/>

<wd l="3158" t="10166" r="3456" b="10334">’11,</wd>

<space/>

<wd l="3552" t="10210" r="4003" b="10354">pages</wd>

<space/>

<wd l="4109" t="10166" r="5030" b="10334">1524–1534,</wd>

<space/>

<wd l="5136" t="10166" r="5798" b="10310">Strouds-</wd>

</run>

</ln>

<ln l="1656" t="10387" r="5798" b="10574" baseLine="10522" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="10387" r="2059" b="10574">burg,</wd>

<space/>

<wd l="2117" t="10392" r="2395" b="10555">PA,</wd>

<space/>

<wd l="2453" t="10387" r="2890" b="10531">USA.</wd>

<space/>

<wd l="2952" t="10387" r="3893" b="10531">Association</wd>

<space/>

<wd l="3946" t="10387" r="4176" b="10531">for</wd>

<space/>

<wd l="4234" t="10387" r="5410" b="10570">Computational</wd>

<space/>

<wd l="5462" t="10387" r="5798" b="10526">Lin-</wd>

</ln>

<ln l="1661" t="10608" r="2304" b="10795" baseLine="10742" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="10608" r="2304" b="10795">guistics.</wd>

</ln>

</para>

<para l="1445" t="11016" r="5808" b="11818" alignment="justified" li="216" spaceBefore="184" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1445" t="11016" r="5798" b="11203" baseLine="11150" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1445" t="11016" r="1920" b="11160">Kevin</wd>

<space/>

<wd l="1968" t="11021" r="2098" b="11160">P.</wd>

<space/>

<wd l="2165" t="11016" r="2885" b="11160">Scannell.</wd>

<space/>

<wd l="2986" t="11016" r="3418" b="11160">2003.</wd>

<space/>

<wd l="3509" t="11016" r="4349" b="11160">Automatic</wd>

<space/>

<wd l="4402" t="11016" r="5150" b="11160">thesaurus</wd>

<space/>

<wd l="5213" t="11059" r="5798" b="11203">genera-</wd>

</ln>

<ln l="1656" t="11237" r="5803" b="11424" baseLine="11371">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="11237" r="1968" b="11381">tion</wd>

<space/>

<wd l="2016" t="11237" r="2246" b="11381">for</wd>

<space/>

<wd l="2290" t="11237" r="2976" b="11424">minority</wd>

<space/>

<wd l="3024" t="11237" r="3859" b="11424">languages:</wd>

<space/>

<wd l="3941" t="11280" r="4118" b="11381">an</wd>

<space/>

<wd l="4166" t="11237" r="4536" b="11381">Irish</wd>

<space/>

<wd l="4584" t="11237" r="5290" b="11419">example.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5362" t="11242" r="5803" b="11381">Actes</wd>

<space/>

</run>

</ln>

<ln l="1656" t="11453" r="5808" b="11635" baseLine="11592">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="11453" r="1843" b="11597">de</wd>

<space/>

<wd l="1920" t="11453" r="2064" b="11597">la</wd>

<space/>

<wd l="2146" t="11453" r="2424" b="11597">10e</wd>

<space/>

<wd l="2496" t="11453" r="3355" b="11635">conf´erence</wd>

<space/>

<wd l="3437" t="11458" r="3989" b="11597">TALNa</wd>

<space/>

</run>

<wd l="4056" t="11458" r="5174" b="11621"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Batz-sur-Mer</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5256" t="11453" r="5808" b="11597">2:203–</wd>

<space/>

</run>

</ln>

<ln l="1661" t="11674" r="1997" b="11818" baseLine="11808" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="11674" r="1997" b="11818">212.</wd>

</ln>

</para>

<para l="1440" t="12082" r="5808" b="13147" alignment="justified" li="216" spaceBefore="188" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="1440" t="12082" r="5803" b="12269" baseLine="12216" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="12082" r="1968" b="12269">Djam´e</wd>

<space/>

<wd l="2035" t="12082" r="2659" b="12250">Seddah,</wd>

<space/>

<wd l="2726" t="12082" r="3259" b="12226">Benoit</wd>

<space/>

<wd l="3322" t="12082" r="3816" b="12269">Sagot,</wd>

<space/>

<wd l="3883" t="12082" r="4354" b="12226">Marie</wd>

<space/>

<wd l="4421" t="12082" r="5088" b="12250">Candito,</wd>

<space/>

<wd l="5155" t="12082" r="5803" b="12269">Virginie</wd>

<space/>

</ln>

<ln l="1656" t="12302" r="5803" b="12470" baseLine="12437" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="12302" r="2597" b="12470">Mouilleron,</wd>

<space/>

<wd l="2731" t="12302" r="3014" b="12446">and</wd>

<space/>

<wd l="3120" t="12307" r="3763" b="12446">Vanessa</wd>

<space/>

<wd l="3869" t="12302" r="4536" b="12446">Combet.</wd>

<space/>

<wd l="4800" t="12302" r="5232" b="12446">2012.</wd>

<space/>

<wd l="5496" t="12302" r="5803" b="12446">The</wd>

<space/>

</ln>

<ln l="1656" t="12518" r="5803" b="12706" baseLine="12658" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="12518" r="2213" b="12662">French</wd>

<space/>

<wd l="2314" t="12518" r="2803" b="12662">Social</wd>

<space/>

<wd l="2904" t="12518" r="3418" b="12662">Media</wd>

<space/>

<wd l="3509" t="12518" r="3970" b="12662">Bank:</wd>

<space/>

<wd l="4147" t="12562" r="4234" b="12662">a</wd>

<space/>

<wd l="4330" t="12518" r="5016" b="12662">treebank</wd>

<space/>

<wd l="5117" t="12518" r="5285" b="12662">of</wd>

<space/>

<wd l="5376" t="12518" r="5803" b="12706">noisy</wd>

<space/>

</ln>

<ln l="1656" t="12739" r="5808" b="12926" baseLine="12874">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1656" t="12782" r="1992" b="12883">user</wd>

<space/>

<wd l="2050" t="12739" r="2822" b="12926">generated</wd>

<space/>

<wd l="2880" t="12758" r="3499" b="12883">content.</wd>

<space/>

<wd l="3600" t="12744" r="3768" b="12878">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3821" t="12739" r="4810" b="12922">Proceedings</wd>

<space/>

<wd l="4867" t="12739" r="5050" b="12922">of</wd>

<space/>

<wd l="5083" t="12744" r="5808" b="12883">COLING</wd>

<space/>

</run>

</ln>

<ln l="1656" t="12960" r="3595" b="13147" baseLine="13094">

<wd l="1656" t="12960" r="2098" b="13128"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">2012</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="2155" t="13003" r="2606" b="13147">pages</wd>

<space/>

<wd l="2664" t="12960" r="3595" b="13104">2441–2458.</wd>

</run>

</ln>

</para>

<para l="1440" t="13368" r="5808" b="15307" alignment="justified" li="216" spaceBefore="183" fli="-216" lsp="exactly" lspExact="219" language="en">

<ln l="1440" t="13368" r="5798" b="13555" baseLine="13502" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1440" t="13368" r="2059" b="13512">Thamar</wd>

<space/>

<wd l="2237" t="13368" r="2861" b="13536">Solorio,</wd>

<space/>

<wd l="3067" t="13368" r="3821" b="13512">Elizabeth</wd>

<space/>

<wd l="3989" t="13368" r="4426" b="13536">Blair,</wd>

<space/>

<wd l="4637" t="13368" r="5040" b="13555">Suraj</wd>

<space/>

<wd l="5222" t="13368" r="5798" b="13512">Mahar-</wd>

</ln>

<ln l="1642" t="13589" r="5808" b="13776" baseLine="13723" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1642" t="13589" r="1944" b="13776">jan,</wd>

<space/>

<wd l="2150" t="13589" r="2683" b="13733">Steven</wd>

<space/>

<wd l="2846" t="13589" r="3523" b="13757">Bethard,</wd>

<space/>

<wd l="3725" t="13594" r="4190" b="13733">Mona</wd>

<space/>

<wd l="4354" t="13589" r="4786" b="13757">Diab,</wd>

<space/>

<wd l="4987" t="13589" r="5808" b="13733">Mahmoud</wd>

<space/>

</ln>

<ln l="1661" t="13805" r="5798" b="13973" baseLine="13944" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="13805" r="2443" b="13973">Ghoneim,</wd>

<space/>

<wd l="2506" t="13805" r="3187" b="13949">Abdelati</wd>

<space/>

<wd l="3245" t="13805" r="4013" b="13973">Hawwari,</wd>

<space/>

<wd l="4075" t="13805" r="4560" b="13949">Fahad</wd>

<space/>

<wd l="4613" t="13805" r="5501" b="13973">AlGhamdi,</wd>

<space/>

<wd l="5563" t="13810" r="5798" b="13949">Ju-</wd>

</ln>

<ln l="1656" t="14026" r="5798" b="14213" baseLine="14160" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="14026" r="1862" b="14170">lia</wd>

<space/>

<wd l="1949" t="14026" r="2875" b="14213">Hirschberg,</wd>

<space/>

<wd l="2986" t="14026" r="3518" b="14170">Alison</wd>

<space/>

<wd l="3610" t="14026" r="4171" b="14213">Chang,</wd>

<space/>

<wd l="4286" t="14026" r="4570" b="14170">and</wd>

<space/>

<wd l="4661" t="14026" r="5251" b="14170">Pascale</wd>

<space/>

<wd l="5347" t="14030" r="5798" b="14213">Fung,</wd>

<space/>

</ln>

<ln l="1661" t="14242" r="5798" b="14424" baseLine="14381">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1661" t="14242" r="2093" b="14386">2014.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2227" t="14242" r="3211" b="14424">Proceedings</wd>

<space/>

<wd l="3283" t="14242" r="3461" b="14424">of</wd>

<space/>

<wd l="3499" t="14242" r="3739" b="14386">the</wd>

<space/>

<wd l="3802" t="14246" r="4186" b="14386">First</wd>

<space/>

<wd l="4253" t="14242" r="5030" b="14424">Workshop</wd>

<space/>

<wd l="5102" t="14290" r="5294" b="14386">on</wd>

<space/>

<wd l="5371" t="14246" r="5798" b="14386">Com-</wd>

</run>

</ln>

<ln l="1637" t="14462" r="5808" b="14645" baseLine="14602">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1637" t="14462" r="2482" b="14645">putational</wd>

<space/>

<wd l="2539" t="14462" r="3494" b="14645">Approaches</wd>

<space/>

<wd l="3576" t="14491" r="3725" b="14606">to</wd>

<space/>

<wd l="3816" t="14462" r="4224" b="14606">Code</wd>

<space/>

</run>

<wd l="4301" t="14462" r="5126" b="14645"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Switching</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="5222" t="14462" r="5808" b="14645">chapter</wd>

<space/>

</run>

</ln>

<ln l="1661" t="14683" r="5803" b="14870" baseLine="14818" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1661" t="14683" r="2434" b="14827">Overview</wd>

<space/>

<wd l="2525" t="14683" r="2755" b="14827">for</wd>

<space/>

<wd l="2846" t="14683" r="3086" b="14827">the</wd>

<space/>

<wd l="3178" t="14683" r="3542" b="14827">First</wd>

<space/>

<wd l="3634" t="14683" r="4186" b="14827">Shared</wd>

<space/>

<wd l="4272" t="14683" r="4646" b="14827">Task</wd>

<space/>

<wd l="4738" t="14726" r="4934" b="14827">on</wd>

<space/>

<wd l="5021" t="14688" r="5803" b="14870">Language</wd>

<space/>

</ln>

<ln l="1656" t="14899" r="5794" b="15086" baseLine="15038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="14899" r="2722" b="15043">Identification</wd>

<space/>

<wd l="2774" t="14899" r="2933" b="15038">in</wd>

<space/>

<wd l="2990" t="14899" r="4214" b="15043">Code-Switched</wd>

<space/>

<wd l="4267" t="14904" r="4685" b="15067">Data,</wd>

<space/>

<wd l="4747" t="14942" r="5198" b="15086">pages</wd>

<space/>

<wd l="5261" t="14899" r="5794" b="15043">62–72.</wd>

<space/>

</ln>

<ln l="1656" t="15120" r="5088" b="15307" baseLine="15259" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="1656" t="15120" r="2602" b="15264">Association</wd>

<space/>

<wd l="2650" t="15120" r="2880" b="15264">for</wd>

<space/>

<wd l="2938" t="15120" r="4114" b="15302">Computational</wd>

<space/>

<wd l="4166" t="15120" r="5088" b="15307">Linguistics.</wd>

</ln>

</para>

</column>

<column l="6142" t="1291" r="10524" b="5835">

<para l="6149" t="1334" r="10507" b="3278" alignment="justified" li="216" spaceBefore="7" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6149" t="1334" r="10502" b="1517" baseLine="1474" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6149" t="1334" r="6792" b="1478">Kristina</wd>

<space/>

<wd l="6859" t="1339" r="7733" b="1502">Toutanova,</wd>

<space/>

<wd l="7819" t="1339" r="8146" b="1478">Dan</wd>

<space/>

<wd l="8232" t="1334" r="8712" b="1502">Klein,</wd>

<space/>

<wd l="8803" t="1334" r="9739" b="1517">Christopher</wd>

<space/>

<wd l="9811" t="1339" r="9994" b="1478">D.</wd>

<space/>

<wd l="10080" t="1339" r="10502" b="1478">Man-</wd>

</ln>

<ln l="6365" t="1555" r="10502" b="1742" baseLine="1694" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="1555" r="6763" b="1742">ning,</wd>

<space/>

<wd l="6821" t="1555" r="7104" b="1699">and</wd>

<space/>

<wd l="7152" t="1560" r="7685" b="1699">Yoram</wd>

<space/>

<wd l="7733" t="1555" r="8275" b="1742">Singer.</wd>

<space/>

<wd l="8366" t="1555" r="8798" b="1699">2003.</wd>

<space/>

<wd l="8880" t="1555" r="9854" b="1699">Feature-rich</wd>

<space/>

<wd l="9902" t="1555" r="10502" b="1738">part-of-</wd>

</ln>

<ln l="6374" t="1776" r="10498" b="1963" baseLine="1910" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6374" t="1776" r="6907" b="1958">speech</wd>

<space/>

<wd l="6979" t="1776" r="7574" b="1963">tagging</wd>

<space/>

<wd l="7651" t="1776" r="8006" b="1920">with</wd>

<space/>

<wd l="8083" t="1819" r="8170" b="1920">a</wd>

<space/>

<wd l="8246" t="1776" r="8712" b="1963">cyclic</wd>

<space/>

<wd l="8794" t="1776" r="9734" b="1963">dependency</wd>

<space/>

<wd l="9811" t="1776" r="10498" b="1920">network.</wd>

<space/>

</ln>

<ln l="6365" t="1992" r="10507" b="2174" baseLine="2131">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6365" t="1997" r="6533" b="2131">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6581" t="1992" r="7570" b="2174">Proceedings</wd>

<space/>

<wd l="7627" t="1992" r="7810" b="2174">of</wd>

<space/>

<wd l="7834" t="1992" r="8074" b="2136">the</wd>

<space/>

<wd l="8126" t="1992" r="8520" b="2136">2003</wd>

<space/>

<wd l="8587" t="1992" r="9485" b="2174">Conference</wd>

<space/>

<wd l="9547" t="1992" r="9730" b="2174">of</wd>

<space/>

<wd l="9754" t="1992" r="9989" b="2136">the</wd>

<space/>

<wd l="10042" t="1992" r="10507" b="2136">North</wd>

<space/>

</run>

</ln>

<ln l="6350" t="2213" r="10502" b="2395" baseLine="2352" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6350" t="2218" r="7133" b="2357">American</wd>

<space/>

<wd l="7210" t="2213" r="7862" b="2395">Chapter</wd>

<space/>

<wd l="7915" t="2213" r="8098" b="2395">of</wd>

<space/>

<wd l="8131" t="2213" r="8366" b="2357">the</wd>

<space/>

<wd l="8414" t="2218" r="9355" b="2357">Association</wd>

<space/>

<wd l="9389" t="2213" r="9662" b="2395">for</wd>

<space/>

<wd l="9725" t="2218" r="10502" b="2395">Computa-</wd>

</ln>

<ln l="6370" t="2434" r="10507" b="2616" baseLine="2568" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6370" t="2434" r="6830" b="2578">tional</wd>

<space/>

<wd l="6888" t="2438" r="7766" b="2616">Linguistics</wd>

<space/>

<wd l="7838" t="2482" r="8030" b="2578">on</wd>

<space/>

<wd l="8093" t="2438" r="8678" b="2578">Human</wd>

<space/>

<wd l="8741" t="2438" r="9538" b="2616">Language</wd>

<space/>

<wd l="9614" t="2434" r="10507" b="2616">Technology</wd>

<space/>

</ln>

<ln l="6374" t="2650" r="10502" b="2837" baseLine="2789">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6374" t="2736" r="6422" b="2750">-</wd>

<space/>

<wd l="6514" t="2650" r="7080" b="2794">Volume</wd>

<space/>

</run>

<wd l="7162" t="2650" r="7291" b="2818"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">1</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">,</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><space/>

<wd l="7373" t="2650" r="8040" b="2794">NAACL</wd>

<space/>

<wd l="8126" t="2650" r="8419" b="2818">’03,</wd>

<space/>

<wd l="8496" t="2693" r="8942" b="2837">pages</wd>

<space/>

<wd l="9038" t="2650" r="9758" b="2818">173–180,</wd>

<space/>

<wd l="9840" t="2650" r="10502" b="2794">Strouds-</wd>

</run>

</ln>

<ln l="6365" t="2870" r="10502" b="3058" baseLine="3005" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="2870" r="6763" b="3058">burg,</wd>

<space/>

<wd l="6821" t="2875" r="7104" b="3038">PA,</wd>

<space/>

<wd l="7157" t="2870" r="7594" b="3014">USA.</wd>

<space/>

<wd l="7656" t="2870" r="8602" b="3014">Association</wd>

<space/>

<wd l="8650" t="2870" r="8885" b="3014">for</wd>

<space/>

<wd l="8938" t="2870" r="10114" b="3053">Computational</wd>

<space/>

<wd l="10166" t="2870" r="10502" b="3010">Lin-</wd>

</ln>

<ln l="6370" t="3091" r="7013" b="3278" baseLine="3226" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6370" t="3091" r="7013" b="3278">guistics.</wd>

</ln>

</para>

<para l="6144" t="3490" r="10517" b="4762" alignment="justified" li="216" spaceBefore="173" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="3490" r="10498" b="3634" baseLine="3624" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6144" t="3490" r="6653" b="3634">Elaine</wd>

<space/>

<wd l="6701" t="3490" r="6907" b="3634">U´ı</wd>

<space/>

<wd l="6946" t="3490" r="8054" b="3634">Dhonnchadha</wd>

<space/>

<wd l="8102" t="3490" r="8386" b="3634">and</wd>

<space/>

<wd l="8429" t="3490" r="8846" b="3634">Josef</wd>

<space/>

<wd l="8880" t="3533" r="9163" b="3634">van</wd>

<space/>

<wd l="9216" t="3490" r="9979" b="3634">Genabith.</wd>

<space/>

<wd l="10066" t="3490" r="10498" b="3634">2006.</wd>

<space/>

</ln>

<ln l="6365" t="3706" r="10507" b="3893" baseLine="3845" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="3710" r="6509" b="3845">A</wd>

<space/>

<wd l="6590" t="3706" r="7742" b="3888">part-of-speech</wd>

<space/>

<wd l="7819" t="3725" r="8318" b="3893">tagger</wd>

<space/>

<wd l="8400" t="3706" r="8630" b="3850">for</wd>

<space/>

<wd l="8712" t="3706" r="9077" b="3850">Irish</wd>

<space/>

<wd l="9158" t="3706" r="9586" b="3893">using</wd>

<space/>

<wd l="9677" t="3706" r="10507" b="3850">finite-state</wd>

<space/>

</ln>

<ln l="6365" t="3926" r="10502" b="4114" baseLine="4066" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6365" t="3926" r="7334" b="4114">morphology</wd>

<space/>

<wd l="7440" t="3926" r="7723" b="4070">and</wd>

<space/>

<wd l="7829" t="3926" r="8611" b="4070">constraint</wd>

<space/>

<wd l="8712" t="3970" r="9427" b="4114">grammar</wd>

<space/>

<wd l="9533" t="3926" r="10502" b="4114">disambigua-</wd>

</ln>

<ln l="6365" t="4147" r="10502" b="4330" baseLine="4282">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="6365" t="4147" r="6710" b="4291">tion.</wd>

<space/>

<wd l="6797" t="4152" r="6965" b="4286">In</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><wd l="7003" t="4147" r="7987" b="4330">Proceedings</wd>

<space/>

<wd l="8035" t="4147" r="8218" b="4330">of</wd>

<space/>

<wd l="8232" t="4147" r="8467" b="4291">the</wd>

<space/>

<wd l="8510" t="4147" r="8760" b="4291">5th</wd>

<space/>

<wd l="8798" t="4147" r="9859" b="4291">International</wd>

<space/>

<wd l="9902" t="4147" r="10502" b="4330">Confer-</wd>

</run>

</ln>

<ln l="6370" t="4363" r="10517" b="4546" baseLine="4502" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">

<wd l="6370" t="4411" r="6725" b="4507">ence</wd>

<space/>

<wd l="6778" t="4411" r="6965" b="4507">on</wd>

<space/>

<wd l="7008" t="4368" r="7805" b="4546">Language</wd>

<space/>

<wd l="7843" t="4368" r="8659" b="4507">Resources</wd>

<space/>

<wd l="8702" t="4363" r="9005" b="4507">and</wd>

<space/>

<wd l="9038" t="4363" r="9912" b="4507">Evaluation</wd>

<space/>

<wd l="9960" t="4368" r="10517" b="4541">(LREC</wd>

<space/>

</ln>

<ln l="6365" t="4584" r="6869" b="4762" baseLine="4718">

<wd l="6365" t="4584" r="6869" b="4762"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">2006)</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-1"><nl orig="true"/>

</run>

</ln>

</para>

<para l="6144" t="4982" r="10507" b="5827" alignment="justified" li="216" spaceBefore="176" spaceAfter="5" fli="-216" lsp="exactly" lspExact="220" language="en">

<ln l="6144" t="4982" r="10502" b="5165" baseLine="5121">

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6144" t="4982" r="6653" b="5126">Elaine</wd>

<space/>

<wd l="6730" t="4982" r="6931" b="5126">U´ı</wd>

<space/>

<wd l="6998" t="4982" r="8146" b="5126">Dhonnchadha.</wd>

<space/>

<wd l="8304" t="4982" r="8736" b="5126">2009.</wd>

<space/>

</run>

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="8894" t="4982" r="10080" b="5165">Part-of-Speech</wd>

<space/>

<wd l="10166" t="4987" r="10502" b="5165">Tag-</wd>

</run>

</ln>

<ln l="6365" t="5203" r="10507" b="5386" baseLine="5338" italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5208" r="6715" b="5386">ging</wd>

<space/>

<wd l="6768" t="5203" r="7075" b="5347">and</wd>

<space/>

<wd l="7118" t="5203" r="7670" b="5347">Partial</wd>

<space/>

<wd l="7718" t="5208" r="8328" b="5386">Parsing</wd>

<space/>

<wd l="8352" t="5203" r="8626" b="5386">for</wd>

<space/>

<wd l="8664" t="5203" r="9043" b="5347">Irish</wd>

<space/>

<wd l="9101" t="5208" r="9523" b="5386">using</wd>

<space/>

<wd l="9581" t="5208" r="10507" b="5347">Finite-State</wd>

<space/>

</ln>

<ln l="6374" t="5419" r="10502" b="5587" baseLine="5558">

<run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6374" t="5419" r="7344" b="5563">Transducers</wd>

<space/>

<wd l="7382" t="5419" r="7690" b="5563">and</wd>

<space/>

<wd l="7728" t="5424" r="8578" b="5563">Constraint</wd>

<space/>

</run>

<wd l="8616" t="5424" r="9432" b="5563"><run italic="true" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Grammar</run>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>

</wd>

<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>

<wd l="9514" t="5419" r="9955" b="5563">Ph.D.</wd>

<space/>

<wd l="10008" t="5419" r="10502" b="5587">thesis,</wd>

<space/>

</run>

</ln>

<ln l="6365" t="5640" r="8218" b="5827" baseLine="5774" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">

<wd l="6365" t="5640" r="6917" b="5784">Dublin</wd>

<space/>

<wd l="6970" t="5640" r="7306" b="5827">City</wd>

<space/>

<wd l="7358" t="5640" r="8218" b="5827">University.</wd>

</ln>

</para>

</column>

</section>

<dd l="1440" t="15746" r="10524" b="15975">

<para l="5867" t="15792" r="6090" b="15946" alignment="centered" lsp="exactly" lspExact="223" language="en">

<ln l="5933" t="15792" r="6024" b="15946" baseLine="15936" underlined="none" subsuperscript="none" fontSize="950" fontFace="Tahoma" fontFamily="swiss" fontPitch="variable" spacing="0">

<wd l="5933" t="15792" r="6024" b="15946">8</wd>

</ln>

</para>

</dd>

</body>

</page>

</document>

