<?xml version="1.0" encoding="UTF-16"?>
<!--XML document generated using OCR technology from Nuance Communications, Inc.-->
<document xmlns="http://www.scansoft.com/omnipage/xml/ssdoc-schema3.xsd" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance">
<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">
<description>
<source file="pdf\L08-1001.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>
<theoreticalPage size="A4" marginLeft="1042" marginTop="1440" marginRight="1105" marginBottom="1008" offsetX="38" width="11918" height="16854"/>
<language>en</language>
</description>
<body>
<section l="1042" t="1720" r="10804" b="2302">
<column l="1042" t="1720" r="10804" b="2302">
<para l="1925" t="1800" r="9917" b="2059" alignment="centered" spaceBefore="19" spaceAfter="217" lsp="exactly" lspExact="333" language="en">
<ln l="1925" t="1800" r="9917" b="2059" baseLine="1997" underlined="none" subsuperscript="none" fontSize="1550" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="18">
<wd l="1925" t="1800" r="3821" b="2059">Unsupervised</wd>
<space/>
<wd l="3946" t="1800" r="5117" b="2006">Relation</wd>
<space/>
<wd l="5242" t="1800" r="6720" b="2006">Extraction</wd>
<space/>
<wd l="6845" t="1800" r="7493" b="2006">from</wd>
<space/>
<wd l="7608" t="1800" r="8227" b="2006">Web</wd>
<space/>
<wd l="8352" t="1805" r="9917" b="2006">Documents</wd>
</ln>
</para>
</column>
</section>
<section l="1042" t="2302" r="10802" b="5270">
<column l="1042" t="2302" r="10802" b="5270">
<para l="2635" t="2371" r="9202" b="2587" alignment="centered" spaceBefore="17" lsp="exactly" lspExact="279" language="en">
<ln l="2635" t="2371" r="9202" b="2587" baseLine="2534" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="14">
<wd l="2635" t="2371" r="3552" b="2544">Kathrin</wd>
<space/>
<wd l="3653" t="2371" r="4526" b="2587">Eichler,</wd>
<space/>
<wd l="4637" t="2371" r="5506" b="2544">Holmer</wd>
<space/>
<wd l="5602" t="2371" r="6528" b="2544">Hemsen</wd>
<space/>
<wd l="6629" t="2371" r="7046" b="2544">and</wd>
<space/>
<wd l="7157" t="2371" r="7978" b="2544">G¨unter</wd>
<space/>
<wd l="8074" t="2371" r="9202" b="2544">Neumann</wd>
</ln>
</para>
<para l="2242" t="2861" r="9600" b="3307" alignment="centered" spaceBefore="237" lsp="exactly" lspExact="240" language="en">
<ln l="2242" t="2861" r="9600" b="3067" baseLine="3014" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0" forcedEOF="true">
<wd l="2242" t="2875" r="2741" b="3014">DFKI</wd>
<space/>
<wd l="2822" t="2870" r="3432" b="3053">GmbH,</wd>
<space/>
<wd l="3514" t="2875" r="4205" b="3053">LT-Lab,</wd>
<space/>
<wd l="4296" t="2870" r="6019" b="3058">Stuhlsatzenhausweg</wd>
<space/>
<wd l="6091" t="2880" r="6178" b="3019">3</wd>
<space/>
<wd l="6269" t="2861" r="7066" b="3067">(Building</wd>
<space/>
<wd l="7138" t="2875" r="7378" b="3019">D3</wd>
<space/>
<wd l="7459" t="2861" r="7670" b="3067">2),</wd>
<space/>
<wd l="7752" t="2875" r="8458" b="3019">D-66123</wd>
<space/>
<wd l="8539" t="2870" r="9600" b="3019">Saarbr¨ucken</wd>
</ln>
<ln l="4416" t="3101" r="7430" b="3307" baseLine="3250" forcedEOF="true">
<wd l="4416" t="3101" r="7430" b="3307"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">{</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">FirstName.SecondName</run>
<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0">}</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">@dfki.de</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
<para l="5486" t="3422" r="6346" b="3566" alignment="centered" spaceBefore="62" lsp="exactly" lspExact="241" language="en">
<ln l="5486" t="3422" r="6346" b="3566" baseLine="3562" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="5486" t="3422" r="6346" b="3566">Abstract</wd>
</ln>
</para>
<para l="1042" t="3662" r="10795" b="4930" alignment="justified" spaceBefore="4" spaceAfter="320" lsp="exactly" lspExact="219" language="en">
<ln l="1046" t="3662" r="10795" b="3845" baseLine="3792" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="3672" r="1354" b="3802">The</wd>
<space/>
<wd l="1440" t="3672" r="1901" b="3797">IDEX</wd>
<space/>
<wd l="1982" t="3686" r="2530" b="3835">system</wd>
<space/>
<wd l="2606" t="3677" r="2722" b="3802">is</wd>
<space/>
<wd l="2808" t="3715" r="2894" b="3802">a</wd>
<space/>
<wd l="2971" t="3686" r="3744" b="3835">prototype</wd>
<space/>
<wd l="3830" t="3667" r="3984" b="3802">of</wd>
<space/>
<wd l="4051" t="3715" r="4238" b="3802">an</wd>
<space/>
<wd l="4320" t="3677" r="5155" b="3802">interactive</wd>
<space/>
<wd l="5242" t="3672" r="5909" b="3835">dynamic</wd>
<space/>
<wd l="5995" t="3667" r="6941" b="3802">Information</wd>
<space/>
<wd l="7018" t="3672" r="7872" b="3802">Extraction</wd>
<space/>
<wd l="7958" t="3662" r="8266" b="3845">(IE)</wd>
<space/>
<wd l="8362" t="3686" r="8942" b="3835">system.</wd>
<space/>
<wd l="9082" t="3667" r="9211" b="3797">A</wd>
<space/>
<wd l="9293" t="3715" r="9614" b="3802">user</wd>
<space/>
<wd l="9696" t="3667" r="9850" b="3802">of</wd>
<space/>
<wd l="9917" t="3672" r="10166" b="3802">the</wd>
<space/>
<wd l="10248" t="3686" r="10795" b="3835">system</wd>
<space/>
</ln>
<ln l="1046" t="3883" r="10790" b="4051" baseLine="4013" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="3931" r="1771" b="4051">expresses</wd>
<space/>
<wd l="1843" t="3931" r="2030" b="4018">an</wd>
<space/>
<wd l="2098" t="3883" r="3029" b="4018">information</wd>
<space/>
<wd l="3096" t="3902" r="3662" b="4051">request</wd>
<space/>
<wd l="3739" t="3893" r="3883" b="4013">in</wd>
<space/>
<wd l="3946" t="3888" r="4195" b="4018">the</wd>
<space/>
<wd l="4267" t="3883" r="4637" b="4018">form</wd>
<space/>
<wd l="4704" t="3883" r="4858" b="4018">of</wd>
<space/>
<wd l="4910" t="3931" r="4997" b="4018">a</wd>
<space/>
<wd l="5059" t="3893" r="5453" b="4051">topic</wd>
<space/>
<wd l="5525" t="3888" r="6437" b="4051">description,</wd>
<space/>
<wd l="6514" t="3888" r="6974" b="4018">which</wd>
<space/>
<wd l="7042" t="3893" r="7157" b="4018">is</wd>
<space/>
<wd l="7229" t="3888" r="7579" b="4018">used</wd>
<space/>
<wd l="7646" t="3883" r="7858" b="4018">for</wd>
<space/>
<wd l="7930" t="3931" r="8117" b="4018">an</wd>
<space/>
<wd l="8184" t="3888" r="8645" b="4018">initial</wd>
<space/>
<wd l="8717" t="3888" r="9206" b="4018">search</wd>
<space/>
<wd l="9274" t="3893" r="9422" b="4013">in</wd>
<space/>
<wd l="9490" t="3888" r="9898" b="4018">order</wd>
<space/>
<wd l="9965" t="3902" r="10128" b="4018">to</wd>
<space/>
<wd l="10195" t="3893" r="10790" b="4018">retrieve</wd>
<space/>
</ln>
<ln l="1046" t="4104" r="10795" b="4272" baseLine="4229" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="4152" r="1133" b="4238">a</wd>
<space/>
<wd l="1200" t="4109" r="1819" b="4238">relevant</wd>
<space/>
<wd l="1891" t="4123" r="2102" b="4238">set</wd>
<space/>
<wd l="2174" t="4104" r="2328" b="4238">of</wd>
<space/>
<wd l="2381" t="4109" r="3274" b="4238">documents.</wd>
<space/>
<wd l="3379" t="4104" r="3614" b="4238">On</wd>
<space/>
<wd l="3677" t="4109" r="4056" b="4238">basis</wd>
<space/>
<wd l="4128" t="4104" r="4282" b="4238">of</wd>
<space/>
<wd l="4325" t="4109" r="4618" b="4238">this</wd>
<space/>
<wd l="4690" t="4123" r="4901" b="4238">set</wd>
<space/>
<wd l="4973" t="4104" r="5126" b="4238">of</wd>
<space/>
<wd l="5179" t="4109" r="6072" b="4272">documents,</wd>
<space/>
<wd l="6149" t="4109" r="7186" b="4272">unsupervised</wd>
<space/>
<wd l="7253" t="4109" r="7858" b="4238">relation</wd>
<space/>
<wd l="7925" t="4114" r="8731" b="4238">extraction</wd>
<space/>
<wd l="8794" t="4109" r="9086" b="4238">and</wd>
<space/>
<wd l="9149" t="4109" r="9922" b="4272">clustering</wd>
<space/>
<wd l="9989" t="4114" r="10099" b="4238">is</wd>
<space/>
<wd l="10166" t="4109" r="10536" b="4238">done</wd>
<space/>
<wd l="10603" t="4109" r="10795" b="4272">by</wd>
<space/>
</ln>
<ln l="1042" t="4325" r="10790" b="4493" baseLine="4450" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1042" t="4330" r="1296" b="4459">the</wd>
<space/>
<wd l="1363" t="4344" r="1944" b="4493">system.</wd>
<space/>
<wd l="2045" t="4330" r="2352" b="4459">The</wd>
<space/>
<wd l="2419" t="4330" r="2933" b="4459">results</wd>
<space/>
<wd l="3005" t="4325" r="3158" b="4459">of</wd>
<space/>
<wd l="3206" t="4330" r="3610" b="4459">these</wd>
<space/>
<wd l="3682" t="4334" r="4502" b="4493">operations</wd>
<space/>
<wd l="4574" t="4373" r="4843" b="4459">can</wd>
<space/>
<wd l="4906" t="4330" r="5261" b="4459">then</wd>
<space/>
<wd l="5328" t="4330" r="5506" b="4459">be</wd>
<space/>
<wd l="5573" t="4330" r="6562" b="4493">interactively</wd>
<space/>
<wd l="6624" t="4330" r="7373" b="4493">inspected</wd>
<space/>
<wd l="7435" t="4330" r="7627" b="4493">by</wd>
<space/>
<wd l="7685" t="4330" r="7934" b="4459">the</wd>
<space/>
<wd l="8006" t="4373" r="8366" b="4459">user.</wd>
<space/>
<wd l="8467" t="4330" r="8630" b="4454">In</wd>
<space/>
<wd l="8688" t="4330" r="8981" b="4459">this</wd>
<space/>
<wd l="9048" t="4373" r="9494" b="4493">paper</wd>
<space/>
<wd l="9562" t="4373" r="9763" b="4459">we</wd>
<space/>
<wd l="9835" t="4330" r="10474" b="4459">describe</wd>
<space/>
<wd l="10541" t="4330" r="10790" b="4459">the</wd>
<space/>
</ln>
<ln l="1046" t="4541" r="10790" b="4709" baseLine="4670" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="4546" r="1656" b="4675">relation</wd>
<space/>
<wd l="1714" t="4550" r="2520" b="4675">extraction</wd>
<space/>
<wd l="2573" t="4546" r="2866" b="4675">and</wd>
<space/>
<wd l="2918" t="4546" r="3691" b="4709">clustering</wd>
<space/>
<wd l="3749" t="4560" r="4690" b="4709">components</wd>
<space/>
<wd l="4747" t="4541" r="4906" b="4675">of</wd>
<space/>
<wd l="4944" t="4546" r="5194" b="4675">the</wd>
<space/>
<wd l="5251" t="4546" r="5712" b="4670">IDEX</wd>
<space/>
<wd l="5770" t="4560" r="6355" b="4709">system.</wd>
<space/>
<wd l="6451" t="4546" r="7392" b="4709">Preliminary</wd>
<space/>
<wd l="7450" t="4546" r="8266" b="4675">evaluation</wd>
<space/>
<wd l="8323" t="4546" r="8837" b="4675">results</wd>
<space/>
<wd l="8894" t="4541" r="9048" b="4675">of</wd>
<space/>
<wd l="9086" t="4546" r="9494" b="4675">these</wd>
<space/>
<wd l="9552" t="4560" r="10493" b="4709">components</wd>
<space/>
<wd l="10555" t="4589" r="10790" b="4675">are</wd>
<space/>
</ln>
<ln l="1046" t="4762" r="10704" b="4930" baseLine="4886" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="4766" r="1805" b="4930">presented</wd>
<space/>
<wd l="1858" t="4766" r="2146" b="4896">and</wd>
<space/>
<wd l="2198" t="4810" r="2386" b="4896">an</wd>
<space/>
<wd l="2438" t="4771" r="3125" b="4896">overview</wd>
<space/>
<wd l="3178" t="4771" r="3293" b="4896">is</wd>
<space/>
<wd l="3346" t="4771" r="3758" b="4930">given</wd>
<space/>
<wd l="3811" t="4762" r="3965" b="4896">of</wd>
<space/>
<wd l="4003" t="4766" r="4622" b="4930">possible</wd>
<space/>
<wd l="4680" t="4766" r="5789" b="4896">enhancements</wd>
<space/>
<wd l="5842" t="4781" r="6005" b="4896">to</wd>
<space/>
<wd l="6053" t="4771" r="6682" b="4930">improve</wd>
<space/>
<wd l="6734" t="4766" r="6984" b="4896">the</wd>
<space/>
<wd l="7037" t="4766" r="7646" b="4896">relation</wd>
<space/>
<wd l="7699" t="4771" r="8506" b="4896">extraction</wd>
<space/>
<wd l="8554" t="4766" r="8846" b="4896">and</wd>
<space/>
<wd l="8894" t="4766" r="9667" b="4930">clustering</wd>
<space/>
<wd l="9720" t="4781" r="10704" b="4930">components.</wd>
</ln>
</para>
</column>
</section>
<section l="1042" t="5270" r="10804" b="15830">
<column l="1042" t="5270" r="5755" b="15830">
<para l="2434" t="5270" r="4363" b="5443" alignment="centered" lsp="exactly" lspExact="228" language="en">
<ln l="2434" t="5270" r="4363" b="5443" baseLine="5434" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="23">
<wd l="2434" t="5280" r="2606" b="5438">1.</wd>
<space/>
<wd l="2894" t="5270" r="4363" b="5443">Introduction</wd>
</ln>
</para>
<para l="1042" t="5597" r="5750" b="9619" alignment="justified" spaceBefore="51" lsp="exactly" lspExact="239" language="en">
<ln l="1046" t="5597" r="5731" b="5803" baseLine="5750" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="5606" r="2074" b="5755">Information</wd>
<space/>
<wd l="2136" t="5616" r="3010" b="5755">extraction</wd>
<space/>
<wd l="3086" t="5597" r="3408" b="5803">(IE)</wd>
<space/>
<wd l="3490" t="5611" r="4162" b="5755">involves</wd>
<space/>
<wd l="4224" t="5611" r="4502" b="5755">the</wd>
<space/>
<wd l="4565" t="5659" r="5179" b="5794">process</wd>
<space/>
<wd l="5251" t="5606" r="5419" b="5755">of</wd>
<space/>
<wd l="5467" t="5659" r="5731" b="5755">au-</wd>
</ln>
<ln l="1042" t="5846" r="5750" b="6034" baseLine="5986" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="5851" r="2021" b="6034">tomatically</wd>
<space/>
<wd l="2083" t="5846" r="3005" b="6034">identifying</wd>
<space/>
<wd l="3067" t="5856" r="3840" b="5995">instances</wd>
<space/>
<wd l="3912" t="5846" r="4075" b="5995">of</wd>
<space/>
<wd l="4128" t="5856" r="4723" b="5995">certain</wd>
<space/>
<wd l="4786" t="5851" r="5515" b="5995">relations</wd>
<space/>
<wd l="5582" t="5846" r="5750" b="5995">of</wd>
<space/>
</ln>
<ln l="1046" t="6077" r="5731" b="6283" baseLine="6226">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5"><wd l="1046" t="6096" r="1733" b="6269">interest,</wd>
<space/>
<wd l="1829" t="6139" r="2165" b="6274">e.g.,</wd>
<space/>
</run>
<wd l="2261" t="6077" r="4152" b="6283"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">produce(</run>
<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="5">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">company</run>
<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="5">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">,</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5"><space/>
</run>
<wd l="4258" t="6091" r="5275" b="6274"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="5">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">product</run>
<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="5">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">,</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5"><space/>
</run>
<wd l="5381" t="6091" r="5731" b="6240"><run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="5">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">lo-</run>
</wd>
</ln>
<ln l="1046" t="6317" r="5731" b="6523" baseLine="6466">
<wd l="1046" t="6317" r="1848" b="6523"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">cation</run>
<run underlined="none" subsuperscript="none" fontSize="1200" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="5">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">),</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5"><space/>
<wd l="1963" t="6336" r="2126" b="6470">in</wd>
<space/>
<wd l="2222" t="6379" r="2650" b="6475">some</wd>
<space/>
<wd l="2746" t="6331" r="3581" b="6475">document</wd>
<space/>
<wd l="3691" t="6331" r="4502" b="6475">collection</wd>
<space/>
<wd l="4598" t="6331" r="4910" b="6475">and</wd>
<space/>
<wd l="5006" t="6331" r="5280" b="6475">the</wd>
<space/>
<wd l="5381" t="6379" r="5731" b="6475">con-</wd>
</run>
</ln>
<ln l="1046" t="6562" r="5741" b="6710" baseLine="6706" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="6571" r="1819" b="6710">struction</wd>
<space/>
<wd l="1910" t="6562" r="2078" b="6710">of</wd>
<space/>
<wd l="2160" t="6614" r="2256" b="6710">a</wd>
<space/>
<wd l="2347" t="6566" r="3106" b="6710">database</wd>
<space/>
<wd l="3192" t="6566" r="3581" b="6710">with</wd>
<space/>
<wd l="3672" t="6562" r="4680" b="6710">information</wd>
<space/>
<wd l="4771" t="6566" r="5261" b="6710">about</wd>
<space/>
<wd l="5362" t="6566" r="5741" b="6710">each</wd>
<space/>
</ln>
<ln l="1046" t="6792" r="5731" b="6998" baseLine="6946" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="6806" r="1910" b="6950">individual</wd>
<space/>
<wd l="2006" t="6811" r="2707" b="6950">instance</wd>
<space/>
<wd l="2818" t="6792" r="3216" b="6998">(e.g.,</wd>
<space/>
<wd l="3326" t="6806" r="3600" b="6950">the</wd>
<space/>
<wd l="3696" t="6811" r="4718" b="6989">participants</wd>
<space/>
<wd l="4819" t="6802" r="4987" b="6950">of</wd>
<space/>
<wd l="5069" t="6854" r="5165" b="6950">a</wd>
<space/>
<wd l="5256" t="6821" r="5731" b="6950">meet-</wd>
</ln>
<ln l="1046" t="7032" r="5741" b="7238" baseLine="7181" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="7051" r="1354" b="7229">ing,</wd>
<space/>
<wd l="1435" t="7046" r="1709" b="7190">the</wd>
<space/>
<wd l="1790" t="7046" r="2155" b="7190">date</wd>
<space/>
<wd l="2237" t="7046" r="2544" b="7190">and</wd>
<space/>
<wd l="2621" t="7051" r="3010" b="7190">time</wd>
<space/>
<wd l="3086" t="7042" r="3254" b="7190">of</wd>
<space/>
<wd l="3312" t="7046" r="3586" b="7190">the</wd>
<space/>
<wd l="3662" t="7032" r="4459" b="7238">meeting).</wd>
<space/>
<wd l="4589" t="7042" r="5448" b="7229">Currently,</wd>
<space/>
<wd l="5539" t="7046" r="5741" b="7186">IE</wd>
<space/>
</ln>
<ln l="1046" t="7286" r="5741" b="7469" baseLine="7421" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="7301" r="1709" b="7469">systems</wd>
<space/>
<wd l="1810" t="7334" r="2069" b="7430">are</wd>
<space/>
<wd l="2170" t="7286" r="2779" b="7469">usually</wd>
<space/>
<wd l="2875" t="7286" r="4464" b="7469">domain-dependent</wd>
<space/>
<wd l="4570" t="7286" r="4882" b="7430">and</wd>
<space/>
<wd l="4982" t="7286" r="5741" b="7469">adapting</wd>
<space/>
</ln>
<ln l="1042" t="7526" r="5731" b="7709" baseLine="7661" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="7526" r="1315" b="7670">the</wd>
<space/>
<wd l="1406" t="7541" r="1992" b="7709">system</wd>
<space/>
<wd l="2078" t="7541" r="2251" b="7670">to</wd>
<space/>
<wd l="2347" t="7574" r="2443" b="7670">a</wd>
<space/>
<wd l="2530" t="7574" r="2866" b="7670">new</wd>
<space/>
<wd l="2952" t="7526" r="3590" b="7670">domain</wd>
<space/>
<wd l="3677" t="7531" r="4349" b="7709">requires</wd>
<space/>
<wd l="4445" t="7574" r="4541" b="7670">a</wd>
<space/>
<wd l="4627" t="7526" r="4997" b="7709">high</wd>
<space/>
<wd l="5088" t="7541" r="5731" b="7670">amount</wd>
<space/>
</ln>
<ln l="1046" t="7757" r="5731" b="7944" baseLine="7901" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="7757" r="1214" b="7906">of</wd>
<space/>
<wd l="1291" t="7762" r="1920" b="7906">manual</wd>
<space/>
<wd l="2006" t="7762" r="2602" b="7939">labour,</wd>
<space/>
<wd l="2702" t="7762" r="3082" b="7906">such</wd>
<space/>
<wd l="3168" t="7810" r="3336" b="7906">as</wd>
<space/>
<wd l="3427" t="7757" r="4282" b="7944">specifying</wd>
<space/>
<wd l="4363" t="7762" r="4675" b="7906">and</wd>
<space/>
<wd l="4766" t="7762" r="5731" b="7944">implement-</wd>
</ln>
<ln l="1046" t="7987" r="5722" b="8194" baseLine="8141" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="8006" r="1310" b="8184">ing</wd>
<space/>
<wd l="1387" t="7997" r="2770" b="8184">relation–specific</wd>
<space/>
<wd l="2846" t="8006" r="3725" b="8146">extraction</wd>
<space/>
<wd l="3802" t="8016" r="4512" b="8184">patterns</wd>
<space/>
<wd l="4594" t="8002" r="5386" b="8184">manually</wd>
<space/>
<wd l="5477" t="7987" r="5722" b="8194">(cf.</wd>
<space/>
</ln>
<ln l="1046" t="8227" r="5731" b="8434" baseLine="8376" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="8242" r="1368" b="8424">Fig.</wd>
<space/>
<wd l="1488" t="8227" r="1632" b="8434">1)</wd>
<space/>
<wd l="1747" t="8290" r="1920" b="8386">or</wd>
<space/>
<wd l="2016" t="8246" r="2952" b="8424">annotating</wd>
<space/>
<wd l="3043" t="8242" r="3461" b="8424">large</wd>
<space/>
<wd l="3557" t="8256" r="4282" b="8386">amounts</wd>
<space/>
<wd l="4382" t="8237" r="4550" b="8386">of</wd>
<space/>
<wd l="4632" t="8246" r="5318" b="8424">training</wd>
<space/>
<wd l="5414" t="8290" r="5731" b="8386">cor-</wd>
</ln>
<ln l="1046" t="8467" r="5736" b="8674" baseLine="8616" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="8530" r="1435" b="8664">pora</wd>
<space/>
<wd l="1526" t="8467" r="1771" b="8674">(cf.</wd>
<space/>
<wd l="1867" t="8482" r="2184" b="8664">Fig.</wd>
<space/>
<wd l="2285" t="8467" r="2491" b="8674">2).</wd>
<space/>
<wd l="2616" t="8482" r="3120" b="8626">These</wd>
<space/>
<wd l="3197" t="8482" r="4205" b="8664">adaptations</wd>
<space/>
<wd l="4291" t="8482" r="4675" b="8626">have</wd>
<space/>
<wd l="4752" t="8496" r="4925" b="8626">to</wd>
<space/>
<wd l="5002" t="8482" r="5203" b="8626">be</wd>
<space/>
<wd l="5280" t="8482" r="5736" b="8626">made</wd>
<space/>
</ln>
<ln l="1046" t="8717" r="5741" b="8904" baseLine="8856" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="8717" r="1608" b="8899">offline,</wd>
<space/>
<wd l="1723" t="8726" r="2016" b="8899">i.e.,</wd>
<space/>
<wd l="2131" t="8717" r="2654" b="8866">before</wd>
<space/>
<wd l="2750" t="8722" r="3024" b="8866">the</wd>
<space/>
<wd l="3125" t="8717" r="3744" b="8904">specific</wd>
<space/>
<wd l="3840" t="8722" r="4042" b="8861">IE</wd>
<space/>
<wd l="4142" t="8736" r="4728" b="8904">system</wd>
<space/>
<wd l="4829" t="8726" r="4949" b="8866">is</wd>
<space/>
<wd l="5054" t="8722" r="5741" b="8904">actually</wd>
<space/>
</ln>
<ln l="1046" t="8957" r="5741" b="9144" baseLine="9096" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="8962" r="1546" b="9106">made.</wd>
<space/>
<wd l="1704" t="8957" r="2890" b="9144">Consequently,</wd>
<space/>
<wd l="2990" t="8976" r="3600" b="9106">current</wd>
<space/>
<wd l="3696" t="8962" r="3898" b="9101">IE</wd>
<space/>
<wd l="3979" t="8962" r="4910" b="9144">technology</wd>
<space/>
<wd l="4997" t="8966" r="5117" b="9106">is</wd>
<space/>
<wd l="5208" t="8962" r="5741" b="9144">highly</wd>
<space/>
</ln>
<ln l="1046" t="9192" r="5731" b="9379" baseLine="9336" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="9197" r="1670" b="9341">statical</wd>
<space/>
<wd l="1738" t="9197" r="2050" b="9341">and</wd>
<space/>
<wd l="2117" t="9192" r="2890" b="9341">inflexible</wd>
<space/>
<wd l="2952" t="9197" r="3341" b="9341">with</wd>
<space/>
<wd l="3403" t="9211" r="4003" b="9379">respect</wd>
<space/>
<wd l="4075" t="9211" r="4248" b="9341">to</wd>
<space/>
<wd l="4315" t="9245" r="4411" b="9341">a</wd>
<space/>
<wd l="4469" t="9197" r="5016" b="9379">timely</wd>
<space/>
<wd l="5083" t="9197" r="5731" b="9379">adapta-</wd>
</ln>
<ln l="1042" t="9432" r="5520" b="9619" baseLine="9576" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="9442" r="1387" b="9581">tion</wd>
<space/>
<wd l="1454" t="9451" r="1627" b="9581">to</wd>
<space/>
<wd l="1699" t="9485" r="2040" b="9581">new</wd>
<space/>
<wd l="2112" t="9442" r="3216" b="9619">requirements</wd>
<space/>
<wd l="3293" t="9442" r="3456" b="9576">in</wd>
<space/>
<wd l="3523" t="9437" r="3797" b="9581">the</wd>
<space/>
<wd l="3869" t="9432" r="4267" b="9581">form</wd>
<space/>
<wd l="4339" t="9432" r="4507" b="9581">of</wd>
<space/>
<wd l="4565" t="9485" r="4906" b="9581">new</wd>
<space/>
<wd l="4973" t="9442" r="5520" b="9619">topics.</wd>
</ln>
</para>
<picture l="3336" t="9998" r="4363" b="10138" alignment="left" li="2294" ri="1392" spaceBefore="369">
</picture>
<picture l="1502" t="10238" r="1834" b="10570" alignment="left" li="460" ri="3921" spaceBefore="100">
</picture>
<rulerline l="3898" t="10627" r="4354" b="10627" type="double" width="10" color="000000"/>
<picture l="3149" t="11054" r="4704" b="12235" alignment="left" ri="1051" spaceBefore="484" spaceAfter="354">
</picture>
<rulerline l="3898" t="12600" r="4488" b="12600" type="double" width="19" color="000000"/>
<picture l="3600" t="12941" r="5323" b="13253" alignment="left" li="2558" ri="432" spaceBefore="74" spaceAfter="493">
</picture>
<para l="1046" t="13795" r="5741" b="14630" alignment="justified" spaceBefore="15" lsp="exactly" lspExact="219" language="en">
<ln l="1046" t="13795" r="5731" b="13982" baseLine="13930">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><wd l="1046" t="13795" r="1603" b="13978">Figure</wd>
<space/>
<wd l="1694" t="13800" r="1814" b="13934">1:</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><wd l="1944" t="13805" r="2074" b="13934">A</wd>
<space/>
<wd l="2150" t="13810" r="3067" b="13939">hand-coded</wd>
<space/>
<wd l="3139" t="13810" r="3984" b="13939">rule–based</wd>
<space/>
<wd l="4061" t="13810" r="4886" b="13973">IE–system</wd>
<space/>
<wd l="4973" t="13800" r="5731" b="13982">(schemat-</wd>
</run>
</ln>
<ln l="1046" t="14021" r="5736" b="14203" baseLine="14150" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="14021" r="1579" b="14203">ically):</wd>
<space/>
<wd l="1694" t="14026" r="1824" b="14155">A</wd>
<space/>
<wd l="1896" t="14035" r="2290" b="14194">topic</wd>
<space/>
<wd l="2366" t="14045" r="2866" b="14194">expert</wd>
<space/>
<wd l="2947" t="14030" r="3854" b="14194">implements</wd>
<space/>
<wd l="3936" t="14030" r="4666" b="14194">manually</wd>
<space/>
<wd l="4738" t="14026" r="5736" b="14194">task–specific</wd>
<space/>
</ln>
<ln l="1046" t="14242" r="5741" b="14410" baseLine="14371" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="14251" r="1853" b="14376">extraction</wd>
<space/>
<wd l="1939" t="14246" r="2309" b="14376">rules</wd>
<space/>
<wd l="2400" t="14290" r="2587" b="14376">on</wd>
<space/>
<wd l="2669" t="14246" r="2923" b="14376">the</wd>
<space/>
<wd l="3010" t="14246" r="3394" b="14376">basis</wd>
<space/>
<wd l="3480" t="14242" r="3634" b="14376">of</wd>
<space/>
<wd l="3710" t="14246" r="3955" b="14376">her</wd>
<space/>
<wd l="4046" t="14246" r="4627" b="14376">manual</wd>
<space/>
<wd l="4714" t="14246" r="5333" b="14410">analysis</wd>
<space/>
<wd l="5424" t="14242" r="5578" b="14376">of</wd>
<space/>
<wd l="5654" t="14290" r="5741" b="14376">a</wd>
<space/>
</ln>
<ln l="1046" t="14472" r="2789" b="14630" baseLine="14587" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="14472" r="2160" b="14630">representative</wd>
<space/>
<wd l="2232" t="14510" r="2789" b="14630">corpus.</wd>
</ln>
</para>
<para l="1056" t="15110" r="2501" b="15293" alignment="left" spaceBefore="423" lsp="exactly" lspExact="241" language="en">
<ln l="1056" t="15110" r="2501" b="15293" baseLine="15245" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="16">
<wd l="1056" t="15115" r="1382" b="15250">1.1.</wd>
<space/>
<wd l="1637" t="15110" r="2016" b="15254">Our</wd>
<space/>
<wd l="2102" t="15110" r="2501" b="15293">goal</wd>
</ln>
</para>
<para l="1046" t="15398" r="5741" b="15826" alignment="justified" spaceBefore="49" lsp="exactly" lspExact="237" language="en">
<ln l="1046" t="15398" r="5731" b="15586" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="15403" r="1382" b="15547">The</wd>
<space/>
<wd l="1459" t="15403" r="1805" b="15586">goal</wd>
<space/>
<wd l="1882" t="15398" r="2050" b="15547">of</wd>
<space/>
<wd l="2112" t="15451" r="2395" b="15547">our</wd>
<space/>
<wd l="2472" t="15403" r="2674" b="15542">IE</wd>
<space/>
<wd l="2746" t="15403" r="3446" b="15547">research</wd>
<space/>
<wd l="3518" t="15408" r="3643" b="15547">is</wd>
<space/>
<wd l="3720" t="15403" r="3994" b="15547">the</wd>
<space/>
<wd l="4070" t="15408" r="4992" b="15586">conception</wd>
<space/>
<wd l="5069" t="15403" r="5381" b="15547">and</wd>
<space/>
<wd l="5458" t="15408" r="5731" b="15542">im-</wd>
</ln>
<ln l="1046" t="15638" r="5741" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="15643" r="2174" b="15826">plementation</wd>
<space/>
<wd l="2256" t="15638" r="2424" b="15787">of</wd>
<space/>
<wd l="2491" t="15691" r="2842" b="15787">core</wd>
<space/>
<wd l="2923" t="15643" r="3125" b="15782">IE</wd>
<space/>
<wd l="3202" t="15643" r="4128" b="15826">technology</wd>
<space/>
<wd l="4205" t="15658" r="4378" b="15787">to</wd>
<space/>
<wd l="4459" t="15643" r="5146" b="15826">produce</wd>
<space/>
<wd l="5227" t="15691" r="5323" b="15787">a</wd>
<space/>
<wd l="5400" t="15691" r="5741" b="15787">new</wd>
</ln>
</para>
</column>
<column l="6091" t="5270" r="10804" b="15830">
<picture l="6600" t="5563" r="8366" b="6989" alignment="left" li="509" spaceBefore="293" spaceAfter="1305">
</picture>
<picture l="8832" t="8294" r="10416" b="8606" alignment="left" li="2741" ri="388" spaceAfter="519">
</picture>
<para l="6096" t="9173" r="10795" b="10450" alignment="justified" lsp="exactly" lspExact="221" language="en">
<ln l="6101" t="9173" r="10790" b="9360" baseLine="9312">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><wd l="6101" t="9173" r="6658" b="9355">Figure</wd>
<space/>
<wd l="6725" t="9178" r="6850" b="9312">2:</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><wd l="6955" t="9182" r="7085" b="9312">A</wd>
<space/>
<wd l="7142" t="9187" r="8237" b="9317">data–oriented</wd>
<space/>
<wd l="8294" t="9187" r="8477" b="9312">IE</wd>
<space/>
<wd l="8534" t="9202" r="9082" b="9350">system</wd>
<space/>
<wd l="9144" t="9178" r="10387" b="9360">(schematically):</wd>
<space/>
<wd l="10483" t="9187" r="10790" b="9317">The</wd>
<space/>
</run>
</ln>
<ln l="6096" t="9403" r="10795" b="9571" baseLine="9528" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="6096" t="9403" r="7094" b="9571">task–specific</wd>
<space/>
<wd l="7152" t="9413" r="7958" b="9538">extraction</wd>
<space/>
<wd l="8011" t="9408" r="8381" b="9538">rules</wd>
<space/>
<wd l="8438" t="9451" r="8674" b="9538">are</wd>
<space/>
<wd l="8731" t="9408" r="9826" b="9571">automatically</wd>
<space/>
<wd l="9878" t="9408" r="10550" b="9571">acquired</wd>
<space/>
<wd l="10603" t="9408" r="10795" b="9571">by</wd>
<space/>
</ln>
<ln l="6101" t="9624" r="10795" b="9792" baseLine="9749" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="6101" t="9672" r="6595" b="9758">means</wd>
<space/>
<wd l="6691" t="9624" r="6850" b="9758">of</wd>
<space/>
<wd l="6931" t="9629" r="7594" b="9758">Machine</wd>
<space/>
<wd l="7694" t="9629" r="8400" b="9792">Learning</wd>
<space/>
<wd l="8491" t="9629" r="9374" b="9792">algorithms,</wd>
<space/>
<wd l="9485" t="9629" r="9950" b="9758">which</wd>
<space/>
<wd l="10042" t="9672" r="10282" b="9758">are</wd>
<space/>
<wd l="10378" t="9634" r="10795" b="9792">using</wd>
<space/>
</ln>
<ln l="6101" t="9840" r="10786" b="10008" baseLine="9970" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="6101" t="9888" r="6187" b="9974">a</wd>
<space/>
<wd l="6274" t="9840" r="7128" b="10008">sufficiently</wd>
<space/>
<wd l="7210" t="9845" r="7589" b="10008">large</wd>
<space/>
<wd l="7675" t="9845" r="8242" b="10008">enough</wd>
<space/>
<wd l="8328" t="9888" r="8837" b="10008">corpus</wd>
<space/>
<wd l="8928" t="9840" r="9082" b="9974">of</wd>
<space/>
<wd l="9149" t="9845" r="10262" b="10008">topic–relevant</wd>
<space/>
<wd l="10354" t="9845" r="10786" b="9974">docu-</wd>
</ln>
<ln l="6101" t="10066" r="10795" b="10229" baseLine="10186" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="6101" t="10080" r="6614" b="10195">ments.</wd>
<space/>
<wd l="6758" t="10066" r="7219" b="10195">These</wd>
<space/>
<wd l="7306" t="10066" r="8155" b="10195">documents</wd>
<space/>
<wd l="8242" t="10066" r="8597" b="10195">have</wd>
<space/>
<wd l="8678" t="10080" r="8842" b="10195">to</wd>
<space/>
<wd l="8923" t="10066" r="9101" b="10195">be</wd>
<space/>
<wd l="9187" t="10066" r="9878" b="10195">collected</wd>
<space/>
<wd l="9960" t="10066" r="10248" b="10195">and</wd>
<space/>
<wd l="10334" t="10066" r="10795" b="10229">costly</wd>
<space/>
</ln>
<ln l="6101" t="10286" r="8414" b="10450" baseLine="10406" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="6101" t="10286" r="6902" b="10416">annotated</wd>
<space/>
<wd l="6970" t="10286" r="7162" b="10450">by</wd>
<space/>
<wd l="7229" t="10330" r="7315" b="10416">a</wd>
<space/>
<wd l="7378" t="10286" r="8414" b="10450">topic–expert.</wd>
</ln>
</para>
<para l="6096" t="10882" r="10795" b="14894" alignment="justified" spaceBefore="363" lsp="exactly" lspExact="240" language="en">
<ln l="6101" t="10882" r="10790" b="11069" baseLine="11021" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="10886" r="6302" b="11026">IE</wd>
<space/>
<wd l="6389" t="10901" r="6974" b="11069">system</wd>
<space/>
<wd l="7066" t="10886" r="8246" b="11069">automatically</wd>
<space/>
<wd l="8333" t="10882" r="8563" b="11030">for</wd>
<space/>
<wd l="8650" t="10934" r="8746" b="11030">a</wd>
<space/>
<wd l="8832" t="10891" r="9278" b="11069">given</wd>
<space/>
<wd l="9360" t="10891" r="9830" b="11069">topic.</wd>
<space/>
<wd l="9979" t="10886" r="10421" b="11064">Here,</wd>
<space/>
<wd l="10517" t="10886" r="10790" b="11030">the</wd>
<space/>
</ln>
<ln l="6101" t="11122" r="10795" b="11309" baseLine="11261" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11126" r="7368" b="11309">pre–knowledge</wd>
<space/>
<wd l="7445" t="11126" r="7934" b="11270">about</wd>
<space/>
<wd l="8011" t="11126" r="8285" b="11270">the</wd>
<space/>
<wd l="8362" t="11122" r="9370" b="11270">information</wd>
<space/>
<wd l="9446" t="11141" r="10056" b="11309">request</wd>
<space/>
<wd l="10142" t="11131" r="10262" b="11270">is</wd>
<space/>
<wd l="10344" t="11131" r="10795" b="11309">given</wd>
<space/>
</ln>
<ln l="6101" t="11352" r="10776" b="11558" baseLine="11501" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11366" r="6307" b="11549">by</wd>
<space/>
<wd l="6389" t="11414" r="6485" b="11510">a</wd>
<space/>
<wd l="6562" t="11414" r="6912" b="11510">user</wd>
<space/>
<wd l="6989" t="11366" r="7502" b="11510">online</wd>
<space/>
<wd l="7579" t="11381" r="7752" b="11510">to</wd>
<space/>
<wd l="7829" t="11366" r="8102" b="11510">the</wd>
<space/>
<wd l="8184" t="11366" r="8386" b="11506">IE</wd>
<space/>
<wd l="8467" t="11414" r="8813" b="11510">core</wd>
<space/>
<wd l="8894" t="11381" r="9480" b="11549">system</wd>
<space/>
<wd l="9576" t="11352" r="10128" b="11558">(called</wd>
<space/>
<wd l="10214" t="11352" r="10776" b="11558">IDEX)</wd>
<space/>
</ln>
<ln l="6101" t="11587" r="10786" b="11794" baseLine="11741" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11606" r="6264" b="11741">in</wd>
<space/>
<wd l="6350" t="11602" r="6629" b="11746">the</wd>
<space/>
<wd l="6725" t="11597" r="7118" b="11746">form</wd>
<space/>
<wd l="7219" t="11597" r="7382" b="11746">of</wd>
<space/>
<wd l="7469" t="11650" r="7565" b="11746">a</wd>
<space/>
<wd l="7651" t="11606" r="8083" b="11784">topic</wd>
<space/>
<wd l="8179" t="11602" r="9125" b="11784">description</wd>
<space/>
<wd l="9235" t="11587" r="9480" b="11794">(cf.</wd>
<space/>
<wd l="9590" t="11602" r="9907" b="11784">Fig.</wd>
<space/>
<wd l="10022" t="11587" r="10229" b="11794">3).</wd>
<space/>
<wd l="10411" t="11602" r="10786" b="11746">This</wd>
<space/>
</ln>
<ln l="6101" t="11837" r="10786" b="11986" baseLine="11981" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11842" r="6605" b="11986">initial</wd>
<space/>
<wd l="6696" t="11837" r="7704" b="11986">information</wd>
<space/>
<wd l="7790" t="11890" r="8328" b="11986">source</wd>
<space/>
<wd l="8419" t="11846" r="8544" b="11986">is</wd>
<space/>
<wd l="8640" t="11842" r="9019" b="11986">used</wd>
<space/>
<wd l="9106" t="11856" r="9283" b="11986">to</wd>
<space/>
<wd l="9374" t="11846" r="10022" b="11986">retrieve</wd>
<space/>
<wd l="10114" t="11842" r="10786" b="11986">relevant</wd>
<space/>
</ln>
<ln l="6101" t="12082" r="10786" b="12226" baseLine="12216" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12082" r="7022" b="12226">documents</wd>
<space/>
<wd l="7099" t="12082" r="7411" b="12226">and</wd>
<space/>
<wd l="7483" t="12096" r="8083" b="12226">extract</wd>
<space/>
<wd l="8165" t="12082" r="8477" b="12226">and</wd>
<space/>
<wd l="8554" t="12082" r="9125" b="12226">cluster</wd>
<space/>
<wd l="9197" t="12082" r="9926" b="12226">relations</wd>
<space/>
<wd l="10003" t="12086" r="10166" b="12221">in</wd>
<space/>
<wd l="10234" t="12130" r="10440" b="12226">an</wd>
<space/>
<wd l="10512" t="12130" r="10786" b="12226">un-</wd>
</ln>
<ln l="6101" t="12322" r="10786" b="12504" baseLine="12456" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12322" r="7003" b="12504">supervised</wd>
<space/>
<wd l="7094" t="12370" r="7454" b="12504">way.</wd>
<space/>
<wd l="7627" t="12322" r="7805" b="12461">In</wd>
<space/>
<wd l="7891" t="12322" r="8208" b="12466">this</wd>
<space/>
<wd l="8304" t="12370" r="8669" b="12504">way,</wd>
<space/>
<wd l="8779" t="12322" r="9278" b="12461">IDEX</wd>
<space/>
<wd l="9374" t="12326" r="9494" b="12466">is</wd>
<space/>
<wd l="9595" t="12322" r="9941" b="12466">able</wd>
<space/>
<wd l="10032" t="12336" r="10205" b="12466">to</wd>
<space/>
<wd l="10301" t="12322" r="10786" b="12504">adapt</wd>
<space/>
</ln>
<ln l="6101" t="12557" r="10786" b="12744" baseLine="12696" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12562" r="6562" b="12706">much</wd>
<space/>
<wd l="6624" t="12562" r="7142" b="12706">better</wd>
<space/>
<wd l="7205" t="12576" r="7378" b="12706">to</wd>
<space/>
<wd l="7440" t="12562" r="7714" b="12706">the</wd>
<space/>
<wd l="7776" t="12562" r="8506" b="12744">dynamic</wd>
<space/>
<wd l="8568" t="12557" r="9576" b="12706">information</wd>
<space/>
<wd l="9638" t="12610" r="10142" b="12744">space,</wd>
<space/>
<wd l="10219" t="12566" r="10382" b="12701">in</wd>
<space/>
<wd l="10445" t="12610" r="10786" b="12744">par-</wd>
</ln>
<ln l="6096" t="12792" r="10786" b="12979" baseLine="12936" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12797" r="6662" b="12941">ticular</wd>
<space/>
<wd l="6744" t="12797" r="7411" b="12941">because</wd>
<space/>
<wd l="7498" t="12845" r="7699" b="12941">no</wd>
<space/>
<wd l="7786" t="12792" r="8674" b="12979">predefined</wd>
<space/>
<wd l="8760" t="12811" r="9470" b="12979">patterns</wd>
<space/>
<wd l="9562" t="12792" r="9730" b="12941">of</wd>
<space/>
<wd l="9802" t="12797" r="10474" b="12941">relevant</wd>
<space/>
<wd l="10565" t="12845" r="10786" b="12941">re-</wd>
</ln>
<ln l="6101" t="13032" r="10790" b="13219" baseLine="13176" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13037" r="6667" b="13181">lations</wd>
<space/>
<wd l="6749" t="13037" r="7138" b="13181">have</wd>
<space/>
<wd l="7210" t="13051" r="7387" b="13181">to</wd>
<space/>
<wd l="7469" t="13037" r="7666" b="13181">be</wd>
<space/>
<wd l="7742" t="13032" r="8520" b="13219">specified,</wd>
<space/>
<wd l="8611" t="13037" r="8894" b="13181">but</wd>
<space/>
<wd l="8981" t="13037" r="9653" b="13181">relevant</wd>
<space/>
<wd l="9739" t="13051" r="10450" b="13219">patterns</wd>
<space/>
<wd l="10531" t="13085" r="10790" b="13181">are</wd>
<space/>
</ln>
<ln l="6101" t="13272" r="10781" b="13459" baseLine="13411" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13277" r="7066" b="13421">determined</wd>
<space/>
<wd l="7133" t="13277" r="7685" b="13421">online.</wd>
<space/>
<wd l="7800" t="13272" r="8131" b="13421">Our</wd>
<space/>
<wd l="8194" t="13291" r="8779" b="13459">system</wd>
<space/>
<wd l="8846" t="13282" r="9504" b="13421">consists</wd>
<space/>
<wd l="9571" t="13272" r="9739" b="13421">of</wd>
<space/>
<wd l="9792" t="13325" r="9888" b="13421">a</wd>
<space/>
<wd l="9946" t="13272" r="10781" b="13454">front-end,</wd>
<space/>
</ln>
<ln l="6096" t="13512" r="10786" b="13699" baseLine="13651" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="13517" r="6600" b="13661">which</wd>
<space/>
<wd l="6653" t="13517" r="7363" b="13699">provides</wd>
<space/>
<wd l="7416" t="13517" r="7690" b="13661">the</wd>
<space/>
<wd l="7747" t="13565" r="8098" b="13661">user</wd>
<space/>
<wd l="8146" t="13517" r="8534" b="13661">with</wd>
<space/>
<wd l="8587" t="13565" r="8683" b="13661">a</wd>
<space/>
<wd l="8736" t="13512" r="9101" b="13661">GUI</wd>
<space/>
<wd l="9158" t="13512" r="9394" b="13661">for</wd>
<space/>
<wd l="9446" t="13517" r="10517" b="13699">interactively</wd>
<space/>
<wd l="10565" t="13522" r="10786" b="13656">in-</wd>
</ln>
<ln l="6101" t="13752" r="10790" b="13939" baseLine="13891" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13762" r="6811" b="13939">specting</wd>
<space/>
<wd l="6878" t="13752" r="7886" b="13901">information</wd>
<space/>
<wd l="7958" t="13757" r="8760" b="13901">extracted</wd>
<space/>
<wd l="8832" t="13752" r="9230" b="13901">from</wd>
<space/>
<wd l="9298" t="13757" r="10387" b="13939">topic-related</wd>
<space/>
<wd l="10454" t="13757" r="10790" b="13901">web</wd>
<space/>
</ln>
<ln l="6101" t="13992" r="10786" b="14170" baseLine="14131" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13992" r="7070" b="14170">documents,</wd>
<space/>
<wd l="7171" t="13992" r="7483" b="14136">and</wd>
<space/>
<wd l="7574" t="14040" r="7670" b="14136">a</wd>
<space/>
<wd l="7757" t="13992" r="8568" b="14170">back-end,</wd>
<space/>
<wd l="8669" t="13992" r="9173" b="14136">which</wd>
<space/>
<wd l="9259" t="13997" r="9960" b="14136">contains</wd>
<space/>
<wd l="10046" t="13992" r="10325" b="14136">the</wd>
<space/>
<wd l="10411" t="13992" r="10786" b="14136">rela-</wd>
</ln>
<ln l="6096" t="14232" r="10786" b="14414" baseLine="14371" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="14237" r="6442" b="14376">tion</wd>
<space/>
<wd l="6514" t="14237" r="7392" b="14376">extraction</wd>
<space/>
<wd l="7464" t="14232" r="7776" b="14376">and</wd>
<space/>
<wd l="7858" t="14232" r="8698" b="14414">clustering</wd>
<space/>
<wd l="8770" t="14246" r="9754" b="14414">component.</wd>
<space/>
<wd l="9878" t="14232" r="10056" b="14371">In</wd>
<space/>
<wd l="10123" t="14232" r="10440" b="14376">this</wd>
<space/>
<wd l="10522" t="14280" r="10786" b="14414">pa-</wd>
</ln>
<ln l="6101" t="14472" r="10786" b="14654" baseLine="14606" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14520" r="6422" b="14654">per,</wd>
<space/>
<wd l="6504" t="14520" r="6730" b="14616">we</wd>
<space/>
<wd l="6806" t="14472" r="7502" b="14616">describe</wd>
<space/>
<wd l="7570" t="14472" r="7843" b="14616">the</wd>
<space/>
<wd l="7920" t="14472" r="8683" b="14616">back-end</wd>
<space/>
<wd l="8765" t="14486" r="9701" b="14654">component</wd>
<space/>
<wd l="9782" t="14472" r="10094" b="14616">and</wd>
<space/>
<wd l="10171" t="14486" r="10786" b="14654">present</wd>
<space/>
</ln>
<ln l="6101" t="14712" r="8726" b="14894" baseLine="14846" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14712" r="7099" b="14894">preliminary</wd>
<space/>
<wd l="7171" t="14712" r="8054" b="14856">evaluation</wd>
<space/>
<wd l="8126" t="14712" r="8726" b="14856">results.</wd>
</ln>
</para>
<para l="6110" t="15115" r="8808" b="15298" alignment="left" spaceBefore="170" lsp="exactly" lspExact="241" language="en">
<ln l="6110" t="15115" r="8808" b="15298" baseLine="15254" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">
<wd l="6110" t="15120" r="6437" b="15254">1.2.</wd>
<space/>
<wd l="6686" t="15115" r="7843" b="15298">Application</wd>
<space/>
<wd l="7925" t="15115" r="8808" b="15298">potential</wd>
</ln>
</para>
<para l="6096" t="15398" r="10790" b="15826" alignment="justified" spaceBefore="40" lsp="exactly" lspExact="237" language="en">
<ln l="6101" t="15398" r="10790" b="15586" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6101" t="15403" r="6878" b="15581">However,</wd>
<space/>
<wd l="6994" t="15398" r="7517" b="15547">before</wd>
<space/>
<wd l="7618" t="15403" r="8088" b="15586">doing</wd>
<space/>
<wd l="8184" t="15451" r="8352" b="15547">so</wd>
<space/>
<wd l="8448" t="15451" r="8674" b="15547">we</wd>
<space/>
<wd l="8770" t="15403" r="9278" b="15547">would</wd>
<space/>
<wd l="9379" t="15403" r="9672" b="15547">like</wd>
<space/>
<wd l="9768" t="15418" r="9941" b="15547">to</wd>
<space/>
<wd l="10042" t="15408" r="10790" b="15547">motivate</wd>
<space/>
</ln>
<ln l="6096" t="15638" r="10786" b="15826" baseLine="15782">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6096" t="15643" r="6370" b="15787">the</wd>
<space/>
<wd l="6446" t="15643" r="7402" b="15826">application</wd>
<space/>
<wd l="7478" t="15643" r="8242" b="15826">potential</wd>
<space/>
<wd l="8318" t="15643" r="8630" b="15787">and</wd>
<space/>
<wd l="8707" t="15648" r="9288" b="15826">impact</wd>
<space/>
<wd l="9374" t="15638" r="9538" b="15787">of</wd>
<space/>
<wd l="9595" t="15643" r="9869" b="15787">the</wd>
<space/>
<wd l="9946" t="15643" r="10450" b="15782">IDEX</wd>
<space/>
<wd l="10522" t="15691" r="10786" b="15826">ap-</wd>
</run>
<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>
</run>
</ln>
</para>
</column>
</section>
<rulerline l="4349" t="10138" r="4349" b="10622" type="double" width="14" color="7f7f7f"/>
<rulerline l="4358" t="10138" r="4358" b="10632" type="single" width="5" color="bfbfbf"/>
<rulerline l="2635" t="10037" r="3336" b="10037" type="double" width="10" color="000000"/>
<rulerline l="1886" t="10354" r="2630" b="10354" type="double" width="14" color="000000"/>
<rulerline l="1666" t="10570" r="1666" b="11770" type="single" width="19" color="000000"/>
<rulerline l="1666" t="10570" r="1666" b="11155" type="double" width="19" color="bfbfbf"/>
<rulerline l="1670" t="11146" r="1670" b="11770" type="double" width="19" color="9f9f9f"/>
<dd l="1042" t="11827" r="1728" b="11914" topDistance="1257" rightDistance="1421" bottomDistance="953">
<picture l="1138" t="11827" r="1728" b="11914" alignment="left" li="96">
</picture>
</dd>
<dd l="8582" t="5539" r="10138" b="7944" leftDistance="216" topDistance="529" rightDistance="666" bottomDistance="278">
<picture l="8582" t="5539" r="10138" b="7944" alignment="left">
</picture>
</dd>
<rulerline l="3893" t="10622" r="3893" b="11054" type="double" width="14" color="bfbfbf"/>
</body>
</page>
<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">
<description>
<source file="pdf\L08-1001.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>
<theoreticalPage size="A4" marginLeft="1041" marginTop="1347" marginRight="1099" marginBottom="1003" offsetX="32" offsetY="16" width="11918" height="16854"/>
<language>en</language>
</description>
<body>
<section l="1041" t="1347" r="10810" b="15835">
<column l="1041" t="1347" r="5755" b="15835">
<picture l="1550" t="1848" r="4858" b="4536" alignment="left" li="509" ri="897" spaceBefore="501" spaceAfter="735">
</picture>
<para l="1042" t="5318" r="5741" b="8347" alignment="justified" spaceBefore="3" lsp="exactly" lspExact="220" language="en">
<ln l="1046" t="5318" r="5726" b="5506" baseLine="5458">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5"><wd l="1046" t="5318" r="1603" b="5501">Figure</wd>
<space/>
<wd l="1680" t="5323" r="1814" b="5462">3:</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5"><wd l="1934" t="5333" r="2242" b="5462">The</wd>
<space/>
<wd l="2318" t="5333" r="2990" b="5496">dynamic</wd>
<space/>
<wd l="3067" t="5333" r="3245" b="5458">IE</wd>
<space/>
<wd l="3322" t="5347" r="3869" b="5496">system</wd>
<space/>
<wd l="3941" t="5333" r="4402" b="5458">IDEX</wd>
<space/>
<wd l="4483" t="5323" r="5726" b="5506">(schematically):</wd>
<space/>
</run>
</ln>
<ln l="1046" t="5549" r="5741" b="5717" baseLine="5674" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="5597" r="1133" b="5683">a</wd>
<space/>
<wd l="1219" t="5597" r="1541" b="5683">user</wd>
<space/>
<wd l="1632" t="5549" r="1786" b="5683">of</wd>
<space/>
<wd l="1858" t="5554" r="2107" b="5683">the</wd>
<space/>
<wd l="2198" t="5554" r="2659" b="5678">IDEX</wd>
<space/>
<wd l="2750" t="5554" r="2933" b="5678">IE</wd>
<space/>
<wd l="3024" t="5568" r="3566" b="5717">system</wd>
<space/>
<wd l="3653" t="5597" r="4378" b="5717">expresses</wd>
<space/>
<wd l="4469" t="5554" r="4718" b="5683">her</wd>
<space/>
<wd l="4810" t="5549" r="5741" b="5683">information</wd>
<space/>
</ln>
<ln l="1046" t="5770" r="5736" b="5938" baseLine="5894" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="5789" r="1613" b="5938">request</wd>
<space/>
<wd l="1685" t="5779" r="1834" b="5899">in</wd>
<space/>
<wd l="1891" t="5774" r="2146" b="5904">the</wd>
<space/>
<wd l="2213" t="5770" r="2582" b="5904">form</wd>
<space/>
<wd l="2645" t="5770" r="2798" b="5904">of</wd>
<space/>
<wd l="2851" t="5818" r="2938" b="5904">a</wd>
<space/>
<wd l="3000" t="5779" r="3394" b="5938">topic</wd>
<space/>
<wd l="3461" t="5774" r="4334" b="5938">description</wd>
<space/>
<wd l="4397" t="5774" r="4858" b="5904">which</wd>
<space/>
<wd l="4925" t="5779" r="5040" b="5904">is</wd>
<space/>
<wd l="5107" t="5774" r="5458" b="5904">used</wd>
<space/>
<wd l="5525" t="5770" r="5736" b="5904">for</wd>
<space/>
</ln>
<ln l="1046" t="5986" r="5731" b="6120" baseLine="6115" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="6034" r="1234" b="6120">an</wd>
<space/>
<wd l="1310" t="5990" r="1771" b="6120">initial</wd>
<space/>
<wd l="1848" t="5990" r="2342" b="6120">search</wd>
<space/>
<wd l="2414" t="5995" r="2563" b="6115">in</wd>
<space/>
<wd l="2635" t="5990" r="3048" b="6120">order</wd>
<space/>
<wd l="3120" t="6005" r="3283" b="6120">to</wd>
<space/>
<wd l="3355" t="5995" r="3950" b="6120">retrieve</wd>
<space/>
<wd l="4027" t="6034" r="4114" b="6120">a</wd>
<space/>
<wd l="4190" t="5990" r="4810" b="6120">relevant</wd>
<space/>
<wd l="4891" t="6005" r="5102" b="6120">set</wd>
<space/>
<wd l="5184" t="5986" r="5342" b="6120">of</wd>
<space/>
<wd l="5405" t="5990" r="5731" b="6120">doc-</wd>
</ln>
<ln l="1046" t="6206" r="5736" b="6374" baseLine="6331" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="6226" r="1661" b="6341">uments.</wd>
<space/>
<wd l="1790" t="6211" r="2208" b="6341">From</wd>
<space/>
<wd l="2280" t="6211" r="2573" b="6341">this</wd>
<space/>
<wd l="2654" t="6226" r="2866" b="6341">set</wd>
<space/>
<wd l="2952" t="6206" r="3106" b="6341">of</wd>
<space/>
<wd l="3173" t="6211" r="4066" b="6374">documents,</wd>
<space/>
<wd l="4152" t="6211" r="4402" b="6341">the</wd>
<space/>
<wd l="4483" t="6226" r="5026" b="6374">system</wd>
<space/>
<wd l="5102" t="6226" r="5736" b="6341">extracts</wd>
<space/>
</ln>
<ln l="1046" t="6422" r="5731" b="6605" baseLine="6552" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="6432" r="1339" b="6562">and</wd>
<space/>
<wd l="1402" t="6432" r="1978" b="6562">collects</wd>
<space/>
<wd l="2054" t="6422" r="2534" b="6605">(using</wd>
<space/>
<wd l="2592" t="6432" r="2842" b="6562">the</wd>
<space/>
<wd l="2914" t="6432" r="3091" b="6557">IE</wd>
<space/>
<wd l="3163" t="6475" r="3480" b="6562">core</wd>
<space/>
<wd l="3547" t="6446" r="4493" b="6595">components</wd>
<space/>
<wd l="4560" t="6427" r="4714" b="6562">of</wd>
<space/>
<wd l="4766" t="6422" r="5290" b="6605">IDEX)</wd>
<space/>
<wd l="5366" t="6475" r="5453" b="6562">a</wd>
<space/>
<wd l="5520" t="6446" r="5731" b="6562">set</wd>
<space/>
</ln>
<ln l="1046" t="6643" r="5736" b="6811" baseLine="6773" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="6643" r="1200" b="6778">of</wd>
<space/>
<wd l="1258" t="6648" r="1723" b="6778">tables</wd>
<space/>
<wd l="1800" t="6643" r="1954" b="6778">of</wd>
<space/>
<wd l="2016" t="6653" r="2731" b="6778">instances</wd>
<space/>
<wd l="2808" t="6643" r="2966" b="6778">of</wd>
<space/>
<wd l="3024" t="6648" r="3662" b="6811">possibly</wd>
<space/>
<wd l="3739" t="6648" r="4358" b="6778">relevant</wd>
<space/>
<wd l="4440" t="6648" r="5160" b="6778">relations.</wd>
<space/>
<wd l="5275" t="6648" r="5736" b="6778">These</wd>
<space/>
</ln>
<ln l="1042" t="6859" r="5736" b="7042" baseLine="6989" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="6869" r="1507" b="6998">tables</wd>
<space/>
<wd l="1579" t="6912" r="1814" b="6998">are</wd>
<space/>
<wd l="1886" t="6869" r="2645" b="7032">presented</wd>
<space/>
<wd l="2702" t="6883" r="2866" b="6998">to</wd>
<space/>
<wd l="2928" t="6869" r="3178" b="6998">the</wd>
<space/>
<wd l="3250" t="6912" r="3566" b="6998">user</wd>
<space/>
<wd l="3648" t="6859" r="4032" b="7042">(who</wd>
<space/>
<wd l="4094" t="6874" r="4210" b="6998">is</wd>
<space/>
<wd l="4282" t="6869" r="4949" b="6998">assumed</wd>
<space/>
<wd l="5011" t="6883" r="5174" b="6998">to</wd>
<space/>
<wd l="5242" t="6869" r="5419" b="6998">be</wd>
<space/>
<wd l="5486" t="6869" r="5736" b="6998">the</wd>
<space/>
</ln>
<ln l="1042" t="7075" r="5731" b="7262" baseLine="7210" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="7075" r="2155" b="7262">topic–expert),</wd>
<space/>
<wd l="2227" t="7090" r="2554" b="7219">who</wd>
<space/>
<wd l="2611" t="7090" r="2894" b="7219">will</wd>
<space/>
<wd l="2957" t="7090" r="3538" b="7253">analyse</wd>
<space/>
<wd l="3595" t="7090" r="3845" b="7219">the</wd>
<space/>
<wd l="3912" t="7090" r="4267" b="7219">data</wd>
<space/>
<wd l="4325" t="7085" r="4877" b="7219">further</wd>
<space/>
<wd l="4939" t="7085" r="5150" b="7219">for</wd>
<space/>
<wd l="5218" t="7090" r="5462" b="7219">her</wd>
<space/>
<wd l="5530" t="7094" r="5731" b="7214">in-</wd>
</ln>
<ln l="1046" t="7301" r="5736" b="7469" baseLine="7430" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="7301" r="1824" b="7435">formation</wd>
<space/>
<wd l="1877" t="7306" r="2563" b="7435">research.</wd>
<space/>
<wd l="2659" t="7306" r="2966" b="7435">The</wd>
<space/>
<wd l="3019" t="7306" r="3475" b="7435">whole</wd>
<space/>
<wd l="3533" t="7306" r="3715" b="7430">IE</wd>
<space/>
<wd l="3773" t="7349" r="4344" b="7469">process</wd>
<space/>
<wd l="4402" t="7310" r="4517" b="7435">is</wd>
<space/>
<wd l="4574" t="7306" r="5285" b="7469">dynamic,</wd>
<space/>
<wd l="5357" t="7310" r="5736" b="7435">since</wd>
<space/>
</ln>
<ln l="1046" t="7522" r="5726" b="7690" baseLine="7646" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="7570" r="1238" b="7656">no</wd>
<space/>
<wd l="1291" t="7522" r="1762" b="7656">offline</wd>
<space/>
<wd l="1819" t="7526" r="2170" b="7656">data</wd>
<space/>
<wd l="2227" t="7531" r="2338" b="7656">is</wd>
<space/>
<wd l="2395" t="7526" r="3091" b="7690">required,</wd>
<space/>
<wd l="3158" t="7526" r="3451" b="7656">and</wd>
<space/>
<wd l="3499" t="7526" r="3749" b="7656">the</wd>
<space/>
<wd l="3811" t="7526" r="3989" b="7651">IE</wd>
<space/>
<wd l="4051" t="7570" r="4618" b="7690">process</wd>
<space/>
<wd l="4675" t="7531" r="4790" b="7656">is</wd>
<space/>
<wd l="4848" t="7531" r="5726" b="7690">interactive,</wd>
<space/>
</ln>
<ln l="1046" t="7742" r="5731" b="7910" baseLine="7867" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="7752" r="1426" b="7877">since</wd>
<space/>
<wd l="1498" t="7747" r="1747" b="7877">the</wd>
<space/>
<wd l="1814" t="7752" r="2208" b="7910">topic</wd>
<space/>
<wd l="2285" t="7762" r="2779" b="7910">expert</wd>
<space/>
<wd l="2861" t="7752" r="2971" b="7877">is</wd>
<space/>
<wd l="3048" t="7747" r="3365" b="7877">able</wd>
<space/>
<wd l="3432" t="7762" r="3595" b="7877">to</wd>
<space/>
<wd l="3662" t="7742" r="4205" b="7910">specify</wd>
<space/>
<wd l="4277" t="7790" r="4584" b="7877">new</wd>
<space/>
<wd l="4651" t="7752" r="5045" b="7910">topic</wd>
<space/>
<wd l="5122" t="7747" r="5731" b="7910">descrip-</wd>
</ln>
<ln l="1042" t="7963" r="5736" b="8126" baseLine="8088" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="7968" r="1469" b="8126">tions,</wd>
<space/>
<wd l="1541" t="7963" r="2002" b="8093">which</wd>
<space/>
<wd l="2064" t="8006" r="2635" b="8126">express</wd>
<space/>
<wd l="2698" t="7963" r="2947" b="8093">her</wd>
<space/>
<wd l="3010" t="8006" r="3317" b="8093">new</wd>
<space/>
<wd l="3379" t="7968" r="4104" b="8093">attention</wd>
<space/>
<wd l="4162" t="7963" r="4877" b="8126">triggered</wd>
<space/>
<wd l="4934" t="7963" r="5126" b="8126">by</wd>
<space/>
<wd l="5184" t="8006" r="5270" b="8093">a</wd>
<space/>
<wd l="5333" t="7963" r="5736" b="8093">novel</wd>
<space/>
</ln>
<ln l="1046" t="8179" r="4704" b="8347" baseLine="8304" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="8184" r="1978" b="8347">relationship</wd>
<space/>
<wd l="2050" t="8184" r="2299" b="8314">she</wd>
<space/>
<wd l="2366" t="8227" r="2650" b="8314">was</wd>
<space/>
<wd l="2722" t="8198" r="2976" b="8314">not</wd>
<space/>
<wd l="3053" t="8227" r="3504" b="8314">aware</wd>
<space/>
<wd l="3571" t="8179" r="3730" b="8314">of</wd>
<space/>
<wd l="3782" t="8179" r="4704" b="8314">beforehand.</wd>
</ln>
</para>
<para l="1042" t="8904" r="5750" b="15787" alignment="justified" spaceBefore="483" spaceAfter="28" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="8904" r="5736" b="9091" baseLine="9048" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="8909" r="1622" b="9091">proach</wd>
<space/>
<wd l="1699" t="8909" r="1906" b="9091">by</wd>
<space/>
<wd l="1978" t="8957" r="2184" b="9053">an</wd>
<space/>
<wd l="2256" t="8909" r="2966" b="9091">example</wd>
<space/>
<wd l="3038" t="8909" r="4037" b="9091">application.</wd>
<space/>
<wd l="4162" t="8904" r="4958" b="9086">Consider,</wd>
<space/>
<wd l="5045" t="8957" r="5381" b="9091">e.g.,</wd>
<space/>
<wd l="5462" t="8909" r="5736" b="9053">the</wd>
<space/>
</ln>
<ln l="1046" t="9144" r="5736" b="9331" baseLine="9288" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="9197" r="1397" b="9293">case</wd>
<space/>
<wd l="1454" t="9144" r="1622" b="9293">of</wd>
<space/>
<wd l="1661" t="9149" r="1939" b="9293">the</wd>
<space/>
<wd l="1997" t="9149" r="2971" b="9331">exploration</wd>
<space/>
<wd l="3029" t="9149" r="3341" b="9293">and</wd>
<space/>
<wd l="3398" t="9149" r="3672" b="9293">the</wd>
<space/>
<wd l="3730" t="9197" r="4488" b="9331">exposure</wd>
<space/>
<wd l="4546" t="9144" r="4714" b="9293">of</wd>
<space/>
<wd l="4757" t="9154" r="5736" b="9331">corruptions</wd>
<space/>
</ln>
<ln l="1046" t="9384" r="5741" b="9571" baseLine="9523" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="9437" r="1219" b="9533">or</wd>
<space/>
<wd l="1282" t="9389" r="1555" b="9533">the</wd>
<space/>
<wd l="1622" t="9389" r="1934" b="9533">risk</wd>
<space/>
<wd l="1997" t="9389" r="2669" b="9571">analysis</wd>
<space/>
<wd l="2741" t="9384" r="2904" b="9533">of</wd>
<space/>
<wd l="2962" t="9437" r="3408" b="9571">mega</wd>
<space/>
<wd l="3470" t="9394" r="4541" b="9533">construction</wd>
<space/>
<wd l="4608" t="9394" r="5333" b="9571">projects.</wd>
<space/>
<wd l="5434" t="9389" r="5741" b="9533">Via</wd>
<space/>
</ln>
<ln l="1042" t="9624" r="5750" b="9811" baseLine="9763" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="9629" r="1315" b="9773">the</wd>
<space/>
<wd l="1406" t="9629" r="2141" b="9806">Internet,</wd>
<space/>
<wd l="2242" t="9677" r="2338" b="9773">a</wd>
<space/>
<wd l="2424" t="9629" r="2837" b="9811">large</wd>
<space/>
<wd l="2923" t="9629" r="3293" b="9811">pool</wd>
<space/>
<wd l="3379" t="9624" r="3547" b="9773">of</wd>
<space/>
<wd l="3624" t="9624" r="4627" b="9773">information</wd>
<space/>
<wd l="4714" t="9677" r="5491" b="9773">resources</wd>
<space/>
<wd l="5582" t="9624" r="5750" b="9773">of</wd>
<space/>
</ln>
<ln l="1046" t="9869" r="5736" b="10051" baseLine="10003" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="9869" r="1426" b="10013">such</wd>
<space/>
<wd l="1526" t="9917" r="1973" b="10051">mega</wd>
<space/>
<wd l="2074" t="9874" r="3144" b="10013">construction</wd>
<space/>
<wd l="3240" t="9874" r="3922" b="10051">projects</wd>
<space/>
<wd l="4027" t="9874" r="4152" b="10013">is</wd>
<space/>
<wd l="4258" t="9869" r="5040" b="10013">available.</wd>
<space/>
<wd l="5237" t="9869" r="5736" b="10013">These</wd>
<space/>
</ln>
<ln l="1046" t="10104" r="5736" b="10291" baseLine="10243" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="10104" r="2054" b="10253">information</wd>
<space/>
<wd l="2165" t="10157" r="2942" b="10253">resources</wd>
<space/>
<wd l="3058" t="10157" r="3317" b="10253">are</wd>
<space/>
<wd l="3427" t="10109" r="3749" b="10253">rich</wd>
<space/>
<wd l="3859" t="10114" r="4018" b="10248">in</wd>
<space/>
<wd l="4128" t="10114" r="4882" b="10291">quantity,</wd>
<space/>
<wd l="5011" t="10109" r="5294" b="10253">but</wd>
<space/>
<wd l="5410" t="10109" r="5736" b="10253">also</wd>
<space/>
</ln>
<ln l="1046" t="10339" r="5726" b="10526" baseLine="10483" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="10349" r="1210" b="10483">in</wd>
<space/>
<wd l="1325" t="10344" r="1949" b="10526">quality,</wd>
<space/>
<wd l="2088" t="10392" r="2424" b="10526">e.g.,</wd>
<space/>
<wd l="2568" t="10344" r="3264" b="10488">business</wd>
<space/>
<wd l="3389" t="10358" r="4042" b="10526">reports,</wd>
<space/>
<wd l="4181" t="10392" r="4954" b="10526">company</wd>
<space/>
<wd l="5069" t="10339" r="5726" b="10526">profiles,</wd>
<space/>
</ln>
<ln l="1046" t="10584" r="5731" b="10766" baseLine="10723" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="10584" r="1531" b="10766">blogs,</wd>
<space/>
<wd l="1618" t="10598" r="2222" b="10766">reports</wd>
<space/>
<wd l="2304" t="10584" r="2510" b="10766">by</wd>
<space/>
<wd l="2582" t="10589" r="3278" b="10762">tourists,</wd>
<space/>
<wd l="3365" t="10584" r="3715" b="10728">who</wd>
<space/>
<wd l="3787" t="10584" r="4354" b="10728">visited</wd>
<space/>
<wd l="4430" t="10584" r="4872" b="10728">these</wd>
<space/>
<wd l="4949" t="10598" r="5731" b="10728">construc-</wd>
</ln>
<ln l="1042" t="10824" r="5741" b="11006" baseLine="10958" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="10829" r="1387" b="10968">tion</wd>
<space/>
<wd l="1498" t="10829" r="2232" b="11006">projects,</wd>
<space/>
<wd l="2366" t="10824" r="2650" b="10968">but</wd>
<space/>
<wd l="2774" t="10824" r="3096" b="10968">also</wd>
<space/>
<wd l="3206" t="10824" r="3542" b="10968">web</wd>
<space/>
<wd l="3658" t="10824" r="4627" b="11002">documents,</wd>
<space/>
<wd l="4757" t="10824" r="5261" b="10968">which</wd>
<space/>
<wd l="5376" t="10824" r="5741" b="11006">only</wd>
<space/>
</ln>
<ln l="1046" t="11059" r="5750" b="11246" baseLine="11198" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="11069" r="1747" b="11208">mention</wd>
<space/>
<wd l="1834" t="11064" r="2107" b="11208">the</wd>
<space/>
<wd l="2203" t="11069" r="2803" b="11246">project</wd>
<space/>
<wd l="2909" t="11112" r="3365" b="11208">name</wd>
<space/>
<wd l="3461" t="11064" r="3773" b="11208">and</wd>
<space/>
<wd l="3869" t="11064" r="4531" b="11246">nothing</wd>
<space/>
<wd l="4622" t="11064" r="4963" b="11208">else.</wd>
<space/>
<wd l="5146" t="11059" r="5491" b="11208">One</wd>
<space/>
<wd l="5582" t="11059" r="5750" b="11208">of</wd>
<space/>
</ln>
<ln l="1042" t="11299" r="5731" b="11486" baseLine="11438" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="11304" r="1315" b="11448">the</wd>
<space/>
<wd l="1402" t="11304" r="2261" b="11486">challenges</wd>
<space/>
<wd l="2352" t="11299" r="2582" b="11448">for</wd>
<space/>
<wd l="2664" t="11304" r="2938" b="11448">the</wd>
<space/>
<wd l="3019" t="11304" r="3336" b="11448">risk</wd>
<space/>
<wd l="3418" t="11304" r="4085" b="11486">analysis</wd>
<space/>
<wd l="4176" t="11299" r="4344" b="11448">of</wd>
<space/>
<wd l="4416" t="11352" r="4867" b="11486">mega</wd>
<space/>
<wd l="4949" t="11318" r="5731" b="11448">construc-</wd>
</ln>
<ln l="1042" t="11534" r="5741" b="11722" baseLine="11678" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="11544" r="1387" b="11683">tion</wd>
<space/>
<wd l="1450" t="11544" r="2131" b="11722">projects</wd>
<space/>
<wd l="2198" t="11544" r="2323" b="11683">is</wd>
<space/>
<wd l="2386" t="11539" r="2664" b="11683">the</wd>
<space/>
<wd l="2726" t="11534" r="3379" b="11683">efficient</wd>
<space/>
<wd l="3456" t="11539" r="4430" b="11722">exploration</wd>
<space/>
<wd l="4493" t="11534" r="4661" b="11683">of</wd>
<space/>
<wd l="4709" t="11539" r="4982" b="11683">the</wd>
<space/>
<wd l="5045" t="11539" r="5741" b="11722">possibly</wd>
<space/>
</ln>
<ln l="1046" t="11779" r="5731" b="11962" baseLine="11918" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="11779" r="1718" b="11923">relevant</wd>
<space/>
<wd l="1795" t="11779" r="2328" b="11923">search</wd>
<space/>
<wd l="2395" t="11827" r="2894" b="11962">space.</wd>
<space/>
<wd l="3000" t="11779" r="3955" b="11962">Developing</wd>
<space/>
<wd l="4022" t="11779" r="4814" b="11962">manually</wd>
<space/>
<wd l="4877" t="11827" r="5083" b="11923">an</wd>
<space/>
<wd l="5150" t="11779" r="5352" b="11918">IE</wd>
<space/>
<wd l="5414" t="11827" r="5731" b="11962">sys-</wd>
</ln>
<ln l="1042" t="12014" r="5736" b="12202" baseLine="12154" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="12034" r="1373" b="12163">tem</wd>
<space/>
<wd l="1464" t="12024" r="1589" b="12163">is</wd>
<space/>
<wd l="1685" t="12014" r="2117" b="12163">often</wd>
<space/>
<wd l="2208" t="12034" r="2482" b="12163">not</wd>
<space/>
<wd l="2582" t="12019" r="3254" b="12202">possible</wd>
<space/>
<wd l="3350" t="12019" r="4013" b="12163">because</wd>
<space/>
<wd l="4104" t="12014" r="4272" b="12163">of</wd>
<space/>
<wd l="4349" t="12019" r="4622" b="12163">the</wd>
<space/>
<wd l="4709" t="12019" r="5256" b="12202">timely</wd>
<space/>
<wd l="5347" t="12019" r="5736" b="12163">need</wd>
<space/>
</ln>
<ln l="1046" t="12254" r="5731" b="12442" baseLine="12394" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="12254" r="1214" b="12403">of</wd>
<space/>
<wd l="1291" t="12259" r="1565" b="12403">the</wd>
<space/>
<wd l="1656" t="12254" r="2707" b="12437">information,</wd>
<space/>
<wd l="2813" t="12259" r="3173" b="12437">and,</wd>
<space/>
<wd l="3278" t="12307" r="3706" b="12403">more</wd>
<space/>
<wd l="3797" t="12259" r="4853" b="12442">importantly,</wd>
<space/>
<wd l="4963" t="12264" r="5083" b="12403">is</wd>
<space/>
<wd l="5179" t="12259" r="5731" b="12442">proba-</wd>
</ln>
<ln l="1046" t="12485" r="5731" b="12691" baseLine="12634" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="12499" r="1315" b="12682">bly</wd>
<space/>
<wd l="1397" t="12514" r="1670" b="12643">not</wd>
<space/>
<wd l="1766" t="12494" r="2309" b="12677">useful,</wd>
<space/>
<wd l="2405" t="12499" r="3072" b="12643">because</wd>
<space/>
<wd l="3154" t="12499" r="3427" b="12643">the</wd>
<space/>
<wd l="3514" t="12499" r="4099" b="12643">needed</wd>
<space/>
<wd l="4205" t="12485" r="4906" b="12691">(hidden)</wd>
<space/>
<wd l="5011" t="12494" r="5731" b="12643">informa-</wd>
</ln>
<ln l="1042" t="12739" r="5731" b="12922" baseLine="12874" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="12744" r="1387" b="12883">tion</wd>
<space/>
<wd l="1474" t="12744" r="1594" b="12883">is</wd>
<space/>
<wd l="1690" t="12739" r="2376" b="12922">actually</wd>
<space/>
<wd l="2462" t="12754" r="2731" b="12883">not</wd>
<space/>
<wd l="2832" t="12739" r="3427" b="12883">known.</wd>
<space/>
<wd l="3586" t="12739" r="3763" b="12878">In</wd>
<space/>
<wd l="3850" t="12754" r="4594" b="12917">contrast,</wd>
<space/>
<wd l="4694" t="12787" r="4901" b="12883">an</wd>
<space/>
<wd l="4987" t="12787" r="5731" b="12922">unsuper-</wd>
</ln>
<ln l="1042" t="12974" r="5736" b="13157" baseLine="13114" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="12974" r="1474" b="13118">vised</wd>
<space/>
<wd l="1565" t="12974" r="1877" b="13118">and</wd>
<space/>
<wd l="1963" t="12974" r="2693" b="13157">dynamic</wd>
<space/>
<wd l="2774" t="12974" r="2976" b="13114">IE</wd>
<space/>
<wd l="3062" t="12989" r="3648" b="13157">system</wd>
<space/>
<wd l="3734" t="12974" r="4027" b="13118">like</wd>
<space/>
<wd l="4109" t="12974" r="4613" b="13114">IDEX</wd>
<space/>
<wd l="4699" t="13022" r="4992" b="13118">can</wd>
<space/>
<wd l="5074" t="12974" r="5270" b="13118">be</wd>
<space/>
<wd l="5357" t="12974" r="5736" b="13118">used</wd>
<space/>
</ln>
<ln l="1042" t="13210" r="5741" b="13397" baseLine="13354" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="13229" r="1214" b="13358">to</wd>
<space/>
<wd l="1296" t="13229" r="1949" b="13397">support</wd>
<space/>
<wd l="2030" t="13214" r="2304" b="13358">the</wd>
<space/>
<wd l="2381" t="13229" r="2918" b="13397">expert</wd>
<space/>
<wd l="3000" t="13219" r="3163" b="13354">in</wd>
<space/>
<wd l="3230" t="13214" r="3509" b="13358">the</wd>
<space/>
<wd l="3581" t="13214" r="4555" b="13397">exploration</wd>
<space/>
<wd l="4632" t="13210" r="4800" b="13358">of</wd>
<space/>
<wd l="4858" t="13214" r="5131" b="13358">the</wd>
<space/>
<wd l="5208" t="13214" r="5741" b="13358">search</wd>
<space/>
</ln>
<ln l="1046" t="13450" r="5741" b="13637" baseLine="13589" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="13502" r="1507" b="13637">space</wd>
<space/>
<wd l="1579" t="13454" r="2266" b="13637">through</wd>
<space/>
<wd l="2342" t="13459" r="3230" b="13637">pro–active</wd>
<space/>
<wd l="3307" t="13450" r="4435" b="13598">identification</wd>
<space/>
<wd l="4512" t="13454" r="4824" b="13598">and</wd>
<space/>
<wd l="4901" t="13454" r="5741" b="13637">clustering</wd>
<space/>
</ln>
<ln l="1046" t="13690" r="5736" b="13877" baseLine="13829" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="13690" r="1214" b="13838">of</wd>
<space/>
<wd l="1272" t="13694" r="2160" b="13838">structured</wd>
<space/>
<wd l="2232" t="13699" r="2894" b="13838">entities.</wd>
<space/>
<wd l="3000" t="13694" r="3605" b="13838">Named</wd>
<space/>
<wd l="3677" t="13699" r="4291" b="13838">entities</wd>
<space/>
<wd l="4368" t="13694" r="4661" b="13838">like</wd>
<space/>
<wd l="4728" t="13690" r="4963" b="13838">for</wd>
<space/>
<wd l="5030" t="13694" r="5736" b="13877">example</wd>
<space/>
</ln>
<ln l="1046" t="13930" r="5736" b="14117" baseLine="14069" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="13982" r="1613" b="14117">person</wd>
<space/>
<wd l="1670" t="13982" r="2203" b="14078">names</wd>
<space/>
<wd l="2270" t="13934" r="2582" b="14078">and</wd>
<space/>
<wd l="2645" t="13934" r="3451" b="14112">locations,</wd>
<space/>
<wd l="3523" t="13982" r="3782" b="14078">are</wd>
<space/>
<wd l="3845" t="13930" r="4277" b="14078">often</wd>
<space/>
<wd l="4334" t="13930" r="4834" b="14078">useful</wd>
<space/>
<wd l="4891" t="13934" r="5736" b="14078">indicators</wd>
<space/>
</ln>
<ln l="1046" t="14165" r="5736" b="14352" baseLine="14309" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="14165" r="1214" b="14314">of</wd>
<space/>
<wd l="1258" t="14170" r="1930" b="14314">relevant</wd>
<space/>
<wd l="1987" t="14184" r="2323" b="14314">text</wd>
<space/>
<wd l="2386" t="14218" r="3158" b="14352">passages,</wd>
<space/>
<wd l="3226" t="14174" r="3389" b="14309">in</wd>
<space/>
<wd l="3442" t="14170" r="4330" b="14352">particular,</wd>
<space/>
<wd l="4402" t="14165" r="4522" b="14309">if</wd>
<space/>
<wd l="4560" t="14170" r="4834" b="14314">the</wd>
<space/>
<wd l="4886" t="14218" r="5419" b="14314">names</wd>
<space/>
<wd l="5477" t="14218" r="5736" b="14314">are</wd>
<space/>
</ln>
<ln l="1046" t="14405" r="5736" b="14592" baseLine="14549" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="14414" r="1210" b="14549">in</wd>
<space/>
<wd l="1282" t="14458" r="1709" b="14554">some</wd>
<space/>
<wd l="1786" t="14410" r="2837" b="14592">relationship.</wd>
<space/>
<wd l="2957" t="14410" r="4080" b="14587">Furthermore,</wd>
<space/>
<wd l="4166" t="14410" r="4834" b="14554">because</wd>
<space/>
<wd l="4901" t="14410" r="5179" b="14554">the</wd>
<space/>
<wd l="5251" t="14405" r="5736" b="14554">found</wd>
<space/>
</ln>
<ln l="1046" t="14650" r="5731" b="14832" baseLine="14784" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="14650" r="2136" b="14832">relationships</wd>
<space/>
<wd l="2222" t="14698" r="2482" b="14794">are</wd>
<space/>
<wd l="2558" t="14650" r="3398" b="14794">visualized</wd>
<space/>
<wd l="3485" t="14654" r="3936" b="14832">using</wd>
<space/>
<wd l="4018" t="14698" r="4219" b="14794">an</wd>
<space/>
<wd l="4301" t="14650" r="5093" b="14794">advanced</wd>
<space/>
<wd l="5179" t="14650" r="5731" b="14832">graph-</wd>
</ln>
<ln l="1046" t="14885" r="5736" b="15072" baseLine="15024" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="14890" r="1339" b="15034">ical</wd>
<space/>
<wd l="1430" t="14938" r="1781" b="15034">user</wd>
<space/>
<wd l="1867" t="14885" r="2650" b="15067">interface,</wd>
<space/>
<wd l="2746" t="14890" r="3024" b="15034">the</wd>
<space/>
<wd l="3110" t="14938" r="3461" b="15034">user</wd>
<space/>
<wd l="3552" t="14938" r="3845" b="15034">can</wd>
<space/>
<wd l="3931" t="14890" r="4397" b="15034">select</wd>
<space/>
<wd l="4493" t="14885" r="5112" b="15072">specific</wd>
<space/>
<wd l="5203" t="14938" r="5736" b="15034">names</wd>
<space/>
</ln>
<ln l="1046" t="15125" r="5736" b="15312" baseLine="15264" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="15130" r="1358" b="15274">and</wd>
<space/>
<wd l="1450" t="15125" r="1771" b="15274">find</wd>
<space/>
<wd l="1858" t="15130" r="2731" b="15274">associated</wd>
<space/>
<wd l="2822" t="15130" r="3907" b="15312">relationships</wd>
<space/>
<wd l="3994" t="15144" r="4166" b="15274">to</wd>
<space/>
<wd l="4253" t="15130" r="4704" b="15274">other</wd>
<space/>
<wd l="4786" t="15178" r="5371" b="15307">names,</wd>
<space/>
<wd l="5462" t="15130" r="5736" b="15274">the</wd>
<space/>
</ln>
<ln l="1046" t="15360" r="5731" b="15547" baseLine="15504" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="15365" r="1968" b="15509">documents</wd>
<space/>
<wd l="2059" t="15365" r="2438" b="15547">they</wd>
<space/>
<wd l="2530" t="15413" r="2995" b="15509">occur</wd>
<space/>
<wd l="3086" t="15370" r="3245" b="15504">in</wd>
<space/>
<wd l="3336" t="15413" r="3509" b="15509">or</wd>
<space/>
<wd l="3600" t="15365" r="3869" b="15509">she</wd>
<space/>
<wd l="3960" t="15413" r="4253" b="15509">can</wd>
<space/>
<wd l="4344" t="15365" r="4877" b="15509">search</wd>
<space/>
<wd l="4968" t="15360" r="5198" b="15509">for</wd>
<space/>
<wd l="5290" t="15413" r="5731" b="15547">para-</wd>
</ln>
<ln l="1046" t="15600" r="2822" b="15787" baseLine="15744" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="15605" r="1680" b="15787">phrases</wd>
<space/>
<wd l="1757" t="15600" r="1925" b="15749">of</wd>
<space/>
<wd l="1987" t="15619" r="2822" b="15749">sentences.</wd>
</ln>
</para>
</column>
<column l="6096" t="1347" r="10810" b="15835">
<para l="7042" t="1416" r="9850" b="1632" alignment="centered" spaceBefore="17" lsp="exactly" lspExact="279" language="en">
<ln l="7042" t="1416" r="9850" b="1632" baseLine="1579" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="21">
<wd l="7042" t="1426" r="7224" b="1584">2.</wd>
<space/>
<wd l="7526" t="1416" r="8357" b="1632">System</wd>
<space/>
<wd l="8453" t="1416" r="9850" b="1589">architecture</wd>
</ln>
</para>
<para l="6101" t="1762" r="10795" b="2659" alignment="justified" spaceBefore="66" lsp="exactly" lspExact="240" language="en">
<ln l="6101" t="1762" r="10786" b="1944" baseLine="1896" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="1762" r="6437" b="1906">The</wd>
<space/>
<wd l="6514" t="1762" r="7277" b="1906">back-end</wd>
<space/>
<wd l="7358" t="1776" r="8347" b="1944">component,</wd>
<space/>
<wd l="8429" t="1762" r="9269" b="1906">visualized</wd>
<space/>
<wd l="9346" t="1766" r="9509" b="1901">in</wd>
<space/>
<wd l="9581" t="1762" r="10138" b="1944">Figure</wd>
<space/>
<wd l="10210" t="1762" r="10349" b="1939">4,</wd>
<space/>
<wd l="10435" t="1810" r="10786" b="1906">con-</wd>
</ln>
<ln l="6101" t="1997" r="10786" b="2184" baseLine="2136" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="2006" r="6461" b="2146">sists</wd>
<space/>
<wd l="6518" t="1997" r="6686" b="2146">of</wd>
<space/>
<wd l="6725" t="2002" r="7166" b="2146">three</wd>
<space/>
<wd l="7224" t="2016" r="7704" b="2184">parts,</wd>
<space/>
<wd l="7771" t="2002" r="8275" b="2146">which</wd>
<space/>
<wd l="8328" t="2050" r="8587" b="2146">are</wd>
<space/>
<wd l="8645" t="2002" r="9451" b="2146">described</wd>
<space/>
<wd l="9509" t="2006" r="9672" b="2141">in</wd>
<space/>
<wd l="9725" t="2002" r="10205" b="2146">detail</wd>
<space/>
<wd l="10262" t="2006" r="10421" b="2141">in</wd>
<space/>
<wd l="10474" t="2002" r="10786" b="2146">this</wd>
<space/>
</ln>
<ln l="6101" t="2237" r="10795" b="2419" baseLine="2376" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="2242" r="6734" b="2381">section:</wd>
<space/>
<wd l="6835" t="2242" r="8045" b="2419">preprocessing,</wd>
<space/>
<wd l="8117" t="2237" r="8774" b="2381">relation</wd>
<space/>
<wd l="8832" t="2242" r="9706" b="2381">extraction</wd>
<space/>
<wd l="9763" t="2237" r="10075" b="2381">and</wd>
<space/>
<wd l="10133" t="2237" r="10795" b="2381">relation</wd>
<space/>
</ln>
<ln l="6101" t="2477" r="6979" b="2659" baseLine="2616" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="2477" r="6979" b="2659">clustering.</wd>
</ln>
</para>
<para l="6106" t="2899" r="8074" b="3082" alignment="left" spaceBefore="184" lsp="exactly" lspExact="238" language="en">
<ln l="6106" t="2899" r="8074" b="3082" baseLine="3038" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="14">
<wd l="6106" t="2904" r="6437" b="3038">2.1.</wd>
<space/>
<wd l="6686" t="2899" r="8074" b="3082">Preprocessing</wd>
</ln>
</para>
<para l="6096" t="3192" r="10805" b="8890" alignment="justified" spaceBefore="39" lsp="exactly" lspExact="240" language="en">
<ln l="6101" t="3192" r="10805" b="3379" baseLine="3336" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="3197" r="6278" b="3336">In</wd>
<space/>
<wd l="6360" t="3197" r="6634" b="3341">the</wd>
<space/>
<wd l="6720" t="3192" r="7046" b="3341">first</wd>
<space/>
<wd l="7142" t="3211" r="7536" b="3379">step,</wd>
<space/>
<wd l="7637" t="3192" r="7867" b="3341">for</wd>
<space/>
<wd l="7954" t="3245" r="8050" b="3341">a</wd>
<space/>
<wd l="8131" t="3192" r="8750" b="3379">specific</wd>
<space/>
<wd l="8837" t="3197" r="9370" b="3341">search</wd>
<space/>
<wd l="9446" t="3197" r="9850" b="3374">task,</wd>
<space/>
<wd l="9950" t="3245" r="10046" b="3341">a</wd>
<space/>
<wd l="10123" t="3202" r="10555" b="3379">topic</wd>
<space/>
<wd l="10637" t="3192" r="10805" b="3341">of</wd>
<space/>
</ln>
<ln l="6101" t="3432" r="10795" b="3619" baseLine="3571" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="3442" r="6734" b="3581">interest</wd>
<space/>
<wd l="6826" t="3437" r="7099" b="3581">has</wd>
<space/>
<wd l="7181" t="3451" r="7354" b="3581">to</wd>
<space/>
<wd l="7435" t="3437" r="7632" b="3581">be</wd>
<space/>
<wd l="7714" t="3432" r="8323" b="3581">defined</wd>
<space/>
<wd l="8405" t="3442" r="8563" b="3576">in</wd>
<space/>
<wd l="8640" t="3437" r="8914" b="3581">the</wd>
<space/>
<wd l="8990" t="3432" r="9389" b="3581">form</wd>
<space/>
<wd l="9470" t="3432" r="9634" b="3581">of</wd>
<space/>
<wd l="9701" t="3485" r="9797" b="3581">a</wd>
<space/>
<wd l="9874" t="3485" r="10378" b="3619">query.</wd>
<space/>
<wd l="10507" t="3437" r="10795" b="3581">For</wd>
<space/>
</ln>
<ln l="6096" t="3672" r="10790" b="3859" baseLine="3811" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="3677" r="6413" b="3821">this</wd>
<space/>
<wd l="6475" t="3682" r="6950" b="3859">topic,</wd>
<space/>
<wd l="7022" t="3677" r="7944" b="3821">documents</wd>
<space/>
<wd l="8011" t="3725" r="8270" b="3821">are</wd>
<space/>
<wd l="8333" t="3677" r="9514" b="3859">automatically</wd>
<space/>
<wd l="9576" t="3677" r="10330" b="3821">retrieved</wd>
<space/>
<wd l="10397" t="3672" r="10790" b="3821">from</wd>
<space/>
</ln>
<ln l="6096" t="3912" r="10790" b="4099" baseLine="4051" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="3917" r="6370" b="4061">the</wd>
<space/>
<wd l="6451" t="3917" r="6787" b="4061">web</wd>
<space/>
<wd l="6874" t="3922" r="7325" b="4099">using</wd>
<space/>
<wd l="7402" t="3917" r="7675" b="4061">the</wd>
<space/>
<wd l="7766" t="3912" r="8362" b="4099">Google</wd>
<space/>
<wd l="8448" t="3917" r="8981" b="4061">search</wd>
<space/>
<wd l="9062" t="3922" r="9653" b="4099">engine.</wd>
<space/>
<wd l="9797" t="3917" r="10392" b="4056">HTML</wd>
<space/>
<wd l="10478" t="3917" r="10790" b="4061">and</wd>
<space/>
</ln>
<ln l="6101" t="4147" r="10786" b="4334" baseLine="4291" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="4152" r="6509" b="4291">PDF</wd>
<space/>
<wd l="6581" t="4152" r="7498" b="4296">documents</wd>
<space/>
<wd l="7574" t="4200" r="7834" b="4296">are</wd>
<space/>
<wd l="7901" t="4152" r="8726" b="4296">converted</wd>
<space/>
<wd l="8798" t="4157" r="9125" b="4296">into</wd>
<space/>
<wd l="9197" t="4152" r="9619" b="4334">plain</wd>
<space/>
<wd l="9682" t="4166" r="10022" b="4296">text</wd>
<space/>
<wd l="10094" t="4147" r="10464" b="4296">files.</wd>
<space/>
<wd l="10570" t="4147" r="10786" b="4296">As</wd>
<space/>
</ln>
<ln l="6096" t="4378" r="10786" b="4584" baseLine="4531" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="4392" r="6370" b="4536">the</wd>
<space/>
<wd l="6466" t="4392" r="6874" b="4536">tools</wd>
<space/>
<wd l="6979" t="4392" r="7358" b="4536">used</wd>
<space/>
<wd l="7459" t="4387" r="7694" b="4536">for</wd>
<space/>
<wd l="7795" t="4392" r="8573" b="4574">linguistic</wd>
<space/>
<wd l="8674" t="4397" r="9562" b="4574">processing</wd>
<space/>
<wd l="9672" t="4378" r="10013" b="4584">(NE</wd>
<space/>
<wd l="10114" t="4397" r="10786" b="4574">recogni-</wd>
</ln>
<ln l="6096" t="4618" r="10790" b="4824" baseLine="4766" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="4637" r="6485" b="4810">tion,</wd>
<space/>
<wd l="6590" t="4637" r="7258" b="4814">parsing,</wd>
<space/>
<wd l="7368" t="4618" r="7728" b="4824">etc.)</wd>
<space/>
<wd l="7896" t="4680" r="8155" b="4776">are</wd>
<space/>
<wd l="8246" t="4627" r="9744" b="4814">language-specific,</wd>
<space/>
<wd l="9845" t="4680" r="10070" b="4776">we</wd>
<space/>
<wd l="10162" t="4680" r="10430" b="4776">use</wd>
<space/>
<wd l="10517" t="4632" r="10790" b="4776">the</wd>
<space/>
</ln>
<ln l="6106" t="4867" r="10790" b="5054" baseLine="5006" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6106" t="4867" r="6701" b="5054">Google</wd>
<space/>
<wd l="6797" t="4872" r="7555" b="5054">language</wd>
<space/>
<wd l="7651" t="4867" r="8054" b="5016">filter</wd>
<space/>
<wd l="8155" t="4877" r="8702" b="5054">option</wd>
<space/>
<wd l="8794" t="4872" r="9245" b="5016">when</wd>
<space/>
<wd l="9341" t="4872" r="10426" b="5054">downloading</wd>
<space/>
<wd l="10517" t="4872" r="10790" b="5016">the</wd>
<space/>
</ln>
<ln l="6101" t="5112" r="10786" b="5294" baseLine="5246" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="5112" r="7066" b="5256">documents.</wd>
<space/>
<wd l="7176" t="5112" r="7949" b="5290">However,</wd>
<space/>
<wd l="8026" t="5112" r="8342" b="5256">this</wd>
<space/>
<wd l="8419" t="5112" r="8789" b="5256">does</wd>
<space/>
<wd l="8866" t="5126" r="9139" b="5256">not</wd>
<space/>
<wd l="9221" t="5126" r="9850" b="5294">prevent</wd>
<space/>
<wd l="9931" t="5160" r="10358" b="5256">some</wd>
<space/>
<wd l="10430" t="5112" r="10786" b="5256">doc-</wd>
</ln>
<ln l="6101" t="5352" r="10786" b="5534" baseLine="5486" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="5366" r="6715" b="5496">uments</wd>
<space/>
<wd l="6816" t="5357" r="7450" b="5496">written</wd>
<space/>
<wd l="7546" t="5357" r="7709" b="5491">in</wd>
<space/>
<wd l="7805" t="5400" r="7901" b="5496">a</wd>
<space/>
<wd l="8002" t="5352" r="8755" b="5534">language</wd>
<space/>
<wd l="8856" t="5352" r="9307" b="5496">other</wd>
<space/>
<wd l="9398" t="5352" r="9797" b="5496">than</wd>
<space/>
<wd l="9898" t="5400" r="10181" b="5496">our</wd>
<space/>
<wd l="10272" t="5366" r="10786" b="5534">target</wd>
<space/>
</ln>
<ln l="6101" t="5573" r="10786" b="5779" baseLine="5726" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="5587" r="6859" b="5770">language</wd>
<space/>
<wd l="6965" t="5573" r="7728" b="5779">(English)</wd>
<space/>
<wd l="7838" t="5582" r="8232" b="5731">from</wd>
<space/>
<wd l="8328" t="5592" r="9024" b="5770">entering</wd>
<space/>
<wd l="9115" t="5635" r="9398" b="5731">our</wd>
<space/>
<wd l="9490" t="5635" r="10085" b="5770">corpus.</wd>
<space/>
<wd l="10253" t="5587" r="10430" b="5726">In</wd>
<space/>
<wd l="10522" t="5587" r="10786" b="5731">ad-</wd>
</ln>
<ln l="6101" t="5827" r="10790" b="6005" baseLine="5966" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="5827" r="6648" b="6005">dition,</wd>
<space/>
<wd l="6744" t="5875" r="7171" b="5971">some</wd>
<space/>
<wd l="7248" t="5827" r="7584" b="5971">web</wd>
<space/>
<wd l="7670" t="5832" r="8035" b="5971">sites</wd>
<space/>
<wd l="8122" t="5832" r="8755" b="5971">contain</wd>
<space/>
<wd l="8832" t="5842" r="9168" b="5971">text</wd>
<space/>
<wd l="9254" t="5832" r="9888" b="5971">written</wd>
<space/>
<wd l="9970" t="5832" r="10128" b="5966">in</wd>
<space/>
<wd l="10210" t="5827" r="10790" b="5971">several</wd>
<space/>
</ln>
<ln l="6101" t="6067" r="10786" b="6250" baseLine="6202" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="6067" r="6979" b="6250">languages.</wd>
<space/>
<wd l="7123" t="6067" r="7301" b="6206">In</wd>
<space/>
<wd l="7387" t="6067" r="7834" b="6211">order</wd>
<space/>
<wd l="7915" t="6082" r="8088" b="6211">to</wd>
<space/>
<wd l="8174" t="6072" r="8779" b="6211">restrict</wd>
<space/>
<wd l="8870" t="6067" r="9144" b="6211">the</wd>
<space/>
<wd l="9230" t="6072" r="10118" b="6250">processing</wd>
<space/>
<wd l="10195" t="6082" r="10368" b="6211">to</wd>
<space/>
<wd l="10454" t="6115" r="10786" b="6211">sen-</wd>
</ln>
<ln l="6096" t="6307" r="10795" b="6490" baseLine="6442" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="6322" r="6624" b="6451">tences</wd>
<space/>
<wd l="6686" t="6312" r="7320" b="6451">written</wd>
<space/>
<wd l="7382" t="6312" r="7546" b="6446">in</wd>
<space/>
<wd l="7608" t="6307" r="8290" b="6490">English,</wd>
<space/>
<wd l="8366" t="6355" r="8587" b="6451">we</wd>
<space/>
<wd l="8654" t="6307" r="9134" b="6490">apply</wd>
<space/>
<wd l="9197" t="6355" r="9293" b="6451">a</wd>
<space/>
<wd l="9355" t="6307" r="10109" b="6490">language</wd>
<space/>
<wd l="10176" t="6355" r="10795" b="6490">guesser</wd>
<space/>
</ln>
<ln l="6096" t="6533" r="10786" b="6739" baseLine="6682" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="6547" r="6480" b="6725">tool,</wd>
<space/>
<wd l="6571" t="6547" r="6854" b="6730">lc4j</wd>
<space/>
<wd l="6965" t="6533" r="7440" b="6739">(Lc4j,</wd>
<space/>
<wd l="7541" t="6533" r="7982" b="6739">2007)</wd>
<space/>
<wd l="8083" t="6547" r="8395" b="6691">and</wd>
<space/>
<wd l="8482" t="6595" r="9086" b="6691">remove</wd>
<space/>
<wd l="9168" t="6562" r="9960" b="6691">sentences</wd>
<space/>
<wd l="10046" t="6562" r="10320" b="6691">not</wd>
<space/>
<wd l="10411" t="6547" r="10786" b="6691">clas-</wd>
</ln>
<ln l="6101" t="6778" r="10795" b="6965" baseLine="6922" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="6778" r="6538" b="6926">sified</wd>
<space/>
<wd l="6638" t="6830" r="6806" b="6926">as</wd>
<space/>
<wd l="6907" t="6787" r="7541" b="6926">written</wd>
<space/>
<wd l="7637" t="6787" r="7800" b="6922">in</wd>
<space/>
<wd l="7901" t="6782" r="8578" b="6965">English.</wd>
<space/>
<wd l="8774" t="6782" r="9149" b="6926">This</wd>
<space/>
<wd l="9254" t="6782" r="9888" b="6926">reduces</wd>
<space/>
<wd l="9994" t="6830" r="10483" b="6926">errors</wd>
<space/>
<wd l="10589" t="6830" r="10795" b="6926">on</wd>
<space/>
</ln>
<ln l="6096" t="7018" r="10786" b="7205" baseLine="7162" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="7022" r="6370" b="7166">the</wd>
<space/>
<wd l="6437" t="7018" r="7210" b="7205">following</wd>
<space/>
<wd l="7272" t="7022" r="7728" b="7166">levels</wd>
<space/>
<wd l="7795" t="7018" r="7963" b="7166">of</wd>
<space/>
<wd l="8016" t="7027" r="8942" b="7205">processing.</wd>
<space/>
<wd l="9048" t="7022" r="9322" b="7166">We</wd>
<space/>
<wd l="9389" t="7022" r="9710" b="7166">also</wd>
<space/>
<wd l="9782" t="7070" r="10387" b="7166">remove</wd>
<space/>
<wd l="10454" t="7070" r="10786" b="7166">sen-</wd>
</ln>
<ln l="6096" t="7262" r="10776" b="7445" baseLine="7397" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="7277" r="6624" b="7406">tences</wd>
<space/>
<wd l="6691" t="7262" r="7046" b="7406">that</wd>
<space/>
<wd l="7118" t="7262" r="7488" b="7445">only</wd>
<space/>
<wd l="7550" t="7267" r="8184" b="7406">contain</wd>
<space/>
<wd l="8246" t="7262" r="9797" b="7445">non-alphanumeric</wd>
<space/>
<wd l="9864" t="7262" r="10776" b="7406">characters.</wd>
<space/>
</ln>
<ln l="6101" t="7488" r="10786" b="7694" baseLine="7637" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="7502" r="6322" b="7646">To</wd>
<space/>
<wd l="6403" t="7502" r="6605" b="7646">all</wd>
<space/>
<wd l="6686" t="7507" r="7546" b="7685">remaining</wd>
<space/>
<wd l="7622" t="7517" r="8462" b="7680">sentences,</wd>
<space/>
<wd l="8549" t="7550" r="8774" b="7646">we</wd>
<space/>
<wd l="8856" t="7502" r="9331" b="7685">apply</wd>
<space/>
<wd l="9408" t="7502" r="10186" b="7685">LingPipe</wd>
<space/>
<wd l="10282" t="7488" r="10786" b="7694">(Ling-</wd>
</ln>
<ln l="6101" t="7728" r="10790" b="7934" baseLine="7877" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="7742" r="6538" b="7925">Pipe,</wd>
<space/>
<wd l="6653" t="7728" r="7099" b="7934">2007)</wd>
<space/>
<wd l="7214" t="7738" r="7445" b="7886">for</wd>
<space/>
<wd l="7541" t="7757" r="8261" b="7886">sentence</wd>
<space/>
<wd l="8357" t="7742" r="9182" b="7925">boundary</wd>
<space/>
<wd l="9278" t="7742" r="10114" b="7920">detection,</wd>
<space/>
<wd l="10224" t="7742" r="10790" b="7886">named</wd>
<space/>
</ln>
<ln l="6101" t="7963" r="10776" b="8170" baseLine="8117" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="7982" r="6600" b="8160">entity</wd>
<space/>
<wd l="6696" t="7982" r="7656" b="8160">recognition</wd>
<space/>
<wd l="7766" t="7963" r="8314" b="8170">(NER)</wd>
<space/>
<wd l="8429" t="7978" r="8741" b="8122">and</wd>
<space/>
<wd l="8842" t="7973" r="9792" b="8122">coreference</wd>
<space/>
<wd l="9893" t="7978" r="10776" b="8122">resolution.</wd>
<space/>
</ln>
<ln l="6101" t="8213" r="10781" b="8400" baseLine="8357" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="8213" r="6317" b="8362">As</wd>
<space/>
<wd l="6422" t="8266" r="6518" b="8362">a</wd>
<space/>
<wd l="6610" t="8218" r="7085" b="8362">result</wd>
<space/>
<wd l="7190" t="8213" r="7358" b="8362">of</wd>
<space/>
<wd l="7435" t="8218" r="7752" b="8362">this</wd>
<space/>
<wd l="7853" t="8232" r="8198" b="8400">step</wd>
<space/>
<wd l="8299" t="8218" r="9058" b="8362">database</wd>
<space/>
<wd l="9149" t="8218" r="9653" b="8362">tables</wd>
<space/>
<wd l="9758" t="8266" r="10018" b="8362">are</wd>
<space/>
<wd l="10114" t="8218" r="10781" b="8395">created,</wd>
<space/>
</ln>
<ln l="6101" t="8453" r="10786" b="8640" baseLine="8592" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="8462" r="6998" b="8640">containing</wd>
<space/>
<wd l="7099" t="8453" r="7939" b="8602">references</wd>
<space/>
<wd l="8040" t="8472" r="8213" b="8602">to</wd>
<space/>
<wd l="8314" t="8458" r="8587" b="8602">the</wd>
<space/>
<wd l="8693" t="8458" r="9341" b="8640">original</wd>
<space/>
<wd l="9442" t="8458" r="10334" b="8635">document,</wd>
<space/>
<wd l="10454" t="8506" r="10786" b="8602">sen-</wd>
</ln>
<ln l="6096" t="8683" r="9768" b="8890" baseLine="8832" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="8712" r="6624" b="8842">tences</wd>
<space/>
<wd l="6701" t="8698" r="7013" b="8842">and</wd>
<space/>
<wd l="7090" t="8698" r="7810" b="8842">detected</wd>
<space/>
<wd l="7882" t="8698" r="8448" b="8842">named</wd>
<space/>
<wd l="8525" t="8702" r="9139" b="8842">entities</wd>
<space/>
<wd l="9230" t="8683" r="9768" b="8890">(NEs).</wd>
</ln>
</para>
<para l="6106" t="9120" r="8616" b="9264" alignment="left" spaceBefore="179" lsp="exactly" lspExact="238" language="en">
<ln l="6106" t="9120" r="8616" b="9264" baseLine="9254" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="14">
<wd l="6106" t="9125" r="6437" b="9259">2.2.</wd>
<space/>
<wd l="6686" t="9120" r="7526" b="9264">Relation</wd>
<space/>
<wd l="7608" t="9120" r="8616" b="9264">extraction</wd>
</ln>
</para>
<para l="6096" t="9413" r="10795" b="14866" alignment="justified" spaceBefore="48" lsp="exactly" lspExact="240" language="en">
<ln l="6101" t="9413" r="10786" b="9600" baseLine="9552" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="9418" r="6830" b="9562">Relation</wd>
<space/>
<wd l="6898" t="9422" r="7771" b="9562">extraction</wd>
<space/>
<wd l="7838" t="9422" r="7963" b="9562">is</wd>
<space/>
<wd l="8035" t="9418" r="8438" b="9562">done</wd>
<space/>
<wd l="8506" t="9466" r="8712" b="9562">on</wd>
<space/>
<wd l="8774" t="9418" r="9048" b="9562">the</wd>
<space/>
<wd l="9115" t="9418" r="9528" b="9562">basis</wd>
<space/>
<wd l="9600" t="9413" r="9768" b="9562">of</wd>
<space/>
<wd l="9821" t="9422" r="10450" b="9600">parsing</wd>
<space/>
<wd l="10517" t="9466" r="10786" b="9600">po-</wd>
</ln>
<ln l="6096" t="9653" r="10790" b="9840" baseLine="9792" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="9658" r="6816" b="9840">tentially</wd>
<space/>
<wd l="6874" t="9658" r="7541" b="9802">relevant</wd>
<space/>
<wd l="7608" t="9672" r="8448" b="9802">sentences.</wd>
<space/>
<wd l="8549" t="9658" r="8822" b="9802">We</wd>
<space/>
<wd l="8880" t="9653" r="9379" b="9802">define</wd>
<space/>
<wd l="9442" t="9706" r="9538" b="9802">a</wd>
<space/>
<wd l="9590" t="9672" r="10310" b="9802">sentence</wd>
<space/>
<wd l="10363" t="9672" r="10536" b="9802">to</wd>
<space/>
<wd l="10594" t="9658" r="10790" b="9802">be</wd>
<space/>
</ln>
<ln l="6101" t="9893" r="10670" b="10080" baseLine="10032" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="9893" r="6269" b="10042">of</wd>
<space/>
<wd l="6331" t="9898" r="7094" b="10080">potential</wd>
<space/>
<wd l="7171" t="9898" r="7954" b="10042">relevance</wd>
<space/>
<wd l="8026" t="9893" r="8150" b="10037">if</wd>
<space/>
<wd l="8208" t="9902" r="8328" b="10042">it</wd>
<space/>
<wd l="8410" t="9912" r="8568" b="10042">at</wd>
<space/>
<wd l="8650" t="9898" r="9034" b="10042">least</wd>
<space/>
<wd l="9115" t="9902" r="9821" b="10042">contains</wd>
<space/>
<wd l="9893" t="9912" r="10200" b="10042">two</wd>
<space/>
<wd l="10272" t="9898" r="10670" b="10042">NEs.</wd>
<space/>
</ln>
<ln l="6101" t="10123" r="10786" b="10330" baseLine="10277" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="10138" r="6278" b="10277">In</wd>
<space/>
<wd l="6346" t="10138" r="6624" b="10282">the</wd>
<space/>
<wd l="6696" t="10133" r="7027" b="10282">first</wd>
<space/>
<wd l="7109" t="10152" r="7502" b="10320">step,</wd>
<space/>
<wd l="7589" t="10138" r="8318" b="10282">so-called</wd>
<space/>
<wd l="8400" t="10138" r="9163" b="10282">skeletons</wd>
<space/>
<wd l="9259" t="10123" r="10142" b="10330">(simplified</wd>
<space/>
<wd l="10219" t="10138" r="10786" b="10320">depen-</wd>
</ln>
<ln l="6101" t="10363" r="10790" b="10570" baseLine="10512" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="10378" r="6600" b="10560">dency</wd>
<space/>
<wd l="6662" t="10363" r="7128" b="10570">trees)</wd>
<space/>
<wd l="7214" t="10426" r="7474" b="10522">are</wd>
<space/>
<wd l="7546" t="10378" r="8390" b="10522">extracted.</wd>
<space/>
<wd l="8501" t="10378" r="8717" b="10522">To</wd>
<space/>
<wd l="8789" t="10378" r="9221" b="10522">build</wd>
<space/>
<wd l="9288" t="10378" r="9562" b="10522">the</wd>
<space/>
<wd l="9629" t="10378" r="10445" b="10555">skeletons,</wd>
<space/>
<wd l="10517" t="10378" r="10790" b="10522">the</wd>
<space/>
</ln>
<ln l="6106" t="10603" r="10786" b="10810" baseLine="10752" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6106" t="10613" r="6840" b="10762">Stanford</wd>
<space/>
<wd l="6902" t="10666" r="7430" b="10800">parser</wd>
<space/>
<wd l="7507" t="10603" r="8309" b="10810">(Stanford</wd>
<space/>
<wd l="8371" t="10618" r="8962" b="10795">Parser,</wd>
<space/>
<wd l="9043" t="10603" r="9490" b="10810">2007)</wd>
<space/>
<wd l="9571" t="10622" r="9691" b="10762">is</wd>
<space/>
<wd l="9758" t="10618" r="10138" b="10762">used</wd>
<space/>
<wd l="10195" t="10632" r="10368" b="10762">to</wd>
<space/>
<wd l="10435" t="10666" r="10786" b="10800">gen-</wd>
</ln>
<ln l="6101" t="10853" r="10786" b="11040" baseLine="10992" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="10872" r="6528" b="11002">erate</wd>
<space/>
<wd l="6586" t="10858" r="7598" b="11040">dependency</wd>
<space/>
<wd l="7646" t="10872" r="8054" b="11002">trees</wd>
<space/>
<wd l="8117" t="10853" r="8347" b="11002">for</wd>
<space/>
<wd l="8400" t="10858" r="8674" b="11002">the</wd>
<space/>
<wd l="8731" t="10858" r="9662" b="11040">potentially</wd>
<space/>
<wd l="9720" t="10858" r="10387" b="11002">relevant</wd>
<space/>
<wd l="10454" t="10906" r="10786" b="11002">sen-</wd>
</ln>
<ln l="6096" t="11093" r="10795" b="11275" baseLine="11232" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="11107" r="6667" b="11237">tences.</wd>
<space/>
<wd l="6816" t="11093" r="7099" b="11237">For</wd>
<space/>
<wd l="7186" t="11093" r="7560" b="11237">each</wd>
<space/>
<wd l="7642" t="11093" r="7925" b="11232">NE</wd>
<space/>
<wd l="8006" t="11098" r="8347" b="11275">pair</wd>
<space/>
<wd l="8429" t="11098" r="8592" b="11232">in</wd>
<space/>
<wd l="8674" t="11141" r="8770" b="11237">a</wd>
<space/>
<wd l="8851" t="11107" r="9614" b="11270">sentence,</wd>
<space/>
<wd l="9710" t="11093" r="9984" b="11237">the</wd>
<space/>
<wd l="10070" t="11141" r="10795" b="11237">common</wd>
<space/>
</ln>
<ln l="6101" t="11328" r="10790" b="11515" baseLine="11472" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11347" r="6446" b="11477">root</wd>
<space/>
<wd l="6514" t="11333" r="7171" b="11477">element</wd>
<space/>
<wd l="7238" t="11338" r="7397" b="11472">in</wd>
<space/>
<wd l="7450" t="11333" r="7723" b="11477">the</wd>
<space/>
<wd l="7786" t="11333" r="8995" b="11515">corresponding</wd>
<space/>
<wd l="9048" t="11347" r="9379" b="11477">tree</wd>
<space/>
<wd l="9437" t="11338" r="9562" b="11477">is</wd>
<space/>
<wd l="9624" t="11328" r="10416" b="11477">identified</wd>
<space/>
<wd l="10478" t="11333" r="10790" b="11477">and</wd>
<space/>
</ln>
<ln l="6096" t="11568" r="10786" b="11717" baseLine="11707" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="11573" r="6370" b="11717">the</wd>
<space/>
<wd l="6442" t="11573" r="7176" b="11717">elements</wd>
<space/>
<wd l="7253" t="11568" r="7651" b="11717">from</wd>
<space/>
<wd l="7718" t="11573" r="8098" b="11717">each</wd>
<space/>
<wd l="8165" t="11568" r="8333" b="11717">of</wd>
<space/>
<wd l="8386" t="11573" r="8659" b="11717">the</wd>
<space/>
<wd l="8731" t="11573" r="9082" b="11717">NEs</wd>
<space/>
<wd l="9154" t="11587" r="9326" b="11717">to</wd>
<space/>
<wd l="9394" t="11573" r="9667" b="11717">the</wd>
<space/>
<wd l="9739" t="11587" r="10080" b="11717">root</wd>
<space/>
<wd l="10162" t="11621" r="10421" b="11717">are</wd>
<space/>
<wd l="10488" t="11573" r="10786" b="11717">col-</wd>
</ln>
<ln l="6101" t="11808" r="10776" b="11995" baseLine="11947" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11813" r="6643" b="11957">lected.</wd>
<space/>
<wd l="6754" t="11808" r="7008" b="11952">An</wd>
<space/>
<wd l="7075" t="11813" r="7781" b="11995">example</wd>
<space/>
<wd l="7853" t="11808" r="8016" b="11957">of</wd>
<space/>
<wd l="8074" t="11861" r="8170" b="11957">a</wd>
<space/>
<wd l="8237" t="11813" r="8928" b="11957">skeleton</wd>
<space/>
<wd l="8995" t="11818" r="9120" b="11957">is</wd>
<space/>
<wd l="9192" t="11813" r="9725" b="11957">shown</wd>
<space/>
<wd l="9792" t="11818" r="9955" b="11952">in</wd>
<space/>
<wd l="10022" t="11813" r="10574" b="11995">Figure</wd>
<space/>
<wd l="10651" t="11818" r="10776" b="11957">5.</wd>
<space/>
</ln>
<ln l="6101" t="12053" r="10795" b="12240" baseLine="12192" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12058" r="6278" b="12197">In</wd>
<space/>
<wd l="6355" t="12058" r="6629" b="12202">the</wd>
<space/>
<wd l="6710" t="12058" r="7277" b="12202">second</wd>
<space/>
<wd l="7363" t="12072" r="7752" b="12240">step,</wd>
<space/>
<wd l="7848" t="12053" r="8856" b="12202">information</wd>
<space/>
<wd l="8933" t="12058" r="9413" b="12202">based</wd>
<space/>
<wd l="9499" t="12106" r="9701" b="12202">on</wd>
<space/>
<wd l="9782" t="12058" r="10795" b="12240">dependency</wd>
<space/>
</ln>
<ln l="6096" t="12288" r="10786" b="12475" baseLine="12432" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12307" r="6552" b="12475">types</wd>
<space/>
<wd l="6677" t="12298" r="6802" b="12437">is</wd>
<space/>
<wd l="6926" t="12293" r="7733" b="12437">extracted</wd>
<space/>
<wd l="7858" t="12288" r="8088" b="12437">for</wd>
<space/>
<wd l="8208" t="12293" r="8482" b="12437">the</wd>
<space/>
<wd l="8602" t="12293" r="9533" b="12475">potentially</wd>
<space/>
<wd l="9653" t="12293" r="10325" b="12437">relevant</wd>
<space/>
<wd l="10454" t="12341" r="10786" b="12437">sen-</wd>
</ln>
<ln l="6096" t="12518" r="10786" b="12725" baseLine="12672" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12547" r="6667" b="12677">tences.</wd>
<space/>
<wd l="6869" t="12533" r="7627" b="12715">Focusing</wd>
<space/>
<wd l="7728" t="12581" r="7934" b="12677">on</wd>
<space/>
<wd l="8030" t="12533" r="8400" b="12677">verb</wd>
<space/>
<wd l="8506" t="12533" r="9240" b="12677">relations</wd>
<space/>
<wd l="9360" t="12518" r="9734" b="12725">(this</wd>
<space/>
<wd l="9845" t="12581" r="10138" b="12677">can</wd>
<space/>
<wd l="10238" t="12533" r="10435" b="12677">be</wd>
<space/>
<wd l="10541" t="12581" r="10786" b="12677">ex-</wd>
</ln>
<ln l="6096" t="12758" r="10795" b="12965" baseLine="12907" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12773" r="6677" b="12917">tended</wd>
<space/>
<wd l="6749" t="12787" r="6922" b="12917">to</wd>
<space/>
<wd l="6994" t="12773" r="7445" b="12917">other</wd>
<space/>
<wd l="7507" t="12787" r="7963" b="12955">types</wd>
<space/>
<wd l="8040" t="12768" r="8203" b="12917">of</wd>
<space/>
<wd l="8266" t="12758" r="9120" b="12965">relations),</wd>
<space/>
<wd l="9202" t="12821" r="9422" b="12917">we</wd>
<space/>
<wd l="9494" t="12773" r="10032" b="12917">collect</wd>
<space/>
<wd l="10114" t="12768" r="10349" b="12917">for</wd>
<space/>
<wd l="10416" t="12773" r="10795" b="12917">each</wd>
<space/>
</ln>
<ln l="6096" t="12998" r="10786" b="13205" baseLine="13147" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="13013" r="6470" b="13157">verb</wd>
<space/>
<wd l="6566" t="13018" r="6768" b="13157">its</wd>
<space/>
<wd l="6864" t="12998" r="7762" b="13205">subject(s),</wd>
<space/>
<wd l="7872" t="12998" r="8678" b="13205">object(s),</wd>
<space/>
<wd l="8789" t="12998" r="9970" b="13205">preposition(s)</wd>
<space/>
<wd l="10075" t="13013" r="10464" b="13157">with</wd>
<space/>
<wd l="10555" t="13061" r="10786" b="13157">ar-</wd>
</ln>
<ln l="6101" t="13238" r="10786" b="13445" baseLine="13387" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13267" r="6816" b="13435">guments</wd>
<space/>
<wd l="6917" t="13253" r="7229" b="13397">and</wd>
<space/>
<wd l="7325" t="13253" r="8083" b="13435">auxiliary</wd>
<space/>
<wd l="8174" t="13238" r="8822" b="13445">verb(s).</wd>
<space/>
<wd l="8990" t="13253" r="9264" b="13397">We</wd>
<space/>
<wd l="9360" t="13301" r="9653" b="13397">can</wd>
<space/>
<wd l="9749" t="13301" r="10094" b="13397">now</wd>
<space/>
<wd l="10186" t="13267" r="10786" b="13397">extract</wd>
<space/>
</ln>
<ln l="6096" t="13483" r="10795" b="13670" baseLine="13627" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="13488" r="6470" b="13632">verb</wd>
<space/>
<wd l="6562" t="13488" r="7291" b="13632">relations</wd>
<space/>
<wd l="7382" t="13493" r="7834" b="13670">using</wd>
<space/>
<wd l="7920" t="13536" r="8016" b="13632">a</wd>
<space/>
<wd l="8102" t="13488" r="8650" b="13670">simple</wd>
<space/>
<wd l="8736" t="13488" r="9610" b="13670">algorithm:</wd>
<space/>
<wd l="9749" t="13488" r="10022" b="13632">We</wd>
<space/>
<wd l="10109" t="13483" r="10613" b="13632">define</wd>
<space/>
<wd l="10699" t="13536" r="10795" b="13632">a</wd>
<space/>
</ln>
<ln l="6096" t="13728" r="10786" b="13910" baseLine="13867" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="13728" r="6470" b="13872">verb</wd>
<space/>
<wd l="6542" t="13728" r="7200" b="13872">relation</wd>
<space/>
<wd l="7267" t="13742" r="7440" b="13872">to</wd>
<space/>
<wd l="7512" t="13728" r="7709" b="13872">be</wd>
<space/>
<wd l="7781" t="13776" r="7877" b="13872">a</wd>
<space/>
<wd l="7939" t="13728" r="8314" b="13872">verb</wd>
<space/>
<wd l="8381" t="13728" r="9101" b="13910">together</wd>
<space/>
<wd l="9163" t="13728" r="9552" b="13872">with</wd>
<space/>
<wd l="9619" t="13733" r="9821" b="13872">its</wd>
<space/>
<wd l="9898" t="13742" r="10786" b="13910">arguments</wd>
<space/>
</ln>
<ln l="6115" t="13954" r="10790" b="14160" baseLine="14102" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6115" t="13954" r="7075" b="14160">(subject(s),</wd>
<space/>
<wd l="7186" t="13954" r="7934" b="14160">object(s)</wd>
<space/>
<wd l="8045" t="13968" r="8357" b="14112">and</wd>
<space/>
<wd l="8458" t="13968" r="9571" b="14150">prepositional</wd>
<space/>
<wd l="9667" t="13954" r="10363" b="14160">phrases)</wd>
<space/>
<wd l="10478" t="13968" r="10790" b="14112">and</wd>
<space/>
</ln>
<ln l="6101" t="14203" r="10786" b="14390" baseLine="14342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14208" r="6806" b="14352">consider</wd>
<space/>
<wd l="6874" t="14208" r="7238" b="14390">only</wd>
<space/>
<wd l="7296" t="14208" r="7752" b="14352">those</wd>
<space/>
<wd l="7819" t="14208" r="8549" b="14352">relations</wd>
<space/>
<wd l="8616" t="14222" r="8789" b="14352">to</wd>
<space/>
<wd l="8856" t="14208" r="9058" b="14352">be</wd>
<space/>
<wd l="9125" t="14203" r="9288" b="14352">of</wd>
<space/>
<wd l="9346" t="14213" r="9979" b="14352">interest</wd>
<space/>
<wd l="10046" t="14208" r="10555" b="14352">where</wd>
<space/>
<wd l="10622" t="14222" r="10786" b="14352">at</wd>
<space/>
</ln>
<ln l="6101" t="14443" r="10786" b="14630" baseLine="14582" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14448" r="6485" b="14592">least</wd>
<space/>
<wd l="6566" t="14448" r="6840" b="14592">the</wd>
<space/>
<wd l="6912" t="14448" r="7526" b="14630">subject</wd>
<space/>
<wd l="7608" t="14496" r="7781" b="14592">or</wd>
<space/>
<wd l="7848" t="14448" r="8122" b="14592">the</wd>
<space/>
<wd l="8198" t="14448" r="8717" b="14630">object</wd>
<space/>
<wd l="8803" t="14453" r="8923" b="14592">is</wd>
<space/>
<wd l="9005" t="14496" r="9206" b="14592">an</wd>
<space/>
<wd l="9283" t="14448" r="9600" b="14587">NE.</wd>
<space/>
<wd l="9686" t="14448" r="9960" b="14592">We</wd>
<space/>
<wd l="10032" t="14443" r="10440" b="14592">filter</wd>
<space/>
<wd l="10512" t="14462" r="10786" b="14592">out</wd>
<space/>
</ln>
<ln l="6101" t="14683" r="9024" b="14866" baseLine="14822" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14683" r="6835" b="14827">relations</wd>
<space/>
<wd l="6907" t="14683" r="7291" b="14827">with</wd>
<space/>
<wd l="7363" t="14683" r="7733" b="14866">only</wd>
<space/>
<wd l="7800" t="14731" r="8093" b="14827">one</wd>
<space/>
<wd l="8165" t="14698" r="9024" b="14866">argument.</wd>
</ln>
</para>
<para l="6106" t="15106" r="8582" b="15288" alignment="left" spaceBefore="185" lsp="exactly" lspExact="238" language="en">
<ln l="6106" t="15106" r="8582" b="15288" baseLine="15245" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">
<wd l="6106" t="15110" r="6437" b="15250">2.3.</wd>
<space/>
<wd l="6686" t="15106" r="7526" b="15250">Relation</wd>
<space/>
<wd l="7608" t="15106" r="8582" b="15288">clustering</wd>
</ln>
</para>
<para l="6101" t="15403" r="10795" b="15826" alignment="justified" spaceBefore="57" lsp="exactly" lspExact="235" language="en">
<ln l="6101" t="15403" r="10795" b="15586" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6101" t="15403" r="6830" b="15547">Relation</wd>
<space/>
<wd l="6931" t="15403" r="7574" b="15547">clusters</wd>
<space/>
<wd l="7680" t="15451" r="7939" b="15547">are</wd>
<space/>
<wd l="8040" t="15403" r="8870" b="15586">generated</wd>
<space/>
<wd l="8971" t="15403" r="9178" b="15586">by</wd>
<space/>
<wd l="9278" t="15408" r="10037" b="15586">grouping</wd>
<space/>
<wd l="10133" t="15403" r="10795" b="15547">relation</wd>
<space/>
</ln>
<ln l="6101" t="15643" r="9101" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6101" t="15648" r="6878" b="15787">instances</wd>
<space/>
<wd l="6955" t="15643" r="7435" b="15787">based</wd>
<space/>
<wd l="7512" t="15691" r="7714" b="15787">on</wd>
<space/>
<wd l="7781" t="15643" r="8189" b="15787">their</wd>
<space/>
<wd l="8261" t="15643" r="9101" b="15826">similarity.</wd>
</ln>
</para>
</column>
</section>
</body>
</page>
<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">
<description>
<source file="pdf\L08-1001.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>
<theoreticalPage size="A4" marginLeft="1038" marginTop="1380" marginRight="1095" marginBottom="954" offsetX="32" offsetY="16" width="11918" height="16854"/>
<language>en</language>
</description>
<body>
<section l="1038" t="6896" r="10814" b="10648">
<column l="1038" t="6896" r="10814" b="10648">
<para l="4622" t="6941" r="7214" b="7128" alignment="centered" spaceAfter="598" lsp="exactly" lspExact="238" language="en">
<ln l="4622" t="6941" r="7214" b="7128" baseLine="7080" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="4622" t="6946" r="5179" b="7128">Figure</wd>
<space/>
<wd l="5251" t="6946" r="5386" b="7085">4:</wd>
<space/>
<wd l="5501" t="6941" r="6115" b="7128">System</wd>
<space/>
<wd l="6187" t="6946" r="7214" b="7090">architecture</wd>
</ln>
</para>
<picture l="3518" t="7742" r="8520" b="9475" alignment="left" li="2480" ri="2294" spaceAfter="296">
</picture>
<para l="1042" t="9816" r="10805" b="10243" alignment="justified" spaceAfter="392" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="9816" r="10805" b="10003" baseLine="9955" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="9821" r="1603" b="10003">Figure</wd>
<space/>
<wd l="1685" t="9826" r="1814" b="9965">5:</wd>
<space/>
<wd l="1944" t="9816" r="2664" b="9965">Skeleton</wd>
<space/>
<wd l="2741" t="9816" r="2971" b="9965">for</wd>
<space/>
<wd l="3043" t="9821" r="3322" b="9965">the</wd>
<space/>
<wd l="3398" t="9821" r="3677" b="9960">NE</wd>
<space/>
<wd l="3754" t="9826" r="4094" b="10003">pair</wd>
<space/>
<wd l="4171" t="9821" r="5448" b="9965">“Hohenzollern”</wd>
<space/>
<wd l="5525" t="9821" r="5837" b="9965">and</wd>
<space/>
<wd l="5918" t="9821" r="7195" b="10003">“Brandenburg”</wd>
<space/>
<wd l="7272" t="9826" r="7435" b="9960">in</wd>
<space/>
<wd l="7507" t="9821" r="7781" b="9965">the</wd>
<space/>
<wd l="7862" t="9835" r="8578" b="9965">sentence</wd>
<space/>
<wd l="8659" t="9816" r="9706" b="10003">“Subsequent</wd>
<space/>
<wd l="9792" t="9821" r="10555" b="9965">members</wd>
<space/>
<wd l="10637" t="9816" r="10805" b="9965">of</wd>
<space/>
</ln>
<ln l="1042" t="10056" r="8381" b="10243" baseLine="10195" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1042" t="10061" r="1315" b="10205">the</wd>
<space/>
<wd l="1392" t="10061" r="2520" b="10205">Hohenzollern</wd>
<space/>
<wd l="2592" t="10056" r="3130" b="10243">family</wd>
<space/>
<wd l="3197" t="10061" r="3634" b="10205">ruled</wd>
<space/>
<wd l="3710" t="10061" r="4104" b="10205">until</wd>
<space/>
<wd l="4186" t="10066" r="4570" b="10205">1918</wd>
<space/>
<wd l="4642" t="10066" r="4805" b="10200">in</wd>
<space/>
<wd l="4877" t="10061" r="5443" b="10238">Berlin,</wd>
<space/>
<wd l="5525" t="10056" r="5856" b="10205">first</wd>
<space/>
<wd l="5938" t="10109" r="6101" b="10205">as</wd>
<space/>
<wd l="6182" t="10061" r="6821" b="10205">electors</wd>
<space/>
<wd l="6902" t="10056" r="7066" b="10205">of</wd>
<space/>
<wd l="7128" t="10061" r="8381" b="10243">Brandenburg.“</wd>
</ln>
</para>
</column>
</section>
<dd l="1038" t="1380" r="10814" b="6896">
<dd l="2237" t="1387" r="9600" b="6634">
<picture l="2237" t="1387" r="9600" b="6634" alignment="left">
</picture>
</dd>
<dd l="8093" t="3942" r="9192" b="4246">
<para l="8093" t="3974" r="9187" b="4219" alignment="left" li="288" fli="-288" lsp="exactly" lspExact="145" language="en">
<ln l="8093" t="3974" r="9187" b="4061" baseLine="4051" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-5">
<wd l="8093" t="3974" r="9187" b="4061">sentence/documents+</wd>
<space/>
</ln>
<ln l="8366" t="4128" r="8842" b="4219" baseLine="4210" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-5">
<wd l="8366" t="4133" r="8515" b="4214">NE</wd>
<space/>
<wd l="8549" t="4133" r="8842" b="4219">tables</wd>
</ln>
</para>
</dd>
<dd l="2565" t="3904" r="3325" b="4049">
<para l="2598" t="3931" r="3292" b="4018" alignment="left" spaceBefore="6" lsp="exactly" lspExact="136" language="en">
<ln l="2664" t="3931" r="3226" b="4018" baseLine="4013" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="3">
<wd l="2664" t="3931" r="3130" b="4018">skeletons</wd>
<space/>
<wd l="3168" t="3960" r="3226" b="4018">+</wd>
</ln>
</para>
</dd>
<dd l="2512" t="4049" r="3368" b="4164">
<para l="2545" t="4051" r="3335" b="4138" alignment="left" lsp="exactly" lspExact="112" language="en">
<ln l="2611" t="4051" r="3269" b="4138" baseLine="4128" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="2">
<wd l="2611" t="4051" r="3269" b="4138">sov−relations</wd>
</ln>
</para>
</dd>
<dd l="6175" t="4336" r="6857" b="4579">
<para l="6208" t="4363" r="6824" b="4560" alignment="left" li="72" spaceBefore="33" lsp="exactly" lspExact="97" language="en">
<ln l="6274" t="4363" r="6758" b="4478" baseLine="4445" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="6274" t="4368" r="6629" b="4478">filtering</wd>
<space/>
<wd l="6667" t="4368" r="6758" b="4454">of</wd>
<space/>
</ln>
<ln l="6331" t="4469" r="6720" b="4560" baseLine="4550" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="6331" t="4474" r="6720" b="4560">relevant</wd>
</ln>
</para>
</dd>
<dd l="6175" t="4579" r="6877" b="4692">
<para l="6208" t="4579" r="6844" b="4666" alignment="left" lsp="exactly" lspExact="101" language="en">
<ln l="6274" t="4579" r="6778" b="4666" baseLine="4656" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="4">
<wd l="6274" t="4584" r="6778" b="4666">sentences</wd>
</ln>
</para>
</dd>
<dd l="4272" t="4259" r="5189" b="4747">
<para l="4272" t="4286" r="5184" b="4742" alignment="centered" spaceBefore="34" lsp="exactly" lspExact="111" language="en">
<ln l="4507" t="4286" r="4944" b="4402" baseLine="4368" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-5" forcedEOF="true">
<wd l="4507" t="4291" r="4944" b="4402">syntactic</wd>
</ln>
<ln l="4723" t="4392" r="4781" b="4478" baseLine="4474" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-5" forcedEOF="true">
<wd l="4723" t="4416" r="4781" b="4478">+</wd>
</ln>
<ln l="4272" t="4493" r="5184" b="4608" baseLine="4579" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-5" forcedEOF="true">
<wd l="4272" t="4498" r="4541" b="4608">typed</wd>
<space/>
<wd l="4574" t="4498" r="5184" b="4608">dependency</wd>
</ln>
<ln l="4541" t="4622" r="4896" b="4742" baseLine="4709" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-5" forcedEOF="true">
<wd l="4541" t="4632" r="4896" b="4742">parsing</wd>
</ln>
</para>
</dd>
<dd l="2386" t="4977" r="3758" b="5177">
<para l="2386" t="5011" r="3754" b="5141" alignment="left" spaceBefore="3" lsp="exactly" lspExact="189" language="en">
<ln l="2386" t="5011" r="3754" b="5141" baseLine="5131" underlined="none" subsuperscript="none" fontSize="850" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-8">
<wd l="2386" t="5011" r="2981" b="5141">Relation</wd>
<space/>
<wd l="3038" t="5011" r="3754" b="5141">extraction</wd>
</ln>
</para>
</dd>
<dd l="8040" t="5550" r="9346" b="5695">
<para l="8040" t="5578" r="9341" b="5669" alignment="left" spaceBefore="6" lsp="exactly" lspExact="132" language="en">
<ln l="8040" t="5578" r="9341" b="5669" baseLine="5659" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-7">
<wd l="8040" t="5582" r="8280" b="5669">table</wd>
<space/>
<wd l="8314" t="5582" r="8410" b="5669">of</wd>
<space/>
<wd l="8438" t="5582" r="8885" b="5669">clustered</wd>
<space/>
<wd l="8928" t="5582" r="9341" b="5669">relations</wd>
</ln>
</para>
</dd>
<dd l="2723" t="5838" r="3281" b="6120">
<para l="2756" t="5870" r="3248" b="6115" alignment="left" spaceBefore="10" spaceAfter="2" lsp="exactly" lspExact="135" language="en">
<ln l="2827" t="5870" r="3182" b="5957" baseLine="5947" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="12">
<wd l="2827" t="5870" r="3182" b="5957">relation</wd>
<space/>
</ln>
<ln l="2822" t="6005" r="3178" b="6115" baseLine="6082" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="12">
<wd l="2822" t="6005" r="3178" b="6115">filtering</wd>
</ln>
</para>
</dd>
<dd l="5488" t="5920" r="6161" b="6067">
<para l="5521" t="5947" r="6128" b="6062" alignment="left" spaceBefore="6" lsp="exactly" lspExact="136" language="en">
<ln l="5587" t="5947" r="6062" b="6062" baseLine="6029" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="4">
<wd l="5587" t="5952" r="6062" b="6062">clustering</wd>
</ln>
</para>
</dd>
<dd l="2414" t="6350" r="3773" b="6550">
<para l="2414" t="6379" r="3768" b="6542" alignment="left" spaceBefore="3" lsp="exactly" lspExact="184" language="en">
<ln l="2414" t="6379" r="3768" b="6542" baseLine="6504" underlined="none" subsuperscript="none" fontSize="850" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-8">
<wd l="2414" t="6379" r="3005" b="6509">Relation</wd>
<space/>
<wd l="3062" t="6379" r="3768" b="6542">clustering</wd>
</ln>
</para>
</dd>
<dd l="2386" t="3264" r="3442" b="3467">
<para l="2386" t="3293" r="3437" b="3461" alignment="left" spaceBefore="3" lsp="exactly" lspExact="189" language="en">
<ln l="2386" t="3293" r="3437" b="3461" baseLine="3418" underlined="none" subsuperscript="none" fontSize="850" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-10">
<wd l="2386" t="3298" r="3437" b="3461">Preprocessing</wd>
</ln>
</para>
</dd>
<dd l="2424" t="2046" r="3206" b="2191">
<para l="2424" t="2074" r="3202" b="2160" alignment="left" spaceBefore="6" lsp="exactly" lspExact="136" language="en">
<ln l="2424" t="2074" r="3202" b="2160" baseLine="2155" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-12">
<wd l="2424" t="2074" r="2630" b="2160">web</wd>
<space/>
<wd l="2659" t="2074" r="3202" b="2160">documents</wd>
</ln>
</para>
</dd>
<dd l="3827" t="2200" r="4515" b="2479">
<para l="3860" t="2232" r="4482" b="2453" alignment="left" li="72" spaceBefore="11" lsp="exactly" lspExact="132" language="en">
<ln l="3926" t="2232" r="4416" b="2318" baseLine="2309" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="3926" t="2232" r="4416" b="2318">document</wd>
<space/>
</ln>
<ln l="3984" t="2362" r="4373" b="2453" baseLine="2443" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="3984" t="2366" r="4373" b="2453">retrieval</wd>
</ln>
</para>
</dd>
<dd l="4778" t="2017" r="5614" b="2297">
<para l="4811" t="2050" r="5581" b="2266" alignment="left" spaceBefore="10" lsp="exactly" lspExact="131" language="en">
<ln l="4877" t="2050" r="5515" b="2160" baseLine="2126" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="4877" t="2050" r="5112" b="2160">topic</wd>
<space/>
<wd l="5146" t="2050" r="5515" b="2160">specific</wd>
<space/>
</ln>
<ln l="4906" t="2179" r="5448" b="2266" baseLine="2261" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="4906" t="2179" r="5448" b="2266">documents</wd>
</ln>
</para>
</dd>
<dd l="5939" t="2253" r="6670" b="2398">
<para l="5972" t="2280" r="6637" b="2371" alignment="left" spaceBefore="6" lsp="exactly" lspExact="131" language="en">
<ln l="6038" t="2280" r="6571" b="2371" baseLine="2362" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="3">
<wd l="6038" t="2285" r="6571" b="2371">conversion</wd>
</ln>
</para>
</dd>
<dd l="6938" t="2017" r="7678" b="2297">
<para l="6971" t="2045" r="7645" b="2266" alignment="left" spaceBefore="10" fli="72" lsp="exactly" lspExact="131" language="en">
<ln l="7094" t="2045" r="7536" b="2160" baseLine="2126" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="7094" t="2050" r="7325" b="2160">plain</wd>
<space/>
<wd l="7358" t="2054" r="7536" b="2136">text</wd>
<space/>
</ln>
<ln l="7037" t="2179" r="7579" b="2266" baseLine="2261" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="7037" t="2179" r="7579" b="2266">documents</wd>
</ln>
</para>
</dd>
<dd l="8122" t="2017" r="9173" b="2165">
<para l="8122" t="2050" r="9168" b="2160" alignment="left" spaceBefore="6" lsp="exactly" lspExact="137" language="en">
<ln l="8122" t="2050" r="9168" b="2160" baseLine="2126" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-4">
<wd l="8122" t="2054" r="8568" b="2136">sentence</wd>
<space/>
<wd l="8702" t="2050" r="9168" b="2160">boundary</wd>
</ln>
</para>
</dd>
<dd l="8338" t="2165" r="9091" b="2453">
<para l="8434" t="2174" r="8914" b="2280" alignment="left" li="72" lsp="exactly" lspExact="132" language="en">
<ln l="8434" t="2174" r="8914" b="2280" baseLine="2261" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-3">
<wd l="8434" t="2179" r="8914" b="2280">detection,</wd>
</ln>
</para>
<para l="8338" t="2333" r="9086" b="2448" alignment="left" spaceBefore="14" lsp="exactly" lspExact="137" language="en">
<ln l="8338" t="2333" r="9086" b="2448" baseLine="2414" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="-11">
<wd l="8338" t="2338" r="8482" b="2419">NE</wd>
<space/>
<wd l="8520" t="2338" r="9086" b="2448">recognition,</wd>
</ln>
</para>
</dd>
<dd l="8258" t="2464" r="9041" b="2609">
<para l="8291" t="2491" r="9008" b="2582" alignment="left" spaceBefore="6" lsp="exactly" lspExact="136" language="en">
<ln l="8357" t="2491" r="8942" b="2582" baseLine="2573" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="3">
<wd l="8357" t="2491" r="8942" b="2582">coreference</wd>
</ln>
</para>
</dd>
<dd l="8315" t="3126" r="8965" b="3377">
<para l="8348" t="3154" r="8932" b="3370" alignment="left" li="72" spaceBefore="39" lsp="exactly" lspExact="102" language="en">
<ln l="8414" t="3154" r="8866" b="3264" baseLine="3235" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="8414" t="3154" r="8866" b="3264">language</wd>
<space/>
</ln>
<ln l="8462" t="3254" r="8818" b="3370" baseLine="3341" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="0">
<wd l="8462" t="3259" r="8818" b="3370">filtering</wd>
</ln>
</para>
</dd>
<dd l="8339" t="2609" r="9013" b="2743">
<para l="8372" t="2621" r="8980" b="2712" alignment="left" lsp="exactly" lspExact="127" language="en">
<ln l="8438" t="2621" r="8914" b="2712" baseLine="2707" underlined="none" subsuperscript="none" fontSize="600" fontFace="Arial" fontFamily="swiss" fontPitch="variable" spacing="3">
<wd l="8438" t="2626" r="8914" b="2712">resolution</wd>
</ln>
</para>
</dd>
</dd>
<section l="1042" t="10648" r="10811" b="15884">
<column l="1042" t="10648" r="5756" b="15884">
<para l="1042" t="10690" r="5741" b="13747" alignment="justified" lsp="exactly" lspExact="238" language="en">
<ln l="1046" t="10690" r="5736" b="10877" baseLine="10834" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="10694" r="1382" b="10838">The</wd>
<space/>
<wd l="1478" t="10694" r="2486" b="10877">comparably</wd>
<space/>
<wd l="2582" t="10694" r="2995" b="10877">large</wd>
<space/>
<wd l="3091" t="10709" r="3734" b="10838">amount</wd>
<space/>
<wd l="3835" t="10690" r="4003" b="10838">of</wd>
<space/>
<wd l="4085" t="10694" r="4469" b="10838">data</wd>
<space/>
<wd l="4560" t="10699" r="4723" b="10834">in</wd>
<space/>
<wd l="4810" t="10694" r="5083" b="10838">the</wd>
<space/>
<wd l="5179" t="10742" r="5736" b="10877">corpus</wd>
<space/>
</ln>
<ln l="1046" t="10930" r="5722" b="11117" baseLine="11069" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="10939" r="1718" b="11117">requires</wd>
<space/>
<wd l="1824" t="10934" r="2098" b="11078">the</wd>
<space/>
<wd l="2203" t="10982" r="2472" b="11078">use</wd>
<space/>
<wd l="2578" t="10930" r="2746" b="11078">of</wd>
<space/>
<wd l="2837" t="10982" r="3038" b="11078">an</wd>
<space/>
<wd l="3144" t="10930" r="3797" b="11078">efficient</wd>
<space/>
<wd l="3907" t="10934" r="4747" b="11117">clustering</wd>
<space/>
<wd l="4848" t="10934" r="5722" b="11117">algorithm.</wd>
<space/>
</ln>
<ln l="1051" t="11170" r="5736" b="11357" baseLine="11309" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1051" t="11170" r="1834" b="11318">Standard</wd>
<space/>
<wd l="1939" t="11174" r="2237" b="11314">ML</wd>
<space/>
<wd l="2338" t="11174" r="3178" b="11357">clustering</wd>
<space/>
<wd l="3274" t="11174" r="4181" b="11357">algorithms</wd>
<space/>
<wd l="4286" t="11174" r="4661" b="11318">such</wd>
<space/>
<wd l="4762" t="11222" r="4925" b="11318">as</wd>
<space/>
<wd l="5030" t="11174" r="5736" b="11318">k-means</wd>
<space/>
</ln>
<ln l="1046" t="11400" r="5741" b="11606" baseLine="11549" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="11414" r="1358" b="11558">and</wd>
<space/>
<wd l="1464" t="11414" r="1771" b="11554">EM</wd>
<space/>
<wd l="1886" t="11400" r="2117" b="11606">(as</wd>
<space/>
<wd l="2222" t="11414" r="2966" b="11597">provided</wd>
<space/>
<wd l="3072" t="11414" r="3274" b="11597">by</wd>
<space/>
<wd l="3370" t="11414" r="3643" b="11558">the</wd>
<space/>
<wd l="3739" t="11414" r="4210" b="11558">Weka</wd>
<space/>
<wd l="4306" t="11414" r="4958" b="11558">toolbox</wd>
<space/>
<wd l="5069" t="11400" r="5741" b="11606">(Witten</wd>
<space/>
</ln>
<ln l="1046" t="11640" r="5736" b="11846" baseLine="11789" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="11654" r="1358" b="11798">and</wd>
<space/>
<wd l="1440" t="11654" r="1987" b="11832">Frank,</wd>
<space/>
<wd l="2083" t="11640" r="2606" b="11846">2005))</wd>
<space/>
<wd l="2707" t="11654" r="3091" b="11798">have</wd>
<space/>
<wd l="3173" t="11654" r="3571" b="11798">been</wd>
<space/>
<wd l="3643" t="11654" r="4157" b="11798">tested</wd>
<space/>
<wd l="4243" t="11650" r="4474" b="11798">for</wd>
<space/>
<wd l="4555" t="11654" r="5390" b="11837">clustering</wd>
<space/>
<wd l="5462" t="11654" r="5736" b="11798">the</wd>
<space/>
</ln>
<ln l="1046" t="11890" r="5736" b="12034" baseLine="12029" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="11890" r="1781" b="12034">relations</wd>
<space/>
<wd l="1872" t="11904" r="2035" b="12034">at</wd>
<space/>
<wd l="2131" t="11890" r="2554" b="12034">hand</wd>
<space/>
<wd l="2645" t="11890" r="2928" b="12034">but</wd>
<space/>
<wd l="3019" t="11938" r="3413" b="12034">were</wd>
<space/>
<wd l="3499" t="11904" r="3773" b="12034">not</wd>
<space/>
<wd l="3869" t="11890" r="4214" b="12034">able</wd>
<space/>
<wd l="4301" t="11904" r="4474" b="12034">to</wd>
<space/>
<wd l="4565" t="11890" r="4910" b="12034">deal</wd>
<space/>
<wd l="4997" t="11890" r="5381" b="12034">with</wd>
<space/>
<wd l="5462" t="11890" r="5736" b="12034">the</wd>
<space/>
</ln>
<ln l="1046" t="12125" r="5741" b="12312" baseLine="12269" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="12130" r="1464" b="12312">large</wd>
<space/>
<wd l="1531" t="12130" r="2184" b="12274">number</wd>
<space/>
<wd l="2256" t="12125" r="2419" b="12274">of</wd>
<space/>
<wd l="2477" t="12125" r="3149" b="12274">features</wd>
<space/>
<wd l="3221" t="12130" r="3533" b="12274">and</wd>
<space/>
<wd l="3605" t="12134" r="4382" b="12274">instances</wd>
<space/>
<wd l="4454" t="12130" r="5160" b="12312">required</wd>
<space/>
<wd l="5232" t="12125" r="5467" b="12274">for</wd>
<space/>
<wd l="5534" t="12178" r="5741" b="12274">an</wd>
<space/>
</ln>
<ln l="1046" t="12365" r="5731" b="12552" baseLine="12504" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="12370" r="1819" b="12552">adequate</wd>
<space/>
<wd l="1910" t="12374" r="3139" b="12552">representation</wd>
<space/>
<wd l="3230" t="12365" r="3394" b="12514">of</wd>
<space/>
<wd l="3470" t="12418" r="3754" b="12514">our</wd>
<space/>
<wd l="3840" t="12370" r="4507" b="12514">dataset.</wd>
<space/>
<wd l="4661" t="12370" r="4934" b="12514">We</wd>
<space/>
<wd l="5021" t="12370" r="5386" b="12514">thus</wd>
<space/>
<wd l="5482" t="12370" r="5731" b="12514">de-</wd>
</ln>
<ln l="1046" t="12610" r="5731" b="12792" baseLine="12744" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="12610" r="1493" b="12754">cided</wd>
<space/>
<wd l="1579" t="12624" r="1752" b="12754">to</wd>
<space/>
<wd l="1843" t="12658" r="2112" b="12754">use</wd>
<space/>
<wd l="2198" t="12658" r="2294" b="12754">a</wd>
<space/>
<wd l="2381" t="12614" r="2986" b="12792">scoring</wd>
<space/>
<wd l="3072" t="12610" r="3907" b="12792">algorithm</wd>
<space/>
<wd l="3989" t="12610" r="4344" b="12754">that</wd>
<space/>
<wd l="4440" t="12658" r="5237" b="12792">compares</wd>
<space/>
<wd l="5333" t="12658" r="5429" b="12754">a</wd>
<space/>
<wd l="5510" t="12658" r="5731" b="12754">re-</wd>
</ln>
<ln l="1046" t="12850" r="5736" b="13032" baseLine="12984" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="12850" r="1541" b="12994">lation</wd>
<space/>
<wd l="1613" t="12864" r="1786" b="12994">to</wd>
<space/>
<wd l="1867" t="12850" r="2318" b="12994">other</wd>
<space/>
<wd l="2395" t="12850" r="3125" b="12994">relations</wd>
<space/>
<wd l="3211" t="12850" r="3686" b="12994">based</wd>
<space/>
<wd l="3773" t="12898" r="3974" b="12994">on</wd>
<space/>
<wd l="4056" t="12854" r="4646" b="12994">certain</wd>
<space/>
<wd l="4723" t="12864" r="5342" b="13032">aspects</wd>
<space/>
<wd l="5424" t="12850" r="5736" b="12994">and</wd>
<space/>
</ln>
<ln l="1046" t="13080" r="5731" b="13267" baseLine="13224" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="13085" r="1877" b="13229">calculates</wd>
<space/>
<wd l="1944" t="13133" r="2040" b="13229">a</wd>
<space/>
<wd l="2102" t="13085" r="2918" b="13267">similarity</wd>
<space/>
<wd l="2976" t="13133" r="3446" b="13229">score.</wd>
<space/>
<wd l="3552" t="13080" r="3691" b="13224">If</wd>
<space/>
<wd l="3734" t="13085" r="4051" b="13229">this</wd>
<space/>
<wd l="4118" t="13085" r="4934" b="13267">similarity</wd>
<space/>
<wd l="4997" t="13133" r="5424" b="13229">score</wd>
<space/>
<wd l="5486" t="13133" r="5731" b="13229">ex-</wd>
</ln>
<ln l="1046" t="13320" r="5736" b="13507" baseLine="13464" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="13325" r="1493" b="13469">ceeds</wd>
<space/>
<wd l="1555" t="13373" r="1651" b="13469">a</wd>
<space/>
<wd l="1704" t="13320" r="2592" b="13507">predefined</wd>
<space/>
<wd l="2650" t="13325" r="3499" b="13502">threshold,</wd>
<space/>
<wd l="3566" t="13339" r="3874" b="13469">two</wd>
<space/>
<wd l="3931" t="13325" r="4661" b="13469">relations</wd>
<space/>
<wd l="4723" t="13373" r="4982" b="13469">are</wd>
<space/>
<wd l="5040" t="13325" r="5736" b="13507">grouped</wd>
<space/>
</ln>
<ln l="1042" t="13565" r="1800" b="13747" baseLine="13699" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1042" t="13565" r="1800" b="13747">together.</wd>
</ln>
</para>
<para l="1042" t="13805" r="5736" b="14482" alignment="justified" spaceBefore="9" lsp="exactly" lspExact="240" language="en">
<ln l="1051" t="13805" r="5736" b="13992" baseLine="13944" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1051" t="13805" r="1896" b="13992">Similarity</wd>
<space/>
<wd l="1982" t="13814" r="2102" b="13954">is</wd>
<space/>
<wd l="2198" t="13810" r="3005" b="13954">measured</wd>
<space/>
<wd l="3096" t="13810" r="3576" b="13954">based</wd>
<space/>
<wd l="3667" t="13858" r="3874" b="13954">on</wd>
<space/>
<wd l="3955" t="13810" r="4229" b="13954">the</wd>
<space/>
<wd l="4315" t="13824" r="4886" b="13992">output</wd>
<space/>
<wd l="4982" t="13805" r="5381" b="13954">from</wd>
<space/>
<wd l="5462" t="13810" r="5736" b="13954">the</wd>
<space/>
</ln>
<ln l="1046" t="14045" r="5731" b="14232" baseLine="14184" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="14045" r="1752" b="14194">different</wd>
<space/>
<wd l="1824" t="14054" r="2990" b="14232">preprocessing</wd>
<space/>
<wd l="3053" t="14064" r="3475" b="14232">steps</wd>
<space/>
<wd l="3542" t="14098" r="3706" b="14194">as</wd>
<space/>
<wd l="3773" t="14050" r="4104" b="14194">well</wd>
<space/>
<wd l="4171" t="14098" r="4334" b="14194">as</wd>
<space/>
<wd l="4406" t="14050" r="4944" b="14194">lexical</wd>
<space/>
<wd l="5011" t="14045" r="5731" b="14194">informa-</wd>
</ln>
<ln l="1042" t="14275" r="4286" b="14482" baseLine="14424" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1042" t="14294" r="1387" b="14434">tion</wd>
<space/>
<wd l="1459" t="14285" r="1853" b="14434">from</wd>
<space/>
<wd l="1925" t="14290" r="2702" b="14434">WordNet</wd>
<space/>
<wd l="2798" t="14275" r="3691" b="14482">(WordNet,</wd>
<space/>
<wd l="3782" t="14275" r="4286" b="14482">2007):</wd>
</ln>
</para>
<para l="1253" t="14741" r="5741" b="15408" alignment="justified" li="360" spaceBefore="212" fli="-216" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="1253" t="14741" r="5731" b="14890" baseLine="14885" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1253" t="14746" r="1440" b="14885">•</wd>
<tab position="1331"/>
<wd l="1440" t="14746" r="2270" b="14890">WordNet:</wd>
<space/>
<wd l="2381" t="14746" r="3163" b="14890">WordNet</wd>
<space/>
<wd l="3250" t="14741" r="4258" b="14890">information</wd>
<space/>
<wd l="4330" t="14750" r="4450" b="14890">is</wd>
<space/>
<wd l="4531" t="14746" r="4910" b="14890">used</wd>
<space/>
<wd l="4987" t="14760" r="5160" b="14890">to</wd>
<space/>
<wd l="5237" t="14746" r="5731" b="14890">deter-</wd>
</ln>
<ln l="1445" t="14981" r="5741" b="15168" baseLine="15120" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1445" t="14990" r="1858" b="15130">mine</wd>
<space/>
<wd l="1925" t="14981" r="2050" b="15125">if</wd>
<space/>
<wd l="2098" t="15000" r="2405" b="15130">two</wd>
<space/>
<wd l="2467" t="14986" r="2837" b="15130">verb</wd>
<space/>
<wd l="2904" t="14981" r="3734" b="15130">infinitives</wd>
<space/>
<wd l="3806" t="14986" r="4339" b="15130">match</wd>
<space/>
<wd l="4402" t="15034" r="4574" b="15130">or</wd>
<space/>
<wd l="4637" t="14981" r="4762" b="15125">if</wd>
<space/>
<wd l="4810" t="14986" r="5189" b="15168">they</wd>
<space/>
<wd l="5256" t="15034" r="5515" b="15130">are</wd>
<space/>
<wd l="5578" t="14990" r="5741" b="15125">in</wd>
<space/>
</ln>
<ln l="1440" t="15226" r="3403" b="15408" baseLine="15360" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1440" t="15226" r="1714" b="15370">the</wd>
<space/>
<wd l="1790" t="15274" r="2213" b="15370">same</wd>
<space/>
<wd l="2290" t="15274" r="3053" b="15408">synonym</wd>
<space/>
<wd l="3125" t="15240" r="3403" b="15370">set.</wd>
</ln>
</para>
<para l="1253" t="15638" r="5731" b="15826" alignment="justified" li="360" spaceBefore="182" spaceAfter="47" fli="-216" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="1253" t="15638" r="5731" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1253" t="15643" r="1445" b="15782">•</wd>
<tab position="1331"/>
<wd l="1445" t="15643" r="2131" b="15826">Parsing:</wd>
<space/>
<wd l="2232" t="15643" r="2568" b="15787">The</wd>
<space/>
<wd l="2626" t="15643" r="3427" b="15787">extracted</wd>
<space/>
<wd l="3485" t="15643" r="4498" b="15826">dependency</wd>
<space/>
<wd l="4550" t="15638" r="5558" b="15787">information</wd>
<space/>
<wd l="5611" t="15648" r="5731" b="15787">is</wd>
<space/>
</ln>
</para>
</column>
<column l="6097" t="10648" r="10811" b="15884">
<para l="6485" t="10690" r="10805" b="12072" alignment="justified" li="360" lsp="exactly" lspExact="239" language="en">
<ln l="6499" t="10690" r="10786" b="10877" baseLine="10834" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6499" t="10694" r="6878" b="10838">used</wd>
<space/>
<wd l="6941" t="10709" r="7118" b="10838">to</wd>
<space/>
<wd l="7186" t="10742" r="7886" b="10838">measure</wd>
<space/>
<wd l="7949" t="10694" r="8222" b="10838">the</wd>
<space/>
<wd l="8285" t="10694" r="8760" b="10838">token</wd>
<space/>
<wd l="8822" t="10694" r="9442" b="10877">overlap</wd>
<space/>
<wd l="9509" t="10690" r="9677" b="10838">of</wd>
<space/>
<wd l="9725" t="10694" r="9998" b="10838">the</wd>
<space/>
<wd l="10061" t="10709" r="10363" b="10838">two</wd>
<space/>
<wd l="10435" t="10694" r="10786" b="10838">sub-</wd>
</ln>
<ln l="6485" t="10934" r="10790" b="11117" baseLine="11069" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6485" t="10939" r="6883" b="11117">jects</wd>
<space/>
<wd l="6974" t="10934" r="7282" b="11078">and</wd>
<space/>
<wd l="7373" t="10934" r="8026" b="11117">objects,</wd>
<space/>
<wd l="8122" t="10934" r="9158" b="11117">respectively.</wd>
<space/>
<wd l="9298" t="10934" r="9571" b="11078">We</wd>
<space/>
<wd l="9658" t="10934" r="9984" b="11078">also</wd>
<space/>
<wd l="10070" t="10982" r="10790" b="11117">compare</wd>
<space/>
</ln>
<ln l="6494" t="11170" r="10805" b="11357" baseLine="11309" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6494" t="11174" r="6768" b="11318">the</wd>
<space/>
<wd l="6845" t="11174" r="7454" b="11357">subject</wd>
<space/>
<wd l="7536" t="11170" r="7699" b="11318">of</wd>
<space/>
<wd l="7757" t="11174" r="8030" b="11318">the</wd>
<space/>
<wd l="8102" t="11170" r="8434" b="11318">first</wd>
<space/>
<wd l="8510" t="11174" r="9173" b="11318">relation</wd>
<space/>
<wd l="9235" t="11174" r="9624" b="11318">with</wd>
<space/>
<wd l="9691" t="11174" r="9965" b="11318">the</wd>
<space/>
<wd l="10037" t="11174" r="10560" b="11357">object</wd>
<space/>
<wd l="10637" t="11170" r="10805" b="11318">of</wd>
<space/>
</ln>
<ln l="6494" t="11414" r="10781" b="11592" baseLine="11549" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6494" t="11414" r="6768" b="11558">the</wd>
<space/>
<wd l="6864" t="11414" r="7430" b="11558">second</wd>
<space/>
<wd l="7526" t="11414" r="8184" b="11558">relation</wd>
<space/>
<wd l="8275" t="11414" r="8587" b="11558">and</wd>
<space/>
<wd l="8678" t="11419" r="9014" b="11558">vice</wd>
<space/>
<wd l="9101" t="11462" r="9586" b="11558">versa.</wd>
<space/>
<wd l="9758" t="11414" r="9936" b="11554">In</wd>
<space/>
<wd l="10027" t="11414" r="10781" b="11592">addition,</wd>
<space/>
</ln>
<ln l="6494" t="11654" r="10790" b="11837" baseLine="11789" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6494" t="11702" r="6720" b="11798">we</wd>
<space/>
<wd l="6797" t="11702" r="7522" b="11837">compare</wd>
<space/>
<wd l="7594" t="11654" r="7867" b="11798">the</wd>
<space/>
<wd l="7944" t="11654" r="8702" b="11837">auxiliary</wd>
<space/>
<wd l="8774" t="11654" r="9274" b="11832">verbs,</wd>
<space/>
<wd l="9360" t="11659" r="10397" b="11837">prepositions</wd>
<space/>
<wd l="10478" t="11654" r="10790" b="11798">and</wd>
<space/>
</ln>
<ln l="6499" t="11885" r="10334" b="12072" baseLine="12029" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="6499" t="11894" r="7464" b="12072">preposition</wd>
<space/>
<wd l="7536" t="11904" r="8429" b="12072">arguments</wd>
<space/>
<wd l="8506" t="11885" r="8986" b="12034">found</wd>
<space/>
<wd l="9062" t="11894" r="9226" b="12029">in</wd>
<space/>
<wd l="9293" t="11890" r="9566" b="12034">the</wd>
<space/>
<wd l="9638" t="11890" r="10334" b="12034">relation.</wd>
</ln>
</para>
<para l="6307" t="12326" r="10795" b="13670" alignment="justified" li="360" spaceBefore="197" fli="-216" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="6307" t="12326" r="10790" b="12514" baseLine="12470" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6307" t="12331" r="6499" b="12470">•</wd>
<tab position="6385"/>
<wd l="6499" t="12331" r="6778" b="12470">NE</wd>
<space/>
<wd l="6874" t="12336" r="7867" b="12514">recognition:</wd>
<space/>
<wd l="8016" t="12331" r="8352" b="12475">The</wd>
<space/>
<wd l="8448" t="12326" r="9456" b="12475">information</wd>
<space/>
<wd l="9547" t="12326" r="9941" b="12475">from</wd>
<space/>
<wd l="10032" t="12331" r="10349" b="12475">this</wd>
<space/>
<wd l="10445" t="12346" r="10790" b="12514">step</wd>
<space/>
</ln>
<ln l="6499" t="12566" r="10795" b="12754" baseLine="12706" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="12576" r="6624" b="12715">is</wd>
<space/>
<wd l="6710" t="12571" r="7090" b="12715">used</wd>
<space/>
<wd l="7166" t="12586" r="7344" b="12715">to</wd>
<space/>
<wd l="7426" t="12586" r="7891" b="12715">count</wd>
<space/>
<wd l="7982" t="12571" r="8328" b="12715">how</wd>
<space/>
<wd l="8405" t="12619" r="8880" b="12754">many</wd>
<space/>
<wd l="8957" t="12566" r="9125" b="12715">of</wd>
<space/>
<wd l="9192" t="12571" r="9466" b="12715">the</wd>
<space/>
<wd l="9547" t="12571" r="9898" b="12715">NEs</wd>
<space/>
<wd l="9984" t="12576" r="10795" b="12754">occurring</wd>
<space/>
</ln>
<ln l="6499" t="12811" r="10790" b="12989" baseLine="12946" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="12816" r="6662" b="12950">in</wd>
<space/>
<wd l="6754" t="12811" r="7027" b="12955">the</wd>
<space/>
<wd l="7128" t="12826" r="7886" b="12989">contexts,</wd>
<space/>
<wd l="8002" t="12816" r="8290" b="12989">i.e.,</wd>
<space/>
<wd l="8400" t="12811" r="8678" b="12955">the</wd>
<space/>
<wd l="8774" t="12826" r="9566" b="12955">sentences</wd>
<space/>
<wd l="9672" t="12816" r="9830" b="12950">in</wd>
<space/>
<wd l="9922" t="12811" r="10426" b="12955">which</wd>
<space/>
<wd l="10517" t="12811" r="10790" b="12955">the</wd>
<space/>
</ln>
<ln l="6494" t="13046" r="10790" b="13229" baseLine="13186" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6494" t="13066" r="6802" b="13195">two</wd>
<space/>
<wd l="6898" t="13051" r="7627" b="13195">relations</wd>
<space/>
<wd l="7723" t="13099" r="7982" b="13195">are</wd>
<space/>
<wd l="8074" t="13046" r="8606" b="13229">found,</wd>
<space/>
<wd l="8712" t="13051" r="9245" b="13195">match</wd>
<space/>
<wd l="9336" t="13051" r="9643" b="13195">and</wd>
<space/>
<wd l="9734" t="13051" r="10430" b="13195">whether</wd>
<space/>
<wd l="10517" t="13051" r="10790" b="13195">the</wd>
<space/>
</ln>
<ln l="6499" t="13282" r="10781" b="13469" baseLine="13426" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="13286" r="6778" b="13426">NE</wd>
<space/>
<wd l="6830" t="13301" r="7286" b="13469">types</wd>
<space/>
<wd l="7349" t="13282" r="7517" b="13430">of</wd>
<space/>
<wd l="7555" t="13286" r="7829" b="13430">the</wd>
<space/>
<wd l="7891" t="13286" r="8582" b="13469">subjects</wd>
<space/>
<wd l="8645" t="13286" r="8957" b="13430">and</wd>
<space/>
<wd l="9019" t="13286" r="9672" b="13469">objects,</wd>
<space/>
<wd l="9744" t="13286" r="10781" b="13469">respectively,</wd>
<space/>
</ln>
<ln l="6499" t="13526" r="7070" b="13670" baseLine="13666" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="13526" r="7070" b="13670">match.</wd>
</ln>
</para>
<para l="6307" t="13963" r="10805" b="15067" alignment="justified" li="360" spaceBefore="196" fli="-216" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="6307" t="13963" r="10795" b="14150" baseLine="14102" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6307" t="13963" r="6504" b="14102">•</wd>
<tab position="6385"/>
<wd l="6504" t="13963" r="7507" b="14112">Coreference</wd>
<space/>
<wd l="7594" t="13968" r="8482" b="14112">resolution:</wd>
<space/>
<wd l="8616" t="13968" r="8995" b="14112">This</wd>
<space/>
<wd l="9082" t="13982" r="9461" b="14150">type</wd>
<space/>
<wd l="9547" t="13963" r="9715" b="14112">of</wd>
<space/>
<wd l="9787" t="13963" r="10795" b="14112">information</wd>
<space/>
</ln>
<ln l="6499" t="14194" r="10805" b="14400" baseLine="14342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="14213" r="6624" b="14352">is</wd>
<space/>
<wd l="6706" t="14208" r="7085" b="14352">used</wd>
<space/>
<wd l="7162" t="14222" r="7334" b="14352">to</wd>
<space/>
<wd l="7416" t="14256" r="8141" b="14390">compare</wd>
<space/>
<wd l="8218" t="14208" r="8491" b="14352">the</wd>
<space/>
<wd l="8568" t="14208" r="8846" b="14347">NE</wd>
<space/>
<wd l="8928" t="14208" r="9538" b="14390">subject</wd>
<space/>
<wd l="9638" t="14194" r="9874" b="14400">(or</wd>
<space/>
<wd l="9950" t="14194" r="10541" b="14400">object)</wd>
<space/>
<wd l="10637" t="14203" r="10805" b="14352">of</wd>
<space/>
</ln>
<ln l="6499" t="14448" r="10790" b="14630" baseLine="14582" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="14496" r="6792" b="14592">one</wd>
<space/>
<wd l="6893" t="14448" r="7550" b="14592">relation</wd>
<space/>
<wd l="7646" t="14462" r="7819" b="14592">to</wd>
<space/>
<wd l="7920" t="14453" r="8486" b="14630">strings</wd>
<space/>
<wd l="8587" t="14448" r="8942" b="14592">that</wd>
<space/>
<wd l="9053" t="14496" r="9638" b="14630">appear</wd>
<space/>
<wd l="9739" t="14453" r="9898" b="14587">in</wd>
<space/>
<wd l="9994" t="14448" r="10267" b="14592">the</wd>
<space/>
<wd l="10368" t="14496" r="10790" b="14592">same</wd>
<space/>
</ln>
<ln l="6499" t="14674" r="10790" b="14880" baseLine="14822" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="14683" r="7450" b="14832">coreference</wd>
<space/>
<wd l="7546" t="14702" r="7776" b="14832">set</wd>
<space/>
<wd l="7882" t="14736" r="8045" b="14832">as</wd>
<space/>
<wd l="8141" t="14688" r="8419" b="14832">the</wd>
<space/>
<wd l="8510" t="14688" r="9125" b="14870">subject</wd>
<space/>
<wd l="9240" t="14674" r="9475" b="14880">(or</wd>
<space/>
<wd l="9571" t="14674" r="10162" b="14880">object)</wd>
<space/>
<wd l="10272" t="14683" r="10440" b="14832">of</wd>
<space/>
<wd l="10517" t="14688" r="10790" b="14832">the</wd>
<space/>
</ln>
<ln l="6499" t="14923" r="7838" b="15067" baseLine="15062" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6499" t="14923" r="7066" b="15067">second</wd>
<space/>
<wd l="7142" t="14923" r="7838" b="15067">relation.</wd>
</ln>
</para>
<para l="6101" t="15398" r="10795" b="15826" alignment="justified" spaceBefore="240" spaceAfter="47" lsp="exactly" lspExact="240" language="en">
<ln l="6101" t="15398" r="10786" b="15586" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="15403" r="6912" b="15586">Manually</wd>
<space/>
<wd l="7037" t="15403" r="7858" b="15586">analyzing</wd>
<space/>
<wd l="7982" t="15451" r="8078" b="15547">a</wd>
<space/>
<wd l="8203" t="15418" r="8429" b="15547">set</wd>
<space/>
<wd l="8568" t="15398" r="8731" b="15547">of</wd>
<space/>
<wd l="8846" t="15403" r="9653" b="15547">extracted</wd>
<space/>
<wd l="9782" t="15403" r="10440" b="15547">relation</wd>
<space/>
<wd l="10565" t="15408" r="10786" b="15542">in-</wd>
</ln>
<ln l="6101" t="15638" r="10795" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="15658" r="6763" b="15821">stances,</wd>
<space/>
<wd l="6845" t="15691" r="7066" b="15787">we</wd>
<space/>
<wd l="7142" t="15638" r="7752" b="15787">defined</wd>
<space/>
<wd l="7824" t="15643" r="8462" b="15826">weights</wd>
<space/>
<wd l="8539" t="15638" r="8774" b="15787">for</wd>
<space/>
<wd l="8842" t="15643" r="9115" b="15787">the</wd>
<space/>
<wd l="9192" t="15638" r="9898" b="15787">different</wd>
<space/>
<wd l="9979" t="15643" r="10795" b="15826">similarity</wd>
</ln>
</para>
</column>
</section>
</body>
</page>
<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">
<description>
<source file="pdf\L08-1001.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>
<theoreticalPage size="A4" marginLeft="1032" marginTop="1395" marginRight="1099" marginBottom="1003" offsetX="32" offsetY="16" width="11918" height="16854"/>
<language>en</language>
</description>
<body>
<section l="1032" t="1395" r="10810" b="15835">
<column l="1032" t="1395" r="5756" b="15835">
<para l="1042" t="1440" r="5736" b="2544" alignment="justified" lsp="exactly" lspExact="238" language="en">
<ln l="1046" t="1440" r="5731" b="1627" baseLine="1579" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">
<wd l="1046" t="1493" r="1824" b="1589">measures</wd>
<space/>
<wd l="1901" t="1445" r="2213" b="1589">and</wd>
<space/>
<wd l="2285" t="1445" r="3149" b="1589">calculated</wd>
<space/>
<wd l="3221" t="1493" r="3317" b="1589">a</wd>
<space/>
<wd l="3384" t="1445" r="4200" b="1627">similarity</wd>
<space/>
<wd l="4267" t="1493" r="4694" b="1589">score</wd>
<space/>
<wd l="4766" t="1440" r="4997" b="1589">for</wd>
<space/>
<wd l="5069" t="1445" r="5443" b="1589">each</wd>
<space/>
<wd l="5510" t="1493" r="5731" b="1589">re-</wd>
</ln>
<ln l="1046" t="1680" r="5731" b="1867" baseLine="1819" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">
<wd l="1046" t="1685" r="1541" b="1829">lation</wd>
<space/>
<wd l="1594" t="1690" r="1968" b="1867">pair.</wd>
<space/>
<wd l="2069" t="1685" r="2342" b="1829">We</wd>
<space/>
<wd l="2390" t="1685" r="2779" b="1829">then</wd>
<space/>
<wd l="2832" t="1680" r="3442" b="1829">defined</wd>
<space/>
<wd l="3494" t="1733" r="3590" b="1829">a</wd>
<space/>
<wd l="3643" t="1733" r="4070" b="1829">score</wd>
<space/>
<wd l="4118" t="1685" r="4920" b="1829">threshold</wd>
<space/>
<wd l="4978" t="1685" r="5290" b="1829">and</wd>
<space/>
<wd l="5347" t="1685" r="5731" b="1829">clus-</wd>
</ln>
<ln l="1042" t="1920" r="5736" b="2102" baseLine="2059" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">
<wd l="1042" t="1920" r="1483" b="2064">tered</wd>
<space/>
<wd l="1560" t="1920" r="2290" b="2064">relations</wd>
<space/>
<wd l="2371" t="1920" r="2578" b="2102">by</wd>
<space/>
<wd l="2654" t="1925" r="3293" b="2102">putting</wd>
<space/>
<wd l="3360" t="1934" r="3667" b="2064">two</wd>
<space/>
<wd l="3744" t="1920" r="4478" b="2064">relations</wd>
<space/>
<wd l="4560" t="1925" r="4886" b="2064">into</wd>
<space/>
<wd l="4963" t="1920" r="5237" b="2064">the</wd>
<space/>
<wd l="5314" t="1968" r="5736" b="2064">same</wd>
<space/>
</ln>
<ln l="1046" t="2155" r="5736" b="2342" baseLine="2299" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">
<wd l="1046" t="2160" r="1618" b="2304">cluster</wd>
<space/>
<wd l="1690" t="2155" r="1810" b="2299">if</wd>
<space/>
<wd l="1862" t="2160" r="2270" b="2304">their</wd>
<space/>
<wd l="2338" t="2160" r="3154" b="2342">similarity</wd>
<space/>
<wd l="3221" t="2208" r="3648" b="2304">score</wd>
<space/>
<wd l="3720" t="2160" r="4478" b="2304">exceeded</wd>
<space/>
<wd l="4546" t="2160" r="4862" b="2304">this</wd>
<space/>
<wd l="4930" t="2160" r="5736" b="2304">threshold</wd>
<space/>
</ln>
<ln l="1042" t="2400" r="1531" b="2544" baseLine="2534" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="1">
<wd l="1042" t="2400" r="1531" b="2544">value.</wd>
</ln>
</para>
<para l="1733" t="2822" r="5059" b="3038" alignment="centered" spaceBefore="188" lsp="exactly" lspExact="274" language="en">
<ln l="1733" t="2822" r="5059" b="3038" baseLine="2990" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="20">
<wd l="1733" t="2832" r="1915" b="2995">3.</wd>
<space/>
<wd l="2203" t="2822" r="3677" b="3038">Experiments</wd>
<space/>
<wd l="3773" t="2822" r="4195" b="2995">and</wd>
<space/>
<wd l="4296" t="2822" r="5059" b="2995">results</wd>
</ln>
</para>
<para l="1042" t="3149" r="5741" b="5453" alignment="justified" spaceBefore="47" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="3149" r="5731" b="3336" baseLine="3293" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="3154" r="1334" b="3298">For</wd>
<space/>
<wd l="1435" t="3202" r="1718" b="3298">our</wd>
<space/>
<wd l="1819" t="3158" r="2904" b="3336">experiments,</wd>
<space/>
<wd l="3014" t="3202" r="3240" b="3298">we</wd>
<space/>
<wd l="3341" t="3154" r="3739" b="3298">built</wd>
<space/>
<wd l="3845" t="3202" r="3941" b="3298">a</wd>
<space/>
<wd l="4037" t="3168" r="4349" b="3298">test</wd>
<space/>
<wd l="4459" t="3202" r="5011" b="3336">corpus</wd>
<space/>
<wd l="5117" t="3149" r="5285" b="3298">of</wd>
<space/>
<wd l="5376" t="3154" r="5731" b="3298">doc-</wd>
</ln>
<ln l="1046" t="3389" r="5736" b="3576" baseLine="3533" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="3408" r="1661" b="3538">uments</wd>
<space/>
<wd l="1781" t="3394" r="2371" b="3538">related</wd>
<space/>
<wd l="2482" t="3408" r="2654" b="3538">to</wd>
<space/>
<wd l="2765" t="3394" r="3043" b="3538">the</wd>
<space/>
<wd l="3149" t="3398" r="3581" b="3576">topic</wd>
<space/>
<wd l="3691" t="3394" r="4291" b="3538">“Berlin</wd>
<space/>
<wd l="4406" t="3389" r="5736" b="3576">Hauptbahnhof”</wd>
<space/>
</ln>
<ln l="1046" t="3619" r="5741" b="3826" baseLine="3768" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="3634" r="1253" b="3816">by</wd>
<space/>
<wd l="1344" t="3634" r="1997" b="3816">sending</wd>
<space/>
<wd l="2083" t="3638" r="2678" b="3816">queries</wd>
<space/>
<wd l="2774" t="3634" r="3648" b="3816">describing</wd>
<space/>
<wd l="3734" t="3634" r="4008" b="3778">the</wd>
<space/>
<wd l="4094" t="3638" r="4526" b="3816">topic</wd>
<space/>
<wd l="4632" t="3619" r="5035" b="3826">(e.g.,</wd>
<space/>
<wd l="5141" t="3634" r="5741" b="3778">“Berlin</wd>
<space/>
</ln>
<ln l="1046" t="3859" r="5736" b="4066" baseLine="4008" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="3869" r="2424" b="4056">Hauptbahnhof”,</wd>
<space/>
<wd l="2568" t="3874" r="3168" b="4018">“Berlin</wd>
<space/>
<wd l="3283" t="3874" r="3869" b="4018">central</wd>
<space/>
<wd l="3989" t="3859" r="4714" b="4066">station”)</wd>
<space/>
<wd l="4848" t="3888" r="5021" b="4018">to</wd>
<space/>
<wd l="5146" t="3869" r="5736" b="4056">Google</wd>
<space/>
</ln>
<ln l="1046" t="4109" r="5741" b="4296" baseLine="4248" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="4114" r="1358" b="4258">and</wd>
<space/>
<wd l="1459" t="4114" r="2549" b="4296">downloading</wd>
<space/>
<wd l="2635" t="4114" r="2914" b="4258">the</wd>
<space/>
<wd l="3010" t="4114" r="3763" b="4258">retrieved</wd>
<space/>
<wd l="3864" t="4114" r="4786" b="4258">documents</wd>
<space/>
<wd l="4886" t="4109" r="5741" b="4296">specifying</wd>
<space/>
</ln>
<ln l="1046" t="4344" r="5741" b="4531" baseLine="4488" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="4349" r="1690" b="4531">English</wd>
<space/>
<wd l="1786" t="4397" r="1954" b="4493">as</wd>
<space/>
<wd l="2054" t="4349" r="2328" b="4493">the</wd>
<space/>
<wd l="2424" t="4363" r="2933" b="4531">target</wd>
<space/>
<wd l="3038" t="4349" r="3835" b="4531">language.</wd>
<space/>
<wd l="4027" t="4344" r="4478" b="4493">After</wd>
<space/>
<wd l="4574" t="4354" r="5741" b="4531">preprocessing</wd>
<space/>
</ln>
<ln l="1042" t="4589" r="5731" b="4771" baseLine="4728" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1042" t="4589" r="1483" b="4733">these</wd>
<space/>
<wd l="1565" t="4589" r="2482" b="4733">documents</wd>
<space/>
<wd l="2568" t="4637" r="2731" b="4733">as</wd>
<space/>
<wd l="2818" t="4589" r="3619" b="4733">described</wd>
<space/>
<wd l="3706" t="4594" r="3864" b="4728">in</wd>
<space/>
<wd l="3946" t="4594" r="4291" b="4766">2.1.,</wd>
<space/>
<wd l="4382" t="4637" r="4666" b="4733">our</wd>
<space/>
<wd l="4742" t="4637" r="5294" b="4771">corpus</wd>
<space/>
<wd l="5381" t="4637" r="5731" b="4733">con-</wd>
</ln>
<ln l="1046" t="4824" r="5736" b="5011" baseLine="4963" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="4829" r="1526" b="4973">sisted</wd>
<space/>
<wd l="1608" t="4824" r="1771" b="4973">of</wd>
<space/>
<wd l="1843" t="4834" r="2376" b="5006">55,255</wd>
<space/>
<wd l="2458" t="4843" r="3254" b="4973">sentences</wd>
<space/>
<wd l="3331" t="4824" r="3730" b="4973">from</wd>
<space/>
<wd l="3816" t="4834" r="4253" b="5006">1,068</wd>
<space/>
<wd l="4325" t="4829" r="4661" b="4973">web</wd>
<space/>
<wd l="4738" t="4877" r="5251" b="5011">pages,</wd>
<space/>
<wd l="5342" t="4824" r="5736" b="4973">from</wd>
<space/>
</ln>
<ln l="1042" t="5069" r="5736" b="5251" baseLine="5203" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1042" t="5069" r="1546" b="5213">which</wd>
<space/>
<wd l="1670" t="5069" r="2146" b="5213">10773</wd>
<space/>
<wd l="2270" t="5069" r="3005" b="5213">relations</wd>
<space/>
<wd l="3120" t="5117" r="3514" b="5213">were</wd>
<space/>
<wd l="3634" t="5069" r="4814" b="5251">automatically</wd>
<space/>
<wd l="4930" t="5069" r="5736" b="5213">extracted</wd>
<space/>
</ln>
<ln l="1046" t="5309" r="2246" b="5453" baseLine="5443" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="5309" r="1358" b="5453">and</wd>
<space/>
<wd l="1435" t="5309" r="2246" b="5453">clustered.</wd>
</ln>
</para>
<para l="1051" t="5712" r="2669" b="5894" alignment="left" spaceBefore="165" lsp="exactly" lspExact="243" language="en">
<ln l="1051" t="5712" r="2669" b="5894" baseLine="5846" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="16">
<wd l="1051" t="5717" r="1382" b="5856">3.1.</wd>
<space/>
<wd l="1637" t="5712" r="2669" b="5894">Clustering</wd>
</ln>
</para>
<para l="1042" t="6000" r="5741" b="8534" alignment="justified" spaceBefore="34" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="6000" r="5731" b="6182" baseLine="6134" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="6000" r="1498" b="6144">From</wd>
<space/>
<wd l="1546" t="6000" r="1819" b="6144">the</wd>
<space/>
<wd l="1872" t="6000" r="2678" b="6144">extracted</wd>
<space/>
<wd l="2736" t="6000" r="3514" b="6178">relations,</wd>
<space/>
<wd l="3576" t="6000" r="3850" b="6144">the</wd>
<space/>
<wd l="3902" t="6014" r="4493" b="6182">system</wd>
<space/>
<wd l="4546" t="6000" r="4939" b="6144">built</wd>
<space/>
<wd l="5002" t="6005" r="5285" b="6144">306</wd>
<space/>
<wd l="5347" t="6000" r="5731" b="6144">clus-</wd>
</ln>
<ln l="1042" t="6235" r="5741" b="6422" baseLine="6374" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="6254" r="1358" b="6384">ters</wd>
<space/>
<wd l="1464" t="6235" r="1632" b="6384">of</wd>
<space/>
<wd l="1714" t="6254" r="2021" b="6384">two</wd>
<space/>
<wd l="2122" t="6288" r="2294" b="6384">or</wd>
<space/>
<wd l="2395" t="6288" r="2818" b="6384">more</wd>
<space/>
<wd l="2918" t="6245" r="3744" b="6418">instances,</wd>
<space/>
<wd l="3859" t="6240" r="4363" b="6384">which</wd>
<space/>
<wd l="4454" t="6288" r="4848" b="6384">were</wd>
<space/>
<wd l="4949" t="6240" r="5741" b="6422">manually</wd>
<space/>
</ln>
<ln l="1046" t="6470" r="5731" b="6658" baseLine="6614" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="6475" r="1862" b="6619">evaluated</wd>
<space/>
<wd l="1930" t="6475" r="2136" b="6658">by</wd>
<space/>
<wd l="2198" t="6490" r="2501" b="6619">two</wd>
<space/>
<wd l="2573" t="6475" r="3211" b="6619">authors</wd>
<space/>
<wd l="3283" t="6470" r="3451" b="6619">of</wd>
<space/>
<wd l="3499" t="6475" r="3816" b="6619">this</wd>
<space/>
<wd l="3883" t="6523" r="4411" b="6658">paper.</wd>
<space/>
<wd l="4522" t="6480" r="4699" b="6619">81</wd>
<space/>
<wd l="4776" t="6470" r="4944" b="6619">of</wd>
<space/>
<wd l="4997" t="6523" r="5280" b="6619">our</wd>
<space/>
<wd l="5347" t="6475" r="5731" b="6619">clus-</wd>
</ln>
<ln l="1042" t="6710" r="5736" b="6898" baseLine="6854" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="6730" r="1358" b="6859">ters</wd>
<space/>
<wd l="1430" t="6720" r="2059" b="6859">contain</wd>
<space/>
<wd l="2122" t="6730" r="2429" b="6859">two</wd>
<space/>
<wd l="2496" t="6763" r="2669" b="6859">or</wd>
<space/>
<wd l="2736" t="6763" r="3158" b="6859">more</wd>
<space/>
<wd l="3226" t="6720" r="4003" b="6859">instances</wd>
<space/>
<wd l="4075" t="6710" r="4243" b="6859">of</wd>
<space/>
<wd l="4296" t="6715" r="4910" b="6898">exactly</wd>
<space/>
<wd l="4973" t="6715" r="5246" b="6859">the</wd>
<space/>
<wd l="5314" t="6763" r="5736" b="6859">same</wd>
<space/>
</ln>
<ln l="1046" t="6955" r="5741" b="7138" baseLine="7090" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="6955" r="1752" b="7133">relation,</wd>
<space/>
<wd l="1824" t="6955" r="2405" b="7138">mostly</wd>
<space/>
<wd l="2462" t="6955" r="2765" b="7099">due</wd>
<space/>
<wd l="2822" t="6970" r="2995" b="7099">to</wd>
<space/>
<wd l="3058" t="6955" r="3331" b="7099">the</wd>
<space/>
<wd l="3394" t="7003" r="3821" b="7099">same</wd>
<space/>
<wd l="3883" t="6970" r="4603" b="7099">sentence</wd>
<space/>
<wd l="4666" t="6960" r="5520" b="7138">appearing</wd>
<space/>
<wd l="5578" t="6960" r="5741" b="7094">in</wd>
<space/>
</ln>
<ln l="1046" t="7190" r="5731" b="7378" baseLine="7330" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="7195" r="1627" b="7339">several</wd>
<space/>
<wd l="1690" t="7195" r="2611" b="7339">documents</wd>
<space/>
<wd l="2674" t="7190" r="2842" b="7339">of</wd>
<space/>
<wd l="2885" t="7195" r="3158" b="7339">the</wd>
<space/>
<wd l="3221" t="7243" r="3821" b="7378">corpus.</wd>
<space/>
<wd l="3931" t="7190" r="4147" b="7339">Of</wd>
<space/>
<wd l="4190" t="7195" r="4469" b="7339">the</wd>
<space/>
<wd l="4526" t="7200" r="5386" b="7378">remaining</wd>
<space/>
<wd l="5453" t="7200" r="5731" b="7339">225</wd>
<space/>
</ln>
<ln l="1046" t="7435" r="5741" b="7618" baseLine="7570" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="7435" r="1742" b="7613">clusters,</wd>
<space/>
<wd l="1853" t="7440" r="2122" b="7574">121</wd>
<space/>
<wd l="2218" t="7483" r="2611" b="7579">were</wd>
<space/>
<wd l="2698" t="7435" r="3331" b="7579">marked</wd>
<space/>
<wd l="3422" t="7483" r="3586" b="7579">as</wd>
<space/>
<wd l="3682" t="7440" r="4579" b="7613">consistent,</wd>
<space/>
<wd l="4680" t="7440" r="4867" b="7579">35</wd>
<space/>
<wd l="4958" t="7483" r="5126" b="7579">as</wd>
<space/>
<wd l="5218" t="7435" r="5741" b="7618">partly</wd>
<space/>
</ln>
<ln l="1046" t="7670" r="5731" b="7853" baseLine="7810" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="7680" r="1944" b="7853">consistent,</wd>
<space/>
<wd l="2059" t="7680" r="2246" b="7819">69</wd>
<space/>
<wd l="2352" t="7723" r="2520" b="7819">as</wd>
<space/>
<wd l="2626" t="7690" r="2899" b="7819">not</wd>
<space/>
<wd l="3005" t="7680" r="3898" b="7819">consistent.</wd>
<space/>
<wd l="4080" t="7675" r="4358" b="7819">We</wd>
<space/>
<wd l="4454" t="7670" r="5064" b="7819">defined</wd>
<space/>
<wd l="5170" t="7680" r="5731" b="7819">consis-</wd>
</ln>
<ln l="1042" t="7906" r="5736" b="8093" baseLine="8050" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="7925" r="1512" b="8093">tency</wd>
<space/>
<wd l="1584" t="7910" r="2064" b="8054">based</wd>
<space/>
<wd l="2141" t="7958" r="2347" b="8054">on</wd>
<space/>
<wd l="2414" t="7910" r="2688" b="8054">the</wd>
<space/>
<wd l="2760" t="7910" r="3528" b="8093">potential</wd>
<space/>
<wd l="3600" t="7906" r="4450" b="8054">usefulness</wd>
<space/>
<wd l="4531" t="7906" r="4694" b="8054">of</wd>
<space/>
<wd l="4757" t="7958" r="4853" b="8054">a</wd>
<space/>
<wd l="4925" t="7910" r="5496" b="8054">cluster</wd>
<space/>
<wd l="5563" t="7925" r="5736" b="8054">to</wd>
<space/>
</ln>
<ln l="1042" t="8146" r="5741" b="8333" baseLine="8290" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="8150" r="1315" b="8294">the</wd>
<space/>
<wd l="1378" t="8198" r="1728" b="8294">user</wd>
<space/>
<wd l="1786" t="8150" r="2098" b="8294">and</wd>
<space/>
<wd l="2160" t="8146" r="2952" b="8294">identified</wd>
<space/>
<wd l="3014" t="8150" r="3451" b="8294">three</wd>
<space/>
<wd l="3514" t="8155" r="4022" b="8333">major</wd>
<space/>
<wd l="4080" t="8165" r="4531" b="8333">types</wd>
<space/>
<wd l="4598" t="8146" r="4762" b="8294">of</wd>
<space/>
<wd l="4810" t="8150" r="5741" b="8333">potentially</wd>
<space/>
</ln>
<ln l="1046" t="8386" r="2309" b="8534" baseLine="8525" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="8386" r="1546" b="8534">useful</wd>
<space/>
<wd l="1618" t="8390" r="2309" b="8534">clusters:</wd>
</ln>
</para>
<para l="1253" t="8798" r="3734" b="8986" alignment="left" li="216" spaceBefore="173" spaceAfter="239" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="1253" t="8803" r="3734" b="8986" baseLine="8938" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1253" t="8803" r="1445" b="8938">•</wd>
<tab position="1329"/>
<wd l="1445" t="8803" r="2174" b="8947">Relation</wd>
<space/>
<wd l="2246" t="8803" r="3317" b="8986">paraphrases,</wd>
<space/>
<wd l="3398" t="8851" r="3734" b="8986">e.g.,</wd>
</ln>
</para>
<frame l="1450" t="9238" r="5088" b="9945">
<leftBorder type="single" width="10" color="000000"/>
<topBorder type="single" width="10" color="000000"/>
<rightBorder type="single" width="10" color="000000"/>
<bottomBorder type="single" width="10" color="000000"/>
<para l="1579" t="9278" r="4968" b="9922" alignment="left" li="144" ri="144" spaceAfter="14" lsp="exactly" lspExact="228" language="en">
<ln l="1589" t="9278" r="4603" b="9461" baseLine="9413">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="1589" t="9288" r="2179" b="9418">accused</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2261" t="9278" r="2554" b="9461">(Mr</wd>
<space/>
<wd l="2626" t="9288" r="3168" b="9451">Moore,</wd>
<space/>
<wd l="3250" t="9288" r="3811" b="9451">Disney,</wd>
<space/>
<wd l="3893" t="9288" r="4056" b="9413">In</wd>
<space/>
<wd l="4123" t="9278" r="4603" b="9461">letter)</wd>
<space/>
</run>
</ln>
<ln l="1589" t="9518" r="4968" b="9701" baseLine="9653">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="1589" t="9528" r="2179" b="9658">accused</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2342" t="9518" r="3019" b="9701">(Michael</wd>
<space/>
<wd l="3173" t="9528" r="3715" b="9691">Moore,</wd>
<space/>
<wd l="3893" t="9528" r="4272" b="9658">Walt</wd>
<space/>
<wd l="4430" t="9528" r="4968" b="9691">Disney</wd>
<space/>
</run>
</ln>
<ln l="1579" t="9739" r="2395" b="9922" baseLine="9869" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1579" t="9739" r="2395" b="9922">Company)</wd>
</ln>
</para>
</frame>
<para l="1253" t="10109" r="5294" b="10301" alignment="left" li="216" spaceBefore="116" spaceAfter="229" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="1253" t="10114" r="5294" b="10301" baseLine="10258" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1253" t="10118" r="1445" b="10258">•</wd>
<tab position="1331"/>
<wd l="1445" t="10114" r="2194" b="10262">Different</wd>
<space/>
<wd l="2275" t="10123" r="3048" b="10262">instances</wd>
<space/>
<wd l="3130" t="10114" r="3293" b="10262">of</wd>
<space/>
<wd l="3350" t="10118" r="3624" b="10262">the</wd>
<space/>
<wd l="3696" t="10166" r="4123" b="10262">same</wd>
<space/>
<wd l="4195" t="10133" r="4877" b="10301">pattern,</wd>
<space/>
<wd l="4958" t="10166" r="5294" b="10301">e.g.,</wd>
</ln>
</para>
<frame l="1450" t="10541" r="5088" b="11040">
<leftBorder type="single" width="10" color="000000"/>
<topBorder type="single" width="10" color="000000"/>
<rightBorder type="single" width="10" color="000000"/>
<bottomBorder type="single" width="10" color="000000"/>
<para l="1589" t="10598" r="4805" b="11021" alignment="left" li="144" ri="288" spaceAfter="9" lsp="exactly" lspExact="240" language="en">
<ln l="1589" t="10598" r="4805" b="10781" baseLine="10728">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="1589" t="10618" r="2218" b="10771">operates</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2304" t="10598" r="2837" b="10781">(Delta,</wd>
<space/>
<wd l="2918" t="10603" r="3437" b="10771">flights,</wd>
<space/>
<wd l="3518" t="10603" r="3888" b="10738">from</wd>
<space/>
<wd l="3950" t="10608" r="4296" b="10738">New</wd>
<space/>
<wd l="4363" t="10598" r="4805" b="10781">York)</wd>
<space/>
</run>
</ln>
<ln l="1589" t="10838" r="4445" b="11021" baseLine="10968">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="1589" t="10843" r="2016" b="11011">offers</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2102" t="10838" r="3005" b="11021">(Lufthansa,</wd>
<space/>
<wd l="3086" t="10843" r="3605" b="11011">flights,</wd>
<space/>
<wd l="3682" t="10843" r="4051" b="10978">from</wd>
<space/>
<wd l="4118" t="10838" r="4445" b="11021">DC)</wd>
</run>
</ln>
</para>
</frame>
<para l="1253" t="11213" r="5131" b="11419" alignment="left" li="216" spaceBefore="129" spaceAfter="245" lsp="exactly" lspExact="240" language="en">
<bullet type="bulleted" value="smallCircle" numChars="2">
</bullet>
<ln l="1253" t="11213" r="5131" b="11419" baseLine="11366" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1253" t="11227" r="1445" b="11366">•</wd>
<tab position="1331"/>
<wd l="1445" t="11227" r="2246" b="11371">Relations</wd>
<space/>
<wd l="2323" t="11227" r="2813" b="11371">about</wd>
<space/>
<wd l="2890" t="11227" r="3163" b="11371">the</wd>
<space/>
<wd l="3235" t="11275" r="3662" b="11371">same</wd>
<space/>
<wd l="3730" t="11232" r="4162" b="11410">topic</wd>
<space/>
<wd l="4248" t="11213" r="4709" b="11419">(NE),</wd>
<space/>
<wd l="4795" t="11275" r="5131" b="11410">e.g.,</wd>
</ln>
</para>
<frame l="1440" t="11674" r="5098" b="13090">
<leftBorder type="single" width="10" color="000000"/>
<topBorder type="single" width="10" color="000000"/>
<rightBorder type="single" width="10" color="000000"/>
<bottomBorder type="single" width="10" color="000000"/>
<para l="1574" t="11717" r="4968" b="12120" alignment="justified" spaceBefore="12" lsp="exactly" lspExact="217" language="en">
<ln l="1584" t="11717" r="4968" b="11899" baseLine="11851">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="7"><wd l="1584" t="11726" r="2179" b="11890">rejected</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7"><wd l="2270" t="11717" r="2563" b="11899">(Mr</wd>
<space/>
<wd l="2645" t="11726" r="3077" b="11890">Blair,</wd>
<space/>
<wd l="3168" t="11770" r="3859" b="11890">pressure,</wd>
<space/>
<wd l="3950" t="11722" r="4320" b="11856">from</wd>
<space/>
<wd l="4397" t="11726" r="4968" b="11856">Labour</wd>
<space/>
</run>
</ln>
<ln l="1574" t="11938" r="1992" b="12120" baseLine="12067" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1574" t="11938" r="1992" b="12120">MPs)</wd>
</ln>
</para>
<para l="1574" t="12178" r="4968" b="12576" alignment="justified" spaceBefore="27" lsp="exactly" lspExact="217" language="en">
<ln l="1584" t="12178" r="4968" b="12360" baseLine="12307">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="0"><wd l="1584" t="12187" r="2328" b="12317">reiterated</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="2429" t="12178" r="2722" b="12360">(Mr</wd>
<space/>
<wd l="2813" t="12187" r="3245" b="12350">Blair,</wd>
<space/>
<wd l="3350" t="12187" r="3782" b="12350">ideas,</wd>
<space/>
<wd l="3888" t="12192" r="4032" b="12312">in</wd>
<space/>
<wd l="4123" t="12187" r="4675" b="12350">speech,</wd>
<space/>
<wd l="4781" t="12230" r="4968" b="12317">on</wd>
<space/>
</run>
</ln>
<ln l="1574" t="12394" r="2141" b="12576" baseLine="12528" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1574" t="12394" r="2141" b="12576">March)</wd>
</ln>
</para>
<para l="1589" t="12634" r="3802" b="12816" alignment="left" spaceBefore="18" lsp="exactly" lspExact="217" language="en">
<ln l="1589" t="12634" r="3802" b="12816" baseLine="12763">
<run italic="true" underlined="none" subsuperscript="none" fontSize="850" fontFace="Times New Roman" fontFamily="swiss" fontPitch="variable" spacing="6"><wd l="1589" t="12643" r="2131" b="12773">created</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><wd l="2218" t="12634" r="2510" b="12816">(Mr</wd>
<space/>
<wd l="2578" t="12643" r="3010" b="12806">Blair,</wd>
<space/>
<wd l="3091" t="12634" r="3802" b="12816">doctrine)</wd>
</run>
</ln>
</para>
<para l="1542" t="12979" r="1784" b="13008" alignment="left" spaceAfter="33" lsp="exactly" lspExact="240" language="en">
<ln l="1584" t="12979" r="1718" b="13008" baseLine="13003" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="22">
<wd l="1584" t="12984" r="1718" b="13008">...</wd>
</ln>
</para>
</frame>
<para l="1046" t="13272" r="5736" b="14659" alignment="justified" spaceBefore="134" lsp="exactly" lspExact="240" language="en">
<ln l="1051" t="13272" r="5731" b="13454" baseLine="13416" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="1051" t="13272" r="1272" b="13421">Of</wd>
<space/>
<wd l="1320" t="13325" r="1603" b="13421">our</wd>
<space/>
<wd l="1675" t="13282" r="1949" b="13416">121</wd>
<space/>
<wd l="2021" t="13282" r="2866" b="13421">consistent</wd>
<space/>
<wd l="2938" t="13277" r="3634" b="13454">clusters,</wd>
<space/>
<wd l="3715" t="13277" r="3893" b="13421">76</wd>
<space/>
<wd l="3960" t="13325" r="4354" b="13421">were</wd>
<space/>
<wd l="4416" t="13272" r="5170" b="13421">classified</wd>
<space/>
<wd l="5237" t="13325" r="5405" b="13421">as</wd>
<space/>
<wd l="5472" t="13277" r="5731" b="13421">be-</wd>
</ln>
<ln l="1046" t="13512" r="5736" b="13699" baseLine="13656" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="1046" t="13522" r="1310" b="13699">ing</wd>
<space/>
<wd l="1378" t="13512" r="1546" b="13661">of</wd>
<space/>
<wd l="1598" t="13517" r="1872" b="13661">the</wd>
<space/>
<wd l="1939" t="13531" r="2318" b="13699">type</wd>
<space/>
<wd l="2400" t="13517" r="2870" b="13661">’same</wd>
<space/>
<wd l="2942" t="13517" r="3677" b="13699">pattern’,</wd>
<space/>
<wd l="3763" t="13517" r="3955" b="13661">27</wd>
<space/>
<wd l="4022" t="13565" r="4190" b="13661">as</wd>
<space/>
<wd l="4262" t="13517" r="4728" b="13699">being</wd>
<space/>
<wd l="4800" t="13512" r="4963" b="13661">of</wd>
<space/>
<wd l="5016" t="13517" r="5294" b="13661">the</wd>
<space/>
<wd l="5357" t="13531" r="5736" b="13699">type</wd>
<space/>
</ln>
<ln l="1056" t="13752" r="5731" b="13939" baseLine="13891" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="1056" t="13757" r="1531" b="13901">’same</wd>
<space/>
<wd l="1589" t="13757" r="2064" b="13939">topic’</wd>
<space/>
<wd l="2136" t="13757" r="2448" b="13901">and</wd>
<space/>
<wd l="2520" t="13762" r="2702" b="13901">18</wd>
<space/>
<wd l="2770" t="13805" r="2933" b="13901">as</wd>
<space/>
<wd l="3000" t="13757" r="3470" b="13939">being</wd>
<space/>
<wd l="3528" t="13752" r="3696" b="13901">of</wd>
<space/>
<wd l="3739" t="13757" r="4013" b="13901">the</wd>
<space/>
<wd l="4075" t="13771" r="4454" b="13939">type</wd>
<space/>
<wd l="4526" t="13757" r="5232" b="13901">’relation</wd>
<space/>
<wd l="5290" t="13805" r="5731" b="13939">para-</wd>
</ln>
<ln l="1046" t="13992" r="5736" b="14179" baseLine="14131" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="1046" t="13997" r="1781" b="14179">phrases’.</wd>
<space/>
<wd l="1886" t="13992" r="2102" b="14141">As</wd>
<space/>
<wd l="2160" t="14045" r="2630" b="14179">many</wd>
<space/>
<wd l="2678" t="13992" r="2846" b="14141">of</wd>
<space/>
<wd l="2885" t="14045" r="3168" b="14141">our</wd>
<space/>
<wd l="3221" t="13997" r="3864" b="14141">clusters</wd>
<space/>
<wd l="3922" t="14002" r="4550" b="14141">contain</wd>
<space/>
<wd l="4598" t="14011" r="4906" b="14141">two</wd>
<space/>
<wd l="4958" t="14002" r="5736" b="14141">instances</wd>
<space/>
</ln>
<ln l="1046" t="14237" r="5736" b="14419" baseLine="14371" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="1046" t="14237" r="1440" b="14419">only,</wd>
<space/>
<wd l="1507" t="14285" r="1733" b="14381">we</wd>
<space/>
<wd l="1795" t="14285" r="2054" b="14381">are</wd>
<space/>
<wd l="2112" t="14237" r="2861" b="14419">planning</wd>
<space/>
<wd l="2914" t="14251" r="3091" b="14381">to</wd>
<space/>
<wd l="3154" t="14237" r="3792" b="14419">analyze</wd>
<space/>
<wd l="3850" t="14237" r="4546" b="14381">whether</wd>
<space/>
<wd l="4603" t="14285" r="5030" b="14381">some</wd>
<space/>
<wd l="5088" t="14237" r="5736" b="14381">clusters</wd>
<space/>
</ln>
<ln l="1046" t="14477" r="5410" b="14659" baseLine="14611" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="1046" t="14477" r="1603" b="14621">should</wd>
<space/>
<wd l="1680" t="14477" r="1877" b="14621">be</wd>
<space/>
<wd l="1949" t="14477" r="2573" b="14659">merged</wd>
<space/>
<wd l="2650" t="14477" r="2957" b="14621">and</wd>
<space/>
<wd l="3034" t="14477" r="3379" b="14621">how</wd>
<space/>
<wd l="3446" t="14477" r="3758" b="14621">this</wd>
<space/>
<wd l="3840" t="14477" r="4291" b="14621">could</wd>
<space/>
<wd l="4368" t="14477" r="4565" b="14621">be</wd>
<space/>
<wd l="4642" t="14477" r="5410" b="14621">achieved.</wd>
</ln>
</para>
<para l="1051" t="14880" r="3566" b="15024" alignment="left" spaceBefore="165" lsp="exactly" lspExact="243" language="en">
<ln l="1051" t="14880" r="3566" b="15024" baseLine="15014" underlined="none" subsuperscript="none" fontSize="1150" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="14">
<wd l="1051" t="14885" r="1382" b="15024">3.2.</wd>
<space/>
<wd l="1632" t="14880" r="2472" b="15024">Relation</wd>
<space/>
<wd l="2554" t="14880" r="3566" b="15024">extraction</wd>
</ln>
</para>
<para l="1042" t="15163" r="5736" b="15826" alignment="justified" spaceBefore="43" lsp="exactly" lspExact="236" language="en">
<ln l="1046" t="15163" r="5731" b="15350" baseLine="15302" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="15168" r="1224" b="15307">In</wd>
<space/>
<wd l="1282" t="15168" r="1728" b="15312">order</wd>
<space/>
<wd l="1781" t="15182" r="1954" b="15312">to</wd>
<space/>
<wd l="2016" t="15168" r="2722" b="15312">evaluate</wd>
<space/>
<wd l="2774" t="15168" r="3048" b="15312">the</wd>
<space/>
<wd l="3106" t="15163" r="4171" b="15350">performance</wd>
<space/>
<wd l="4234" t="15163" r="4397" b="15312">of</wd>
<space/>
<wd l="4440" t="15168" r="4714" b="15312">the</wd>
<space/>
<wd l="4771" t="15168" r="5429" b="15312">relation</wd>
<space/>
<wd l="5486" t="15216" r="5731" b="15312">ex-</wd>
</ln>
<ln l="1042" t="15408" r="5731" b="15590" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="15413" r="1728" b="15552">traction</wd>
<space/>
<wd l="1810" t="15422" r="2798" b="15590">component,</wd>
<space/>
<wd l="2894" t="15456" r="3115" b="15552">we</wd>
<space/>
<wd l="3202" t="15408" r="3994" b="15590">manually</wd>
<space/>
<wd l="4075" t="15408" r="4939" b="15552">annotated</wd>
<space/>
<wd l="5030" t="15413" r="5314" b="15552">550</wd>
<space/>
<wd l="5400" t="15456" r="5731" b="15552">sen-</wd>
</ln>
<ln l="1042" t="15638" r="5736" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="15658" r="1570" b="15787">tences</wd>
<space/>
<wd l="1642" t="15638" r="1810" b="15787">of</wd>
<space/>
<wd l="1862" t="15643" r="2136" b="15787">the</wd>
<space/>
<wd l="2203" t="15658" r="2515" b="15787">test</wd>
<space/>
<wd l="2592" t="15691" r="3149" b="15826">corpus</wd>
<space/>
<wd l="3226" t="15643" r="3432" b="15826">by</wd>
<space/>
<wd l="3494" t="15648" r="4138" b="15826">tagging</wd>
<space/>
<wd l="4205" t="15643" r="4406" b="15787">all</wd>
<space/>
<wd l="4478" t="15643" r="4829" b="15787">NEs</wd>
<space/>
<wd l="4906" t="15643" r="5218" b="15787">and</wd>
<space/>
<wd l="5285" t="15643" r="5736" b="15787">verbs</wd>
</ln>
</para>
</column>
<column l="6086" t="1395" r="10810" b="15835">
<para l="6086" t="1445" r="10795" b="4018" alignment="justified" lsp="exactly" lspExact="238" language="en">
<ln l="6101" t="1445" r="10790" b="1627" baseLine="1579" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="1445" r="6413" b="1589">and</wd>
<space/>
<wd l="6518" t="1445" r="7310" b="1627">manually</wd>
<space/>
<wd l="7411" t="1450" r="8285" b="1627">extracting</wd>
<space/>
<wd l="8386" t="1445" r="9312" b="1627">potentially</wd>
<space/>
<wd l="9413" t="1450" r="10325" b="1627">interesting</wd>
<space/>
<wd l="10416" t="1445" r="10790" b="1589">verb</wd>
<space/>
</ln>
<ln l="6101" t="1680" r="10786" b="1867" baseLine="1819" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="1685" r="6878" b="1829">relations.</wd>
<space/>
<wd l="6994" t="1685" r="7267" b="1829">We</wd>
<space/>
<wd l="7344" t="1680" r="7848" b="1829">define</wd>
<space/>
<wd l="7934" t="1685" r="8909" b="1867">’potentially</wd>
<space/>
<wd l="8981" t="1690" r="9893" b="1867">interesting</wd>
<space/>
<wd l="9960" t="1685" r="10334" b="1829">verb</wd>
<space/>
<wd l="10411" t="1685" r="10786" b="1829">rela-</wd>
</ln>
<ln l="6096" t="1906" r="10786" b="2112" baseLine="2059" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6096" t="1920" r="6485" b="2064">tion’</wd>
<space/>
<wd l="6576" t="1968" r="6739" b="2064">as</wd>
<space/>
<wd l="6826" t="1968" r="6922" b="2064">a</wd>
<space/>
<wd l="6998" t="1920" r="7368" b="2064">verb</wd>
<space/>
<wd l="7450" t="1920" r="8165" b="2102">together</wd>
<space/>
<wd l="8242" t="1920" r="8626" b="2064">with</wd>
<space/>
<wd l="8707" t="1925" r="8909" b="2064">its</wd>
<space/>
<wd l="8990" t="1934" r="9883" b="2102">arguments</wd>
<space/>
<wd l="9984" t="1906" r="10339" b="2112">(i.e.,</wd>
<space/>
<wd l="10435" t="1920" r="10786" b="2064">sub-</wd>
</ln>
<ln l="6086" t="2146" r="10790" b="2352" baseLine="2299" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6086" t="2165" r="6456" b="2342">ject,</wd>
<space/>
<wd l="6562" t="2160" r="7166" b="2342">objects</wd>
<space/>
<wd l="7262" t="2160" r="7574" b="2304">and</wd>
<space/>
<wd l="7666" t="2160" r="7925" b="2299">PP</wd>
<space/>
<wd l="8026" t="2146" r="9043" b="2352">arguments),</wd>
<space/>
<wd l="9144" t="2160" r="9653" b="2304">where</wd>
<space/>
<wd l="9744" t="2174" r="9907" b="2304">at</wd>
<space/>
<wd l="10003" t="2160" r="10387" b="2304">least</wd>
<space/>
<wd l="10483" t="2174" r="10790" b="2304">two</wd>
<space/>
</ln>
<ln l="6101" t="2395" r="10790" b="2582" baseLine="2534" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="2395" r="6269" b="2544">of</wd>
<space/>
<wd l="6350" t="2400" r="6624" b="2544">the</wd>
<space/>
<wd l="6725" t="2414" r="7618" b="2582">arguments</wd>
<space/>
<wd l="7723" t="2448" r="7982" b="2544">are</wd>
<space/>
<wd l="8078" t="2400" r="8434" b="2544">NEs</wd>
<space/>
<wd l="8534" t="2400" r="8846" b="2544">and</wd>
<space/>
<wd l="8952" t="2414" r="9110" b="2544">at</wd>
<space/>
<wd l="9221" t="2400" r="9605" b="2544">least</wd>
<space/>
<wd l="9710" t="2448" r="10003" b="2544">one</wd>
<space/>
<wd l="10104" t="2395" r="10272" b="2544">of</wd>
<space/>
<wd l="10354" t="2400" r="10790" b="2544">them</wd>
<space/>
</ln>
<ln l="6101" t="2635" r="10786" b="2822" baseLine="2774" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="2645" r="6226" b="2784">is</wd>
<space/>
<wd l="6298" t="2640" r="6576" b="2784">the</wd>
<space/>
<wd l="6648" t="2640" r="7262" b="2822">subject</wd>
<space/>
<wd l="7344" t="2688" r="7517" b="2784">or</wd>
<space/>
<wd l="7589" t="2688" r="7795" b="2784">an</wd>
<space/>
<wd l="7867" t="2640" r="8438" b="2822">object.</wd>
<space/>
<wd l="8558" t="2635" r="8818" b="2784">On</wd>
<space/>
<wd l="8885" t="2640" r="9158" b="2784">the</wd>
<space/>
<wd l="9235" t="2640" r="9648" b="2784">basis</wd>
<space/>
<wd l="9725" t="2635" r="9893" b="2784">of</wd>
<space/>
<wd l="9950" t="2640" r="10267" b="2784">this</wd>
<space/>
<wd l="10344" t="2645" r="10786" b="2784">crite-</wd>
</ln>
<ln l="6101" t="2875" r="10776" b="3062" baseLine="3014" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="2885" r="6485" b="3058">rion,</wd>
<space/>
<wd l="6552" t="2928" r="6773" b="3024">we</wd>
<space/>
<wd l="6830" t="2875" r="7315" b="3024">found</wd>
<space/>
<wd l="7382" t="2885" r="7560" b="3024">15</wd>
<space/>
<wd l="7627" t="2880" r="8554" b="3062">potentially</wd>
<space/>
<wd l="8611" t="2885" r="9518" b="3062">interesting</wd>
<space/>
<wd l="9571" t="2880" r="9941" b="3024">verb</wd>
<space/>
<wd l="10003" t="2880" r="10776" b="3024">relations.</wd>
<space/>
</ln>
<ln l="6101" t="3120" r="10795" b="3302" baseLine="3254" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="3120" r="6389" b="3264">For</wd>
<space/>
<wd l="6442" t="3120" r="6720" b="3264">the</wd>
<space/>
<wd l="6782" t="3168" r="7205" b="3264">same</wd>
<space/>
<wd l="7267" t="3134" r="8112" b="3298">sentences,</wd>
<space/>
<wd l="8179" t="3120" r="8453" b="3264">the</wd>
<space/>
<wd l="8515" t="3120" r="9019" b="3259">IDEX</wd>
<space/>
<wd l="9082" t="3134" r="9667" b="3302">system</wd>
<space/>
<wd l="9730" t="3120" r="10536" b="3264">extracted</wd>
<space/>
<wd l="10603" t="3120" r="10795" b="3264">27</wd>
<space/>
</ln>
<ln l="6101" t="3350" r="10795" b="3538" baseLine="3494" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="3355" r="6883" b="3533">relations,</wd>
<space/>
<wd l="7003" t="3360" r="7176" b="3494">11</wd>
<space/>
<wd l="7286" t="3350" r="7450" b="3499">of</wd>
<space/>
<wd l="7531" t="3355" r="7968" b="3499">them</wd>
<space/>
<wd l="8069" t="3355" r="9278" b="3538">corresponding</wd>
<space/>
<wd l="9365" t="3370" r="9538" b="3499">to</wd>
<space/>
<wd l="9634" t="3355" r="9907" b="3499">the</wd>
<space/>
<wd l="10003" t="3355" r="10795" b="3538">manually</wd>
<space/>
</ln>
<ln l="6101" t="3581" r="10790" b="3778" baseLine="3734" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="3595" r="6907" b="3739">extracted</wd>
<space/>
<wd l="6989" t="3643" r="7402" b="3739">ones.</wd>
<space/>
<wd l="7536" t="3595" r="7915" b="3739">This</wd>
<space/>
<wd l="7992" t="3595" r="8482" b="3778">yields</wd>
<space/>
<wd l="8568" t="3643" r="8664" b="3739">a</wd>
<space/>
<wd l="8741" t="3595" r="9197" b="3739">recall</wd>
<space/>
<wd l="9274" t="3595" r="9720" b="3739">value</wd>
<space/>
<wd l="9802" t="3590" r="9970" b="3739">of</wd>
<space/>
<wd l="10042" t="3581" r="10392" b="3749">73%</wd>
<space/>
<wd l="10478" t="3595" r="10790" b="3739">and</wd>
<space/>
</ln>
<ln l="6101" t="3821" r="8237" b="4018" baseLine="3970" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="3883" r="6197" b="3979">a</wd>
<space/>
<wd l="6269" t="3840" r="7027" b="4018">precision</wd>
<space/>
<wd l="7094" t="3835" r="7541" b="3979">value</wd>
<space/>
<wd l="7613" t="3830" r="7781" b="3979">of</wd>
<space/>
<wd l="7838" t="3821" r="8237" b="3989">41%.</wd>
</ln>
</para>
<para l="6096" t="4070" r="10805" b="5702" alignment="justified" lsp="exactly" lspExact="239" language="en">
<ln l="6101" t="4070" r="10795" b="4258" baseLine="4214" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="4075" r="6605" b="4219">There</wd>
<space/>
<wd l="6682" t="4123" r="7070" b="4219">were</wd>
<space/>
<wd l="7147" t="4090" r="7454" b="4219">two</wd>
<space/>
<wd l="7536" t="4090" r="7987" b="4258">types</wd>
<space/>
<wd l="8074" t="4070" r="8242" b="4219">of</wd>
<space/>
<wd l="8309" t="4075" r="8765" b="4219">recall</wd>
<space/>
<wd l="8846" t="4123" r="9379" b="4219">errors:</wd>
<space/>
<wd l="9509" t="4075" r="9965" b="4253">First,</wd>
<space/>
<wd l="10061" t="4123" r="10546" b="4219">errors</wd>
<space/>
<wd l="10632" t="4080" r="10795" b="4214">in</wd>
<space/>
</ln>
<ln l="6101" t="4315" r="10786" b="4498" baseLine="4450" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="4330" r="6821" b="4459">sentence</wd>
<space/>
<wd l="6902" t="4315" r="7728" b="4498">boundary</wd>
<space/>
<wd l="7810" t="4315" r="8645" b="4493">detection,</wd>
<space/>
<wd l="8736" t="4315" r="9326" b="4498">mainly</wd>
<space/>
<wd l="9403" t="4315" r="9706" b="4459">due</wd>
<space/>
<wd l="9787" t="4330" r="9960" b="4459">to</wd>
<space/>
<wd l="10042" t="4320" r="10488" b="4498">noisy</wd>
<space/>
<wd l="10565" t="4320" r="10786" b="4454">in-</wd>
</ln>
<ln l="6101" t="4541" r="10795" b="4747" baseLine="4690" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="4570" r="6384" b="4738">put</wd>
<space/>
<wd l="6466" t="4555" r="6850" b="4699">data</wd>
<space/>
<wd l="6926" t="4541" r="7330" b="4747">(e.g.,</wd>
<space/>
<wd l="7411" t="4560" r="8050" b="4738">missing</wd>
<space/>
<wd l="8117" t="4541" r="8861" b="4747">periods),</wd>
<space/>
<wd l="8938" t="4555" r="9442" b="4699">which</wd>
<space/>
<wd l="9509" t="4555" r="9854" b="4699">lead</wd>
<space/>
<wd l="9922" t="4570" r="10094" b="4699">to</wd>
<space/>
<wd l="10166" t="4560" r="10795" b="4738">parsing</wd>
<space/>
</ln>
<ln l="6101" t="4795" r="10790" b="4973" baseLine="4930" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="4843" r="6643" b="4973">errors,</wd>
<space/>
<wd l="6758" t="4795" r="7070" b="4939">and</wd>
<space/>
<wd l="7171" t="4795" r="7786" b="4973">second,</wd>
<space/>
<wd l="7901" t="4795" r="8333" b="4939">NER</wd>
<space/>
<wd l="8429" t="4843" r="8966" b="4973">errors,</wd>
<space/>
<wd l="9082" t="4800" r="9374" b="4973">i.e.,</wd>
<space/>
<wd l="9490" t="4795" r="9845" b="4939">NEs</wd>
<space/>
<wd l="9941" t="4795" r="10296" b="4939">that</wd>
<space/>
<wd l="10402" t="4843" r="10790" b="4939">were</wd>
<space/>
</ln>
<ln l="6101" t="5030" r="10795" b="5213" baseLine="5170" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="5045" r="6374" b="5174">not</wd>
<space/>
<wd l="6466" t="5030" r="7354" b="5213">recognised</wd>
<space/>
<wd l="7435" t="5078" r="7603" b="5174">as</wd>
<space/>
<wd l="7690" t="5030" r="8107" b="5174">such.</wd>
<space/>
<wd l="8242" t="5030" r="9024" b="5174">Precision</wd>
<space/>
<wd l="9106" t="5078" r="9595" b="5174">errors</wd>
<space/>
<wd l="9677" t="5030" r="10133" b="5174">could</wd>
<space/>
<wd l="10219" t="5030" r="10795" b="5213">mostly</wd>
<space/>
</ln>
<ln l="6101" t="5256" r="10805" b="5462" baseLine="5410" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6101" t="5270" r="6298" b="5414">be</wd>
<space/>
<wd l="6384" t="5270" r="6922" b="5414">traced</wd>
<space/>
<wd l="7008" t="5270" r="7402" b="5414">back</wd>
<space/>
<wd l="7483" t="5285" r="7656" b="5414">to</wd>
<space/>
<wd l="7738" t="5270" r="8016" b="5414">the</wd>
<space/>
<wd l="8102" t="5270" r="8530" b="5414">NER</wd>
<space/>
<wd l="8611" t="5285" r="9547" b="5453">component</wd>
<space/>
<wd l="9658" t="5256" r="10546" b="5462">(sequences</wd>
<space/>
<wd l="10637" t="5266" r="10805" b="5414">of</wd>
<space/>
</ln>
<ln l="6096" t="5496" r="9480" b="5702" baseLine="5645" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="6096" t="5510" r="6595" b="5654">words</wd>
<space/>
<wd l="6667" t="5558" r="7061" b="5654">were</wd>
<space/>
<wd l="7128" t="5510" r="7819" b="5693">wrongly</wd>
<space/>
<wd l="7891" t="5506" r="8683" b="5654">identified</wd>
<space/>
<wd l="8760" t="5558" r="8928" b="5654">as</wd>
<space/>
<wd l="9005" t="5496" r="9480" b="5702">NEs).</wd>
</ln>
</para>
<para l="6096" t="5750" r="10790" b="8328" alignment="justified" lsp="exactly" lspExact="239" language="en">
<ln l="6101" t="5750" r="10786" b="5933" baseLine="5890" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="5750" r="6278" b="5890">In</wd>
<space/>
<wd l="6370" t="5750" r="6648" b="5894">the</wd>
<space/>
<wd l="6749" t="5755" r="7037" b="5894">550</wd>
<space/>
<wd l="7133" t="5750" r="7925" b="5933">manually</wd>
<space/>
<wd l="8021" t="5750" r="8885" b="5894">annotated</wd>
<space/>
<wd l="8990" t="5765" r="9830" b="5928">sentences,</wd>
<space/>
<wd l="9955" t="5755" r="10334" b="5894">1300</wd>
<space/>
<wd l="10435" t="5750" r="10786" b="5894">NEs</wd>
<space/>
</ln>
<ln l="6096" t="5986" r="10786" b="6173" baseLine="6130" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6096" t="6038" r="6490" b="6134">were</wd>
<space/>
<wd l="6581" t="5986" r="7373" b="6134">identified</wd>
<space/>
<wd l="7469" t="6038" r="7632" b="6134">as</wd>
<space/>
<wd l="7728" t="5990" r="8083" b="6134">NEs</wd>
<space/>
<wd l="8179" t="5990" r="8386" b="6173">by</wd>
<space/>
<wd l="8467" t="5990" r="8741" b="6134">the</wd>
<space/>
<wd l="8832" t="5990" r="9264" b="6134">NER</wd>
<space/>
<wd l="9350" t="6005" r="10334" b="6173">component.</wd>
<space/>
<wd l="10502" t="5990" r="10786" b="6134">402</wd>
<space/>
</ln>
<ln l="6101" t="6230" r="10790" b="6413" baseLine="6365" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="6230" r="6456" b="6374">NEs</wd>
<space/>
<wd l="6605" t="6278" r="6998" b="6374">were</wd>
<space/>
<wd l="7147" t="6230" r="8035" b="6413">recognised</wd>
<space/>
<wd l="8189" t="6230" r="8942" b="6413">correctly</wd>
<space/>
<wd l="9091" t="6230" r="9298" b="6413">by</wd>
<space/>
<wd l="9442" t="6230" r="9715" b="6374">the</wd>
<space/>
<wd l="9869" t="6230" r="10339" b="6408">NER,</wd>
<space/>
<wd l="10507" t="6235" r="10790" b="6374">588</wd>
<space/>
</ln>
<ln l="6096" t="6466" r="10790" b="6653" baseLine="6605" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6096" t="6470" r="6792" b="6653">wrongly</wd>
<space/>
<wd l="6888" t="6470" r="7195" b="6614">and</wd>
<space/>
<wd l="7301" t="6475" r="7459" b="6610">in</wd>
<space/>
<wd l="7555" t="6475" r="7848" b="6614">310</wd>
<space/>
<wd l="7949" t="6518" r="8371" b="6614">cases</wd>
<space/>
<wd l="8477" t="6470" r="8842" b="6653">only</wd>
<space/>
<wd l="8938" t="6485" r="9370" b="6653">parts</wd>
<space/>
<wd l="9475" t="6466" r="9638" b="6614">of</wd>
<space/>
<wd l="9725" t="6518" r="9931" b="6614">an</wd>
<space/>
<wd l="10027" t="6470" r="10306" b="6610">NE</wd>
<space/>
<wd l="10402" t="6518" r="10790" b="6614">were</wd>
<space/>
</ln>
<ln l="6101" t="6710" r="10790" b="6893" baseLine="6845" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="6710" r="7032" b="6893">recognised.</wd>
<space/>
<wd l="7152" t="6710" r="7656" b="6854">These</wd>
<space/>
<wd l="7733" t="6715" r="8021" b="6854">310</wd>
<space/>
<wd l="8098" t="6758" r="8520" b="6854">cases</wd>
<space/>
<wd l="8602" t="6758" r="8894" b="6854">can</wd>
<space/>
<wd l="8971" t="6710" r="9168" b="6854">be</wd>
<space/>
<wd l="9245" t="6710" r="9869" b="6854">divided</wd>
<space/>
<wd l="9950" t="6715" r="10277" b="6854">into</wd>
<space/>
<wd l="10354" t="6710" r="10790" b="6854">three</wd>
<space/>
</ln>
<ln l="6101" t="6941" r="10786" b="7128" baseLine="7085" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="6994" r="6667" b="7128">groups</wd>
<space/>
<wd l="6754" t="6941" r="6922" b="7090">of</wd>
<space/>
<wd l="6989" t="6994" r="7526" b="7090">errors.</wd>
<space/>
<wd l="7661" t="6946" r="8117" b="7123">First,</wd>
<space/>
<wd l="8213" t="6946" r="8568" b="7090">NEs</wd>
<space/>
<wd l="8654" t="6946" r="9542" b="7128">recognised</wd>
<space/>
<wd l="9624" t="6946" r="10406" b="7128">correctly,</wd>
<space/>
<wd l="10502" t="6946" r="10786" b="7090">but</wd>
<space/>
</ln>
<ln l="6101" t="7181" r="10786" b="7368" baseLine="7325" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="7186" r="6706" b="7330">labeled</wd>
<space/>
<wd l="6792" t="7186" r="7176" b="7330">with</wd>
<space/>
<wd l="7258" t="7186" r="7531" b="7330">the</wd>
<space/>
<wd l="7613" t="7234" r="8146" b="7368">wrong</wd>
<space/>
<wd l="8227" t="7186" r="8510" b="7325">NE</wd>
<space/>
<wd l="8587" t="7200" r="9010" b="7368">type.</wd>
<space/>
<wd l="9163" t="7181" r="9806" b="7363">Second,</wd>
<space/>
<wd l="9907" t="7186" r="10272" b="7368">only</wd>
<space/>
<wd l="10354" t="7200" r="10786" b="7368">parts</wd>
<space/>
</ln>
<ln l="6101" t="7421" r="10786" b="7608" baseLine="7560" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="7421" r="6269" b="7570">of</wd>
<space/>
<wd l="6374" t="7426" r="6648" b="7570">the</wd>
<space/>
<wd l="6773" t="7426" r="7051" b="7565">NE</wd>
<space/>
<wd l="7171" t="7474" r="7560" b="7570">were</wd>
<space/>
<wd l="7685" t="7426" r="8573" b="7608">recognised</wd>
<space/>
<wd l="8698" t="7426" r="9480" b="7608">correctly,</wd>
<space/>
<wd l="9624" t="7474" r="9965" b="7608">e.g.,</wd>
<space/>
<wd l="10109" t="7426" r="10786" b="7570">“Touris-</wd>
</ln>
<ln l="6101" t="7661" r="10786" b="7848" baseLine="7800" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="7714" r="6442" b="7810">mus</wd>
<space/>
<wd l="6538" t="7666" r="7426" b="7848">Marketing</wd>
<space/>
<wd l="7522" t="7661" r="8160" b="7810">GmbH”</wd>
<space/>
<wd l="8256" t="7666" r="8866" b="7810">instead</wd>
<space/>
<wd l="8962" t="7661" r="9130" b="7810">of</wd>
<space/>
<wd l="9211" t="7666" r="9806" b="7810">“Berlin</wd>
<space/>
<wd l="9902" t="7666" r="10786" b="7810">Tourismus</wd>
<space/>
</ln>
<ln l="6101" t="7901" r="10790" b="8088" baseLine="8040" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="7906" r="6989" b="8088">Marketing</wd>
<space/>
<wd l="7080" t="7901" r="7757" b="8050">GmbH”.</wd>
<space/>
<wd l="7862" t="7906" r="8400" b="8083">Third,</wd>
<space/>
<wd l="8501" t="7906" r="8851" b="8050">NEs</wd>
<space/>
<wd l="8942" t="7910" r="9840" b="8088">containing</wd>
<space/>
<wd l="9926" t="7906" r="10790" b="8050">additional</wd>
<space/>
</ln>
<ln l="6096" t="8141" r="10291" b="8328" baseLine="8280" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6096" t="8146" r="6648" b="8323">words,</wd>
<space/>
<wd l="6730" t="8146" r="7109" b="8290">such</wd>
<space/>
<wd l="7176" t="8194" r="7344" b="8290">as</wd>
<space/>
<wd l="7421" t="8146" r="7838" b="8290">“the”</wd>
<space/>
<wd l="7915" t="8150" r="8074" b="8285">in</wd>
<space/>
<wd l="8146" t="8146" r="8491" b="8290">“the</wd>
<space/>
<wd l="8563" t="8146" r="9691" b="8328">Brandenburg</wd>
<space/>
<wd l="9768" t="8141" r="10291" b="8290">Gate”.</wd>
</ln>
</para>
<para l="6096" t="8381" r="10795" b="10488" alignment="justified" lsp="exactly" lspExact="239" language="en">
<ln l="6101" t="8381" r="10790" b="8568" baseLine="8520" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="8386" r="6322" b="8530">To</wd>
<space/>
<wd l="6389" t="8386" r="6864" b="8568">judge</wd>
<space/>
<wd l="6941" t="8386" r="7214" b="8530">the</wd>
<space/>
<wd l="7296" t="8381" r="8146" b="8530">usefulness</wd>
<space/>
<wd l="8227" t="8381" r="8395" b="8530">of</wd>
<space/>
<wd l="8458" t="8386" r="8731" b="8530">the</wd>
<space/>
<wd l="8813" t="8386" r="9614" b="8530">extracted</wd>
<space/>
<wd l="9701" t="8386" r="10478" b="8563">relations,</wd>
<space/>
<wd l="10570" t="8434" r="10790" b="8530">we</wd>
<space/>
</ln>
<ln l="6101" t="8621" r="10786" b="8808" baseLine="8760" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="8626" r="6725" b="8808">applied</wd>
<space/>
<wd l="6802" t="8626" r="7075" b="8770">the</wd>
<space/>
<wd l="7152" t="8621" r="7925" b="8808">following</wd>
<space/>
<wd l="7997" t="8621" r="8299" b="8770">soft</wd>
<space/>
<wd l="8386" t="8630" r="9149" b="8770">criterion:</wd>
<space/>
<wd l="9274" t="8621" r="9413" b="8765">A</wd>
<space/>
<wd l="9494" t="8626" r="10152" b="8770">relation</wd>
<space/>
<wd l="10229" t="8630" r="10349" b="8770">is</wd>
<space/>
<wd l="10435" t="8674" r="10786" b="8770">con-</wd>
</ln>
<ln l="6101" t="8856" r="10795" b="9043" baseLine="9000" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="8861" r="6701" b="9005">sidered</wd>
<space/>
<wd l="6758" t="8856" r="7253" b="9005">useful</wd>
<space/>
<wd l="7306" t="8856" r="7430" b="9000">if</wd>
<space/>
<wd l="7469" t="8866" r="7589" b="9005">it</wd>
<space/>
<wd l="7646" t="8909" r="8429" b="9043">expresses</wd>
<space/>
<wd l="8482" t="8861" r="8755" b="9005">the</wd>
<space/>
<wd l="8808" t="8866" r="9235" b="9005">main</wd>
<space/>
<wd l="9288" t="8856" r="10296" b="9005">information</wd>
<space/>
<wd l="10344" t="8866" r="10795" b="9043">given</wd>
<space/>
</ln>
<ln l="6101" t="9101" r="10786" b="9283" baseLine="9240" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="9101" r="6307" b="9283">by</wd>
<space/>
<wd l="6398" t="9101" r="6672" b="9245">the</wd>
<space/>
<wd l="6768" t="9115" r="7483" b="9245">sentence</wd>
<space/>
<wd l="7579" t="9149" r="7752" b="9245">or</wd>
<space/>
<wd l="7848" t="9101" r="8405" b="9278">clause,</wd>
<space/>
<wd l="8520" t="9106" r="8678" b="9240">in</wd>
<space/>
<wd l="8770" t="9101" r="9269" b="9245">which</wd>
<space/>
<wd l="9360" t="9101" r="9634" b="9245">the</wd>
<space/>
<wd l="9730" t="9101" r="10387" b="9245">relation</wd>
<space/>
<wd l="10478" t="9149" r="10786" b="9245">was</wd>
<space/>
</ln>
<ln l="6101" t="9336" r="10795" b="9523" baseLine="9475" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="9336" r="6629" b="9485">found.</wd>
<space/>
<wd l="6806" t="9336" r="7680" b="9523">According</wd>
<space/>
<wd l="7766" t="9355" r="7939" b="9485">to</wd>
<space/>
<wd l="8035" t="9341" r="8347" b="9485">this</wd>
<space/>
<wd l="8448" t="9346" r="9216" b="9518">criterion,</wd>
<space/>
<wd l="9326" t="9346" r="9562" b="9485">six</wd>
<space/>
<wd l="9653" t="9336" r="9821" b="9485">of</wd>
<space/>
<wd l="9898" t="9341" r="10171" b="9485">the</wd>
<space/>
<wd l="10267" t="9341" r="10795" b="9485">eleven</wd>
<space/>
</ln>
<ln l="6101" t="9576" r="10795" b="9763" baseLine="9715" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="9581" r="6835" b="9725">relations</wd>
<space/>
<wd l="6936" t="9581" r="7387" b="9725">could</wd>
<space/>
<wd l="7488" t="9581" r="7685" b="9725">be</wd>
<space/>
<wd l="7786" t="9581" r="8683" b="9725">considered</wd>
<space/>
<wd l="8784" t="9576" r="9322" b="9725">useful.</wd>
<space/>
<wd l="9504" t="9581" r="9840" b="9725">The</wd>
<space/>
<wd l="9936" t="9586" r="10795" b="9763">remaining</wd>
<space/>
</ln>
<ln l="6101" t="9816" r="10786" b="10003" baseLine="9955" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="9816" r="6394" b="9965">five</wd>
<space/>
<wd l="6509" t="9821" r="7238" b="9965">relations</wd>
<space/>
<wd l="7358" t="9821" r="7882" b="9965">lacked</wd>
<space/>
<wd l="8002" t="9869" r="8424" b="9965">some</wd>
<space/>
<wd l="8539" t="9821" r="9211" b="9965">relevant</wd>
<space/>
<wd l="9331" t="9835" r="9682" b="10003">part</wd>
<space/>
<wd l="9806" t="9816" r="9970" b="9965">of</wd>
<space/>
<wd l="10066" t="9821" r="10339" b="9965">the</wd>
<space/>
<wd l="10454" t="9869" r="10786" b="9965">sen-</wd>
</ln>
<ln l="6096" t="10042" r="10790" b="10248" baseLine="10195" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="10042" r="7171" b="10248">tence/clause</wd>
<space/>
<wd l="7286" t="10042" r="7685" b="10248">(e.g.,</wd>
<space/>
<wd l="7805" t="10104" r="7901" b="10200">a</wd>
<space/>
<wd l="8002" t="10056" r="8568" b="10200">crucial</wd>
<space/>
<wd l="8669" t="10070" r="9019" b="10238">part</wd>
<space/>
<wd l="9130" t="10051" r="9298" b="10200">of</wd>
<space/>
<wd l="9389" t="10104" r="9595" b="10200">an</wd>
<space/>
<wd l="9691" t="10056" r="10018" b="10234">NE,</wd>
<space/>
<wd l="10128" t="10056" r="10421" b="10200">like</wd>
<space/>
<wd l="10517" t="10056" r="10790" b="10200">the</wd>
<space/>
</ln>
<ln l="6110" t="10282" r="8045" b="10488" baseLine="10435" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6110" t="10291" r="6557" b="10440">’ICC’</wd>
<space/>
<wd l="6638" t="10301" r="6802" b="10435">in</wd>
<space/>
<wd l="6878" t="10291" r="7272" b="10440">’ICC</wd>
<space/>
<wd l="7354" t="10282" r="8045" b="10488">Berlin’).</wd>
</ln>
</para>
<para l="6874" t="10757" r="10018" b="10930" alignment="centered" spaceBefore="222" lsp="exactly" lspExact="274" language="en">
<ln l="6874" t="10757" r="10018" b="10930" baseLine="10925" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="19">
<wd l="6874" t="10766" r="7061" b="10925">4.</wd>
<space/>
<wd l="7354" t="10757" r="8285" b="10930">Possible</wd>
<space/>
<wd l="8386" t="10757" r="10018" b="10930">enhancements</wd>
</ln>
</para>
<para l="6096" t="11093" r="10795" b="14352" alignment="justified" spaceBefore="51" lsp="exactly" lspExact="240" language="en">
<ln l="6096" t="11093" r="10790" b="11280" baseLine="11237" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="11098" r="6547" b="11242">With</wd>
<space/>
<wd l="6624" t="11098" r="6989" b="11280">only</wd>
<space/>
<wd l="7075" t="11102" r="7253" b="11242">15</wd>
<space/>
<wd l="7339" t="11098" r="8131" b="11280">manually</wd>
<space/>
<wd l="8208" t="11098" r="9010" b="11242">extracted</wd>
<space/>
<wd l="9091" t="11098" r="9821" b="11242">relations</wd>
<space/>
<wd l="9907" t="11112" r="10181" b="11242">out</wd>
<space/>
<wd l="10267" t="11093" r="10435" b="11242">of</wd>
<space/>
<wd l="10507" t="11102" r="10790" b="11242">550</wd>
<space/>
</ln>
<ln l="6101" t="11333" r="10795" b="11520" baseLine="11477" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11352" r="6946" b="11515">sentences,</wd>
<space/>
<wd l="7013" t="11386" r="7238" b="11482">we</wd>
<space/>
<wd l="7296" t="11386" r="7910" b="11482">assume</wd>
<space/>
<wd l="7963" t="11338" r="8318" b="11482">that</wd>
<space/>
<wd l="8386" t="11386" r="8669" b="11482">our</wd>
<space/>
<wd l="8726" t="11333" r="9538" b="11482">definition</wd>
<space/>
<wd l="9595" t="11333" r="9763" b="11482">of</wd>
<space/>
<wd l="9821" t="11338" r="10795" b="11520">’potentially</wd>
<space/>
</ln>
<ln l="6101" t="11578" r="10786" b="11760" baseLine="11712" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11582" r="7013" b="11760">interesting</wd>
<space/>
<wd l="7085" t="11578" r="7786" b="11722">relation’</wd>
<space/>
<wd l="7872" t="11582" r="7997" b="11722">is</wd>
<space/>
<wd l="8069" t="11592" r="8347" b="11722">too</wd>
<space/>
<wd l="8424" t="11582" r="8918" b="11755">strict,</wd>
<space/>
<wd l="9005" t="11578" r="9317" b="11722">and</wd>
<space/>
<wd l="9389" t="11578" r="9744" b="11722">that</wd>
<space/>
<wd l="9830" t="11626" r="10253" b="11722">more</wd>
<space/>
<wd l="10330" t="11582" r="10786" b="11722">inter-</wd>
</ln>
<ln l="6101" t="11818" r="10786" b="12000" baseLine="11952" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="11822" r="6610" b="12000">esting</wd>
<space/>
<wd l="6662" t="11818" r="7397" b="11962">relations</wd>
<space/>
<wd l="7459" t="11818" r="7910" b="11962">could</wd>
<space/>
<wd l="7973" t="11818" r="8170" b="11962">be</wd>
<space/>
<wd l="8232" t="11818" r="9034" b="11962">extracted</wd>
<space/>
<wd l="9096" t="11818" r="9302" b="12000">by</wd>
<space/>
<wd l="9355" t="11818" r="10157" b="12000">loosening</wd>
<space/>
<wd l="10205" t="11818" r="10478" b="11962">the</wd>
<space/>
<wd l="10541" t="11866" r="10786" b="11962">ex-</wd>
</ln>
<ln l="6096" t="12058" r="10795" b="12240" baseLine="12192" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12062" r="6782" b="12202">traction</wd>
<space/>
<wd l="6859" t="12062" r="7622" b="12202">criterion.</wd>
<space/>
<wd l="7738" t="12058" r="7958" b="12202">To</wd>
<space/>
<wd l="8035" t="12062" r="8952" b="12240">investigate</wd>
<space/>
<wd l="9029" t="12106" r="9230" b="12202">on</wd>
<space/>
<wd l="9307" t="12058" r="9648" b="12202">how</wd>
<space/>
<wd l="9720" t="12058" r="9994" b="12202">the</wd>
<space/>
<wd l="10070" t="12062" r="10795" b="12202">criterion</wd>
<space/>
</ln>
<ln l="6101" t="12293" r="10795" b="12475" baseLine="12432" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12293" r="6557" b="12437">could</wd>
<space/>
<wd l="6643" t="12293" r="6840" b="12437">be</wd>
<space/>
<wd l="6926" t="12293" r="7704" b="12470">loosened,</wd>
<space/>
<wd l="7795" t="12341" r="8021" b="12437">we</wd>
<space/>
<wd l="8107" t="12293" r="8842" b="12475">analysed</wd>
<space/>
<wd l="8933" t="12293" r="9134" b="12437">all</wd>
<space/>
<wd l="9216" t="12293" r="9667" b="12437">those</wd>
<space/>
<wd l="9754" t="12307" r="10546" b="12437">sentences</wd>
<space/>
<wd l="10632" t="12298" r="10795" b="12432">in</wd>
<space/>
</ln>
<ln l="6096" t="12533" r="10795" b="12715" baseLine="12672" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12533" r="6370" b="12677">the</wd>
<space/>
<wd l="6422" t="12547" r="6730" b="12677">test</wd>
<space/>
<wd l="6792" t="12581" r="7349" b="12715">corpus</wd>
<space/>
<wd l="7402" t="12533" r="7757" b="12677">that</wd>
<space/>
<wd l="7814" t="12533" r="8640" b="12677">contained</wd>
<space/>
<wd l="8698" t="12547" r="8861" b="12677">at</wd>
<space/>
<wd l="8923" t="12533" r="9307" b="12677">least</wd>
<space/>
<wd l="9360" t="12547" r="9667" b="12677">two</wd>
<space/>
<wd l="9725" t="12533" r="10075" b="12677">NEs</wd>
<space/>
<wd l="10133" t="12538" r="10291" b="12672">in</wd>
<space/>
<wd l="10344" t="12533" r="10795" b="12677">order</wd>
<space/>
</ln>
<ln l="6096" t="12768" r="10786" b="12955" baseLine="12907" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12787" r="6269" b="12917">to</wd>
<space/>
<wd l="6331" t="12768" r="6653" b="12917">find</wd>
<space/>
<wd l="6715" t="12787" r="6984" b="12917">out</wd>
<space/>
<wd l="7046" t="12773" r="7742" b="12917">whether</wd>
<space/>
<wd l="7800" t="12821" r="8227" b="12917">some</wd>
<space/>
<wd l="8285" t="12778" r="9197" b="12955">interesting</wd>
<space/>
<wd l="9250" t="12773" r="9979" b="12917">relations</wd>
<space/>
<wd l="10037" t="12821" r="10430" b="12917">were</wd>
<space/>
<wd l="10488" t="12773" r="10786" b="12917">lost</wd>
<space/>
</ln>
<ln l="6101" t="13008" r="10790" b="13195" baseLine="13147" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13013" r="6307" b="13195">by</wd>
<space/>
<wd l="6370" t="13013" r="6643" b="13157">the</wd>
<space/>
<wd l="6710" t="13008" r="7522" b="13157">definition</wd>
<space/>
<wd l="7589" t="13013" r="7901" b="13157">and</wd>
<space/>
<wd l="7968" t="13013" r="8314" b="13157">how</wd>
<space/>
<wd l="8376" t="13013" r="8650" b="13157">the</wd>
<space/>
<wd l="8717" t="13008" r="9528" b="13157">definition</wd>
<space/>
<wd l="9590" t="13013" r="10099" b="13157">would</wd>
<space/>
<wd l="10171" t="13013" r="10555" b="13157">have</wd>
<space/>
<wd l="10618" t="13027" r="10790" b="13157">to</wd>
<space/>
</ln>
<ln l="6101" t="13253" r="10786" b="13435" baseLine="13387" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13253" r="6298" b="13397">be</wd>
<space/>
<wd l="6374" t="13253" r="7066" b="13435">changed</wd>
<space/>
<wd l="7142" t="13258" r="7306" b="13392">in</wd>
<space/>
<wd l="7378" t="13253" r="7829" b="13397">order</wd>
<space/>
<wd l="7896" t="13267" r="8069" b="13397">to</wd>
<space/>
<wd l="8146" t="13253" r="8659" b="13397">detect</wd>
<space/>
<wd l="8741" t="13253" r="9182" b="13397">these</wd>
<space/>
<wd l="9254" t="13253" r="10032" b="13397">relations.</wd>
<space/>
<wd l="10147" t="13253" r="10483" b="13397">The</wd>
<space/>
<wd l="10550" t="13267" r="10786" b="13397">ta-</wd>
</ln>
<ln l="6101" t="13488" r="10790" b="13675" baseLine="13627" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13493" r="6350" b="13637">ble</wd>
<space/>
<wd l="6413" t="13498" r="6576" b="13632">in</wd>
<space/>
<wd l="6634" t="13493" r="7190" b="13675">Figure</wd>
<space/>
<wd l="7253" t="13498" r="7339" b="13637">6</wd>
<space/>
<wd l="7411" t="13493" r="7742" b="13637">lists</wd>
<space/>
<wd l="7810" t="13541" r="8237" b="13637">some</wd>
<space/>
<wd l="8299" t="13498" r="9264" b="13675">suggestions</wd>
<space/>
<wd l="9336" t="13488" r="9499" b="13637">of</wd>
<space/>
<wd l="9552" t="13493" r="9893" b="13637">how</wd>
<space/>
<wd l="9950" t="13493" r="10267" b="13637">this</wd>
<space/>
<wd l="10334" t="13493" r="10790" b="13637">could</wd>
<space/>
</ln>
<ln l="6101" t="13728" r="10790" b="13910" baseLine="13867" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13728" r="6298" b="13872">be</wd>
<space/>
<wd l="6384" t="13728" r="7157" b="13906">achieved,</wd>
<space/>
<wd l="7248" t="13728" r="7968" b="13910">together</wd>
<space/>
<wd l="8045" t="13728" r="8434" b="13872">with</wd>
<space/>
<wd l="8515" t="13728" r="9221" b="13910">example</wd>
<space/>
<wd l="9307" t="13728" r="10037" b="13872">relations</wd>
<space/>
<wd l="10123" t="13728" r="10435" b="13872">and</wd>
<space/>
<wd l="10517" t="13728" r="10790" b="13872">the</wd>
<space/>
</ln>
<ln l="6101" t="13963" r="10790" b="14112" baseLine="14107" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13968" r="6754" b="14112">number</wd>
<space/>
<wd l="6821" t="13963" r="6989" b="14112">of</wd>
<space/>
<wd l="7042" t="13968" r="7906" b="14112">additional</wd>
<space/>
<wd l="7973" t="13968" r="8702" b="14112">relations</wd>
<space/>
<wd l="8770" t="13968" r="9125" b="14112">that</wd>
<space/>
<wd l="9197" t="13968" r="9653" b="14112">could</wd>
<space/>
<wd l="9720" t="13968" r="9922" b="14112">be</wd>
<space/>
<wd l="9984" t="13968" r="10790" b="14112">extracted</wd>
<space/>
</ln>
<ln l="6101" t="14203" r="8506" b="14352" baseLine="14342" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14203" r="6499" b="14352">from</wd>
<space/>
<wd l="6566" t="14208" r="6840" b="14352">the</wd>
<space/>
<wd l="6922" t="14213" r="7205" b="14352">550</wd>
<space/>
<wd l="7277" t="14222" r="7589" b="14352">test</wd>
<space/>
<wd l="7670" t="14222" r="8506" b="14352">sentences.</wd>
</ln>
</para>
<para l="6096" t="14448" r="10795" b="15826" alignment="justified" lsp="exactly" lspExact="238" language="en">
<ln l="6101" t="14448" r="10790" b="14630" baseLine="14587" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="6101" t="14448" r="6278" b="14587">In</wd>
<space/>
<wd l="6446" t="14448" r="7200" b="14626">addition,</wd>
<space/>
<wd l="7402" t="14496" r="7829" b="14592">more</wd>
<space/>
<wd l="7992" t="14453" r="8904" b="14630">interesting</wd>
<space/>
<wd l="9067" t="14448" r="9797" b="14592">relations</wd>
<space/>
<wd l="9970" t="14448" r="10426" b="14592">could</wd>
<space/>
<wd l="10594" t="14448" r="10790" b="14592">be</wd>
<space/>
</ln>
<ln l="6101" t="14683" r="10790" b="14870" baseLine="14822" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="6101" t="14683" r="6586" b="14832">found</wd>
<space/>
<wd l="6706" t="14688" r="7090" b="14832">with</wd>
<space/>
<wd l="7210" t="14736" r="7416" b="14832">an</wd>
<space/>
<wd l="7536" t="14688" r="7963" b="14832">NER</wd>
<space/>
<wd l="8083" t="14702" r="9019" b="14870">component</wd>
<space/>
<wd l="9149" t="14688" r="9917" b="14832">extended</wd>
<space/>
<wd l="10042" t="14688" r="10248" b="14870">by</wd>
<space/>
<wd l="10368" t="14736" r="10790" b="14832">more</wd>
<space/>
</ln>
<ln l="6096" t="14923" r="10795" b="15110" baseLine="15062" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="6096" t="14942" r="6600" b="15110">types,</wd>
<space/>
<wd l="6710" t="14976" r="7051" b="15110">e.g.,</wd>
<space/>
<wd l="7162" t="14923" r="7714" b="15067">DATE</wd>
<space/>
<wd l="7810" t="14928" r="8122" b="15072">and</wd>
<space/>
<wd l="8218" t="14928" r="8966" b="15072">EVENT.</wd>
<space/>
<wd l="9082" t="14923" r="9542" b="15110">Open</wd>
<space/>
<wd l="9638" t="14928" r="10272" b="15072">domain</wd>
<space/>
<wd l="10368" t="14928" r="10795" b="15072">NER</wd>
<space/>
</ln>
<ln l="6101" t="15163" r="10790" b="15350" baseLine="15302" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="6101" t="15216" r="6461" b="15350">may</wd>
<space/>
<wd l="6557" t="15168" r="6754" b="15312">be</wd>
<space/>
<wd l="6854" t="15163" r="7349" b="15312">useful</wd>
<space/>
<wd l="7450" t="15173" r="7608" b="15307">in</wd>
<space/>
<wd l="7704" t="15168" r="8150" b="15312">order</wd>
<space/>
<wd l="8242" t="15182" r="8419" b="15312">to</wd>
<space/>
<wd l="8515" t="15182" r="9115" b="15312">extract</wd>
<space/>
<wd l="9221" t="15168" r="9571" b="15312">NEs</wd>
<space/>
<wd l="9677" t="15163" r="9840" b="15312">of</wd>
<space/>
<wd l="9926" t="15168" r="10790" b="15312">additional</wd>
<space/>
</ln>
<ln l="6096" t="15403" r="10786" b="15590" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="6096" t="15422" r="6595" b="15590">types.</wd>
<space/>
<wd l="6773" t="15403" r="7195" b="15586">Also,</wd>
<space/>
<wd l="7306" t="15408" r="7757" b="15552">other</wd>
<space/>
<wd l="7848" t="15422" r="8299" b="15590">types</wd>
<space/>
<wd l="8400" t="15403" r="8568" b="15552">of</wd>
<space/>
<wd l="8650" t="15408" r="9379" b="15552">relations</wd>
<space/>
<wd l="9480" t="15408" r="9936" b="15552">could</wd>
<space/>
<wd l="10037" t="15408" r="10234" b="15552">be</wd>
<space/>
<wd l="10330" t="15413" r="10786" b="15552">inter-</wd>
</ln>
<ln l="6101" t="15643" r="10781" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="6101" t="15648" r="6648" b="15826">esting,</wd>
<space/>
<wd l="6792" t="15643" r="7166" b="15787">such</wd>
<space/>
<wd l="7286" t="15691" r="7454" b="15787">as</wd>
<space/>
<wd l="7574" t="15643" r="8309" b="15787">relations</wd>
<space/>
<wd l="8429" t="15643" r="9130" b="15787">between</wd>
<space/>
<wd l="9245" t="15643" r="10258" b="15787">coordinated</wd>
<space/>
<wd l="10382" t="15643" r="10781" b="15821">NEs,</wd>
</ln>
</para>
</column>
</section>
</body>
</page>
<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">
<description>
<source file="pdf\L08-1001.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>
<theoreticalPage size="A4" marginLeft="1035" marginTop="1360" marginRight="1092" marginBottom="995" offsetX="32" offsetY="16" width="11918" height="16854"/>
<language>en</language>
</description>
<body>
<section l="1035" t="1360" r="10811" b="6447">
<column l="1035" t="1360" r="10811" b="6447">
<table l="1459" t="1382" r="10378" b="5179" alignment="left" li="424" ri="433" spaceBefore="22" spaceAfter="169">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<gridTable>
<gridCol>2520</gridCol>
<gridCol>4214</gridCol>
<gridCol>2185</gridCol>
<gridRow>254</gridRow>
<gridRow>1124</gridRow>
<gridRow>724</gridRow>
<gridRow>965</gridRow>
<gridRow>730</gridRow>
</gridTable>
<cell gridColFrom="0" gridColTill="0" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="2410" t="1421" r="3038" b="1603" alignment="centered" spaceAfter="15" lsp="exactly" lspExact="230" language="en">
<ln l="2410" t="1421" r="3038" b="1603" baseLine="1555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="2410" t="1421" r="3038" b="1603">option</wd>
</ln>
</para>
</cell>
<cell gridColFrom="1" gridColTill="1" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="5683" t="1421" r="6499" b="1603" alignment="centered" spaceAfter="15" lsp="exactly" lspExact="230" language="en">
<ln l="5683" t="1421" r="6499" b="1603" baseLine="1555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">
<wd l="5683" t="1421" r="6499" b="1603">example</wd>
</ln>
</para>
</cell>
<cell gridColFrom="2" gridColTill="2" gridRowFrom="0" gridRowTill="0" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="8323" t="1421" r="10248" b="1565" alignment="centered" spaceAfter="15" lsp="exactly" lspExact="230" language="en">
<ln l="8323" t="1421" r="10248" b="1565" baseLine="1555" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="11">
<wd l="8323" t="1421" r="9317" b="1565">additional</wd>
<space/>
<wd l="9398" t="1421" r="10248" b="1565">relations</wd>
</ln>
</para>
</cell>
<cell gridColFrom="0" gridColTill="0" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="1594" t="1670" r="3840" b="1843" alignment="left" li="72" lsp="exactly" lspExact="217" language="en">
<tabs position="1594"/>
<tabs alignment="right" position="1843" leaderChar=" "/>
<ln l="1594" t="1670" r="3840" b="1843" baseLine="1805" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1594" t="1685" r="2400" b="1810">extraction</wd>
<tab position="2400"/>
<wd l="2688" t="1675" r="2842" b="1810">of</wd>
<tab position="2842"/>
<wd l="3120" t="1680" r="3840" b="1843">relations,</wd>
</ln>
</para>
<para l="1589" t="1891" r="3850" b="2688" alignment="justified" li="72" ri="108" spaceBefore="5" spaceAfter="23" lsp="exactly" lspExact="217" language="en">
<ln l="1589" t="1891" r="3850" b="2030" baseLine="2021" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="1589" t="1901" r="2054" b="2030">where</wd>
<space/>
<wd l="2184" t="1901" r="2434" b="2030">the</wd>
<space/>
<wd l="2573" t="1901" r="2827" b="2026">NE</wd>
<space/>
<wd l="2962" t="1906" r="3077" b="2030">is</wd>
<space/>
<wd l="3211" t="1915" r="3466" b="2030">not</wd>
<space/>
<wd l="3600" t="1901" r="3850" b="2030">the</wd>
<space/>
</ln>
<ln l="1594" t="2112" r="3850" b="2285" baseLine="2242" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="1594" t="2122" r="2299" b="2285">complete</wd>
<space/>
<wd l="2395" t="2122" r="3005" b="2285">subject,</wd>
<space/>
<wd l="3115" t="2122" r="3595" b="2285">object</wd>
<space/>
<wd l="3696" t="2165" r="3850" b="2251">or</wd>
<space/>
</ln>
<ln l="1594" t="2328" r="3845" b="2501" baseLine="2462" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="1594" t="2338" r="1834" b="2462">PP</wd>
<space/>
<wd l="1906" t="2352" r="2702" b="2501">argument,</wd>
<space/>
<wd l="2779" t="2338" r="3043" b="2467">but</wd>
<space/>
<wd l="3115" t="2338" r="3456" b="2501">only</wd>
<space/>
<wd l="3523" t="2352" r="3845" b="2501">part</wd>
<space/>
</ln>
<ln l="1594" t="2554" r="1910" b="2688" baseLine="2678" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="1594" t="2554" r="1747" b="2688">of</wd>
<space/>
<wd l="1800" t="2563" r="1910" b="2688">it</wd>
</ln>
</para>
</cell>
<cell gridColFrom="1" gridColTill="1" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="4133" t="1862" r="8059" b="2050" alignment="centered" spaceBefore="188" lsp="exactly" lspExact="239" language="en">
<tabs position="4133"/>
<tabs alignment="right" position="2050" leaderChar=" "/>
<ln l="4133" t="1862" r="8059" b="2050" baseLine="2002" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="4133" t="1862" r="5227" b="2050">Co-operation</wd>
<tab position="5227"/>
<wd l="5770" t="1867" r="6125" b="2011">with</wd>
<tab position="6125"/>
<wd l="6672" t="1862" r="8059" b="2016">&lt;ORG&gt;M.A.X.</wd>
</ln>
</para>
<para l="4109" t="2093" r="8083" b="2534" alignment="left" li="144" spaceAfter="207" lsp="exactly" lspExact="240" language="en">
<tabs position="4109"/>
<tabs alignment="left" position="2534" leaderChar=" "/>
<tabs alignment="right" position="4104" leaderChar=" "/>
<ln l="4118" t="2093" r="8083" b="2299" baseLine="2242" forcedEOF="true">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4118" t="2093" r="5352" b="2299">2001&lt;\ORG&gt;</wd>
<tab position="5352"/>
</run>
<wd l="5654" t="2093" r="6778" b="2299"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">V</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">is</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">V</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
</wd>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="6778"/>
</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7070" t="2107" r="7637" b="2290">clearly</wd>
<tab position="7637"/>
<wd l="7915" t="2102" r="8083" b="2251">of</wd>
</run>
</ln>
<ln l="4109" t="2328" r="7133" b="2534" baseLine="2482" forcedEOF="true">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4109" t="2338" r="4685" b="2486">benefit</wd>
<space/>
<wd l="4762" t="2357" r="4934" b="2486">to</wd>
<space/>
</run>
<wd l="5016" t="2328" r="7133" b="2534"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ORG</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">BTM</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ORG</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
</cell>
<cell gridColFrom="2" gridColTill="2" gridRowFrom="1" gridRowTill="1" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="9192" t="2112" r="9374" b="2251" alignment="centered" spaceBefore="420" spaceAfter="454" lsp="exactly" lspExact="240" language="en">
<ln l="9192" t="2112" r="9374" b="2251" baseLine="2242" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-6">
<wd l="9192" t="2112" r="9374" b="2251">25</wd>
</ln>
</para>
</cell>
<cell gridColFrom="0" gridColTill="0" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="1594" t="2923" r="3854" b="3317" alignment="left" li="108" ri="108" spaceBefore="129" spaceAfter="147" lsp="exactly" lspExact="217" language="en">
<ln l="1594" t="2923" r="3854" b="3062" baseLine="3058" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1594" t="2938" r="2400" b="3062">extraction</wd>
<space/>
<wd l="2491" t="2928" r="2645" b="3062">of</wd>
<space/>
<wd l="2726" t="2933" r="3403" b="3062">relations</wd>
<space/>
<wd l="3494" t="2933" r="3854" b="3062">with</wd>
<space/>
</ln>
<ln l="1594" t="3154" r="2722" b="3317" baseLine="3274" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1594" t="3197" r="1680" b="3283">a</wd>
<space/>
<wd l="1747" t="3154" r="2400" b="3317">complex</wd>
<space/>
<wd l="2462" t="3154" r="2722" b="3283">VP</wd>
</ln>
</para>
</cell>
<cell gridColFrom="1" gridColTill="1" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="4109" t="2774" r="8088" b="3461" alignment="left" li="108" spaceAfter="6" lsp="exactly" lspExact="234" language="en">
<ln l="4118" t="2774" r="8088" b="2981" baseLine="2928">
<wd l="4118" t="2774" r="6178" b="2981"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ORG</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">BTM</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ORG</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
</wd>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>
<wd l="6322" t="2789" r="7354" b="2938">&lt;V&gt;invited</wd>
<space/>
<wd l="7474" t="2789" r="7781" b="2933">and</wd>
<space/>
<wd l="7906" t="2837" r="8088" b="2933">or</wd>
<space/>
</run>
</ln>
<ln l="4118" t="3014" r="8059" b="3221" baseLine="3168">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4118" t="3014" r="5458" b="3221">supported&lt;\V&gt;</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5568" t="3077" r="5995" b="3173">more</wd>
<space/>
<wd l="6086" t="3029" r="6485" b="3173">than</wd>
<space/>
<wd l="6590" t="3034" r="7022" b="3206">1,000</wd>
<space/>
<wd l="7123" t="3029" r="7637" b="3173">media</wd>
<space/>
<wd l="7733" t="3077" r="8059" b="3211">rep-</wd>
<space/>
</run>
</ln>
<ln l="4109" t="3254" r="7546" b="3461" baseLine="3403">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4109" t="3274" r="5112" b="3413">resentatives</wd>
<space/>
<wd l="5189" t="3274" r="5347" b="3408">in</wd>
<space/>
</run>
<wd l="5429" t="3254" r="7546" b="3461"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">LOC</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Berlin</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">LOC</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
</cell>
<cell gridColFrom="2" gridColTill="2" gridRowFrom="2" gridRowTill="2" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="9245" t="3034" r="9336" b="3178" alignment="centered" spaceBefore="222" spaceAfter="248" lsp="exactly" lspExact="240" language="en">
<ln l="9245" t="3034" r="9336" b="3178" baseLine="3168" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="9245" t="3034" r="9336" b="3178">7</wd>
</ln>
</para>
</cell>
<cell gridColFrom="0" gridColTill="0" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="1594" t="3763" r="3845" b="3941" alignment="left" li="72" spaceBefore="250" lsp="exactly" lspExact="216" language="en">
<tabs position="1594"/>
<ln l="1594" t="3763" r="3845" b="3941" baseLine="3902" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1594" t="3778" r="2376" b="3907">resolution</wd>
<space/>
<wd l="2515" t="3773" r="2674" b="3907">of</wd>
<space/>
<wd l="2803" t="3778" r="3384" b="3907">relative</wd>
<tab position="3384"/>
<wd l="3533" t="3821" r="3845" b="3941">pro-</wd>
</ln>
</para>
<para l="1594" t="3989" r="2054" b="4128" alignment="left" li="72" spaceAfter="268" lsp="exactly" lspExact="217" language="en">
<ln l="1594" t="3989" r="2054" b="4128" baseLine="4118" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1594" t="4042" r="2054" b="4128">nouns</wd>
</ln>
</para>
</cell>
<cell gridColFrom="1" gridColTill="1" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="4109" t="3514" r="8069" b="3667" alignment="centered" lsp="exactly" lspExact="227" language="en">
<ln l="4109" t="3514" r="8069" b="3667" baseLine="3653">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17"><wd l="4109" t="3518" r="4445" b="3662">The</wd>
<space/>
</run>
<wd l="4618" t="3514" r="5966" b="3667"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17">ORG</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17">Oxford</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="17"><space/>
<wd l="6139" t="3514" r="6710" b="3662">Centre</wd>
<space/>
<wd l="6878" t="3514" r="7109" b="3662">for</wd>
<space/>
<wd l="7272" t="3518" r="8069" b="3662">Maritime</wd>
</run>
</ln>
</para>
<para l="4109" t="3739" r="8069" b="4426" alignment="left" li="72" spaceAfter="6" lsp="exactly" lspExact="239" language="en">
<tabs position="4109"/>
<tabs alignment="left" position="4426" leaderChar=" "/>
<tabs alignment="right" position="4104" leaderChar=" "/>
<ln l="4109" t="3739" r="8069" b="3946" baseLine="3893" forcedEOF="true">
<wd l="4109" t="3739" r="6014" b="3946"><run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Archaeology</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">ORG</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
</wd>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><tab position="6014"/>
</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6264" t="3739" r="6499" b="3946">[...]</wd>
<tab position="6499"/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="7061" t="3754" r="7541" b="3898">which</wd>
<tab position="7541"/>
</run>
<wd l="7762" t="3754" r="8069" b="3898" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">will</wd>
</ln>
<ln l="4118" t="3979" r="8069" b="4186" baseLine="4133" forcedEOF="true">
<wd l="4118" t="3979" r="5789" b="4186"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">V</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">conduct</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">V</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
</wd>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5880" t="4042" r="5976" b="4138">a</wd>
<space/>
<wd l="6048" t="3989" r="6787" b="4138">scientific</wd>
<space/>
<wd l="6864" t="3998" r="7834" b="4176">symposium</wd>
<space/>
<wd l="7910" t="3998" r="8069" b="4133">in</wd>
<space/>
</run>
</ln>
<ln l="4118" t="4219" r="6235" b="4426" baseLine="4368" forcedEOF="true">
<wd l="4118" t="4219" r="6235" b="4426"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">LOC</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Berlin</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">LOC</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
</cell>
<cell gridColFrom="2" gridColTill="2" gridRowFrom="3" gridRowTill="3" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="9245" t="3754" r="9326" b="4018" alignment="centered" spaceBefore="343" spaceAfter="368" lsp="exactly" lspExact="240" language="en">
<ln l="9245" t="3754" r="9326" b="4018" baseLine="4013" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="9245" t="3883" r="9326" b="4018">2</wd>
</ln>
</para>
</cell>
<cell gridColFrom="0" gridColTill="0" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="1594" t="4483" r="3850" b="5006" alignment="left" li="108" spaceBefore="129" spaceAfter="157" lsp="exactly" lspExact="217" language="en">
<ln l="1594" t="4483" r="3850" b="4752" baseLine="4747" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1594" t="4622" r="2573" b="4752">combination</wd>
<space/>
<wd l="2626" t="4618" r="2779" b="4752">of</wd>
<space/>
<wd l="2818" t="4622" r="3355" b="4752">several</wd>
<space/>
<wd l="3408" t="4618" r="3562" b="4752">of</wd>
<space/>
<wd l="3600" t="4622" r="3850" b="4752">the</wd>
<space/>
</ln>
<ln l="1594" t="4728" r="3581" b="5006" baseLine="4963" underlined="none" subsuperscript="none" fontSize="900" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1594" t="4843" r="2165" b="5006">options</wd>
<space/>
<wd l="2237" t="4843" r="3062" b="4973">mentioned</wd>
<space/>
<wd l="3130" t="4843" r="3581" b="4973">above</wd>
</ln>
</para>
</cell>
<cell gridColFrom="1" gridColTill="1" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="top">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="4118" t="4464" r="8102" b="5150" alignment="justified" li="144" ri="108" spaceAfter="15" lsp="exactly" lspExact="235" language="en">
<ln l="4118" t="4464" r="8074" b="4670" baseLine="4618">
<wd l="4118" t="4464" r="6178" b="4670"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">LOC</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Berlin</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;\</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">LOC</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&gt;</run>
</wd>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6250" t="4478" r="6528" b="4622">has</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="6600" t="4478" r="7858" b="4661">&lt;V&gt;developed</wd>
<space/>
<wd l="7915" t="4493" r="8074" b="4622">to</wd>
<space/>
</run>
</ln>
<ln l="4123" t="4704" r="8102" b="4910" baseLine="4858">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="4123" t="4704" r="5242" b="4910">become&lt;\V&gt;</wd>
<space/>
</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5405" t="4718" r="5683" b="4862">the</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5851" t="4723" r="7061" b="4862">entertainment</wd>
<space/>
<wd l="7214" t="4718" r="7771" b="4901">capital</wd>
<space/>
<wd l="7925" t="4714" r="8102" b="4901">of</wd>
<space/>
</run>
</ln>
<ln l="4118" t="4944" r="6504" b="5150" baseLine="5093">
<wd l="4118" t="4944" r="6504" b="5150"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">&lt;LOC&gt;Germany&lt;\LOC&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
</cell>
<cell gridColFrom="2" gridColTill="2" gridRowFrom="4" gridRowTill="4" alignment="left" verticalAlignment="middle">
<leftBorder type="single" width="10"/>
<topBorder type="single" width="10"/>
<rightBorder type="single" width="10"/>
<bottomBorder type="single" width="10"/>
<para l="9245" t="4714" r="9336" b="4867" alignment="centered" spaceBefore="223" spaceAfter="257" lsp="exactly" lspExact="240" language="en">
<ln l="9245" t="4714" r="9336" b="4867" baseLine="4858" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="9245" t="4723" r="9336" b="4867">7</wd>
</ln>
</para>
</cell>
</table>
<para l="1046" t="5390" r="10795" b="6058" alignment="justified" spaceAfter="372" lsp="exactly" lspExact="238" language="en">
<ln l="1046" t="5390" r="10790" b="5578" baseLine="5534" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="5395" r="1603" b="5578">Figure</wd>
<space/>
<wd l="1666" t="5400" r="1800" b="5539">6:</wd>
<space/>
<wd l="1906" t="5395" r="2381" b="5539">Table</wd>
<space/>
<wd l="2443" t="5395" r="3394" b="5578">illustrating</wd>
<space/>
<wd l="3451" t="5390" r="4157" b="5539">different</wd>
<space/>
<wd l="4229" t="5400" r="4848" b="5578">options</wd>
<space/>
<wd l="4915" t="5395" r="5746" b="5578">according</wd>
<space/>
<wd l="5798" t="5410" r="5971" b="5539">to</wd>
<space/>
<wd l="6034" t="5395" r="6538" b="5539">which</wd>
<space/>
<wd l="6595" t="5395" r="6869" b="5539">the</wd>
<space/>
<wd l="6931" t="5390" r="7742" b="5539">definition</wd>
<space/>
<wd l="7805" t="5390" r="7973" b="5539">of</wd>
<space/>
<wd l="8026" t="5395" r="9029" b="5578">”potentially</wd>
<space/>
<wd l="9091" t="5400" r="9998" b="5578">interesting</wd>
<space/>
<wd l="10061" t="5395" r="10790" b="5539">relation”</wd>
<space/>
</ln>
<ln l="1046" t="5630" r="10795" b="5818" baseLine="5770" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="5635" r="1502" b="5779">could</wd>
<space/>
<wd l="1574" t="5635" r="1771" b="5779">be</wd>
<space/>
<wd l="1838" t="5635" r="2606" b="5779">loosened.</wd>
<space/>
<wd l="2717" t="5635" r="3000" b="5779">For</wd>
<space/>
<wd l="3067" t="5635" r="3442" b="5779">each</wd>
<space/>
<wd l="3509" t="5640" r="4099" b="5818">option,</wd>
<space/>
<wd l="4176" t="5683" r="4382" b="5779">an</wd>
<space/>
<wd l="4445" t="5635" r="5155" b="5818">example</wd>
<space/>
<wd l="5222" t="5650" r="5938" b="5779">sentence</wd>
<space/>
<wd l="6005" t="5630" r="6403" b="5779">from</wd>
<space/>
<wd l="6466" t="5635" r="6739" b="5779">the</wd>
<space/>
<wd l="6802" t="5650" r="7114" b="5779">test</wd>
<space/>
<wd l="7190" t="5683" r="7742" b="5818">corpus</wd>
<space/>
<wd l="7814" t="5640" r="7934" b="5779">is</wd>
<space/>
<wd l="8006" t="5640" r="8501" b="5818">given,</wd>
<space/>
<wd l="8573" t="5635" r="9293" b="5818">together</wd>
<space/>
<wd l="9350" t="5635" r="9739" b="5779">with</wd>
<space/>
<wd l="9802" t="5635" r="10075" b="5779">the</wd>
<space/>
<wd l="10142" t="5635" r="10795" b="5779">number</wd>
<space/>
</ln>
<ln l="1046" t="5870" r="7094" b="6058" baseLine="6010" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="5870" r="1214" b="6019">of</wd>
<space/>
<wd l="1277" t="5875" r="2006" b="6019">relations</wd>
<space/>
<wd l="2078" t="5875" r="2434" b="6019">that</wd>
<space/>
<wd l="2515" t="5875" r="2971" b="6019">could</wd>
<space/>
<wd l="3043" t="5875" r="3245" b="6019">be</wd>
<space/>
<wd l="3317" t="5875" r="4118" b="6019">extracted</wd>
<space/>
<wd l="4195" t="5875" r="5227" b="6058">additionally</wd>
<space/>
<wd l="5294" t="5870" r="5693" b="6019">from</wd>
<space/>
<wd l="5760" t="5875" r="6034" b="6019">the</wd>
<space/>
<wd l="6106" t="5890" r="6418" b="6019">test</wd>
<space/>
<wd l="6499" t="5923" r="7094" b="6058">corpus.</wd>
</ln>
</para>
</column>
</section>
<section l="1039" t="6447" r="10817" b="15843">
<column l="1039" t="6447" r="5763" b="15843">
<para l="1046" t="6494" r="5755" b="8136" alignment="justified" spaceBefore="24" lsp="exactly" lspExact="239" language="en">
<ln l="1046" t="6494" r="5746" b="6701" baseLine="6648">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1046" t="6557" r="1387" b="6691">e.g.,</wd>
<space/>
<wd l="1531" t="6514" r="1694" b="6648">in</wd>
<space/>
<wd l="1814" t="6557" r="1910" b="6653">a</wd>
<space/>
<wd l="2035" t="6523" r="2750" b="6653">sentence</wd>
<space/>
<wd l="2875" t="6509" r="3168" b="6653">like</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3322" t="6509" r="3629" b="6653">The</wd>
<space/>
<wd l="3763" t="6509" r="4594" b="6653">exhibition</wd>
<space/>
<wd l="4718" t="6494" r="5016" b="6701">[...]</wd>
<space/>
<wd l="5256" t="6509" r="5746" b="6653">shows</wd>
<space/>
</run>
</ln>
<ln l="1056" t="6734" r="5746" b="6941" baseLine="6888" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1056" t="6744" r="2506" b="6898">&lt;PER&gt;Clemens</wd>
<space/>
<wd l="2640" t="6734" r="4301" b="6941">Brentano&lt;\PER&gt;,</wd>
<space/>
<wd l="4474" t="6744" r="5746" b="6898">&lt;PER&gt;Achim</wd>
<space/>
</ln>
<ln l="1056" t="6974" r="5750" b="7181" baseLine="7123" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1056" t="7037" r="1358" b="7133">von</wd>
<space/>
<wd l="1584" t="6974" r="2947" b="7181">Arnim&lt;\PER&gt;</wd>
<space/>
<wd l="3211" t="6989" r="3518" b="7133">and</wd>
<space/>
<wd l="3749" t="6989" r="5218" b="7138">&lt;PER&gt;Heinrich</wd>
<space/>
<wd l="5448" t="7037" r="5750" b="7133">von</wd>
<space/>
</ln>
<ln l="1051" t="7214" r="5736" b="7421" baseLine="7363">
<wd l="1051" t="7214" r="2414" b="7421"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Kleist&lt;\PER&gt;</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>
<wd l="2554" t="7229" r="2866" b="7373">and</wd>
<space/>
<wd l="2986" t="7229" r="3682" b="7373">between</wd>
<space/>
<wd l="3797" t="7229" r="4147" b="7373">NEs</wd>
<space/>
<wd l="4267" t="7234" r="5078" b="7411">occurring</wd>
<space/>
<wd l="5194" t="7234" r="5352" b="7368">in</wd>
<space/>
<wd l="5462" t="7229" r="5736" b="7373">the</wd>
<space/>
</run>
</ln>
<ln l="1046" t="7454" r="5755" b="7661" baseLine="7603">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1046" t="7517" r="1474" b="7613">same</wd>
<space/>
<wd l="1574" t="7454" r="2405" b="7661">(complex)</wd>
<space/>
<wd l="2510" t="7483" r="3374" b="7651">argument,</wd>
<space/>
<wd l="3475" t="7517" r="3811" b="7651">e.g.,</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3922" t="7469" r="5194" b="7618">&lt;PER&gt;Hanns</wd>
<space/>
<wd l="5280" t="7469" r="5755" b="7613">Peter</wd>
<space/>
</run>
</ln>
<ln l="1051" t="7690" r="5746" b="7896" baseLine="7843" italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1051" t="7690" r="2496" b="7896">Nerger&lt;\PER&gt;,</wd>
<space/>
<wd l="2650" t="7699" r="3058" b="7848">CEO</wd>
<space/>
<wd l="3178" t="7699" r="3350" b="7886">of</wd>
<space/>
<wd l="3442" t="7699" r="4728" b="7853">&lt;ORG&gt;Berlin</wd>
<space/>
<wd l="4862" t="7704" r="5746" b="7848">Tourismus</wd>
<space/>
</ln>
<ln l="1051" t="7930" r="5626" b="8136" baseLine="8083">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1051" t="7944" r="1930" b="8126">Marketing</wd>
<space/>
<wd l="2021" t="7939" r="2573" b="8088">GmbH</wd>
<space/>
<wd l="2650" t="7930" r="3240" b="8136">(BTM)</wd>
<space/>
<wd l="3326" t="7930" r="4219" b="8136">&lt;\ORG&gt;,</wd>
<space/>
<wd l="4315" t="7992" r="4738" b="8088">sums</wd>
<space/>
<wd l="4819" t="7949" r="4944" b="8088">it</wd>
<space/>
<wd l="5021" t="7992" r="5218" b="8126">up</wd>
<space/>
</run>
<wd l="5299" t="7930" r="5626" b="8136"><run italic="true" underlined="none" subsuperscript="none" fontSize="1100" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">[...]</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
<para l="2381" t="8376" r="4411" b="8549" alignment="centered" spaceBefore="185" lsp="exactly" lspExact="282" language="en">
<ln l="2381" t="8376" r="4411" b="8549" baseLine="8544" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="23">
<wd l="2381" t="8386" r="2563" b="8549">5.</wd>
<space/>
<wd l="2851" t="8376" r="3749" b="8549">Related</wd>
<space/>
<wd l="3845" t="8376" r="4411" b="8549">work</wd>
</ln>
</para>
<para l="1042" t="8707" r="5736" b="9619" alignment="justified" spaceBefore="49" lsp="exactly" lspExact="237" language="en">
<ln l="1051" t="8707" r="5731" b="8894" baseLine="8846" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1051" t="8707" r="1387" b="8856">Our</wd>
<space/>
<wd l="1507" t="8712" r="1930" b="8856">work</wd>
<space/>
<wd l="2054" t="8717" r="2174" b="8856">is</wd>
<space/>
<wd l="2304" t="8712" r="2894" b="8856">related</wd>
<space/>
<wd l="3019" t="8726" r="3192" b="8856">to</wd>
<space/>
<wd l="3322" t="8717" r="4037" b="8894">previous</wd>
<space/>
<wd l="4162" t="8712" r="4584" b="8856">work</wd>
<space/>
<wd l="4709" t="8760" r="4910" b="8856">on</wd>
<space/>
<wd l="5035" t="8712" r="5731" b="8856">domain-</wd>
</ln>
<ln l="1046" t="8952" r="5731" b="9134" baseLine="9086" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="8952" r="2093" b="9134">independent</wd>
<space/>
<wd l="2184" t="8952" r="3307" b="9134">unsupervised</wd>
<space/>
<wd l="3394" t="8952" r="4051" b="9096">relation</wd>
<space/>
<wd l="4133" t="8957" r="5050" b="9130">extraction,</wd>
<space/>
<wd l="5146" t="8957" r="5309" b="9091">in</wd>
<space/>
<wd l="5390" t="9000" r="5731" b="9134">par-</wd>
</ln>
<ln l="1042" t="9173" r="5736" b="9379" baseLine="9326" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1042" t="9187" r="1608" b="9331">ticular</wd>
<space/>
<wd l="1670" t="9182" r="2218" b="9331">Sekine</wd>
<space/>
<wd l="2290" t="9173" r="2866" b="9379">(2006),</wd>
<space/>
<wd l="2942" t="9182" r="3782" b="9370">Shinyama</wd>
<space/>
<wd l="3835" t="9187" r="4147" b="9331">and</wd>
<space/>
<wd l="4214" t="9182" r="4762" b="9331">Sekine</wd>
<space/>
<wd l="4834" t="9173" r="5347" b="9379">(2006)</wd>
<space/>
<wd l="5424" t="9187" r="5736" b="9331">and</wd>
<space/>
</ln>
<ln l="1046" t="9413" r="2760" b="9619" baseLine="9566" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="9427" r="1589" b="9571">Banko</wd>
<space/>
<wd l="1666" t="9442" r="1814" b="9571">et</wd>
<space/>
<wd l="1896" t="9427" r="2083" b="9571">al.</wd>
<space/>
<wd l="2189" t="9413" r="2760" b="9619">(2007).</wd>
</ln>
</para>
<para l="1042" t="9653" r="5741" b="14352" alignment="justified" lsp="exactly" lspExact="239" language="en">
<ln l="1051" t="9653" r="5731" b="9859" baseLine="9802" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1051" t="9662" r="1598" b="9811">Sekine</wd>
<space/>
<wd l="1699" t="9653" r="2213" b="9859">(2006)</wd>
<space/>
<wd l="2318" t="9667" r="3206" b="9811">introduces</wd>
<space/>
<wd l="3302" t="9662" r="4306" b="9811">On-demand</wd>
<space/>
<wd l="4392" t="9662" r="5400" b="9811">information</wd>
<space/>
<wd l="5486" t="9715" r="5731" b="9811">ex-</wd>
</ln>
<ln l="1042" t="9902" r="5741" b="10090" baseLine="10042" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="9912" r="1771" b="10085">traction,</wd>
<space/>
<wd l="1954" t="9907" r="2458" b="10051">which</wd>
<space/>
<wd l="2611" t="9912" r="3000" b="10051">aims</wd>
<space/>
<wd l="3158" t="9922" r="3322" b="10051">at</wd>
<space/>
<wd l="3485" t="9907" r="4670" b="10090">automatically</wd>
<space/>
<wd l="4824" t="9902" r="5741" b="10090">identifying</wd>
<space/>
</ln>
<ln l="1046" t="10147" r="5736" b="10330" baseLine="10282" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="10147" r="1594" b="10291">salient</wd>
<space/>
<wd l="1656" t="10162" r="2366" b="10330">patterns</wd>
<space/>
<wd l="2424" t="10147" r="2736" b="10291">and</wd>
<space/>
<wd l="2794" t="10152" r="3667" b="10330">extracting</wd>
<space/>
<wd l="3720" t="10147" r="4450" b="10291">relations</wd>
<space/>
<wd l="4507" t="10147" r="4987" b="10291">based</wd>
<space/>
<wd l="5045" t="10195" r="5251" b="10291">on</wd>
<space/>
<wd l="5294" t="10147" r="5736" b="10291">these</wd>
<space/>
</ln>
<ln l="1046" t="10378" r="5741" b="10565" baseLine="10522" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="10397" r="1800" b="10565">patterns.</wd>
<space/>
<wd l="2064" t="10382" r="2299" b="10526">He</wd>
<space/>
<wd l="2424" t="10387" r="3144" b="10526">retrieves</wd>
<space/>
<wd l="3274" t="10382" r="3941" b="10526">relevant</wd>
<space/>
<wd l="4075" t="10382" r="4992" b="10526">documents</wd>
<space/>
<wd l="5122" t="10378" r="5520" b="10526">from</wd>
<space/>
<wd l="5645" t="10430" r="5741" b="10526">a</wd>
<space/>
</ln>
<ln l="1046" t="10618" r="5731" b="10805" baseLine="10762" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="10670" r="1958" b="10805">newspaper</wd>
<space/>
<wd l="2021" t="10670" r="2573" b="10805">corpus</wd>
<space/>
<wd l="2640" t="10622" r="3120" b="10766">based</wd>
<space/>
<wd l="3187" t="10670" r="3394" b="10766">on</wd>
<space/>
<wd l="3456" t="10670" r="3552" b="10766">a</wd>
<space/>
<wd l="3610" t="10670" r="4094" b="10805">query</wd>
<space/>
<wd l="4157" t="10622" r="4464" b="10766">and</wd>
<space/>
<wd l="4531" t="10622" r="5117" b="10805">applies</wd>
<space/>
<wd l="5189" t="10670" r="5285" b="10766">a</wd>
<space/>
<wd l="5342" t="10618" r="5731" b="10766">POS</wd>
<space/>
</ln>
<ln l="1042" t="10862" r="5741" b="11045" baseLine="10997" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="10877" r="1627" b="11045">tagger,</wd>
<space/>
<wd l="1747" t="10910" r="1843" b="11006">a</wd>
<space/>
<wd l="1939" t="10862" r="2952" b="11045">dependency</wd>
<space/>
<wd l="3048" t="10862" r="3768" b="11045">analyzer</wd>
<space/>
<wd l="3869" t="10862" r="4181" b="11006">and</wd>
<space/>
<wd l="4282" t="10910" r="4488" b="11006">an</wd>
<space/>
<wd l="4589" t="10862" r="5357" b="11006">extended</wd>
<space/>
<wd l="5458" t="10862" r="5741" b="11002">NE</wd>
<space/>
</ln>
<ln l="1042" t="11098" r="5731" b="11285" baseLine="11237" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="11117" r="1622" b="11285">tagger.</wd>
<space/>
<wd l="1733" t="11102" r="2222" b="11285">Using</wd>
<space/>
<wd l="2280" t="11102" r="2554" b="11246">the</wd>
<space/>
<wd l="2621" t="11098" r="3629" b="11246">information</wd>
<space/>
<wd l="3691" t="11098" r="4090" b="11246">from</wd>
<space/>
<wd l="4152" t="11102" r="4426" b="11246">the</wd>
<space/>
<wd l="4483" t="11117" r="5150" b="11285">taggers,</wd>
<space/>
<wd l="5227" t="11102" r="5419" b="11246">he</wd>
<space/>
<wd l="5486" t="11150" r="5731" b="11246">ex-</wd>
</ln>
<ln l="1042" t="11342" r="5736" b="11525" baseLine="11477" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="11357" r="1536" b="11486">tracts</wd>
<space/>
<wd l="1622" t="11357" r="2333" b="11525">patterns</wd>
<space/>
<wd l="2424" t="11342" r="2736" b="11486">and</wd>
<space/>
<wd l="2822" t="11342" r="3408" b="11525">applies</wd>
<space/>
<wd l="3499" t="11342" r="4445" b="11525">paraphrase</wd>
<space/>
<wd l="4526" t="11347" r="5486" b="11525">recognition</wd>
<space/>
<wd l="5563" t="11357" r="5736" b="11486">to</wd>
<space/>
</ln>
<ln l="1046" t="11573" r="5741" b="11760" baseLine="11717" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="11592" r="1560" b="11722">create</wd>
<space/>
<wd l="1632" t="11592" r="1944" b="11722">sets</wd>
<space/>
<wd l="2021" t="11573" r="2189" b="11722">of</wd>
<space/>
<wd l="2246" t="11578" r="3317" b="11760">semantically</wd>
<space/>
<wd l="3384" t="11578" r="3965" b="11722">similar</wd>
<space/>
<wd l="4037" t="11592" r="4790" b="11760">patterns.</wd>
<space/>
<wd l="4906" t="11573" r="5741" b="11760">Shinyama</wd>
<space/>
</ln>
<ln l="1046" t="11803" r="5741" b="12010" baseLine="11957" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="11818" r="1358" b="11962">and</wd>
<space/>
<wd l="1454" t="11813" r="2002" b="11962">Sekine</wd>
<space/>
<wd l="2102" t="11803" r="2616" b="12010">(2006)</wd>
<space/>
<wd l="2722" t="11818" r="3202" b="12000">apply</wd>
<space/>
<wd l="3283" t="11818" r="3754" b="11995">NER,</wd>
<space/>
<wd l="3854" t="11813" r="4805" b="11962">coreference</wd>
<space/>
<wd l="4891" t="11818" r="5741" b="11962">resolution</wd>
<space/>
</ln>
<ln l="1046" t="12053" r="5731" b="12240" baseLine="12192" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="12058" r="1358" b="12202">and</wd>
<space/>
<wd l="1454" t="12062" r="2083" b="12240">parsing</wd>
<space/>
<wd l="2165" t="12072" r="2342" b="12202">to</wd>
<space/>
<wd l="2434" t="12106" r="2530" b="12202">a</wd>
<space/>
<wd l="2621" t="12106" r="3173" b="12240">corpus</wd>
<space/>
<wd l="3269" t="12053" r="3437" b="12202">of</wd>
<space/>
<wd l="3518" t="12106" r="4426" b="12240">newspaper</wd>
<space/>
<wd l="4517" t="12058" r="5126" b="12202">articles</wd>
<space/>
<wd l="5218" t="12072" r="5390" b="12202">to</wd>
<space/>
<wd l="5486" t="12106" r="5731" b="12202">ex-</wd>
</ln>
<ln l="1042" t="12298" r="5736" b="12480" baseLine="12432" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="12312" r="1454" b="12442">tract</wd>
<space/>
<wd l="1531" t="12298" r="2347" b="12480">two-place</wd>
<space/>
<wd l="2424" t="12298" r="3154" b="12442">relations</wd>
<space/>
<wd l="3235" t="12298" r="3931" b="12442">between</wd>
<space/>
<wd l="4008" t="12298" r="4402" b="12442">NEs.</wd>
<space/>
<wd l="4522" t="12298" r="4858" b="12442">The</wd>
<space/>
<wd l="4930" t="12298" r="5736" b="12442">extracted</wd>
<space/>
</ln>
<ln l="1046" t="12533" r="5736" b="12720" baseLine="12672" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="12538" r="1781" b="12682">relations</wd>
<space/>
<wd l="1867" t="12586" r="2126" b="12682">are</wd>
<space/>
<wd l="2213" t="12538" r="2909" b="12720">grouped</wd>
<space/>
<wd l="2995" t="12542" r="3326" b="12682">into</wd>
<space/>
<wd l="3413" t="12552" r="4046" b="12720">pattern</wd>
<space/>
<wd l="4128" t="12538" r="4632" b="12682">tables</wd>
<space/>
<wd l="4718" t="12533" r="4886" b="12682">of</wd>
<space/>
<wd l="4958" t="12538" r="5237" b="12677">NE</wd>
<space/>
<wd l="5323" t="12542" r="5736" b="12720">pairs</wd>
<space/>
</ln>
<ln l="1046" t="12778" r="5741" b="12960" baseLine="12912" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="12782" r="1939" b="12960">expressing</wd>
<space/>
<wd l="1992" t="12778" r="2266" b="12922">the</wd>
<space/>
<wd l="2328" t="12826" r="2755" b="12922">same</wd>
<space/>
<wd l="2818" t="12778" r="3523" b="12955">relation,</wd>
<space/>
<wd l="3595" t="12826" r="3936" b="12960">e.g.,</wd>
<space/>
<wd l="4008" t="12778" r="4891" b="12922">hurricanes</wd>
<space/>
<wd l="4958" t="12778" r="5270" b="12922">and</wd>
<space/>
<wd l="5333" t="12778" r="5741" b="12922">their</wd>
<space/>
</ln>
<ln l="1046" t="13008" r="5741" b="13195" baseLine="13152" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="13013" r="1853" b="13157">locations.</wd>
<space/>
<wd l="1997" t="13008" r="2885" b="13195">Clustering</wd>
<space/>
<wd l="2966" t="13018" r="3086" b="13157">is</wd>
<space/>
<wd l="3178" t="13008" r="4051" b="13195">performed</wd>
<space/>
<wd l="4138" t="13018" r="4296" b="13152">in</wd>
<space/>
<wd l="4373" t="13027" r="4680" b="13157">two</wd>
<space/>
<wd l="4766" t="13027" r="5232" b="13195">steps:</wd>
<space/>
<wd l="5357" t="13013" r="5741" b="13195">they</wd>
<space/>
</ln>
<ln l="1046" t="13248" r="5736" b="13397" baseLine="13392" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="13248" r="1378" b="13397">first</wd>
<space/>
<wd l="1459" t="13253" r="2030" b="13397">cluster</wd>
<space/>
<wd l="2102" t="13253" r="2304" b="13397">all</wd>
<space/>
<wd l="2376" t="13253" r="3293" b="13397">documents</wd>
<space/>
<wd l="3374" t="13253" r="3682" b="13397">and</wd>
<space/>
<wd l="3758" t="13301" r="4027" b="13397">use</wd>
<space/>
<wd l="4099" t="13253" r="4411" b="13397">this</wd>
<space/>
<wd l="4488" t="13248" r="5496" b="13397">information</wd>
<space/>
<wd l="5563" t="13267" r="5736" b="13397">to</wd>
<space/>
</ln>
<ln l="1046" t="13493" r="5741" b="13675" baseLine="13627" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="13493" r="1618" b="13637">cluster</wd>
<space/>
<wd l="1704" t="13493" r="1978" b="13637">the</wd>
<space/>
<wd l="2069" t="13493" r="2846" b="13637">relations.</wd>
<space/>
<wd l="3010" t="13493" r="3782" b="13670">However,</wd>
<space/>
<wd l="3888" t="13493" r="4253" b="13675">only</wd>
<space/>
<wd l="4344" t="13493" r="5074" b="13637">relations</wd>
<space/>
<wd l="5170" t="13541" r="5741" b="13675">among</wd>
<space/>
</ln>
<ln l="1042" t="13728" r="5736" b="13915" baseLine="13867" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1042" t="13733" r="1315" b="13877">the</wd>
<space/>
<wd l="1402" t="13728" r="1690" b="13877">five</wd>
<space/>
<wd l="1771" t="13747" r="2179" b="13877">most</wd>
<space/>
<wd l="2270" t="13733" r="3624" b="13915">highly-weighted</wd>
<space/>
<wd l="3710" t="13738" r="4325" b="13877">entities</wd>
<space/>
<wd l="4411" t="13738" r="4574" b="13872">in</wd>
<space/>
<wd l="4651" t="13781" r="4747" b="13877">a</wd>
<space/>
<wd l="4829" t="13733" r="5400" b="13877">cluster</wd>
<space/>
<wd l="5477" t="13781" r="5736" b="13877">are</wd>
<space/>
</ln>
<ln l="1046" t="13968" r="5731" b="14155" baseLine="14107" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="13973" r="1853" b="14117">extracted</wd>
<space/>
<wd l="1925" t="13973" r="2237" b="14117">and</wd>
<space/>
<wd l="2309" t="13973" r="2674" b="14155">only</wd>
<space/>
<wd l="2741" t="13973" r="3014" b="14117">the</wd>
<space/>
<wd l="3082" t="13968" r="3413" b="14117">first</wd>
<space/>
<wd l="3485" t="13987" r="3763" b="14117">ten</wd>
<space/>
<wd l="3830" t="13987" r="4622" b="14117">sentences</wd>
<space/>
<wd l="4699" t="13968" r="4867" b="14117">of</wd>
<space/>
<wd l="4925" t="13973" r="5299" b="14117">each</wd>
<space/>
<wd l="5366" t="13978" r="5731" b="14117">arti-</wd>
</ln>
<ln l="1046" t="14208" r="3326" b="14352" baseLine="14347" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="5">
<wd l="1046" t="14208" r="1272" b="14352">cle</wd>
<space/>
<wd l="1349" t="14256" r="1603" b="14352">are</wd>
<space/>
<wd l="1675" t="14208" r="2150" b="14352">taken</wd>
<space/>
<wd l="2222" t="14213" r="2549" b="14352">into</wd>
<space/>
<wd l="2626" t="14222" r="3326" b="14352">account.</wd>
</ln>
</para>
<para l="1042" t="14434" r="5741" b="15835" alignment="justified" spaceAfter="4" lsp="exactly" lspExact="239" language="en">
<ln l="1046" t="14434" r="5741" b="14640" baseLine="14587" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="14448" r="1589" b="14592">Banko</wd>
<space/>
<wd l="1670" t="14462" r="1819" b="14592">et</wd>
<space/>
<wd l="1906" t="14448" r="2093" b="14592">al.</wd>
<space/>
<wd l="2198" t="14434" r="2712" b="14640">(2007)</wd>
<space/>
<wd l="2808" t="14496" r="3077" b="14592">use</wd>
<space/>
<wd l="3154" t="14496" r="3250" b="14592">a</wd>
<space/>
<wd l="3326" t="14448" r="3782" b="14592">much</wd>
<space/>
<wd l="3859" t="14448" r="4354" b="14630">larger</wd>
<space/>
<wd l="4430" t="14496" r="5030" b="14630">corpus,</wd>
<space/>
<wd l="5122" t="14448" r="5741" b="14630">namely</wd>
<space/>
</ln>
<ln l="1046" t="14688" r="5741" b="14870" baseLine="14822" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="14693" r="1133" b="14832">9</wd>
<space/>
<wd l="1234" t="14688" r="1824" b="14832">million</wd>
<space/>
<wd l="1910" t="14688" r="2242" b="14832">web</wd>
<space/>
<wd l="2338" t="14736" r="2851" b="14870">pages,</wd>
<space/>
<wd l="2952" t="14702" r="3130" b="14832">to</wd>
<space/>
<wd l="3221" t="14702" r="3821" b="14832">extract</wd>
<space/>
<wd l="3922" t="14688" r="4123" b="14832">all</wd>
<space/>
<wd l="4214" t="14688" r="4944" b="14832">relations</wd>
<space/>
<wd l="5045" t="14688" r="5741" b="14832">between</wd>
<space/>
</ln>
<ln l="1046" t="14923" r="5741" b="15110" baseLine="15062" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="14976" r="1474" b="15072">noun</wd>
<space/>
<wd l="1550" t="14928" r="2232" b="15110">phrases.</wd>
<space/>
<wd l="2362" t="14928" r="2707" b="15072">Due</wd>
<space/>
<wd l="2779" t="14942" r="2957" b="15072">to</wd>
<space/>
<wd l="3034" t="14928" r="3307" b="15072">the</wd>
<space/>
<wd l="3384" t="14928" r="3802" b="15110">large</wd>
<space/>
<wd l="3878" t="14942" r="4522" b="15072">amount</wd>
<space/>
<wd l="4613" t="14923" r="4781" b="15072">of</wd>
<space/>
<wd l="4848" t="14928" r="5270" b="15106">data,</wd>
<space/>
<wd l="5357" t="14928" r="5741" b="15110">they</wd>
<space/>
</ln>
<ln l="1046" t="15163" r="5731" b="15350" baseLine="15302" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="15168" r="1526" b="15350">apply</wd>
<space/>
<wd l="1594" t="15163" r="1978" b="15312">POS</wd>
<space/>
<wd l="2054" t="15173" r="2693" b="15350">tagging</wd>
<space/>
<wd l="2760" t="15168" r="3149" b="15350">only.</wd>
<space/>
<wd l="3259" t="15168" r="3730" b="15312">Their</wd>
<space/>
<wd l="3797" t="15182" r="4368" b="15350">output</wd>
<space/>
<wd l="4450" t="15173" r="5102" b="15312">consists</wd>
<space/>
<wd l="5179" t="15163" r="5347" b="15312">of</wd>
<space/>
<wd l="5400" t="15168" r="5731" b="15307">mil-</wd>
</ln>
<ln l="1046" t="15398" r="5731" b="15586" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="15403" r="1435" b="15547">lions</wd>
<space/>
<wd l="1526" t="15398" r="1694" b="15547">of</wd>
<space/>
<wd l="1766" t="15403" r="2549" b="15581">relations,</wd>
<space/>
<wd l="2650" t="15418" r="3058" b="15547">most</wd>
<space/>
<wd l="3154" t="15398" r="3317" b="15547">of</wd>
<space/>
<wd l="3389" t="15403" r="3826" b="15547">them</wd>
<space/>
<wd l="3917" t="15403" r="4382" b="15586">being</wd>
<space/>
<wd l="4464" t="15403" r="5160" b="15547">abstract</wd>
<space/>
<wd l="5256" t="15451" r="5731" b="15547">asser-</wd>
</ln>
<ln l="1042" t="15629" r="5741" b="15835" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1042" t="15648" r="1459" b="15787">tions</wd>
<space/>
<wd l="1570" t="15643" r="1944" b="15787">such</wd>
<space/>
<wd l="2050" t="15691" r="2218" b="15787">as</wd>
<space/>
<wd l="2342" t="15629" r="3245" b="15835">(executive,</wd>
<space/>
<wd l="3365" t="15643" r="3797" b="15787">hired</wd>
<space/>
<wd l="3907" t="15643" r="4138" b="15826">by,</wd>
<space/>
<wd l="4262" t="15629" r="5088" b="15835">company)</wd>
<space/>
<wd l="5213" t="15643" r="5741" b="15787">rather</wd>
</ln>
</para>
</column>
<column l="6093" t="6447" r="10817" b="15843">
<para l="6096" t="6504" r="7790" b="6653" alignment="justified" spaceBefore="15" lsp="exactly" lspExact="233" language="en">
<ln l="6096" t="6504" r="7790" b="6653" baseLine="6648" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="6096" t="6509" r="6494" b="6653">than</wd>
<space/>
<wd l="6566" t="6523" r="7277" b="6653">concrete</wd>
<space/>
<wd l="7354" t="6504" r="7790" b="6653">facts.</wd>
</ln>
</para>
<para l="6096" t="6744" r="10805" b="10042" alignment="justified" lsp="exactly" lspExact="239" language="en">
<ln l="6106" t="6744" r="10805" b="6931" baseLine="6888" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6106" t="6744" r="6442" b="6893">Our</wd>
<space/>
<wd l="6547" t="6749" r="7334" b="6931">approach</wd>
<space/>
<wd l="7435" t="6797" r="7733" b="6893">can</wd>
<space/>
<wd l="7834" t="6749" r="8035" b="6893">be</wd>
<space/>
<wd l="8141" t="6749" r="8885" b="6931">regarded</wd>
<space/>
<wd l="8995" t="6797" r="9158" b="6893">as</wd>
<space/>
<wd l="9274" t="6797" r="9370" b="6893">a</wd>
<space/>
<wd l="9470" t="6749" r="10536" b="6893">combination</wd>
<space/>
<wd l="10637" t="6744" r="10805" b="6893">of</wd>
<space/>
</ln>
<ln l="6096" t="6974" r="10786" b="7181" baseLine="7123" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6096" t="6989" r="6538" b="7133">these</wd>
<space/>
<wd l="6605" t="6989" r="7598" b="7171">approaches:</wd>
<space/>
<wd l="7704" t="6989" r="8064" b="7133">Like</wd>
<space/>
<wd l="8126" t="6989" r="8669" b="7133">Banko</wd>
<space/>
<wd l="8736" t="7003" r="8890" b="7133">et</wd>
<space/>
<wd l="8962" t="6989" r="9149" b="7133">al.</wd>
<space/>
<wd l="9245" t="6974" r="9821" b="7181">(2007),</wd>
<space/>
<wd l="9893" t="7037" r="10118" b="7133">we</wd>
<space/>
<wd l="10186" t="7003" r="10786" b="7133">extract</wd>
<space/>
</ln>
<ln l="6101" t="7224" r="10786" b="7411" baseLine="7363" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="7229" r="6835" b="7373">relations</wd>
<space/>
<wd l="6912" t="7224" r="7310" b="7373">from</wd>
<space/>
<wd l="7387" t="7234" r="7834" b="7411">noisy</wd>
<space/>
<wd l="7901" t="7229" r="8232" b="7373">web</wd>
<space/>
<wd l="8314" t="7229" r="9230" b="7373">documents</wd>
<space/>
<wd l="9312" t="7229" r="9835" b="7373">rather</wd>
<space/>
<wd l="9907" t="7229" r="10306" b="7373">than</wd>
<space/>
<wd l="10378" t="7277" r="10786" b="7373">com-</wd>
</ln>
<ln l="6101" t="7469" r="10795" b="7651" baseLine="7603" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="7469" r="6758" b="7651">parably</wd>
<space/>
<wd l="6840" t="7469" r="7982" b="7651">homogeneous</wd>
<space/>
<wd l="8074" t="7517" r="8486" b="7613">news</wd>
<space/>
<wd l="8578" t="7469" r="9235" b="7613">articles.</wd>
<space/>
<wd l="9389" t="7469" r="10166" b="7646">However,</wd>
<space/>
<wd l="10267" t="7469" r="10795" b="7613">rather</wd>
<space/>
</ln>
<ln l="6096" t="7699" r="10786" b="7886" baseLine="7843" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6096" t="7704" r="6494" b="7848">than</wd>
<space/>
<wd l="6562" t="7709" r="7440" b="7886">extracting</wd>
<space/>
<wd l="7507" t="7704" r="8237" b="7848">relations</wd>
<space/>
<wd l="8309" t="7699" r="8707" b="7848">from</wd>
<space/>
<wd l="8774" t="7704" r="9442" b="7848">millions</wd>
<space/>
<wd l="9514" t="7699" r="9682" b="7848">of</wd>
<space/>
<wd l="9739" t="7752" r="10205" b="7886">pages</wd>
<space/>
<wd l="10272" t="7752" r="10498" b="7848">we</wd>
<space/>
<wd l="10565" t="7752" r="10786" b="7848">re-</wd>
</ln>
<ln l="6101" t="7939" r="10795" b="8126" baseLine="8083" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="7944" r="6494" b="8088">duce</wd>
<space/>
<wd l="6547" t="7944" r="6821" b="8088">the</wd>
<space/>
<wd l="6883" t="7949" r="7186" b="8088">size</wd>
<space/>
<wd l="7248" t="7939" r="7411" b="8088">of</wd>
<space/>
<wd l="7459" t="7992" r="7742" b="8088">our</wd>
<space/>
<wd l="7800" t="7992" r="8352" b="8126">corpus</wd>
<space/>
<wd l="8419" t="7939" r="9370" b="8088">beforehand</wd>
<space/>
<wd l="9432" t="7949" r="9883" b="8126">using</wd>
<space/>
<wd l="9941" t="7992" r="10037" b="8088">a</wd>
<space/>
<wd l="10094" t="7992" r="10574" b="8126">query</wd>
<space/>
<wd l="10632" t="7949" r="10795" b="8083">in</wd>
<space/>
</ln>
<ln l="6101" t="8184" r="10776" b="8366" baseLine="8318" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="8184" r="6552" b="8328">order</wd>
<space/>
<wd l="6605" t="8198" r="6778" b="8328">to</wd>
<space/>
<wd l="6835" t="8184" r="7032" b="8328">be</wd>
<space/>
<wd l="7090" t="8184" r="7435" b="8328">able</wd>
<space/>
<wd l="7488" t="8198" r="7666" b="8328">to</wd>
<space/>
<wd l="7723" t="8184" r="8198" b="8366">apply</wd>
<space/>
<wd l="8256" t="8232" r="8678" b="8328">more</wd>
<space/>
<wd l="8736" t="8184" r="9518" b="8366">linguistic</wd>
<space/>
<wd l="9576" t="8189" r="10776" b="8366">preprocessing.</wd>
<space/>
</ln>
<ln l="6101" t="8410" r="10781" b="8616" baseLine="8558" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="8424" r="6461" b="8568">Like</wd>
<space/>
<wd l="6557" t="8419" r="7104" b="8568">Sekine</wd>
<space/>
<wd l="7205" t="8410" r="7718" b="8616">(2006)</wd>
<space/>
<wd l="7824" t="8424" r="8136" b="8568">and</wd>
<space/>
<wd l="8227" t="8419" r="9067" b="8606">Shinyama</wd>
<space/>
<wd l="9149" t="8424" r="9461" b="8568">and</wd>
<space/>
<wd l="9557" t="8419" r="10104" b="8568">Sekine</wd>
<space/>
<wd l="10205" t="8410" r="10781" b="8616">(2006),</wd>
<space/>
</ln>
<ln l="6096" t="8664" r="10786" b="8846" baseLine="8798" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6096" t="8712" r="6322" b="8808">we</wd>
<space/>
<wd l="6374" t="8678" r="7368" b="8808">concentrate</wd>
<space/>
<wd l="7421" t="8712" r="7627" b="8808">on</wd>
<space/>
<wd l="7680" t="8664" r="8410" b="8808">relations</wd>
<space/>
<wd l="8467" t="8664" r="9250" b="8846">involving</wd>
<space/>
<wd l="9298" t="8664" r="9701" b="8842">NEs,</wd>
<space/>
<wd l="9763" t="8664" r="10037" b="8808">the</wd>
<space/>
<wd l="10090" t="8712" r="10786" b="8846">assump-</wd>
</ln>
<ln l="6096" t="8899" r="10786" b="9082" baseLine="9038" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6096" t="8904" r="6442" b="9043">tion</wd>
<space/>
<wd l="6523" t="8899" r="6989" b="9082">being</wd>
<space/>
<wd l="7066" t="8899" r="7421" b="9043">that</wd>
<space/>
<wd l="7507" t="8899" r="7949" b="9043">these</wd>
<space/>
<wd l="8035" t="8899" r="8765" b="9043">relations</wd>
<space/>
<wd l="8856" t="8947" r="9115" b="9043">are</wd>
<space/>
<wd l="9197" t="8899" r="9470" b="9043">the</wd>
<space/>
<wd l="9557" t="8899" r="10483" b="9082">potentially</wd>
<space/>
<wd l="10565" t="8904" r="10786" b="9038">in-</wd>
</ln>
<ln l="6096" t="9139" r="10786" b="9322" baseLine="9278" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6096" t="9144" r="6850" b="9322">teresting</wd>
<space/>
<wd l="6936" t="9187" r="7344" b="9283">ones.</wd>
<space/>
<wd l="7488" t="9139" r="7824" b="9283">The</wd>
<space/>
<wd l="7910" t="9139" r="8568" b="9283">relation</wd>
<space/>
<wd l="8654" t="9139" r="9490" b="9322">clustering</wd>
<space/>
<wd l="9571" t="9154" r="9917" b="9322">step</wd>
<space/>
<wd l="10003" t="9139" r="10522" b="9283">allows</wd>
<space/>
<wd l="10608" t="9187" r="10786" b="9283">us</wd>
<space/>
</ln>
<ln l="6096" t="9374" r="10790" b="9562" baseLine="9514" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6096" t="9394" r="6269" b="9523">to</wd>
<space/>
<wd l="6350" t="9427" r="6840" b="9562">group</wd>
<space/>
<wd l="6917" t="9379" r="7502" b="9523">similar</wd>
<space/>
<wd l="7579" t="9379" r="8357" b="9557">relations,</wd>
<space/>
<wd l="8443" t="9379" r="8942" b="9523">which</wd>
<space/>
<wd l="9019" t="9427" r="9355" b="9557">can,</wd>
<space/>
<wd l="9446" t="9374" r="9677" b="9523">for</wd>
<space/>
<wd l="9754" t="9379" r="10507" b="9562">example,</wd>
<space/>
<wd l="10594" t="9379" r="10790" b="9523">be</wd>
<space/>
</ln>
<ln l="6101" t="9614" r="10786" b="9802" baseLine="9754" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="9614" r="6600" b="9763">useful</wd>
<space/>
<wd l="6672" t="9614" r="6902" b="9763">for</wd>
<space/>
<wd l="6965" t="9619" r="7243" b="9763">the</wd>
<space/>
<wd l="7310" t="9624" r="8213" b="9802">generation</wd>
<space/>
<wd l="8280" t="9614" r="8448" b="9763">of</wd>
<space/>
<wd l="8506" t="9667" r="9168" b="9763">answers</wd>
<space/>
<wd l="9240" t="9624" r="9403" b="9758">in</wd>
<space/>
<wd l="9470" t="9667" r="9566" b="9763">a</wd>
<space/>
<wd l="9638" t="9614" r="10406" b="9802">Question</wd>
<space/>
<wd l="10474" t="9614" r="10786" b="9758">An-</wd>
</ln>
<ln l="6101" t="9864" r="7445" b="10042" baseLine="9994" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="3">
<wd l="6101" t="9864" r="6749" b="10042">swering</wd>
<space/>
<wd l="6816" t="9874" r="7445" b="10042">system.</wd>
</ln>
</para>
<para l="7493" t="10291" r="9403" b="10464" alignment="centered" spaceBefore="191" lsp="exactly" lspExact="282" language="en">
<ln l="7493" t="10291" r="9403" b="10464" baseLine="10454" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="24">
<wd l="7493" t="10301" r="7675" b="10464">6.</wd>
<space/>
<wd l="7968" t="10296" r="8736" b="10464">Future</wd>
<space/>
<wd l="8842" t="10291" r="9403" b="10464">work</wd>
</ln>
</para>
<para l="6096" t="10618" r="10805" b="12000" alignment="justified" spaceBefore="50" lsp="exactly" lspExact="238" language="en">
<ln l="6106" t="10618" r="10786" b="10805" baseLine="10762" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6106" t="10618" r="6547" b="10766">Since</wd>
<space/>
<wd l="6624" t="10670" r="7094" b="10805">many</wd>
<space/>
<wd l="7166" t="10670" r="7656" b="10766">errors</wd>
<space/>
<wd l="7728" t="10670" r="8122" b="10766">were</wd>
<space/>
<wd l="8194" t="10622" r="8496" b="10766">due</wd>
<space/>
<wd l="8568" t="10637" r="8741" b="10766">to</wd>
<space/>
<wd l="8813" t="10622" r="9086" b="10766">the</wd>
<space/>
<wd l="9158" t="10627" r="9902" b="10766">noisiness</wd>
<space/>
<wd l="9984" t="10618" r="10152" b="10766">of</wd>
<space/>
<wd l="10205" t="10622" r="10478" b="10766">the</wd>
<space/>
<wd l="10555" t="10670" r="10786" b="10766">ar-</wd>
</ln>
<ln l="6101" t="10862" r="10786" b="11045" baseLine="10997" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="10862" r="6811" b="11045">bitrarily</wd>
<space/>
<wd l="6878" t="10862" r="7891" b="11006">downloaded</wd>
<space/>
<wd l="7958" t="10862" r="8290" b="11006">web</wd>
<space/>
<wd l="8362" t="10862" r="9331" b="11040">documents,</wd>
<space/>
<wd l="9413" t="10910" r="9509" b="11006">a</wd>
<space/>
<wd l="9571" t="10910" r="9998" b="11006">more</wd>
<space/>
<wd l="10066" t="10862" r="10786" b="11045">sophisti-</wd>
</ln>
<ln l="6101" t="11098" r="10786" b="11285" baseLine="11237" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="11102" r="6557" b="11246">cated</wd>
<space/>
<wd l="6610" t="11098" r="7282" b="11285">filtering</wd>
<space/>
<wd l="7330" t="11117" r="7675" b="11285">step</wd>
<space/>
<wd l="7733" t="11098" r="7963" b="11246">for</wd>
<space/>
<wd l="8016" t="11107" r="8890" b="11285">extracting</wd>
<space/>
<wd l="8938" t="11102" r="9610" b="11246">relevant</wd>
<space/>
<wd l="9667" t="11102" r="10277" b="11246">textual</wd>
<space/>
<wd l="10330" t="11098" r="10786" b="11246">infor-</wd>
</ln>
<ln l="6101" t="11338" r="10781" b="11525" baseLine="11477" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="11347" r="6706" b="11486">mation</wd>
<space/>
<wd l="6768" t="11338" r="7162" b="11486">from</wd>
<space/>
<wd l="7219" t="11342" r="7555" b="11486">web</wd>
<space/>
<wd l="7618" t="11347" r="7987" b="11486">sites</wd>
<space/>
<wd l="8054" t="11338" r="8578" b="11486">before</wd>
<space/>
<wd l="8640" t="11342" r="9384" b="11525">applying</wd>
<space/>
<wd l="9442" t="11342" r="9720" b="11482">NE</wd>
<space/>
<wd l="9782" t="11347" r="10781" b="11525">recognition,</wd>
<space/>
</ln>
<ln l="6101" t="11573" r="10805" b="11760" baseLine="11717" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6101" t="11582" r="6773" b="11760">parsing,</wd>
<space/>
<wd l="6888" t="11592" r="7171" b="11722">etc.</wd>
<space/>
<wd l="7286" t="11582" r="7406" b="11722">is</wd>
<space/>
<wd l="7507" t="11578" r="7963" b="11760">likely</wd>
<space/>
<wd l="8054" t="11592" r="8227" b="11722">to</wd>
<space/>
<wd l="8328" t="11582" r="9010" b="11760">improve</wd>
<space/>
<wd l="9101" t="11578" r="9379" b="11722">the</wd>
<space/>
<wd l="9475" t="11573" r="10541" b="11760">performance</wd>
<space/>
<wd l="10637" t="11573" r="10805" b="11722">of</wd>
<space/>
</ln>
<ln l="6096" t="11818" r="7070" b="12000" baseLine="11957" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="6096" t="11818" r="6370" b="11962">the</wd>
<space/>
<wd l="6446" t="11832" r="7070" b="12000">system.</wd>
</ln>
</para>
<para l="6096" t="12053" r="10805" b="15826" alignment="justified" spaceAfter="4" lsp="exactly" lspExact="239" language="en">
<ln l="6101" t="12053" r="10786" b="12240" baseLine="12192" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12058" r="6437" b="12202">The</wd>
<space/>
<wd l="6509" t="12058" r="6936" b="12202">NER</wd>
<space/>
<wd l="7003" t="12072" r="7944" b="12240">component</wd>
<space/>
<wd l="8021" t="12058" r="8453" b="12240">plays</wd>
<space/>
<wd l="8530" t="12106" r="8626" b="12202">a</wd>
<space/>
<wd l="8693" t="12058" r="9259" b="12202">crucial</wd>
<space/>
<wd l="9331" t="12058" r="9648" b="12202">role</wd>
<space/>
<wd l="9720" t="12053" r="9950" b="12202">for</wd>
<space/>
<wd l="10018" t="12058" r="10291" b="12202">the</wd>
<space/>
<wd l="10363" t="12058" r="10786" b="12240">qual-</wd>
</ln>
<ln l="6101" t="12293" r="10795" b="12480" baseLine="12432" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12302" r="6331" b="12480">ity</wd>
<space/>
<wd l="6384" t="12293" r="6547" b="12442">of</wd>
<space/>
<wd l="6586" t="12298" r="6859" b="12442">the</wd>
<space/>
<wd l="6912" t="12298" r="7406" b="12442">whole</wd>
<space/>
<wd l="7464" t="12312" r="8093" b="12480">system,</wd>
<space/>
<wd l="8165" t="12298" r="8827" b="12442">because</wd>
<space/>
<wd l="8875" t="12298" r="9154" b="12442">the</wd>
<space/>
<wd l="9206" t="12298" r="9864" b="12442">relation</wd>
<space/>
<wd l="9922" t="12302" r="10795" b="12442">extraction</wd>
<space/>
</ln>
<ln l="6101" t="12538" r="10790" b="12720" baseLine="12672" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="12552" r="7037" b="12720">component</wd>
<space/>
<wd l="7133" t="12538" r="7824" b="12720">depends</wd>
<space/>
<wd l="7910" t="12538" r="8520" b="12720">heavily</wd>
<space/>
<wd l="8606" t="12586" r="8808" b="12682">on</wd>
<space/>
<wd l="8890" t="12538" r="9163" b="12682">the</wd>
<space/>
<wd l="9245" t="12538" r="9677" b="12682">NER</wd>
<space/>
<wd l="9758" t="12538" r="10382" b="12720">quality,</wd>
<space/>
<wd l="10478" t="12538" r="10790" b="12682">and</wd>
<space/>
</ln>
<ln l="6096" t="12773" r="10805" b="12960" baseLine="12912" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="12778" r="6749" b="12960">thereby</wd>
<space/>
<wd l="6821" t="12778" r="7094" b="12922">the</wd>
<space/>
<wd l="7171" t="12778" r="7598" b="12922">NER</wd>
<space/>
<wd l="7670" t="12778" r="8270" b="12960">quality</wd>
<space/>
<wd l="8342" t="12773" r="9173" b="12922">influences</wd>
<space/>
<wd l="9254" t="12778" r="9581" b="12922">also</wd>
<space/>
<wd l="9653" t="12778" r="9926" b="12922">the</wd>
<space/>
<wd l="10003" t="12778" r="10560" b="12922">results</wd>
<space/>
<wd l="10637" t="12773" r="10805" b="12922">of</wd>
<space/>
</ln>
<ln l="6096" t="13008" r="10790" b="13195" baseLine="13152" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="13013" r="6370" b="13157">the</wd>
<space/>
<wd l="6446" t="13013" r="7286" b="13195">clustering</wd>
<space/>
<wd l="7358" t="13061" r="8021" b="13195">process.</wd>
<space/>
<wd l="8136" t="13008" r="8275" b="13152">A</wd>
<space/>
<wd l="8357" t="13013" r="9029" b="13195">possible</wd>
<space/>
<wd l="9106" t="13013" r="9787" b="13157">solution</wd>
<space/>
<wd l="9854" t="13027" r="10032" b="13157">to</wd>
<space/>
<wd l="10109" t="13018" r="10790" b="13195">improve</wd>
<space/>
</ln>
<ln l="6101" t="13248" r="10795" b="13435" baseLine="13392" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13253" r="6533" b="13397">NER</wd>
<space/>
<wd l="6605" t="13258" r="6763" b="13392">in</wd>
<space/>
<wd l="6835" t="13253" r="7109" b="13397">the</wd>
<space/>
<wd l="7186" t="13253" r="7690" b="13392">IDEX</wd>
<space/>
<wd l="7771" t="13248" r="8381" b="13435">System</wd>
<space/>
<wd l="8462" t="13258" r="8582" b="13397">is</wd>
<space/>
<wd l="8659" t="13267" r="8832" b="13397">to</wd>
<space/>
<wd l="8909" t="13258" r="9672" b="13435">integrate</wd>
<space/>
<wd l="9749" t="13301" r="9845" b="13397">a</wd>
<space/>
<wd l="9922" t="13253" r="10795" b="13397">MetaNER</wd>
<space/>
</ln>
<ln l="6101" t="13488" r="10786" b="13675" baseLine="13627" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13507" r="7090" b="13675">component,</wd>
<space/>
<wd l="7162" t="13493" r="8050" b="13675">combining</wd>
<space/>
<wd l="8098" t="13493" r="8371" b="13637">the</wd>
<space/>
<wd l="8429" t="13493" r="8986" b="13637">results</wd>
<space/>
<wd l="9048" t="13488" r="9216" b="13637">of</wd>
<space/>
<wd l="9259" t="13493" r="9840" b="13637">several</wd>
<space/>
<wd l="9898" t="13493" r="10325" b="13637">NER</wd>
<space/>
<wd l="10378" t="13541" r="10786" b="13637">com-</wd>
</ln>
<ln l="6101" t="13728" r="10786" b="13915" baseLine="13867" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="13747" r="6811" b="13915">ponents.</wd>
<space/>
<wd l="6955" t="13733" r="7570" b="13877">Within</wd>
<space/>
<wd l="7646" t="13733" r="7925" b="13877">the</wd>
<space/>
<wd l="8006" t="13728" r="8918" b="13877">framework</wd>
<space/>
<wd l="9000" t="13728" r="9168" b="13877">of</wd>
<space/>
<wd l="9235" t="13733" r="9509" b="13877">the</wd>
<space/>
<wd l="9595" t="13733" r="10099" b="13872">IDEX</wd>
<space/>
<wd l="10186" t="13738" r="10786" b="13915">project</wd>
<space/>
</ln>
<ln l="6101" t="13973" r="10790" b="14155" baseLine="14107" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14021" r="6197" b="14117">a</wd>
<space/>
<wd l="6298" t="13973" r="7176" b="14117">MetaNER</wd>
<space/>
<wd l="7277" t="13987" r="8213" b="14155">component</wd>
<space/>
<wd l="8323" t="13973" r="8957" b="14155">already</wd>
<space/>
<wd l="9058" t="13973" r="9336" b="14117">has</wd>
<space/>
<wd l="9442" t="13973" r="9840" b="14117">been</wd>
<space/>
<wd l="9941" t="13973" r="10790" b="14155">developed</wd>
<space/>
</ln>
<ln l="6115" t="14194" r="10790" b="14400" baseLine="14347" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6115" t="14194" r="6614" b="14400">(Heyl,</wd>
<space/>
<wd l="6686" t="14222" r="6859" b="14352">to</wd>
<space/>
<wd l="6926" t="14256" r="7512" b="14390">appear</wd>
<space/>
<wd l="7579" t="14194" r="8093" b="14400">2008),</wd>
<space/>
<wd l="8165" t="14208" r="8448" b="14352">but</wd>
<space/>
<wd l="8525" t="14222" r="8794" b="14352">not</wd>
<space/>
<wd l="8861" t="14222" r="9120" b="14390">yet</wd>
<space/>
<wd l="9192" t="14208" r="10061" b="14390">integrated</wd>
<space/>
<wd l="10128" t="14213" r="10459" b="14352">into</wd>
<space/>
<wd l="10517" t="14208" r="10790" b="14352">the</wd>
<space/>
</ln>
<ln l="6101" t="14448" r="10786" b="14630" baseLine="14587" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14462" r="6984" b="14630">prototype.</wd>
<space/>
<wd l="7114" t="14448" r="7450" b="14592">The</wd>
<space/>
<wd l="7531" t="14448" r="8410" b="14592">MetaNER</wd>
<space/>
<wd l="8486" t="14462" r="9422" b="14630">component</wd>
<space/>
<wd l="9514" t="14448" r="10358" b="14630">developed</wd>
<space/>
<wd l="10445" t="14496" r="10786" b="14592">uses</wd>
<space/>
</ln>
<ln l="6096" t="14683" r="10786" b="14870" baseLine="14822" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="14688" r="6370" b="14832">the</wd>
<space/>
<wd l="6427" t="14688" r="6984" b="14832">results</wd>
<space/>
<wd l="7046" t="14683" r="7440" b="14832">from</wd>
<space/>
<wd l="7493" t="14688" r="7934" b="14832">three</wd>
<space/>
<wd l="7992" t="14683" r="8698" b="14832">different</wd>
<space/>
<wd l="8760" t="14688" r="9187" b="14832">NER</wd>
<space/>
<wd l="9240" t="14702" r="9946" b="14870">systems.</wd>
<space/>
<wd l="10051" t="14688" r="10387" b="14832">The</wd>
<space/>
<wd l="10445" t="14702" r="10786" b="14832">out-</wd>
</ln>
<ln l="6101" t="14923" r="10795" b="15110" baseLine="15062" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="14942" r="6384" b="15110">put</wd>
<space/>
<wd l="6461" t="14923" r="6629" b="15072">of</wd>
<space/>
<wd l="6682" t="14928" r="7056" b="15072">each</wd>
<space/>
<wd l="7123" t="14928" r="7550" b="15072">NER</wd>
<space/>
<wd l="7613" t="14942" r="8549" b="15110">component</wd>
<space/>
<wd l="8621" t="14933" r="8746" b="15072">is</wd>
<space/>
<wd l="8813" t="14928" r="9571" b="15110">weighted</wd>
<space/>
<wd l="9638" t="14928" r="10526" b="15110">depending</wd>
<space/>
<wd l="10589" t="14976" r="10795" b="15072">on</wd>
<space/>
</ln>
<ln l="6096" t="15163" r="10786" b="15350" baseLine="15302" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6096" t="15168" r="6370" b="15312">the</wd>
<space/>
<wd l="6432" t="15182" r="7368" b="15350">component</wd>
<space/>
<wd l="7435" t="15168" r="7742" b="15312">and</wd>
<space/>
<wd l="7805" t="15163" r="7930" b="15307">if</wd>
<space/>
<wd l="7968" t="15168" r="8246" b="15312">the</wd>
<space/>
<wd l="8304" t="15216" r="8650" b="15312">sum</wd>
<space/>
<wd l="8712" t="15163" r="8875" b="15312">of</wd>
<space/>
<wd l="8918" t="15168" r="9360" b="15312">these</wd>
<space/>
<wd l="9413" t="15168" r="9931" b="15312">values</wd>
<space/>
<wd l="9998" t="15163" r="10229" b="15312">for</wd>
<space/>
<wd l="10286" t="15216" r="10382" b="15312">a</wd>
<space/>
<wd l="10440" t="15216" r="10786" b="15350">pos-</wd>
</ln>
<ln l="6101" t="15403" r="10786" b="15586" baseLine="15542" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="15403" r="6485" b="15547">sible</wd>
<space/>
<wd l="6566" t="15403" r="6845" b="15542">NE</wd>
<space/>
<wd l="6926" t="15403" r="7560" b="15547">exceeds</wd>
<space/>
<wd l="7646" t="15451" r="7742" b="15547">a</wd>
<space/>
<wd l="7824" t="15408" r="8414" b="15547">certain</wd>
<space/>
<wd l="8491" t="15403" r="9293" b="15547">threshold</wd>
<space/>
<wd l="9379" t="15408" r="9494" b="15547">it</wd>
<space/>
<wd l="9586" t="15408" r="9706" b="15547">is</wd>
<space/>
<wd l="9792" t="15403" r="10536" b="15586">accepted</wd>
<space/>
<wd l="10622" t="15451" r="10786" b="15547">as</wd>
<space/>
</ln>
<ln l="6101" t="15643" r="8453" b="15826" baseLine="15782" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="6101" t="15643" r="6379" b="15782">NE</wd>
<space/>
<wd l="6451" t="15643" r="7267" b="15787">otherwise</wd>
<space/>
<wd l="7339" t="15648" r="7459" b="15787">it</wd>
<space/>
<wd l="7541" t="15648" r="7661" b="15787">is</wd>
<space/>
<wd l="7738" t="15643" r="8453" b="15826">rejected.</wd>
</ln>
</para>
</column>
</section>
</body>
</page>
<page ocr-vers="OmniPageCSDK18" app-vers="OmniPageCSDK18">
<description>
<source file="pdf\L08-1001.pdf.pdf" dpix="300" dpiy="300" sizex="2481" sizey="3508"/>
<theoreticalPage size="A4" marginLeft="1042" marginTop="1380" marginRight="6147" marginBottom="1440" offsetX="10" offsetY="16" width="11918" height="16854"/>
<language>en</language>
</description>
<body>
<section l="1042" t="1380" r="5762" b="12060">
<column l="1042" t="1380" r="5762" b="12060">
<para l="1042" t="1445" r="5741" b="3538" alignment="justified" spaceBefore="8" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="1445" r="5741" b="1627" baseLine="1579" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="1445" r="1382" b="1589">The</wd>
<space/>
<wd l="1474" t="1445" r="2314" b="1627">clustering</wd>
<space/>
<wd l="2400" t="1459" r="2746" b="1627">step</wd>
<space/>
<wd l="2842" t="1459" r="3451" b="1589">returns</wd>
<space/>
<wd l="3547" t="1493" r="4018" b="1627">many</wd>
<space/>
<wd l="4104" t="1445" r="4747" b="1589">clusters</wd>
<space/>
<wd l="4843" t="1450" r="5741" b="1627">containing</wd>
<space/>
</ln>
<ln l="1042" t="1680" r="5731" b="1867" baseLine="1819" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="1699" r="1349" b="1829">two</wd>
<space/>
<wd l="1445" t="1690" r="2222" b="1829">instances</wd>
<space/>
<wd l="2323" t="1685" r="2712" b="1867">only.</wd>
<space/>
<wd l="2885" t="1680" r="3024" b="1824">A</wd>
<space/>
<wd l="3120" t="1685" r="3480" b="1829">task</wd>
<space/>
<wd l="3576" t="1680" r="3806" b="1829">for</wd>
<space/>
<wd l="3902" t="1680" r="4421" b="1829">future</wd>
<space/>
<wd l="4512" t="1685" r="4934" b="1829">work</wd>
<space/>
<wd l="5026" t="1690" r="5146" b="1829">is</wd>
<space/>
<wd l="5242" t="1699" r="5414" b="1829">to</wd>
<space/>
<wd l="5510" t="1690" r="5731" b="1824">in-</wd>
</ln>
<ln l="1042" t="1920" r="5731" b="2102" baseLine="2059" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="1925" r="1853" b="2102">vestigate,</wd>
<space/>
<wd l="1958" t="1920" r="2654" b="2064">whether</wd>
<space/>
<wd l="2746" t="1925" r="2866" b="2064">it</wd>
<space/>
<wd l="2966" t="1925" r="3091" b="2064">is</wd>
<space/>
<wd l="3192" t="1920" r="3864" b="2102">possible</wd>
<space/>
<wd l="3955" t="1934" r="4133" b="2064">to</wd>
<space/>
<wd l="4229" t="1920" r="4661" b="2064">build</wd>
<space/>
<wd l="4757" t="1920" r="5251" b="2102">larger</wd>
<space/>
<wd l="5347" t="1920" r="5731" b="2064">clus-</wd>
</ln>
<ln l="1042" t="2155" r="5741" b="2342" baseLine="2299" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="2174" r="1406" b="2338">ters,</wd>
<space/>
<wd l="1488" t="2160" r="1992" b="2304">which</wd>
<space/>
<wd l="2064" t="2208" r="2323" b="2304">are</wd>
<space/>
<wd l="2400" t="2160" r="2712" b="2304">still</wd>
<space/>
<wd l="2789" t="2155" r="3778" b="2342">meaningful.</wd>
<space/>
<wd l="3898" t="2155" r="4238" b="2304">One</wd>
<space/>
<wd l="4310" t="2208" r="4646" b="2342">way</wd>
<space/>
<wd l="4718" t="2155" r="4886" b="2304">of</wd>
<space/>
<wd l="4949" t="2160" r="5741" b="2342">enlarging</wd>
<space/>
</ln>
<ln l="1046" t="2400" r="5736" b="2544" baseLine="2534" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="2400" r="1618" b="2544">cluster</wd>
<space/>
<wd l="1714" t="2405" r="2021" b="2544">size</wd>
<space/>
<wd l="2117" t="2405" r="2242" b="2544">is</wd>
<space/>
<wd l="2338" t="2414" r="2510" b="2544">to</wd>
<space/>
<wd l="2611" t="2414" r="3211" b="2544">extract</wd>
<space/>
<wd l="3317" t="2448" r="3744" b="2544">more</wd>
<space/>
<wd l="3840" t="2400" r="4618" b="2544">relations.</wd>
<space/>
<wd l="4800" t="2400" r="5179" b="2544">This</wd>
<space/>
<wd l="5280" t="2400" r="5736" b="2544">could</wd>
<space/>
</ln>
<ln l="1046" t="2640" r="5731" b="2822" baseLine="2774" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="2640" r="1243" b="2784">be</wd>
<space/>
<wd l="1320" t="2640" r="2045" b="2784">achieved</wd>
<space/>
<wd l="2117" t="2640" r="2323" b="2822">by</wd>
<space/>
<wd l="2395" t="2640" r="3192" b="2822">loosening</wd>
<space/>
<wd l="3259" t="2640" r="3533" b="2784">the</wd>
<space/>
<wd l="3605" t="2645" r="4478" b="2784">extraction</wd>
<space/>
<wd l="4550" t="2645" r="5165" b="2784">criteria</wd>
<space/>
<wd l="5237" t="2688" r="5405" b="2784">as</wd>
<space/>
<wd l="5482" t="2640" r="5731" b="2784">de-</wd>
</ln>
<ln l="1046" t="2875" r="5736" b="3062" baseLine="3014" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="2880" r="1651" b="3024">scribed</wd>
<space/>
<wd l="1714" t="2885" r="1877" b="3019">in</wd>
<space/>
<wd l="1934" t="2885" r="2525" b="3024">section</wd>
<space/>
<wd l="2582" t="2880" r="2717" b="3019">4.</wd>
<space/>
<wd l="2794" t="2875" r="3211" b="3058">Also,</wd>
<space/>
<wd l="3283" t="2885" r="3403" b="3024">it</wd>
<space/>
<wd l="3466" t="2880" r="3974" b="3024">would</wd>
<space/>
<wd l="4037" t="2880" r="4234" b="3024">be</wd>
<space/>
<wd l="4296" t="2885" r="5203" b="3062">interesting</wd>
<space/>
<wd l="5256" t="2894" r="5429" b="3024">to</wd>
<space/>
<wd l="5491" t="2928" r="5736" b="3024">see</wd>
<space/>
</ln>
<ln l="1042" t="3120" r="5736" b="3302" baseLine="3254" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1042" t="3120" r="1738" b="3264">whether</wd>
<space/>
<wd l="1810" t="3120" r="2453" b="3264">clusters</wd>
<space/>
<wd l="2530" t="3120" r="2986" b="3264">could</wd>
<space/>
<wd l="3062" t="3120" r="3259" b="3264">be</wd>
<space/>
<wd l="3331" t="3120" r="3998" b="3302">merged.</wd>
<space/>
<wd l="4109" t="3120" r="4483" b="3264">This</wd>
<space/>
<wd l="4555" t="3120" r="5064" b="3264">would</wd>
<space/>
<wd l="5141" t="3125" r="5736" b="3302">require</wd>
<space/>
</ln>
<ln l="1046" t="3350" r="4622" b="3538" baseLine="3494" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="4">
<wd l="1046" t="3403" r="1142" b="3499">a</wd>
<space/>
<wd l="1214" t="3355" r="1843" b="3499">manual</wd>
<space/>
<wd l="1915" t="3355" r="2587" b="3538">analysis</wd>
<space/>
<wd l="2664" t="3350" r="2832" b="3499">of</wd>
<space/>
<wd l="2885" t="3355" r="3163" b="3499">the</wd>
<space/>
<wd l="3235" t="3355" r="3854" b="3499">created</wd>
<space/>
<wd l="3931" t="3355" r="4622" b="3499">clusters.</wd>
</ln>
</para>
<para l="1046" t="3768" r="2842" b="3950" alignment="left" spaceBefore="173" lsp="exactly" lspExact="238" language="en">
<ln l="1046" t="3768" r="2842" b="3950" baseLine="3902" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="13">
<wd l="1046" t="3768" r="2842" b="3950">Acknowledgement</wd>
</ln>
</para>
<para l="1046" t="4056" r="5741" b="5208" alignment="justified" spaceBefore="49" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="4056" r="5741" b="4238" baseLine="4195" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="4056" r="1382" b="4200">The</wd>
<space/>
<wd l="1450" t="4056" r="1872" b="4200">work</wd>
<space/>
<wd l="1939" t="4056" r="2755" b="4238">presented</wd>
<space/>
<wd l="2827" t="4056" r="3187" b="4200">here</wd>
<space/>
<wd l="3254" t="4104" r="3562" b="4200">was</wd>
<space/>
<wd l="3638" t="4056" r="4368" b="4238">partially</wd>
<space/>
<wd l="4440" t="4056" r="5299" b="4238">supported</wd>
<space/>
<wd l="5371" t="4056" r="5578" b="4238">by</wd>
<space/>
<wd l="5645" t="4104" r="5741" b="4200">a</wd>
<space/>
</ln>
<ln l="1046" t="4291" r="5741" b="4478" baseLine="4435" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="4296" r="1747" b="4440">research</wd>
<space/>
<wd l="1805" t="4310" r="2251" b="4478">grant</wd>
<space/>
<wd l="2318" t="4291" r="2712" b="4440">from</wd>
<space/>
<wd l="2770" t="4296" r="3043" b="4440">the</wd>
<space/>
<wd l="3101" t="4296" r="4090" b="4478">“Programm</wd>
<space/>
<wd l="4147" t="4344" r="4421" b="4440">zur</wd>
<space/>
<wd l="4478" t="4296" r="5381" b="4478">F¨orderung</wd>
<space/>
<wd l="5429" t="4344" r="5741" b="4440">von</wd>
<space/>
</ln>
<ln l="1046" t="4522" r="5736" b="4728" baseLine="4670" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="4536" r="1963" b="4718">Forschung,</wd>
<space/>
<wd l="2054" t="4536" r="3173" b="4680">Innovationen</wd>
<space/>
<wd l="3250" t="4536" r="3571" b="4680">und</wd>
<space/>
<wd l="3658" t="4536" r="4781" b="4718">Technologien</wd>
<space/>
<wd l="4872" t="4522" r="5736" b="4728">(ProFIT)”</wd>
<space/>
</ln>
<ln l="1061" t="4762" r="5731" b="4968" baseLine="4910" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1061" t="4762" r="1565" b="4968">(FKZ:</wd>
<space/>
<wd l="1651" t="4762" r="2491" b="4968">10135984)</wd>
<space/>
<wd l="2573" t="4776" r="2885" b="4920">and</wd>
<space/>
<wd l="2942" t="4776" r="3216" b="4920">the</wd>
<space/>
<wd l="3278" t="4776" r="4114" b="4958">European</wd>
<space/>
<wd l="4176" t="4776" r="4920" b="4958">Regional</wd>
<space/>
<wd l="4982" t="4776" r="5731" b="4958">Develop-</wd>
</ln>
<ln l="1046" t="5002" r="2813" b="5208" baseLine="5150" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="5030" r="1469" b="5160">ment</wd>
<space/>
<wd l="1550" t="5016" r="1987" b="5160">Fund</wd>
<space/>
<wd l="2078" t="5002" r="2813" b="5208">(ERDF).</wd>
</ln>
</para>
<para l="2539" t="5462" r="4253" b="5635" alignment="centered" spaceBefore="207" lsp="exactly" lspExact="282" language="en">
<ln l="2539" t="5462" r="4253" b="5635" baseLine="5630" underlined="none" subsuperscript="none" fontSize="1300" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="21">
<wd l="2539" t="5467" r="2717" b="5635">7.</wd>
<space/>
<wd l="3005" t="5462" r="4253" b="5635">References</wd>
</ln>
</para>
<para l="1046" t="5794" r="5750" b="6950" alignment="justified" li="216" spaceBefore="53" fli="-216" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="5794" r="5731" b="5981" baseLine="5938" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="5798" r="1704" b="5942">Michele</wd>
<space/>
<wd l="1795" t="5798" r="2381" b="5976">Banko,</wd>
<space/>
<wd l="2486" t="5798" r="3154" b="5942">Michael</wd>
<space/>
<wd l="3245" t="5798" r="3379" b="5942">J.</wd>
<space/>
<wd l="3490" t="5794" r="4301" b="5976">Cafarella,</wd>
<space/>
<wd l="4411" t="5794" r="5098" b="5981">Stephen</wd>
<space/>
<wd l="5189" t="5794" r="5731" b="5942">Soder-</wd>
</ln>
<ln l="1248" t="6034" r="5722" b="6216" baseLine="6178" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1248" t="6038" r="1661" b="6216">land,</wd>
<space/>
<wd l="1742" t="6038" r="2515" b="6182">Matthew</wd>
<space/>
<wd l="2587" t="6038" r="3562" b="6216">Broadhead,</wd>
<space/>
<wd l="3643" t="6038" r="3955" b="6182">and</wd>
<space/>
<wd l="4037" t="6034" r="4459" b="6182">Oren</wd>
<space/>
<wd l="4526" t="6038" r="5184" b="6182">Etzioni.</wd>
<space/>
<wd l="5294" t="6038" r="5722" b="6182">2007.</wd>
<space/>
</ln>
<ln l="1253" t="6274" r="5726" b="6461" baseLine="6413">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1253" t="6274" r="1714" b="6461">Open</wd>
<space/>
<wd l="1771" t="6274" r="2779" b="6422">information</wd>
<space/>
<wd l="2842" t="6283" r="3715" b="6422">extraction</wd>
<space/>
<wd l="3778" t="6274" r="4176" b="6422">from</wd>
<space/>
<wd l="4238" t="6278" r="4512" b="6422">the</wd>
<space/>
<wd l="4570" t="6278" r="4944" b="6422">web.</wd>
<space/>
<wd l="5054" t="6278" r="5232" b="6418">In</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="5299" t="6278" r="5726" b="6422">Proc.</wd>
<space/>
</run>
</ln>
<ln l="1262" t="6514" r="5750" b="6701" baseLine="6653" italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1262" t="6514" r="1435" b="6701">of</wd>
<space/>
<wd l="1512" t="6518" r="1762" b="6662">the</wd>
<space/>
<wd l="1858" t="6518" r="2995" b="6662">International</wd>
<space/>
<wd l="3091" t="6518" r="3533" b="6662">Joint</wd>
<space/>
<wd l="3643" t="6514" r="4574" b="6701">Conference</wd>
<space/>
<wd l="4685" t="6566" r="4886" b="6662">on</wd>
<space/>
<wd l="4978" t="6514" r="5750" b="6701">Artificial</wd>
<space/>
</ln>
<ln l="1253" t="6744" r="3048" b="6950" baseLine="6893">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1253" t="6758" r="2232" b="6941">Intelligence</wd>
<space/>
</run>
<wd l="2328" t="6744" r="3048" b="6950"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">(IJCAI)</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><nl orig="true"/>
</run>
</ln>
</para>
<para l="1046" t="6998" r="5741" b="7186" alignment="justified" spaceBefore="6" lsp="exactly" lspExact="237" language="en">
<ln l="1046" t="6998" r="5741" b="7186" baseLine="7142" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="7">
<wd l="1046" t="6998" r="1680" b="7147">Andrea</wd>
<space/>
<wd l="1766" t="7003" r="2198" b="7186">Heyl.</wd>
<space/>
<wd l="2328" t="7018" r="2501" b="7147">to</wd>
<space/>
<wd l="2592" t="7051" r="3178" b="7186">appear</wd>
<space/>
<wd l="3269" t="7008" r="3696" b="7147">2008.</wd>
<space/>
<wd l="3830" t="7003" r="4992" b="7186">Unsupervised</wd>
<space/>
<wd l="5083" t="7003" r="5741" b="7147">relation</wd>
</ln>
</para>
<para l="1046" t="7238" r="5722" b="7675" alignment="justified" fli="216" lsp="exactly" lspExact="244" language="en">
<ln l="1248" t="7238" r="5424" b="7426" baseLine="7382" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1248" t="7248" r="2160" b="7387">extraction.</wd>
<space/>
<wd l="2270" t="7243" r="2995" b="7387">Master’s</wd>
<space/>
<wd l="3067" t="7243" r="3600" b="7421">thesis,</wd>
<space/>
<wd l="3686" t="7238" r="4440" b="7387">Saarland</wd>
<space/>
<wd l="4512" t="7243" r="5424" b="7426">University.</wd>
<space/>
</ln>
<ln l="1046" t="7488" r="5722" b="7675" baseLine="7627" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1046" t="7493" r="1454" b="7675">Lc4j.</wd>
<space/>
<wd l="1598" t="7493" r="2026" b="7637">2007.</wd>
<space/>
<wd l="2165" t="7493" r="2990" b="7675">Language</wd>
<space/>
<wd l="3062" t="7498" r="4277" b="7675">categorization</wd>
<space/>
<wd l="4349" t="7493" r="4925" b="7675">library</wd>
<space/>
<wd l="4997" t="7488" r="5227" b="7637">for</wd>
<space/>
<wd l="5299" t="7493" r="5722" b="7637">Java.</wd>
</ln>
</para>
<para l="1248" t="7718" r="4450" b="7925" alignment="justified" li="216" spaceBefore="4" lsp="exactly" lspExact="238" language="en">
<ln l="1248" t="7718" r="4450" b="7925" baseLine="7867" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="9">
<wd l="1248" t="7718" r="4450" b="7925">http://www.olivo.net/software/lc4j/.</wd>
</ln>
</para>
<para l="1046" t="7968" r="5731" b="8371" alignment="justified" lsp="exactly" lspExact="248" language="en">
<ln l="1046" t="7968" r="5472" b="8174" baseLine="8117" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6">
<wd l="1046" t="7982" r="1867" b="8165">LingPipe.</wd>
<space/>
<wd l="1982" t="7982" r="2410" b="8126">2007.</wd>
<space/>
<wd l="2520" t="7968" r="5472" b="8174">http://www.alias-i.com/lingpipe/.</wd>
<space/>
</ln>
<ln l="1051" t="8222" r="5731" b="8371" baseLine="8366">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="6"><wd l="1051" t="8222" r="1670" b="8371">Satoshi</wd>
<space/>
<wd l="1747" t="8222" r="2333" b="8371">Sekine.</wd>
<space/>
<wd l="2448" t="8232" r="2875" b="8371">2006.</wd>
<space/>
<wd l="2990" t="8222" r="3994" b="8371">On-demand</wd>
<space/>
<wd l="4066" t="8222" r="5074" b="8371">information</wd>
<space/>
<wd l="5141" t="8242" r="5731" b="8371">extrac-</wd>
</run>
<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>
</run>
</ln>
</para>
<para l="1243" t="8462" r="5731" b="8650" alignment="justified" li="216" spaceBefore="2" lsp="exactly" lspExact="237" language="en">
<ln l="1243" t="8462" r="5731" b="8650" baseLine="8606">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8"><wd l="1243" t="8472" r="1622" b="8611">tion.</wd>
<space/>
<wd l="1766" t="8467" r="1944" b="8606">In</wd>
<space/>
</run>
<wd l="2040" t="8462" r="2482" b="8611"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">ACL</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="8"><space/>
<wd l="2587" t="8467" r="2923" b="8611">The</wd>
<space/>
<wd l="3019" t="8462" r="4013" b="8611">Association</wd>
<space/>
<wd l="4104" t="8462" r="4334" b="8611">for</wd>
<space/>
<wd l="4430" t="8462" r="5294" b="8650">Computer</wd>
<space/>
<wd l="5390" t="8467" r="5731" b="8606">Lin-</wd>
</run>
<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>
</run>
</ln>
</para>
<para l="1248" t="8712" r="1925" b="8890" alignment="justified" li="216" lsp="exactly" lspExact="237" language="en">
<ln l="1248" t="8712" r="1925" b="8890" baseLine="8842" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1248" t="8712" r="1925" b="8890">guistics.</wd>
</ln>
</para>
<para l="1042" t="8952" r="5746" b="10574" alignment="justified" li="216" spaceBefore="4" fli="-216" lsp="exactly" lspExact="240" language="en">
<ln l="1042" t="8952" r="5731" b="9139" baseLine="9091" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1042" t="8957" r="1661" b="9101">Yusuke</wd>
<space/>
<wd l="1742" t="8952" r="2582" b="9139">Shinyama</wd>
<space/>
<wd l="2659" t="8957" r="2966" b="9101">and</wd>
<space/>
<wd l="3053" t="8952" r="3672" b="9101">Satoshi</wd>
<space/>
<wd l="3758" t="8952" r="4344" b="9101">Sekine.</wd>
<space/>
<wd l="4469" t="8962" r="4896" b="9101">2006.</wd>
<space/>
<wd l="5011" t="8957" r="5731" b="9139">Preemp-</wd>
</ln>
<ln l="1243" t="9192" r="5731" b="9379" baseLine="9331" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1243" t="9202" r="1560" b="9341">tive</wd>
<space/>
<wd l="1680" t="9192" r="2688" b="9341">information</wd>
<space/>
<wd l="2803" t="9202" r="3677" b="9341">extraction</wd>
<space/>
<wd l="3792" t="9202" r="4243" b="9379">using</wd>
<space/>
<wd l="4358" t="9197" r="5390" b="9341">unrestricted</wd>
<space/>
<wd l="5510" t="9245" r="5731" b="9341">re-</wd>
</ln>
<ln l="1248" t="9427" r="5746" b="9614" baseLine="9571">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1248" t="9432" r="1738" b="9576">lation</wd>
<space/>
<wd l="1848" t="9432" r="2664" b="9614">discovery.</wd>
<space/>
<wd l="2832" t="9432" r="3010" b="9571">In</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="3120" t="9432" r="3552" b="9576">Proc.</wd>
<space/>
<wd l="3686" t="9427" r="3864" b="9614">of</wd>
<space/>
<wd l="3950" t="9432" r="4200" b="9576">the</wd>
<space/>
<wd l="4315" t="9437" r="4747" b="9576">main</wd>
<space/>
<wd l="4862" t="9427" r="5746" b="9614">conference</wd>
<space/>
</run>
</ln>
<ln l="1262" t="9667" r="5746" b="9854" baseLine="9811" italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1262" t="9720" r="1464" b="9816">on</wd>
<space/>
<wd l="1550" t="9672" r="2179" b="9816">Human</wd>
<space/>
<wd l="2270" t="9672" r="3077" b="9854">Language</wd>
<space/>
<wd l="3187" t="9672" r="4109" b="9854">Technology</wd>
<space/>
<wd l="4214" t="9667" r="5150" b="9854">Conference</wd>
<space/>
<wd l="5251" t="9667" r="5424" b="9854">of</wd>
<space/>
<wd l="5496" t="9672" r="5746" b="9816">the</wd>
<space/>
</ln>
<ln l="1253" t="9907" r="5741" b="10094" baseLine="10046" italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1253" t="9912" r="1752" b="10056">North</wd>
<space/>
<wd l="1810" t="9907" r="2645" b="10056">American</wd>
<space/>
<wd l="2726" t="9907" r="3403" b="10094">Chapter</wd>
<space/>
<wd l="3466" t="9907" r="3638" b="10094">of</wd>
<space/>
<wd l="3682" t="9912" r="3931" b="10056">the</wd>
<space/>
<wd l="3994" t="9907" r="4992" b="10056">Association</wd>
<space/>
<wd l="5059" t="9907" r="5232" b="10094">of</wd>
<space/>
<wd l="5290" t="9907" r="5741" b="10056">Com-</wd>
</ln>
<ln l="1243" t="10147" r="5741" b="10334" baseLine="10286">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><wd l="1243" t="10152" r="2122" b="10334">putational</wd>
<space/>
</run>
<wd l="2222" t="10152" r="3197" b="10334"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">Linguistics</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">,</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0"><space/>
<wd l="3317" t="10200" r="3782" b="10334">pages</wd>
<space/>
<wd l="3898" t="10152" r="4627" b="10296">304–311.</wd>
<space/>
<wd l="4747" t="10147" r="5741" b="10296">Association</wd>
<space/>
</run>
</ln>
<ln l="1248" t="10387" r="3888" b="10574" baseLine="10526" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1248" t="10387" r="1478" b="10536">for</wd>
<space/>
<wd l="1555" t="10387" r="2851" b="10574">Computational</wd>
<space/>
<wd l="2923" t="10392" r="3888" b="10574">Linguistics.</wd>
</ln>
</para>
<para l="1051" t="10622" r="5731" b="11069" alignment="justified" li="216" spaceBefore="10" fli="-216" lsp="exactly" lspExact="240" language="en">
<ln l="1051" t="10622" r="5731" b="10829" baseLine="10776" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1051" t="10632" r="1786" b="10781">Stanford</wd>
<space/>
<wd l="1978" t="10637" r="2563" b="10781">Parser.</wd>
<space/>
<wd l="2875" t="10637" r="3302" b="10781">2007.</wd>
<space/>
<wd l="3610" t="10622" r="5731" b="10829">http://nlp.stanford.edu/</wd>
<space/>
</ln>
<ln l="1248" t="10862" r="3667" b="11069" baseLine="11016" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1248" t="10862" r="3667" b="11069">downloads/lex-parser.shtml.</wd>
</ln>
</para>
<para l="1046" t="11126" r="5741" b="11270" alignment="justified" spaceBefore="7" lsp="exactly" lspExact="240" language="en">
<ln l="1046" t="11126" r="5741" b="11270" baseLine="11261">
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="15"><wd l="1046" t="11126" r="1325" b="11270">Ian</wd>
<space/>
<wd l="1445" t="11126" r="1627" b="11266">H.</wd>
<space/>
<wd l="1757" t="11126" r="2371" b="11270">Witten</wd>
<space/>
<wd l="2491" t="11126" r="2803" b="11270">and</wd>
<space/>
<wd l="2928" t="11126" r="3317" b="11270">Eibe</wd>
<space/>
<wd l="3437" t="11126" r="3974" b="11270">Frank.</wd>
<space/>
<wd l="4171" t="11131" r="4598" b="11270">2005.</wd>
<space/>
</run>
<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="15"><wd l="4790" t="11126" r="5213" b="11270">Data</wd>
<space/>
<wd l="5328" t="11126" r="5741" b="11270">Min-</wd>
</run>
<run fontFace="Times New Roman" fontFamily="roman" fontPitch="variable"><nl orig="true"/>
</run>
</ln>
</para>
<para l="1258" t="11366" r="5722" b="11549" alignment="justified" li="216" lsp="exactly" lspExact="234" language="en">
<ln l="1258" t="11366" r="5722" b="11549" baseLine="11501">
<run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><wd l="1258" t="11371" r="1570" b="11549">ing:</wd>
<space/>
<wd l="1661" t="11366" r="2424" b="11510">Practical</wd>
<space/>
<wd l="2482" t="11366" r="3192" b="11510">machine</wd>
<space/>
<wd l="3254" t="11366" r="3946" b="11549">learning</wd>
<space/>
<wd l="4003" t="11366" r="4382" b="11510">tools</wd>
<space/>
<wd l="4450" t="11366" r="4762" b="11510">and</wd>
<space/>
</run>
<wd l="4814" t="11366" r="5722" b="11549"><run italic="true" underlined="none" subsuperscript="none" fontSize="1050" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">techniques</run>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3">.</run>
</wd>
<run underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="-3"><nl orig="true"/>
</run>
</ln>
</para>
<para l="1042" t="11602" r="5357" b="12043" alignment="justified" ri="360" spaceAfter="8" fli="216" lsp="exactly" lspExact="246" language="en">
<ln l="1248" t="11602" r="5357" b="11789" baseLine="11741" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1248" t="11606" r="1910" b="11789">Morgan</wd>
<space/>
<wd l="1982" t="11602" r="2933" b="11784">Kaufmann,</wd>
<space/>
<wd l="3024" t="11602" r="3331" b="11750">San</wd>
<space/>
<wd l="3403" t="11606" r="4253" b="11784">Francisco,</wd>
<space/>
<wd l="4344" t="11606" r="4646" b="11750">2nd</wd>
<space/>
<wd l="4723" t="11606" r="5357" b="11750">edition.</wd>
<space/>
</ln>
<ln l="1042" t="11837" r="5222" b="12043" baseLine="11990" underlined="none" subsuperscript="none" fontSize="1000" fontFace="Times New Roman" fontFamily="roman" fontPitch="variable" spacing="0">
<wd l="1042" t="11851" r="1872" b="11995">WordNet.</wd>
<space/>
<wd l="1987" t="11851" r="2414" b="11995">2007.</wd>
<space/>
<wd l="2525" t="11837" r="5222" b="12043">http://wordnet.princeton.edu/.</wd>
</ln>
</para>
</column>
</section>
</body>
</page>
</document>
