%!PS-Adobe-2.0 %%Creator: dvips(k) 5.86e Copyright 2001 Radical Eye Software %%Title: paper.dvi %%Pages: 8 %%PageOrder: Ascend %%BoundingBox: 0 0 596 842 %%DocumentFonts: Times-Bold Times-Roman Courier Times-Italic %%EndComments %DVIPSWebPage: (www.radicaleye.com) %DVIPSCommandLine: dvips paper.dvi %DVIPSParameters: dpi=600, compressed %DVIPSSource: TeX output 2003.05.19:1656 %%BeginProcSet: texc.pro %! /TeXDict 300 dict def TeXDict begin/N{def}def/B{bind def}N/S{exch}N/X{S N}B/A{dup}B/TR{translate}N/isls false N/vsize 11 72 mul N/hsize 8.5 72 mul N/landplus90{false}def/@rigin{isls{[0 landplus90{1 -1}{-1 1}ifelse 0 0 0]concat}if 72 Resolution div 72 VResolution div neg scale isls{ landplus90{VResolution 72 div vsize mul 0 exch}{Resolution -72 div hsize mul 0}ifelse TR}if Resolution VResolution vsize -72 div 1 add mul TR[ matrix currentmatrix{A A round sub abs 0.00001 lt{round}if}forall round exch round exch]setmatrix}N/@landscape{/isls true N}B/@manualfeed{ statusdict/manualfeed true put}B/@copies{/#copies X}B/FMat[1 0 0 -1 0 0] N/FBB[0 0 0 0]N/nn 0 N/IEn 0 N/ctr 0 N/df-tail{/nn 8 dict N nn begin /FontType 3 N/FontMatrix fntrx N/FontBBox FBB N string/base X array /BitMaps X/BuildChar{CharBuilder}N/Encoding IEn N end A{/foo setfont}2 array copy cvx N load 0 nn put/ctr 0 N[}B/sf 0 N/df{/sf 1 N/fntrx FMat N df-tail}B/dfs{div/sf X/fntrx[sf 0 0 sf neg 0 0]N df-tail}B/E{pop nn A definefont setfont}B/Cw{Cd A length 5 sub get}B/Ch{Cd A length 4 sub get }B/Cx{128 Cd A length 3 sub get sub}B/Cy{Cd A length 2 sub get 127 sub} B/Cdx{Cd A length 1 sub get}B/Ci{Cd A type/stringtype ne{ctr get/ctr ctr 1 add N}if}B/id 0 N/rw 0 N/rc 0 N/gp 0 N/cp 0 N/G 0 N/CharBuilder{save 3 1 roll S A/base get 2 index get S/BitMaps get S get/Cd X pop/ctr 0 N Cdx 0 Cx Cy Ch sub Cx Cw add Cy setcachedevice Cw Ch true[1 0 0 -1 -.1 Cx sub Cy .1 sub]/id Ci N/rw Cw 7 add 8 idiv string N/rc 0 N/gp 0 N/cp 0 N{ rc 0 ne{rc 1 sub/rc X rw}{G}ifelse}imagemask restore}B/G{{id gp get/gp gp 1 add N A 18 mod S 18 idiv pl S get exec}loop}B/adv{cp add/cp X}B /chg{rw cp id gp 4 index getinterval putinterval A gp add/gp X adv}B/nd{ /cp 0 N rw exit}B/lsh{rw cp 2 copy get A 0 eq{pop 1}{A 255 eq{pop 254}{ A A add 255 and S 1 and or}ifelse}ifelse put 1 adv}B/rsh{rw cp 2 copy get A 0 eq{pop 128}{A 255 eq{pop 127}{A 2 idiv S 128 and or}ifelse} ifelse put 1 adv}B/clr{rw cp 2 index string putinterval adv}B/set{rw cp fillstr 0 4 index getinterval putinterval adv}B/fillstr 18 string 0 1 17 {2 copy 255 put pop}for N/pl[{adv 1 chg}{adv 1 chg nd}{1 add chg}{1 add chg nd}{adv lsh}{adv lsh nd}{adv rsh}{adv rsh nd}{1 add adv}{/rc X nd}{ 1 add set}{1 add clr}{adv 2 chg}{adv 2 chg nd}{pop nd}]A{bind pop} forall N/D{/cc X A type/stringtype ne{]}if nn/base get cc ctr put nn /BitMaps get S ctr S sf 1 ne{A A length 1 sub A 2 index S get sf div put }if put/ctr ctr 1 add N}B/I{cc 1 add D}B/bop{userdict/bop-hook known{ bop-hook}if/SI save N @rigin 0 0 moveto/V matrix currentmatrix A 1 get A mul exch 0 get A mul add .99 lt{/QV}{/RV}ifelse load def pop pop}N/eop{ SI restore userdict/eop-hook known{eop-hook}if showpage}N/@start{ userdict/start-hook known{start-hook}if pop/VResolution X/Resolution X 1000 div/DVImag X/IEn 256 array N 2 string 0 1 255{IEn S A 360 add 36 4 index cvrs cvn put}for pop 65781.76 div/vsize X 65781.76 div/hsize X}N /p{show}N/RMat[1 0 0 -1 0 0]N/BDot 260 string N/Rx 0 N/Ry 0 N/V{}B/RV/v{ /Ry X/Rx X V}B statusdict begin/product where{pop false[(Display)(NeXT) (LaserWriter 16/600)]{A length product length le{A length product exch 0 exch getinterval eq{pop true exit}if}{pop}ifelse}forall}{false}ifelse end{{gsave TR -.1 .1 TR 1 1 scale Rx Ry false RMat{BDot}imagemask grestore}}{{gsave TR -.1 .1 TR Rx Ry scale 1 1 false RMat{BDot} imagemask grestore}}ifelse B/QV{gsave newpath transform round exch round exch itransform moveto Rx 0 rlineto 0 Ry neg rlineto Rx neg 0 rlineto fill grestore}B/a{moveto}B/delta 0 N/tail{A/delta X 0 rmoveto}B/M{S p delta add tail}B/b{S p tail}B/c{-4 M}B/d{-3 M}B/e{-2 M}B/f{-1 M}B/g{0 M} B/h{1 M}B/i{2 M}B/j{3 M}B/k{4 M}B/w{0 rmoveto}B/l{p -4 w}B/m{p -3 w}B/n{ p -2 w}B/o{p -1 w}B/q{p 1 w}B/r{p 2 w}B/s{p 3 w}B/t{p 4 w}B/x{0 S rmoveto}B/y{3 2 roll p a}B/bos{/SS save N}B/eos{SS restore}B end %%EndProcSet %%BeginProcSet: 8r.enc % @@psencodingfile@{ % author = "S. Rahtz, P. MacKay, Alan Jeffrey, B. Horn, K. Berry", % version = "0.6", % date = "1 July 1998", % filename = "8r.enc", % email = "tex-fonts@@tug.org", % docstring = "Encoding for TrueType or Type 1 fonts % to be used with TeX." % @} % % Idea is to have all the characters normally included in Type 1 fonts % available for typesetting. This is effectively the characters in Adobe % Standard Encoding + ISO Latin 1 + extra characters from Lucida. % % Character code assignments were made as follows: % % (1) the Windows ANSI characters are almost all in their Windows ANSI % positions, because some Windows users cannot easily reencode the % fonts, and it makes no difference on other systems. The only Windows % ANSI characters not available are those that make no sense for % typesetting -- rubout (127 decimal), nobreakspace (160), softhyphen % (173). quotesingle and grave are moved just because it's such an % irritation not having them in TeX positions. % % (2) Remaining characters are assigned arbitrarily to the lower part % of the range, avoiding 0, 10 and 13 in case we meet dumb software. % % (3) Y&Y Lucida Bright includes some extra text characters; in the % hopes that other PostScript fonts, perhaps created for public % consumption, will include them, they are included starting at 0x12. % % (4) Remaining positions left undefined are for use in (hopefully) % upward-compatible revisions, if someday more characters are generally % available. % % (5) hyphen appears twice for compatibility with both % ASCII and Windows. % /TeXBase1Encoding [ % 0x00 (encoded characters from Adobe Standard not in Windows 3.1) /.notdef /dotaccent /fi /fl /fraction /hungarumlaut /Lslash /lslash /ogonek /ring /.notdef /breve /minus /.notdef % These are the only two remaining unencoded characters, so may as % well include them. /Zcaron /zcaron % 0x10 /caron /dotlessi % (unusual TeX characters available in, e.g., Lucida Bright) /dotlessj /ff /ffi /ffl /.notdef /.notdef /.notdef /.notdef /.notdef /.notdef /.notdef /.notdef % very contentious; it's so painful not having quoteleft and quoteright % at 96 and 145 that we move the things normally found there to here. /grave /quotesingle % 0x20 (ASCII begins) /space /exclam /quotedbl /numbersign /dollar /percent /ampersand /quoteright /parenleft /parenright /asterisk /plus /comma /hyphen /period /slash % 0x30 /zero /one /two /three /four /five /six /seven /eight /nine /colon /semicolon /less /equal /greater /question % 0x40 /at /A /B /C /D /E /F /G /H /I /J /K /L /M /N /O % 0x50 /P /Q /R /S /T /U /V /W /X /Y /Z /bracketleft /backslash /bracketright /asciicircum /underscore % 0x60 /quoteleft /a /b /c /d /e /f /g /h /i /j /k /l /m /n /o % 0x70 /p /q /r /s /t /u /v /w /x /y /z /braceleft /bar /braceright /asciitilde /.notdef % rubout; ASCII ends % 0x80 /.notdef /.notdef /quotesinglbase /florin /quotedblbase /ellipsis /dagger /daggerdbl /circumflex /perthousand /Scaron /guilsinglleft /OE /.notdef /.notdef /.notdef % 0x90 /.notdef /.notdef /.notdef /quotedblleft /quotedblright /bullet /endash /emdash /tilde /trademark /scaron /guilsinglright /oe /.notdef /.notdef /Ydieresis % 0xA0 /.notdef % nobreakspace /exclamdown /cent /sterling /currency /yen /brokenbar /section /dieresis /copyright /ordfeminine /guillemotleft /logicalnot /hyphen % Y&Y (also at 45); Windows' softhyphen /registered /macron % 0xD0 /degree /plusminus /twosuperior /threesuperior /acute /mu /paragraph /periodcentered /cedilla /onesuperior /ordmasculine /guillemotright /onequarter /onehalf /threequarters /questiondown % 0xC0 /Agrave /Aacute /Acircumflex /Atilde /Adieresis /Aring /AE /Ccedilla /Egrave /Eacute /Ecircumflex /Edieresis /Igrave /Iacute /Icircumflex /Idieresis % 0xD0 /Eth /Ntilde /Ograve /Oacute /Ocircumflex /Otilde /Odieresis /multiply /Oslash /Ugrave /Uacute /Ucircumflex /Udieresis /Yacute /Thorn /germandbls % 0xE0 /agrave /aacute /acircumflex /atilde /adieresis /aring /ae /ccedilla /egrave /eacute /ecircumflex /edieresis /igrave /iacute /icircumflex /idieresis % 0xF0 /eth /ntilde /ograve /oacute /ocircumflex /otilde /odieresis /divide /oslash /ugrave /uacute /ucircumflex /udieresis /yacute /thorn /ydieresis ] def %%EndProcSet %%BeginProcSet: texps.pro %! TeXDict begin/rf{findfont dup length 1 add dict begin{1 index/FID ne 2 index/UniqueID ne and{def}{pop pop}ifelse}forall[1 index 0 6 -1 roll exec 0 exch 5 -1 roll VResolution Resolution div mul neg 0 0]/Metrics exch def dict begin Encoding{exch dup type/integertype ne{pop pop 1 sub dup 0 le{pop}{[}ifelse}{FontMatrix 0 get div Metrics 0 get div def} ifelse}forall Metrics/Metrics currentdict end def[2 index currentdict end definefont 3 -1 roll makefont/setfont cvx]cvx def}def/ObliqueSlant{ dup sin S cos div neg}B/SlantFont{4 index mul add}def/ExtendFont{3 -1 roll mul exch}def/ReEncodeFont{CharStrings rcheck{/Encoding false def dup[exch{dup CharStrings exch known not{pop/.notdef/Encoding true def} if}forall Encoding{]exch pop}{cleartomark}ifelse}if/Encoding exch def} def end %%EndProcSet TeXDict begin 39158280 55380996 1000 600 600 (paper.dvi) @start /Fa 172[40 5[65 3[24 6[49 53 65[{TeXBase1Encoding ReEncodeFont}5 72.7272 /Times-Roman rf /Fb 203[25 25 25 25 49[{ TeXBase1Encoding ReEncodeFont}4 49.8132 /Times-Roman rf /Fc 203[33 33 33 33 49[{TeXBase1Encoding ReEncodeFont}4 66.4176 /Times-Roman rf %DVIPSBitmapFont: Fd cmr9 9 1 /Fd 1 7 df6 D E %EndDVIPSBitmapFont /Fe 134[37 37 54 37 42 25 29 33 1[42 37 42 62 21 42 1[21 1[37 25 33 42 33 42 37 12[50 42 2[46 1[54 4[29 2[46 2[54 9[37 37 37 37 37 37 37 37 37 37 2[25 19 7[37 33[42 2[{ TeXBase1Encoding ReEncodeFont}43 74.7198 /Times-Bold rf /Ff 135[45 66 1[51 30 35 40 1[51 45 51 76 25 51 1[25 1[45 1[40 51 40 1[45 13[51 66 10[71 1[61 66 66 1[66 11[45 1[45 45 45 2[23 46[{TeXBase1Encoding ReEncodeFont}30 90.9091 /Times-Bold rf /Fg 136[50 33 37 21 29 29 37 37 37 37 54 21 33 21 21 37 37 21 33 37 33 37 37 9[62 46 54 42 37 46 1[46 54 50 62 42 1[33 25 1[54 1[46 54 50 1[46 6[25 2[37 37 37 37 37 37 1[37 1[19 25 19 2[25 25 37[37 2[{TeXBase1Encoding ReEncodeFont}55 74.7198 /Times-Italic rf %DVIPSBitmapFont: Fh cmmi6 6 3 /Fh 3 108 df<1338137CA2137813701300A7EA0780EA1FC0EA38E01230EA60F0EAC1E0 A3EA03C0A3EA0780A2EA0F0013041306EA1E0CA21318121CEA1E70EA0FE0EA07800F237D A116>105 D<1418143C147CA214381400A7EB0780EB1FE01338EB60F013C0A2EA0180A2 380001E0A4EB03C0A4EB0780A4EB0F00A4131EA21238EA783CEAF8381378EA70F0EA7FC0 001FC7FC162D81A119>I<13F8EA0FF0A21200A2485AA4485AA43807801E147FEB81C3EB 8387380F060F495A1318EB700E4848C7FCA213FCEA1E7EEA3C0F80EB0781158039780F03 00A21402EB070600F0138CEB03F8386000F019247CA221>I E %EndDVIPSBitmapFont /Fi 87[25 17[37 27[33 37 37 54 37 37 21 29 25 37 37 37 37 58 21 37 21 21 37 37 25 33 37 33 37 33 3[25 1[25 1[54 1[71 54 1[46 42 50 1[42 54 54 66 46 54 29 25 54 54 42 46 54 50 50 54 6[21 37 37 37 37 37 37 37 37 37 37 21 19 25 19 2[25 25 25 58 34[42 42 2[{TeXBase1Encoding ReEncodeFont}73 74.7198 /Times-Roman rf %DVIPSBitmapFont: Fj cmmi8 8 4 /Fj 4 120 df<1307EB0F80EB1FC0A2EB0F80EB070090C7FCA9EA01E0EA07F8EA0E3CEA 1C3E123812301270EA607EEAE07C12C013FC485A120012015B12035BA21207EBC04014C0 120F13801381381F01801303EB0700EA0F06131EEA07F8EA01F0122E7EAC18>105 D<15E0EC01F01403A3EC01C091C7FCA9147CEB03FE9038078F80EB0E07131C013813C013 30EB700F0160138013E013C0EB801F13001500A25CA2143EA2147EA2147CA214FCA25CA2 1301A25CA21303A25CA2130700385BEAFC0F5C49C7FCEAF83EEAF0F8EA7FF0EA1F801C3B 81AC1D>I<131FEA03FFA2EA003FA2133EA2137EA2137CA213FCA25BA2120115F89038F0 03FCEC0F0E0003EB1C1EEC387EEBE07014E03807E1C09038E3803849C7FC13CEEA0FDC13 F8A2EBFF80381F9FE0EB83F0EB01F81300481404150C123EA2007E141C1518007CEBF038 ECF83000FC1470EC78E048EB3FC00070EB0F801F2F7DAD25>I119 D E %EndDVIPSBitmapFont /Fk 107[51 51 25[40 1[61 40 45 25 35 35 1[45 45 45 66 25 40 1[25 45 45 25 40 45 40 45 45 7[51 2[56 66 51 45 56 1[56 1[61 4[30 4[66 61 1[56 18[23 30 5[30 35[45 45 2[{TeXBase1Encoding ReEncodeFont}41 90.9091 /Times-Italic rf /Fl 87[30 17[45 1[40 40 24[40 45 45 66 45 45 25 35 30 45 45 45 45 71 25 45 25 25 45 45 30 40 45 40 45 40 9[86 66 1[56 51 61 1[51 66 66 81 56 66 35 30 66 66 51 56 66 61 61 66 3[51 1[25 25 45 45 45 45 45 45 45 45 45 45 25 23 30 23 51 45 30 30 30 71 76 33[51 51 2[{ TeXBase1Encoding ReEncodeFont}77 90.9091 /Times-Roman rf /Fm 131[45 2[45 45 45 45 45 45 45 45 1[45 45 45 45 45 2[45 45 1[45 45 45 45 45 45 16[45 1[45 13[45 1[45 45 45 2[45 45 45 45 45 45 45 45 45 45 1[45 45 45 1[45 42[{TeXBase1Encoding ReEncodeFont}42 74.7198 /Courier rf %DVIPSBitmapFont: Fn cmsy9 9 2 /Fn 2 104 df102 D<12FCEAFFC0EA07F0EA01FC6C7E137F7F80131FB3A580 130F6D7E6D7EEB01FC9038007FC0EC1FE0EC7FC0903801FC00EB03F0495A495A131F5CB3 A5133F91C7FC5B13FE485AEA07F0EAFFC000FCC8FC1B4B7BB726>I E %EndDVIPSBitmapFont /Fo 32[50 101[50 1[72 1[50 28 39 33 1[50 50 50 78 28 2[28 50 50 33 44 50 44 50 44 9[94 72 2[55 5[89 61 3[72 72 1[61 2[66 8[50 50 1[50 2[50 1[50 3[33 25 44[{ TeXBase1Encoding ReEncodeFont}37 99.6264 /Times-Roman rf /Fp 87[33 47[50 1[50 55 33 39 44 1[55 50 55 83 28 55 1[28 55 1[33 44 55 44 55 50 9[100 3[55 72 1[61 1[72 94 3[39 2[61 66 72 72 1[72 9[50 50 50 50 50 50 50 2[25 33 45[{TeXBase1Encoding ReEncodeFont}42 99.6264 /Times-Bold rf /Fq 138[66 40 47 53 1[66 60 66 1[33 66 1[33 66 60 1[53 1[53 1[60 13[66 86 1[73 2[113 80 7[86 2[86 65[{ TeXBase1Encoding ReEncodeFont}22 119.552 /Times-Bold rf end %%EndProlog %%BeginSetup %%Feature: *Resolution 600dpi TeXDict begin %%PaperSize: A4 %%EndSetup %%Page: 1 1 1 0 bop 54 157 a Fq(A)30 b(Machine)h(Lear)n(ning)g(A)m(ppr)n(oach)g(to) e(Pr)n(onoun)i(Resolution)g(in)f(Spok)o(en)i(Dialogue)1125 507 y Fp(Michael)25 b(Strube)52 b Fo(and)e Fp(Christoph)25 b(M)2586 506 y(\250)2575 507 y(uller)1238 623 y Fo(European)f(Media)h (Laboratory)f(GmbH)1716 739 y(V)-6 b(illa)25 b(Bosch)1370 855 y(Schlo\337-W)-8 b(olfsbrunnenwe)o(g)23 b(33)1383 972 y(69118)h(Heidelber)n(g,)h(German)o(y)768 1088 y Fn(f)p Fm(michael.strube|christoph.mueller)p Fn(g)p Fm(@eml.villa-bos)o (ch.de)760 1627 y Fp(Abstract)182 1859 y Fl(W)-7 b(e)31 b(apply)i(a)e(decision)j(tree)e(based)h(approach)182 1972 y(to)26 b(pronoun)i(resolution)h(in)d(spok)o(en)h(dialogue.)182 2085 y(Our)c(system)i(deals)f(with)g(pronouns)i(with)e(NP-)182 2198 y(and)e(non-NP-antecedents.)33 b(W)-7 b(e)21 b(present)j(a)d(set) 182 2311 y(of)36 b(features)j(designed)f(for)f(pronoun)i(resolu-)182 2424 y(tion)24 b(in)g(spok)o(en)i(dialogue)g(and)e(determine)i(the)182 2537 y(most)h(promising)h(features.)41 b(W)-7 b(e)26 b(e)n(v)n(aluate)i(the)182 2649 y(system)33 b(on)g(twenty)g (Switchboard)i(dialogues)182 2762 y(and)23 b(sho)n(w)g(that)h(it)e (compares)j(well)d(to)h(Byron')-5 b(s)182 2875 y(\(2002\))25 b(manually)g(tuned)g(system.)0 3181 y Fp(1)99 b(Intr)n(oduction)0 3364 y Fl(Corpus-based)37 b(methods)d(and)g(machine)h(learning)g(tech-) 0 3477 y(niques)d(ha)n(v)o(e)f(been)g(applied)h(to)e(anaphora)j (resolution)g(in)0 3590 y(written)f(te)o(xt)e(with)h(considerable)k (success)d(\(Soon)f(et)g(al.,)0 3703 y(2001;)39 b(Ng)e(&)f(Cardie,)i (2002,)k(among)d(others\).)72 b(It)38 b(has)0 3816 y(been)31 b(demonstrated)i(that)d(systems)h(based)g(on)f(these)h(ap-)0 3929 y(proaches)h(achie)n(v)o(e)e(a)g(performance)i(that)e(is)f (comparable)0 4042 y(to)35 b(hand-crafted)k(systems.)64 b(Since)35 b(the)o(y)g(can)h(easily)g(be)0 4154 y(applied)43 b(to)e(ne)n(w)f(domains)j(it)d(seems)i(also)f(feasible)i(to)0 4267 y(port)32 b(a)e(gi)n(v)o(en)i(corpus-based)j(anaphora)f (resolution)g(sys-)0 4380 y(tem)29 b(from)g(written)h(te)o(xt)f(to)g (spok)o(en)i(dialogue.)48 b(This)29 b(pa-)0 4493 y(per)24 b(describes)j(the)d(e)o(xtensions)j(and)d(adaptations)k(needed)0 4606 y(for)21 b(applying)h(our)f(anaphora)i(resolution)g(system)e(\(M)8 b(\250)-38 b(uller)0 4719 y(et)29 b(al.,)f(2002;)i(Strube)g(et)f(al.,)f (2002\))i(to)f(pronoun)j(resolu-)0 4832 y(tion)24 b(in)g(spok)o(en)h (dialogue.)91 4948 y(There)33 b(are)g(important)i(dif)n(ferences)g (between)f(written)0 5061 y(te)o(xt)18 b(and)h(spok)o(en)h(dialogue)g (which)f(ha)n(v)o(e)f(to)g(be)g(accounted)0 5174 y(for)-5 b(.)84 b(The)42 b(most)f(ob)o(vious)j(dif)n(ference)g(is)e(that)h(in)e (spo-)0 5287 y(k)o(en)25 b(dialogue)h(there)f(is)f(an)g(ab)n(undance)j (of)d(\(personal)j(and)0 5400 y(demonstrati)n(v)o(e\))41 b(pronouns)f(with)e(non-NP-antecedents)2010 1627 y(or)25 b(no)g(antecedents)j(at)d(all.)33 b(Corpus)26 b(studies)g(ha)n(v)o(e)g (sho)n(wn)2010 1740 y(that)j(a)f(signi\002cant)i(amount)f(of)f (pronouns)j(in)d(spok)o(en)i(di-)2010 1853 y(alogue)41 b(ha)n(v)o(e)g(non-NP-antecedents:)66 b(Byron)40 b(&)f(Allen)2010 1965 y(\(1998\))27 b(report)f(that)g(about)g(50\045)f(of)g(the)g (pronouns)j(in)d(the)2010 2078 y(TRAINS93)i(corpus)k(ha)n(v)o(e)e (non-NP-antecedents.)49 b(Eck-)2010 2191 y(ert)39 b(&)f(Strube)i (\(2000\))h(note)e(that)h(only)g(about)g(45\045)f(of)2010 2304 y(the)23 b(pronouns)j(in)c(a)h(set)g(of)f(Switchboard)j(dialogues) h(ha)n(v)o(e)2010 2417 y(NP-antecedents.)90 b(The)43 b(remainder)i(consists)g(of)e(22\045)2010 2530 y(which)38 b(ha)n(v)o(e)h(non-NP-antecedents)k(and)38 b(33\045)g(without)2010 2643 y(antecedents.)55 b(These)31 b(studies)i(suggest)g(that)f(the)f (perfor)n(-)2010 2756 y(mance)24 b(of)f(a)f(pronoun)j(resolution)h (algorithm)f(can)f(be)f(im-)2010 2869 y(pro)o(v)o(ed)36 b(considerably)k(by)35 b(enabling)j(it)d(to)h(resolv)o(e)h(also)2010 2982 y(pronouns)26 b(with)d(non-NP-antecedents.)2101 3097 y(Because)38 b(of)e(the)i(dif)n(\002culties)g(a)e(pronoun)j (resolution)2010 3209 y(algorithm)d(encounters)h(in)d(spok)o(en)i (dialogue,)i(pre)n(vious)2010 3322 y(approaches)29 b(were)d(applied)i (only)f(to)f(tin)o(y)h(domains,)h(the)o(y)2010 3435 y(needed)39 b(deep)f(semantic)h(analysis)g(and)f(discourse)i(pro-)2010 3548 y(cessing)22 b(and)f(relied)h(on)e(hand-crafted)k(kno)n(wledge)e (bases.)2010 3661 y(In)31 b(contrast,)k(we)30 b(b)n(uild)j(on)e(our)g (e)o(xisting)i(anaphora)h(res-)2010 3774 y(olution)f(system)e(and)h (incrementally)i(add)d(ne)n(w)f(features)2010 3887 y(speci\002cally)h (de)n(vised)g(for)e(spok)o(en)i(dialogue.)47 b(That)28 b(w)o(ay)2010 4000 y(we)44 b(are)i(able)g(to)f(determine)i(relati)n(v)o (ely)g(po)n(werful)f(yet)2010 4113 y(computationally)34 b(cheap)e(features.)50 b(T)-7 b(o)29 b(our)h(kno)n(wledge)2010 4226 y(the)38 b(w)o(ork)g(presented)j(here)d(describes)j(the)d(\002rst) g(imple-)2010 4339 y(mented)19 b(system)g(for)g(corpus-based)j (anaphora)e(resolution)2010 4451 y(dealing)25 b(also)g(with)e (non-NP-antecedents.)2010 4656 y Fp(2)99 b(NP-)25 b(vs.)g (Non-NP-Antecedents)2010 4835 y Fl(Spok)o(en)i(dialogue)g(contains)h (more)e(pronouns)i(with)d(non-)2010 4948 y(NP-antecedents)43 b(than)e(written)f(te)o(xt)h(does.)79 b(Ho)n(we)n(v)o(er)l(,)2010 5061 y(pronouns)34 b(with)d(NP-antecedents)i(\(lik)o(e)f(3rd)g(pers.)f (mas-)2010 5174 y(culine/feminine)e(pronouns,)g(cf.)c Fk(he)h Fl(in)f(the)h(e)o(xample)h(be-)2010 5287 y(lo)n(w\))h(still)g (constitute)j(the)d(lar)n(gest)i(fraction)g(of)e(all)g(coref-)2010 5400 y(erential)d(pronouns)h(in)e(the)g(Switchboard)h(corpus.)p eop %%Page: 2 2 2 1 bop 91 91 a Fl(In)36 b(spok)o(en)h(dialogue)h(there)f(are)f (considerable)j(num-)0 204 y(bers)46 b(of)f(pronouns)j(that)f(pick)f (up)f(dif)n(ferent)j(kinds)e(of)0 317 y(abstract)e(objects)g(from)f (the)f(pre)n(vious)i(discourse,)50 b(e.g.)0 430 y(e)n(v)o(ents,)27 b(states,)g(concepts,)i(propositions)g(or)d(f)o(acts)h(\(W)-7 b(eb-)0 543 y(ber)l(,)29 b(1991;)g(Asher)l(,)g(1993\).)44 b(These)28 b(anaphors)j(then)e(ha)n(v)o(e)0 656 y(VP-antecedents)35 b(\()p Fk(\223it)733 670 y Fj(j)770 656 y Fk(\224)c Fl(in)h(\(B6\))h (belo)n(w\))f(or)h(sentential)0 769 y(antecedents)27 b(\()p Fk(\223that)668 784 y Fj(k)712 769 y Fk(\224)22 b Fl(in)h(\(B5\)\).)28 928 y Fi(A1:)42 b(.)11 b(.)g(.)g([he])392 936 y Fh(i)418 928 y Fi(')l(s)19 b(nine)g(months)h(old.)j(.)11 b(.)g(.)28 1083 y(A2:)42 b([He])319 1091 y Fh(i)364 1083 y Fi(lik)o(es)19 b(to)g(dig)g(around)h(a)f(little)f(bit.)28 1239 y(A3:)42 b([His])336 1247 y Fh(i)383 1239 y Fi(mother)21 b(comes)h(in)f(and)h(says,)g(why)f(did)g(you)h(let)f([him])1864 1247 y Fh(i)182 1322 y Fi([play)e(in)g(the)g(dirt])670 1330 y Fh(j)702 1322 y Fi(,)28 1477 y(A:4)42 b(I)18 b(guess)i([[he])555 1485 y Fh(i)582 1477 y Fi(')l(s)e(enjo)o(ying)j(himself])1179 1486 y Fh(k)1217 1477 y Fi(.)32 1632 y(B5:)42 b([That])369 1641 y Fh(k)407 1632 y Fi(')l(s)18 b(right.)32 1787 y(B6:)42 b([It])278 1795 y Fh(j)310 1787 y Fi(')l(s)18 b(healthy)-5 b(,)19 b(.)11 b(.)g(.)91 1976 y Fl(A)31 b(major)h(problem)h(for)f (pronoun)j(resolution)g(in)c(spo-)0 2089 y(k)o(en)39 b(dialogue)i(is)d(the)h(lar)n(ge)h(number)g(of)e(personal)j(and)0 2202 y(demonstrati)n(v)o(e)34 b(pronouns)g(which)e(are)g(either)g(not)g (refer)n(-)0 2315 y(ential)27 b(at)f(all)h(\(e.g.)f(e)o(xpleti)n(v)o(e) h(pronouns\))i(or)e(for)f(which)h(a)0 2428 y(particular)22 b(antecedent)h(cannot)e(easily)g(be)e(determined)j(by)0 2541 y(humans)28 b(\(called)g Fk(va)o(gue)g Fl(anaphors)g(by)f(Eck)o (ert)g(&)f(Strube)0 2654 y(\(2000\)\).)91 2767 y(In)41 b(the)g(follo)n(wing)h(e)o(xample,)j(the)d Fk(\223that)1465 2781 y Fj(i)1494 2767 y Fk(\224)d Fl(in)i(utter)n(-)0 2880 y(ance)h(\(A3\))g(refers)g(back)h(to)e(utterance)j(\(A1\).)83 b(As)41 b(for)0 2993 y(the)31 b(\002rst)g(tw)o(o)g(pronouns)j(in)d (\(B4\),)i(follo)n(wing)g(Eck)o(ert)e(&)0 3106 y(Strube)26 b(\(2000\))h(and)f(Byron)h(\(2002\))g(we)d(assume)j(that)f(re-)0 3218 y(ferring)e(e)o(xpressions)h(in)e(dis\003uencies,)i(abandoned)g (utter)n(-)0 3331 y(ances)40 b(etc.)g(are)f(e)o(xcluded)i(from)e(the)h (resolution.)79 b(The)0 3444 y(third)29 b(pronoun)i(in)d(\(B4\))h(is)f (an)g(e)o(xpleti)n(v)o(e.)45 b(The)28 b(pronoun)0 3557 y(in)f(\(A5\))f(is)g(dif)n(ferent)j(in)d(that)h(it)g(is)f(indeed)i (referential:)38 b(it)0 3670 y(refers)25 b(back)f(to)p Fk(\223that)685 3684 y Fj(i)715 3670 y Fk(\224)e Fl(from)i(\(A3\).)28 3829 y Fi(A1:)42 b(.)11 b(.)g(.)g([There)16 b(is)g(a)h(lot)f(of)g (theft,)h(a)f(lot)h(of)f(assault)h(dealing)g(with,)g(uh,)182 3912 y(people)j(trying)f(to)g(get)g(mone)o(y)h(for)e(drugs.)1294 3920 y Fh(i)1321 3912 y Fi(])32 4068 y(B2:)42 b(Y)-7 b(eah.)28 4223 y(A3:)42 b(And,)19 b(uh,)g(I)f(think)i([that)813 4231 y Fh(i)839 4223 y Fi(]')l(s)e(a)h(national)h(problem,)f(though.)32 4378 y(B4:)42 b Fg(It,)18 b(it,)g(it)q Fi(')l(s)g(pretty)h(bad)h(here,) f(too.)28 4533 y(A5:)42 b([It)253 4541 y Fh(i)279 4533 y Fi(]')l(s)18 b(not)h(unique)h(.)11 b(.)g(.)91 4723 y Fl(Pronoun)39 b(resolution)h(in)d(spok)o(en)i(dialogue)h(also)e(has)0 4835 y(to)47 b(deal)h(with)f(the)h(whole)g(range)g(of)f(dif)n (\002culties)j(that)0 4948 y(come)40 b(with)f(processing)j(spok)o(en)f (language:)64 b(dis\003uen-)0 5061 y(cies,)55 b(hesitations,)j (abandoned)52 b(utterances,)58 b(interrup-)0 5174 y(tions,)29 b(backchannels,)j(etc.)40 b(These)28 b(phenomena)h(ha)n(v)o(e)f(to)0 5287 y(be)g(tak)o(en)h(into)g(account)h(when)f(formulating)h (constraints)0 5400 y(on)f(e.g.)g(the)g(search)h(space)h(in)d(which)i (an)f(anaphor)i(looks)2010 91 y(for)c(its)g(antecedent.)41 b(E.g.,)26 b(utterance)k(\(B2\))c(in)h(the)g(pre)n(vi-)2010 204 y(ous)i(e)o(xample)g(does)g(not)g(contain)h(an)o(y)e(referring)j(e) o(xpres-)2010 317 y(sions.)41 b(So)26 b(the)i(demonstrati)n(v)o(e)i (pronoun)f(in)f(\(A3\))f(has)g(to)2010 430 y(ha)n(v)o(e)d(access)h(not) f(only)g(to)g(\(B2\))f(b)n(ut)h(also)g(to)g(\(A1\).)2010 645 y Fp(3)99 b(Data)2010 831 y Ff(3.1)92 b(Cor)o(pus)2010 987 y Fl(Our)51 b(w)o(ork)h(is)f(based)i(on)f(twenty)g(randomly)i (chosen)2010 1100 y(Switchboard)46 b(dialogues.)94 b(T)-7 b(ak)o(en)45 b(together)l(,)52 b(the)45 b(dia-)2010 1213 y(logues)39 b(contain)g(30810)g(tok)o(ens)h(\(w)o(ords)e(and)g (punctua-)2010 1325 y(tion\))24 b(in)e(3275)i(sentences)h(/)d(1771)i (turns.)29 b(The)22 b(annotation)2010 1438 y(consists)f(of)d(16601)j (markables,)g(i.e.)d(sequences)j(of)e(w)o(ords)2010 1551 y(and)g(attrib)n(utes)i(associated)g(with)d(them.)27 b(On)17 b(the)i(top)f(le)n(v)o(el,)2010 1664 y(dif)n(ferent)30 b(types)e(of)g(markables)h(are)f(distinguished:)42 b Fk(NP)p Fl(-)2010 1777 y(markables)c(identify)g(referring)g(e)o (xpressions)h(lik)o(e)d(noun)2010 1890 y(phrases,)57 b(pronouns)51 b(and)e(proper)h(names.)105 b(Some)48 b(of)2010 2003 y(the)32 b(attrib)n(utes)j(for)e(these)g(markables)h(are)e(deri)n (v)o(ed)h(from)2010 2116 y(the)d(Penn)g(T)m(reebank)h(v)o(ersion)g(of)f (the)g(Switchboard)i(dia-)2010 2229 y(logues,)i(e.g.)c(grammatical)j (function,)h(NP)c(form,)i(gram-)2010 2342 y(matical)41 b(case)g(and)f(depth)i(of)e(embedding)i(in)e(the)g(syn-)2010 2455 y(tactical)e(structure.)67 b Fk(VP)p Fl(-markables)37 b(are)f(v)o(erb)h(phrases,)2010 2567 y Fk(S)q Fl(-markables)45 b(sentences.)89 b Fk(Dis\003uency)p Fl(-markables)48 b(are)2010 2680 y(noun)e(phrases)h(or)e(pronouns)i(which)f(occur)g(in)f (un\002n-)2010 2793 y(ished)27 b(or)f(abandoned)j(utterances.)38 b(Among)26 b(other)h(\(type-)2010 2906 y(dependent\))34 b(attrib)n(utes,)h(markables)e(contain)g(a)d Fk(member)2010 3019 y Fl(attrib)n(ute)38 b(with)d(the)h(ID)f(of)g(the)h(coreference)i (class)f(the)o(y)2010 3132 y(are)32 b(part)g(of)g(\(if)f(an)o(y\).)53 b(If)32 b(an)f(e)o(xpression)k(is)c(used)i(to)e(re-)2010 3245 y(fer)h(to)h(an)f(entity)h(that)g(is)f(not)h(referred)h(to)e(by)h (an)o(y)f(other)2010 3358 y(e)o(xpression,)26 b(it)d(is)h(considered)i (a)d(singleton.)2101 3476 y(T)-7 b(able)37 b(1)g(gi)n(v)o(es)h(the)f (distrib)n(ution)k(of)c(the)h Fk(npform)g Fl(at-)2010 3589 y(trib)n(ute)26 b(for)e Fk(NP)p Fl(-markables.)32 b(The)24 b(second)h(and)g(third)g(ro)n(w)2010 3701 y(gi)n(v)o(e)20 b(the)h(number)g(of)f(non-singletons)25 b(and)c(singletons)i(re-)2010 3814 y(specti)n(v)o(ely)34 b(that)e(add)g(up)f(to)h(the)f(total)i (number)f(gi)n(v)o(en)g(in)2010 3927 y(the)24 b(\002rst)f(ro)n(w)-6 b(.)2101 4045 y(T)f(able)34 b(2)g(sho)n(ws)g(the)h(distrib)n(ution)j (of)c(the)h Fk(a)o(gr)m(eement)2010 4158 y Fl(attrib)n(ute)k(\(i.e.)e (person,)k(gender)l(,)h(and)c(number\))g(for)f(the)2010 4271 y(pronominal)30 b(e)o(xpressions)h(in)c(our)i(corpus.)42 b(The)28 b(left)g(\002g-)2010 4384 y(ure)37 b(in)g(each)h(cell)f(gi)n (v)o(es)g(the)g(total)h(number)g(of)f(e)o(xpres-)2010 4497 y(sions,)52 b(the)46 b(right)h(\002gure)f(gi)n(v)o(es)h(the)f (number)h(of)e(non-)2010 4610 y(singletons.)50 b(Note)30 b(the)f(relati)n(v)o(ely)j(high)f(number)f(of)g(sin-)2010 4723 y(gletons)g(among)g(the)f(personal)h(and)f(demonstrati)n(v)o(e)j (pro-)2010 4835 y(nouns)23 b(\(223)g(for)f Fk(it)p Fl(,)g(60)g(for)g Fk(the)m(y)h Fl(and)g(82)f(for)g Fk(that)r Fl(\).)29 b(These)2010 4948 y(pronouns)40 b(are)d(either)i(e)o(xpleti)n(v)o(e)g (or)e(v)n(ague,)k(and)d(cause)2010 5061 y(the)23 b(most)g(trouble)i (for)e(a)g(pronoun)i(resolution)h(algorithm,)2010 5174 y(which)45 b(will)f(usually)i(attempt)f(to)f(\002nd)g(an)g(antecedent) 2010 5287 y(nonetheless.)79 b(Singleton)40 b Fk(the)m(y)g Fl(pronouns,)45 b(in)39 b(particu-)2010 5400 y(lar)l(,)33 b(are)f(typical)h(for)e(spok)o(en)j(language)f(\(as)f(opposed)h(to)p eop %%Page: 3 3 3 2 bop 1579 83 4 84 v 1630 58 a Fe(defNP)99 b(indefNP)f(NNP)116 b(pr)o(p)h(pr)o(p$)99 b(dtpr)o(o)p 609 86 2663 4 v 659 144 a(T)-7 b(otal)p 1579 169 4 84 v 858 w Fi(1080)213 b(1899)143 b(217)100 b(1075)180 b(70)165 b(392)p 609 173 2663 4 v 809 231 a Fe(In)18 b(cor)o(efer)o(ence)h(r)o(elation)p 1579 256 4 84 v 186 w Fi(219)251 b(163)179 b(94)138 b(786)179 b(56)165 b(309)809 314 y Fe(Singletons)p 1579 339 V 579 w Fi(861)213 b(1736)143 b(123)138 b(289)179 b(14)202 b(83)487 492 y Fl(T)-7 b(able)24 b(1:)29 b(Distrib)n(ution)d(of)e Fk(npform)g Fl(Feature)g(on)g(Markables)h(\(w/o)f(1st)f(and)h(2nd)h (Persons\))p 1305 735 V 1431 710 a Fe(3m)p 1654 735 V 1654 735 V 269 w(3f)p 2003 735 V 2003 735 V 316 w(3n)p 2426 735 V 2426 735 V 344 w(3p)p 1030 739 1821 4 v 1080 797 a(pr)o(p)p 1305 822 4 84 v 161 w Fi(67)100 b(63)p 1654 822 V 100 w(49)h(47)p 2003 822 V 100 w Fe(541)g(318)p 2426 822 V 101 w(418)f(358)1080 880 y(pr)o(p$)p 1305 905 V 124 w Fi(18)g(15)p 1654 905 V 100 w(14)h(11)p 2003 905 V 175 w Fe(3)175 b(3)p 2426 905 V 137 w(35)138 b(27)1080 963 y(dtpr)o(o)p 1305 988 V 136 w Fi(0)f(0)p 1654 988 V 138 w(0)g(0)p 2003 988 V 100 w Fe(380)101 b(298)p 2426 988 V 138 w(12)138 b(11)p 1030 991 1821 4 v 1080 1049 a Fd(\006)p 1305 1074 4 84 v 222 w Fi(85)100 b(78)p 1654 1074 V 100 w(63)h(58)p 2003 1074 V 100 w Fe(924)g(619)p 2426 1074 V 101 w(465)f(396)649 1227 y Fl(T)-7 b(able)23 b(2:)29 b(Distrib)n(ution)e(of)c(Agreement)i(Feature)f(on)g(Pronominal) h(Expressions)0 1546 y(written)37 b(te)o(xt\).)69 b(The)36 b(same)h(is)f(true)h(for)g(anaphors)i(with)0 1659 y (non-NP-antecedents.)73 b(Ho)n(we)n(v)o(er)l(,)40 b(while)d(the)o(y)g (are)g(f)o(ar)0 1772 y(more)h(frequent)i(in)e(spok)o(en)i(language)g (than)f(in)e(written)0 1885 y(te)o(xt,)25 b(the)o(y)h(still)g (constitute)h(only)f(a)f(fraction)i(of)e(all)g(coref-)0 1997 y(erential)33 b(e)o(xpressions)h(in)d(our)g(corpus.)53 b(This)31 b(de\002nes)h(an)0 2110 y(upper)26 b(limit)f(for)h(what)f (the)g(resolution)j(of)d(these)h(kinds)g(of)0 2223 y(anaphors)c(can)e (contrib)n(ute)i(at)e(all.)27 b(These)20 b(f)o(acts)h(ha)n(v)o(e)f(to)f (be)0 2336 y(k)o(ept)30 b(in)e(mind)h(when)g(comparing)i(our)e(results) i(to)e(results)0 2449 y(of)23 b(coreference)k(resolution)f(in)e (written)g(te)o(xt.)0 2645 y Ff(3.2)92 b(Data)23 b(Generation)0 2797 y Fl(T)m(raining)e(and)f(test)g(data)g(instances)i(were)d (generated)j(from)0 2910 y(our)36 b(corpus)g(as)f(follo)n(ws.)64 b(All)35 b(markables)i(were)e(sorted)0 3023 y(in)28 b(document)i(order) l(,)g(and)f(markables)h(for)e(\002rst)g(and)h(sec-)0 3135 y(ond)i(person)h(pronouns)i(were)c(remo)o(v)o(ed.)51 b(The)30 b(resulting)0 3248 y(list)j(w)o(as)f(then)h(processed)i(from)d (top)h(to)g(bottom.)56 b(If)32 b(the)0 3361 y(list)j(contained)j(an)d Fk(NP)p Fl(-markable)h(at)e(the)i(current)g(posi-)0 3474 y(tion)26 b(and)h(if)e(this)h(markable)i(w)o(as)d(not)h(an)g (inde\002nite)h(noun)0 3587 y(phrase,)43 b(it)38 b(w)o(as)g(considered) j(a)d(potential)i(anaphor)-5 b(.)75 b(In)0 3700 y(that)19 b(case,)h(pairs)f(of)f(potentially)k(coreferring)f(e)o(xpressions)0 3813 y(were)27 b(generated)j(by)d(combining)i(the)f(potential)h (anaphor)0 3926 y(with)39 b(each)g Fk(compatible)805 3893 y Fc(1)883 3926 y Fk(NP)p Fl(-markable)h(preceding)1761 3893 y Fc(2)1839 3926 y Fl(it)0 4039 y(in)d(the)h(list.)71 b(The)37 b(resulting)i(pairs)g(were)e(labelled)i Fk(P)d Fl(if)0 4152 y(both)31 b(markables)h(had)f(the)f(same)g(\(non-empty\))j (v)n(alue)e(in)0 4265 y(their)i Fk(member)g Fl(attrib)n(ute,)j Fk(N)g Fl(otherwise.)55 b(F)o(or)31 b(anaphors)0 4377 y(with)44 b(non-NP-antecedents,)54 b Fk(additional)48 b Fl(training)f(and)0 4490 y(test)23 b(data)g(instances)j(had)d(to)f (be)h(generated.)31 b(This)22 b(process)0 4603 y(w)o(as)e(triggered)i (by)e(the)h(markable)g(at)f(the)g(current)i(position)0 4716 y(being)32 b Fk(it)h Fl(or)e Fk(that)p Fl(.)53 b(In)31 b(that)h(case,)i(a)d(small)g(set)h(of)f(poten-)0 4829 y(tial)c(non-NP-antecedents)k(w)o(as)26 b(generated)j(by)e(selecting)0 4942 y Fk(S)q Fl(-)36 b(and)h Fk(VP)p Fl(-markables)h(from)f(the)g (last)g(tw)o(o)f(v)n(alid)i(sen-)0 5055 y(tences)30 b(preceding)i(the)d (potential)j(anaphor)-5 b(.)47 b(The)29 b(choice)p 0 5139 499 4 v 105 5195 a Fb(1)134 5226 y Fi(Markables)g(are)e (considered)i(compatible)f(if)f(the)o(y)h(do)g(not)f(mis-)0 5309 y(match)19 b(in)g(terms)g(of)g(agreement.)105 5368 y Fb(2)134 5400 y Fi(W)-6 b(e)19 b(disre)o(gard)g(the)g(phenomenon)j (of)d Fg(cataphor)j Fi(here.)2010 1546 y Fl(of)39 b(the)h(last)g Fk(two)e Fl(sentences)k(w)o(as)d(moti)n(v)n(ated)i(pragmat-)2010 1659 y(ically)i(by)e(considerations)46 b(to)c(k)o(eep)g(the)g(search)h (space)2010 1772 y(\(and)d(the)f(number)g(of)g(instances\))j(small.)74 b(A)38 b(sentence)2010 1885 y(w)o(as)43 b(considered)k(v)n(alid)d(if)f (it)g(w)o(as)g(neither)i(un\002nished)2010 1997 y(nor)d(a)e (backchannel)45 b(utterance)f(\(lik)o(e)e(e.g.)e Fk(\224Uh-huh\224)p Fl(,)2010 2110 y Fk(\224Y)-8 b(eah\224)p Fl(,)35 b(etc.\).)61 b(From)33 b(the)i(selected)h(markables,)i(inac-)2010 2223 y(cessible)26 b(non-NP-e)o(xpressions)j(were)24 b(automatically)j(re-)2010 2336 y(mo)o(v)o(ed.)62 b(W)-7 b(e)34 b(considered)k(an)c(e)o(xpression)k(inaccessible)2010 2449 y(if)27 b(it)h Fk(ended)h(befor)m(e)f Fl(the)g(sentence)i(in)e (which)g(it)f(w)o(as)g(con-)2010 2562 y(tained.)68 b(This)36 b(w)o(as)f(intended)k(to)d(be)g(a)g(rough)h(approxi-)2010 2675 y(mation)27 b(of)g(the)g(concept)i(of)d(the)h(right)h(frontier)g (\(W)-7 b(ebber)l(,)2010 2788 y(1991\).)53 b(The)30 b(remaining)j(e)o (xpressions)h(were)d(then)h(com-)2010 2901 y(bined)25 b(with)f(the)g(potential)j(anaphor)-5 b(.)32 b(Finally)-6 b(,)24 b(the)h(result-)2010 3014 y(ing)k(pairs)g(were)f(labelled)j Fk(P)c Fl(or)i Fk(N)j Fl(and)d(added)h(to)e(the)h(in-)2010 3127 y(stances)c(generated)h(with)e Fk(NP)p Fl(-antecedents.)2010 3372 y Fp(4)99 b(F)n(eatur)n(es)2010 3580 y Fl(W)-7 b(e)42 b(distinguish)k(tw)o(o)c(classes)i(of)f(features:)69 b(NP-le)n(v)o(el)2010 3693 y(features)36 b(specify)f(e.g.)f(the)g (grammatical)h(function,)k(NP)2010 3806 y(form,)57 b(morpho-syntax,)k (grammatical)53 b(case)f(and)f(the)2010 3919 y(depth)g(of)g(embedding)h (in)e(the)h(syntactical)i(structure.)2010 4031 y(F)o(or)60 b(these)i(features,)71 b(each)62 b(instance)h(contains)g(one)2010 4144 y(v)n(alue)39 b(for)f(the)h(antecedent)i(and)e(one)g(for)f(the)g (anaphor)-5 b(.)2010 4257 y(Coreference-le)n(v)o(el)41 b(features,)i(on)38 b(the)g(other)g(hand,)k(de-)2010 4370 y(scribe)30 b(the)f(relation)i(between)f(antecedent)i(and)d (anaphor)2010 4483 y(in)k(terms)h(of)f(e.g.)g(distance)i(\(in)f(w)o (ords,)i(markables)f(and)2010 4596 y(sentences\),)28 b(compatibility)g(in)d(terms)g(of)g(agreement)i(and)2010 4709 y(identity)41 b(of)e(syntactic)i(function.)77 b(F)o(or)39 b(these)h(features,)2010 4822 y(each)24 b(instance)i(contains)g(only)e (one)g(v)n(alue.)2101 4948 y(In)29 b(addition,)j(we)c(introduce)k(a)c (set)h(of)g(features)i(which)2010 5061 y(is)38 b(partly)h(tailored)g (to)f(the)g(processing)i(of)e(spok)o(en)i(dia-)2010 5174 y(logue.)76 b(The)39 b(feature)h(ante)p 2934 5174 28 4 v 35 w(e)o(xp)p 3098 5174 V 33 w(type)g(\(17\))g(is)e(a)h(rather)2010 5287 y(ob)o(vious)c(yet)e(useful)h(feature)h(to)d(distinguish)37 b(NP-)31 b(from)2010 5400 y(non-NP-antecedents.)42 b(The)26 b(features)j(ana)p 3418 5400 V 34 w(np)p 3542 5400 V 33 w(,)d(vp)p 3714 5400 V 60 w(and)p eop %%Page: 4 4 4 3 bop 470 3 2942 4 v 713 61 a Fe(NP-le)o(v)o(el)18 b(featur)o(es)557 144 y Fi(1.)100 b(ante)p 841 144 23 4 v 27 w(gram)p 1021 144 V 27 w(func)h(grammatical)19 b(function)h(of)f(antecedent)557 227 y(2.)100 b(ante)p 841 227 V 27 w(npform)194 b(form)19 b(of)g(antecedent)557 311 y(3.)100 b(ante)p 841 311 V 27 w(agree)252 b(person,)19 b(gender)m(,)h(number)557 394 y(4.)100 b(ante)p 841 394 V 27 w(case)285 b(grammatical)19 b(case)g(of)g(antecedent)557 477 y(5.)100 b(ante)p 841 477 V 27 w(s)p 897 477 V 27 w(depth)192 b(the)19 b(le)n(v)o(el)g(of)g(embedding)h(in)f(a)g (sentence)557 560 y(6.)100 b(ana)p 820 560 V 27 w(gram)p 1000 560 V 28 w(func)121 b(grammatical)19 b(function)h(of)f(anaphor)557 643 y(7.)100 b(ana)p 820 643 V 27 w(npform)215 b(form)19 b(of)g(anaphor)557 726 y(8.)100 b(ana)p 820 726 V 27 w(agree)273 b(person,)19 b(gender)m(,)h(number)557 809 y(9.)100 b(ana)p 820 809 V 27 w(case)306 b(grammatical)19 b(case)g(of)g(anaphor)520 892 y(10.)100 b(ana)p 820 892 V 27 w(s)p 876 892 V 27 w(depth)213 b(the)19 b(le)n(v)o(el)g(of)g (embedding)h(in)f(a)g(sentence)p 470 920 2942 4 v 713 978 a Fe(Cor)o(efer)o(ence-le)o(v)o(el)g(featur)o(es)520 1061 y Fi(11.)100 b(agree)p 878 1061 23 4 v 27 w(comp)211 b(compatibility)19 b(in)g(agreement)h(between)f(anaphor)i(and)e (antecedent)520 1144 y(12.)100 b(npform)p 936 1144 V 28 w(comp)152 b(compatibilty)19 b(in)g(NP)f(form)h(between)h(anaphor)g (and)g(antecedent)520 1227 y(13.)100 b(wdist)402 b(distance)19 b(between)h(anaphor)g(and)g(antecedent)g(in)f(w)o(ords)520 1310 y(14.)100 b(mdist)398 b(distance)19 b(between)h(anaphor)g(and)g (antecedent)g(in)f(markables)520 1393 y(15.)100 b(sdist)427 b(distance)19 b(between)h(anaphor)g(and)g(antecedent)g(in)f(sentences) 520 1476 y(16.)100 b(syn)p 820 1476 V 27 w(par)339 b(anaphor)20 b(and)g(antecedent)g(ha)o(v)o(e)f(the)g(same)g(grammatical)h(function)f (\(yes,)g(no\))p 470 1504 2942 4 v 713 1562 a Fe(F)n(eatur)o(es)f(intr) o(oduced)f(f)n(or)i(spok)o(en)g(dialogue)520 1645 y Fi(17.)100 b(ante)p 841 1645 23 4 v 27 w(e)o(xp)p 974 1645 V 28 w(type)151 b(type)19 b(of)g(antecedent)h(\(NP)-8 b(,)18 b(S,)g(VP\))520 1729 y(18.)100 b(ana)p 820 1729 V 27 w(np)p 921 1729 V 28 w(pref)212 b(preference)20 b(for)f(NP)f(ar)o (guments)520 1812 y(19.)100 b(ana)p 820 1812 V 27 w(vp)p 921 1812 V 28 w(pref)212 b(preference)20 b(for)f(VP)f(ar)o(guments)520 1895 y(20.)100 b(ana)p 820 1895 V 27 w(s)p 876 1895 V 27 w(pref)258 b(preference)20 b(for)f(S)f(ar)o(guments)520 1978 y(21.)100 b(mdist)p 883 1978 V 27 w(3mf3p)177 b(\(see)19 b(te)o(xt\))520 2061 y(22.)100 b(mdist)p 883 2061 V 27 w(3n)297 b(\(see)19 b(te)o(xt\))520 2144 y(23.)100 b(ante)p 841 2144 V 27 w(t\002df)288 b(\(see)19 b(te)o(xt\))520 2227 y(24.)100 b(ante)p 841 2227 V 27 w(ic)359 b(\(see)19 b(te)o(xt\))520 2310 y(25.)100 b(wdist)p 879 2310 V 26 w(ic)322 b(\(see)19 b(te)o(xt\))p 470 2338 2942 4 v 1553 2491 a Fl(T)-7 b(able)24 b(3:)29 b(Our)23 b(Features)0 2791 y(s)p 40 2791 28 4 v 33 w(pref)31 b(\(18,)i(19,)f(20\))g(describe) g(a)f(v)o(erb')-5 b(s)32 b(preference)h(for)0 2904 y(ar)n(guments)49 b(of)d(a)g(particular)i(type.)98 b(Inspired)49 b(by)d(the)0 3017 y(w)o(ork)28 b(of)g(Eck)o(ert)h(&)e(Strube)h(\(2000\))i(and)e (Byron)h(\(2002\),)0 3130 y(these)35 b(features)h(capture)g (preferences)i(for)c(NP-)f(or)h(non-)0 3243 y(NP-antecedents)43 b(by)d(taking)i(a)e(pronoun')-5 b(s)43 b(predicati)n(v)o(e)0 3356 y(conte)o(xt)28 b(into)f(account.)40 b(The)27 b(underlying)i (assumption)g(is)0 3469 y(that)e(if)f(a)g(v)o(erb)g(preceding)j(a)d (personal)i(or)f(demonstrati)n(v)o(e)0 3582 y(pronoun)38 b(preferentially)h(subcate)o(gorizes)h(sentences)e(or)0 3695 y(VPs,)27 b(then)h(the)f(pronoun)j(will)d(be)g(lik)o(ely)h(to)g (ha)n(v)o(e)g(a)e(non-)0 3808 y(NP-antecedent.)31 b(The)22 b(features)j(are)e(based)h(on)f(a)g(v)o(erb)g(list)0 3920 y(compiled)g(from)f(553)g(Switchboard)h(dialogues.)1562 3887 y Fc(3)1630 3920 y Fl(F)o(or)e(e)n(v-)0 4033 y(ery)35 b(v)o(erb)g(occurring)i(in)d(the)h(corpus,)k(this)c(list)g(contains)0 4146 y(up)22 b(to)g(three)h(entries)g(gi)n(ving)h(the)e(absolute)i (count)f(of)f(cases)0 4259 y(where)f(the)h(v)o(erb)g(has)f(a)g(direct)h (ar)n(gument)h(of)f(type)g Fk(NP)p Fl(,)d Fk(VP)0 4372 y Fl(or)29 b Fk(S)p Fl(.)f(When)h(the)g(v)o(erb)h(list)f(w)o(as)f (produced,)33 b(pronominal)0 4485 y(ar)n(guments)28 b(were)e(ignored.) 37 b(The)25 b(features)j(mdist)p 1624 4485 V 34 w(3mf3p)0 4598 y(and)k(mdist)p 368 4598 V 33 w(3n)f(\(21,)j(22\))d(are)g (re\002nements)i(of)e(the)g(mdist)0 4711 y(feature.)f(The)o(y)22 b(measure)h(the)g(distance)h(in)f(markables)h(be-)0 4824 y(tween)k(antecedent)i(and)e(anaphor)l(,)i(b)n(ut)e(in)f(doing)i(so)e (the)o(y)0 4937 y(tak)o(e)42 b(the)f(agreement)i(v)n(alue)f(of)g(the)f (anaphor)i(into)f(ac-)0 5050 y(count.)29 b(F)o(or)20 b(anaphors)k(with)d(an)g(agreement)i(v)n(alue)f(of)f(3mf)0 5162 y(or)g(3p,)h(mdist)p 437 5162 V 34 w(3mf3p)g(is)f(measured)i(as)e (D)g(=)f(1)i(+)e(the)i(num-)p 0 5230 499 4 v 105 5285 a Fb(3)134 5317 y Fi(It)e(seemed)h(preferable)g(to)g(compile)f(our)h(o) n(wn)g(list)f(instead)g(of)h(us-)0 5400 y(ing)e(e)o(xisting)g(ones)h (lik)o(e)f(Briscoe)g(&)g(Carroll)f(\(1997\).)2010 2791 y Fl(ber)23 b(of)g Fk(NP)p Fl(-markables)h(between)g(anaphor)h(and)f (potential)2010 2904 y(antecedent.)64 b(Anaphors)36 b(with)e(an)h (agreement)h(v)n(alue)f(of)2010 3017 y(3n,)40 b(\(i.e.)c Fk(it)i Fl(or)f Fk(that)r Fl(\),)k(on)36 b(the)i(other)f(hand,)k (potentially)2010 3130 y(ha)n(v)o(e)30 b(non-NP-antecedents,)36 b(so)29 b(mdist)p 3313 3130 28 4 v 34 w(3n)h(is)g(measured)2010 3243 y(as)j(D)e(+)i(the)g(number)g(of)g(anaphorically)k(accessible)3751 3210 y Fc(4)3824 3243 y Fk(S)q Fl(-)2010 3356 y(and)k Fk(VP)p Fl(-markables)h(between)f(anaphor)i(and)e(potential)2010 3469 y(antecedent.)2101 3587 y(The)26 b(feature)i(ante)p 2701 3587 V 35 w(t\002fd)e(\(23\))h(is)g(supposed)i(to)d(capture)2010 3700 y(the)34 b(relati)n(v)o(e)h(importance)h(of)e(an)g(e)o(xpression)i (for)e(a)g(dia-)2010 3812 y(logue.)g(The)24 b(underlying)k(assumption)f (is)d(that)i(the)f(higher)2010 3925 y(the)32 b(importance)i(of)d(a)g (non-NP)h(e)o(xpression,)k(the)c(higher)2010 4038 y(the)39 b(probability)j(of)c(its)h(being)h(referred)h(back)e(to.)74 b(F)o(or)2010 4151 y(our)34 b(purposes,)j(we)c(calculated)i(TF)d(for)h (e)n(v)o(ery)h(w)o(ord)f(by)2010 4264 y(counting)23 b(its)e(frequenc)o (y)i(in)e(each)g(of)g(our)g(twenty)g(Switch-)2010 4377 y(board)30 b(dialogues)i(separately)-6 b(.)49 b(The)28 b(calculation)k(of)e(IDF)2010 4490 y(w)o(as)k(based)h(on)g(a)e(set)i (of)f(553)h(Switchboard)h(dialogues.)2010 4603 y(F)o(or)25 b(e)n(v)o(ery)i(w)o(ord,)g(we)e(calculated)k(IDF)c(as)h(log\(553/N)3788 4617 y Fj(w)3847 4603 y Fl(\),)2010 4716 y(with)18 b(N)2255 4730 y Fj(w)2311 4716 y Fl(=number)i(of)e(documents)i(containing)h(the) d(w)o(ord.)2010 4829 y(F)o(or)43 b(e)n(v)o(ery)h(non-NP-markable,)51 b(an)44 b Fk(aver)o(a)o(g)o(e)h Fl(TF*IDF)2010 4942 y(v)n(alue)20 b(w)o(as)e(calculated)k(as)c(the)i(TF*IDF)d(sum)h(of)h(all)g(w)o(ords) 2010 5054 y(comprising)29 b(the)e(markable,)i(di)n(vided)g(by)d(the)i (number)f(of)p 2010 5147 499 4 v 2115 5202 a Fb(4)2144 5234 y Fi(As)18 b(mentioned)h(earlier)m(,)f(the)g(de\002nition)g(of)g (accessibility)g(of)g(non-)2010 5317 y(NP-antecedents)25 b(is)e(inspired)i(by)f(the)g(concept)h(of)f(the)g(right)g(frontier)2010 5400 y(\(W)-6 b(ebber)m(,)19 b(1991\).)p eop %%Page: 5 5 5 4 bop 0 91 a Fl(w)o(ords)31 b(in)f(the)h(markable.)50 b(The)30 b(feature)i(ante)p 1509 91 28 4 v 34 w(ic)e(\(24\))h(as)0 204 y(an)e(alternati)n(v)o(e)j(to)d(ante)p 777 204 V 34 w(t\002df)g(is)g(based)h(on)f(the)h(same)f(as-)0 317 y(sumptions)23 b(as)e(the)g(former)-5 b(.)29 b(The)20 b Fk(information)k(content)g Fl(of)0 430 y(a)32 b(non-NP-markable)j(is) e(calculated)i(as)e(follo)n(ws,)i(based)0 543 y(on)j(a)g(set)h(of)f (553)h(Switchboard)h(dialogues:)62 b(F)o(or)37 b(each)0 656 y(w)o(ord)c(in)f(the)h(markable,)j(the)c(IC)g(v)n(alue)h(w)o(as)f (calculated)0 769 y(as)21 b(the)g(ne)o(gati)n(v)o(e)h(log)f(of)g(the)g (total)h(frequenc)o(y)h(of)e(the)g(w)o(ord)0 882 y(di)n(vided)27 b(by)e(the)g(total)h(number)g(of)f(w)o(ords)g(in)g(all)g(553)h(dia-)0 995 y(logues.)k(The)21 b Fk(aver)o(a)o(g)o(e)i Fl(IC)d(v)n(alue)j(w)o (as)e(then)h(calculated)i(as)0 1108 y(the)h(IC)g(sum)g(of)g(all)g(w)o (ords)h(in)f(the)g(markable,)i(di)n(vided)g(by)0 1220 y(the)32 b(number)i(of)e(w)o(ords)g(in)g(the)h(markable.)56 b(Finally)-6 b(,)35 b(the)0 1333 y(feature)e(wdist)p 484 1333 V 33 w(ic)e(\(25\))h(measures)h(the)e(w)o(ord-based)j(dis-)0 1446 y(tance)c(between)f(tw)o(o)g(e)o(xpressions.)47 b(It)28 b(does)i(so)e(in)h(terms)0 1559 y(of)c(the)f Fk(sum)h(of)f(the)h(individual)j(wor)m(ds')d(IC)p Fl(.)e(The)h (calcula-)0 1672 y(tion)k(of)f(the)g(IC)f(w)o(as)h(done)h(as)f (described)j(for)d(the)g(ante)p 1795 1672 V 34 w(ic)0 1785 y(feature.)0 2000 y Fp(5)99 b(Experiments)27 b(and)e(Results)0 2186 y Ff(5.1)92 b(Experimental)24 b(Setup)0 2342 y Fl(All)k(e)o (xperiments)i(were)e(performed)i(using)g(the)e(decision)0 2455 y(tree)34 b(learner)h Fk(RP)-8 b(ART)37 b Fl(\(Therneau)d(&)f (Atkinson,)h(1997\),)0 2567 y(which)j(is)g(a)g(CAR)-5 b(T)34 b(\(Breiman)k(et)e(al.,)h(1984\))h(reimple-)0 2680 y(mentation)e(for)e(the)h(S-Plus)f(and)g(R)f(statistical)k (comput-)0 2793 y(ing)j(en)l(vironments)j(\(we)c(use)g(R,)f(Ihaka)j(&)d (Gentleman)0 2906 y(\(1996\),)c(see)e(http://www)-6 b(.r)n(-project.or) n(g\).)57 b(W)-7 b(e)30 b(used)i(the)0 3019 y(standard)44 b(pruning)g(and)f(control)h(settings)g(for)e(RP)-8 b(AR)j(T)0 3132 y(\(cp=0.0001,)27 b(minsplit=20,)g(minb)n(uck)o(et=7\).)35 b(All)24 b(results)0 3245 y(reported)e(were)d(obtained)j(by)e (performing)h(20-fold)h(cross-)0 3358 y(v)n(alidation.)91 3476 y(In)e(the)f(prediction)k(phase,)e(the)f(trained)i(classi\002er)f (is)e(e)o(x-)0 3589 y(posed)k(to)e(unlabeled)j(instances)f(of)f(test)f (data.)29 b(The)21 b(classi-)0 3701 y(\002er')-5 b(s)18 b(task)h(is)f(to)g(label)h(each)g(instance.)29 b(When)19 b(an)f(instance)0 3814 y(is)24 b(labeled)i(as)e(coreferring,)j(the)e (IDs)f(of)g(the)g(anaphor)j(and)0 3927 y(antecedent)g(are)e(k)o(ept)g (in)f(a)g Fk(r)m(esponse)i(list)g Fl(for)e(the)h(e)n(v)n(alua-)0 4040 y(tion)f(according)i(to)e(V)-5 b(ilain)23 b(et)h(al.)k(\(1995\).) 91 4158 y(F)o(or)35 b(determining)j(the)e(rele)n(v)n(ant)h(feature)h (set)e(we)f(fol-)0 4271 y(lo)n(wed)40 b(an)h(iterati)n(v)o(e)g (procedure)i(similar)e(to)g(the)f Fk(wr)o(ap-)0 4384 y(per)31 b Fl(approach)g(for)e(feature)h(selection)h(\(K)m(oha)n(vi)e (&)f(John,)0 4497 y(1997\).)g(W)-7 b(e)18 b(start)h(with)f(a)g(model)h (based)h(on)f(a)f(set)g(of)h(prede-)0 4610 y(\002ned)26 b(baseline)j(features.)39 b(Then)27 b(we)f(train)h(models)g(com-)0 4723 y(bining)j(the)f(baseline)h(with)e(all)h(additional)i(features)g (sep-)0 4835 y(arately)-6 b(.)57 b(W)-7 b(e)32 b(choose)i(the)e(best)i (performing)g(feature)g(\(f-)0 4948 y(measure)f(according)h(to)e(V)-5 b(ilain)31 b(et)h(al.)52 b(\(1995\)\),)36 b(adding)0 5061 y(it)26 b(to)h(the)g(model.)38 b(W)-7 b(e)26 b(then)h(train)h (classi\002ers)g(combining)0 5174 y(the)c(enhanced)i(model)e(with)g (each)g(of)g(the)g(remaining)i(fea-)0 5287 y(tures)g(separately)-6 b(.)37 b(W)-7 b(e)24 b(again)i(choose)h(the)e(best)h(perform-)0 5400 y(ing)d(classi\002er)i(and)e(add)h(the)f(corresponding)k(ne)n(w)c (feature)2010 91 y(to)35 b(the)h(model.)66 b(This)35 b(process)i(is)f(repeated)h(as)f(long)g(as)2010 204 y(signi\002cant)26 b(impro)o(v)o(ement)e(can)g(be)g(observ)o(ed.)2010 394 y Ff(5.2)92 b(Results)2010 541 y Fl(In)23 b(our)h(e)o(xperiments)h(we)e (split)h(the)g(data)g(in)f(three)h(sets)g(ac-)2010 654 y(cording)30 b(to)f(the)f(agreement)i(of)f(the)f(anaphor:)41 b(third)29 b(per)n(-)2010 767 y(son)34 b(masculine)i(and)e(feminine)i (pronouns)g(\(3mf\),)g(third)2010 880 y(person)24 b(neuter)f(pronouns)i (\(3n\),)e(and)g(third)g(person)h(plural)2010 992 y(pronouns)36 b(\(3p\).)58 b(Since)34 b(only)g(3n-pronouns)j(ha)n(v)o(e)c(non-)2010 1105 y(NP-antecedents,)41 b(we)35 b(were)g(mainly)h(interested)i(in)e (im-)2010 1218 y(pro)o(v)o(ements)25 b(in)f(this)g(data)g(set.)2101 1332 y(W)-7 b(e)33 b(used)i(the)f(same)h(baseline)h(model)e(for)h(each) g(data)2010 1445 y(set.)56 b(The)32 b(baseline)j(model)e(corresponds)j (to)d(a)f(pronoun)2010 1558 y(resolution)41 b(algorithm)f(commonly)g (applied)g(to)e(written)2010 1671 y(te)o(xt,)j(i.e.,)f(it)d(uses)h (only)g(the)f(features)j(in)d(the)h(\002rst)f(tw)o(o)2010 1784 y(parts)30 b(of)f(T)-7 b(able)29 b(3.)46 b(F)o(or)28 b(the)h(baseline)j(model)d(we)g(gener)n(-)2010 1897 y(ated)e(training)h (and)f(test)f(data)h(which)g(included)h(only)g(NP-)2010 2009 y(antecedents.)2101 2123 y(Then)40 b(we)f(performed)j(e)o (xperiments)g(using)f(the)g(fea-)2010 2236 y(tures)32 b(introduced)i(for)d(spok)o(en)i(dialogue.)54 b(The)30 b(training)2010 2349 y(and)20 b(test)h(data)f(for)g(the)h(models)f (using)i(additional)g(features)2010 2462 y(included)44 b(NP-)d(and)h(non-NP-antecedents.)88 b(F)o(or)41 b(each)2010 2575 y(data)22 b(set)g(we)e(follo)n(wed)j(the)e(iterati)n(v)o(e)i (procedure)h(outlined)2010 2688 y(in)f(Section)i(5.1.)2101 2801 y(In)33 b(the)g(follo)n(wing)h(tables)g(we)e(present)j(the)e (results)h(of)2010 2914 y(our)25 b(e)o(xperiments.)32 b(The)24 b(\002rst)g(column)h(gi)n(v)o(es)g(the)f(number)2010 3027 y(of)c(coreference)j(links)e(correctly)h(found)f(by)f(the)h (classi\002er)l(,)2010 3140 y(the)29 b(second)i(column)e(gi)n(v)o(es)h (the)f(number)h(of)e(all)h(corefer)n(-)2010 3253 y(ence)j(links)g (found.)54 b(The)31 b(third)h(column)g(gi)n(v)o(es)g(the)f(total)2010 3366 y(number)37 b(of)f(coreference)j(links)e(\(1250\))h(in)e(the)g (corpus.)2010 3479 y(During)23 b(e)n(v)n(aluation,)h(the)e(list)g(of)g (all)g(correct)i(links)f(is)e(used)2010 3592 y(as)34 b(the)g Fk(k)o(e)m(y)h(list)h Fl(against)f(which)f(the)h Fk(r)m(esponse)h(list)g Fl(pro-)2010 3705 y(duced)26 b(by)e(the)h(classi\002er)h(\(cf.)e(abo)o(v)o(e\))h(is)g(compared.)33 b(The)2010 3818 y(remaining)28 b(three)f(columns)g(sho)n(w)f (precision,)j(recall)f(and)2010 3931 y(f-measure,)d(respecti)n(v)o(ely) -6 b(.)2101 4044 y(T)f(able)31 b(4)g(gi)n(v)o(es)g(the)g(results)i(for) e(3mf)g(pronouns.)54 b(The)2010 4157 y(baseline)34 b(model)d(performs)i (v)o(ery)f(well)f(on)h(this)g(data)g(set)2010 4270 y(\(the)c(lo)n(w)g (recall)h(\002gure)f(is)f(due)i(to)e(the)i(f)o(act)f(that)g(the)h(3mf) 2010 4383 y(data)35 b(set)g(contains)i(only)e(a)g(small)f(subset)j(of)d (the)h(coref-)2010 4496 y(erence)j(links)g(e)o(xpected)g(by)f(the)g(e)n (v)n(aluation\).)71 b(The)36 b(re-)2010 4609 y(sults)e(are)f (comparable)i(to)e(an)o(y)g(pronoun)i(resolution)h(al-)2010 4722 y(gorithm)c(dealing)i(with)d(written)h(te)o(xt.)52 b(This)31 b(sho)n(ws)h(that)2010 4835 y(our)20 b(pronoun)h(resolution)h (system)e(could)h(be)e(ported)i(to)e(the)2010 4948 y(spok)o(en)31 b(dialogue)g(domain)f(without)g(sacri\002cing)g(perfor)n(-)2010 5060 y(mance.)2101 5174 y(T)-7 b(able)33 b(5)f(sho)n(ws)h(the)h (results)g(for)f(3n)g(pronouns.)60 b(The)2010 5287 y(baseline)22 b(model)f(does)g(not)f(perform)h(v)o(ery)g(well.)27 b(As)19 b(men-)2010 5400 y(tioned)29 b(abo)o(v)o(e,)g(for)f(e)n(v)n(aluating)i (the)d(performance)j(of)e(the)p eop %%Page: 6 6 6 5 bop 1066 83 4 84 v 1117 58 a Fe(corr)o(ect)20 b(f)n(ound)98 b(total)19 b(f)n(ound)99 b(total)19 b(corr)o(ect)p 2535 83 V 100 w(pr)o(ecision)99 b(r)o(ecall)h(f-measur)o(e)p 262 86 3359 4 v 311 144 a(baseline,)18 b(featur)o(es)h(1-16)p 1066 169 4 84 v 259 w Fi(120)379 b(150)340 b(1250)p 2535 169 V 282 w(80.00)184 b(9.60)199 b(17.14)p 262 173 3359 4 v 311 231 a Fe(plus)18 b(mdist)p 646 231 23 4 v 26 w(3mf3p)p 1066 256 4 84 v 405 w Fi(121)379 b(153)340 b(1250)p 2535 256 V 282 w(79.08)184 b(9.68)199 b(17.25)585 409 y Fl(T)-7 b(able)23 b(4:)29 b(Results)c(for)e(Third)h(Person)g (Masculine)i(and)e(Feminine)g(Pronouns)h(\(3mf\))p 1066 608 V 1117 583 a Fe(corr)o(ect)20 b(f)n(ound)98 b(total)19 b(f)n(ound)99 b(total)19 b(corr)o(ect)p 2535 608 V 100 w(pr)o(ecision)99 b(r)o(ecall)h(f-measur)o(e)p 262 611 3359 4 v 311 669 a(baseline,)18 b(featur)o(es)h(1-16)p 1066 694 4 84 v 259 w Fi(109)379 b(235)340 b(1250)p 2535 694 V 282 w(46.38)184 b(8.72)199 b(14.68)p 262 697 3359 4 v 311 756 a Fe(plus)18 b(none)p 1066 781 4 84 v 678 w Fi(97)397 b(232)340 b(1250)p 2535 781 V 282 w(41.81)184 b(7.76)199 b(13.09)311 839 y Fe(plus)18 b(ante)p 604 839 23 4 v 27 w(exp)p 743 839 V 27 w(type)p 1066 864 4 84 v 373 w Fi(137)379 b(359)340 b(1250)p 2535 864 V 282 w(38.16)166 b(10.96)180 b(17.03)311 922 y Fe(plus)18 b(wdist)p 638 922 23 4 v 26 w(ic)p 1066 947 4 84 v 562 w Fi(154)379 b(389)340 b(1250)p 2535 947 V 282 w(39.59)166 b(12.32)180 b(18.79)311 1005 y Fe(plus)18 b(ante)p 604 1005 23 4 v 27 w(t\002df)p 1066 1030 4 84 v 515 w Fi(158)379 b(391)340 b(1250)p 2535 1030 V 282 w(40.41)166 b(12.64)180 b(19.26)938 1183 y Fl(T)-7 b(able)24 b(5:)29 b(Results)24 b(for)g(Third)g(Person)g(Neuter)g(Pronouns)h(\(3n\))0 1456 y(baseline)40 b(model)e(we)f(remo)o(v)o(ed)h(all)g(potential)i (non-NP-)0 1569 y(antecedents)h(from)d(the)g(data.)71 b(This)38 b(corresponds)j(to)d(a)0 1682 y(nai)n(v)o(e)32 b(application)j(of)c(a)h(model)g(de)n(v)o(eloped)i(for)d(written)0 1795 y(te)o(xt)24 b(to)f(spok)o(en)j(dialogue.)91 1934 y(First,)33 b(we)d(applied)j(the)f(same)f(model)h(to)f(the)h(data)g (set)0 2047 y(containing)47 b(all)d(kinds)h(of)e(antecedents.)93 b(The)43 b(perfor)n(-)0 2160 y(mance)32 b(drops)h(some)n(what)g(as)e (the)i(classi\002er)g(is)e(e)o(xposed)0 2273 y(to)26 b(non-NP-antecedents)31 b(without)c(being)g(able)g(to)f(dif)n(fer)n(-)0 2386 y(entiate)37 b(between)f(NP-)e(and)i(non-NP-antecedents.)68 b(By)0 2499 y(adding)26 b(the)f(feature)h(ante)p 837 2499 28 4 v 34 w(e)o(xp)p 1000 2499 V 33 w(type)f(the)g(classi\002er)h (is)e(en-)0 2612 y(abled)36 b(to)e(address)j(NP-)c(and)j (non-NP-antecedents)j(dif-)0 2725 y(ferently)-6 b(,)26 b(which)f(results)h(in)e(a)g(considerable)k(gain)d(in)f(per)n(-)0 2837 y(formance.)71 b(Substituting)40 b(the)e(wdist)f(feature)i(with)e (the)0 2950 y(wdist)p 201 2950 V 34 w(ic)22 b(feature)h(also)g(impro)o (v)o(es)g(the)g(performance)h(con-)0 3063 y(siderably)-6 b(.)86 b(The)41 b(ante)p 770 3063 V 34 w(t\002df)h(feature)h(only)g (contrib)n(utes)0 3176 y(mar)n(ginally)32 b(to)e(the)g(o)o(v)o(erall)h (performance.)50 b(\226)29 b(These)h(re-)0 3289 y(sults)h(sho)n(w)f (that)h(it)f(pays)h(of)n(f)g(to)f(consider)i(features)g(par)n(-)0 3402 y(ticularly)26 b(designed)g(for)d(spok)o(en)j(dialogue.)91 3541 y(T)-7 b(able)51 b(6)f(presents)j(the)e(results)h(for)f(3p)g (pronouns,)0 3654 y(which)37 b(do)g(not)f(ha)n(v)o(e)i (non-NP-antecedents.)72 b(Man)o(y)36 b(of)0 3767 y(these)20 b(pronouns)h(do)d(not)h(ha)n(v)o(e)h(an)e(antecedent)k(at)c(all.)27 b(Oth-)0 3880 y(ers)41 b(are)g Fk(va)o(gue)h Fl(in)f(that)h(human)f (annotators)j(felt)d(them)0 3993 y(to)i(be)f(referential,)50 b(b)n(ut)43 b(could)h(not)f(determine)h(an)f(an-)0 4106 y(tecedent.)83 b(Since)42 b(we)e(did)h(not)h(address)h(that)e(issue)h (in)0 4219 y(depth,)21 b(the)e(classi\002er)h(tries)g(to)e(\002nd)h (antecedents)j(for)d(these)0 4331 y(pronouns)43 b(indiscriminately)-6 b(,)48 b(which)41 b(results)h(in)e(rather)0 4444 y(lo)n(w)27 b(precision)k(\002gures,)e(as)f(compared)i(to)e(e.g.)f(those)i(for)0 4557 y(3mf.)34 b(Only)26 b(the)f(feature)i(wdist)p 1023 4557 V 34 w(ic)e(leads)i(to)e(an)g(impro)o(v)o(e-)0 4670 y(ment)f(o)o(v)o(er)f(the)h(baseline.)91 4809 y(T)-7 b(able)30 b(7)f(sho)n(ws)i(the)f(results)h(for)f(the)h(combined)g (clas-)0 4922 y(si\002ers.)39 b(The)26 b(impro)o(v)o(ement)i(in)e (f-measure)j(is)d(due)h(to)g(the)0 5035 y(increase)34 b(in)d(recall)i(while)f(the)f(precision)j(sho)n(ws)e(only)h(a)0 5148 y(slight)25 b(decrease.)91 5287 y(Though)54 b(some)f(of)g(the)g (features)i(of)e(the)g(baseline)0 5400 y(model)48 b(\(features)h (1-16\))f(still)g(occur)g(in)g(the)f(decision)2010 1456 y(tree)33 b(learned,)k(the)c(feature)i(ante)p 3086 1456 V 34 w(e)o(xp)p 3249 1456 V 34 w(type)e(di)n(vides)i(ma-)2010 1569 y(jor)27 b(parts)h(of)e(the)h(tree)h(quite)f(nicely)i(\(see)e (Figure)g(1\).)39 b(Be-)2010 1682 y(lo)n(w)24 b(that)i(node)g(the)f (feature)i(ana)p 3072 1682 V 34 w(npform)f(is)f(used)h(to)f(dis-)2010 1795 y(tinguish)34 b(between)e(ne)o(gati)n(v)o(e)g(\(personal)i (pronouns\))h(and)2010 1908 y(potential)44 b(positi)n(v)o(e)f(cases)f (\(demonstrati)n(v)o(e)j(pronouns\).)2010 2021 y(This)40 b(con\002rms)g(the)h(hypothesis)i(by)d(Eck)o(ert)h(&)e(Strube)2010 2134 y(\(2000\))j(and)f(Byron)g(\(2002\))h(to)f(gi)n(v)o(e)f(high)i (priority)g(to)2010 2247 y(these)26 b(features.)34 b(The)25 b(decision)i(tree)e(fragment)h(in)f(Figure)2010 2360 y(1)f(correctly)i(assigns)g(the)f Fk(P)e Fl(label)i(to)f(23-7=16)j (sentential)2010 2473 y(antecedents.)2010 2635 y Fm(split,)44 b(n,)g(loss,)g(yval)2100 2718 y(*)g(denotes)g(terminal)f(node)2010 2884 y(...)2100 2967 y(anteexptype=s,vp)f(1110)i(55)g(N)2189 3050 y(ananpform=prp)f(747,11)h(N)g(*)2189 3133 y(ananpform=dtpro)f (363)h(44)g(N)2279 3216 y(anteexptype=vp)e(177)j(3)f(N)h(*)2279 3299 y(anteexptype=s)e(186)h(41)g(N)2369 3382 y(udist>=1.5)f(95)h(14)h (N)f(*)2369 3465 y(udist<1.5)f(91)h(27)h(N)2458 3548 y(wdistic<43.32)e(33)h(4)h(N)g(*)2458 3631 y(wdistic>=43.32)e(58)h(23)h (N)2548 3714 y(anasdepth>=2.5)d(23)j(4)g(N)f(*)2548 3797 y(anasdepth<2.5)f(35)h(16)h(N)2638 3880 y(wdistic>=63.62)d(24)j(11)f(N) 2727 3963 y(wdistic<80.60)f(12)h(3)h(N)g(*)2727 4046 y(wdistic>=80.60)e(12)h(4)h(P)g(*)2638 4129 y(wdistic<63.62)d(11)j(3)f (P)h(*)2335 4367 y Fl(Figure)24 b(1:)29 b(Decision)c(T)m(ree)e (Fragment)2101 4610 y(Ho)n(we)n(v)o(er)l(,)g(the)g(most)g(important)i (problem)g(is)d(the)i(lar)n(ge)2010 4723 y(amount)56 b(of)e(pronouns)j(without)f(antecedents.)126 b(The)2010 4835 y(model)20 b(does)g(\002nd)f(\(wrong\))i(antecedents)i(for)c(a)g (lot)h(of)g(pro-)2010 4948 y(nouns)h(which)f(should)i(not)e(ha)n(v)o(e) g(one.)28 b(Only)20 b(a)f(small)h(frac-)2010 5061 y(tion)28 b(of)f(these)h(pronouns)i(are)e(true)f(e)o(xpleti)n(v)o(es)i(\(i.e.,)f (the)o(y)2010 5174 y(precede)23 b(a)d(\223weather\224)j(v)o(erb)e(or)g (are)g(in)g(constructions)k(lik)o(e)2010 5287 y Fk(\223It)f(seems)i (that)g(.)14 b(.)g(.)g(\224)p Fl(.)30 b(The)25 b(majority)h(of)g(these) g(cases)g(are)2010 5400 y(referential,)34 b(b)n(ut)c(ha)n(v)o(e)h(no)f (antecedent)j(in)c(the)h(data)h(\(i.e.,)p eop %%Page: 7 7 7 6 bop 1066 83 4 84 v 1117 58 a Fe(corr)o(ect)20 b(f)n(ound)98 b(total)19 b(f)n(ound)99 b(total)19 b(corr)o(ect)p 2535 83 V 100 w(pr)o(ecision)99 b(r)o(ecall)h(f-measur)o(e)p 262 86 3359 4 v 311 144 a(baseline,)18 b(featur)o(es)h(1-16)p 1066 169 4 84 v 259 w Fi(227)379 b(354)340 b(1250)p 2535 169 V 282 w(64.12)166 b(18.16)180 b(28.30)p 262 173 3359 4 v 311 231 a Fe(plus)18 b(wdist)p 638 231 23 4 v 26 w(ic)p 1066 256 4 84 v 562 w Fi(230)379 b(353)340 b(1250)p 2535 256 V 282 w(65.16)166 b(18.40)180 b(28.70)954 409 y Fl(T)-7 b(able)23 b(6:)29 b(Results)24 b(for)g(Third)g(Person)g (Plural)g(Pronouns)h(\(3p\))p 1066 611 V 1117 586 a Fe(corr)o(ect)20 b(f)n(ound)98 b(total)19 b(f)n(ound)99 b(total)19 b(corr)o(ect)p 2535 611 V 100 w(pr)o(ecision)99 b(r)o(ecall)h(f-measur)o(e)p 262 615 3359 4 v 311 673 a(baseline,)18 b(featur)o(es)h(1-16)p 1066 698 4 84 v 259 w Fi(456)379 b(739)340 b(1250)p 2535 698 V 282 w(61.71)166 b(36.48)180 b(45.85)p 262 701 3359 4 v 311 759 a Fe(combined)p 1066 784 4 84 v 653 w Fi(509)379 b(897)340 b(1250)p 2535 784 V 282 w(56.74)166 b(40.72)180 b(47.42)1138 937 y Fl(T)-7 b(able)23 b(7:)29 b(Combined)c(Results)f (for)g(All)f(Pronouns)0 1196 y(the)o(y)h(are)g Fk(va)o(gue)h Fl(pronouns\).)91 1309 y(The)34 b(o)o(v)o(erall)i(numbers)f(for)g (precision,)40 b(recall)35 b(and)g(f-)0 1422 y(measure)22 b(are)e(f)o(airly)i(lo)n(w)-6 b(.)27 b(One)21 b(reason)h(is)e(that)h (we)f(did)h(not)0 1535 y(attempt)g(to)f(resolv)o(e)h(anaphoric)i (de\002nite)e(NPs)d(and)j(proper)0 1648 y(names)27 b(though)h(these)f (coreference)j(links)d(are)g(contained)0 1761 y(in)e(the)h(e)n(v)n (aluation)i(k)o(e)o(y)d(list.)35 b(If)25 b(we)g(remo)o(v)o(ed)h(them)f (from)0 1873 y(there,)i(the)e(recall)i(of)e(our)h(e)o(xperiments)i(w)o (ould)e(approach)0 1986 y(the)d(51\045)f(Byron)h(\(2002\))h(mentioned)g (for)f(her)g(system)g(us-)0 2099 y(ing)h(only)g(domain-independent)29 b(semantic)c(restrictions.)0 2294 y Fp(6)99 b(Comparison)25 b(to)g(Related)g(W)-7 b(ork)0 2464 y Fl(Our)19 b(approach)j(for)d (determining)j(the)e(feature)h(set)e(for)h(pro-)0 2577 y(noun)h(resolution)i(resembles)f(the)f(so-called)i Fk(wr)o(apper)g Fl(ap-)0 2690 y(proach)j(for)f(feature)i(selection)g(\(K)m(oha)n(vi)f (&)e(John,)h(1997\).)0 2803 y(This)k(is)f(in)h(contrast)i(to)e(the)g (majority)h(of)e(other)i(w)o(ork)f(on)0 2916 y(feature)23 b(selection)i(for)d(anaphora)i(resolution,)g(which)f(w)o(as)0 3029 y(hardly)40 b(e)n(v)o(er)f(done)h(systematically)-6 b(.)79 b(E.g.)38 b(Soon)h(et)g(al.)0 3142 y(\(2001\))e(only)f(compared) h(baseline)h(systems)e(consisting)0 3255 y(of)28 b(one)h(feature)g (each,)h(only)f(three)g(of)f(which)g(yielded)i(an)0 3368 y(f-measure)37 b(greater)g(than)g(zero.)65 b(Then)36 b(the)o(y)f(combined)0 3481 y(these)22 b(features)h(and)f(achie)n(v)o (ed)g(results)h(which)e(were)g(close)0 3593 y(to)e(the)h(best)g(o)o(v)o (erall)g(results)h(the)o(y)e(report.)29 b(While)20 b(this)f(tells)0 3706 y(us)32 b(which)h(features)i(contrib)n(ute)g(a)d(lot,)j(it)d(does) h(not)g(gi)n(v)o(e)0 3819 y(an)o(y)38 b(information)i(about)e (potential)i(\(positi)n(v)o(e)f(or)f(ne)o(ga-)0 3932 y(ti)n(v)o(e\))20 b(in\003uence)h(of)f(the)g(rest.)28 b(Ng)19 b(&)g(Cardie)i(\(2002\))g(select)0 4045 y(the)34 b(set)g(of)g(features)h(by)f(hand,)j(gi)n(ving)e(a)f(preference)i(to)0 4158 y(high)22 b(precision)i(features.)30 b(The)o(y)21 b(admit)h(that)g(this)g(method)0 4271 y(is)h(quite)i(subjecti)n(v)o(e.) 91 4384 y(Corpus-based)39 b(w)o(ork)c(about)i(pronoun)h(resolution)g (in)0 4497 y(spok)o(en)f(dialogue)g(is)e(almost)h(non-e)o(xistent.)67 b(Ho)n(we)n(v)o(er)l(,)0 4610 y(there)26 b(are)e(a)h(fe)n(w)f(papers)i (dealing)g(with)f(neuter)h(pronouns)0 4723 y(with)21 b(NP-antecedents.)30 b(E.g.,)20 b(Dagan)h(&)f(Itai)h(\(1991\))i(pre-)0 4835 y(sented)28 b(a)f(corpus-based)k(approach)e(to)e(the)g(resolution) j(of)0 4948 y(the)22 b(pronoun)h Fk(it)p Fl(,)e(b)n(ut)h(the)o(y)g(use) f(a)g(written)h(te)o(xt)g(corpus)h(and)0 5061 y(do)c(not)h(mention)g (non-NP-antecedents)j(at)c(all.)27 b(P)o(aul)19 b(et)g(al.)0 5174 y(\(1999\))41 b(presented)h(a)d(corpus-based)44 b(anaphora)e(resolu-)0 5287 y(tion)25 b(algorithm)i(for)e(spok)o(en)i (dialogue.)34 b(F)o(or)24 b(their)i(e)o(xper)n(-)0 5400 y(iments,)i(ho)n(we)n(v)o(er)l(,)h(the)o(y)e(restricted)j(anaphoric)g (relations)2010 1196 y(to)23 b(those)i(with)e(NP-antecedents.)2101 1309 y(Byron)56 b(\(2002\))h(presented)h(a)e(symbolic)h(approach)2010 1422 y(which)48 b(resolv)o(es)h(pronouns)h(with)e(NP-)e(and)i(non-NP-) 2010 1535 y(antecedents)32 b(in)c(spok)o(en)j(dialogue)g(in)d(the)h (TRAINS)d(do-)2010 1648 y(main.)118 b(Byron)53 b(e)o(xtends)i(a)e (pronoun)i(resolution)h(al-)2010 1761 y(gorithm)e(\(T)-6 b(etrault,)53 b(2001\))i(with)d Fk(semantic)i(\002ltering)p Fl(,)2010 1873 y(thus)36 b(enabling)h(it)e(to)g(resolv)o(e)i(anaphors)g (with)e(non-NP-)2010 1986 y(antecedents)46 b(as)d(well.)87 b(Semantic)43 b(\002ltering)h(relies)g(on)2010 2099 y(kno)n(wledge)50 b(about)g(semantic)g(restrictions)h(associated)2010 2212 y(with)18 b(v)o(erbs,)i(lik)o(e)f(semantic)h(compatibility)i(between)d (sub-)2010 2325 y(ject)24 b(and)g(predicati)n(v)o(e)i(noun)f(or)e (predicati)n(v)o(e)j(adjecti)n(v)o(e.)2101 2438 y(An)k(e)n(v)n (aluation)k(on)d(ten)h(TRAINS93)d(dialogues)34 b(with)2010 2551 y(80)25 b(3rd)g(person)h(pronouns)h(and)e(100)g(demonstrati)n(v)o (e)j(pro-)2010 2664 y(nouns)50 b(sho)n(ws)e(that)h(semantic)g (\002ltering)h(and)e(the)h(im-)2010 2777 y(plementation)38 b(of)c(dif)n(ferent)j(search)f(strate)o(gies)h(for)e(per)n(-)2010 2890 y(sonal)53 b(and)g(demonstrati)n(v)o(e)i(pronouns)f(yields)g(a)e (suc-)2010 3003 y(cess)i(rate)f(of)h(72\045.)117 b(As)53 b(Byron)g(admits,)61 b(the)54 b(ma-)2010 3115 y(jor)46 b(limitation)h(of)f(her)g(algorithm)i(is)d(its)h(dependence)2010 3228 y(on)k(domain-dependent)55 b(resources)e(which)d(co)o(v)o(er)h (the)2010 3341 y(domain)45 b(entirely)-6 b(.)92 b(When)44 b(e)n(v)n(aluating)i(her)e(algorithm)2010 3454 y(with)52 b(only)g(domain-independent)57 b(semantics,)k(Byron)2010 3567 y(achie)n(v)o(ed)43 b(51\045)d(success)j(rate.)81 b(What)41 b(is)g(problematic)2010 3680 y(with)33 b(her)g(approach)i(is) e(that)h(she)f(assumes)h(the)f(input)h(to)2010 3793 y(her)28 b(algorithm)i(to)e(be)g(only)h(referential)i(pronouns.)45 b(This)2010 3906 y(simpli\002es)24 b(the)g(task)g(considerably)-6 b(.)2010 4100 y Fp(7)99 b(Conclusions)25 b(and)h(Futur)n(e)g(W)-7 b(ork)2010 4271 y Fl(W)g(e)31 b(presented)k(a)d(machine)i(learning)g (approach)h(to)e(pro-)2010 4384 y(noun)d(resolution)i(in)d(spok)o(en)i (dialogue.)49 b(W)-7 b(e)28 b(b)n(uilt)i(upon)2010 4497 y(a)35 b(system)g(we)g(used)h(for)f(anaphora)i(resolution)h(in)d(writ-) 2010 4610 y(ten)h(te)o(xt)h(and)f(e)o(xtended)i(it)e(with)g(a)g(set)g (of)g(features)i(de-)2010 4723 y(signed)43 b(for)f(spok)o(en)h (dialogue.)85 b(W)-7 b(e)40 b(re\002ned)i(distance)2010 4835 y(features)25 b(and)e(used)h(metrics)g(from)e(information)k (retrie)n(v)n(al)2010 4948 y(for)40 b(determining)j (non-NP-antecedents.)83 b(Inspired)42 b(by)2010 5061 y(the)35 b(more)f(linguistically)39 b(oriented)d(w)o(ork)f(by)f(Eck)o (ert)h(&)2010 5174 y(Strube)d(\(2000\))h(and)e(Byron)h(\(2002\))h(we)d (also)i(e)n(v)n(aluated)2010 5287 y(the)26 b(contrib)n(ution)k(of)25 b(features)j(which)e(used)h(the)f(predica-)2010 5400 y(ti)n(v)o(e)21 b(conte)o(xt)h(of)f(the)h(pronoun)h(to)e(be)g(resolv)o (ed.)30 b(Ho)n(we)n(v)o(er)l(,)p eop %%Page: 8 8 8 7 bop 0 91 a Fl(these)35 b(features)g(did)g(not)f(sho)n(w)f(up)h(in)g (the)g(\002nal)f(models)0 204 y(since)28 b(the)o(y)f(did)f(not)h(lead)h (to)e(an)h(impro)o(v)o(ement.)39 b(Instead,)0 317 y(rather)20 b(simple)f(distance)i(metrics)e(were)f(preferred.)30 b(While)0 430 y(we)e(were)h(\(almost\))i(satis\002ed)f(with)f(the)h (performance)h(of)0 543 y(these)e(features,)j(the)c(major)h(problem)h (for)e(a)g(spok)o(en)j(dia-)0 656 y(logue)20 b(pronoun)h(resolution)h (algorithm)f(is)e(the)g(ab)n(undance)0 769 y(of)25 b(pronouns)j (without)f(antecedents.)38 b(Pre)n(vious)26 b(research)0 882 y(could)f(a)n(v)n(oid)g(dealing)h(with)e(this)g(phenomenon)j(by)d (either)0 995 y(applying)38 b(the)d(algorithm)j(by)d(hand)h(\(Eck)o (ert)h(&)d(Strube,)0 1108 y(2000\))c(or)f(e)o(xcluding)j(these)e(cases) g(\(Byron,)f(2002\))h(from)0 1220 y(the)41 b(e)n(v)n(aluation.)84 b(Because)42 b(we)e(included)j(these)f(cases)0 1333 y(in)29 b(our)g(e)n(v)n(aluation)i(we)d(consider)j(our)e(approach)i(at)d(least) 0 1446 y(comparable)34 b(to)e(Byron')-5 b(s)33 b(system)g(when)f(she)h (uses)f(only)0 1559 y(domain-independent)e(semantics.)j(W)-7 b(e)24 b(belie)n(v)o(e)i(that)f(our)0 1672 y(system)f(is)f(more)h(rob)n (ust)h(than)f(hers)g(and)f(that)h(it)f(can)h(more)0 1785 y(easily)h(be)e(ported)i(to)f(ne)n(w)f(domains.)0 2003 y Ff(Ackno)o(wledgements.)91 b Fl(The)18 b(w)o(ork)h(presented)i(here)f (has)0 2116 y(been)42 b(partially)g(funded)h(by)e(the)g(German)f (Ministry)i(of)0 2229 y(Research)36 b(and)g(T)-6 b(echnology)37 b(as)d(part)i(of)e(the)k(E)t Fa(M)t(B)r(A)t(S)t(S)t(I)0 2342 y Fl(project)f(\(01)e(IL)g(904)g(D/2\))g(and)h(by)f(the)h(Klaus)f (Tschira)0 2455 y(F)o(oundation.)127 b(W)-7 b(e)54 b(w)o(ould)j(lik)o (e)f(to)f(thank)i(Susanne)0 2568 y(W)l(ilhelm)f(and)g(Lutz)f(W)l(ind)h (for)g(doing)h(the)e(annota-)0 2681 y(tions,)20 b(K)n(erstin)f(Sch)8 b(\250)-38 b(urmann,)21 b(T)-7 b(orben)19 b(P)o(astuch)g(and)g(Klaus)0 2794 y(Rothenh)5 b(\250)-35 b(ausler)47 b(for)e(helping)g(with)f(the)h (data)f(prepara-)0 2907 y(tion.)0 3149 y Fp(Refer)n(ences)0 3324 y Fi(Asher)m(,)23 b(Nicholas)f(\(1993\).)38 b Fg(Refer)m(ence)23 b(to)f(Abstr)o(act)g(Objects)g(in)g(Dis-)91 3407 y(cour)o(se)p Fi(.)28 b(Dordrecht,)19 b(The)g(Netherlands:)24 b(Kluwer)l(.)0 3490 y(Breiman,)k(Leo,)g(Jerome)f(H.)e(Friedman,)j(Charles)f(J.)e (Stone)i(&)f(R.A.)91 3574 y(Olshen)h(\(1984\).)54 b Fg (Classi\002cation)28 b(and)g(Re)m(gr)m(ession)g(T)l(r)m(ees)p Fi(.)53 b(Bel-)91 3657 y(mont,)19 b(Cal.:)j(W)-6 b(adsw)o(orth)20 b(and)f(Brooks/Cole.)0 3740 y(Briscoe,)39 b(T)-5 b(ed)34 b(&)h(John)h(Carroll)e(\(1997\).)79 b(Automatic)35 b(e)o(xtraction)91 3823 y(of)29 b(subcate)o(gorization)j(from)d(corpora.)62 b(In)30 b Fg(Pr)m(oceedings)g(of)g(the)91 3906 y(5th)g(Confer)m(ence)i (on)e(Applied)h(Natur)o(al)f(Langua)o(g)o(e)i(Pr)m(ocessing)o(,)91 3989 y Fi(W)-6 b(ashington,)19 b(D.C.,)f(31)h(March)h(\226)f(3)g(April) g(1997,)g(pp.)g(356\226363.)0 4072 y(Byron,)29 b(Donna)e(K.)f (\(2002\).)52 b(Resolving)28 b(pronominal)g(reference)f(to)91 4155 y(abstract)19 b(entities.)26 b(In)19 b Fg(Pr)m(oceedings)h(of)e (the)h(40th)h(Annual)f(Meeting)91 4238 y(of)25 b(the)f(Association)i (for)f(Computational)g(Linguistics,)h Fi(Philadel-)91 4321 y(phia,)19 b(Penn.,)f(7\22612)j(July)e(2002,)h(pp.)f(80\22687.)0 4404 y(Byron,)j(Donna)g(K.)f(&)g(James)g(F)-6 b(.)21 b(Allen)g(\(1998\).)35 b(Resolving)22 b(demon-)91 4487 y(strati)n(v)o(e)32 b(pronouns)h(in)f(the)g(TRAINS93)f(corpus.)70 b(In)32 b Fg(Ne)o(w)f(Ap-)91 4570 y(pr)m(oac)o(hes)d(to)f(Discour)o(se) g(Anaphor)o(a:)41 b(Pr)m(oceedings)28 b(of)f(the)f(Sec-)91 4653 y(ond)d(Colloquium)g(on)f(Discour)o(se)h(Anaphor)o(a)h(and)f (Anaphor)g(Res-)91 4736 y(olution)c(\(D)m(AARC2\))p Fi(,)f(pp.)h (68\22681.)0 4819 y(Dagan,)28 b(Ido)e(&)f(Alon)h(Itai)f(\(1991\).)50 b(A)25 b(statistical)g(\002lter)g(for)h(resolv-)91 4902 y(ing)f(pronoun)h(references.)46 b(In)24 b(Y)-10 b(.A.)24 b(Feldman)h(&)f(A.)g(Bruckstein)91 4985 y(\(Eds.\),)17 b Fg(Arti\002cial)g(Intellig)o(ence)i(and)g(Computer)f(V)-6 b(ision)p Fi(,)18 b(pp.)h(125\226)91 5068 y(135.)g(Amsterdam:)24 b(Else)n(vier)l(.)0 5151 y(Eck)o(ert,)g(Miriam)e(&)h(Michael)g(Strube)g (\(2000\).)40 b(Dialogue)24 b(acts,)f(syn-)91 5234 y(chronising)18 b(units)g(and)g(anaphora)h(resolution.)24 b Fg(J)n(ournal)19 b(of)e(Seman-)91 5317 y(tics)p Fi(,)h(17\(1\):51\22689.)0 5400 y(Ihaka,)30 b(Ross)d(&)g(Robert)g(Gentleman)h(\(1996\).)55 b(R:)26 b(A)h(language)i(for)2101 91 y(data)d(analysis)h(and)g (graphics.)50 b Fg(J)n(ournal)28 b(of)e(Computational)h(and)2101 174 y(Gr)o(aphical)20 b(Statistics)p Fi(,)e(5:299\226314.)2010 257 y(K)m(oha)o(vi,)36 b(Ron)c(&)h(Geor)o(ge)f(H.)g(John)h(\(1997\).)70 b(Wrappers)33 b(for)f(fea-)2101 340 y(ture)26 b(subset)h(selection.)51 b Fg(Arti\002cial)26 b(Intellig)o(ence)h(J)n(ournal)p Fi(,)i(97\(1-)2101 423 y(2\):273\226324.)2010 506 y(M)6 b(\250)-31 b(uller)m(,)21 b(Christoph,)h(Stef)o(an)e(Rapp)h(&)g (Michael)g(Strube)g(\(2002\).)34 b(Ap-)2101 589 y(plying)24 b(Co-Training)f(to)f(reference)i(resolution.)40 b(In)23 b Fg(Pr)m(oceedings)2101 672 y(of)c(the)h(40th)f(Annual)h(Meeting)g(of) g(the)f(Association)h(for)f(Computa-)2101 756 y(tional)k(Linguistics,)h Fi(Philadelphia,)g(Penn.,)f(7\22612)h(July)g(2002,)h(pp.)2101 839 y(352\226359.)2010 922 y(Ng,)18 b(V)l(incent)g(&)f(Claire)h(Cardie) f(\(2002\).)26 b(Impro)o(ving)19 b(machine)g(learn-)2101 1005 y(ing)i(approaches)h(to)e(coreference)i(resolution.)32 b(In)21 b Fg(Pr)m(oceedings)g(of)2101 1088 y(the)29 b(40th)h(Annual)f (Meeting)h(of)f(the)g(Association)g(for)g(Computa-)2101 1171 y(tional)23 b(Linguistics,)h Fi(Philadelphia,)g(Penn.,)f(7\22612)h (July)g(2002,)h(pp.)2101 1254 y(104\226111.)2010 1337 y(P)o(aul,)19 b(Michael,)h(Kazuhide)h(Y)-7 b(amamoto)20 b(&)g(Eiichiro)f(Sumita)g(\(1999\).)2101 1420 y(Corpus-based)25 b(anaphora)g(resolution)g(to)n(w)o(ards)f(antecedent)h(pref-)2101 1503 y(erence.)e(In)17 b Fg(Pr)m(oc.)f(of)h(the)f(37th)i(A)n(CL,)d(W)-7 b(orkshop)19 b(Cor)m(efer)m(ence)f(and)2101 1586 y(Its)g(Applications,) h Fi(Colle)o(ge)g(P)o(ark,)g(Md.,)f(1999,)i(pp.)f(47\22652.)2010 1669 y(Soon,)29 b(W)-6 b(ee)27 b(Meng,)k(Hwee)c(T)-6 b(ou)27 b(Ng)h(&)f(Daniel)g(Chung)i(Y)-8 b(ong)27 b(Lim)2101 1752 y(\(2001\).)i(A)18 b(machine)i(learning)g(approach)h(to)e (coreference)i(resolu-)2101 1835 y(tion)16 b(of)g(noun)i(phrases.)j Fg(Computational)d(Linguistics)p Fi(,)e(27\(4\):521\226)2101 1918 y(544.)2010 2001 y(Strube,)k(Michael,)i(Stef)o(an)e(Rapp)h(&)f (Christoph)h(M)6 b(\250)-31 b(uller)21 b(\(2002\).)33 b(The)2101 2084 y(in\003uence)22 b(of)f(minimum)g(edit)g(distance)g(on) h(reference)f(resolution.)2101 2167 y(In)h Fg(Pr)m(oceedings)h(of)f (the)g(2002)h(Confer)m(ence)g(on)g(Empirical)f(Meth-)2101 2250 y(ods)f(in)g(Natur)o(al)g(Langua)o(g)o(e)i(Pr)m(ocessing)o(,)f Fi(Philadelphia,)g(P)o(a.,)e(6\2267)2101 2333 y(July)f(2002,)h(pp.)f (312\226319.)2010 2416 y(T)-5 b(etrault,)33 b(Joel)f(R.)e(\(2001\).)67 b(A)31 b(corpus-based)j(e)n(v)n(aluation)e(of)f(cen-)2101 2499 y(tering)26 b(and)h(pronoun)i(resolution.)51 b Fg(Computational)27 b(Linguistics)p Fi(,)2101 2582 y(27\(4\):507\226520.)2010 2665 y(Therneau,)d(T)-5 b(erry)21 b(M.)h(&)g(Elizabeth)g(J.)g(Atkinson) h(\(1997\).)38 b Fg(An)22 b(intr)m(o-)2101 2748 y(duction)g(to)f(r)m (ecur)o(sive)i(partitioning)f(using)g(the)g(RPART)d(r)m(outines)p Fi(.)2101 2831 y(T)-5 b(echnical)27 b(Report:)38 b(Mayo)28 b(F)o(oundation.)52 b(Distrib)o(uted)26 b(with)g(the)2101 2914 y(RPART)17 b(package.)2010 2997 y(V)l(ilain,)h(Marc,)h(John)h(Bur) o(ger)m(,)f(John)h(Aberdeen,)g(Dennis)g(Connolly)g(&)2101 3080 y(L)l(ynette)26 b(Hirschman)h(\(1995\).)51 b(A)26 b(model-theoretic)h(coreference)2101 3163 y(scoring)22 b(scheme.)36 b(In)22 b Fg(Pr)m(oceedings)g(of)g(the)g(6th)f(Messa)o(g)o (e)j(Under)o(-)2101 3246 y(standing)d(Confer)m(ence)h(\(MUC-6\))p Fi(,)e(pp.)g(45\22652.)h(San)f(Mateo,)h(Cal.:)2101 3329 y(Mor)o(gan)e(Kaufmann.)2010 3412 y(W)-6 b(ebber)m(,)19 b(Bonnie)g(L.)e(\(1991\).)27 b(Structure)18 b(and)h(ostension)h(in)e (the)h(inter)o(-)2101 3495 y(pretation)i(of)g(discourse)i(deixis.)34 b Fg(Langua)o(g)o(e)23 b(and)f(Co)o(gnitive)f(Pr)m(o-)2101 3578 y(cesses)p Fi(,)e(6\(2\):107\226135.)p eop %%Trailer end userdict /end-hook known{end-hook}if %%EOF