## English wordsketches (Penn tagset) version 2 ## Modified to TreeTagger tagset by Niels Ott ## Modified by Jan so that definitions don't use ## lempos (not always available) *STRUCTLIMIT s ## *DEFAULTATTR tag *DEFAULTATTR tag =and/or *SYMMETRIC 1:"NN.?.?" [word=","]{0,1} [word="and"|word="or"|word=","] [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"] 1:"V..?" [word=","]{0,1} [word="and"|word="or"|word=","] "RB.?"{0,2} 2:[tag="V..?"|tag="JJ.?"] & 1.tag = 2.tag 1:"JJ.?" [word=","]{0,1} [word="and"|word="or"|word=","]{0,1} "RB.?"{0,2} 2:"JJ.?" & 1.tag = 2.tag *DUAL =object/object_of 1:"V..?" "RB.?"{0,2} [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"] 2:"NN.?.?" "RB.?"{0,2} 1:"V.N" 2:"NN.?.?" [tag="WP"|tag="PNQ"|tag="CJT"]? [tag="RB.?"|tag="RB"|tag="VM"]{0,5} [lemma="be" & tag="V.*"] "RB.?"{0,2} 1:"V.N" *DUAL =subject/subject_of 2:"NN.?.?" [tag="WP"|tag="PNQ"|tag="CJT"]? [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} 1:"V.[^N]?" 2:"NN.?.?" [tag="WP"|tag="PNQ"|tag="CJT"]? [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} [lemma="have" & tag="V.*"] "RB.?"{0,2} 1:"V.N" 1:"V.N" "RB.?"{0,2} [word="by"] [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"] *DUAL =adj_subject_of/adj_subject 1:"NN.?.?" [tag="WP"|tag="PNQ"|tag="CJT"]? [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} 2:"JJ.?" [tag!="NN.?.?"] *DUAL =predicate_of/predicate 1:"NN.?.?" [tag="WP"|tag="PNQ"|tag="CJT"]? [tag="RB.?"|tag="RB"|tag="VM"]{0,5} [lemma="be" & tag="V.*"] "RB.?"{0,2} [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"] =it+ [word="it"] [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} 1:"JJ.?" "RB.?"{0,2} [tag="CJT"|tag="PRP"|tag="TO"] [word="it"] [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 1:"NN.?.?" "TO" [word="it"] [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 1:"NN.?.?" [word="for"] "PRP" "TO" =pro_object 1:"V..?" "RB.?"{0,2} 2:[tag="PRP" & word!="I" & word!="he" & word!="she" & word!="we" & word!="they"] # 2:any_pro adv_aux_string_not_be copular adv_string 1:past_part =pro_subject 2:"PRP" [tag="RB.?"|tag="RB"|tag="VM"]{0,3} [lemma="be" & tag="V.*"]? "RB.?"{0,2} 1:[tag="V.[^N]?"] 2:"PRP" [tag="RB.?"|tag="RB"|tag="VM"]{0,5} [lemma="be" & tag="V.*"] "RB.?"{0,2} 1:"V.N" *DUAL =a_modifier/modifies 2:"JJ.?" [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 1:"NN.?.?" [tag!="NN.?.?"] =modifier 2:"RB" 1:[tag="JJ.?"|tag="V..?"] 1:"V..?" "RB.?"{0,2} 2:"RB" [tag!="RB.?" & tag!="JJ.?"] *DUAL =n_modifier/modifies 2:"NN.?.?" "NN.?.?"{0,3} 1:"NN.?.?" *DUAL =possessed/possessor 1:"NN.?.?" "POS" "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,1} 2:"NN.?.?" [tag!="NN.?.?"] =pro_possessor 1:"PRP\$" "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,1} 2:"NN.?.?" [tag!="NN.?.?"] =wh_comp 1:"V..?" "RB.?"{0,2} 2:[tag="W.?.?"] =infin_comp 1:"V..?" [tag="RB.?"]{0,2} "TO" [tag="RB.?"]{0,2} 2:"V.P?" 1:"JJ.?" "RB"{0,1} "TO" [tag="RB.?"]{0,2} 2:"V.P?" =ing_comp 1:"V..?" [tag="RB.?"]{0,3} 2:"V.G" =reflexive 1:"V..?" [tag="PRP" & word = ".*sel[fv].*"] *TRINARY =pp_%s 1:[tag="NN.?.?"|tag="JJ.?"] 3:"IN" [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"] 1:"V..?" "RB.?"{0,2} 3:"IN" [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"] =passive [tag="NN.?.?"|tag="PU."] [tag="RB.?"|tag="RB"|tag="VM"]{0,5} 1:"V.N" *DUAL =np_adj_comp/np_adj_comp_of 1:"V..?" "RB.?"{0,2} [tag="DT.?"|tag="PRP\$"]{0,1} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,1} "NN.?.?" "RB.?"{0,2} 2:"JJ.?" [tag!="NN.?.?"] 1:"V..?" "RB.?"{0,2} "PRP" "RB.?"{0,2} 2:"JJ.?" [tag!="NN.?.?"] *DUAL =adj_comp/adj_comp_of 1:"V..?" "RB.?"{0,2} 2:"JJ.?" [tag!="NN.?.?" & tag!="CC" & tag!="JJ.?"] =part_intrans 1:"V..?" 2:"RP" [!(tag="DT"|tag="PRP\$"|tag="CD"|tag="JJ.?"|tag="NN.?.?")] =part_trans 1:"V..?" 2:"RP" [tag="DT"|tag="PRP\$"|tag="CD"|tag="JJ.?"|tag="NN.?.?"] 1:"V..?" "PRP" 2:"RP" 1:"V..?" [tag="DT.?"|tag="PRP\$"]{0,1} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,1} "NN.?.?" 2:"RP" *TRINARY =part_%s_obj 1:"V..?" 3:"RP" [tag="DT.?"|tag="PRP\$"]{0,1} "CD"{0,2} [tag="JJ.?"|tag="RB.?"|word=","]{0,3} "NN.?.?"{0,2} 2:"NN.?.?" [tag!="NN.?.?"]