<!ELEMENT verb> <!ATTLIST verb n (sg, pl, ind) i -- number: singular, plural, indefinite -- p (1, 2, 3, 0) 0 -- person: 1, 2, 3, or unmarked -- pt (participle, nonparticipial) nonparticipial -- participles: yes or no -- t (pres, past, fut) pres -- tense: present, preterite, future -- lex (lex, be, do, have, aux, mod) lex -- lexical, auxiliary (and which), or modal -- >
<f.struct> <f.struct.name>BEZ <feature><f.name>category <f.struct>verb </feature> <feature><f.name>lexical type <f.struct>copula </feature> <feature><f.name>number <f.struct>singular </feature> <feature><f.name>person <f.struct>3rd </feature> <feature><f.name>tense <f.struct>present </feature> </f.struct>while the feature structure for VBD might be somewhat simpler:
<f.struct> <f.struct.name>VBD <feature><f.name>category <f.struct>verb </feature> <feature><f.name>lexical type <f.struct>full verb</feature> <feature><f.name>tense <f.struct>preterite</feature> </f.struct>
<f.struct> <f.struct.name>VBD <feature><f.name>category <f.struct>verb </feature> <feature><f.name>lexical type <f.struct>full verb</feature> <feature><f.name>number <f.struct>unmarked </feature> <feature><f.name>person <f.struct>unmarked </feature> <feature><f.name>tense <f.struct>preterite</feature> </f.struct>
<f.struct> <f.struct.name>VBD <feature><f.name>category <f.struct>verb </feature> <feature><f.name>lexical type <f.struct>full verb</feature> <feature><f.name>number <f.s.OR><f.struct>singular</f.struct> <f.struct>plural </f.struct> </f.s.OR> </feature> <feature><f.name>person <f.s.OR><f.struct>1st</f.struct> <f.struct>2nd</f.struct> <f.struct>3rd</f.struct> </f.s.OR> </feature> <feature><f.name>tense <f.struct>preterite</feature> </f.struct>
Wash <f.struct>&nn; </f.struct> sinks <f.struct>&vbz; </f.struct> . <f.struct>&punct.stop;</f.struct>
<!ENTITY v "<feature><f.name> category </f.name> <f.struct> verb </f.struct> </feature>" > <!ENTITY adv "<feature><f.name> category </f.name> <f.struct> adverb </f.struct> </feature>" > <!ENTITY n "<feature><f.name> category </f.name> <f.struct> noun </f.struct> </feature>" > <!ENTITY pron "<feature><f.name> category </f.name> <f.struct> pronoun </f.struct> </feature>" >
<!ENTITY conj "<feature><f.name> category </f.name> <f.struct> conjunction</f.struct> </feature>" > <!ENTITY num "<feature><f.name> category </f.name> <f.struct> numeral </f.struct> </feature>" > <!-- determiner-pronoun class includes determiners, quantifiers, --> <!-- and qualifiers which can act as determiners or pronominally. --> <!-- AB subclass is pre-qualifiers and pre-quantifiers. --> <!ENTITY AB "<feature><f.name> category </f.name> <f.struct> determiner-pronoun</f.struct> </feature> <feature><f.name> position </f.name> <f.struct> pre-posed</f.struct> </feature>" >
<!-- AP subclass is post-determiner/pronoun --> <!ENTITY AP "<feature><f.name> category </f.name> <f.struct> determiner-pronoun</f.struct> </feature> <feature><f.name> position </f.name> <f.struct> post-posed</f.struct> </feature>" > <!ENTITY det "<feature><f.name> category </f.name> <f.struct> determiner </f.struct> </feature>" > <!ENTITY article "<feature><f.name> category </f.name> <f.struct> article </f.struct> </feature>" >
<!ENTITY ex "<feature><f.name> category </f.name> <f.struct> existential THERE</f.struct> </feature>" > <!ENTITY prep "<feature><f.name> category </f.name> <f.struct> preposition </f.struct> </feature>" > <!ENTITY adj "<feature><f.name> category </f.name> <f.struct> adjective </f.struct> </feature>" > <!ENTITY qual "<feature><f.name> category </f.name> <f.struct> qualifier </f.struct> </feature>" >
<!ENTITY to "<feature><f.name> category </f.name> <f.struct> infinitival TO </f.struct> </feature>" > <!ENTITY uh "<feature><f.name> category </f.name> <f.struct> interjection </f.struct> </feature>" > <!ENTITY wh "<feature><f.name> category </f.name> <f.struct> WH-determiner </f.struct> </feature>" > <!ENTITY not "<feature><f.name> category </f.name> <f.struct> NOT </f.struct> </feature>" > <!ENTITY letter "<feature><f.name> category </f.name> <f.struct> letter </f.struct> </feature>" > <!ENTITY punct "<feature><f.name> category </f.name> <f.struct> punctuation </f.struct> </feature>" > <!ENTITY formula "<feature><f.name> category </f.name> <f.struct> formula </f.struct> </feature>" > <!ENTITY foreign "<feature><f.name> category </f.name> <f.struct> foreign phrase </f.struct> </feature>" >
<!-- VERBS --> <!-- Lexical class of verb: LOB distinguishes lexical verbs, --> <!-- auxiliaries, and modals. We use +/- AUX, +/- MODAL, and --> <!-- a LEXITEM feature to make these distinctions. --> <!-- An alternative analysis would use a single feature and allow --> <!-- it the values LEXICAL, MODAL, BE, DO, HAVE. This would be --> <!-- very close to the tag construction of LOB, but seems less --> <!-- general. --> <!-- Lexical verbs are -AUX -MOD --> <!ENTITY vb.lex "&v; <feature><f.name>AUX</f.name><minus></feature> <feature><f.name>MOD</f.name><minus></feature>" > <!-- Modal verbs are +AUX +MOD --> <!ENTITY vb.mod "&v; <feature><f.name>AUX</f.name><plus></feature> <feature><f.name>MOD</f.name><plus></feature>" > <!-- Auxiliary verbs are +AUX -MOD and get a LEXITEM feature --> <!ENTITY vb.be "&v; <feature><f.name>AUX</f.name><plus></feature> <feature><f.name>MOD</f.name><minus></feature> <feature><f.name> Lexical item</f.name> <f.struct> be </f.struct> </feature>" > <!ENTITY vb.do "&v; <feature><f.name>AUX</f.name><plus></feature> <feature><f.name>MOD</f.name><minus></feature> <feature><f.name> Lexical item</f.name> <f.struct> do </f.struct> </feature>" > <!ENTITY vb.have "&v; <feature><f.name>AUX</f.name><plus></feature> <feature><f.name>MOD</f.name><minus></feature> <feature><f.name> Lexical item</f.name> <f.struct> have </f.struct> </feature>" >
<!-- NOUNS --> <!-- Lexical class of noun: LOB distinguishes common and proper --> <!-- nouns. Common nouns may be marked additionally as capped. --> <!-- Such nouns are common nouns habitually written with --> <!-- uppercase initial, which act syntactically and --> <!-- morphologically as common nouns, not proper nouns. --> <!-- Examples: Jew, Englishman, the English, Urdu, a Thatcherite,--> <!-- an Etonian, Gaullism. --> <!-- Proper nouns may also be marked as locative or titular. --> <!-- The locatives are locative words written with initial cap. --> <!-- E.g. Bay, Bight, Cape, Firth, Hill, \0Is, Island, Isle, --> <!-- Lake, Loch, \0Mt, Mount, Mountain, Peninsula, Plain, Point, --> <!-- \0Rd, Road, \0St, Street, Square, Valley, Wood. Loch_NPL --> <!-- Ness_NP, the Firth_NPL of Forth_NP, the Houses_NPLS of --> <!-- Parliament_NP. --> <!-- An alternative analysis would use a single feature and allow --> <!-- it the values COMMON, PROP, PROPTIT, PROPLOC, CAP. As for --> <!-- verbs, we prefer what appears a more general construction. --> <!-- Some special features are also marked by LOB: nouns of --> <!-- measure (UNIT), cited words, and nouns used adverbially. --> <!-- Common nouns are -PROPER, -CAP and otherwise unmarked. --> <!ENTITY n.com "&n; <feature><f.name>proper </f.name><minus> </feature> <feature><f.name>capitalized </f.name><minus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Capitalized nouns are -PROPER, +CAP. --> <!ENTITY n.cap "&n; <feature><f.name>proper </f.name><minus> </feature> <feature><f.name>capitalized </f.name><plus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Proper nouns are +PROPER, +CAP. LOB apparently does not --> <!-- recognize -CAP proper nouns. (Treatment of 'van' and 'de' --> <!-- should be checked to make sure this is correct.) --> <!ENTITY n.proper "&n; <feature><f.name>proper </f.name><plus> </feature> <feature><f.name>capitalized </f.name><plus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Locative proper nouns have +LOC -TITLE --> <!ENTITY np.loc "&n; <feature><f.name>proper </f.name><plus> </feature> <feature><f.name>capitalized </f.name><plus> </feature> <feature><f.name>locative </f.name><plus> </feature> <feature><f.name>title </f.name><minus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Titles have -LOC +TITLE --> <!ENTITY np.title "&n; <feature><f.name>proper </f.name><plus> </feature> <feature><f.name>capitalized </f.name><plus> </feature> <feature><f.name>locative </f.name><minus> </feature> <feature><f.name>title </f.name><plus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Cited nouns are tagged by LOB as otherwise like common nouns.--> <!ENTITY n.cited "&n; <feature><f.name>proper </f.name><minus> </feature> <feature><f.name>capitalized </f.name><minus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><plus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Unit nouns are otherwise like common nouns. --> <!ENTITY n.unit "&n; <feature><f.name>proper </f.name><minus> </feature> <feature><f.name>capitalized </f.name><minus> </feature> <feature><f.name>unit noun </f.name><plus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><minus> </feature>" > <!-- Adverbial nouns are otherwise like common nouns. --> <!ENTITY n.adverb "&n; <feature><f.name>proper </f.name><minus> </feature> <feature><f.name>capitalized </f.name><minus> </feature> <feature><f.name>unit noun </f.name><minus> </feature> <feature><f.name>cited word </f.name><minus> </feature> <feature><f.name>noun-as-adv </f.name><plus> </feature>" > <!-- Note that LOB does not define an orthogonal set of tags --> <!-- for the various imaginable interactions among these features -->
<!-- ADVERBS --> <!-- LOB distinguishes denominative, prepositional, participial, --> <!-- and other (unmarked) adverbs. --> <!-- adv.nom are nominal adverbs, e.g. here, now, ... --> <!ENTITY adv.nom "&pron; <feature><f.name> adv.type </f.name> <f.struct> denominative </f.struct> </feature>" > <!-- adv.prep are adverb homographs of prepositions --> <!ENTITY adv.prep "&pron; <feature><f.name> adv.type </f.name> <f.struct> prepositional </f.struct> </feature>" > <!-- adv.part are adverbial participles like 'back' ... --> <!ENTITY adv.part "&pron; <feature><f.name> adv.type </f.name> <f.struct> participial </f.struct> </feature>" > <!ENTITY adv.com "&pron; <feature><f.name> adv.type </f.name> <f.struct> unmarked </f.struct> </feature>" >
<!-- PRONOUNS --> <!-- Lexical class of pronoun: LOB distinguishes nominal --> <!-- pronouns (anybody, anyone, anything, everybody, ...), --> <!-- determiners, personal pronouns, and reflexive pronouns. --> <!ENTITY pro.nom "&pron; <feature><f.name> pron.type </f.name> <f.struct> nominal </f.struct> </feature>" > <!-- Possessive pronominal determiners include "my" etc. --> <!ENTITY pro.det "&pron; <feature><f.name> pron.type </f.name> <f.struct> determiner </f.struct> </feature>" > <!ENTITY pro.pers "&pron; <feature><f.name> pron.type </f.name> <f.struct> personal </f.struct> </feature>" > <!ENTITY pro.refl "&pron; <feature><f.name> pron.type </f.name> <f.struct> reflexive </f.struct> </feature>" >
<!-- CONJUNCTIONS --> <!-- LOB distinguishes coordinating and subordinating conj. --> <!ENTITY CC "&conj; <feature><f.name>subordinating</f.name><minus> </feature>" > <!ENTITY CS "&conj; <feature><f.name>subordinating</f.name><plus> </feature>" >
<!-- NUMERALS --> <!-- LOB distinguishes cardinals and numerals. Other --> <!-- distinctions are made, and may be found below. --> <!ENTITY num.card "# <feature><f.name>ordinal</f.name><minus> </feature>" > <!ENTITY num.ord "# <feature><f.name>ordinal</f.name><plus> </feature>" >
<!-- PREPOSED PRONOUN-DETERMINER --> <!-- LOB distinguishes qualifiers and quantifiers --> <!ENTITY AB.qual "&AB; <feature><f.name> det.type </f.name> <f.struct> qualifier </f.struct> </feature>" > <!ENTITY AB.quant "&AB; <feature><f.name> det.type </f.name> <f.struct> quantifier </f.struct> </feature>" >
<!-- ADJECTIVES --> <!-- LOB distinguishes attributive-only adjectives from those --> <!-- which can be either attributive or predicative. --> <!ENTITY jj.attr "<feature><f.name>attrib-only</f.name><plus> </feature>" > <!ENTITY jj.pred "<feature><f.name>attrib-only</f.name><minus> </feature>" >
<!-- WH-pronouns --> <!-- LOB distinguishes determiners, pronouns, and relatives. --> <!-- The first two can be marked with the CATEGORY feature --> <!-- already defined, (assuming we don't mind having two values --> <!-- for the same feature). The last requires a RELATIVE feature --> <!ENTITY rel.yes "<feature><f.name>relative</f.name><plus> </feature>" > <!ENTITY rel.no "<feature><f.name>relative</f.name><minus> </feature>" >
<!-- PUNCTUATION --> <!-- LOB distinguishes !, open and close bracket, open and --> <!-- close quote, dash, comma, stop, ellipsis, colon, semicolon, --> <!-- and question mark. --> <!ENTITY p.bang "<feature><f.name>character</f.name> <f.struct> ! </f.struct> </feature>" > <!ENTITY p.openbr "<feature><f.name>character</f.name> <f.struct> ( </f.struct> </feature>" > <!ENTITY p.closbr "<feature><f.name>character</f.name> <f.struct> ) </f.struct> </feature>" > <!ENTITY p.openq "<feature><f.name>character</f.name> <f.struct> &ldquo </f.struct> </feature>" > <!ENTITY p.closq "<feature><f.name>character</f.name> <f.struct> &rdquo </f.struct> </feature>" > <!ENTITY p.dash "<feature><f.name>character</f.name> <f.struct> &dash </f.struct> </feature>" > <!ENTITY p.comma "<feature><f.name>character</f.name> <f.struct> , </f.struct> </feature>" >
<!ENTITY p.stop "<feature><f.name>character</f.name> <f.struct> . </f.struct> </feature>" > <!ENTITY p.ellips "<feature><f.name>character</f.name> <f.struct> &hellip </f.struct> </feature>" > <!ENTITY p.colon "<feature><f.name>character</f.name> <f.struct> : </f.struct> </feature>" > <!ENTITY p.semi "<feature><f.name>character</f.name> <f.struct> ; </f.struct> </feature>" > <!ENTITY p.query "<feature><f.name>character</f.name> <f.struct> ? </f.struct> </feature>" >
<!-- Number: English words marked for number are sing or plur. --> <!-- This feature is used for verbs, nouns, pronouns, and --> <!-- numerals. --> <!ENTITY sing "<feature><f.name> number </f.name> <f.struct> singular </f.struct> </feature>" > <!ENTITY plur "<feature><f.name> number </f.name> <f.struct> plural </f.struct> </feature>" > <!ENTITY num.no "<feature><f.name> number </f.name> <f.struct> unmarked </f.struct> </feature>" > <!-- We define "unmarked" as a placeholder, so that we can --> <!-- specify that a given word is not marked for number, rather --> <!-- than either leaving it out or specifying an exhaustive --> <!-- list of alternatives. -->
<!-- Person: English words marked for person are 1st, 2nd, 3rd. --> <!-- This feature is used for verbs and pronouns. --> <!-- We distinguish IMPERSONAL as a value for pronouns and --> <!-- UNMARKED as a value for verbs which are not marked. --> <!-- Participles are not marked for person and have their own --> <!-- binary feature. --> <!ENTITY p1 "<feature><f.name> person </f.name> <f.struct> 1st </f.struct> </feature>" > <!ENTITY p2 "<feature><f.name> person </f.name> <f.struct> 2nd </f.struct> </feature>" > <!ENTITY p3 "<feature><f.name> person </f.name> <f.struct> 3rd </f.struct> </feature>" > <!ENTITY impers "<feature><f.name> person </f.name> <f.struct> none </f.struct> </feature>" > <!-- We might say MINUS but PERSON is not binary so we don't --> <!ENTITY per.no "<feature><f.name> person </f.name> <f.struct> unmarked </f.struct> </feature>" > <!ENTITY partic "<feature><f.name> participle </f.name> <plus> </feature>" > <!ENTITY par.no "<feature><f.name> participle </f.name> <minus> </feature>" >
<!-- Tense: English tenses are present and preterite. --> <!-- This feature is used for verbs. --> <!-- This omits the compound tenses because they are analytic in --> <!-- English and we are worrying only about word tags. --> <!-- To allow for the compound tenses, e.g. for phrase tagging, --> <!-- we add a future tense and introduce a +/- PERFECTIVE feature --> <!-- and perform the Cartesian product. --> <!ENTITY present "<feature><f.name> tense </f.name> <f.struct> present </f.struct> </feature>" > <!ENTITY preterite "<feature><f.name> tense </f.name> <f.struct> preterite </f.struct> </feature>" > <!-- The features above are all that are needed for LOB tags. --> <!-- The following features are added proleptically for other --> <!-- uses. --> <!ENTITY future "<feature><f.name> tense </f.name> <f.struct> future </f.struct> </feature>" > <!ENTITY presperf "<feature><f.name> tense </f.name> <f.struct> present </f.struct> </feature> <feature><f.name> perfective </f.name><plus> </feature>" > <!ENTITY pluperf "<feature><f.name> tense </f.name> <f.struct> preterite</f.struct> </feature> <feature><f.name> perfective </f.name><plus> </feature>" > <!ENTITY futperf "<feature><f.name> tense </f.name> <f.struct> future </f.struct> </feature> <feature><f.name> perfective </f.name><plus> </feature>" >
<!-- Degree: English modifiers are pos, comp, or sup. --> <!-- This feature is used for adverbs and adjectives. --> <!ENTITY pos "<feature><f.name> degree </f.name> <f.struct> positive </f.struct> </feature>" > <!ENTITY comp "<feature><f.name> degree </f.name> <f.struct> comparative </f.struct> </feature>" > <!ENTITY sup "<feature><f.name> degree </f.name> <f.struct> superlative </f.struct> </feature>" >
<!-- Case: English words marked for case are nom, gen, or acc. --> <!-- This feature is used for adverbs (sometimes marked GEN), --> <!-- nouns (NOM or GEN), pronouns, numerals (sometimes GEN), --> <!-- determinerr-pronouns, and determiners. --> <!-- NOM is nominative or "subjective" case. We use NOM not SUB --> <!-- because we hope to generalize to other IE languages later. --> <!ENTITY nom "<feature><f.name> case </f.name> <f.struct> nominative </f.struct> </feature>" > <!ENTITY gen "<feature><f.name> case </f.name> <f.struct> genitive </f.struct> </feature>" > <!-- ACC is accusative or "objective" case. We use ACC not OBJ --> <!-- or OBLIQUE to make other IE languages easier later. --> <!ENTITY acc "<feature><f.name> case </f.name> <f.struct> accusative </f.struct> </feature>" > <!ENTITY case.no "<feature><f.name> case </f.name> <f.struct> unmarked </f.struct> </feature>" >
<!-- Gender: English words marked for gender are masculine, --> <!-- feminine, neuter, or common. We add unmarked just in case. --> <!-- This feature is used for personal pronouns (3rd-person only) --> <!ENTITY masc "<feature><f.name> gender </f.name> <f.struct> masculine </f.struct> </feature>" > <!ENTITY fem "<feature><f.name> gender </f.name> <f.struct> feminine </f.struct> </feature>" > <!ENTITY neut "<feature><f.name> gender </f.name> <f.struct> neuter </f.struct> </feature>" > <!-- Common gender in English is masculine or feminine. Other --> <!-- languages might need to define it as a distinct value. --> <!-- Danish, for instance? --> <!ENTITY common "<feature><f.name> gender </f.name> <f.s.OR> <f.struct> masculine </f.struct> <f.struct> feminine </f.struct> </f.s.OR> </feature>" > <!ENTITY gend.no "<feature><f.name> gender </f.name> <f.struct> unmarked </f.struct> </feature>" >
<!-- LOB distinguishes cardinals with the value 1, and others. --> <!-- Because LOB tokenizes on spaces, hyphenated pairs are also --> <!-- distinguished, here with a COUNT feature whose value is the --> <!-- number of numerals in the unit being tagged. --> <!ENTITY num.one "<feature><f.name>unitary value</f.name><plus> </feature>" > <!ENTITY num.plur "<feature><f.name>unitary value</f.name><minus> </feature>" > <!ENTITY num.pair "<feature><f.name> count </f.name> <f.struct> 2 </f.struct> </feature>" >
<!-- LOB distinguishes the word BOTH from other ABNs because it --> <!-- can serve as a double conjunction. --> <!-- No distinction is made among uses of BOTH. --> <!-- Determiners also distinguish double and single conjunctions. --> <!ENTITY conj.dbl "<feature><f.name>double-conj </f.name><plus> </feature>" > <!ENTITY c.dbl.no "<feature><f.name>double-conj </f.name><minus> </feature>" >
<!-- LOB distinguishes various words which can be pre-posed, --> <!-- post-posed, or both. --> <!ENTITY pre.yes "<feature><f.name>preposable </f.name><plus> </feature>" > <!ENTITY pre.no "<feature><f.name>preposable </f.name><minus> </feature>" > <!ENTITY post.yes "<feature><f.name>postposable </f.name><plus> </feature>" > <!ENTITY post.no "<feature><f.name>postposable </f.name><minus> </feature>" >
<!-- Simple verbs: VB, VBD, VBG, VBN, VBZ --> <!ENTITY VB "&vb.lex; &num.no; &per.no; &par.no; &present;" > <!ENTITY VBD "&vb.lex; &num.no; &per.no; &par.no; &preterite;" > <!ENTITY VBG "&vb.lex; &num.no; &partic; &present;" > <!ENTITY VBN "&vb.lex; &num.no; &partic; &preterite;" > <!ENTITY VBZ "&vb.lex; &sing; &p3; &par.no; &present;" >
<!-- Modal verbs: MD --> <!ENTITY MD "&vb.mod; &num.no; &per.no; &par.no; &present;" > <!-- BE Auxiliaries: BE, BED, BEDZ, BEG, BEM, BEN, BER, BEZ --> <!-- Some might wish for a +/- INFINITE feature to distinguish --> <!-- infinitives; except for BE, however, the English infinitive --> <!-- is always the same as the form unmarked for person and num. --> <!-- And BE marks all forms for per/num. So we don't need INFIN. --> <!ENTITY BE "&vb.be; &num.no; &per.no; &par.no; &present;" > <!ENTITY BED "&vb.be; &num.no; &per.no; &par.no; &preterite;" > <!ENTITY BEDZ "&vb.be; &sing; &p3; &par.no; &preterite;" > <!ENTITY BEG "&vb.be; &num.no; &per.no; &partic; &present;" > <!ENTITY BEM "&vb.be; &sing; &p1; &par.no; &present;" > <!ENTITY BEN "&vb.be; &num.no; &per.no; &partic; &preterite;" > <!ENTITY BER "&vb.be; &plur; &per.no; &par.no; &present;" > <!ENTITY BEZ "&vb.be; &sing; &p3; &par.no; &present;" >
<!-- DO Auxiliaries: DO, DOD, DOZ --> <!ENTITY DO "&vb.do; &num.no; &per.no; &par.no; &present;" > <!ENTITY DOD "&vb.do; &num.no; &per.no; &par.no; &preterite;" > <!ENTITY DOZ "&vb.do; &sing; &p3; &par.no; &present;" >
+/-AUX auxiliary /* verb */ +/-MOD modal /* verb */ +/-PROP proper /* noun */ +/-CAP capitalized /* noun, adjective */ +/-SUB subordinating /* conjunction */ +/-ORD ordinal /* number */ +/-PERF perfective /* tensed verbs */ +/-PART participle /* verbs */ +/-LOC locative term /* proper nouns */ +/-TITL title /* proper nouns */ +/-UNIT unit-term /* noun */ +/-CITE cited-word /* noun */ +/-ATTR attributive /* adjectives */ +/-PRED predicative /* adjectives -- redundant? */ +/-DBLC double-conj /* determiner/pronouns, and determiners */ +/-PRE preposable /* ? may precede its head */ +/-POST postposable /* ? may follow its head */ +/-PTCL particle /* ? adverb ?==? inverse of +/-takes-complement? */ +/-REL relative /* pronouns -- alternative to pron.type */ +/-PERS personal /* pronouns -- alternative to pron.type */ +/-REFL reflexive /* pronouns -- alternative to pron.type */ +/-WH WH-word /* pronouns, adverbs */ /* cross-category usages: */ +/-pseudo-adverb /* i.e. can appear in adverbial positions -- noun */ +/-pseudo-noun /* i.e. can appear in noun positions -- adverb */ +/-also-prep /* i.e. is also a preposition -- adverb */ +/-DET /* i.e. is a determiner -- pronoun */ +/-exnoun /* formed from a noun -- pronoun (anybody ...) */
/* Base categories */ CAT category = verb | adverb | noun | pronoun | conjunction | number | determiner | article | THERE | preposition | adjective | qualifier | TO | interjection | [WH] | NOT | letter | punctuation | formula | foreign /* Sub-categorization */ LEX lexitem = (string) /* verbs */ CHAR character = (string) /* punctuation */ CNT count = (integer) /* numbers -- for pairs, ranges */ [ATYP adv.type = nominal | preposition | particle | unmarked ] [prefer binary +/-pseudo-noun +/-also.prep +/-ptcl ] [PTYP pron.type = nominal | determiner | personal | reflexive ] [prefer binary +/-exnoun +/-det +/-pers +/-refl +/-wh +/-rel ] DTYP det.type = qualifier | quantifier /* Categories of Traditional Grammar */ NUM number = singular | plural | unmarked PER person = 1st | 2nd | 3rd | none | unmarked TEN tense = present | preterite | future DEG degree = positive | comparative | superlative CASE case = nominative | genitive | accusative | unmarked GEN gender = masculine | feminine | neuter | unmarked [ | common ]
1 A B L pre-qualifier (quite, rather, such) 7.12 CAT=(DET|PRON), DTYP=QUALIFIER, +PRE 2 A B N pre-quantifier (all, half) 7.12 CAT=(DET|PRON), DTYP=QUANTIFIER, +PRE 3 A B X pre-quantifier/pronoun/double conjunction (both) CAT=(DET|PRON), DTYP=QUANTIFIER, +PRE, +DBLC 4 A P post-determiner/pronoun. CAT=(DET|PRON), +POST 5 A P $ other's CAT=(DET|PRON), +POST, CASE=GEN 6 A P S others CAT=(DET|PRON), +POST, NUM=PLURAL 7 A P S $ others' CAT=(DET|PRON), +POST, CASE=GEN, NUM=PLURAL 8 A T article, singular (a, an, every) 7.12 CAT=ARTICLE, NUM=SINGULAR 9 A T I article, sing or plural (the, no) 7.12 CAT=ARTICLE, NUM=UNMARKED 10 BE be CAT=VERB +AUX -MOD -PART TEN=PRES LEX=BE 11 BE D were CAT=VERB +AUX -MOD -PART TEN=PRET LEX=BE 12 BE D Z was CAT=VERB +AUX -MOD -PART TEN=PRET NUM=SING PER=3 LEX=BE 13 BE G being CAT=VERB +AUX -MOD +PART TEN=PRES LEX=BE 14 BE M am, 'm CAT=VERB +AUX -MOD -PART TEN=PRES NUM=SING PER=1 LEX=BE 15 BE N been CAT=VERB +AUX -MOD +PART TEN=PRET LEX=BE 16 BE R are, 're CAT=VERB +AUX -MOD -PART TEN=PRES NUM=UNMKD PER=UNMKD LEX=BE 17 BE Z is, 's CAT=VERB +AUX -MOD -PART TEN=PRES NUM=SING PER=3 LEX=BE 18 CC coordinating conjunction (and, and/or, but, nor, only, or, yet) CAT=CONJ -SUB 19 CD 2, 3, two, three, hundred, thousand, dozen, zero - 7.17 20 CD $ cardinal + genitive 21 CD -CD hyphenated pair of cardinals 7.17 22 CD 1 one, 1 7.17 23 CD 1 $ one's 24 CD 1 S ones 25 CD S cardinal + plural (tens, millions, dozens, etc.) 26 CS subordinating conjunction (after, although, etc.) 7.14-15 CAT=CONJ +SUB 27 DO do 7.5 CAT=VERB +AUX -MOD -PART TEN=PRES NUM=UNMKD PER=UNMKD LEX=DO 28 DO D did CAT=VERB +AUX -MOD -PART TEN=PRET NUM=UNMKD PER=UNMKD LEX=DO 29 DO Z does CAT=VERB +AUX -MOD -PART TEN=PRES NUM=SING PER=3 LEX=DO 30 DT singular detemrinal (another, each, that, this) 7.12 31 DT $ singular determiner + genitive (another's) 32 DT I singular or plural determiner (any, enough, some) 33 DT S plural determiner (those, these) 34 DT X determiner/double conjunction (either, neither) 7.12 35 EX existential 'there' 36 HV have 7.5 CAT=VERB +AUX -MOD -PART TEN=PRES NUM=UNMKD PER=UNMKD LEX=HAVE 37 HV D had, 'd CAT=VERB +AUX -MOD -PART TEN=PRET NUM=UNMKD PER=UNMKD LEX=HAVE 38 HV G having CAT=VERB +AUX -MOD +PART TEN=PRES LEX=HAVE 39 HV N had (past participle) CAT=VERB +AUX -MOD +PART TEN=PRET LEX=HAVE 40 HV Z has, 's CAT=VERB +AUX -MOD -PART TEN=PRES NUM=SING PER=3 LEX=HAVE 41 IN preposition (about, above, etc.) 7.13, 7.15 42 JJ adjective 7.3-4, 7.8-9, 7.11 43 JJ B attributive-only adjective (chief, main, entire, etc.) 44 JJ R comparative adjective 7.9, 7.11 45 JJ T superlative adjective 7.9, 7.11 46 J NP adj with word-initial capital (English, German, etc.) 47 MD modal auxiliary CAT=VERB +AUX +MOD TEN=PRES NUM=UNMKD PER=UNMKD 48 N C cited word 7.23 NC CAT=NOUN N=SING CASE=NOM -PROP -CAP -UNIT +CITE 49 N N noun, sg, common 7.4, 7.6, 7.7 NN CAT=NOUN N=SING CASE=NOM -PROP -CAP -UNIT -CITE 50 N N $ noun, sg, common, + genitive 7.6 NN$ CAT=NOUN N=SING CASE=GEN -PROP -CAP -UNIT -CITE 51 N N P noun, sg, common, with word-initial capital 7.7 NNP CAT=NOUN N=SING CASE=NOM -PROP +CAP -UNIT -CITE 52 N N P $ noun, sg, common, with word-init cap and genitive NNP$ CAT=NOUN N=SING CASE=GEN -PROP +CAP -UNIT -CITE 53 N N P S noun, pl, common, with word-init cap NNPS CAT=NOUN N=PLUR CASE=NOM -PROP +CAP -UNIT -CITE 54 N N P S $ noun, pl, common, with word-init cap and genitive NNS$ CAT=NOUN N=PLUR CASE=GEN -PROP +CAP -UNIT -CITE 55 N N S noun, pl, common 7.6, 7.7 NNS CAT=NOUN N=PLUR CASE=NOM -PROP -CAP -UNIT -CITE 56 N N S $ noun, pl, common, + genitive NNS$ CAT=NOUN N=PLUR CASE=GEN -PROP -CAP -UNIT -CITE 57 N N U noun, abbrev unit of measurement (hr., lb., etc.) NNU CAT=NOUN N=SING CASE=NOM -PROP -CAP +UNIT -CITE 58 N N U S noun, abbrev unit of measurement, pl (gns, yds, etc.) NNUS CAT=NOUN N=PLUR CASE=NOM -PROP -CAP +UNIT -CITE 59 N P noun, sg, proper 7.7 NP CAT=NOUN N=SING CASE=NOM +PROP +CAP -UNIT -CITE -LOC -TITL -PS.ADV 60 N P $ noun, sg, proper, + genitive NP$ CAT=NOUN N=SING CASE=GEN +PROP +CAP -UNIT -CITE -LOC -TITL -PS.ADV 61 N P L noun, sg, locative with word-initial cap (Abbey, NPL CAT=NOUN N=SING CASE=NOM +PROP +CAP -UNIT -CITE +LOC -TITL -PS.ADV 62 N P L $ ditto + genitive NPL$ CAT=NOUN N=SING CASE=GEN +PROP +CAP -UNIT -CITE +LOC -TITL -PS.ADV 63 N P L S noun, pl, locative with word-initial cap NPLS CAT=NOUN N=PLUR CASE=NOM +PROP +CAP -UNIT -CITE +LOC -TITL -PS.ADV 64 N P L S $ ditto + genitive NPLS$ CAT=NOUN N=PLUR CASE=GEN -PROP +CAP -UNIT -CITE +LOC -TITL -PS.ADV 65 N P S noun, pl, proper 7.7 NPS CAT=NOUN N=PLUR CASE=NOM +PROP +CAP -UNIT -CITE -LOC -TITL -PS.ADV 66 N P S $ noun, pl, proper, + genitive NPS$ CAT=NOUN N=PLUR CASE=GEN +PROP +CAP -UNIT -CITE -LOC -TITL -PS.ADV 67 N P T noun, sg, titular with word-initial cap NPT CAT=NOUN N=SING CASE=NOM +PROP +CAP -UNIT -CITE -LOC +TITL -PS.ADV 68 N P T $ noun, sg, titular, cap, + genitive NPT$ CAT=NOUN N=SING CASE=GEN +PROP -CAP -UNIT -CITE -LOC +TITL -PS.ADV 69 N P T S noun, pl, titular, cap NPTS CAT=NOUN N=PLUR CASE=NOM +PROP -CAP -UNIT -CITE -LOC +TITL -PS.ADV 70 N P T S $ noun, pl, titular, cap, + genitive NPTS$ CAT=NOUN N=PLUR CASE=GEN +PROP -CAP -UNIT -CITE -LOC +TITL -PS.ADV 71 N R noun, sg, adverbial (Jan, Feb, east, today, NR CAT=NOUN N=SING CASE=NOM -PROP -CAP -UNIT -CITE -LOC -TITL +PS.ADV 72 N R $ noun, sg, adverbial + genitive NR$ CAT=NOUN N=SING CASE=GEN -PROP -CAP -UNIT -CITE -LOC -TITL +PS.ADV 73 N R S noun, pl, adverbial NRS CAT=NOUN N=PLUR CASE=NOM -PROP -CAP -UNIT -CITE -LOC -TITL +PS.ADV 74 N R S $ noun, pl, adverbial + genitive NRS$ CAT=NOUN N=PLUR CASE=GEN -PROP -CAP -UNIT -CITE -LOC -TITL +PS.ADV 75 OD ordinal (1st, 2nd, first, ...) 7.17 76 OD $ ordinal + genitive 77 P N nominal pron (anybody, anyone, anything; everybody, 78 P N $ nominal pron + genitive 79 P P $ poss determiner (my, your, etc.) 7.12 80 P P $$ poss pron (mine, yours, etc.) 81 P P 1 A pers pron, 1st pers sing nom (I) 82 P P 1 A S pers pron, 1st pers plur nom (we) 83 P P 1 O pers pron, 1st pers sing acc (me) 84 P P 1 O S pers pron, 1st pers plur acc (us) 85 P P 2 pers pron, 2nd pers (you, thou, thee, ye) 86 P P 3 pers pron, 3rd pers sing nom + acc (it) 87 P P 3 A pers pron, 3rd pers sing nom (he, she) 88 P P 3 A S pers pron, 3rd pers plur nom (they) 89 P P 3 O pers pron, 3rd pers sing acc (him, her) 90 P P 3 O S pers pron, 3rd pers plur acc (them, 'em) 91 P P L refl pron, sg 92 P P L S refl pron, pl; reciprocal pron 93 QL qualifier (as, awfully, less, more, so, too, very, ...) 94 QL P post-qualifier (enough, indeed) 95 R B adverb 7.10-7.11 CAT=ADV DEG=POS CASE=UNMKD -PSEUDO.NOUN -ALSO.PREP -WH 96 R B $ adverb + genitive (else's) CAT=ADV CASE=GEN -PSEUDO.NOUN -ALSO.PREP -WH 97 R B R comparative adverb CAT=ADV DEG=COMP CASE=UNMKD -PSEUDO.NOUN -ALSO.PREP -WH 98 R B T superlative adverb CAT=ADV DEG=SUP CASE=UNMKD -PSEUDO.NOUN -ALSO.PREP -WH 99 R I adverb (homograph of preposition: below, near, ...) CAT=ADV DEG=POS CASE=UNMKD -PSEUDO.NOUN +ALSO.PREP -PTCL -WH 100 R N nominal adverb (here, now, there, then) 7.10 CAT=ADV DEG=POS CASE=UNMKD +PSEUDO.NOUN -ALSO.PREP -WH 101 R P adverbial particle (back, down, off, ...) 7.10, 7.13 CAT=ADV DEG=POS CASE=UNMKD -PSEUDO.NOUN +ALSO.PREP +PTCL -WH 102 TO infinitival 'to' CAT=TO 103 UH interjection CAT=INTERJECTION 104 VB base form of verb (uninflected present tense, imper) CAT=VERB -AUX -MOD -PART TEN=PRES NUM=UNMKD PER=UNMKD 105 VB D past tense of verb 7.3 CAT=VERB -AUX -MOD -PART TEN=PRET 106 VB G present participle, gerund 7.4 CAT=VERB -AUX -MOD +PART TEN=PRES 107 VB N past participle 7.3 CAT=VERB -AUX -MOD +PART TEN=PRET 108 VB Z 3d person sg CAT=VERB -AUX -MOD -PART TEN=PRES NUM=SING PER=3 109 W DT WH-determiner (what, whatever, interrogative 110 W DT R WH-determiner, relative (which) 7.16 111 W P WH-pron, interrogative, nom+acc (who, whoever) 112 W P $ WH-pron, interrogative, gen (whose) 113 W P $ R WH-pron, relative, gen (whose) 114 W P A WH-pron, nom (whosoever) 115 W P O WH-pron, interrogative, acc (whom, whomsoever) 116 W P O R WH-pron, relative, acc (whom) 117 W P R WH-pron, relative, nom+acc (that, relative who) 7.14, 118 W RB WH-adverb (how, when, ...) 7.16 119 XNOT 'not' 120 ZZ letter 121 ! exclamation mark 122 &FO formula 7.22 123 &FW foreign word 7.21 124 ( left bracket (round or square) 125 ) right bracket (round or square) 126 *' begin quote (single or double) 2.6 127 **' end quote (single or double 2.6 128 *- dash 7.24 129 , comma 7.24 130 . full stop 7.24 131 ... ellipsis 132 : colon 7.24 133 ; semicolon 7.24 134 ? question mark