| /* |
| * Licensed to the Apache Software Foundation (ASF) under one or more |
| * contributor license agreements. See the NOTICE file distributed with |
| * this work for additional information regarding copyright ownership. |
| * The ASF licenses this file to You under the Apache License, Version 2.0 |
| * (the "License"); you may not use this file except in compliance with |
| * the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.apache.stanbol.enhancer.nlp.pos; |
| |
| import java.util.Arrays; |
| import java.util.Collection; |
| import java.util.Collections; |
| import java.util.EnumMap; |
| import java.util.EnumSet; |
| import java.util.HashSet; |
| import java.util.Iterator; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.Set; |
| |
| import org.apache.clerezza.rdf.core.UriRef; |
| import org.apache.stanbol.enhancer.nlp.morpho.Tense; |
| |
| import com.ibm.icu.impl.Punycode; |
| |
| |
| /** |
| * Enumeration over all POS (Part of Speach) categories as defined by the |
| * MorphosyntacticCategory class hierarchy og the |
| * <a heref="http://olia.nlp2rdf.org/">Olia</a> Ontology.<p> |
| * The top-level morphosyntactic categories are not defined by this enum, but link |
| * to the {@link LexicalCategory} enumeration. The multi-sub-class hierarchy of the |
| * morphosyntactic categories is also reflected by this enumeration and accessible |
| * via the <ul> |
| * <li> {@link #parents()}: the direct parent categories |
| * <li> {@link #hierarchy()}: the transitive closure |
| * <li> {@link #categories()}: the {@link LexicalCategory LexicalCategories} |
| * </ul> |
| * Enumeration elements that represent classes that are deprecated within the Olia |
| * Ontology are also deprecated within this Enumeration. |
| */ |
| public enum Pos { |
| /** |
| * |
| An attributive adjective is an adjective that qualifies or modifies a noun and that precedes the noun, |
| * e.g."a delicious apple", "a short letter".<br> |
| * (http://en.wikipedia.org/wiki/Adjective 18.09.06) |
| */ |
| AttributiveAdjective(LexicalCategory.Adjective), |
| /** |
| * It is an adjective, which expresses the character and feature of subject or an object, while modifying |
| * a noun. |
| * |
| * <pre> |
| * ང་འ ་ ང ་ འ ག། |
| * Shing-di rim du |
| * 'The tree is tall' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| CharacteristicAdjective(LexicalCategory.Adjective), |
| /** |
| * It is an adjective, which expresses the time or period of the circumstances, while modifying a noun. |
| * |
| * <pre> |
| * ན་ ང་ ང་ ་ ལ་ ་ འ ་ ། |
| * Nahing Nga chigyel-lu joyi |
| * 'I went abroad last year' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| PeriodicAdjective(LexicalCategory.Adjective), |
| /** |
| * A PossessiveAdjective is an denominal adjective, often derived from a ProperNoun, that serves to |
| * indicate possession in most Slavic languages. Unlike a genitival construction, a possessive adjective |
| * shows agreement with its head noun. (Chiarcos) |
| * <p> |
| * Adjective/Type="possessive" are denominal, not pronominal expressions of possession (Ivan A Derzhanski, |
| * email 2010/06/09). Therefore not to be confused with Pronoun/Type=adjectival(a) (Bulgarian only), for |
| * words like умно /cleverly, wisely, sensibly/, which are derived from adjectives. (Dimitrova et al. |
| * 2009) |
| * <p> |
| * e.g., Slovene dušikovima/dušikov, Marsovi/Marsov, |
| * <p> |
| * Slovak vojvodova/vojvodov, vojvodove/vojvodov, vojvodovej/vojvodov, vojvodovho/vojvodov, |
| * vojvodovi/vojvodov, vojvodovmu/vojvodov, vojvodovo/vojvodov, vojvodovom/vojvodov, vojvodovou/vojvodov, |
| * <p> |
| * Serbian evroazijske/evroazijska, evroazijskih/evroazijski, Goldštajnov, govornikov, Jehovine/Jehovin, |
| * malabarskom/malabarski, O'Brajenov, O'Brajenovog/O'Brajenov, oficirov, |
| * <p> |
| * Czech Riegrovými/Riegrův, Stradellovými/Stradellův, Tristanovou/Tristanův, Wagnerových/Wagnerův, |
| * Wagnerovým/Wagnerův, Weberovi/Weberův, Weberových/Weberův, Wertherovi/Wertherův, Winstonovi/Winstonův <br> |
| * (http://purl.org/olia/mte/multext-east.owl#PossessiveAdjective) |
| */ |
| PossessiveAdjective(LexicalCategory.Adjective), |
| /** |
| * |
| A predicative adjective is one which functions as part of the predicate of a sentence. This means that |
| * it is linked to the noun by a verb, often a copula (such as to be). <br> |
| * (http://en.wikipedia.org/wiki/Adjective 18.09.06) |
| */ |
| PredicativeAdjective(LexicalCategory.Adjective), |
| /** |
| * Relative adjectives express similarity or a comparison. (Schmidt 1999, p.218, |
| * http://purl.org/olia/emille.owl#RelativeAdjective) |
| */ |
| RelativeAdjective(LexicalCategory.Adjective), |
| /** |
| * |
| An adjective that modifies an implied, but not expressed, noun. When translating such an adjective into |
| * English, you must supply the missing noun. (www.southwestern.edu/~carlg/Latin_Web/glossary.html; |
| * http://www.isocat.org/datcat/DC-1394) |
| * <p> |
| * (Chiarcos: this seems to pertain to nominalization) |
| */ |
| SubstantiveAdjective(LexicalCategory.Adjective), |
| /** |
| * |
| Adjective expressing a numeric ranking.<br> |
| * (http://www.isocat.org/datcat/DC-1338) |
| * <p> |
| * Cf. "second", "next", "last" |
| * |
| * @deprecated The DCR definition and this term are incorrect. "Ordinal adjective" entered ISOcat from |
| * MULTEXT-East, where it was originally applied to relational adjectives (Slovene, Resian, |
| * Ukrainian, Czech). "Ordinal adjective" is a mistranslation from Slovene _vrstni pridevniki_ |
| * that should be properly rendered in English as "relational adjective" (Derzhanski and |
| * Kotsyba 2009). However, the Macedonian MULTEXT v.4 guidelines use this category for ordinal |
| * numerals. Due to its inherent ambiguity, this category is to be avoided. |
| */ |
| OrdinalAdjective(LexicalCategory.Adjective), |
| /** |
| * Adjective used to qualify.<br> |
| * (http://www.isocat.org/datcat/DC-1477) |
| */ |
| QualifierAdjective(LexicalCategory.Adjective, LexicalCategory.Quantifier), |
| /** |
| * The Slovene adjective expresses three main ideas: quality (qualitative adjectives, kakovostni |
| * pridevniki), relation (relational adjectives, vrstni pridevniki) and possession (possessive adjectives, |
| * svojilni pridevniki). Relational adjectives express type, class or numerical sequence of a noun. For |
| * instance: kemijska in fizikalna sprememba (chemical and physical change), fotografski aparat |
| * (photographic device (=camera)).<br> |
| * (http://en.wikipedia.org/wiki/Slovene_grammar) |
| */ |
| RelationalAdjective(LexicalCategory.Adjective), |
| /** |
| * A circumposition is an adposition with a part before the noun phrase and a part after. It is much less |
| * common than prepositions or postpositions.<br> |
| * (http://en.wikipedia.org/wiki/Circumposition 19.09.06) |
| */ |
| Circumposition(LexicalCategory.Adposition), |
| /** |
| * A postposition is an adposition that occurs after its complement. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPostposition.htm 19.09.06) |
| */ |
| Postposition(LexicalCategory.Adposition), |
| /** |
| * A preposition is an adposition that occurs before its complement. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPreposition.htm 19.09.06) |
| */ |
| Preposition(LexicalCategory.Adposition), |
| /** |
| * Preposition that is a aggregation of words<br> |
| * (http://www.isocat.org/datcat/DC-1934) |
| */ |
| CompoundPreposition(Preposition), |
| /** |
| * Preposition that is the result of a morphological merge from at least two words. <br> |
| * (http://www.isocat.org/datcat/DC-1901) |
| */ |
| FusedPreposition(Preposition), |
| /** |
| * Preposition that is a pure simple word in contrast with the notion of fused preposition. <br> |
| * (http://www.isocat.org/datcat/DC-1900) |
| */ |
| SimplePreposition(Preposition), |
| /** |
| * An adjectival adverb is an adverb that is formally identical to an adjective.<br/> |
| * MULTEXT-East Adverb/Type="adjectival" (Serbian, Macedonian, Bulgarian)<br/> |
| * Bulgarian AdjectivalAdverbs have the same form as adjectives in Gender = neuter, Person = 3, Number = |
| * singular. (MTE v4, http://purl.org/olia/mte/multext-east.owl#AdjectivalAdverb) |
| */ |
| AdjectivalAdverb(LexicalCategory.Adverb), |
| /** |
| * Adverb/Type="causal" is used in the Hungarian MTE v4, but no examples are provided. <br> |
| * (http://purl.org/olia/mte/multext-east.owl#CausalAdverb) |
| * |
| * @deprecated equivalent to Adverb and hasSemanticRole some CauseRole |
| */ |
| CausalAdverb(LexicalCategory.Adverb), |
| /** |
| * Any adverb which modifies an adjective, an adverb, a verbal particle, a preposition, a conjunction or a |
| * determiner is a degree adverb.<br> |
| * (http://xlex.uni-muenster.de/Portal/MTPE/tagsetDescriptionEN.doc, p. 113, 8.1 Degree Adverbs 23.09.06) |
| * <p> |
| * Also known as specifier adverb<br> |
| * (http://www.unlweb.net/unlarium/dictionary/export_tagset.php) |
| */ |
| DegreeAdverb(LexicalCategory.Adverb), |
| /** |
| * equivalent to Adverb and hasSemanticRole some LocationRole |
| */ |
| LocationAdverb(LexicalCategory.Adverb), |
| /** |
| * equivalent to Adverb and hasSemanticRole some MannerRole |
| */ |
| MannerAdverb(LexicalCategory.Adverb), |
| /** |
| * Adverb/Type="modifier" is used in the English, Romanian and Hungarian MTE v4 specs. For Romanian, |
| * Adverb/Type="modifier" applies to adverbs which can have predicative role, that is they can govern a |
| * subordinate sentence (ex. Fireşte că o ştiu -- Certainly I know it). Here (for uniformity within a |
| * multilingual environment), they are squeezed into the modifier class. (MTE v4) e.g., better (en) <br> |
| * (http://purl.org/olia/mte/multext-east.owl#ModifierAdverb) |
| */ |
| ModifierAdverb(LexicalCategory.Adverb), |
| /** |
| * Adverb/Type="negative" are used in the Serbian and Romanian MTE v4 specs, e.g., for Romanian nicăieri - |
| * nowhere, niciodată - never. (MTE v4)<br> |
| * (http://purl.org/olia/mte/multext-east.owl#NegativeAdverb) |
| */ |
| NegativeAdverb(LexicalCategory.Adverb), |
| /** |
| * Pronominal adverbs substitute for a preposition (which is incorporated into them) and an NP, cf. |
| * English therefore lit. "for this (reason, ...)", German deswegen lit. "because of this (reason, ...)". <br> |
| * (http://www.ilc.cnr.it/EAGLES96/elm_de/node235.html 21.09.06, examples Ch. Chiarcos) |
| */ |
| PronominalAdverb(LexicalCategory.Adverb), |
| /** |
| * Pronominal adverb derived from a demonstrative stem (Ch. Chiarcos) |
| */ |
| DemonstrativeAdverb(PronominalAdverb), |
| /** |
| * Adverb/Type="verbal" applies to adverbs derived from from verbs (verbal adverbs) in the Serbian, |
| * Macedonian and Hungarian MTE v4 specs. Macedonian verbal adverbs (gerunds) like odejkji are thus not |
| * considered as verbal forms, but as Adverb/Type="verbal". (MTE v4) <br> |
| * (http://purl.org/olia/mte/multext-east.owl#VerbalAdverb) |
| */ |
| VerbalAdverb(LexicalCategory.Adverb), |
| /** |
| * Adverb that serves to express interrogativity, exclamation or that serves to link a subordinate clause |
| * to the matrix clause. (Ch. Chiarcos) |
| */ |
| WHTypeAdverbs(LexicalCategory.Adverb), |
| /** |
| * An ExclamatoryAdverb seves to express exclamation, cf. how in "How well everyone played!" |
| * <p> |
| * Exclamative sentences or exclamatives An exclamatory sentence or exclamation is generally a more |
| * emphatic form of statement, in particular, they are used are used to express strong feelings (Latin |
| * exclamare : "to call out, to cry out"). <br> |
| * (http://english.unitecnology.ac.nz/resources/resources/exp_lang/sentence.html 07.05.07, |
| * http://en.wikipedia.org/wiki/Sentence_(linguistics) 07.05.07) |
| */ |
| ExclamatoryAdverb(WHTypeAdverbs), |
| /** |
| * Interrogative adverbs are used to introduce questions, e.g. "When are you coming?" (Angelika Adam) |
| */ |
| InterrogativeAdverb(WHTypeAdverbs), |
| /** |
| * The value relative is used for adverbs in clear relative cases as in: "The place 'where' I met you.", |
| * "The reason 'why' I did it."<br> |
| * (http://www.ilc.cnr.it/EAGLES96/pub/eagles/lexicons/elm_en.ps.gz, p.33, 07.05.07) |
| */ |
| RelativeAdverb(WHTypeAdverbs), |
| /** |
| * Multi-word conjunction |
| * <p> |
| * Besides the usual and, or, but, etc., certain prepositions and subordinating conjunctions can be used |
| * as coordinating conjunctions. Multi-word coordinating conjunctions are labeled CONJP (see section 7 |
| * [Coordination]). ... CONJP — Conjunction Phrase. Used to mark certain “multi-word” conjunctions, such |
| * as as well as, instead of. (Bies et al. 1995) |
| */ |
| ConjunctionPhrase(LexicalCategory.Conjuction), |
| /** |
| * Coordinating conjunctions, also called coordinators, are conjunctions that join two items of equal |
| * syntactic importance.<br> |
| * (http://en.wikipedia.org/wiki/Grammatical_conjunction 19.09.06) |
| */ |
| CoordinatingConjunction(LexicalCategory.Conjuction), |
| /** |
| * When the same word is also placed before the first conjunct, as in French "ou...ou...", the former |
| * occurrence is given the Correlative value and the latter the Simple value. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06) |
| * <p> |
| * Conjunction/Coord_Type="correlat" (Romanian). In Romanian, there are three kinds of conjunctions |
| * depending on their usage: as such or together with other conjunctions or adverbs: (1) simple, between |
| * conjuncts: Ion ori Maria (John or Mary); (2) repetitive, before each conjunct: fie Ion fie Maria fie... |
| * (either John or Mary or...) (3) correlative, before a conjoined phrase, it requires specific |
| * coordinators between conjuncts: atât mama cât şi tata (both mother and father). (MTE v4, |
| * http://purl.org/olia/mte/multext-east.owl#CorrelativeCoordinatingConjunction) |
| */ |
| CorrelativeCoordinatingConjunction(CoordinatingConjunction), |
| /** |
| * When two distinct words occur, as in German "weder...noch...", then the first is given the Initial |
| * value.<br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06) |
| */ |
| InitialCoordinatingConjunction(CoordinatingConjunction), |
| /** |
| * When two distinct words occur, as in German weder...noch..., then the second is given the Non-initial |
| * value.<br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06) |
| */ |
| NonInitialCoordinatingConjunction(CoordinatingConjunction), |
| /** |
| * Conjunction/Coord_Type="repetit" (Romanian). In Romanian, there are three kinds of conjunctions |
| * depending on their usage: as such or together with other conjunctions or adverbs: (1) simple, between |
| * conjuncts: Ion ori Maria (John or Mary); (2) repetitive, before each conjunct: fie Ion fie Maria fie... |
| * (either John or Mary or...) (3) correlative, before a conjoined phrase, it requires specific |
| * coordinators between conjuncts: atât mama cât şi tata (both mother and father). (MTE v4, |
| * http://purl.org/olia/mte/multext-east.owl#RepetitiveCoordinatingConjunction) |
| */ |
| RepetitiveCoordinatingConjunction(CoordinatingConjunction), |
| /** |
| * Simple applies to the regular type of coordinator occurring between conjuncts: German und, for example. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06) |
| * <p> |
| * In the Romanian MTE v4 specs, Conjunction/Coord_Type="simple" is defined in contrast to repetitive and |
| * correlative coordinating conjunctions. In Romanian, there are three kinds of conjunctions depending on |
| * their usage: as such or together with other conjunctions or adverbs: (1) simple, between conjuncts: Ion |
| * ori Maria (John or Mary); (2) repetitive, before each conjunct: fie Ion fie Maria fie... (either John |
| * or Mary or...) (3) correlative, before a conjoined phrase, it requires specific coordinators between |
| * conjuncts: atât mama cât şi tata (both mother and father). (MTE v4), e.g., aşa_că, va_să_zică (ro) <br> |
| * (http://purl.org/olia/mte/multext-east.owl#SimpleCoordinatingConjunction) |
| */ |
| SimpleCoordinatingConjunction(CoordinatingConjunction), |
| /** |
| * Subordinating conjunctions, also called subordinators, are conjunctions that introduce a dependent |
| * clause.<br> |
| * (http://en.wikipedia.org/wiki/Grammatical_conjunction 19.09.06) |
| */ |
| SubordinatingConjunction(LexicalCategory.Conjuction), |
| /** |
| * |
| For example, in German the subordinating conjunction "als" is followed by various kinds of comparative |
| * clause (including clauses without finite verbs). <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node19.html#oav2u 17.11.06) |
| */ |
| SubordinatingConjunctionWithComparative(SubordinatingConjunction), |
| /** |
| * For example, in German the subordinating conjunction "weil" introduces a clause with a finite verb. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node19.html#oav2u 17.11.06) |
| */ |
| SubordinatingConjunctionWithFiniteClause(SubordinatingConjunction), |
| /** |
| * For example, in German the subordinating conjunction "ohne" ("zu"...) is followed by an infinitive. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node19.html#oav2u 17.11.06) |
| */ |
| SubordinatingConjunctionWithInfinite(SubordinatingConjunction), |
| /** |
| * Conjunction/Sub_Type="negative" (Romanian, Serbian, Russian) In Romanian, each conjunction requires |
| * another mood, so that the diversity may be controlled by subcategorisation rules. The attribute |
| * Sub_Type distinguishes among the positive and negative conjunctions, providing means to control verbal |
| * double negation, (as in case of the negative pronouns, determiners and adverbs): nici NU am venit, |
| * nimeni NU vorbeşte, nici_un tren N-a trecut, nicăieri N-am văzut (MTE v4, |
| * http://purl.org/olia/mte/multext-east.owl#NegativeSubordinatingConjunction) |
| */ |
| SubordinatingConjunctionWithNegation(SubordinatingConjunction), |
| /** |
| * Conjunction/Sub_Type="negative" (Romanian, Serbian, Russian) In Romanian, each conjunction requires |
| * another mood, so that the diversity may be controlled by subcategorisation rules. The attribute |
| * Sub_Type distinguishes among the positive and negative conjunctions, providing means to control verbal |
| * double negation, (as in case of the negative pronouns, determiners and adverbs): nici NU am venit, |
| * nimeni NU vorbeşte, nici_un tren N-a trecut, nicăieri N-am văzut (MTE v4, |
| * http://purl.org/olia/mte/multext-east.owl#PositiveSubordinatingConjunction) |
| */ |
| SubordinatingConjunctionWithoutNegation(SubordinatingConjunction), |
| /** |
| * 0|Zero represents a zero complementizer (= subordinating conjunction); it may need to be deleted. The |
| * zero complementizer is generally the counterpart of the overt complementizer that. Example: Iâ ¹m |
| * sure 0 heâ ¹ll be here any minute. ... |
| * <p> |
| * 0 stands in for overt subordinating conjunctions like that in tensed subordinate clauses, including |
| * relative clauses. So the relative clause the man I saw should be bracketed as follows: (NP (NP the man) |
| * (SBAR 0 (S (NP I) (VP saw) (NP T))))) |
| * |
| * (Santorini 1991) |
| */ |
| ZeroComplementizer(SubordinatingConjunction), |
| /** |
| * |
| An interjection is a form, typically brief, such as one syllable or word, which is used most often as |
| * an exclamation or part of an exclamation. It typically expresses an emotional reaction, often with |
| * respect to an accompanying sentence and may include a combination of sounds not otherwise found in the |
| * language, e.g. in English: psst; ugh; well, well <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnInterjection.htm 19.09.06) |
| */ |
| Interjection(LexicalCategory.Conjuction), |
| /** |
| * A common noun is a noun that signifies a non-specific member of a group. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsACommonNoun.htm 19.09.06) |
| */ |
| CommonNoun(LexicalCategory.Noun), |
| /** |
| * Dzongkha uses honorific forms: ན་བཟའ་/nam za/ (cloths) is the honorific form of the noun གོ་ |
| * ལ་/gola/(cloths), གསངས་/sung/(tell) the honorific form of the verb སབ་/lab/(tell). We opted to mark |
| * them by adding the tag NNH (honorific common noun) and VBH (honorific verb) to enable future research |
| * on this specific usage of Dzongkha language. A number of tags were added to the set, of which we |
| * describe four in more detail: two of the additional tags are subclasses of verbs: VBH (honorific verb |
| * form), and VBN which describes past participle forms, like, e.g. བངམ་/jun/(created), the past particle |
| * form of བང་/jung/(create). (Chungku et al. 2010) |
| * <p> |
| * A noun, which indicates respect for the person being addressed, e.g., Miwang Gel-poi Yab “A king's |
| * father” [Though father=Apa, but colloquially we say YAB in Dzongkha] <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| HonorificCommonNoun(CommonNoun), |
| /** |
| * A title designates the function or the social status of an individual. Often, it accompanies a proper |
| * noun, but it can also be used in place of a proper noun (if the bearer of the title is contextually |
| * unambiguous). E.g. "The/Det German/Adj Chancellor/Title Angela/Name Merkel/Name said ..." can be used |
| * besides "the German Chancellor said ...". Accordingly, some schemes (e.g., Chungku et al. 2010, for |
| * Dzongkha) group titles together with proper names <br> |
| * (http://purl.org/olia/dzongkha.owl#ParticularPersonNoun). |
| * <p> |
| * However, if multiple people hold the same title, they can be referred to as a group, e.g., |
| * "Since WWII, the politics of the German chancellors always followed ...", and in this usage, titles are |
| * more comparable to common nouns. Functionally, titles are thus an intermediate category between |
| * CommonNoun and ProperNoun (cf. also Mulkern 1996). |
| * <p> |
| * Titles do, however, share important characteristics with common nouns. In English, for example, titles |
| * generally require a definite determiner (unlike proper nouns), even if unambiguous ("the pope"). They |
| * are thus classified here as a subtype of CommonNoun. |
| * <p> |
| * (Ann E. Mulkern. The name of the game. In Jeanette Gundel and Thorstein Fretheim, editors. Reference |
| * and Referent Accessibility: Pragmatics and Beyond. John Benjamins, Amsterdam and Philadelphia, 1996, |
| * pages 235–250.) |
| */ |
| TitleNoun(CommonNoun), |
| /** |
| * Measuring units are frequently used with numerals. However, they have a different syntactic structure |
| * than numerals (Sajjad 2007). |
| * <p> |
| * In European languages, Units are generally expressed as nouns, e.g., English |
| * "ten/Numeral kilogram/Unit". "Kilogram" can also be used as a common noun: |
| * "The kilogram is losing weight"<br> |
| * (http://www.bbc.co.uk/news/science-environment-12276822) |
| * <p> |
| * Hassan Sajjad (2007), Urdu Part of Speech Tagset, version 1.0.0.0, 07-12-2007, Center for research in |
| * Urdu Language Processing. National University of Computer and Emerging Sciences, Lahore, Pakistan, |
| * http://www.crulp.org/Downloads/langproc/UrduPOStagger/UrduPOStagset.pdf |
| */ |
| UnitNoun(CommonNoun), |
| /** |
| * NLOC Noun Location This is an entirely new tag introduced to cover an important phenomenon of Indian |
| * Languages. Words like 'Age', 'upara', 'pahele', 'bAda', etc. are used in various ways in Hindi. |
| * <ol> |
| * <li>They act as a postposition along with 'ke' e.g. ghade ke upara thAlI rakhI HE. ("pot" "on" "plate" |
| * "kept" "is") Here 'ke upara' is a post position which is the direct equivalent of the English |
| * preposition 'on'. |
| * <li>They also act as adverbs. e.g. tuma upara jAo. ("You" "up" "go") Here 'upara' is an adverbial of |
| * place. |
| * <li>These words also take post positions themselves and so in some sense behave like nouns. e.g. vaHa |
| * upara se AyA. ("He" "above" "from" "came") |
| * <li>As pointed out in 3. above, these words take postpositions and act as arguments of the verb in the |
| * sentence. And they also take a post position to join with a another noun. So in that sense also they |
| * behave like nouns. e.g. upara kA HissA ("above" "of" "portion") |
| * </ol> |
| * To tag such words one option is to tag them according to the category to which they belong in the given |
| * sentence. For example in 1. above, the word is occurring as a postposition so can be marked as a |
| * postposition. In example 2. above, it is an adverb so can be marked as an adverb and so on. |
| * <p> |
| * But we feel that these words are more like nouns as is evident from 3. and 4. above, and also if we |
| * consider for examples, 'aage', 'upara', etc. as places which are in front, up, etc then we can tag them |
| * as nouns. |
| * <p> |
| * But these are not pure nouns. They are nouns which indicate a location or time. These also function as |
| * adverbs or prepositions in a context. So a new tag NLOC is introduced for such words. This tag will |
| * cater to a finite set of such words. set: (Age, piche, upara, nIce, bAda, pahele) ("front", "behind", |
| * "above", "below", "before") Such words if tagged according to their syntactic function, it will hamper |
| * machine learning. So a single tag, NLOC has been devised for such words which indicate location and |
| * time. |
| * <p> |
| * e.g., (upara, Age, pahele, bAda) (IIIT (2007), A Part of Speech Tagger for Indian Languages (POS |
| * tagger), Tagset developed at IIIT - Hyderabad after consultations with several institutions through two |
| * workshops. available under http://shiva.iiit.ac.in/SPSAL2007/iiit_tagset_guidelines.pdf) |
| */ |
| SpatiotemporalNoun(CommonNoun), |
| /** |
| * relation noun (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2226) |
| */ |
| RelationNoun(CommonNoun), |
| /** |
| * |
| A countable noun (also count noun) is a noun which can be modified by a numeral and occur in both |
| * singular and plural form, as well as co-occurring with quantificational determiners like every, each, |
| * several, most, etc..<br> |
| * (http://en.wikipedia.org/wiki/Countable_noun 19.09.06) |
| */ |
| CountableNoun(LexicalCategory.Noun), |
| /** |
| * A mass noun (also uncountable noun or non-count noun) can't be modified by a numeral, occur in |
| * singular/plural or co-occur with the relevant kind of determiner. <br> |
| * (http://en.wikipedia.org/wiki/Mass_noun 19.09.06) |
| */ |
| MassNoun(LexicalCategory.Noun), |
| /** |
| * Proper nouns (also called proper names) are the names of unique entities. <br> |
| * (http://en.wikipedia.org/wiki/Noun 19.09.06) |
| */ |
| ProperNoun(LexicalCategory.Noun), |
| /** |
| * diminutive noun (MIRACL LSCA; http://www.isocat.org/datcat/DC-2225) |
| */ |
| DiminutiveNoun(LexicalCategory.Noun), |
| /** |
| * A noun which quantifies one or more things, regardless of subject and an object. |
| * |
| * <pre> |
| * ང་གིས་ བམོ་ ལ་ དང་ ཕད་ཅི། |
| * NGAGI BUM 'NGA 'DA CHECI |
| * I girl five with met |
| * “I met with five girls.” |
| * </pre> |
| * |
| * (Jurmey Rabgay, email Sep 20, 2010) |
| */ |
| NominalQuantifier(LexicalCategory.Noun, LexicalCategory.Quantifier), |
| /** |
| * noun of a voice<br> |
| * (http://www.isocat.org/datcat/DC-2253) |
| */ |
| VoiceNoun(LexicalCategory.Noun), |
| /** |
| * A determiner is a noun modifier that expresses the reference of a noun or noun phrase in the context, |
| * including quantity, rather than attributes expressed by adjectives. This part of speech is defined in |
| * some languages, such as in English, as it is distinct from adjectives grammatically, though most |
| * English dictionaries still identify the determiners as adjectives. <br> |
| * (http://en.wikipedia.org/wiki/Determiner 19.09.06) |
| */ |
| Determiner(LexicalCategory.PronounOrDeterminer), |
| /** |
| * An article is a member of a small class of determiners that identify a noun's definite or indefinite |
| * reference, and the new or given status. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnArticle.htm 02.05.07) |
| */ |
| Article(Determiner), |
| /** |
| * A definite article is used before singular and plural nouns that refer to a particular member of a |
| * group.<br> |
| * (http://en.wikipedia.org/wiki/Article_%28grammar%29 18.09.06) |
| */ |
| DefiniteArticle(Article), |
| /** |
| * clitic definite determiner, e.g., in Macedonian, Bulgarian, and Romanian <br> |
| * (http://purl.org/olia/mte/multext-east.owl#CliticDeterminerType) |
| */ |
| CliticDefiniteArticle(DefiniteArticle), |
| /** |
| * For definiteness, when a specific form is the syntactic subject of the clause. (DFKI; |
| * http://www.isocat.org/datcat/DC-1928) |
| */ |
| FullDefiniteArticle(DefiniteArticle), |
| /** |
| * For definiteness, when a specific form is not the syntactic subject of the clause. <br> |
| * (http://www.isocat.org/datcat/DC-1927) |
| */ |
| ShortDefiniteArticle(DefiniteArticle), |
| /** |
| * The additional value Fused prep-art is for the benefit of those who do not find it practical to split |
| * fused words such as French au (= à + le) into two text words. This very common phenomenon of a fused |
| * preposition + article in West European languages should preferably, however, be handled by assigning |
| * two tags to the same orthographic word (one for the preposition and one for the article). <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1ap 19.09.06) |
| */ |
| FusedPrepArt(Preposition, Article), |
| /** |
| * An indefinite article is used before singular nouns that refer to any member of a group. <br> |
| * (http://en.wikipedia.org/wiki/Article_%28grammar%29 18.09.06) |
| */ |
| IndefiniteArticle(Article), |
| /** |
| * A partitive article indicates an indefinite quantity of a mass noun; there is no partitive article in |
| * English, though the words some or any often have that function. An example is French du / de la / des, |
| * as in Voulez-vous du café? ("Do you want some coffee?" or "Do you want coffee"). <br> |
| * (http://en.wikipedia.org/wiki/Article_(grammar) 19.09.06) |
| */ |
| PartitiveArticle(Article), |
| /** |
| * In Romanian, the possessive article (also called genitival article) is an element in the structure of |
| * the possessive pronoun, of the ordinal numeral (e.g. al meu (mine) and al treilea (the third)), and of |
| * the indefinite genitive forms of the nouns (e.g. capitol al cărţii (chapter of the book)), e.g., |
| * -al/al, a/al, ai/al, al, ale/al, alor/al<br> |
| * (http://purl.org/olia/mte/multext-east.owl#PossessiveArticle) |
| */ |
| PossessiveArticle(Article), |
| /** |
| * "By ʻspecificʼ and ʻnon-specificʼ I intend the difference between the two readings of English |
| * indefinites like (3): |
| * <p> |
| * (3) Iʼm looking for a deer. |
| * <p> |
| * In the specific reading there is a particular deer, say Bambi, that I am looking for. In the |
| * non-specific reading I will be happy to find any deer. Von Heusinger (2002) likes the test in English |
| * of inserting ʻcertainʼ after the ʻaʼ to fix the specific reading. In either reading of (3) a deer is |
| * being introduced as a new discourse referent. This is opposed to ʻdefiniteʼ which requires a previous |
| * pragmatic instantiation as in ʻIʼm looking for the deer.ʼ In English both the readings of (3) are |
| * indefinite. In Klallam, the specific demonstratives are neither definite nor indefinite." |
| * <p> |
| * (Montler, Timothy. 2007. Klallam demonstratives. Papers ICSNL XLVII. The 42nd International Conference |
| * on Salish and Neighbouring Language, pp. 409-425. University of British Columbia Working Papers in |
| * Linguistics, Volume 20; on specific vs. nonspecific determiners in Klallam, a Salish language, |
| * http://montler.net/papers/KlallamDemons.pdf) |
| */ |
| NonspecificDeterminer(Article), |
| /** |
| * "By ʻspecificʼ and ʻnon-specificʼ I intend the difference between the two readings of English |
| * indefinites like (3): |
| * <p> |
| * (3) Iʼm looking for a deer. |
| * <p> |
| * In the specific reading there is a particular deer, say Bambi, that I am looking for. In the |
| * non-specific reading I will be happy to find any deer. Von Heusinger (2002) likes the test in English |
| * of inserting ʻcertainʼ after the ʻaʼ to fix the specific reading. In either reading of (3) a deer is |
| * being introduced as a new discourse referent. This is opposed to ʻdefiniteʼ which requires a previous |
| * pragmatic instantiation as in ʻIʼm looking for the deer.ʼ In English both the readings of (3) are |
| * indefinite. In Klallam, the specific demonstratives are neither definite nor indefinite." |
| * <p> |
| * (Montler, Timothy. 2007. Klallam demonstratives. Papers ICSNL XLVII. The 42nd International Conference |
| * on Salish and Neighbouring Language, pp. 409-425. University of British Columbia Working Papers in |
| * Linguistics, Volume 20; on specific vs. nonspecific determiners in Klallam, a Salish language, |
| * http://montler.net/papers/KlallamDemons.pdf) |
| */ |
| SpecificArticle(Article), |
| /** |
| * Persian does have an article, but it marks specificity rather than definiteness. The Persian article is |
| * similar to the Balkan one (a clitic of pronominal origin that's written together with the word), except |
| * that it isn't exactly definite (you can even see it described as an indefinite article). (Ivan A. |
| * Derzhanski, p.c. 2010/06/18) |
| */ |
| CliticSpecificArticle(SpecificArticle), |
| /** |
| * Determiner/Type="emphatic" (Romanian)<br/> |
| * <p> |
| * In Romanian, there are specific forms for the so-called emphatic determiner, which may accompany both a |
| * noun and a personal pronoun: fata însăşi (the girl herself), also ea însăşi (she herself). e.g., |
| * însele/însumi, însemi/însumi, însene/însumi, însevă/însumi, înseşi/însumi, înseţi/însumi, însumi, |
| * însuşi/însumi, însuţi/însumi<br> |
| * (http://purl.org/olia/mte/multext-east.owl#EmphaticDeterminer) |
| */ |
| EmphaticDeterminer(Determiner), |
| /** |
| * An indefinite determiner is a determiner that expresses a referent's indefinite number or amount, i.e. |
| * "some", "any", "many".<br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAQuantifier.htm 22.09.06) |
| * <p> |
| * Note that here, a separate top-level class Quantifier has been introduced that covers expressions of |
| * number and amount as *semantic* concepts. Plural indefinite determiners are thus to be modeled as |
| * IndefiniteDeteriner and Quantifier. |
| */ |
| IndefiniteDeterminer(Determiner), |
| /** |
| * Determiner/Type="negative" (Romanian)<br/> |
| * In Romanian the negative determiner is expressed by the unit nici + indefinite article (e.g. nici un, |
| * nici o). (MTE v4) |
| * <p> |
| * e.g., nici-o/nici_un, nici_o/nici_un, nici_un, nici_unei/nici_un, nici_unii/nici_un, nici_unor/nici_un, |
| * nici_unui/nici_un<br> |
| * (http://purl.org/olia/mte/multext-east.owl#NegativeDeterminer) |
| */ |
| NegativeDeterminer(IndefiniteDeterminer), |
| /** |
| * A partitive determiner indicates an indefinite quantity of a mass noun; there is no partitive article |
| * in English, though the words some or any often have that function. (Wilson and Leech 1996) |
| */ |
| PartitiveDeterminer(Determiner), |
| /** |
| * Determiner/Type="exceptional" is applied to the Persian uniquitive determiner تنها i.e., "the only" |
| * (MTE v4; Hamidreza Kobdani, email 2010/06/15, |
| * http://purl.org/olia/mte/multext-east.owl#UniquitiveDeterminer) |
| */ |
| UniquitiveDeterminer(Determiner), |
| /** |
| * @deprecated to be replaced by InterrogativeDeterminer or RelativeDeterminer |
| */ |
| WHDeterminer(Determiner), |
| /** |
| * A exclamatory determiner is used in combination with a Nominal Phrase in order to create an exclamation |
| * (a more emphatic form of statement), e.g. "What a lovely colour!", "What a wonderful day this is!" <br> |
| * (http://www.ilc.cnr.it/EAGLES96/pub/eagles/lexicons/elm_en.ps.gz, p.27, 07.05.07; |
| * http://en.wikipedia.org/wiki/Sentence_(linguistics), 07.05.07) |
| */ |
| ExclamatoryDeterminer(WHDeterminer), |
| /** |
| * A interrogative is a function word used to introduce an interrogative clause. E.g. "which", "what", |
| * "whose" (interrogative possessive determiner) are interrogative determiner in English. <br> |
| * (http://en.wikipedia.org/wiki/Interrogative_word 02.05.07) |
| */ |
| InterrogativeDeterminer(WHDeterminer), |
| /** |
| * The relative determiner describes a attributive relative pronoun. In German "wessen" in |
| * "Ich weiss nicht, wessen Auto das ist." or the English "whose" in "The man whose daughter became ill.". |
| * <p> |
| * The relative determiner needs a noun to complete a NP (Nominal Phrase). <br> |
| * (http://www.ilc.cnr.it/EAGLES96/pub/eagles/lexicons/elm_en.ps.gz, p.28, 07.05.07) |
| */ |
| RelativeDeterminer(WHDeterminer), |
| /** |
| * Determiner that refers to the same entity.<br> |
| * (http://www.isocat.org/datcat/DC-1377) |
| */ |
| ReflexiveDeterminer(Determiner), |
| /** |
| * A pronoun is a pro-form which functions like a noun and substitutes for a noun or a noun-phrase. A |
| * language may have several classes of pronouns. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPronoun.htm 19.09.06) |
| * <p> |
| * A pronominal is a phrase that functions as a pronoun |
| * (www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPronominal.htm; |
| * http://www.isocat.org/datcat/DC-1369) |
| */ |
| Pronoun(LexicalCategory.PronounOrDeterminer), |
| /** |
| * An attributive pronoun is a pronoun that modifies an NP. |
| */ |
| AttributivePronoun(Determiner, Pronoun), |
| /** |
| * Demonstratives are deictic expressions (they depend on an external frame of reference) which indicate |
| * entities a speaker refers to, and distinguishes those entities from others. Demonstratives are usually |
| * employed for spatial deixis (using the context of the physical surroundings), but in many languages |
| * they double as discourse deictics, referring not to concrete objects but to words, phrases and |
| * propositions mentioned in speech.<br> |
| * (http://en.wikipedia.org/wiki/Demonstrative 19.09.06) |
| */ |
| DemonstrativeDeterminer(AttributivePronoun), |
| /** |
| * Demonstrative pronouns are deictic words (they depend on an external frame of reference). They indicate |
| * which entities a speaker refers to, and distinguishes those entities from others. <br> |
| * (http://en.wikipedia.org/wiki/Demonstrative_pronoun 19.09.06) |
| */ |
| DemonstrativePronoun(Pronoun), |
| /** |
| * A pronoun, which classifies or differentiates(pronoun) by a single basis, like everybody; each; |
| * individual etc. |
| * |
| * <pre> |
| * འ ག་པ ་ ་ ར་ ག་ར་ ན་ ང་ ང་ཁ་ ས་ད ། |
| * Drupai Miser Gara Enrung Dzongkha ShegÔ |
| * 'Every Bhutanese must know Dzongkha' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| DifferentialPronoun(Pronoun), |
| /** |
| * When the subject is conjoined, the reflexive cannot refer to only one of them. The proform has to be a |
| * distributive pronoun, i.e., the reduplicated form, when it has coreference to respective subjects, |
| * e.g., kumaarum_i/Kumar.and umaavum_j/Uma.and tan_i+j/self-poss puunekki/cat.to paalu/milk |
| * kuDuttaanaanga/give-pst-aggr. "*Kumar_i and Uma gave milk to his_i/her_j cat." (Annamalai 2000, p. 189, |
| * on Tamil) |
| * <p> |
| * Unlike reciprocals, the two parts of a distributive pronoun cannot be considered as two full, |
| * independent NPs. In "awar/1 awar/2", only "awar/2" is case marked; "awar/1" is its citation form. Also, |
| * the two parts cannot be separated by intervening material (cf. English "one another"). (Jayaseelan |
| * 2000, p. 149, on Malayalam) |
| * <p> |
| * (K.A. Jayaseelan, 2000, Lexical anaphors and pronouns in Malayalam, In: Barbara C. Lust, Kashi Wali, |
| * James W. Gair, K.V.Subharao (eds.), Lexical Anaphors and Pronouns in Selected South Asian Languages. A |
| * Principled Typology, Mouton de Gruyter, Berlin, p. 113-168) (E. Annamalai, 2000, Lexical anaphors and |
| * pronouns in Tamil, , In: Barbara C. Lust, Kashi Wali, James W. Gair, K.V.Subharao (eds.), Lexical |
| * Anaphors and Pronouns in Selected South Asian Languages. A Principled Typology, Mouton de Gruyter, |
| * Berlin, p. 169-216) |
| */ |
| DistributivePronoun(Pronoun), |
| /** |
| * An indefinite pronoun is a pronoun that belongs to a class whose members indicate indefinite reference. |
| * Examples in English are "anybody", "one", "somebody". <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnIndefinitePronoun.htm 19.09.06) |
| */ |
| IndefinitePronoun(Pronoun), |
| /** |
| * In the Russian MTE v4 specs, Pronoun/Type="nonspecific" marks the following Russian words: весь 'all', |
| * всякий 'any, every', сам 'oneself', самый 'the very', каждый 'every, each', иной 'other', любой 'any', |
| * другой 'other'. The name "nonspecific" follows Halliday (1985, Section 6.2.1.1). (MTE v4) |
| * <p> |
| * A nonspecific pronoun refers to an unidentified or general entity (e.g., "I saw *someone*", |
| * "I saw *everyone*"). A nonspecific pronoun is not, therefore, a personal pronoun, but an indefinite |
| * one. (Andrews 2003). |
| * <p> |
| * Andrews, Richard J. (2003), Introduction to Classical Nahuatl. University of Oklahoma Press. Halliday, |
| * M.A.K. (1985), An introduction to Functional Grammar, London: Edward Arnold <br> |
| * (http://purl.org/olia/mte/multext-east.owl#NonspecificPronoun) |
| */ |
| NonspecificPronoun(IndefinitePronoun), |
| /** |
| * Pronoun lacking person referent. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1426) |
| * <p> |
| * More precisely, a form of pronoun that denotes the absence of a concrete or specific referent, e.g., |
| * German "man". |
| * <p> |
| * As opposed to IndefinitePronoun, this referent is not just discourse-new, but generic or hypothetical. |
| */ |
| ImpersonalPronoun(IndefinitePronoun), |
| /** |
| * Pronoun used in a context of a negation or for expressing a negation. <br> |
| * (http://www.isocat.org/datcat/DC-1925) |
| */ |
| NegativePronoun(IndefinitePronoun), |
| /** |
| * A Locative pronoun is a pronoun, which locates the object of a noun or place of anything. |
| * |
| * <pre> |
| * ་ ན་ གས་ ང་ ་ ག། |
| * Nâ[LP] PhÜntsho'ling-lu ShÔ |
| * 'Come here at Phuntsholing' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| LocativePronoun(Pronoun), |
| /** |
| * In Eagles personal and reflexive pronouns are brought together as a single value Pers./Refl. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recp 19.09.06) |
| */ |
| PersReflPronoun(Pronoun), |
| /** |
| * The Estonian determinal pronouns _ise_, _end(a)_ `(one)self'." combine aspects of emphatic pronouns and |
| * reflexive pronouns. It could also be described as an intensifier that is formally identical with the |
| * reflexive pronoun or as an emphatic reflexive pronoun. (Ivan A. Derzhanski, Heiki-Jaan Kaalep, |
| * http://purl.org/olia/mte/multext-east.owl#DeterminalPronoun; |
| * <p> |
| * Insa Gülzow (2006), The acquisition of intensifiers: Emphatic reflexives in English and German child |
| * language, Mouton de Gruyter, Berlin, p. 258) |
| */ |
| DeterminalPronoun(PersReflPronoun), |
| /** |
| * A FirstPersonPronoun refers to the speaker, or to both the speaker and referents grouped with the |
| * speaker.<br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsFirstPersonDeixis.htm 19.09.06) |
| */ |
| FirstPersonPronoun(PersReflPronoun), |
| /** |
| * A personal pronoun is a pronoun that expresses a distinction of person deixis. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPersonalPronoun.htm 19.09.06) |
| */ |
| PersonalPronoun(PersReflPronoun), |
| /** |
| * *|An asterisk represents a zero pronoun; it may need to be deleted. ... is used to represent the empty |
| * subject of gerunds, imperatives and to-infinitive clauses. (Santorini 1991) |
| * <p> |
| * (NP *) â ´ arbitrary PRO, controlled PRO, and trace of A-movement (Bies et al. 1995) |
| */ |
| ZeroPronoun(PersonalPronoun), |
| /** |
| * Personnal pronoun that is affixed. (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2221) |
| */ |
| AffixedPersonalPronoun(PersonalPronoun), |
| /** |
| * Personal pronoun that can occupy the position after a preposition and/or reinforce a weak personal |
| * pronoun. (Eagles; http://www.isocat.org/datcat/DC-1390) |
| */ |
| StrongPersonalPronoun(PersonalPronoun), |
| /** |
| * Personal pronoun that cannot occupy the position after a preposition and/or reinforce a strong personal |
| * pronoun.<br> |
| * (http://www.isocat.org/datcat/DC-1414) |
| */ |
| WeakPersonalPronoun(PersonalPronoun), |
| /** |
| * A reciprocal pronoun is a pronoun that expresses a mutual feeling or action among the referents of a |
| * plural subject.<br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAReciprocalPronoun.htm 19.09.06) |
| */ |
| ReciprocalPronoun(PersReflPronoun), |
| /** |
| * A reflexive pronoun is a pronoun that has coreference with the subject. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAReflexivePronoun.htm 19.09.06) |
| */ |
| ReflexivePronoun(PersReflPronoun), |
| /** |
| * Second person deixis means deictic reference to a person or persons identified as addressee. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsSecondPersonDeixis.htm 19.09.06) |
| */ |
| SecondPersonPronoun(PersReflPronoun), |
| /** |
| * In several European languages exist special forms of pronouns for polite or respectful reference, e.g. |
| * Dutch u and Spanish usted. The concept FamiliarSecondPersonPronoun applies to the corresponding |
| * unmarked forms for informal conversiation in such languages. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1p 19.09.06) |
| */ |
| FamiliarSecondPersonPronoun(SecondPersonPronoun), |
| /** |
| * In several European languages exist special forms of pronouns for polite or respectful reference, e.g. |
| * Dutch u and Spanish usted.<br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1p 19.09.06) |
| */ |
| PoliteSecondPersonPronoun(SecondPersonPronoun), |
| /** |
| * Third person reference is a deictic reference to a referent(s) not identified as the speaker or |
| * addressee.<br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsThirdPersonDeixis.htm 19.09.06) |
| */ |
| ThirdPersonPronoun(PersReflPronoun), |
| /** |
| * A possessive pronoun is a pronoun that expresses relationships like ownership, such as kinship, and |
| * other forms of association. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPossessivePronoun.htm 19.09.06) |
| */ |
| PossessivePronoun(Pronoun), |
| /** |
| * A possessive determiner is a part of speech that modifies a noun by attributing ownership to someone or |
| * something.<br> |
| * (http://en.wikipedia.org/wiki/Possessive_adjective 19.09.06) |
| */ |
| PossessiveDeterminer(AttributivePronoun, PossessivePronoun), |
| /** |
| * Attributive possessive pronoun form of the reflexive pronoun, e.g., Russian свой: |
| * <p> |
| * Обама на свой день рождения угощал гостей стейками и хот-догами. Obama on his day of.birth entertained |
| * guests with.steaks and hot.dogs |
| * "On his birthday, Obama entertained his guests with steaks and hot dogs." <br> |
| * (http://ua.rian.ru/world_news/20110805/78815136.html) |
| * <p> |
| * The antecedent of a possessive reflexive is not determined by its gender, but by its syntactic |
| * prominence. |
| */ |
| ReflexivePossessiveDeterminer(ReflexiveDeterminer, PossessiveDeterminer), |
| /** |
| * non-attributive pronoun |
| */ |
| SubstitutivePronoun(Pronoun), |
| /** |
| * @deprecated to be replaced with InterrogativePronoun or #RelativePronoun |
| */ |
| @Deprecated |
| WHPronoun(Pronoun), |
| /** |
| * An exclamative pronoun is a word which marks an exclamation. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnExclamative.htm 19.09.06) |
| */ |
| ExclamatoryPronoun(WHPronoun), |
| /** |
| * A interrogative pronoun is a pro-form that is used in questions in place of the item questioned for. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnInterrogativeProForm.htm 19.09.06) |
| */ |
| InterrogativePronoun(WHPronoun), |
| /** |
| * A relative pronoun is a pronoun that marks a relative clause, functions grammatically within the |
| * relative clause, and is coreferential to the word modified by the relative clause. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsARelativePronoun.htm 19.09.06) |
| */ |
| RelativePronoun(WHPronoun), |
| /** |
| * pronoun that have reference to something characterized by allusions. (MIRACL & LSCA; |
| * http://www.isocat.org/datcat/DC-2223) |
| * <p> |
| * an invariable pronoun expressing a specific intention by means of unclear term (Khemakhem Aida, |
| * 2010-05-10 via isocat-morpho@loria.fr) |
| * <p> |
| * examples from Arabic (Monica Monachini 2010-05-06 via isocat-morpho@loria.fr): "kam nahaituhu" (how |
| * often I forbade him, Hans Wehr), "baas Saar `amra `ashr isniin, gam (= kam) yriid paysikil" (He just |
| * turned ten, and here [how] he wants a bicycle, Georgetown University Iraqi Arabic-English Dictionary), |
| * "gam (= kam) yurguS imnil-faraH" ([how] he jumped for joy, Georgetown University Iraqi Arabic-English |
| * Dictionary) |
| */ |
| AllusivePronoun(Pronoun), |
| /** |
| * conditional pronoun (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2222) |
| */ |
| ConditionalPronoun(Pronoun), |
| /** |
| * Pronoun marked to show its importance.<br> |
| * (http://www.isocat.org/datcat/DC-1941) |
| */ |
| EmphaticPronoun(Pronoun), |
| /** |
| * Punctuation that is more important than a secondary punctuation with regards to sentence splitting in a |
| * text.<br> |
| * (http://www.isocat.org/datcat/DC-2075) |
| */ |
| MainPunctuation(LexicalCategory.Punctuation), |
| /** |
| * SentenceFinalPunctuation are . ? !.<br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recv 19.09.06) |
| */ |
| SentenceFinalPunctuation(MainPunctuation), |
| /** |
| * Sign used to express a question.<br> |
| * (http://www.isocat.org/datcat/DC-1444) |
| */ |
| QuestionMark(SentenceFinalPunctuation), |
| /** |
| * Sign (.) used to expresses the end of a sentence or an abbreviation. <br> |
| * (http://www.isocat.org/datcat/DC-1445) |
| */ |
| Point(SentenceFinalPunctuation), |
| /** |
| * Special sign (!) usually used in writing to mark exclamation.<br> |
| * (http://www.isocat.org/datcat/DC-1441) |
| */ |
| ExclamativePoint(MainPunctuation), |
| /** |
| * Punctuation used when the sentence is interrogative.<br> |
| * (http://www.isocat.org/datcat/DC-2087) |
| */ |
| InterrogativePunctuation(MainPunctuation), |
| /** |
| * Punctuation that is not very important with regards to sentence splitting in a text. <br> |
| * (http://www.isocat.org/datcat/DC-2076) |
| */ |
| SecondaryPunctuation(LexicalCategory.Punctuation), |
| /** |
| * Parenthetical elements are dominated by a node labeled PRN. Punctuation marks that set off a |
| * parenthetical (i.e., commas, dashes, parentheses (-LRB- and -RRB-)) are contained within the PRN node. |
| * Use of PRN is determined ultimately by individual annotator intuition, though the presence of dashes or |
| * parentheses strongly suggests a parenthetical. (Bies et al. 1995) |
| */ |
| ParentheticalPunctuation(SecondaryPunctuation), |
| /** |
| * Beginning of a paired punctuation.<br> |
| * (http://www.isocat.org/datcat/DC-2078) |
| */ |
| LeftParentheticalPunctuation(ParentheticalPunctuation), |
| /** |
| * < LAB* Left angle bracket (Santorini 1991) |
| */ |
| OpenAngleBracket(LeftParentheticalPunctuation), |
| /** |
| * [ LSB* Left square bracket (Santorini 1991) |
| */ |
| OpenSquareBracket(LeftParentheticalPunctuation), |
| /** |
| * Inverted comma.<br> |
| * (http://www.isocat.org/datcat/DC-1443) |
| */ |
| InvertedComma(LeftParentheticalPunctuation), |
| /** |
| * Punctuation used in certain languages at the beginning of an interrogative sentence. <br> |
| * (http://www.isocat.org/datcat/DC-2088) |
| */ |
| InvertedQuestionMark(LeftParentheticalPunctuation), |
| /** |
| * Punctuation that is represented graphically as [<br> |
| * (http://www.isocat.org/datcat/DC-2082) |
| */ |
| OpenBracket(LeftParentheticalPunctuation), |
| /** |
| * Punctuation that is graphically represented as {<br> |
| * (http://www.isocat.org/datcat/DC-2084) |
| */ |
| OpenCurlyBracket(LeftParentheticalPunctuation), |
| /** |
| * Beginning of a pair of parenthesis.<br> |
| * (http://www.isocat.org/datcat/DC-1442) |
| */ |
| OpenParenthesis(LeftParentheticalPunctuation), |
| /** |
| * End of a paired punctuation.<br> |
| * (http://www.isocat.org/datcat/DC-2079) |
| * |
| * RightParentheticalPunctuation is a punctuation mark which concludes a constituent whose the opening is |
| * marked by a LeftParentheticalPunctuation, e.g. ), ] and Spanish ?. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recv 19.09.06) |
| */ |
| RightParentheticalPunctuation(ParentheticalPunctuation), |
| /** |
| * > RAB* Right angle bracket (Santorini 1991) |
| */ |
| CloseAngleBracket(RightParentheticalPunctuation), |
| /** |
| * ] RSB* Right square bracket (Santorini 1991) |
| */ |
| CloseSquareBracket(RightParentheticalPunctuation), |
| /** |
| * Punctuation that is graphically represented by ]<br> |
| * (http://www.isocat.org/datcat/DC-2083) |
| */ |
| CloseBracket(RightParentheticalPunctuation), |
| /** |
| * Punctuation that is graphically represented by }<br> |
| * (http://www.isocat.org/datcat/DC-2085) |
| */ |
| CloseCurlyBracket(RightParentheticalPunctuation), |
| /** |
| * End of a parenthesis pair.<br> |
| * (http://www.isocat.org/datcat/DC-1440) |
| */ |
| CloseParenthesis(RightParentheticalPunctuation), |
| /** |
| * SentenceMedialPunctuation are , ; : - .<br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recv 19.09.06) |
| */ |
| SentenceMedialPunctuation(SecondaryPunctuation), |
| /** |
| * Sign with two vertical points that is used in writing and printing to introduce an explanation, example |
| * or quotation. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1439) |
| */ |
| Colon(SentenceMedialPunctuation), |
| /** |
| * Mark (,) used in writing to show a short pause or to separate items in a list. (Longman DCE 2005; |
| * http://www.isocat.org/datcat/DC-1448) |
| */ |
| Comma(SentenceMedialPunctuation), |
| /** |
| * Punctuation that is graphically presented as "-".<br> |
| * (http://www.isocat.org/datcat/DC-2077) |
| */ |
| Hyphen(SentenceMedialPunctuation), |
| /** |
| * Sign (;) usually used to separate phrases.<br> |
| * (http://www.isocat.org/datcat/DC-1446) |
| */ |
| SemiColon(SentenceMedialPunctuation), |
| /** |
| * Sequence of three dots having the same meaning as "et cetera" (full form) or "etc" (abbreviated form). <br> |
| * (http://www.isocat.org/datcat/DC-1447) |
| */ |
| SuspensionPoints(SentenceMedialPunctuation), |
| /** |
| * Punctuation usually used to surround a quotation.<br> |
| * (http://www.isocat.org/datcat/DC-2081) |
| */ |
| Quote(SecondaryPunctuation), |
| /** |
| * quotation mark, closing |
| */ |
| CloseQuote(Quote), |
| /** |
| * quotation mark, opening |
| */ |
| OpenQuote(Quote), |
| /** |
| * The punctuation sign /<br> |
| * (http://www.isocat.org/datcat/DC-1437) |
| */ |
| Slash(SecondaryPunctuation), |
| /** |
| * Quantifiers that enforce dual agreement (i.e., as with the numeral "2"). |
| * <p> |
| * Some feminine and neuter body parts in Czech have preserved dual forms, and if the noun is dual, so are |
| * its attributes (adjectives, pronouns). So the agreement of the numeral 2 differs formally from 3-4 |
| * (Ivan A. Derzhanski, email 2010/06/16, http://purl.org/olia/mte/multext-east.owl#DualQuantifier) |
| * <p> |
| * Numeral/Class="definite", Numeral/Class="definite1", Numeral/Class="definite234" etc. refer to specific |
| * patterns of congruency with Slavic numerals that originate from the difference between Old Slavic |
| * singular (definite1), dual (definite2, definite234) and plural (definite). <br> |
| * (http://purl.org/olia/mte/multext-east.owl#DualQuantifier) |
| */ |
| DualQuantifier(LexicalCategory.Quantifier), |
| /** |
| * A numeral is a word, functioning most typically as an adjective or pronoun, that expresses a number, |
| * and relation to the number, such as one of the following: Quantity, Sequence, Frequency, Fraction. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsANumeral.htm 19.09.06) |
| */ |
| Numeral(LexicalCategory.Quantifier), |
| /** |
| * Bulgarian has Numeral/Form=approx(a), used for approximate numerals (десетина /about a ten/, стотина |
| * /about a hundred/) (Dimitrova et al. 2009, |
| * http://purl.org/olia/mte/multext-east.owl#ApproximateNumeral) |
| */ |
| ApproximateNumeral(Numeral), |
| /** |
| * A cardinal numeral is a numeral of the class whose members are considered basic in form, used in |
| * counting, and used in expressing how many objects are referred to. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsACardinalNumeral.htm 19.09.06) |
| */ |
| CardinalNumber(Numeral), |
| /** |
| * Numeral/Type="collect" (Romanian)<br/> |
| * In traditional Romanian grammars, expressions like amândoi "both", toţi trei "all three" are referred |
| * to as collective numerals. (MTE v4, http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) |
| * <p> |
| * e.g., ambelor/ambii, ambilor/ambii, amânduror/amândoi, amândurora/amândoi, câteşipatru, tuspatru (ro, |
| * http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) |
| * <p> |
| * e.g., czworga/czworo, czworgiem/czworo, czworgu/czworo, czworo/czworo, dwoje/dwoje, dwojga/dwoje, |
| * dwojgiem/dwoje, dwojgu/dwoje, jedenaścioro/jedenaścioro (pl, |
| * http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) |
| * <p> |
| * e.g., dvadesetora/dvadesetoro, dvoja/dvoje, dvoje, dvoji/dvoje, dvojih/dvoje, dvojim/dvoje, oboje, |
| * tridesetora/tridesetoro, troja/troje (sr, http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) |
| * <p> |
| * e.g., обата, обајцата, обете, шеесетминава/шеесетмина, шеесетминана/шеесетмина, |
| * шеесетмината/шеесетмина, шеснаесетминава/шеснаесетмина, шеснаесетминана/шеснаесетмина, |
| * шеснаесетмината/шеснаесетмина (mk, http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) |
| */ |
| CollectiveNumeral(Numeral), |
| /** |
| * Nominal numbers are used to identify or refer the things. It does not show the quantity or rank. |
| * <p> |
| * Example: |
| * |
| * <pre> |
| * ངེ་གི་ འགལ་འཕིན་ ཨང་གངས་ འདི་ ༡༧༦༤༩༠༣༧ ཨིན། |
| * NGIGI DRUELTHRIN ANGDRANG 'DI 17649037 INN |
| * my mobile number is 17649037 be |
| * “ My mobile number is 17649037.” |
| * </pre> |
| * |
| * (Jurmey Rabgay, email Sep 20, 2010, http://purl.org/olia/dzongkha.owl#NominalNumber) |
| */ |
| NominalNumber(Numeral), |
| /** |
| * An ordinal number is a number belonging to a class whose members designate positions in a sequence, |
| * e.g. in English "First", "Second", "Third". <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAOrdinalNumeral.htm 19.09.06) |
| */ |
| OrdinalNumber(Numeral), |
| /** |
| * Numeral/Form="fractional" (Romanian)<br/> |
| * In traditional Romanian grammars, FractionalNumeral refers to expressions like treime-one third. (MTE |
| * v4, http://purl.org/olia/mte/multext-east.owl#FractalNumeral) |
| */ |
| Fraction(Numeral), |
| /** |
| * Quantifiers that enforce paucal agreement. In many Slavic languages, numerals between 2 and 4 (and some |
| * quantifiers) involve a specific agreement patterns that is different from that of smaller and greater |
| * numbers. In Russian, for example, genitive singular is requires. These numerals and quantifiers with |
| * the same characteristics are referred to here as "paucal quantifiers". (cf. David Pesetsky, |
| * http://www.uni-leipzig.de/~jtrommer/Harvard/pesetsky.pdf) |
| */ |
| PaucalQuantifier(LexicalCategory.Quantifier), |
| /** |
| * A PluralQuantifier is a Quantifier (or Numeral) that specifies a large multitude of entities. The |
| * agreement pattern of a plural quantifier is different from that or an singular quantifier, but as |
| * opposed to DualQuantifier and PaucalQuantifier, PluralQuantifier includes quantifiers that denote |
| * arbitrarily large sets of entities. (Chiarcos) The corresponding category in Czech, Polish and Slovak |
| * MTE v4 specs is Numeral/Class="definite", that refers to numerals larger than four. (MTE v4) |
| */ |
| PluralQuantifier(LexicalCategory.Quantifier), |
| /** |
| * A ProQuantifier is a quantifier derived from a pronominal element. ProQuantifiers thus partly |
| * characterized as pronouns (e.g., as pronominal adverbs) or quantifiers (e.g., "indefinite numeral" as |
| * in MTE v.4).<br> |
| * (http://purl.org/olia/mte/multext-east.owl#ProQuantifier) |
| */ |
| ProQuantifier(LexicalCategory.Quantifier, Pronoun), |
| /** |
| * In the Czech and Slovak MTE v4 specs, Numeral/Class="demonstrative" are items meaning `this many/much', |
| * etc. Strictly speaking, they are pronumerals (pro-quantifiers), but traditional descriptions don't |
| * recognise such a category, so they are described variously as pronouns (because they contain a |
| * demonstrative element) or as numerals (because their syntactic distribution is that of numerals, or |
| * very close)." (Ivan A Derzhanski, email 2010/06/11, |
| * http://purl.org/olia/mte/multext-east.owl#DemonstrativeQuantifier) |
| */ |
| DemonstrativeQuantifier(ProQuantifier), |
| /** |
| * In the Czech and Slovak MTE v4 specs, Numeral/Class="indefinite" are items meaning `several/some', etc. |
| * Strictly speaking, they are pronumerals (pro-quantifiers), but traditional descriptions don't recognise |
| * such a category, so they are described variously as pronouns or as numerals (because their syntactic |
| * distribution is that of numerals, or very close)." (Ivan A Derzhanski, email 2010/06/11, |
| * http://purl.org/olia/mte/multext-east.owl#IndefiniteQuantifier) |
| */ |
| IndefiniteQuantifier(ProQuantifier), |
| /** |
| * In the Czech and Slovak MTE v4 pecs, Numeral/Class="interrogative" are items meaning `how many/much', |
| * etc. Strictly speaking, they are pronumerals (pro-quantifiers), but traditional descriptions don't |
| * recognise such a category, so they are described variously as pronouns or as numerals (because their |
| * syntactic distribution is that of numerals, or very close)." (Ivan A Derzhanski, email 2010/06/11, |
| * http://purl.org/olia/mte/multext-east.owl#InterrogativeQuantifier) |
| */ |
| InterrogativeQuantifier(ProQuantifier), |
| /** |
| * In the Czech MTE v4 specs, Numeral/Class="relative" are items meaning `how many/much', `as many/much' |
| * etc. Strictly speaking, they are pronumerals (pro-quantifiers), but traditional descriptions don't |
| * recognise such a category, so they are described variously as pronouns or as numerals (because their |
| * syntactic distribution is that of numerals, or very close)." (Ivan A Derzhanski, email 2010/06/11, |
| * http://purl.org/olia/mte/multext-east.owl#RelativeQuantifier) |
| */ |
| RelativeQuantifier(ProQuantifier), |
| /** |
| * A singular quantifier is a quantifier or a numeral that specifies a single referent from a set. |
| * (Chiarcos) In Czech and Slovak MTE v4 specs, the corresponding category Numeral/Class="definite1" is |
| * applied to the numeral "one". (MTE v4) |
| */ |
| SingularQuantifier(LexicalCategory.Quantifier), |
| /** |
| * A Multiple Numeral serves to define a complex whole, with respect to the number of its parts, e.g., |
| * English "twofold", "twice" or "manyfold". Used in morphosyntactic descriptions of, e.g., Romanian, |
| * Slovak and Czech. (Joseph Ghostwick [1878], English language -- Grammar, Historical, London, Longmans, |
| * Green, and Co.; http://purl.org/olia/mte/multext-east.owl#MultipleNumeral) |
| */ |
| MultiplicativeNumeral(LexicalCategory.Quantifier), |
| /** |
| * Abbreviation (from Latin brevis "short") is strictly speaking a shorter form of a word, but more |
| * particularly, an abbreviation is a letter or group of letters, taken from a word or words, and employed |
| * to represent them for the sake of brevity. For example, the word "abbreviation" can be abbreviated as |
| * "abbr." or "abbrev."<br> |
| * (http://en.wikipedia.org/wiki/Abbreviation 19.09.06) |
| */ |
| Abbreviation(LexicalCategory.Residual), |
| /** |
| * Abbreviation/Syntactic_Type="pronominal" (Romanian), e.g., d-ta/dumneata, d-tale/dumitale, |
| * d-voastră/dumneavoastră, dv./dumneavoastră, dvs./dumneavoastră <br> |
| * (http://purl.org/olia/mte/multext-east.owl#Pronominal) |
| */ |
| AbbreviatedPronoun(Pronoun, Abbreviation), |
| /** |
| * An acronym is an abbreviation, such as NATO, laser, and ABC, written as the initial letter or letters |
| * of words, and pronounced on the basis of this abbreviated written form. Acronyms are used most often to |
| * abbreviate names of organizations and long or frequently referenced terms. <br> |
| * (http://en.wikipedia.org/wiki/Acronym 19.09.06) |
| */ |
| Acronym(LexicalCategory.Residual), |
| /** |
| * Date is a stretch of text that specifies a specific point in time and that is not further |
| * linguistically analysed. (Chiarcos) |
| */ |
| Date(LexicalCategory.Residual), |
| /** |
| * A foreign word is a text word which lies outside the traditionally accepted range of grammatical |
| * classes, it occurs quite commonly in many texts and very commonly in some. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node16.html#mr 19.09.06) |
| */ |
| Foreign(LexicalCategory.Residual), |
| /** |
| * A formula (mathematical formulae) is a text word which lies outside the traditionally accepted range of |
| * grammatical classes, it occurs quite commonly in many texts and very commonly in some. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node16.html#mr 19.09.06) |
| */ |
| Formula(LexicalCategory.Residual), |
| /** |
| * Introduced to account for Bullet http://www.isocat.org/datcat/DC-1438 |
| */ |
| LayoutElement(LexicalCategory.Residual), |
| /** |
| * LST — List marker. (Bies et al. 1995) |
| */ |
| ListMarker(LayoutElement), |
| /** |
| * |
| Sign used to mark an item in a list.<br> |
| * (http://www.isocat.org/datcat/DC-1438) |
| */ |
| Bullet(LayoutElement), |
| /** |
| * |
| graphical representation<br> |
| * (http://www.isocat.org/datcat/DC-2249) |
| */ |
| Image(LayoutElement), |
| /** |
| * In morphosyntactic annotation schemes, a symbol is a single graphical sign that occurs in a written |
| * text with a conventionalized meaning but that does not represent a phoneme (like ordinary characters), |
| * an orthogaphic sign (punctuation), or a number. (Christian Chiarcos) |
| * <p> |
| * Symbols such as alphabetic characters can vary for singular and plural (e.g. How many Ps are there in |
| * `psychopath'?), and are in this respect like common nouns. In some languages (e.g. Portuguese) such |
| * symbols also have gender.<br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recr) |
| */ |
| Symbol(LexicalCategory.Residual), |
| /** |
| * a mis-typed word |
| */ |
| Typo(LexicalCategory.Residual), |
| /** |
| * adopted from Dzongkha tagset (Chungku et al. 2010). If its tradition of grammar description is |
| * influenced by the Indian, these case markers are variously described as case morphemes or as |
| * postpositions. Therefore introduced as a shorthand for Adposition or MorphologicalParticle |
| */ |
| CaseMarker(LexicalCategory.Unique), |
| /** |
| * A classifier is a word or affix that expresses the classification of a noun. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAClassifier.htm 19.09.06) |
| * <p> |
| * Classifiers are a very typical feature of sign languages. In some Asian languages, classifiers are used |
| * as particles to combine a noun with a numeral, e.g. chin. _san ge ren_ 'three pieces of people', 'three |
| * people' (Bußmann 2002, under Klassifikator) |
| * <p> |
| * Bharati et al. (2006, for Indian languages) group Classifiers together with Quantifiers and Numerals, |
| * but they do not provide a detailed characterization of this class. |
| * <p> |
| * Akshar Bharati, Dipti Misra Sharma, Lakshmi Bai, Rajeev Sangal (2006), AnnCorra : Annotating Corpora. |
| * Guidelines For POS And Chunk Annotation For Indian Languages, Tech. Rep., L anguage Technologies |
| * Research Centre IIIT, Hyderabad, version of 15-12-2006, http://ltrc.iiit.ac.in/tr031/posguidelines.pdf |
| */ |
| Classifier(LexicalCategory.Unique), |
| /** |
| * Generally, discourse markers are expressions or phrases of greeting, apologizing, thanking, short |
| * emotional utterances, and interjections. Their node label is DM. ... Typical discourse markers are: ja, |
| * nein, hallo, oh, aha, pst, nunja, gewiß, toll, nun ja, etc. (Telljohann et al. 2009, p. 136) |
| */ |
| DiscourseMarker(LexicalCategory.Unique), |
| /** |
| * For Hindi, words like 'bahuta', 'kama', etc. when intensifying adjectives or adverbs will be annotated |
| * as INTF. Example, h37. hEdarAbAda meM aMgUra bahuta_INTF acche milate hEM 'HyderabAd' 'in' 'grapes' |
| * 'very' 'good' 'available' 'are' “Very good grapes are available in Hyderabad” (Bharati et al. 2006) <br> |
| * Akshar Bharati, Dipti Misra Sharma, Lakshmi Bai, Rajeev Sangal (2006), AnnCorra : Annotating Corpora. |
| * Guidelines For POS And Chunk Annotation For Indian Languages, Tech. Rep., L anguage Technologies |
| * Research Centre IIIT, Hyderabad, version of 15-12-2006, http://ltrc.iiit.ac.in/tr031/posguidelines.pdf |
| */ |
| Intensifier(LexicalCategory.Unique), |
| /** |
| * The izāfat (pronounced as a shorter form of –ē–) is an enclitic of Persian origin which is used in |
| * Farsi and neighboring languages. In Urdu, it can be considered a preposition under certain |
| * circumstances: it links two nouns in a possessive relationship, although the phrase thus produced may |
| * often have a different meaning to a phrase produced with the native Urdu postposition kā. However, the |
| * izāfat may also join a noun to an adjective, in which case it is not so clearly accurate to describe it |
| * as a preposition parallel to the prepositions in European languages for which the EAGLES guidelines |
| * were compiled. A better way to treat izāfat is in the context of the Unique category of miscellaneous |
| * one-member wordclasses, discussed below. (Hardie 2003, http://purl.org/olia/emille.owl#Izafat) |
| */ |
| Izafat(LexicalCategory.Unique), |
| /** |
| * In Urdu, multiplicative numerals are formed by adding the suffix gunâ (Schmidt 1999, p. |
| * 260,http://purl.org/olia/emille.owl#MultiplicativeMarker) |
| */ |
| MultiplicativeMarker(LexicalCategory.Unique), |
| /** |
| * synonym of Unique, to be avoided because of its divergent definitions (Chiarcos) |
| */ |
| Particle(LexicalCategory.Unique), |
| /** |
| * Particle that serves to form adjective phrases, e.g., Urdu sā <br> |
| * (http://purl.org/olia/emille.owl#AdjectivalParticle) |
| */ |
| AdjectivalParticle(Particle), |
| /** |
| * Contrastive particle, e.g., (one of the uses of) Urdu tô: |
| * |
| * <pre> |
| * vo urdû parhê gâ |
| * "He will study Urdu." (simple statement) |
| * |
| * vo tô urdû parhê gâ |
| * "HE will study Urdu." (Contrast: the other students may not.) |
| * </pre> |
| * |
| * (Schmidt 1999, p. 232, see http://purl.org/olia/emille.owl#ContrastiveEmphaticParticle) |
| */ |
| ContrastiveParticle(Particle), |
| /** |
| * Emphatic particle, e.g., (one of the uses of) Urdu tô: |
| * |
| * <pre> |
| * vo urdû parhê gâ |
| * "He will study Urdu." (simple statement) |
| * |
| * vo urdû parhê gâ tô lêkin imtihân nahîm dê gâ |
| * "He will STUDY Urdu, OF COURSE, but he won't take the examination." |
| * |
| * <pre> |
| (Schmidt 1999, p. 232, see http://purl.org/olia/emille.owl#ContrastiveEmphaticParticle) |
| */ |
| EmphaticParticle(Particle, Intensifier), |
| /** |
| * adopted from EMILLE, http://purl.org/olia/emille.owl#ContrastiveEmphaticParticle, shorthand for |
| * ContrastiveParticle and EmphaticParticle |
| */ |
| ContrastiveEmphaticParticle(EmphaticParticle, ContrastiveParticle), |
| /** |
| * In Urdu, the exclusive emphatic particle hî emphasizes the preceding word and excludes something else |
| * (which may not be expressed). (Schmidt 1999, p.233, |
| * http://purl.org/olia/emille.owl#ExclusiveEmphaticParticle) <br> |
| * Compare with the inclusive emphatic particle bhî: |
| * |
| * <pre> |
| * maim *bhî* faisalâ karûm gâ |
| * "I'll *also* make a decision" |
| * |
| * maim *hî* faisalâ karûm gâ |
| * "*I'm the one who* will make the decision." |
| * </pre> |
| * |
| * (Schmidt 1999, p.237, http://purl.org/olia/emille.owl#InclusiveEmphaticParticle) |
| */ |
| ExclusiveEmphaticParticle(EmphaticParticle), |
| /** |
| * In Urdu, bhî is an emphatic particle meaning 'even'. In opposition to contrastive tô and exclusive hî, |
| * bhî is inclusive: |
| * |
| * <pre> |
| * maim *bhî* faisalâ karûm gâ |
| * "I'll *also* make a decision" |
| * |
| * maim *hî* faisalâ karûm gâ |
| * "*I'm the one who* will make the decision." |
| * </pre> |
| * |
| * (Schmidt 1999, p.237, http://purl.org/olia/emille.owl#InclusiveEmphaticParticle) |
| */ |
| InclusiveEmphaticParticle(EmphaticParticle), |
| /** |
| * English existential there is specified as a subtype of pronoun in MTE v4, i.e., Pronoun/Type="ex-there" <br> |
| * (http://purl.org/olia/mte/multext-east.owl#ExistentialThere) |
| */ |
| ExistentialParticle(Particle), |
| /** |
| * http://www.isocat.org/datcat/DC-1455 (preverbalParticleLmf) |
| */ |
| PreverbalParticle(Particle), |
| /** |
| * A verbal particle modifies the verb and carries information on the verb form (e.g., finiteness, tense |
| * and aspect). (Dimitrova et al. 2009, Dan Tufis, email 2010/06/09). |
| * |
| * In the Bulgarian MTE specs, Particle/Type=verbal(v) is used to form different type of verbal |
| * syntactical relationships, e.g. to create future tense (ще говориш), or particles like се, да. |
| * (Dimitrova et al. 2009) The Romanian MTE v4 specs provide a more fine-grained subclassification of |
| * (verbal) particles (MTE v4, http://purl.org/olia/mte/multext-east.owl#VerbalParticle) |
| */ |
| VerbalParticle(Particle), |
| /** |
| * In the Romanian MULTEXT-East scheme, a verbal particle with Particle/Type="aspect" modifies the verbs |
| * and carries information on the verb form, i.e., on its aspect (Dan Tufis, email 2010/06/09, |
| * http://purl.org/olia/mte/multext-east.owl#AspectParticle) |
| */ |
| AspectParticle(VerbalParticle), |
| /** |
| * A modality-marking adverb is a verbal particle that serves to indicate mood, aspect and/or tense (cf. |
| * Schmidt 1999). Note that this is not to be confused with the conventional meaning of "modal adverb" in |
| * the sense of "manner adverb" (cf. http://en.wiktionary.org/wiki/Category:English_modal_adverbs), hence |
| * the uncommon name. |
| * |
| * Ruth Laila Schmidt (1999) Urdu, an essential grammar, Routledge, London. |
| */ |
| ModalityMarkingAdverb(LexicalCategory.Adverb, VerbalParticle), |
| /** |
| * In the Romanian MULTEXT-East scheme, a verbal particle with Particle/Type="future" modifies the verbs |
| * and marks the verb as being subjunctive, e.g., s-/să, să (Dan Tufis, email 2010/06/09, |
| * http://purl.org/olia/mte/multext-east.owl#SubjunctiveParticle) |
| */ |
| SubjunctiveParticle(VerbalParticle), |
| /** |
| * Dzongkha has also a tense marker, which is not complicated like in other languages. It has got only six |
| * tense markers and can be used in a very simple and effective way. They are: ('Ni'+'Wong') for future, |
| * ('D'o'+'D'ä') for present and ('Ci'+'Yi') for past tense. |
| * |
| * <pre> |
| * ང་ ནངས་པ་ འ ་ ། |
| * Nga naba jo-ni[past tense] |
| * I tomorrow go-will-[past] |
| * 'I am going tomorrow' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| TenseMarkingParticle(VerbalParticle), |
| /** |
| * Particle used in order to express future.<br> |
| * (http://www.isocat.org/datcat/DC-1919) |
| */ |
| FutureParticle(TenseMarkingParticle), |
| /** |
| * E.g., the mediopassive (middle) voice marker se in the Portuguese EAGLES scheme. (Leech and Wilson |
| * 1996) |
| */ |
| VoiceParticle(VerbalParticle), |
| /** |
| * |
| Particle used to express infinitive.<br> |
| * (http://www.isocat.org/datcat/DC-1896) |
| */ |
| InfinitiveParticle(VerbalParticle), |
| /** |
| * |
| Particle used to compare.<br> |
| * (http://www.isocat.org/datcat/DC-1922) |
| */ |
| ComparativeParticle(Particle), |
| /** |
| * |
| conditional particule (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2230) |
| */ |
| ConditionalParticule(CoordinatingConjunction, Particle), |
| /** |
| * |
| particle for coordination (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2227) |
| */ |
| CoordinationParticle(Particle), |
| /** |
| * |
| distinctive particle (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2228) |
| */ |
| DistinctiveParticle(Particle), |
| /** |
| * |
| Particle used to express a question.<br> |
| * (http://www.isocat.org/datcat/DC-1921) |
| */ |
| InterrogativeParticle(Particle), |
| /** |
| * |
| Particle which functions as a modal.<br> |
| * (http://www.isocat.org/datcat/DC-1920) |
| */ |
| ModalParticle(Particle), |
| /** |
| * |
| Particle used to express negation. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1894) |
| */ |
| NegativeParticle(Particle), |
| /** |
| * Particle used to express affirmation.<br> |
| * (http://www.isocat.org/datcat/DC-1918) |
| */ |
| AffirmativeParticle(Particle), |
| /** |
| * |
| Particle expressing ownship.<br> |
| * (http://www.isocat.org/datcat/DC-1895) |
| */ |
| PossessiveParticle(Particle), |
| /** |
| * relative particle (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2229) |
| */ |
| RelativeParticle(Particle), |
| /** |
| * |
| Particle expressing superlative degree. Superlative is the comparison between more than two entities |
| * and contrasts with comparative where only two entities are involved and positive where no comparison is |
| * implied. (Crystal 2003; http://www.isocat.org/datcat/DC-1923) |
| */ |
| SuperlativeParticle(Particle), |
| /** |
| * In Urdu, wālā can be added to substantives to derive nouns implying possession or general |
| * relationships, e.g., go-wāl, or go-wālā, s.m. cow-keeper, cow-herd (from go, 'cow'), or ghar-wālā, s.m. |
| * master or owner of the house (from ghar, 'house') (Plats 1884, cf. http://purl.org/olia/urdu.owl#Wala) |
| */ |
| PossessionMarker(LexicalCategory.Unique), |
| /** |
| * |
| Word which serves no grammatical function, but which fills up a sentence or gives emphasis. |
| * (www.southwestern.edu/~carlg/Latin_Web/glossary.html; http://www.isocat.org/datcat/DC-1283) |
| */ |
| Expletive(LexicalCategory.Unique), |
| /** |
| * |
| An expletive (also known as a dummy word) is a part of speech whose members have no meaning, but |
| * complete a sentence to make it grammatical [Crystal 1997, 127] <br> |
| * (http://purl.org/linguistics/gold/Expletive) |
| * <p> |
| * In European languages, expletives are pronouns. A verbal part of speech that |
| * "has no meaning, but complete a sentence to make it grammatical" is a copula (see AuxiliaryVerb). |
| */ |
| ExpletivePronoun(ThirdPersonPronoun, Expletive), |
| /** |
| * |
| Three different expletive usages [of the German expletive pronoun es] are traditionally distinguished: |
| * formal subject or object (expletive argument), correlate of an extraposed clausal argument (expletive |
| * correlate), and Vorfeld-es (structural expletive) (cf. (Eisenberg 1999 2001), (Pütz 1986)). ... |
| * <p> |
| * The formal subject obligatorily occurs with weather verbs, e.g. "Es regnet" and unpersonal or agentless |
| * constructions such as "Es gibt so eine Buchung" or "Es geht um populäre Unterhaltung." Some verbs |
| * optionally permit an expletive subject but also occur with referential subjects such as |
| * "Max/Es kopft an der Tür." A formal object is found in constructions like "jmd. legt es an auf etw." or |
| * "jmd. verdirbt es mit jmdm." In all examples mentioned, es functions as a grammatical argument without |
| * semantic contribution, i.e. it does not refer to a person, object, or event. (Telljohann et al. 2009, |
| * p.60f) |
| */ |
| ExpletiveArgument(ExpletivePronoun), |
| /** |
| * |
| Three different expletive usages [of the German expletive pronoun es] are traditionally distinguished: |
| * formal subject or object (expletive argument), correlate of an extraposed clausal argument (expletive |
| * correlate), and Vorfeld-es (structural expletive) (cf. (Eisenberg 1999 2001), (Pütz 1986)). (Telljohann |
| * et al. 2009, p.60) |
| * <p> |
| * Extraposed clausal arguments: |
| * "Aber [es] ist übertrieben zu sagen, damit bekäme die FU erst eine Identität." (Telljohann et al. 2009, |
| * p.62) |
| */ |
| ExpletiveCorrelate(ExpletivePronoun), |
| /** |
| * |
| Three different expletive usages [of the German expletive pronoun es] are traditionally distinguished: |
| * formal subject or object (expletive argument), correlate of an extraposed clausal argument (expletive |
| * correlate), and Vorfeld-es (structural expletive) (cf. (Eisenberg 1999 2001), (Pütz 1986)). (Telljohann |
| * et al. 2009, p.60) |
| * <p> |
| * In German, a purely structural dummy element ... occurs in Vorfeld position only and is not correlated |
| * with any argument of the clause. It does not agree with the verb which becomes evident if there is a |
| * plural subject in the Mittelfeld: |
| * <p> |
| * "es zahlen ihn die Völker, deren Menschenrechte angeblich verteidigt werden." |
| * <p> |
| * It is ungrammatical in the Mittelfeld, e.g. *". . . dass es ihn die Völker zahlen". |
| */ |
| StructuralExpletive(ExpletivePronoun), |
| /** |
| * |
| An auxiliary verb is a verb which accompanies the lexical verb of a verb phrase, and expresses |
| * grammatical distinctions not carried by the lexical verb, such as person, number, tense aspect, and |
| * voice.<br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnAuxiliaryVerb.htm 19.09.06) |
| * <p> |
| * Besides modal verbs ("semiauxiliary") and "strict" auxiliary verbs, also copulas are classified under |
| * auxiliary verbs here, as this is a praxis applied in practically every EAGLES-conformant |
| * morphosyntactic annotation scheme. |
| * <p> |
| * Part of speech referring to the set of verbs, subordinate to the main lexical verb which help to make |
| * distinction in mood, aspect, voice etc. (Crystal 2003; http://www.isocat.org/datcat/DC-1244) |
| */ |
| AuxiliaryVerb(LexicalCategory.Verb), |
| /** |
| * |
| A copula is an intransitivity verb which links a subject to a noun phrase, an adjective or an other |
| * constituent which expresses the predicate. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsACopula.htm 19.09.06) |
| */ |
| Copula(AuxiliaryVerb), |
| /** |
| * |
| Verb form that is usually used with another verb to express ideas such as possibilities, permission, or |
| * intention. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1329) |
| * <p> |
| * A modal verb (also modal, modal auxiliary verb, modal auxiliary) is a type of auxiliary verb that is |
| * used to indicate modality. The use of auxiliary verbs to express modality is characteristic of Germanic |
| * languages.<br> |
| * (http://en.wikipedia.org/wiki/Modal_verb 19.09.06) |
| * <p> |
| * In addition to main and auxiliary verbs, it may be useful (e.g. in English) to recognise an |
| * intermediate category of semi-auxiliary for such verbs as be going to, have got to, ought to. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1v 20.09.06) |
| * <p> |
| * The auxiliaries in English subdivide into the primary verbs `be', `have', and `do', which can also |
| * function as main verbs, and the modal auxiliaries such as `can', `will', and `would', which are |
| * uninflected, and always function as auxiliaries. <br> |
| * (http://www.ilc.cnr.it/EAGLES96/morphsyn/node158.html#SECTION00054800000000000000) |
| */ |
| ModalVerb(AuxiliaryVerb), |
| /** |
| * |
| Non-modal, non-copular auxiliary verb. |
| */ |
| StrictAuxiliaryVerb(AuxiliaryVerb), |
| /** |
| * An auxiliary that marks exclusively aspect, e.g., in Urdu: |
| * <p> |
| * Auxiliaries: Based on the syntactic nature of Urdu, auxiliaries are divided into two categories. |
| * Aspectual auxiliaries always occur after main verb of the sentence. Tense auxiliaries are used to show |
| * the time of the action. They occurred at the end of the verb phrase (Sajjad 2007). |
| * <p> |
| * E.g., Urdu rahā, an auxiliary element is used to mark the durative aspect. (Hardie 2004, |
| * http://purl.org/olia/emille.owl#RahaAuxiliary) |
| */ |
| AspectMarkingAuxiliary(StrictAuxiliaryVerb), |
| /** |
| * An auxiliary that marks exclusively tense, e.g., in Urdu: |
| * <p> |
| * Auxiliaries: Based on the syntactic nature of Urdu, auxiliaries are divided into two categories. |
| * Aspectual auxiliaries always occur after main verb of the sentence. Tense auxiliaries are used to show |
| * the time of the action. They occurred at the end of the verb phrase. (Sajjad 2007). |
| * <p> |
| * In Urdu, the auxiliary gā indicates future tense when it follows a verb in the subjunctive form. <br> |
| * (http://purl.org/olia/emille.owl#GaAuxiliary) |
| */ |
| TenseMarkingAuxiliary(StrictAuxiliaryVerb), |
| /** |
| * |
| Verb used to link the subject of a sentence and its noun or adjective complement or complementing |
| * phrase in certain languages. This verb could be used also to form the passive voice. |
| * (www.wordreference.com/English/definition.asp?en=be -> 4); http://www.isocat.org/datcat/DC-1246) |
| */ |
| BeAuxiliary(StrictAuxiliaryVerb), |
| /** |
| * |
| The verb have as an auxiliary. |
| * (www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnAuxiliaryVerb.htm; |
| * http://www.isocat.org/datcat/DC-1299) |
| */ |
| HaveAuxiliary(StrictAuxiliaryVerb), |
| /** |
| * |
| A finite verb is a verb form that occurs in an independent clause, and is fully inflected according to |
| * the inflectional categories marked on verbs in the language. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAFiniteVerb.htm 19.09.06) |
| * <p> |
| * Property applied to a verb form that can occur on its own in an independent sentence. (Crystal 2003; |
| * http://www.isocat.org/datcat/DC-1287) |
| */ |
| FiniteVerb(LexicalCategory.Verb), |
| /** |
| * |
| A conditional verb is a verb form in many languages. It is used to express degrees of certainty or |
| * uncertainty and hypothesis about past, present, or future. Such forms often occur in conditional |
| * sentences.<br> |
| * (http://en.wikipedia.org/wiki/Conditional_mood 19.09.06) |
| */ |
| ConditionalVerb(FiniteVerb), |
| /** |
| * |
| An imperative verb is used to express commands, direct requests, and prohibitions. Often, direct use of |
| * the imperative mood may appear blunt or even rude, so it is often used with care. Example: "Paul, read |
| * that book".<br> |
| * (http://en.wikipedia.org/wiki/Grammatical_mood#Imperative_mood 19.09.06) |
| */ |
| ImperativeVerb(FiniteVerb), |
| /** |
| * |
| Indicative mood is used in factual statements. All intentions in speaking that a particular language |
| * does not put into another mood use the indicative. It is the most commonly used mood and is found in |
| * all languages.<br> |
| * (http://en.wikipedia.org/wiki/Grammatical_mood#Indicative_mood 19.09.06) |
| */ |
| IndicativeVerb(FiniteVerb), |
| /** |
| * |
| A subjunctive verb is typically used to expresses wishes, commands (in subordinate clauses), emotion, |
| * possibility, judgment, necessity, and statements that are contrary to fact at present. <br> |
| * (http://en.wikipedia.org/wiki/Subjunctive_mood 19.09.06) |
| */ |
| SubjunctiveVerb(FiniteVerb), |
| /** |
| * In linguistics, a light verb is a verb participating in complex predication that has little semantic |
| * content of its own, but provides through inflection some details on the event semantics, such as |
| * aspect, mood, or tense. The semantics of the compound, as well as its argument structure, are |
| * determined by the head or primary component of the compound, which may be a verb or noun (V+V or V+N |
| * compounds). Other names for "light verb" include: vector verb or explicator verb, emphasising its role |
| * within the compound; or thin verb or semantically weak verb, emphasising (as with "light") its lack of |
| * semantics. A "semantically weak" verb is not to be confused with a "weak verb" as in the Germanic weak |
| * inflection. Light verbs are similar to auxiliary verbs in some ways. |
| * <p> |
| * Most English light verbs occur in V+N forms sometimes called "stretched verbs": for example, take in |
| * take a nap, where the primary sense is provided by "nap", and "take" is the light verb. The light verbs |
| * most common in these constructions are also common in phrasal verbs. A verb which is "light" in one |
| * context may be "heavy" in another: as with "take" in I will take a book to read. |
| * <p> |
| * Examples in other languages include the Yiddish geb in geb a helf (literally give a help, "help"); the |
| * French faire in faire semblant (lit. make seeming, "pretend"); the Hindi nikal paRA (lit. leave fall, |
| * "start to leave"); and the bǎ construction in Chinese.[1] Some verbs are found in many such |
| * expressions; to reuse an earlier example, take is found in take a nap, take a shower, take a sip, take |
| * a bow, take turns, and so on. Light verbs are extremely common in Indo-Iranian languages, Japanese, and |
| * other languages in which verb compounding is a primary mechanism for marking aspectual distinctions. <br> |
| * (http://en.wikipedia.org/wiki/Light_verb) |
| */ |
| LightVerb(LexicalCategory.Verb), |
| /** |
| * Verb forms occurring on their own only in dependent clauses and lacking tense and mood contrasts. |
| * (adapted from Crystal 2003; http://www.isocat.org/datcat/DC-1332) |
| * <p> |
| * A non-finite verb is a verb that is not fully inflected for categories that are marked inflectionally |
| * in a language, such as the following: Tense, Aspect, Modality, Number, Person. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsANonfiniteVerb.htm 19.09.06) |
| */ |
| NonFiniteVerb(LexicalCategory.Verb), |
| /** |
| * property for a non-finite form of a verb other than the infinitive. <br> |
| * (http://www.isocat.org/datcat/DC-2243) |
| * <p> |
| * A gerund is a kind of verbal noun that exists in some languages. In today's English, gerunds are nouns |
| * built from a verb with an '-ing' suffix. They can be used as the subject of a sentence, an object, or |
| * an object of preposition. They can also be used to complement a subject. Often, gerunds exist |
| * side-by-side with nouns that come from the same root but the gerund and the common noun have different |
| * shades of meaning.<br> |
| * (http://en.wikipedia.org/wiki/Gerund, http://en.wikibooks.org/wiki/English:Gerund 19.09.06) |
| * <p> |
| * The term _gerund_ is ambiguous: with respect to Latin, in whose grammatical tradition it originates, it |
| * refers to a deverbal noun, and is needed in this function for Polish as well; in descriptions of some |
| * other languages, however, it has been used for an adverbial participle. The two meanings have nothing |
| * in common, except that the English _ing_-form can translate both. (Ivan A Derzhanski, email 2010/06/09) |
| * Here, it is assumed that Gerund refers only to deverbal nouns, cf. NominalNonfiniteVerb in the IIIT |
| * tagset<br> |
| * (http://purl.org/olia/iiit.owl#NominalNonFiniteVerb) |
| */ |
| Gerund(NonFiniteVerb), |
| /** |
| * An infinitive is the base form of a verb. It is unmarked for inflectional categories such as the |
| * following: Aspect, Modality, Number, Person and Tense. <br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnInfinitive.htm 19.09.06) |
| */ |
| Infinitive(NonFiniteVerb), |
| /** |
| * |
| A participle is a lexical item, derived from a verb that has some of the characteristics and functions |
| * of both verbs and adjectives. In English, participles may be used as adjectives, and in non-finite |
| * forms of verbs.<br> |
| * (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAParticiple.htm 19.09.06) |
| */ |
| Participle(NonFiniteVerb), |
| /** |
| * Adverb/Type="participle" is used in the Slovene MTE v4 specs, e.g., 'leže' / lying. Slovenian adverbial |
| * participles are, however, not attested for Resian. (MTE |
| * v4)(http://purl.org/olia/mte/multext-east.owl#AdverbialParticiple) |
| */ |
| AdverbialParticiple(LexicalCategory.Adverb, Participle), |
| /** |
| * [In Bengali, t]he Conditional Participle is widely used to convey |
| * "if a certain action [pertaining to the parent verb] is done,...". The logic is: "in the case or |
| * condition of a certain action being done". Being impersonal, without regard for the doer of the action |
| * that caused the condition, it is not declined to suit number or gender. If this doer is not defined in |
| * the Bengali condition clause but needs to be stated in a natural-sounding English translation, this is |
| * identified and drawn from the second clause. For example:- Student: Teaching Truth in Bengali |
| * <p> |
| * If you pay attention,* you will learn. manoyog kar-*le* tumi shikh-be. [or, If attention is paid] |
| * <p> |
| * <br> |
| * (http://www.jaspell.co.uk/bengalicourse2007/wb149study49.pdf) |
| */ |
| ConditionalParticiple(Participle), |
| /** |
| * Participle and hasTense some Past |
| */ |
| PastParticiple(Participle), |
| /** |
| * Participle and hasTense some Present |
| */ |
| PresentParticiple(Participle), |
| /** |
| * English verb forms ending in '-ing' that represent either Gerunds or Participles. |
| */ |
| Ing("ing", Gerund, Participle), |
| /** |
| * Adjective based on a verb.<br> |
| * (http://www.isocat.org/datcat/DC-1598) |
| */ |
| ParticipleAdjective(LexicalCategory.Adjective, Participle), |
| /** |
| * |
| Adjective based on a past participle.<br> |
| * (http://www.isocat.org/datcat/DC-1596) |
| */ |
| PastParticipleAdjective(ParticipleAdjective, PastParticiple), |
| /** |
| * |
| Adjective based on a present participle.<br> |
| * (http://www.isocat.org/datcat/DC-1597) |
| */ |
| PresentParticipleAdjective(ParticipleAdjective, PresentParticiple), |
| /** |
| * |
| Supine is a nonfinite form of motion verbs with functions similar to that of an infinitive (Angelika |
| * Adams) |
| */ |
| Supine(NonFiniteVerb), |
| /** |
| * A verbal noun is a noun formed directly as an inflexion of a verb or a verb stem, sharing at least in |
| * part its constructions. This term is applied especially to gerunds, and sometimes also to infinitives |
| * and supines.<br> |
| * (http://en.wikipedia.org/wiki/Verbal_noun 19.09.06) |
| */ |
| VerbalNoun(CommonNoun, NonFiniteVerb), |
| /** |
| * Main verb in contrast to a modal or an auxiliary.<br> |
| * (http://www.isocat.org/datcat/DC-1400) |
| */ |
| MainVerb(LexicalCategory.Verb), |
| /** |
| * An agentive verb marks the semantic role of agent or the doer of an action. |
| * <p> |
| * Example: |
| * |
| * <pre> |
| * ་ ་ ས་ ་ ་ བསད་ ག། |
| * Dorji-gi jele sänu |
| * 'Dorji killed the cat' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| AgentiveVerb(MainVerb), |
| /** |
| * It is a verb, which indicates a strong desire to achieve something, without the doer. |
| * |
| * <pre> |
| * དག་པ ་ ང་ ་ ་བར་ ག། |
| * dag-pai zhing-lu kewa shÔ |
| * 'May i be born in pure land' |
| * </pre> |
| * |
| * <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| AspirationalVerb(MainVerb), |
| /** |
| * Dzongkha uses honorific forms: ན་བཟའ་/nam za/ (cloths) is the honorific form of the noun གོ་ |
| * ལ་/gola/(cloths), གསངས་/sung/(tell) the honorific form of the verb སབ་/lab/(tell). We opted to mark |
| * them by adding the tag NNH (honorific common noun) and VBH (honorific verb) to enable future research |
| * on this specific usage of Dzongkha language. A number of tags were added to the set, of which we |
| * describe four in more detail: two of the additional tags are subclasses of verbs: VBH (honorific verb |
| * form), and VBN which describes past participle forms, like, e.g. བངམ་/jun/(created), the past particle |
| * form of བང་/jung/(create). |
| */ |
| HonorificVerb(MainVerb), |
| /** |
| * (of a verb) having no logical subject. Usually in English the pronoun it is used in such cases as a |
| * grammatical subject, as for example in It is raining. (of a pronoun) not denoting a person |
| * (www.wordreference.com/English/definition.asp?en=impersonal; http://www.isocat.org/datcat/DC-1306) |
| */ |
| Impersonal(MainVerb), |
| /** |
| * A non-agentive verb is a type of verb, which indicates an action without the doer. |
| * <p> |
| * Example: ང་མ་ འ ར་ ས། 'lungma phur-dä 'A wind is blowing' <br> |
| * (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) |
| */ |
| NonAgentiveVerb(MainVerb), ; |
| static final String OLIA_NAMESPACE = "http://purl.org/olia/olia.owl#"; |
| |
| private final Set<LexicalCategory> categories; |
| private final Collection<Pos> parents; |
| private final UriRef uri; |
| |
| Pos(LexicalCategory category) { |
| this(null, category, (LexicalCategory) null); |
| } |
| |
| Pos(LexicalCategory category, LexicalCategory additional) { |
| this(null, category, additional); |
| } |
| |
| Pos(String name, LexicalCategory category, LexicalCategory additional) { |
| this.uri = new UriRef(OLIA_NAMESPACE + (name == null ? name() : name)); |
| categories = EnumSet.of(category); |
| if (additional != null) { |
| categories.add(additional); |
| } |
| parents = Collections.emptySet(); |
| } |
| |
| Pos(Pos... parent) { |
| this(null, null, parent); |
| } |
| |
| Pos(String name, Pos... parent) { |
| this(name, null, parent); |
| } |
| |
| Pos(LexicalCategory category, Pos... parent) { |
| this(null, category, parent); |
| } |
| |
| Pos(String name, LexicalCategory category, Pos... parent) { |
| this.uri = new UriRef(OLIA_NAMESPACE + (name == null ? name() : name)); |
| this.parents = parent == null || parent.length < 1 ? Collections.EMPTY_SET : Arrays.asList(parent); |
| categories = category == null ? EnumSet.noneOf(LexicalCategory.class) : EnumSet.of(category); |
| Set<Pos> toProcess = new HashSet<Pos>(parents); |
| while (!toProcess.isEmpty()) { |
| Iterator<Pos> it = toProcess.iterator(); |
| Pos p = it.next(); |
| it.remove(); |
| categories.addAll(p.categories); |
| toProcess.addAll(p.parents); |
| } |
| } |
| |
| public Set<LexicalCategory> categories() { |
| return categories; |
| } |
| |
| public boolean isParent() { |
| return parents.isEmpty(); |
| } |
| |
| public Collection<Pos> parents() { |
| return parents; |
| } |
| |
| public UriRef getUri() { |
| return uri; |
| } |
| |
| public Set<Pos> hierarchy() { |
| return transitiveClosureMap.get(this); |
| } |
| |
| @Override |
| public String toString() { |
| return String.format("olia:%s", |
| uri.getUnicodeString().substring(OLIA_NAMESPACE.length())); |
| } |
| |
| /** |
| * This is needed because one can not create EnumSet instances before the |
| * initialization of an Enum has finished.<p> |
| * To keep using the much faster {@link EnumSet} a static member initialised |
| * in an static {} block is used as a workaround. The {@link Tense#getTenses()} |
| * method does use this static member instead of a member variable |
| */ |
| private static final Map<Pos,Set<Pos>> transitiveClosureMap; |
| |
| static { |
| transitiveClosureMap = new EnumMap<Pos,Set<Pos>>(Pos.class); |
| for(Pos pos : Pos.values()){ |
| Set<Pos> parents = EnumSet.of(pos); |
| for(Pos posParent : pos.parents()){ |
| Set<Pos> transParents = transitiveClosureMap.get(posParent); |
| if(transParents != null){ |
| parents.addAll(transParents); |
| } else if(posParent != null){ |
| parents.add(posParent); |
| } // else no parent |
| } |
| transitiveClosureMap.put(pos, parents); |
| } |
| } |
| |
| } |