/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.stanbol.enhancer.nlp.pos; import java.util.Arrays; import java.util.Collection; import java.util.Collections; import java.util.EnumMap; import java.util.EnumSet; import java.util.HashSet; import java.util.Iterator; import java.util.List; import java.util.Map; import java.util.Set; import org.apache.clerezza.commons.rdf.IRI; import org.apache.stanbol.enhancer.nlp.morpho.Tense; import com.ibm.icu.impl.Punycode; /** * Enumeration over all POS (Part of Speach) categories as defined by the * MorphosyntacticCategory class hierarchy og the * Olia Ontology.
* The top-level morphosyntactic categories are not defined by this enum, but link * to the {@link LexicalCategory} enumeration. The multi-sub-class hierarchy of the * morphosyntactic categories is also reflected by this enumeration and accessible * via the
* ང་འ ་ ང ་ འ ག། * Shing-di rim du * 'The tree is tall' ** *
* ན་ ང་ ང་ ་ ལ་ ་ འ ་ ། * Nahing Nga chigyel-lu joyi * 'I went abroad last year' ** *
* Adjective/Type="possessive" are denominal, not pronominal expressions of possession (Ivan A Derzhanski, * email 2010/06/09). Therefore not to be confused with Pronoun/Type=adjectival(a) (Bulgarian only), for * words like умно /cleverly, wisely, sensibly/, which are derived from adjectives. (Dimitrova et al. * 2009) *
* e.g., Slovene dušikovima/dušikov, Marsovi/Marsov, *
* Slovak vojvodova/vojvodov, vojvodove/vojvodov, vojvodovej/vojvodov, vojvodovho/vojvodov, * vojvodovi/vojvodov, vojvodovmu/vojvodov, vojvodovo/vojvodov, vojvodovom/vojvodov, vojvodovou/vojvodov, *
* Serbian evroazijske/evroazijska, evroazijskih/evroazijski, Goldštajnov, govornikov, Jehovine/Jehovin, * malabarskom/malabarski, O'Brajenov, O'Brajenovog/O'Brajenov, oficirov, *
* Czech Riegrovými/Riegrův, Stradellovými/Stradellův, Tristanovou/Tristanův, Wagnerových/Wagnerův,
* Wagnerovým/Wagnerův, Weberovi/Weberův, Weberových/Weberův, Wertherovi/Wertherův, Winstonovi/Winstonův
* (http://purl.org/olia/mte/multext-east.owl#PossessiveAdjective)
*/
PossessiveAdjective(LexicalCategory.Adjective),
/**
*
A predicative adjective is one which functions as part of the predicate of a sentence. This means that
* it is linked to the noun by a verb, often a copula (such as to be).
* (http://en.wikipedia.org/wiki/Adjective 18.09.06)
*/
PredicativeAdjective(LexicalCategory.Adjective),
/**
* Relative adjectives express similarity or a comparison. (Schmidt 1999, p.218,
* http://purl.org/olia/emille.owl#RelativeAdjective)
*/
RelativeAdjective(LexicalCategory.Adjective),
/**
*
An adjective that modifies an implied, but not expressed, noun. When translating such an adjective into
* English, you must supply the missing noun. (www.southwestern.edu/~carlg/Latin_Web/glossary.html;
* http://www.isocat.org/datcat/DC-1394)
*
* (Chiarcos: this seems to pertain to nominalization)
*/
SubstantiveAdjective(LexicalCategory.Adjective),
/**
*
Adjective expressing a numeric ranking.
* (http://www.isocat.org/datcat/DC-1338)
*
* Cf. "second", "next", "last"
*
* @deprecated The DCR definition and this term are incorrect. "Ordinal adjective" entered ISOcat from
* MULTEXT-East, where it was originally applied to relational adjectives (Slovene, Resian,
* Ukrainian, Czech). "Ordinal adjective" is a mistranslation from Slovene _vrstni pridevniki_
* that should be properly rendered in English as "relational adjective" (Derzhanski and
* Kotsyba 2009). However, the Macedonian MULTEXT v.4 guidelines use this category for ordinal
* numerals. Due to its inherent ambiguity, this category is to be avoided.
*/
OrdinalAdjective(LexicalCategory.Adjective),
/**
* Adjective used to qualify.
* (http://www.isocat.org/datcat/DC-1477)
*/
QualifierAdjective(LexicalCategory.Adjective, LexicalCategory.Quantifier),
/**
* The Slovene adjective expresses three main ideas: quality (qualitative adjectives, kakovostni
* pridevniki), relation (relational adjectives, vrstni pridevniki) and possession (possessive adjectives,
* svojilni pridevniki). Relational adjectives express type, class or numerical sequence of a noun. For
* instance: kemijska in fizikalna sprememba (chemical and physical change), fotografski aparat
* (photographic device (=camera)).
* (http://en.wikipedia.org/wiki/Slovene_grammar)
*/
RelationalAdjective(LexicalCategory.Adjective),
/**
* A circumposition is an adposition with a part before the noun phrase and a part after. It is much less
* common than prepositions or postpositions.
* (http://en.wikipedia.org/wiki/Circumposition 19.09.06)
*/
Circumposition(LexicalCategory.Adposition),
/**
* A postposition is an adposition that occurs after its complement.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPostposition.htm 19.09.06)
*/
Postposition(LexicalCategory.Adposition),
/**
* A preposition is an adposition that occurs before its complement.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPreposition.htm 19.09.06)
*/
Preposition(LexicalCategory.Adposition),
/**
* Preposition that is a aggregation of words
* (http://www.isocat.org/datcat/DC-1934)
*/
CompoundPreposition(Preposition),
/**
* Preposition that is the result of a morphological merge from at least two words.
* (http://www.isocat.org/datcat/DC-1901)
*/
FusedPreposition(Preposition),
/**
* Preposition that is a pure simple word in contrast with the notion of fused preposition.
* (http://www.isocat.org/datcat/DC-1900)
*/
SimplePreposition(Preposition),
/**
* An adjectival adverb is an adverb that is formally identical to an adjective.
* MULTEXT-East Adverb/Type="adjectival" (Serbian, Macedonian, Bulgarian)
* Bulgarian AdjectivalAdverbs have the same form as adjectives in Gender = neuter, Person = 3, Number =
* singular. (MTE v4, http://purl.org/olia/mte/multext-east.owl#AdjectivalAdverb)
*/
AdjectivalAdverb(LexicalCategory.Adverb),
/**
* Adverb/Type="causal" is used in the Hungarian MTE v4, but no examples are provided.
* (http://purl.org/olia/mte/multext-east.owl#CausalAdverb)
*
* @deprecated equivalent to Adverb and hasSemanticRole some CauseRole
*/
CausalAdverb(LexicalCategory.Adverb),
/**
* Any adverb which modifies an adjective, an adverb, a verbal particle, a preposition, a conjunction or a
* determiner is a degree adverb.
* (http://xlex.uni-muenster.de/Portal/MTPE/tagsetDescriptionEN.doc, p. 113, 8.1 Degree Adverbs 23.09.06)
*
* Also known as specifier adverb
* (http://www.unlweb.net/unlarium/dictionary/export_tagset.php)
*/
DegreeAdverb(LexicalCategory.Adverb),
/**
* equivalent to Adverb and hasSemanticRole some LocationRole
*/
LocationAdverb(LexicalCategory.Adverb),
/**
* equivalent to Adverb and hasSemanticRole some MannerRole
*/
MannerAdverb(LexicalCategory.Adverb),
/**
* Adverb/Type="modifier" is used in the English, Romanian and Hungarian MTE v4 specs. For Romanian,
* Adverb/Type="modifier" applies to adverbs which can have predicative role, that is they can govern a
* subordinate sentence (ex. Fireşte că o ştiu -- Certainly I know it). Here (for uniformity within a
* multilingual environment), they are squeezed into the modifier class. (MTE v4) e.g., better (en)
* (http://purl.org/olia/mte/multext-east.owl#ModifierAdverb)
*/
ModifierAdverb(LexicalCategory.Adverb),
/**
* Adverb/Type="negative" are used in the Serbian and Romanian MTE v4 specs, e.g., for Romanian nicăieri -
* nowhere, niciodată - never. (MTE v4)
* (http://purl.org/olia/mte/multext-east.owl#NegativeAdverb)
*/
NegativeAdverb(LexicalCategory.Adverb),
/**
* Pronominal adverbs substitute for a preposition (which is incorporated into them) and an NP, cf.
* English therefore lit. "for this (reason, ...)", German deswegen lit. "because of this (reason, ...)".
* (http://www.ilc.cnr.it/EAGLES96/elm_de/node235.html 21.09.06, examples Ch. Chiarcos)
*/
PronominalAdverb(LexicalCategory.Adverb),
/**
* Pronominal adverb derived from a demonstrative stem (Ch. Chiarcos)
*/
DemonstrativeAdverb(PronominalAdverb),
/**
* Adverb/Type="verbal" applies to adverbs derived from from verbs (verbal adverbs) in the Serbian,
* Macedonian and Hungarian MTE v4 specs. Macedonian verbal adverbs (gerunds) like odejkji are thus not
* considered as verbal forms, but as Adverb/Type="verbal". (MTE v4)
* (http://purl.org/olia/mte/multext-east.owl#VerbalAdverb)
*/
VerbalAdverb(LexicalCategory.Adverb),
/**
* Adverb that serves to express interrogativity, exclamation or that serves to link a subordinate clause
* to the matrix clause. (Ch. Chiarcos)
*/
WHTypeAdverbs(LexicalCategory.Adverb),
/**
* An ExclamatoryAdverb seves to express exclamation, cf. how in "How well everyone played!"
*
* Exclamative sentences or exclamatives An exclamatory sentence or exclamation is generally a more
* emphatic form of statement, in particular, they are used are used to express strong feelings (Latin
* exclamare : "to call out, to cry out").
* (http://english.unitecnology.ac.nz/resources/resources/exp_lang/sentence.html 07.05.07,
* http://en.wikipedia.org/wiki/Sentence_(linguistics) 07.05.07)
*/
ExclamatoryAdverb(WHTypeAdverbs),
/**
* Interrogative adverbs are used to introduce questions, e.g. "When are you coming?" (Angelika Adam)
*/
InterrogativeAdverb(WHTypeAdverbs),
/**
* The value relative is used for adverbs in clear relative cases as in: "The place 'where' I met you.",
* "The reason 'why' I did it."
* (http://www.ilc.cnr.it/EAGLES96/pub/eagles/lexicons/elm_en.ps.gz, p.33, 07.05.07)
*/
RelativeAdverb(WHTypeAdverbs),
/**
* Multi-word conjunction
*
* Besides the usual and, or, but, etc., certain prepositions and subordinating conjunctions can be used
* as coordinating conjunctions. Multi-word coordinating conjunctions are labeled CONJP (see section 7
* [Coordination]). ... CONJP — Conjunction Phrase. Used to mark certain “multi-word” conjunctions, such
* as as well as, instead of. (Bies et al. 1995)
*/
ConjunctionPhrase(LexicalCategory.Conjuction),
/**
* Coordinating conjunctions, also called coordinators, are conjunctions that join two items of equal
* syntactic importance.
* (http://en.wikipedia.org/wiki/Grammatical_conjunction 19.09.06)
*/
CoordinatingConjunction(LexicalCategory.Conjuction),
/**
* When the same word is also placed before the first conjunct, as in French "ou...ou...", the former
* occurrence is given the Correlative value and the latter the Simple value.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06)
*
* Conjunction/Coord_Type="correlat" (Romanian). In Romanian, there are three kinds of conjunctions
* depending on their usage: as such or together with other conjunctions or adverbs: (1) simple, between
* conjuncts: Ion ori Maria (John or Mary); (2) repetitive, before each conjunct: fie Ion fie Maria fie...
* (either John or Mary or...) (3) correlative, before a conjoined phrase, it requires specific
* coordinators between conjuncts: atât mama cât şi tata (both mother and father). (MTE v4,
* http://purl.org/olia/mte/multext-east.owl#CorrelativeCoordinatingConjunction)
*/
CorrelativeCoordinatingConjunction(CoordinatingConjunction),
/**
* When two distinct words occur, as in German "weder...noch...", then the first is given the Initial
* value.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06)
*/
InitialCoordinatingConjunction(CoordinatingConjunction),
/**
* When two distinct words occur, as in German weder...noch..., then the second is given the Non-initial
* value.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06)
*/
NonInitialCoordinatingConjunction(CoordinatingConjunction),
/**
* Conjunction/Coord_Type="repetit" (Romanian). In Romanian, there are three kinds of conjunctions
* depending on their usage: as such or together with other conjunctions or adverbs: (1) simple, between
* conjuncts: Ion ori Maria (John or Mary); (2) repetitive, before each conjunct: fie Ion fie Maria fie...
* (either John or Mary or...) (3) correlative, before a conjoined phrase, it requires specific
* coordinators between conjuncts: atât mama cât şi tata (both mother and father). (MTE v4,
* http://purl.org/olia/mte/multext-east.owl#RepetitiveCoordinatingConjunction)
*/
RepetitiveCoordinatingConjunction(CoordinatingConjunction),
/**
* Simple applies to the regular type of coordinator occurring between conjuncts: German und, for example.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1av 17.11.06)
*
* In the Romanian MTE v4 specs, Conjunction/Coord_Type="simple" is defined in contrast to repetitive and
* correlative coordinating conjunctions. In Romanian, there are three kinds of conjunctions depending on
* their usage: as such or together with other conjunctions or adverbs: (1) simple, between conjuncts: Ion
* ori Maria (John or Mary); (2) repetitive, before each conjunct: fie Ion fie Maria fie... (either John
* or Mary or...) (3) correlative, before a conjoined phrase, it requires specific coordinators between
* conjuncts: atât mama cât şi tata (both mother and father). (MTE v4), e.g., aşa_că, va_să_zică (ro)
* (http://purl.org/olia/mte/multext-east.owl#SimpleCoordinatingConjunction)
*/
SimpleCoordinatingConjunction(CoordinatingConjunction),
/**
* Subordinating conjunctions, also called subordinators, are conjunctions that introduce a dependent
* clause.
* (http://en.wikipedia.org/wiki/Grammatical_conjunction 19.09.06)
*/
SubordinatingConjunction(LexicalCategory.Conjuction),
/**
*
For example, in German the subordinating conjunction "als" is followed by various kinds of comparative
* clause (including clauses without finite verbs).
* (http://www.ilc.cnr.it/EAGLES96/annotate/node19.html#oav2u 17.11.06)
*/
SubordinatingConjunctionWithComparative(SubordinatingConjunction),
/**
* For example, in German the subordinating conjunction "weil" introduces a clause with a finite verb.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node19.html#oav2u 17.11.06)
*/
SubordinatingConjunctionWithFiniteClause(SubordinatingConjunction),
/**
* For example, in German the subordinating conjunction "ohne" ("zu"...) is followed by an infinitive.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node19.html#oav2u 17.11.06)
*/
SubordinatingConjunctionWithInfinite(SubordinatingConjunction),
/**
* Conjunction/Sub_Type="negative" (Romanian, Serbian, Russian) In Romanian, each conjunction requires
* another mood, so that the diversity may be controlled by subcategorisation rules. The attribute
* Sub_Type distinguishes among the positive and negative conjunctions, providing means to control verbal
* double negation, (as in case of the negative pronouns, determiners and adverbs): nici NU am venit,
* nimeni NU vorbeşte, nici_un tren N-a trecut, nicăieri N-am văzut (MTE v4,
* http://purl.org/olia/mte/multext-east.owl#NegativeSubordinatingConjunction)
*/
SubordinatingConjunctionWithNegation(SubordinatingConjunction),
/**
* Conjunction/Sub_Type="negative" (Romanian, Serbian, Russian) In Romanian, each conjunction requires
* another mood, so that the diversity may be controlled by subcategorisation rules. The attribute
* Sub_Type distinguishes among the positive and negative conjunctions, providing means to control verbal
* double negation, (as in case of the negative pronouns, determiners and adverbs): nici NU am venit,
* nimeni NU vorbeşte, nici_un tren N-a trecut, nicăieri N-am văzut (MTE v4,
* http://purl.org/olia/mte/multext-east.owl#PositiveSubordinatingConjunction)
*/
SubordinatingConjunctionWithoutNegation(SubordinatingConjunction),
/**
* 0|Zero represents a zero complementizer (= subordinating conjunction); it may need to be deleted. The
* zero complementizer is generally the counterpart of the overt complementizer that. Example: Iâ ¹m
* sure 0 heâ ¹ll be here any minute. ...
*
* 0 stands in for overt subordinating conjunctions like that in tensed subordinate clauses, including
* relative clauses. So the relative clause the man I saw should be bracketed as follows: (NP (NP the man)
* (SBAR 0 (S (NP I) (VP saw) (NP T)))))
*
* (Santorini 1991)
*/
ZeroComplementizer(SubordinatingConjunction),
/**
*
An interjection is a form, typically brief, such as one syllable or word, which is used most often as
* an exclamation or part of an exclamation. It typically expresses an emotional reaction, often with
* respect to an accompanying sentence and may include a combination of sounds not otherwise found in the
* language, e.g. in English: psst; ugh; well, well
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnInterjection.htm 19.09.06)
*/
Interjection(LexicalCategory.Conjuction),
/**
* A common noun is a noun that signifies a non-specific member of a group.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsACommonNoun.htm 19.09.06)
*/
CommonNoun(LexicalCategory.Noun),
/**
* Dzongkha uses honorific forms: ན་བཟའ་/nam za/ (cloths) is the honorific form of the noun གོ་
* ལ་/gola/(cloths), གསངས་/sung/(tell) the honorific form of the verb སབ་/lab/(tell). We opted to mark
* them by adding the tag NNH (honorific common noun) and VBH (honorific verb) to enable future research
* on this specific usage of Dzongkha language. A number of tags were added to the set, of which we
* describe four in more detail: two of the additional tags are subclasses of verbs: VBH (honorific verb
* form), and VBN which describes past participle forms, like, e.g. བངམ་/jun/(created), the past particle
* form of བང་/jung/(create). (Chungku et al. 2010)
*
* A noun, which indicates respect for the person being addressed, e.g., Miwang Gel-poi Yab “A king's
* father” [Though father=Apa, but colloquially we say YAB in Dzongkha]
* (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf)
*/
HonorificCommonNoun(CommonNoun),
/**
* A title designates the function or the social status of an individual. Often, it accompanies a proper
* noun, but it can also be used in place of a proper noun (if the bearer of the title is contextually
* unambiguous). E.g. "The/Det German/Adj Chancellor/Title Angela/Name Merkel/Name said ..." can be used
* besides "the German Chancellor said ...". Accordingly, some schemes (e.g., Chungku et al. 2010, for
* Dzongkha) group titles together with proper names
* (http://purl.org/olia/dzongkha.owl#ParticularPersonNoun).
*
* However, if multiple people hold the same title, they can be referred to as a group, e.g., * "Since WWII, the politics of the German chancellors always followed ...", and in this usage, titles are * more comparable to common nouns. Functionally, titles are thus an intermediate category between * CommonNoun and ProperNoun (cf. also Mulkern 1996). *
* Titles do, however, share important characteristics with common nouns. In English, for example, titles * generally require a definite determiner (unlike proper nouns), even if unambiguous ("the pope"). They * are thus classified here as a subtype of CommonNoun. *
* (Ann E. Mulkern. The name of the game. In Jeanette Gundel and Thorstein Fretheim, editors. Reference * and Referent Accessibility: Pragmatics and Beyond. John Benjamins, Amsterdam and Philadelphia, 1996, * pages 235–250.) */ TitleNoun(CommonNoun), /** * Measuring units are frequently used with numerals. However, they have a different syntactic structure * than numerals (Sajjad 2007). *
* In European languages, Units are generally expressed as nouns, e.g., English
* "ten/Numeral kilogram/Unit". "Kilogram" can also be used as a common noun:
* "The kilogram is losing weight"
* (http://www.bbc.co.uk/news/science-environment-12276822)
*
* Hassan Sajjad (2007), Urdu Part of Speech Tagset, version 1.0.0.0, 07-12-2007, Center for research in * Urdu Language Processing. National University of Computer and Emerging Sciences, Lahore, Pakistan, * http://www.crulp.org/Downloads/langproc/UrduPOStagger/UrduPOStagset.pdf */ UnitNoun(CommonNoun), /** * NLOC Noun Location This is an entirely new tag introduced to cover an important phenomenon of Indian * Languages. Words like 'Age', 'upara', 'pahele', 'bAda', etc. are used in various ways in Hindi. *
* But we feel that these words are more like nouns as is evident from 3. and 4. above, and also if we * consider for examples, 'aage', 'upara', etc. as places which are in front, up, etc then we can tag them * as nouns. *
* But these are not pure nouns. They are nouns which indicate a location or time. These also function as * adverbs or prepositions in a context. So a new tag NLOC is introduced for such words. This tag will * cater to a finite set of such words. set: (Age, piche, upara, nIce, bAda, pahele) ("front", "behind", * "above", "below", "before") Such words if tagged according to their syntactic function, it will hamper * machine learning. So a single tag, NLOC has been devised for such words which indicate location and * time. *
* e.g., (upara, Age, pahele, bAda) (IIIT (2007), A Part of Speech Tagger for Indian Languages (POS
* tagger), Tagset developed at IIIT - Hyderabad after consultations with several institutions through two
* workshops. available under http://shiva.iiit.ac.in/SPSAL2007/iiit_tagset_guidelines.pdf)
*/
SpatiotemporalNoun(CommonNoun),
/**
* relation noun (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2226)
*/
RelationNoun(CommonNoun),
/**
*
A countable noun (also count noun) is a noun which can be modified by a numeral and occur in both
* singular and plural form, as well as co-occurring with quantificational determiners like every, each,
* several, most, etc..
* (http://en.wikipedia.org/wiki/Countable_noun 19.09.06)
*/
CountableNoun(LexicalCategory.Noun),
/**
* A mass noun (also uncountable noun or non-count noun) can't be modified by a numeral, occur in
* singular/plural or co-occur with the relevant kind of determiner.
* (http://en.wikipedia.org/wiki/Mass_noun 19.09.06)
*/
MassNoun(LexicalCategory.Noun),
/**
* Proper nouns (also called proper names) are the names of unique entities.
* (http://en.wikipedia.org/wiki/Noun 19.09.06)
*/
ProperNoun(LexicalCategory.Noun),
/**
* diminutive noun (MIRACL LSCA; http://www.isocat.org/datcat/DC-2225)
*/
DiminutiveNoun(LexicalCategory.Noun),
/**
* A noun which quantifies one or more things, regardless of subject and an object.
*
*
* ང་གིས་ བམོ་ ལ་ དང་ ཕད་ཅི། * NGAGI BUM 'NGA 'DA CHECI * I girl five with met * “I met with five girls.” ** * (Jurmey Rabgay, email Sep 20, 2010) */ NominalQuantifier(LexicalCategory.Noun, LexicalCategory.Quantifier), /** * noun of a voice
* (3) Iʼm looking for a deer. *
* In the specific reading there is a particular deer, say Bambi, that I am looking for. In the * non-specific reading I will be happy to find any deer. Von Heusinger (2002) likes the test in English * of inserting ʻcertainʼ after the ʻaʼ to fix the specific reading. In either reading of (3) a deer is * being introduced as a new discourse referent. This is opposed to ʻdefiniteʼ which requires a previous * pragmatic instantiation as in ʻIʼm looking for the deer.ʼ In English both the readings of (3) are * indefinite. In Klallam, the specific demonstratives are neither definite nor indefinite." *
* (Montler, Timothy. 2007. Klallam demonstratives. Papers ICSNL XLVII. The 42nd International Conference * on Salish and Neighbouring Language, pp. 409-425. University of British Columbia Working Papers in * Linguistics, Volume 20; on specific vs. nonspecific determiners in Klallam, a Salish language, * http://montler.net/papers/KlallamDemons.pdf) */ NonspecificDeterminer(Article), /** * "By ʻspecificʼ and ʻnon-specificʼ I intend the difference between the two readings of English * indefinites like (3): *
* (3) Iʼm looking for a deer. *
* In the specific reading there is a particular deer, say Bambi, that I am looking for. In the * non-specific reading I will be happy to find any deer. Von Heusinger (2002) likes the test in English * of inserting ʻcertainʼ after the ʻaʼ to fix the specific reading. In either reading of (3) a deer is * being introduced as a new discourse referent. This is opposed to ʻdefiniteʼ which requires a previous * pragmatic instantiation as in ʻIʼm looking for the deer.ʼ In English both the readings of (3) are * indefinite. In Klallam, the specific demonstratives are neither definite nor indefinite." *
* (Montler, Timothy. 2007. Klallam demonstratives. Papers ICSNL XLVII. The 42nd International Conference
* on Salish and Neighbouring Language, pp. 409-425. University of British Columbia Working Papers in
* Linguistics, Volume 20; on specific vs. nonspecific determiners in Klallam, a Salish language,
* http://montler.net/papers/KlallamDemons.pdf)
*/
SpecificArticle(Article),
/**
* Persian does have an article, but it marks specificity rather than definiteness. The Persian article is
* similar to the Balkan one (a clitic of pronominal origin that's written together with the word), except
* that it isn't exactly definite (you can even see it described as an indefinite article). (Ivan A.
* Derzhanski, p.c. 2010/06/18)
*/
CliticSpecificArticle(SpecificArticle),
/**
* Determiner/Type="emphatic" (Romanian)
*
* In Romanian, there are specific forms for the so-called emphatic determiner, which may accompany both a
* noun and a personal pronoun: fata însăşi (the girl herself), also ea însăşi (she herself). e.g.,
* însele/însumi, însemi/însumi, însene/însumi, însevă/însumi, înseşi/însumi, înseţi/însumi, însumi,
* însuşi/însumi, însuţi/însumi
* (http://purl.org/olia/mte/multext-east.owl#EmphaticDeterminer)
*/
EmphaticDeterminer(Determiner),
/**
* An indefinite determiner is a determiner that expresses a referent's indefinite number or amount, i.e.
* "some", "any", "many".
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAQuantifier.htm 22.09.06)
*
* Note that here, a separate top-level class Quantifier has been introduced that covers expressions of
* number and amount as *semantic* concepts. Plural indefinite determiners are thus to be modeled as
* IndefiniteDeteriner and Quantifier.
*/
IndefiniteDeterminer(Determiner),
/**
* Determiner/Type="negative" (Romanian)
* In Romanian the negative determiner is expressed by the unit nici + indefinite article (e.g. nici un,
* nici o). (MTE v4)
*
* e.g., nici-o/nici_un, nici_o/nici_un, nici_un, nici_unei/nici_un, nici_unii/nici_un, nici_unor/nici_un,
* nici_unui/nici_un
* (http://purl.org/olia/mte/multext-east.owl#NegativeDeterminer)
*/
NegativeDeterminer(IndefiniteDeterminer),
/**
* A partitive determiner indicates an indefinite quantity of a mass noun; there is no partitive article
* in English, though the words some or any often have that function. (Wilson and Leech 1996)
*/
PartitiveDeterminer(Determiner),
/**
* Determiner/Type="exceptional" is applied to the Persian uniquitive determiner تنها i.e., "the only"
* (MTE v4; Hamidreza Kobdani, email 2010/06/15,
* http://purl.org/olia/mte/multext-east.owl#UniquitiveDeterminer)
*/
UniquitiveDeterminer(Determiner),
/**
* @deprecated to be replaced by InterrogativeDeterminer or RelativeDeterminer
*/
WHDeterminer(Determiner),
/**
* A exclamatory determiner is used in combination with a Nominal Phrase in order to create an exclamation
* (a more emphatic form of statement), e.g. "What a lovely colour!", "What a wonderful day this is!"
* (http://www.ilc.cnr.it/EAGLES96/pub/eagles/lexicons/elm_en.ps.gz, p.27, 07.05.07;
* http://en.wikipedia.org/wiki/Sentence_(linguistics), 07.05.07)
*/
ExclamatoryDeterminer(WHDeterminer),
/**
* A interrogative is a function word used to introduce an interrogative clause. E.g. "which", "what",
* "whose" (interrogative possessive determiner) are interrogative determiner in English.
* (http://en.wikipedia.org/wiki/Interrogative_word 02.05.07)
*/
InterrogativeDeterminer(WHDeterminer),
/**
* The relative determiner describes a attributive relative pronoun. In German "wessen" in
* "Ich weiss nicht, wessen Auto das ist." or the English "whose" in "The man whose daughter became ill.".
*
* The relative determiner needs a noun to complete a NP (Nominal Phrase).
* (http://www.ilc.cnr.it/EAGLES96/pub/eagles/lexicons/elm_en.ps.gz, p.28, 07.05.07)
*/
RelativeDeterminer(WHDeterminer),
/**
* Determiner that refers to the same entity.
* (http://www.isocat.org/datcat/DC-1377)
*/
ReflexiveDeterminer(Determiner),
/**
* A pronoun is a pro-form which functions like a noun and substitutes for a noun or a noun-phrase. A
* language may have several classes of pronouns.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPronoun.htm 19.09.06)
*
* A pronominal is a phrase that functions as a pronoun
* (www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPronominal.htm;
* http://www.isocat.org/datcat/DC-1369)
*/
Pronoun(LexicalCategory.PronounOrDeterminer),
/**
* An attributive pronoun is a pronoun that modifies an NP.
*/
AttributivePronoun(Determiner, Pronoun),
/**
* Demonstratives are deictic expressions (they depend on an external frame of reference) which indicate
* entities a speaker refers to, and distinguishes those entities from others. Demonstratives are usually
* employed for spatial deixis (using the context of the physical surroundings), but in many languages
* they double as discourse deictics, referring not to concrete objects but to words, phrases and
* propositions mentioned in speech.
* (http://en.wikipedia.org/wiki/Demonstrative 19.09.06)
*/
DemonstrativeDeterminer(AttributivePronoun),
/**
* Demonstrative pronouns are deictic words (they depend on an external frame of reference). They indicate
* which entities a speaker refers to, and distinguishes those entities from others.
* (http://en.wikipedia.org/wiki/Demonstrative_pronoun 19.09.06)
*/
DemonstrativePronoun(Pronoun),
/**
* A pronoun, which classifies or differentiates(pronoun) by a single basis, like everybody; each;
* individual etc.
*
*
* འ ག་པ ་ ་ ར་ ག་ར་ ན་ ང་ ང་ཁ་ ས་ད ། * Drupai Miser Gara Enrung Dzongkha ShegÔ * 'Every Bhutanese must know Dzongkha' ** *
* Unlike reciprocals, the two parts of a distributive pronoun cannot be considered as two full, * independent NPs. In "awar/1 awar/2", only "awar/2" is case marked; "awar/1" is its citation form. Also, * the two parts cannot be separated by intervening material (cf. English "one another"). (Jayaseelan * 2000, p. 149, on Malayalam) *
* (K.A. Jayaseelan, 2000, Lexical anaphors and pronouns in Malayalam, In: Barbara C. Lust, Kashi Wali,
* James W. Gair, K.V.Subharao (eds.), Lexical Anaphors and Pronouns in Selected South Asian Languages. A
* Principled Typology, Mouton de Gruyter, Berlin, p. 113-168) (E. Annamalai, 2000, Lexical anaphors and
* pronouns in Tamil, , In: Barbara C. Lust, Kashi Wali, James W. Gair, K.V.Subharao (eds.), Lexical
* Anaphors and Pronouns in Selected South Asian Languages. A Principled Typology, Mouton de Gruyter,
* Berlin, p. 169-216)
*/
DistributivePronoun(Pronoun),
/**
* An indefinite pronoun is a pronoun that belongs to a class whose members indicate indefinite reference.
* Examples in English are "anybody", "one", "somebody".
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnIndefinitePronoun.htm 19.09.06)
*/
IndefinitePronoun(Pronoun),
/**
* In the Russian MTE v4 specs, Pronoun/Type="nonspecific" marks the following Russian words: весь 'all',
* всякий 'any, every', сам 'oneself', самый 'the very', каждый 'every, each', иной 'other', любой 'any',
* другой 'other'. The name "nonspecific" follows Halliday (1985, Section 6.2.1.1). (MTE v4)
*
* A nonspecific pronoun refers to an unidentified or general entity (e.g., "I saw *someone*", * "I saw *everyone*"). A nonspecific pronoun is not, therefore, a personal pronoun, but an indefinite * one. (Andrews 2003). *
* Andrews, Richard J. (2003), Introduction to Classical Nahuatl. University of Oklahoma Press. Halliday,
* M.A.K. (1985), An introduction to Functional Grammar, London: Edward Arnold
* (http://purl.org/olia/mte/multext-east.owl#NonspecificPronoun)
*/
NonspecificPronoun(IndefinitePronoun),
/**
* Pronoun lacking person referent. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1426)
*
* More precisely, a form of pronoun that denotes the absence of a concrete or specific referent, e.g., * German "man". *
* As opposed to IndefinitePronoun, this referent is not just discourse-new, but generic or hypothetical.
*/
ImpersonalPronoun(IndefinitePronoun),
/**
* Pronoun used in a context of a negation or for expressing a negation.
* (http://www.isocat.org/datcat/DC-1925)
*/
NegativePronoun(IndefinitePronoun),
/**
* A Locative pronoun is a pronoun, which locates the object of a noun or place of anything.
*
*
* ་ ན་ གས་ ང་ ་ ག། * Nâ[LP] PhÜntsho'ling-lu ShÔ * 'Come here at Phuntsholing' ** *
* Insa Gülzow (2006), The acquisition of intensifiers: Emphatic reflexives in English and German child
* language, Mouton de Gruyter, Berlin, p. 258)
*/
DeterminalPronoun(PersReflPronoun),
/**
* A FirstPersonPronoun refers to the speaker, or to both the speaker and referents grouped with the
* speaker.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsFirstPersonDeixis.htm 19.09.06)
*/
FirstPersonPronoun(PersReflPronoun),
/**
* A personal pronoun is a pronoun that expresses a distinction of person deixis.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPersonalPronoun.htm 19.09.06)
*/
PersonalPronoun(PersReflPronoun),
/**
* *|An asterisk represents a zero pronoun; it may need to be deleted. ... is used to represent the empty
* subject of gerunds, imperatives and to-infinitive clauses. (Santorini 1991)
*
* (NP *) â ´ arbitrary PRO, controlled PRO, and trace of A-movement (Bies et al. 1995)
*/
ZeroPronoun(PersonalPronoun),
/**
* Personnal pronoun that is affixed. (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2221)
*/
AffixedPersonalPronoun(PersonalPronoun),
/**
* Personal pronoun that can occupy the position after a preposition and/or reinforce a weak personal
* pronoun. (Eagles; http://www.isocat.org/datcat/DC-1390)
*/
StrongPersonalPronoun(PersonalPronoun),
/**
* Personal pronoun that cannot occupy the position after a preposition and/or reinforce a strong personal
* pronoun.
* (http://www.isocat.org/datcat/DC-1414)
*/
WeakPersonalPronoun(PersonalPronoun),
/**
* A reciprocal pronoun is a pronoun that expresses a mutual feeling or action among the referents of a
* plural subject.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAReciprocalPronoun.htm 19.09.06)
*/
ReciprocalPronoun(PersReflPronoun),
/**
* A reflexive pronoun is a pronoun that has coreference with the subject.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAReflexivePronoun.htm 19.09.06)
*/
ReflexivePronoun(PersReflPronoun),
/**
* Second person deixis means deictic reference to a person or persons identified as addressee.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsSecondPersonDeixis.htm 19.09.06)
*/
SecondPersonPronoun(PersReflPronoun),
/**
* In several European languages exist special forms of pronouns for polite or respectful reference, e.g.
* Dutch u and Spanish usted. The concept FamiliarSecondPersonPronoun applies to the corresponding
* unmarked forms for informal conversiation in such languages.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1p 19.09.06)
*/
FamiliarSecondPersonPronoun(SecondPersonPronoun),
/**
* In several European languages exist special forms of pronouns for polite or respectful reference, e.g.
* Dutch u and Spanish usted.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1p 19.09.06)
*/
PoliteSecondPersonPronoun(SecondPersonPronoun),
/**
* Third person reference is a deictic reference to a referent(s) not identified as the speaker or
* addressee.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsThirdPersonDeixis.htm 19.09.06)
*/
ThirdPersonPronoun(PersReflPronoun),
/**
* A possessive pronoun is a pronoun that expresses relationships like ownership, such as kinship, and
* other forms of association.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAPossessivePronoun.htm 19.09.06)
*/
PossessivePronoun(Pronoun),
/**
* A possessive determiner is a part of speech that modifies a noun by attributing ownership to someone or
* something.
* (http://en.wikipedia.org/wiki/Possessive_adjective 19.09.06)
*/
PossessiveDeterminer(AttributivePronoun, PossessivePronoun),
/**
* Attributive possessive pronoun form of the reflexive pronoun, e.g., Russian свой:
*
* Обама на свой день рождения угощал гостей стейками и хот-догами. Obama on his day of.birth entertained
* guests with.steaks and hot.dogs
* "On his birthday, Obama entertained his guests with steaks and hot dogs."
* (http://ua.rian.ru/world_news/20110805/78815136.html)
*
* The antecedent of a possessive reflexive is not determined by its gender, but by its syntactic
* prominence.
*/
ReflexivePossessiveDeterminer(ReflexiveDeterminer, PossessiveDeterminer),
/**
* non-attributive pronoun
*/
SubstitutivePronoun(Pronoun),
/**
* @deprecated to be replaced with InterrogativePronoun or #RelativePronoun
*/
@Deprecated
WHPronoun(Pronoun),
/**
* An exclamative pronoun is a word which marks an exclamation.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnExclamative.htm 19.09.06)
*/
ExclamatoryPronoun(WHPronoun),
/**
* A interrogative pronoun is a pro-form that is used in questions in place of the item questioned for.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnInterrogativeProForm.htm 19.09.06)
*/
InterrogativePronoun(WHPronoun),
/**
* A relative pronoun is a pronoun that marks a relative clause, functions grammatically within the
* relative clause, and is coreferential to the word modified by the relative clause.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsARelativePronoun.htm 19.09.06)
*/
RelativePronoun(WHPronoun),
/**
* pronoun that have reference to something characterized by allusions. (MIRACL & LSCA;
* http://www.isocat.org/datcat/DC-2223)
*
* an invariable pronoun expressing a specific intention by means of unclear term (Khemakhem Aida, * 2010-05-10 via isocat-morpho@loria.fr) *
* examples from Arabic (Monica Monachini 2010-05-06 via isocat-morpho@loria.fr): "kam nahaituhu" (how
* often I forbade him, Hans Wehr), "baas Saar `amra `ashr isniin, gam (= kam) yriid paysikil" (He just
* turned ten, and here [how] he wants a bicycle, Georgetown University Iraqi Arabic-English Dictionary),
* "gam (= kam) yurguS imnil-faraH" ([how] he jumped for joy, Georgetown University Iraqi Arabic-English
* Dictionary)
*/
AllusivePronoun(Pronoun),
/**
* conditional pronoun (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2222)
*/
ConditionalPronoun(Pronoun),
/**
* Pronoun marked to show its importance.
* (http://www.isocat.org/datcat/DC-1941)
*/
EmphaticPronoun(Pronoun),
/**
* Punctuation that is more important than a secondary punctuation with regards to sentence splitting in a
* text.
* (http://www.isocat.org/datcat/DC-2075)
*/
MainPunctuation(LexicalCategory.Punctuation),
/**
* SentenceFinalPunctuation are . ? !.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recv 19.09.06)
*/
SentenceFinalPunctuation(MainPunctuation),
/**
* Sign used to express a question.
* (http://www.isocat.org/datcat/DC-1444)
*/
QuestionMark(SentenceFinalPunctuation),
/**
* Sign (.) used to expresses the end of a sentence or an abbreviation.
* (http://www.isocat.org/datcat/DC-1445)
*/
Point(SentenceFinalPunctuation),
/**
* Special sign (!) usually used in writing to mark exclamation.
* (http://www.isocat.org/datcat/DC-1441)
*/
ExclamativePoint(MainPunctuation),
/**
* Punctuation used when the sentence is interrogative.
* (http://www.isocat.org/datcat/DC-2087)
*/
InterrogativePunctuation(MainPunctuation),
/**
* Punctuation that is not very important with regards to sentence splitting in a text.
* (http://www.isocat.org/datcat/DC-2076)
*/
SecondaryPunctuation(LexicalCategory.Punctuation),
/**
* Parenthetical elements are dominated by a node labeled PRN. Punctuation marks that set off a
* parenthetical (i.e., commas, dashes, parentheses (-LRB- and -RRB-)) are contained within the PRN node.
* Use of PRN is determined ultimately by individual annotator intuition, though the presence of dashes or
* parentheses strongly suggests a parenthetical. (Bies et al. 1995)
*/
ParentheticalPunctuation(SecondaryPunctuation),
/**
* Beginning of a paired punctuation.
* (http://www.isocat.org/datcat/DC-2078)
*/
LeftParentheticalPunctuation(ParentheticalPunctuation),
/**
* < LAB* Left angle bracket (Santorini 1991)
*/
OpenAngleBracket(LeftParentheticalPunctuation),
/**
* [ LSB* Left square bracket (Santorini 1991)
*/
OpenSquareBracket(LeftParentheticalPunctuation),
/**
* Inverted comma.
* (http://www.isocat.org/datcat/DC-1443)
*/
InvertedComma(LeftParentheticalPunctuation),
/**
* Punctuation used in certain languages at the beginning of an interrogative sentence.
* (http://www.isocat.org/datcat/DC-2088)
*/
InvertedQuestionMark(LeftParentheticalPunctuation),
/**
* Punctuation that is represented graphically as [
* (http://www.isocat.org/datcat/DC-2082)
*/
OpenBracket(LeftParentheticalPunctuation),
/**
* Punctuation that is graphically represented as {
* (http://www.isocat.org/datcat/DC-2084)
*/
OpenCurlyBracket(LeftParentheticalPunctuation),
/**
* Beginning of a pair of parenthesis.
* (http://www.isocat.org/datcat/DC-1442)
*/
OpenParenthesis(LeftParentheticalPunctuation),
/**
* End of a paired punctuation.
* (http://www.isocat.org/datcat/DC-2079)
*
* RightParentheticalPunctuation is a punctuation mark which concludes a constituent whose the opening is
* marked by a LeftParentheticalPunctuation, e.g. ), ] and Spanish ?.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recv 19.09.06)
*/
RightParentheticalPunctuation(ParentheticalPunctuation),
/**
* > RAB* Right angle bracket (Santorini 1991)
*/
CloseAngleBracket(RightParentheticalPunctuation),
/**
* ] RSB* Right square bracket (Santorini 1991)
*/
CloseSquareBracket(RightParentheticalPunctuation),
/**
* Punctuation that is graphically represented by ]
* (http://www.isocat.org/datcat/DC-2083)
*/
CloseBracket(RightParentheticalPunctuation),
/**
* Punctuation that is graphically represented by }
* (http://www.isocat.org/datcat/DC-2085)
*/
CloseCurlyBracket(RightParentheticalPunctuation),
/**
* End of a parenthesis pair.
* (http://www.isocat.org/datcat/DC-1440)
*/
CloseParenthesis(RightParentheticalPunctuation),
/**
* SentenceMedialPunctuation are , ; : - .
* (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recv 19.09.06)
*/
SentenceMedialPunctuation(SecondaryPunctuation),
/**
* Sign with two vertical points that is used in writing and printing to introduce an explanation, example
* or quotation. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1439)
*/
Colon(SentenceMedialPunctuation),
/**
* Mark (,) used in writing to show a short pause or to separate items in a list. (Longman DCE 2005;
* http://www.isocat.org/datcat/DC-1448)
*/
Comma(SentenceMedialPunctuation),
/**
* Punctuation that is graphically presented as "-".
* (http://www.isocat.org/datcat/DC-2077)
*/
Hyphen(SentenceMedialPunctuation),
/**
* Sign (;) usually used to separate phrases.
* (http://www.isocat.org/datcat/DC-1446)
*/
SemiColon(SentenceMedialPunctuation),
/**
* Sequence of three dots having the same meaning as "et cetera" (full form) or "etc" (abbreviated form).
* (http://www.isocat.org/datcat/DC-1447)
*/
SuspensionPoints(SentenceMedialPunctuation),
/**
* Punctuation usually used to surround a quotation.
* (http://www.isocat.org/datcat/DC-2081)
*/
Quote(SecondaryPunctuation),
/**
* quotation mark, closing
*/
CloseQuote(Quote),
/**
* quotation mark, opening
*/
OpenQuote(Quote),
/**
* The punctuation sign /
* (http://www.isocat.org/datcat/DC-1437)
*/
Slash(SecondaryPunctuation),
/**
* Quantifiers that enforce dual agreement (i.e., as with the numeral "2").
*
* Some feminine and neuter body parts in Czech have preserved dual forms, and if the noun is dual, so are * its attributes (adjectives, pronouns). So the agreement of the numeral 2 differs formally from 3-4 * (Ivan A. Derzhanski, email 2010/06/16, http://purl.org/olia/mte/multext-east.owl#DualQuantifier) *
* Numeral/Class="definite", Numeral/Class="definite1", Numeral/Class="definite234" etc. refer to specific
* patterns of congruency with Slavic numerals that originate from the difference between Old Slavic
* singular (definite1), dual (definite2, definite234) and plural (definite).
* (http://purl.org/olia/mte/multext-east.owl#DualQuantifier)
*/
DualQuantifier(LexicalCategory.Quantifier),
/**
* A numeral is a word, functioning most typically as an adjective or pronoun, that expresses a number,
* and relation to the number, such as one of the following: Quantity, Sequence, Frequency, Fraction.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsANumeral.htm 19.09.06)
*/
Numeral(LexicalCategory.Quantifier),
/**
* Bulgarian has Numeral/Form=approx(a), used for approximate numerals (десетина /about a ten/, стотина
* /about a hundred/) (Dimitrova et al. 2009,
* http://purl.org/olia/mte/multext-east.owl#ApproximateNumeral)
*/
ApproximateNumeral(Numeral),
/**
* A cardinal numeral is a numeral of the class whose members are considered basic in form, used in
* counting, and used in expressing how many objects are referred to.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsACardinalNumeral.htm 19.09.06)
*/
CardinalNumber(Numeral),
/**
* Numeral/Type="collect" (Romanian)
* In traditional Romanian grammars, expressions like amândoi "both", toţi trei "all three" are referred
* to as collective numerals. (MTE v4, http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral)
*
* e.g., ambelor/ambii, ambilor/ambii, amânduror/amândoi, amândurora/amândoi, câteşipatru, tuspatru (ro, * http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) *
* e.g., czworga/czworo, czworgiem/czworo, czworgu/czworo, czworo/czworo, dwoje/dwoje, dwojga/dwoje, * dwojgiem/dwoje, dwojgu/dwoje, jedenaścioro/jedenaścioro (pl, * http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) *
* e.g., dvadesetora/dvadesetoro, dvoja/dvoje, dvoje, dvoji/dvoje, dvojih/dvoje, dvojim/dvoje, oboje, * tridesetora/tridesetoro, troja/troje (sr, http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) *
* e.g., обата, обајцата, обете, шеесетминава/шеесетмина, шеесетминана/шеесетмина, * шеесетмината/шеесетмина, шеснаесетминава/шеснаесетмина, шеснаесетминана/шеснаесетмина, * шеснаесетмината/шеснаесетмина (mk, http://purl.org/olia/mte/multext-east.owl#CollectiveNumeral) */ CollectiveNumeral(Numeral), /** * Nominal numbers are used to identify or refer the things. It does not show the quantity or rank. *
* Example: * *
* ངེ་གི་ འགལ་འཕིན་ ཨང་གངས་ འདི་ ༡༧༦༤༩༠༣༧ ཨིན། * NGIGI DRUELTHRIN ANGDRANG 'DI 17649037 INN * my mobile number is 17649037 be * “ My mobile number is 17649037.” ** * (Jurmey Rabgay, email Sep 20, 2010, http://purl.org/olia/dzongkha.owl#NominalNumber) */ NominalNumber(Numeral), /** * An ordinal number is a number belonging to a class whose members designate positions in a sequence, * e.g. in English "First", "Second", "Third".
* Symbols such as alphabetic characters can vary for singular and plural (e.g. How many Ps are there in
* `psychopath'?), and are in this respect like common nouns. In some languages (e.g. Portuguese) such
* symbols also have gender.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node17.html#recr)
*/
Symbol(LexicalCategory.Residual),
/**
* a mis-typed word
*/
Typo(LexicalCategory.Residual),
/**
* adopted from Dzongkha tagset (Chungku et al. 2010). If its tradition of grammar description is
* influenced by the Indian, these case markers are variously described as case morphemes or as
* postpositions. Therefore introduced as a shorthand for Adposition or MorphologicalParticle
*/
CaseMarker(LexicalCategory.Unique),
/**
* A classifier is a word or affix that expresses the classification of a noun.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAClassifier.htm 19.09.06)
*
* Classifiers are a very typical feature of sign languages. In some Asian languages, classifiers are used * as particles to combine a noun with a numeral, e.g. chin. _san ge ren_ 'three pieces of people', 'three * people' (Bußmann 2002, under Klassifikator) *
* Bharati et al. (2006, for Indian languages) group Classifiers together with Quantifiers and Numerals, * but they do not provide a detailed characterization of this class. *
* Akshar Bharati, Dipti Misra Sharma, Lakshmi Bai, Rajeev Sangal (2006), AnnCorra : Annotating Corpora.
* Guidelines For POS And Chunk Annotation For Indian Languages, Tech. Rep., L anguage Technologies
* Research Centre IIIT, Hyderabad, version of 15-12-2006, http://ltrc.iiit.ac.in/tr031/posguidelines.pdf
*/
Classifier(LexicalCategory.Unique),
/**
* Generally, discourse markers are expressions or phrases of greeting, apologizing, thanking, short
* emotional utterances, and interjections. Their node label is DM. ... Typical discourse markers are: ja,
* nein, hallo, oh, aha, pst, nunja, gewiß, toll, nun ja, etc. (Telljohann et al. 2009, p. 136)
*/
DiscourseMarker(LexicalCategory.Unique),
/**
* For Hindi, words like 'bahuta', 'kama', etc. when intensifying adjectives or adverbs will be annotated
* as INTF. Example, h37. hEdarAbAda meM aMgUra bahuta_INTF acche milate hEM 'HyderabAd' 'in' 'grapes'
* 'very' 'good' 'available' 'are' “Very good grapes are available in Hyderabad” (Bharati et al. 2006)
* Akshar Bharati, Dipti Misra Sharma, Lakshmi Bai, Rajeev Sangal (2006), AnnCorra : Annotating Corpora.
* Guidelines For POS And Chunk Annotation For Indian Languages, Tech. Rep., L anguage Technologies
* Research Centre IIIT, Hyderabad, version of 15-12-2006, http://ltrc.iiit.ac.in/tr031/posguidelines.pdf
*/
Intensifier(LexicalCategory.Unique),
/**
* The izāfat (pronounced as a shorter form of –ē–) is an enclitic of Persian origin which is used in
* Farsi and neighboring languages. In Urdu, it can be considered a preposition under certain
* circumstances: it links two nouns in a possessive relationship, although the phrase thus produced may
* often have a different meaning to a phrase produced with the native Urdu postposition kā. However, the
* izāfat may also join a noun to an adjective, in which case it is not so clearly accurate to describe it
* as a preposition parallel to the prepositions in European languages for which the EAGLES guidelines
* were compiled. A better way to treat izāfat is in the context of the Unique category of miscellaneous
* one-member wordclasses, discussed below. (Hardie 2003, http://purl.org/olia/emille.owl#Izafat)
*/
Izafat(LexicalCategory.Unique),
/**
* In Urdu, multiplicative numerals are formed by adding the suffix gunâ (Schmidt 1999, p.
* 260,http://purl.org/olia/emille.owl#MultiplicativeMarker)
*/
MultiplicativeMarker(LexicalCategory.Unique),
/**
* synonym of Unique, to be avoided because of its divergent definitions (Chiarcos)
*/
Particle(LexicalCategory.Unique),
/**
* Particle that serves to form adjective phrases, e.g., Urdu sā
* (http://purl.org/olia/emille.owl#AdjectivalParticle)
*/
AdjectivalParticle(Particle),
/**
* Contrastive particle, e.g., (one of the uses of) Urdu tô:
*
*
* vo urdû parhê gâ * "He will study Urdu." (simple statement) * * vo tô urdû parhê gâ * "HE will study Urdu." (Contrast: the other students may not.) ** * (Schmidt 1999, p. 232, see http://purl.org/olia/emille.owl#ContrastiveEmphaticParticle) */ ContrastiveParticle(Particle), /** * Emphatic particle, e.g., (one of the uses of) Urdu tô: * *
* vo urdû parhê gâ * "He will study Urdu." (simple statement) * * vo urdû parhê gâ tô lêkin imtihân nahîm dê gâ * "He will STUDY Urdu, OF COURSE, but he won't take the examination." * *(Schmidt 1999, p. 232, see http://purl.org/olia/emille.owl#ContrastiveEmphaticParticle) */ EmphaticParticle(Particle, Intensifier), /** * adopted from EMILLE, http://purl.org/olia/emille.owl#ContrastiveEmphaticParticle, shorthand for * ContrastiveParticle and EmphaticParticle */ ContrastiveEmphaticParticle(EmphaticParticle, ContrastiveParticle), /** * In Urdu, the exclusive emphatic particle hî emphasizes the preceding word and excludes something else * (which may not be expressed). (Schmidt 1999, p.233, * http://purl.org/olia/emille.owl#ExclusiveEmphaticParticle)
* Compare with the inclusive emphatic particle bhî: * ** maim *bhî* faisalâ karûm gâ * "I'll *also* make a decision" * * maim *hî* faisalâ karûm gâ * "*I'm the one who* will make the decision." ** * (Schmidt 1999, p.237, http://purl.org/olia/emille.owl#InclusiveEmphaticParticle) */ ExclusiveEmphaticParticle(EmphaticParticle), /** * In Urdu, bhî is an emphatic particle meaning 'even'. In opposition to contrastive tô and exclusive hî, * bhî is inclusive: * ** maim *bhî* faisalâ karûm gâ * "I'll *also* make a decision" * * maim *hî* faisalâ karûm gâ * "*I'm the one who* will make the decision." ** * (Schmidt 1999, p.237, http://purl.org/olia/emille.owl#InclusiveEmphaticParticle) */ InclusiveEmphaticParticle(EmphaticParticle), /** * English existential there is specified as a subtype of pronoun in MTE v4, i.e., Pronoun/Type="ex-there"
* (http://purl.org/olia/mte/multext-east.owl#ExistentialThere) */ ExistentialParticle(Particle), /** * http://www.isocat.org/datcat/DC-1455 (preverbalParticleLmf) */ PreverbalParticle(Particle), /** * A verbal particle modifies the verb and carries information on the verb form (e.g., finiteness, tense * and aspect). (Dimitrova et al. 2009, Dan Tufis, email 2010/06/09). * * In the Bulgarian MTE specs, Particle/Type=verbal(v) is used to form different type of verbal * syntactical relationships, e.g. to create future tense (ще говориш), or particles like се, да. * (Dimitrova et al. 2009) The Romanian MTE v4 specs provide a more fine-grained subclassification of * (verbal) particles (MTE v4, http://purl.org/olia/mte/multext-east.owl#VerbalParticle) */ VerbalParticle(Particle), /** * In the Romanian MULTEXT-East scheme, a verbal particle with Particle/Type="aspect" modifies the verbs * and carries information on the verb form, i.e., on its aspect (Dan Tufis, email 2010/06/09, * http://purl.org/olia/mte/multext-east.owl#AspectParticle) */ AspectParticle(VerbalParticle), /** * A modality-marking adverb is a verbal particle that serves to indicate mood, aspect and/or tense (cf. * Schmidt 1999). Note that this is not to be confused with the conventional meaning of "modal adverb" in * the sense of "manner adverb" (cf. http://en.wiktionary.org/wiki/Category:English_modal_adverbs), hence * the uncommon name. * * Ruth Laila Schmidt (1999) Urdu, an essential grammar, Routledge, London. */ ModalityMarkingAdverb(LexicalCategory.Adverb, VerbalParticle), /** * In the Romanian MULTEXT-East scheme, a verbal particle with Particle/Type="future" modifies the verbs * and marks the verb as being subjunctive, e.g., s-/să, să (Dan Tufis, email 2010/06/09, * http://purl.org/olia/mte/multext-east.owl#SubjunctiveParticle) */ SubjunctiveParticle(VerbalParticle), /** * Dzongkha has also a tense marker, which is not complicated like in other languages. It has got only six * tense markers and can be used in a very simple and effective way. They are: ('Ni'+'Wong') for future, * ('D'o'+'D'ä') for present and ('Ci'+'Yi') for past tense. * ** ང་ ནངས་པ་ འ ་ ། * Nga naba jo-ni[past tense] * I tomorrow go-will-[past] * 'I am going tomorrow' ** *
* (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) */ TenseMarkingParticle(VerbalParticle), /** * Particle used in order to express future.
* (http://www.isocat.org/datcat/DC-1919) */ FutureParticle(TenseMarkingParticle), /** * E.g., the mediopassive (middle) voice marker se in the Portuguese EAGLES scheme. (Leech and Wilson * 1996) */ VoiceParticle(VerbalParticle), /** * Particle used to express infinitive.
* (http://www.isocat.org/datcat/DC-1896) */ InfinitiveParticle(VerbalParticle), /** * Particle used to compare.
* (http://www.isocat.org/datcat/DC-1922) */ ComparativeParticle(Particle), /** * conditional particule (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2230) */ ConditionalParticule(CoordinatingConjunction, Particle), /** * particle for coordination (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2227) */ CoordinationParticle(Particle), /** * distinctive particle (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2228) */ DistinctiveParticle(Particle), /** * Particle used to express a question.
* (http://www.isocat.org/datcat/DC-1921) */ InterrogativeParticle(Particle), /** * Particle which functions as a modal.
* (http://www.isocat.org/datcat/DC-1920) */ ModalParticle(Particle), /** * Particle used to express negation. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1894) */ NegativeParticle(Particle), /** * Particle used to express affirmation.
* (http://www.isocat.org/datcat/DC-1918) */ AffirmativeParticle(Particle), /** * Particle expressing ownship.
* (http://www.isocat.org/datcat/DC-1895) */ PossessiveParticle(Particle), /** * relative particle (MIRACL & LSCA; http://www.isocat.org/datcat/DC-2229) */ RelativeParticle(Particle), /** * Particle expressing superlative degree. Superlative is the comparison between more than two entities * and contrasts with comparative where only two entities are involved and positive where no comparison is * implied. (Crystal 2003; http://www.isocat.org/datcat/DC-1923) */ SuperlativeParticle(Particle), /** * In Urdu, wālā can be added to substantives to derive nouns implying possession or general * relationships, e.g., go-wāl, or go-wālā, s.m. cow-keeper, cow-herd (from go, 'cow'), or ghar-wālā, s.m. * master or owner of the house (from ghar, 'house') (Plats 1884, cf. http://purl.org/olia/urdu.owl#Wala) */ PossessionMarker(LexicalCategory.Unique), /** * Word which serves no grammatical function, but which fills up a sentence or gives emphasis. * (www.southwestern.edu/~carlg/Latin_Web/glossary.html; http://www.isocat.org/datcat/DC-1283) */ Expletive(LexicalCategory.Unique), /** * An expletive (also known as a dummy word) is a part of speech whose members have no meaning, but * complete a sentence to make it grammatical [Crystal 1997, 127]
* (http://purl.org/linguistics/gold/Expletive) ** In European languages, expletives are pronouns. A verbal part of speech that * "has no meaning, but complete a sentence to make it grammatical" is a copula (see AuxiliaryVerb). */ ExpletivePronoun(ThirdPersonPronoun, Expletive), /** * Three different expletive usages [of the German expletive pronoun es] are traditionally distinguished: * formal subject or object (expletive argument), correlate of an extraposed clausal argument (expletive * correlate), and Vorfeld-es (structural expletive) (cf. (Eisenberg 1999 2001), (Pütz 1986)). ... *
* The formal subject obligatorily occurs with weather verbs, e.g. "Es regnet" and unpersonal or agentless * constructions such as "Es gibt so eine Buchung" or "Es geht um populäre Unterhaltung." Some verbs * optionally permit an expletive subject but also occur with referential subjects such as * "Max/Es kopft an der Tür." A formal object is found in constructions like "jmd. legt es an auf etw." or * "jmd. verdirbt es mit jmdm." In all examples mentioned, es functions as a grammatical argument without * semantic contribution, i.e. it does not refer to a person, object, or event. (Telljohann et al. 2009, * p.60f) */ ExpletiveArgument(ExpletivePronoun), /** * Three different expletive usages [of the German expletive pronoun es] are traditionally distinguished: * formal subject or object (expletive argument), correlate of an extraposed clausal argument (expletive * correlate), and Vorfeld-es (structural expletive) (cf. (Eisenberg 1999 2001), (Pütz 1986)). (Telljohann * et al. 2009, p.60) *
* Extraposed clausal arguments: * "Aber [es] ist übertrieben zu sagen, damit bekäme die FU erst eine Identität." (Telljohann et al. 2009, * p.62) */ ExpletiveCorrelate(ExpletivePronoun), /** * Three different expletive usages [of the German expletive pronoun es] are traditionally distinguished: * formal subject or object (expletive argument), correlate of an extraposed clausal argument (expletive * correlate), and Vorfeld-es (structural expletive) (cf. (Eisenberg 1999 2001), (Pütz 1986)). (Telljohann * et al. 2009, p.60) *
* In German, a purely structural dummy element ... occurs in Vorfeld position only and is not correlated * with any argument of the clause. It does not agree with the verb which becomes evident if there is a * plural subject in the Mittelfeld: *
* "es zahlen ihn die Völker, deren Menschenrechte angeblich verteidigt werden." *
* It is ungrammatical in the Mittelfeld, e.g. *". . . dass es ihn die Völker zahlen". */ StructuralExpletive(ExpletivePronoun), /** * An auxiliary verb is a verb which accompanies the lexical verb of a verb phrase, and expresses * grammatical distinctions not carried by the lexical verb, such as person, number, tense aspect, and * voice.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnAuxiliaryVerb.htm 19.09.06) ** Besides modal verbs ("semiauxiliary") and "strict" auxiliary verbs, also copulas are classified under * auxiliary verbs here, as this is a praxis applied in practically every EAGLES-conformant * morphosyntactic annotation scheme. *
* Part of speech referring to the set of verbs, subordinate to the main lexical verb which help to make * distinction in mood, aspect, voice etc. (Crystal 2003; http://www.isocat.org/datcat/DC-1244) */ AuxiliaryVerb(LexicalCategory.Verb), /** * A copula is an intransitivity verb which links a subject to a noun phrase, an adjective or an other * constituent which expresses the predicate.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsACopula.htm 19.09.06) */ Copula(AuxiliaryVerb), /** * Verb form that is usually used with another verb to express ideas such as possibilities, permission, or * intention. (Gil Francopoulo; http://www.isocat.org/datcat/DC-1329) ** A modal verb (also modal, modal auxiliary verb, modal auxiliary) is a type of auxiliary verb that is * used to indicate modality. The use of auxiliary verbs to express modality is characteristic of Germanic * languages.
* (http://en.wikipedia.org/wiki/Modal_verb 19.09.06) ** In addition to main and auxiliary verbs, it may be useful (e.g. in English) to recognise an * intermediate category of semi-auxiliary for such verbs as be going to, have got to, ought to.
* (http://www.ilc.cnr.it/EAGLES96/annotate/node18.html#oav1v 20.09.06) ** The auxiliaries in English subdivide into the primary verbs `be', `have', and `do', which can also * function as main verbs, and the modal auxiliaries such as `can', `will', and `would', which are * uninflected, and always function as auxiliaries.
* (http://www.ilc.cnr.it/EAGLES96/morphsyn/node158.html#SECTION00054800000000000000) */ ModalVerb(AuxiliaryVerb), /** * Non-modal, non-copular auxiliary verb. */ StrictAuxiliaryVerb(AuxiliaryVerb), /** * An auxiliary that marks exclusively aspect, e.g., in Urdu: ** Auxiliaries: Based on the syntactic nature of Urdu, auxiliaries are divided into two categories. * Aspectual auxiliaries always occur after main verb of the sentence. Tense auxiliaries are used to show * the time of the action. They occurred at the end of the verb phrase (Sajjad 2007). *
* E.g., Urdu rahā, an auxiliary element is used to mark the durative aspect. (Hardie 2004, * http://purl.org/olia/emille.owl#RahaAuxiliary) */ AspectMarkingAuxiliary(StrictAuxiliaryVerb), /** * An auxiliary that marks exclusively tense, e.g., in Urdu: *
* Auxiliaries: Based on the syntactic nature of Urdu, auxiliaries are divided into two categories. * Aspectual auxiliaries always occur after main verb of the sentence. Tense auxiliaries are used to show * the time of the action. They occurred at the end of the verb phrase. (Sajjad 2007). *
* In Urdu, the auxiliary gā indicates future tense when it follows a verb in the subjunctive form.
* (http://purl.org/olia/emille.owl#GaAuxiliary) */ TenseMarkingAuxiliary(StrictAuxiliaryVerb), /** * Verb used to link the subject of a sentence and its noun or adjective complement or complementing * phrase in certain languages. This verb could be used also to form the passive voice. * (www.wordreference.com/English/definition.asp?en=be -> 4); http://www.isocat.org/datcat/DC-1246) */ BeAuxiliary(StrictAuxiliaryVerb), /** * The verb have as an auxiliary. * (www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnAuxiliaryVerb.htm; * http://www.isocat.org/datcat/DC-1299) */ HaveAuxiliary(StrictAuxiliaryVerb), /** * A finite verb is a verb form that occurs in an independent clause, and is fully inflected according to * the inflectional categories marked on verbs in the language.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAFiniteVerb.htm 19.09.06) ** Property applied to a verb form that can occur on its own in an independent sentence. (Crystal 2003; * http://www.isocat.org/datcat/DC-1287) */ FiniteVerb(LexicalCategory.Verb), /** * A conditional verb is a verb form in many languages. It is used to express degrees of certainty or * uncertainty and hypothesis about past, present, or future. Such forms often occur in conditional * sentences.
* (http://en.wikipedia.org/wiki/Conditional_mood 19.09.06) */ ConditionalVerb(FiniteVerb), /** * An imperative verb is used to express commands, direct requests, and prohibitions. Often, direct use of * the imperative mood may appear blunt or even rude, so it is often used with care. Example: "Paul, read * that book".
* (http://en.wikipedia.org/wiki/Grammatical_mood#Imperative_mood 19.09.06) */ ImperativeVerb(FiniteVerb), /** * Indicative mood is used in factual statements. All intentions in speaking that a particular language * does not put into another mood use the indicative. It is the most commonly used mood and is found in * all languages.
* (http://en.wikipedia.org/wiki/Grammatical_mood#Indicative_mood 19.09.06) */ IndicativeVerb(FiniteVerb), /** * A subjunctive verb is typically used to expresses wishes, commands (in subordinate clauses), emotion, * possibility, judgment, necessity, and statements that are contrary to fact at present.
* (http://en.wikipedia.org/wiki/Subjunctive_mood 19.09.06) */ SubjunctiveVerb(FiniteVerb), /** * In linguistics, a light verb is a verb participating in complex predication that has little semantic * content of its own, but provides through inflection some details on the event semantics, such as * aspect, mood, or tense. The semantics of the compound, as well as its argument structure, are * determined by the head or primary component of the compound, which may be a verb or noun (V+V or V+N * compounds). Other names for "light verb" include: vector verb or explicator verb, emphasising its role * within the compound; or thin verb or semantically weak verb, emphasising (as with "light") its lack of * semantics. A "semantically weak" verb is not to be confused with a "weak verb" as in the Germanic weak * inflection. Light verbs are similar to auxiliary verbs in some ways. ** Most English light verbs occur in V+N forms sometimes called "stretched verbs": for example, take in * take a nap, where the primary sense is provided by "nap", and "take" is the light verb. The light verbs * most common in these constructions are also common in phrasal verbs. A verb which is "light" in one * context may be "heavy" in another: as with "take" in I will take a book to read. *
* Examples in other languages include the Yiddish geb in geb a helf (literally give a help, "help"); the * French faire in faire semblant (lit. make seeming, "pretend"); the Hindi nikal paRA (lit. leave fall, * "start to leave"); and the bǎ construction in Chinese.[1] Some verbs are found in many such * expressions; to reuse an earlier example, take is found in take a nap, take a shower, take a sip, take * a bow, take turns, and so on. Light verbs are extremely common in Indo-Iranian languages, Japanese, and * other languages in which verb compounding is a primary mechanism for marking aspectual distinctions.
* (http://en.wikipedia.org/wiki/Light_verb) */ LightVerb(LexicalCategory.Verb), /** * Verb forms occurring on their own only in dependent clauses and lacking tense and mood contrasts. * (adapted from Crystal 2003; http://www.isocat.org/datcat/DC-1332) ** A non-finite verb is a verb that is not fully inflected for categories that are marked inflectionally * in a language, such as the following: Tense, Aspect, Modality, Number, Person.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsANonfiniteVerb.htm 19.09.06) */ NonFiniteVerb(LexicalCategory.Verb), /** * property for a non-finite form of a verb other than the infinitive.
* (http://www.isocat.org/datcat/DC-2243) ** A gerund is a kind of verbal noun that exists in some languages. In today's English, gerunds are nouns * built from a verb with an '-ing' suffix. They can be used as the subject of a sentence, an object, or * an object of preposition. They can also be used to complement a subject. Often, gerunds exist * side-by-side with nouns that come from the same root but the gerund and the common noun have different * shades of meaning.
* (http://en.wikipedia.org/wiki/Gerund, http://en.wikibooks.org/wiki/English:Gerund 19.09.06) ** The term _gerund_ is ambiguous: with respect to Latin, in whose grammatical tradition it originates, it * refers to a deverbal noun, and is needed in this function for Polish as well; in descriptions of some * other languages, however, it has been used for an adverbial participle. The two meanings have nothing * in common, except that the English _ing_-form can translate both. (Ivan A Derzhanski, email 2010/06/09) * Here, it is assumed that Gerund refers only to deverbal nouns, cf. NominalNonfiniteVerb in the IIIT * tagset
* (http://purl.org/olia/iiit.owl#NominalNonFiniteVerb) */ Gerund(NonFiniteVerb), /** * An infinitive is the base form of a verb. It is unmarked for inflectional categories such as the * following: Aspect, Modality, Number, Person and Tense.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAnInfinitive.htm 19.09.06) */ Infinitive(NonFiniteVerb), /** * A participle is a lexical item, derived from a verb that has some of the characteristics and functions * of both verbs and adjectives. In English, participles may be used as adjectives, and in non-finite * forms of verbs.
* (http://www.sil.org/linguistics/GlossaryOfLinguisticTerms/WhatIsAParticiple.htm 19.09.06) */ Participle(NonFiniteVerb), /** * Adverb/Type="participle" is used in the Slovene MTE v4 specs, e.g., 'leže' / lying. Slovenian adverbial * participles are, however, not attested for Resian. (MTE * v4)(http://purl.org/olia/mte/multext-east.owl#AdverbialParticiple) */ AdverbialParticiple(LexicalCategory.Adverb, Participle), /** * [In Bengali, t]he Conditional Participle is widely used to convey * "if a certain action [pertaining to the parent verb] is done,...". The logic is: "in the case or * condition of a certain action being done". Being impersonal, without regard for the doer of the action * that caused the condition, it is not declined to suit number or gender. If this doer is not defined in * the Bengali condition clause but needs to be stated in a natural-sounding English translation, this is * identified and drawn from the second clause. For example:- Student: Teaching Truth in Bengali ** If you pay attention,* you will learn. manoyog kar-*le* tumi shikh-be. [or, If attention is paid] *
*
* (http://www.jaspell.co.uk/bengalicourse2007/wb149study49.pdf) */ ConditionalParticiple(Participle), /** * Participle and hasTense some Past */ PastParticiple(Participle), /** * Participle and hasTense some Present */ PresentParticiple(Participle), /** * English verb forms ending in '-ing' that represent either Gerunds or Participles. */ Ing("ing", Gerund, Participle), /** * Adjective based on a verb.
* (http://www.isocat.org/datcat/DC-1598) */ ParticipleAdjective(LexicalCategory.Adjective, Participle), /** * Adjective based on a past participle.
* (http://www.isocat.org/datcat/DC-1596) */ PastParticipleAdjective(ParticipleAdjective, PastParticiple), /** * Adjective based on a present participle.
* (http://www.isocat.org/datcat/DC-1597) */ PresentParticipleAdjective(ParticipleAdjective, PresentParticiple), /** * Supine is a nonfinite form of motion verbs with functions similar to that of an infinitive (Angelika * Adams) */ Supine(NonFiniteVerb), /** * A verbal noun is a noun formed directly as an inflexion of a verb or a verb stem, sharing at least in * part its constructions. This term is applied especially to gerunds, and sometimes also to infinitives * and supines.
* (http://en.wikipedia.org/wiki/Verbal_noun 19.09.06) */ VerbalNoun(CommonNoun, NonFiniteVerb), /** * Main verb in contrast to a modal or an auxiliary.
* (http://www.isocat.org/datcat/DC-1400) */ MainVerb(LexicalCategory.Verb), /** * An agentive verb marks the semantic role of agent or the doer of an action. ** Example: * *
* ་ ་ ས་ ་ ་ བསད་ ག། * Dorji-gi jele sänu * 'Dorji killed the cat' ** *
* (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) */ AgentiveVerb(MainVerb), /** * It is a verb, which indicates a strong desire to achieve something, without the doer. * ** དག་པ ་ ང་ ་ ་བར་ ག། * dag-pai zhing-lu kewa shÔ * 'May i be born in pure land' ** *
* (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) */ AspirationalVerb(MainVerb), /** * Dzongkha uses honorific forms: ན་བཟའ་/nam za/ (cloths) is the honorific form of the noun གོ་ * ལ་/gola/(cloths), གསངས་/sung/(tell) the honorific form of the verb སབ་/lab/(tell). We opted to mark * them by adding the tag NNH (honorific common noun) and VBH (honorific verb) to enable future research * on this specific usage of Dzongkha language. A number of tags were added to the set, of which we * describe four in more detail: two of the additional tags are subclasses of verbs: VBH (honorific verb * form), and VBN which describes past participle forms, like, e.g. བངམ་/jun/(created), the past particle * form of བང་/jung/(create). */ HonorificVerb(MainVerb), /** * (of a verb) having no logical subject. Usually in English the pronoun it is used in such cases as a * grammatical subject, as for example in It is raining. (of a pronoun) not denoting a person * (www.wordreference.com/English/definition.asp?en=impersonal; http://www.isocat.org/datcat/DC-1306) */ Impersonal(MainVerb), /** * A non-agentive verb is a type of verb, which indicates an action without the doer. ** Example: ང་མ་ འ ར་ ས། 'lungma phur-dä 'A wind is blowing'
* (http://panl10n.net/english/Outputs%20Phase%202/CCs/Bhutan/Papers/2007/0701/PartOfSpeech.pdf) */ NonAgentiveVerb(MainVerb), ; static final String OLIA_NAMESPACE = "http://purl.org/olia/olia.owl#"; private final Setcategories; private final Collection parents; private final IRI uri; Pos(LexicalCategory category) { this(null, category, (LexicalCategory) null); } Pos(LexicalCategory category, LexicalCategory additional) { this(null, category, additional); } Pos(String name, LexicalCategory category, LexicalCategory additional) { this.uri = new IRI(OLIA_NAMESPACE + (name == null ? name() : name)); categories = EnumSet.of(category); if (additional != null) { categories.add(additional); } parents = Collections.emptySet(); } Pos(Pos... parent) { this(null, null, parent); } Pos(String name, Pos... parent) { this(name, null, parent); } Pos(LexicalCategory category, Pos... parent) { this(null, category, parent); } Pos(String name, LexicalCategory category, Pos... parent) { this.uri = new IRI(OLIA_NAMESPACE + (name == null ? name() : name)); this.parents = parent == null || parent.length < 1 ? Collections.EMPTY_SET : Arrays.asList(parent); categories = category == null ? EnumSet.noneOf(LexicalCategory.class) : EnumSet.of(category); Set toProcess = new HashSet (parents); while (!toProcess.isEmpty()) { Iterator it = toProcess.iterator(); Pos p = it.next(); it.remove(); categories.addAll(p.categories); toProcess.addAll(p.parents); } } public Set categories() { return categories; } public boolean isParent() { return parents.isEmpty(); } public Collection parents() { return parents; } public IRI getUri() { return uri; } public Set hierarchy() { return transitiveClosureMap.get(this); } @Override public String toString() { return String.format("olia:%s", uri.getUnicodeString().substring(OLIA_NAMESPACE.length())); } /** * This is needed because one can not create EnumSet instances before the * initialization of an Enum has finished. * To keep using the much faster {@link EnumSet} a static member initialised * in an static {} block is used as a workaround. The {@link Tense#getTenses()} * method does use this static member instead of a member variable */ private static final Map
> transitiveClosureMap; static { transitiveClosureMap = new EnumMap >(Pos.class); for(Pos pos : Pos.values()){ Set parents = EnumSet.of(pos); for(Pos posParent : pos.parents()){ Set transParents = transitiveClosureMap.get(posParent); if(transParents != null){ parents.addAll(transParents); } else if(posParent != null){ parents.add(posParent); } // else no parent } transitiveClosureMap.put(pos, parents); } } }