blob: a720c78feafa46906b260594696b858d97965002 [file] [log] [blame]
PACKAGE uima.ruta.example;
// import the types of this type system:
TYPESYSTEM types.BibtexTypeSystem;
// define and import an external dictionary containing first names
WORDLIST FirstNameList = 'FirstNames.txt';
// define some useful annotations
DECLARE FirstName, FirstNameInitial, Name, NameListPart;
//find the first names
Document{-> MARKFAST(FirstName, FirstNameList)};
// something that may links names
DECLARE NameLinker;
W{REGEXP("and", false) -> MARK(NameLinker)};
COMMA{ -> MARK(NameLinker)};
SPECIAL{REGEXP("&") -> MARK(NameLinker)};
// first name initials
CW{REGEXP(".") -> MARK(FirstNameInitial,1,2)} PERIOD;
// maybe a name
FirstName+ FirstNameInitial* CW{-> MARK(Name, 1, 2, 3)};
FirstNameInitial+{-PARTOF(Name)} CW{-> MARK(Name, 1, 2, 3)};
CW{-PARTOF(Name), -REGEXP(".")} COMMA? FirstNameInitial+{-> MARK(Name, 1, 2, 3)};
// list of names
Name{-PARTOF(NameListPart)} NameLinker[1,2]{-> MARK(NameListPart,1,2)};
NameListPart+ Name{-PARTOF(Author),-PARTOF(NameListPart) -> MARK(Author,1,2,3)} ;
NameListPart+{-PARTOF(Author) -> MARK(Author)};
// expand the author to the following punctation mark
Author{-> SHIFT(Author,1,2)} PM;