@@ -474,6 +474,8 @@ EY_ADJS = "cag"|"cak"|"clay"|"cliqu"|"crep"|"dic"|"dop"|"glu"|"goo"|"grip"|"hok"
474
474
475
475
COMP_SUP = "JJR" | "JJS" | "RBR" | "RBS"
476
476
477
+ SINGULAR_DEMONYMS = "Bantu" | "Bengalese" | "Beninese" | "British" | "Boche" | "Burmese" | "Chinese" | "Congolese" | "Danish" | "English" | "Finnish" | "Flemish" | "Gabonese" | "Guyanese" | "Irish" | "Japanese" | "Javanese" | "Jewish" | "Lebanese" | "Maltese" | "Moorish" | "Nepalese" | "Nipponese" | "Polish" | "Portuguese" | "Rhenish" | "Romish" | "Scottish" | "Senegalese" | "Siamese" | "Singhalese" | "Sinhalese" | "Sioux" | "Spanish" | "Sudanese" | "Swedish" | "Swiss" | "Taiwanese" | "Togolese" | "Turkish" | "Vietnamese" | "Yiddish"
478
+
477
479
%%
478
480
479
481
/* can and will not always modal so can be inflected */
@@ -1160,7 +1162,7 @@ COMP_SUP = "JJR"|"JJS"|"RBR"|"RBS"
1160
1162
<noun,any> ( "Brahman" | "German" | "dragoman" | "ottoman" | "shaman" | "talisman" | "Norman" | "Pullman" | "Roman" ) "s" { return (stem(1 ," " ," s" )); }
1161
1163
<noun,any> ( "Czech" | "diptych" | "Sassenach" | "abdomen" | "alibi" | "aria" | "bandit" | "begonia" | "bikini" | "caryatid" | "colon" | "cornucopia" | "cromlech" | "cupola" | "dryad" | "eisteddfod" | "encyclopaedia" | "epoch" | "eunuch" | "flotilla" | "gardenia" | "gestalt" | "gondola" | "hierarch" | "hose" | "impediment" | "koala" | "loch" | "mania" | "manservant" | "martini" | "matriarch" | "monarch" | "oligarch" | "omen" | "parabola" | "pastorale" | "patriarch" | "pea" | "peninsula" | "pfennig" | "phantasmagoria" | "pibroch" | "poly" | "real" | "safari" | "sari" | "specimen" | "standby" | "stomach" | "swami" | "taxi" | "tech" | "toccata" | "triptych" | "villa" | "yogi" | "zloty" ) "s" { return (stem(1 ," " ," s" )); }
1162
1164
<noun,any> ( "asyl" | "sanct" | "rect" | "pl" | "pendul" | "mausole" | "hoodl" | "for" ) "ums" { return (stem(1 ," " ," s" )); }
1163
- <noun,any>("Bantu"|"Bengalese"|"Beninese"|"Boche"|"Burmese"|"Chinese"|"Congolese"|"Gabonese"|"Guyanese"|"Japanese"|"Javanese"|"Lebanese"|"Maltese"|"Olympics"|"Portuguese"|"Senegalese"|"Siamese"|"Singhalese"|"Sinhalese"|"Sioux"|"Sudanese"|"Swiss"|"Taiwanese"|"Togolese"|"Vietnamese"|"aircraft"|"anopheles"|"apparatus"|"asparagus"|"barracks"|"bellows"|"bison"|"bluefish"|"bob"|"bourgeois"|"bream"|"brill"|"butterfingers"|"carp"|"catfish"|"chassis"|"chub"|"cod"|"codfish"|"coley"|"contretemps"|"corps"|"crawfish"|"crayfish"|"crossroads"|"cuttlefish"|"dace"|"dice"|"dogfish"|"doings"|"dory"|"downstairs"|"eldest"|"feces"|"finnan"|"firstborn"|"fish"|"flatfish"|"flounder"|"fowl"|"fry"|"fries"|{A}+"-works"|"gasworks"|"glassworks"|"globefish"|"goldfish"|"grand"|"gudgeon"|"gulden"|"haddock"|"hake"|"halibut"|"headquarters"|"herring"|"hertz"|"horsepower"|"hovercraft"|"hundredweight"|"ironworks"|"jackanapes"|"kilohertz"|"kurus"|"kwacha"|"ling"|"lungfish"|"mackerel"|"means"|"megahertz"|"moorfowl"|"moorgame"|"mullet"|"offspring"|"pampas"|"parr"|"patois"|"pekinese"|"penn'orth"|"perch"|"pickerel"|"pike"|"pince-nez"|"plaice"|"precis"|"quid"|"rand"|"rendezvous"|"revers"|"roach"|"roux"|"salmon"|"samurai"|"series"|"shad"|"sheep"|"shellfish"|"smelt"|"spacecraft"|"species"|"starfish"|"stockfish"|"sunfish"|"superficies"|"sweepstakes"|"swordfish"|"tench"|"tope"|"triceps"|"trout"|"tuna"|"tunafish"|"tunny"|"turbot"|"undersigned"|"veg"|"waterfowl"|"waterworks"|"waxworks"|"whiting"|"wildfowl"|"woodworm"|"yen") { return(xnull_stem()); }
1165
+ <noun,any>("aircraft"|"anopheles"|"apparatus"|"asparagus"|"barracks"|"bellows"|"bison"|"bluefish"|"bob"|"bourgeois"|"bream"|"brill"|"butterfingers"|"carp"|"catfish"|"chassis"|"chub"|"cod"|"codfish"|"coley"|"contretemps"|"corps"|"crawfish"|"crayfish"|"crossroads"|"cuttlefish"|"dace"|"dice"|"dogfish"|"doings"|"dory"|"downstairs"|"eldest"|"feces"|"finnan"|"firstborn"|"fish"|"flatfish"|"flounder"|"fowl"|"fry"|"fries"|{A}+"-works"|"gasworks"|"glassworks"|"globefish"|"goldfish"|"grand"|"gudgeon"|"gulden"|"haddock"|"hake"|"halibut"|"headquarters"|"herring"|"hertz"|"horsepower"|"hovercraft"|"hundredweight"|"ironworks"|"jackanapes"|"kilohertz"|"kurus"|"kwacha"|"ling"|"lungfish"|"mackerel"|"means"|"megahertz"|"moorfowl"|"moorgame"|"mullet"|"offspring"|"pampas"|"parr"|"patois"|"pekinese"|"penn'orth"|"perch"|"pickerel"|"pike"|"pince-nez"|"plaice"|"precis"|"quid"|"rand"|"rendezvous"|"revers"|"roach"|"roux"|"salmon"|"samurai"|"series"|"shad"|"sheep"|"shellfish"|"smelt"|"spacecraft"|"species"|"starfish"|"stockfish"|"sunfish"|"superficies"|"sweepstakes"|"swordfish"|"tench"|"tope"|"triceps"|"trout"|"tuna"|"tunafish"|"tunny"|"turbot"|"undersigned"|"veg"|"waterfowl"|"waterworks"|"waxworks"|"whiting"|"wildfowl"|"woodworm"|"yen") { return(xnull_stem()); }
1164
1166
<noun,any> "Aries" { return (stem(1 ," s" ," s" )); }
1165
1167
<noun,any> "Pisces" { return (stem(1 ," s" ," s" )); }
1166
1168
<noun,any> "Bengali" { return (stem(1 ," i" ," s" )); }
@@ -1835,7 +1837,7 @@ COMP_SUP = "JJR"|"JJS"|"RBR"|"RBS"
1835
1837
<verb,any> ( "accret" | "clon" | "deplet" | "dethron" | "dup" | "excret" | "expedit" | "extradit" | "fet" | "finetun" | "gor" | "hing" | "massacr" | "obsolet" | "reconven" | "recreat" | "recus" | "reignit" | "swip" | "videotap" | "zon" ) {ESEDING} { return (semi_reg_stem(0 ," e" )); }
1836
1838
<verb,any> ( "backpedal" | "bankroll" | "bequeath" | "blackball" | "bottom" | "clang" | "debut" | "doctor" | "eyeball" | "factor" | "imperil" | "landfill" | "margin" | "multihull" | "occur" | "overbill" | "pilot" | "prong" | "pyramid" | "reinstall" | "relabel" | "remodel" | "snowball" | "socall" | "squirrel" | "stonewall" | "wrong" ) {EDING} { return (semi_reg_stem(0 ," " )); } /* disprefer */
1837
1839
<noun,any> ( "beasti" | "browni" | "cach" | "cadr" | "calori" | "champagn" | "cologn" | "cooki" | "druggi" | "eateri" | "emigr" | "emigre" | "employe" | "freebi" | "genr" | "kiddi" | "massacr" | "mooni" | "neckti" | "nich" | "prairi" | "softi" | "toothpast" | "willi" ) "es" { return (stem(1 ," " ," s" )); }
1838
- <noun,any> (( {A} * "phobia" )| "accompli" | "aegis" | "alias" | "anorexia" | "anti" | "artemisia" | "ataxia" | "beatlemania" | "blini" | "cafeteria" | "capita" | "cola" | "coli" | "deli" | "dementia" | "downstairs" | "upstairs" | "dyslexia" | "jakes" | "dystopia" | "encyclopedia" | "estancia" | "euphoria" | "euthanasia" | "fracas" | "fuss" | "gala" | "gorilla" | "GI" | "habeas" | "haemophilia" | "hemophilia" | "hoopla" | "hula" | "impatiens" | "informatics" | "intelligentsia" | "jacuzzi" | "kiwi" | "mafia" | "magnolia" | "malaria" | "maquila" | "marginalia" | "megalomania" | "mercedes" | "militia" | "mufti" | "muni" | "olympics" | " pancreas"| "paranoia" | "pastoris" | "pastrami" | "pepperoni" | "pepsi" | "pi" | "piroghi" | "pizzeria" | "pneumocystis" | "potpourri" | "proboscis" | "rabies" | "reggae" | "regimen" | "rigatoni" | "salmonella" | "sarsaparilla" | "semen" | "ski" | "sonata" | "spatula" | "stats" | "subtilis" | "sushi" | "tachyarrhythmia" | "tachycardia" | "tequila" | "tetris" | "thrips" | "timpani" | "tsunami" | "vaccinia" | "vanilla" ) { return (cnull_stem()); }
1840
+ <noun,any> (( {A} * "phobia" )| "accompli" | "aegis" | "alias" | "anorexia" | "anti" | "artemisia" | "ataxia" | "beatlemania" | "blini" | "cafeteria" | "capita" | "cola" | "coli" | "deli" | "dementia" | "downstairs" | "upstairs" | "dyslexia" | "jakes" | "dystopia" | "encyclopedia" | "estancia" | "euphoria" | "euthanasia" | "fracas" | "fuss" | "gala" | "gorilla" | "GI" | "habeas" | "haemophilia" | "hemophilia" | "hoopla" | "hula" | "impatiens" | "informatics" | "intelligentsia" | "jacuzzi" | "kiwi" | "mafia" | "magnolia" | "malaria" | "maquila" | "marginalia" | "megalomania" | "mercedes" | "militia" | "mufti" | "muni" | "pancreas" | "paranoia" | "pastoris" | "pastrami" | "pepperoni" | "pepsi" | "pi" | "piroghi" | "pizzeria" | "pneumocystis" | "potpourri" | "proboscis" | "rabies" | "reggae" | "regimen" | "rigatoni" | "salmonella" | "sarsaparilla" | "semen" | "ski" | "sonata" | "spatula" | "stats" | "subtilis" | "sushi" | "tachyarrhythmia" | "tachycardia" | "tequila" | "tetris" | "thrips" | "timpani" | "tsunami" | "vaccinia" | "vanilla" ) { return (cnull_stem()); }
1839
1841
<noun,any> ( "acrobatics" | "athletics" | "basics" | "betters" | "bifocals" | "bowels" | "briefs" | "checkers" | "cognoscenti" | "denims" | "doldrums" | "dramatics" | "dungarees" | "ergonomics" | "genetics" | "gravitas" | "gymnastics" | "hackles" | "haves" | "hubris" | "ides" | "incidentals" | "ironworks" | "jinks" | "leavings" | "leftovers" | "logistics" | "makings" | "microelectronics" | "miniseries" | "mips" | "mores" | "oodles" | "pajamas" | "pampas" | "panties" | "payola" | "pickings" | "plainclothes" | "pliers" | "ravings" | "reparations" | "rudiments" | "scads" | "splits" | "stays" | "subtitles" | "sunglasss" | "sweepstakes" | "tatters" | "toiletries" | "tongs" | "trivia" | "tweezers" | "waterworks" | "woolens" ) { return (xnull_stem()); }
1840
1842
<noun,any> ( "biggi" | "bourgeoisi" | "bri" | "camaraderi" | "chinoiseri" | "coteri" | "doggi" | "geni" | "hippi" | "junki" | "lingeri" | "moxi" | "preppi" | "rooki" | "yuppi" ) "es" { return (stem(1 ," " ," s" )); }
1841
1843
<verb,any> ( "chor" | "sepulchr" | "silhouett" | "telescop" ) {ESEDING} { return (semi_reg_stem(0 ," e" )); }
@@ -2098,6 +2100,9 @@ COMP_SUP = "JJR"|"JJS"|"RBR"|"RBS"
2098
2100
<scan> {A} * "people" / _NNS { return (stem(5 , " erson" , " " )); }
2099
2101
<scan> "ppl" / _NNS { return (stem(3 , " person" , " " )); }
2100
2102
2103
+ <scan> "Olympics" / _NN( P?)( S?) { return (capitalise(xnull_stem())); }
2104
+ <scan> {SINGULAR_DEMONYMS} / _( NN( P?)( S?)| JJ) { return (capitalise(xnull_stem())); }
2105
+
2101
2106
<scan> "worse" / _JJR { return (stem(5 , " bad" , " " )); }
2102
2107
<scan> "worst" / _JJS { return (stem(5 , " bad" , " " )); }
2103
2108
<scan> "worse" / _RBR { return (stem(5 , " badly" , " " )); }
0 commit comments