You cannot select more than 25 topics
Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.
8 lines
916 KiB
Plaintext
8 lines
916 KiB
Plaintext
1 month ago
|
/*
|
||
|
* Javascript version of Eric Brill's English lexicon, compressed by Toby Rahilly.
|
||
|
*/
|
||
|
|
||
|
var POSTAGGER_LEXICON = {Ranavan:0,"pro-Soviet":1,"Hydro-Electric":2,"waste-disposal":3,chameleons:4,clotted:1,spiders:4,verses:4,hanging:5,"Hawaiian\\/Japanese":1,hastily:6,comically:6,REIS:2,localized:7,spidery:1,disobeying:8,"marketing-wise":1,"plant-closing":1,Archuleta:2,refunding:9,Western:10,"wrought-iron":1,Gravesend:2,"government-to-government":1,Euro:2,slothful:1,Valle:2,Famed:1,Blade:2,Poetry:11,Mizell:2,"plant-modernization":1,Rizopolous:2,seamier:12,wooded:1,grueling:13,Muniz:2,Amparano:2,Saco:2,Sack:2,virtuosos:4,Raptopoulos:2,Multilateral:2,immunities:4,"all-news":1,Pinkerton:2,gaskets:4,Kibbutzim:4,Shocked:14,deadheads:4,Dixiecrat:2,Honorable:2,Olde:2,"":15,snuggled:16,inanimate:1,errors:4,Initially:6,"self-reliant":1,defenses:4,Hamilton:2,HCFA:2,designing:8,pawed:17,Kosonen:2,Designcraft:2,mailings:4,perforations:4,Sussman:2,affiliates:18,"advanced-ceramics":19,perfunctorily:6,affiliated:14,Footnotes:4,confronts:20,"small-screen":1,Manger:2,Manges:2,Bereuter:2,kids:18,uplifting:13,Downfall:2,deferring:8,Keillor:2,"electric-power":1,orthographies:4,Hafiz:2,"sheep-lined":1,"inflation-induced":1,Harvey:2,stern:3,Vernor:2,inevitable:1,Vernon:2,distortions:4,reasserting:8,sermons:4,"grounds-care":1,populations:4,exuberantly:6,Sindona:2,Hardshell:2,"whole-heartedly":6,Pedone:2,"pay-movie":1,"co-marketing":1,morally:6,Indigo:2,"non-advertising":1,Reichhold:2,Gastronomy:2,"old-guard":1,wiretapping:21,deputy:22,"R.G.":2,"grass-fed":1,Darling:23,Tippecanoe:2,nondiscretionary:1,"well-armed":1,Editorials:4,"electrical-engineering":1,McCamant:2,travel:24,Attention:25,Businessland:2,Nussbaum:2,Bates:2,exposited:17,Feelers:4,assimilated:14,dinosaurs:4,iodocompounds:4,Fogg:2,stipulate:26,sentencing:27,Tenants:28,CFM:2,FINANCIAL:2,CFD:2,CFC:11,subplots:4,"b-Current":29,Shimon:2,CFP:2,Retention:2,sprawling:30,snugly:6,Capistrano:2,Blackstone:31,Sabreliner:2,benefited:32,Robertson:2,"Soviet-trained":1,activating:8,"gay-ess":33,"H.L.":2,WPS:2,"ex-dividend":34,His:35,Hit:36,fit:37,Albrights:28,Schroeder:2,screaming:5,Admirers:4,Bischofberger:2,Kavanagh:2,Walesa:2,Hid:2,Rubins:4,reentered:16,Ciminero:2,Him:38,Galanter:2,effecte:39,Plebian:1,Aloe:2,vouchers:4,"top-quality":1,Civics:28,Pavlovitch:2,effects:18,Specialized:40,McArtor:2,whacking:8,castigating:8,wooden:1,Pergamon:2,Combine:39,uninfluenced:17,Weakening:8,Dairies:41,Eyewear:2,parasites:4,Bullocks:2,Pamorex:2,Crowds:4,ANNOUNCED:16,Pomerania:2,Denizens:4,Susie:11,Sidestepping:8,adapt:42,Chivas:2,Kahler:2,Impressionists:28,MEDIA:2,underfoot:6,Schwarz:2,Corinne:2,Argabright:2,elsewhere:43,stereotypical:1,Bergelt:2,Transformers:28,estimate:44,obliterans:4,Egg:11,silent:1,Nigel:2,nucleoli:4,Woodberry:2,Domestically:6,SIGNED:17,disturbed:45,"dinner-hour":1,Facts:46,Niger:2,breed:44,Varadero:2,Activity:47,Gingerly:6,megabytes:4,Nerves:4,Lurie:2,olds:4,LAND:2,renovated:14,needed:48,master:49,specters:4,"Russo-American":1,Hammerstein:2,Aztar:2,scrapes:4,yield:50,"mid-June":11,mutilated:14,Daddy:2,heftiest:51,positively:6,Guardsmen:28,SPAN:2,anniversaries:4,"ozone-destroying":1,Moonlighting:47,Zeta:2,feeling:21,"movie-themed":1,Escadrille:2,"third-round":1,"value-story":1,neuroselective:1,Chicago:2,"straight-from-the-shoulder":1,"index-options":4,consenting:30,pecs:4,brawny:1,recapitalized:17,Theo:2,Then:6,Them:52,scraped:32,wholesome:1,Ashenberg:2,Grodnik:2,Thee:53,Tschilwyk:2,Myron:2,They:38,"v-senv5":2,shipments:4,diminishing:8,resonates:20,Jessye:2,tensely:6,Hubacher:2,Pandora:2,resonated:16,transverse:3,KEARNEY:2,Encore:2,semicircular:1,Pastern:2,Lanvin:2,"state-directed":1,"Journal-Bulletin":2,willinge:1,Civilized:1,fugitives:4,"conservative-led":1,purged:54,saying:55,ffreind:39,"U-2":2,Euralliance:2,Mignanelli:2,Jacobson:2,padded:7,Butterfinger:2,Cunha:2,Basinger:2,hounded:16,apace:6,Taiyo:2,clicked:32,Rizvi:2,Geste:2,TEACH:39,"L.C.":2,familistical:1,"photo-montage":1,INSEAD:2,Warnke:2,Sibson:2,outfielders:4,Dionne:2,Comenico:2,"Bancorp.":2,affronted:17,Senators:56,Ecology:47,"Baden-Wuerttemburg":2,nicely:6,Andover:2,succumb:39,Dances:57,Dancer:2,pipers:4,Jabe:2,program
|
||
|
|
||
|
var LEXICON_TAG_MAP = [["NNP"],["JJ"],["NNP"],["JJ","NN"],["NNS"],["VBG","JJ","NN"],["RB"],["JJ","VBN"],["VBG"],["VBG","VBG|NN","JJ","NN"],["JJ","NN","NNP"],["NNP","NN"],["JJR"],["JJ","VBG"],["VBN","JJ"],[],["VBD"],["VBN"],["NNS","VBZ"],["NN","NNS"],["VBZ"],["NN","VBG"],["NN","JJ"],["NNP","JJ","NN","UH"],["NN","VBP","VB"],["NN","VB"],["VBP","JJ","VB"],["NN","VBG","JJ"],["NNPS"],["JJ","LS|JJ"],["VBG","JJ"],["NNP","VBP"],["VBD","VBN"],["VBP"],["JJ","NN","RB"],["PRP$","NNP"],["VBN","VBP","NN","VB"],["VB","VBN","VBP","JJ","NN","RB","VBD"],["PRP","NNP"],["VB"],["NNP","JJ"],["NNPS","NNP","NNS"],["VB","VBP"],["RB","NN"],["NN","VB","VBP"],["VBN","VBD","JJ"],["NNP","NNPS","NNS"],["NN","NNP"],["VBN","VBN|JJ","JJ","VBD"],["NN","JJ","VB","JJR"],["VB","VBP","JJ","NN"],["JJS"],["PRP","NNP","DT"],["PRP"],["VBN","VBD"],["VBG","NN"],["NNS","NNP","NNPS"],["NNS","NNPS"],["VB","VBP","VBZ"],["NNP","VB"],["."],["JJ","DT","NN","RB","RB|JJ"],["VB","NN","VBD"],["VB","NN"],["FW"],["NNPS","NNS"],["JJ","NNP"],["RB","UH"],["RBR"],["VBZ","VBN","."],["NN","JJ","VB"],["NNP","JJ","VBN"],["VBZ","NNS"],["NNS","VBZ","NNPS"],["NNP","NNPS"],["NNS","UH"],["WP","NNP"],["NNP","NN","NNPS"],["NN","VBP"],["WP"],["NN","FW"],["VBN","JJ","VBD"],["JJ","VB"],["VB","JJ"],["$"],["VBD","JJ","VBN"],["PRP","NNP","VBP"],["NNP","FW"],["PRP$","NN","NNP"],["DT","NNP"],["VBP","VB","NN"],["NNS","NN"],["NNS","NNPS","NNP"],["NNS","JJ","NN"],["JJ","IN","NN"],["VB","VBP","NN"],["NN","JJ","RB","JJS"],["JJ","RB"],["NNP","VBN","JJ"],["NNP","JJ","NN","VB"],["NNP","MD"],["VBG","JJ","NN","VBG|JJ"],[":"],["JJ","VBD","VBN"],["JJ","NN","VB"],["IN","JJ","RB","RP"],["UH"],["JJ","RB","RBR"],["IN","RB","NNP"],["VBZ","NNP"],["VBD","FW"],["NNPS","NNP"],["VBD","VBN","JJ"],["NNP","NNS"],["VBN","VBD","NNP"],["NNP","NN","VB","VBP"],["NNP","VBG"],["JJ","NNP","NN"],["VBN","VB","VBD"],["CC"],["NNP","VB","VBP","NN"],["JJ","RB","VB"],["NN","JJ","VBG"],["NNS","NNP"],["IN","NNP"],["UH","NNP"],["JJ","RB","UH"],["IN"],["NNP","NN","VB"],["NNP","JJ","NN"],["NNP","NNS","NNPS"],["JJ","NNP","RB","VB"],["VBZ","NNS","NN"],["``"],["NNS","NNPS|NNS","NNPS"],["JJ","NNS","NN"],["JJR","RBR"],["IN","RB|IN","JJ","NN","RB","RP"],["JJS","JJ"],["NN","JJ","VB","VBP"],["VB","VBD","VBN","VBP"],["NNP","JJR"],["NN",","],["RB","NNP","NN"],["NNP","NNPS","NN"],["FW","JJ"],["JJ","IN","NN","RB","VBN","VBP"],["FW","NN"],["JJ","VBN","NNP"],["VBP","VB"],["RB","NNP"],["VBD","VBN","VBP"],["NNS","JJ"],["NN","JJ","VB","NNP","NN|JJ"],["JJR","RB"],["NNP|NP"],["DT","JJ","NN"],["NNP","VBN"],["NNP","VBP","NN"],["VBN|JJ"],["VBN","NN"],["NNS","VBZ","VB","UH"],["JJ","NN","RB","VB","VBP"],["NN","RB"],["NNP","FW","NN"],["RB|VBG"],["DT","NNP","RB"],[")"],["NN","JJ","RB"],["NN","VB","NNP"],["NNS","NN","VBZ"],["NNP","JJ","NNPS","NNS"],["NNP","VBD"],["RB","JJ","NN","VB"],["VBP","NN"],["UH","NN"],["JJ","NNS"],["VBG","JJ","RB"],["NN","JJ","RB","NN|JJ","NN|RB","NN|JJ|RB","RB|NN|JJ"],["NNPS","NNS","NN"],["NNP","JJ","NN","RB"],["NN","VBD","VBN","VBP","VB"],["VB","NN","VBP"],["NNP","UH"],["NNP","RBR","RB","JJR"],["VBN","JJ","NN"],["JJ","JJS"],["VBD","JJ"],["VB","NNP","VBP"],["NN","VB","JJR","VBP"],["MD"],["NN","VBG","VBG|NN"],["NNP","JJS"],["NNP","VBG","JJ","NN"],["RB","NNP","CC","IN","UH"],["JJR","NNP"],["VB","VBN"],["RB","JJ","NNP"],["JJ","NNP","NNS","NNPS"],["VBG","JJ","VBG|JJ"],["JJ","JJR"],["NNP|VBN"],["JJ","NN","NN|JJ"],["RB","NNP","DT"],["NN","JJ","VB","NNP"],["NN","VBP","JJ","VB"],["IN","RB"],["RB","NN","RP","NNP","VBP","JJ"],["NNS","VBZ","NN"],["NNP","JJ","NNPS"],["VBG","NNP","NN"],["NNS","VBZ","CC","RB"],["VBN","VBN|JJ","VBD","JJ"],["NN","JJ","NNP"],["VBD","NN","NNS","VBN"],["NN","JJR"],["VB","NNP"],["VBG","NN","NNP"],["RB","JJ"],["NNS","VBP","VBZ"],["RB","NN","JJS","JJ"],["IN","RB","RP","NNP"],["NNP","NNPS","PRP"],["IN","RP","NNP"],["JJS","RB","RBS"],["NN","NN|VBG","VBG|NN","JJ","VBG"],["NN","NN|JJ","JJ","VB"],["PRP","JJ"],["NNP","VBZ","NN"],["VBG","NNP"],["VBP","NNP"],["VBN","NNP"],["JJ","NN","RB","UH"],["RB","IN|RB","RBR","VBP","IN","JJ","NN","RP","VB"],["VBP","JJ","NN","VB"],["NN","UH"],["JJR","JJ","NN"],["NN","VB","NNS"],["NN","NNP","LS"],["NNP","NN
|