|
{ |
|
"lang":"en", |
|
"name":"data_dev_spacy_lg_1", |
|
"version":"3.7.1", |
|
"description":"English pipeline optimized for CPU. Components: tok2vec, tagger, parser, senter, ner, attribute_ruler, lemmatizer.", |
|
"author":"Explosion", |
|
"email":"contact@explosion.ai", |
|
"url":"https://explosion.ai", |
|
"license":"MIT", |
|
"spacy_version":">=3.7.2,<3.8.0", |
|
"spacy_git_version":"bd2c17e20", |
|
"vectors":{ |
|
"width":300, |
|
"vectors":514157, |
|
"keys":514157, |
|
"name":"en_vectors" |
|
}, |
|
"labels":{ |
|
"tok2vec":[ |
|
|
|
], |
|
"tagger":[ |
|
"$", |
|
"''", |
|
",", |
|
"-LRB-", |
|
"-RRB-", |
|
".", |
|
":", |
|
"ADD", |
|
"AFX", |
|
"CC", |
|
"CD", |
|
"DT", |
|
"EX", |
|
"FW", |
|
"HYPH", |
|
"IN", |
|
"JJ", |
|
"JJR", |
|
"JJS", |
|
"LS", |
|
"MD", |
|
"NFP", |
|
"NN", |
|
"NNP", |
|
"NNPS", |
|
"NNS", |
|
"PDT", |
|
"POS", |
|
"PRP", |
|
"PRP$", |
|
"RB", |
|
"RBR", |
|
"RBS", |
|
"RP", |
|
"SYM", |
|
"TO", |
|
"UH", |
|
"VB", |
|
"VBD", |
|
"VBG", |
|
"VBN", |
|
"VBP", |
|
"VBZ", |
|
"WDT", |
|
"WP", |
|
"WP$", |
|
"WRB", |
|
"XX", |
|
"_SP", |
|
"``" |
|
], |
|
"parser":[ |
|
"ROOT", |
|
"acl", |
|
"acomp", |
|
"advcl", |
|
"advmod", |
|
"agent", |
|
"amod", |
|
"appos", |
|
"attr", |
|
"aux", |
|
"auxpass", |
|
"case", |
|
"cc", |
|
"ccomp", |
|
"compound", |
|
"conj", |
|
"csubj", |
|
"csubjpass", |
|
"dative", |
|
"dep", |
|
"det", |
|
"dobj", |
|
"expl", |
|
"intj", |
|
"mark", |
|
"meta", |
|
"neg", |
|
"nmod", |
|
"npadvmod", |
|
"nsubj", |
|
"nsubjpass", |
|
"nummod", |
|
"oprd", |
|
"parataxis", |
|
"pcomp", |
|
"pobj", |
|
"poss", |
|
"preconj", |
|
"predet", |
|
"prep", |
|
"prt", |
|
"punct", |
|
"quantmod", |
|
"relcl", |
|
"xcomp" |
|
], |
|
"attribute_ruler":[ |
|
|
|
], |
|
"lemmatizer":[ |
|
|
|
], |
|
"ner":[ |
|
"CARDINAL", |
|
"DATE", |
|
"EVENT", |
|
"FAC", |
|
"GPE", |
|
"LANGUAGE", |
|
"LAW", |
|
"LOC", |
|
"MONEY", |
|
"NORP", |
|
"ORDINAL", |
|
"ORG", |
|
"PERCENT", |
|
"PERSON", |
|
"PRODUCT", |
|
"QUANTITY", |
|
"TIME", |
|
"WORK_OF_ART" |
|
] |
|
}, |
|
"pipeline":[ |
|
"tok2vec", |
|
"tagger", |
|
"parser", |
|
"attribute_ruler", |
|
"lemmatizer", |
|
"ner" |
|
], |
|
"components":[ |
|
"tok2vec", |
|
"tagger", |
|
"parser", |
|
"senter", |
|
"attribute_ruler", |
|
"lemmatizer", |
|
"ner" |
|
], |
|
"disabled":[ |
|
"senter" |
|
], |
|
"performance":{ |
|
"token_acc":0.9986194413, |
|
"token_p":0.9956819193, |
|
"token_r":0.9957659295, |
|
"token_f":0.9957239226, |
|
"tag_acc":0.9734810915, |
|
"sents_p":0.9219292867, |
|
"sents_r":0.8927369879, |
|
"sents_f":0.907098331, |
|
"dep_uas":0.9208198801, |
|
"dep_las":0.9027174273, |
|
"dep_las_per_type":{ |
|
"prep":{ |
|
"p":0.8601948321, |
|
"r":0.8677670271, |
|
"f":0.8639643383 |
|
}, |
|
"det":{ |
|
"p":0.9792625789, |
|
"r":0.980021202, |
|
"f":0.9796417436 |
|
}, |
|
"pobj":{ |
|
"p":0.9637052664, |
|
"r":0.9686628706, |
|
"f":0.966177709 |
|
}, |
|
"nsubj":{ |
|
"p":0.9559814937, |
|
"r":0.9505366922, |
|
"f":0.9532513181 |
|
}, |
|
"aux":{ |
|
"p":0.9805627052, |
|
"r":0.9835306686, |
|
"f":0.9820444444 |
|
}, |
|
"advmod":{ |
|
"p":0.8575647625, |
|
"r":0.8550395423, |
|
"f":0.8563002907 |
|
}, |
|
"relcl":{ |
|
"p":0.7582954942, |
|
"r":0.7877358491, |
|
"f":0.7727353622 |
|
}, |
|
"root":{ |
|
"p":0.9225318526, |
|
"r":0.8931987598, |
|
"f":0.9076283684 |
|
}, |
|
"xcomp":{ |
|
"p":0.8885734564, |
|
"r":0.8987796123, |
|
"f":0.8936473947 |
|
}, |
|
"amod":{ |
|
"p":0.9205863192, |
|
"r":0.9155166829, |
|
"f":0.9180445022 |
|
}, |
|
"compound":{ |
|
"p":0.9182062387, |
|
"r":0.9327801292, |
|
"f":0.9254358096 |
|
}, |
|
"poss":{ |
|
"p":0.9745235707, |
|
"r":0.9778582931, |
|
"f":0.976188084 |
|
}, |
|
"ccomp":{ |
|
"p":0.779082774, |
|
"r":0.8511201629, |
|
"f":0.8135098306 |
|
}, |
|
"attr":{ |
|
"p":0.9063777596, |
|
"r":0.9322960471, |
|
"f":0.9191542289 |
|
}, |
|
"case":{ |
|
"p":0.9806835067, |
|
"r":0.990990991, |
|
"f":0.9858103062 |
|
}, |
|
"mark":{ |
|
"p":0.9073055774, |
|
"r":0.9181240064, |
|
"f":0.9126827341 |
|
}, |
|
"intj":{ |
|
"p":0.6783762685, |
|
"r":0.6366300366, |
|
"f":0.656840514 |
|
}, |
|
"advcl":{ |
|
"p":0.6740684022, |
|
"r":0.6650717703, |
|
"f":0.6695398656 |
|
}, |
|
"cc":{ |
|
"p":0.8397405094, |
|
"r":0.836024399, |
|
"f":0.8378783338 |
|
}, |
|
"neg":{ |
|
"p":0.9455272364, |
|
"r":0.9493226292, |
|
"f":0.9474211317 |
|
}, |
|
"conj":{ |
|
"p":0.7754289978, |
|
"r":0.7849949648, |
|
"f":0.7801826598 |
|
}, |
|
"nsubjpass":{ |
|
"p":0.9282744283, |
|
"r":0.9158974359, |
|
"f":0.9220443986 |
|
}, |
|
"auxpass":{ |
|
"p":0.9508709245, |
|
"r":0.9699316629, |
|
"f":0.9603067208 |
|
}, |
|
"dobj":{ |
|
"p":0.9274010192, |
|
"r":0.9426249104, |
|
"f":0.9349509959 |
|
}, |
|
"nummod":{ |
|
"p":0.9397865854, |
|
"r":0.9340909091, |
|
"f":0.9369300912 |
|
}, |
|
"npadvmod":{ |
|
"p":0.7832009081, |
|
"r":0.7353463588, |
|
"f":0.7585196043 |
|
}, |
|
"prt":{ |
|
"p":0.8146622735, |
|
"r":0.8862007168, |
|
"f":0.8489270386 |
|
}, |
|
"pcomp":{ |
|
"p":0.8859957776, |
|
"r":0.8816526611, |
|
"f":0.8838188838 |
|
}, |
|
"expl":{ |
|
"p":0.9808917197, |
|
"r":0.9892933619, |
|
"f":0.9850746269 |
|
}, |
|
"acl":{ |
|
"p":0.7584170112, |
|
"r":0.7004909984, |
|
"f":0.7283040272 |
|
}, |
|
"agent":{ |
|
"p":0.9045996593, |
|
"r":0.9516129032, |
|
"f":0.927510917 |
|
}, |
|
"dative":{ |
|
"p":0.7577319588, |
|
"r":0.6743119266, |
|
"f":0.713592233 |
|
}, |
|
"acomp":{ |
|
"p":0.9089655172, |
|
"r":0.8965986395, |
|
"f":0.902739726 |
|
}, |
|
"dep":{ |
|
"p":0.3837638376, |
|
"r":0.1688311688, |
|
"f":0.2344983089 |
|
}, |
|
"csubj":{ |
|
"p":0.7043010753, |
|
"r":0.775147929, |
|
"f":0.738028169 |
|
}, |
|
"quantmod":{ |
|
"p":0.8682101514, |
|
"r":0.7920389927, |
|
"f":0.8283772302 |
|
}, |
|
"nmod":{ |
|
"p":0.7549407115, |
|
"r":0.5819622182, |
|
"f":0.6572608396 |
|
}, |
|
"appos":{ |
|
"p":0.6977283264, |
|
"r":0.6529284165, |
|
"f":0.6745853877 |
|
}, |
|
"predet":{ |
|
"p":0.8467741935, |
|
"r":0.9012875536, |
|
"f":0.8731808732 |
|
}, |
|
"preconj":{ |
|
"p":0.5462962963, |
|
"r":0.6860465116, |
|
"f":0.6082474227 |
|
}, |
|
"oprd":{ |
|
"p":0.8321678322, |
|
"r":0.7104477612, |
|
"f":0.7665056361 |
|
}, |
|
"parataxis":{ |
|
"p":0.6071428571, |
|
"r":0.4793926247, |
|
"f":0.5357575758 |
|
}, |
|
"meta":{ |
|
"p":0.7428571429, |
|
"r":0.5, |
|
"f":0.5977011494 |
|
}, |
|
"csubjpass":{ |
|
"p":0.3846153846, |
|
"r":0.8333333333, |
|
"f":0.5263157895 |
|
} |
|
}, |
|
"ents_p":0.8516398746, |
|
"ents_r":0.8569711538, |
|
"ents_f":0.8542971968, |
|
"ents_per_type":{ |
|
"DATE":{ |
|
"p":0.8649149923, |
|
"r":0.8882539683, |
|
"f":0.8764291308 |
|
}, |
|
"GPE":{ |
|
"p":0.9244532803, |
|
"r":0.9079497908, |
|
"f":0.9161272164 |
|
}, |
|
"ORDINAL":{ |
|
"p":0.7805555556, |
|
"r":0.8726708075, |
|
"f":0.8240469208 |
|
}, |
|
"ORG":{ |
|
"p":0.8132576735, |
|
"r":0.8358960764, |
|
"f":0.824421493 |
|
}, |
|
"QUANTITY":{ |
|
"p":0.8066666667, |
|
"r":0.6648351648, |
|
"f":0.7289156627 |
|
}, |
|
"PERSON":{ |
|
"p":0.8767166042, |
|
"r":0.9167754569, |
|
"f":0.8962986599 |
|
}, |
|
"NORP":{ |
|
"p":0.9072164948, |
|
"r":0.9152, |
|
"f":0.9111907607 |
|
}, |
|
"FAC":{ |
|
"p":0.4028776978, |
|
"r":0.4307692308, |
|
"f":0.4163568773 |
|
}, |
|
"EVENT":{ |
|
"p":0.5181818182, |
|
"r":0.3275862069, |
|
"f":0.4014084507 |
|
}, |
|
"CARDINAL":{ |
|
"p":0.8147123894, |
|
"r":0.8757431629, |
|
"f":0.8441260745 |
|
}, |
|
"LOC":{ |
|
"p":0.6677852349, |
|
"r":0.6337579618, |
|
"f":0.6503267974 |
|
}, |
|
"TIME":{ |
|
"p":0.7257142857, |
|
"r":0.7426900585, |
|
"f":0.7341040462 |
|
}, |
|
"MONEY":{ |
|
"p":0.9160671463, |
|
"r":0.9020070838, |
|
"f":0.9089827484 |
|
}, |
|
"WORK_OF_ART":{ |
|
"p":0.4647887324, |
|
"r":0.3402061856, |
|
"f":0.3928571429 |
|
}, |
|
"LAW":{ |
|
"p":0.5740740741, |
|
"r":0.484375, |
|
"f":0.5254237288 |
|
}, |
|
"PERCENT":{ |
|
"p":0.9197431782, |
|
"r":0.8774885145, |
|
"f":0.8981191223 |
|
}, |
|
"LANGUAGE":{ |
|
"p":0.76, |
|
"r":0.59375, |
|
"f":0.6666666667 |
|
}, |
|
"PRODUCT":{ |
|
"p":0.5784313725, |
|
"r":0.2796208531, |
|
"f":0.3769968051 |
|
} |
|
}, |
|
"speed":8276.0958055731 |
|
}, |
|
"sources":[ |
|
{ |
|
"name":"OntoNotes 5", |
|
"url":"https://catalog.ldc.upenn.edu/LDC2013T19", |
|
"license":"commercial (licensed by Explosion)", |
|
"author":"Ralph Weischedel, Martha Palmer, Mitchell Marcus, Eduard Hovy, Sameer Pradhan, Lance Ramshaw, Nianwen Xue, Ann Taylor, Jeff Kaufman, Michelle Franchini, Mohammed El-Bachouti, Robert Belvin, Ann Houston" |
|
}, |
|
{ |
|
"name":"ClearNLP Constituent-to-Dependency Conversion", |
|
"url":"https://github.com/clir/clearnlp-guidelines/blob/master/md/components/dependency_conversion.md", |
|
"license":"Citation provided for reference, no code packaged with model", |
|
"author":"Emory University" |
|
}, |
|
{ |
|
"name":"WordNet 3.0", |
|
"url":"https://wordnet.princeton.edu/", |
|
"author":"Princeton University", |
|
"license":"WordNet 3.0 License" |
|
}, |
|
{ |
|
"name":"Explosion Vectors (OSCAR 2109 + Wikipedia + OpenSubtitles + WMT News Crawl)", |
|
"url":"https://github.com/explosion/spacy-vectors-builder", |
|
"license":"CC0", |
|
"author":"Explosion" |
|
} |
|
], |
|
"requirements":[ |
|
|
|
] |
|
} |