Adriane Boyd commited on
Commit
2230db5
1 Parent(s): 182612e

Update spaCy pipeline

Browse files
README.md CHANGED
@@ -14,62 +14,62 @@ model-index:
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
- value: 0.8079331942
18
  - name: NER Recall
19
  type: recall
20
- value: 0.80625
21
  - name: NER F Score
22
  type: f_score
23
- value: 0.8070907195
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
- value: 0.9641646489
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
- value: 0.9641646489
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
- value: 0.9505084746
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
- value: 0.9481840194
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
- value: 0.8130063132
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
- value: 0.7723336499
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
- value: 0.9112107623
73
  ---
74
  ### Details: https://spacy.io/models/da#da_core_news_md
75
 
@@ -78,8 +78,8 @@ Danish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, l
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `da_core_news_md` |
81
- | **Version** | `3.3.0` |
82
- | **spaCy** | `>=3.3.0.dev0,<3.4.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 500000 keys, 20000 unique vectors (300 dimensions) |
@@ -91,11 +91,11 @@ Danish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, l
91
 
92
  <details>
93
 
94
- <summary>View label scheme (193 labels for 3 components)</summary>
95
 
96
  | Component | Labels |
97
  | --- | --- |
98
- | **`morphologizer`** | `AdpType=Prep\|POS=ADP`, `Definite=Ind\|Gender=Com\|Number=Sing\|POS=NOUN`, `Mood=Ind\|POS=AUX\|Tense=Pres\|VerbForm=Fin\|Voice=Act`, `POS=PROPN`, `Definite=Ind\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=SCONJ`, `Definite=Def\|Gender=Com\|Number=Sing\|POS=NOUN`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin\|Voice=Act`, `POS=ADV`, `Number=Plur\|POS=DET\|PronType=Dem`, `Degree=Pos\|Number=Plur\|POS=ADJ`, `Definite=Ind\|Gender=Com\|Number=Plur\|POS=NOUN`, `POS=PUNCT`, `POS=CCONJ`, `Definite=Ind\|Degree=Cmp\|Number=Sing\|POS=ADJ`, `Degree=Cmp\|POS=ADJ`, `POS=PRON\|PartType=Inf`, `Gender=Com\|Number=Sing\|POS=DET\|PronType=Ind`, `Definite=Ind\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Case=Acc\|Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Degree=Pos\|POS=ADV`, `Definite=Def\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=PRON\|PronType=Dem`, `NumType=Card\|POS=NUM`, `Definite=Ind\|Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Case=Acc\|Gender=Com\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Degree=Pos\|Gender=Com\|Number=Sing\|POS=ADJ`, `Case=Nom\|Gender=Com\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `NumType=Ord\|POS=ADJ`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Mood=Ind\|POS=AUX\|Tense=Past\|VerbForm=Fin\|Voice=Act`, `POS=VERB\|VerbForm=Inf\|Voice=Act`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin\|Voice=Act`, `POS=NOUN`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin\|Voice=Pass`, `POS=ADP\|PartType=Inf`, `Degree=Pos\|POS=ADJ`, `Definite=Def\|Gender=Com\|Number=Plur\|POS=NOUN`, `Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Com\|Number=Sing\|POS=NOUN`, `POS=AUX\|VerbForm=Inf\|Voice=Act`, `Definite=Ind\|Degree=Pos\|Gender=Com\|Number=Sing\|POS=ADJ`, `Gender=Com\|Number=Sing\|POS=DET\|PronType=Dem`, `Number=Plur\|POS=DET\|PronType=Ind`, `Gender=Com\|Number=Sing\|POS=PRON\|PronType=Ind`, `Case=Acc\|POS=PRON\|Person=3\|PronType=Prs\|Reflex=Yes`, `POS=PART\|PartType=Inf`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Ind`, `Case=Acc\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `Case=Nom\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Nom\|Gender=Com\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Nom\|Gender=Com\|POS=PRON\|PronType=Ind`, `Gender=Neut\|Number=Sing\|POS=PRON\|PronType=Ind`, `Mood=Imp\|POS=VERB`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Ind\|Number=Sing\|POS=AUX\|Tense=Past\|VerbForm=Part`, `POS=X`, `Case=Nom\|Gender=Com\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Com\|Number=Plur\|POS=NOUN`, `POS=VERB\|Tense=Pres\|VerbForm=Part`, `Number=Plur\|POS=PRON\|PronType=Int,Rel`, `POS=VERB\|VerbForm=Inf\|Voice=Pass`, `Case=Gen\|Definite=Ind\|Gender=Com\|Number=Sing\|POS=NOUN`, `Degree=Cmp\|POS=ADV`, `POS=ADV\|PartType=Inf`, `Degree=Sup\|POS=ADV`, `Number=Plur\|POS=PRON\|PronType=Dem`, `Number=Plur\|POS=PRON\|PronType=Ind`, `Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Case=Acc\|Gender=Com\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|POS=PROPN`, `POS=ADP`, `Degree=Cmp\|Number=Plur\|POS=ADJ`, `Definite=Def\|Degree=Sup\|POS=ADJ`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Degree=Pos\|Number=Sing\|POS=ADJ`, `Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Gender=Com\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Number=Plur\|POS=PRON\|PronType=Rcp`, `Case=Gen\|Degree=Cmp\|POS=ADJ`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Number[psor]=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=INTJ`, `Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Gender=Neut\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Case=Acc\|Gender=Com\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Number=Sing\|POS=PRON\|PronType=Int,Rel`, `Number=Plur\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Gender=Neut\|Number=Sing\|POS=PRON\|PronType=Int,Rel`, `Definite=Def\|Degree=Sup\|Number=Plur\|POS=ADJ`, `Case=Nom\|Gender=Com\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Definite=Ind\|Number=Sing\|POS=NOUN`, `Number=Plur\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Number=Plur\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `POS=SYM`, `Case=Nom\|Gender=Com\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Degree=Sup\|POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Ind\|Style=Arch`, `Case=Gen\|Gender=Com\|Number=Sing\|POS=DET\|PronType=Dem`, `Foreign=Yes\|POS=X`, `POS=DET\|Person=2\|Polite=Form\|Poss=Yes\|PronType=Prs`, `Gender=Neut\|Number=Sing\|POS=PRON\|PronType=Dem`, `Case=Acc\|Gender=Com\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `Case=Gen\|POS=PRON\|PronType=Int,Rel`, `Gender=Com\|Number=Sing\|POS=PRON\|PronType=Dem`, `Abbr=Yes\|POS=X`, `Case=Gen\|Definite=Ind\|Gender=Com\|Number=Plur\|POS=NOUN`, `Definite=Def\|Degree=Abs\|POS=ADJ`, `Definite=Ind\|Degree=Sup\|Number=Sing\|POS=ADJ`, `Definite=Ind\|POS=NOUN`, `Gender=Com\|Number=Plur\|POS=NOUN`, `Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Gender=Com\|POS=PRON\|PronType=Int,Rel`, `Case=Nom\|Gender=Com\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Degree=Abs\|POS=ADV`, `POS=VERB\|VerbForm=Ger`, `POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Def\|Degree=Sup\|Number=Sing\|POS=ADJ`, `Number=Plur\|Number[psor]=Plur\|POS=PRON\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Case=Gen\|Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Case=Gen\|Degree=Pos\|Number=Plur\|POS=ADJ`, `Case=Acc\|Gender=Com\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Gender=Com\|Number=Sing\|POS=PRON\|PronType=Int,Rel`, `POS=VERB\|Tense=Pres`, `Case=Gen\|Number=Plur\|POS=DET\|PronType=Ind`, `Number[psor]=Plur\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=PRON\|Person=2\|Polite=Form\|Poss=Yes\|PronType=Prs`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=AUX\|Tense=Pres\|VerbForm=Part`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin\|Voice=Pass`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Degree=Sup\|Number=Plur\|POS=ADJ`, `Case=Acc\|Gender=Com\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Definite=Ind\|Number=Plur\|POS=NOUN`, `Case=Gen\|Number=Plur\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Mood=Imp\|POS=AUX`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=1\|Poss=Yes\|PronType=Prs`, `Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Com\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Gender=Com\|Number=Sing\|POS=DET\|PronType=Ind`, `Case=Gen\|POS=NOUN`, `Number[psor]=Plur\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=DET\|PronType=Dem`, `Definite=Def\|Number=Plur\|POS=NOUN` |
99
  | **`parser`** | `ROOT`, `acl:relcl`, `advcl`, `advmod`, `advmod:lmod`, `amod`, `appos`, `aux`, `case`, `cc`, `ccomp`, `compound:prt`, `conj`, `cop`, `dep`, `det`, `expl`, `fixed`, `flat`, `iobj`, `list`, `mark`, `nmod`, `nmod:poss`, `nsubj`, `nummod`, `obj`, `obl`, `obl:lmod`, `obl:tmod`, `punct`, `xcomp` |
100
  | **`ner`** | `LOC`, `MISC`, `ORG`, `PER` |
101
 
@@ -109,18 +109,18 @@ Danish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, l
109
  | `TOKEN_P` | 99.78 |
110
  | `TOKEN_R` | 99.75 |
111
  | `TOKEN_F` | 99.76 |
112
- | `POS_ACC` | 96.42 |
113
- | `MORPH_ACC` | 95.05 |
114
- | `MORPH_MICRO_P` | 96.69 |
115
- | `MORPH_MICRO_R` | 96.16 |
116
- | `MORPH_MICRO_F` | 96.42 |
117
- | `SENTS_P` | 92.20 |
118
  | `SENTS_R` | 90.07 |
119
- | `SENTS_F` | 91.12 |
120
- | `DEP_UAS` | 81.30 |
121
- | `DEP_LAS` | 77.23 |
122
- | `LEMMA_ACC` | 94.82 |
123
- | `TAG_ACC` | 96.42 |
124
- | `ENTS_P` | 80.79 |
125
- | `ENTS_R` | 80.62 |
126
- | `ENTS_F` | 80.71 |
 
14
  metrics:
15
  - name: NER Precision
16
  type: precision
17
+ value: 0.8063829787
18
  - name: NER Recall
19
  type: recall
20
+ value: 0.7895833333
21
  - name: NER F Score
22
  type: f_score
23
+ value: 0.7978947368
24
  - task:
25
  name: TAG
26
  type: token-classification
27
  metrics:
28
  - name: TAG (XPOS) Accuracy
29
  type: accuracy
30
+ value: 0.9618401937
31
  - task:
32
  name: POS
33
  type: token-classification
34
  metrics:
35
  - name: POS (UPOS) Accuracy
36
  type: accuracy
37
+ value: 0.9618401937
38
  - task:
39
  name: MORPH
40
  type: token-classification
41
  metrics:
42
  - name: Morph (UFeats) Accuracy
43
  type: accuracy
44
+ value: 0.948377724
45
  - task:
46
  name: LEMMA
47
  type: token-classification
48
  metrics:
49
  - name: Lemma Accuracy
50
  type: accuracy
51
+ value: 0.9497336562
52
  - task:
53
  name: UNLABELED_DEPENDENCIES
54
  type: token-classification
55
  metrics:
56
  - name: Unlabeled Attachment Score (UAS)
57
  type: f_score
58
+ value: 0.8215642458
59
  - task:
60
  name: LABELED_DEPENDENCIES
61
  type: token-classification
62
  metrics:
63
  - name: Labeled Attachment Score (LAS)
64
  type: f_score
65
+ value: 0.7802234637
66
  - task:
67
  name: SENTS
68
  type: token-classification
69
  metrics:
70
  - name: Sentences F-Score
71
  type: f_score
72
+ value: 0.9103942652
73
  ---
74
  ### Details: https://spacy.io/models/da#da_core_news_md
75
 
 
78
  | Feature | Description |
79
  | --- | --- |
80
  | **Name** | `da_core_news_md` |
81
+ | **Version** | `3.4.0` |
82
+ | **spaCy** | `>=3.4.0,<3.5.0` |
83
  | **Default Pipeline** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `attribute_ruler`, `ner` |
84
  | **Components** | `tok2vec`, `morphologizer`, `parser`, `lemmatizer`, `senter`, `attribute_ruler`, `ner` |
85
  | **Vectors** | 500000 keys, 20000 unique vectors (300 dimensions) |
 
91
 
92
  <details>
93
 
94
+ <summary>View label scheme (194 labels for 3 components)</summary>
95
 
96
  | Component | Labels |
97
  | --- | --- |
98
+ | **`morphologizer`** | `AdpType=Prep\|POS=ADP`, `Definite=Ind\|Gender=Com\|Number=Sing\|POS=NOUN`, `Mood=Ind\|POS=AUX\|Tense=Pres\|VerbForm=Fin\|Voice=Act`, `POS=PROPN`, `Definite=Ind\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=SCONJ`, `Definite=Def\|Gender=Com\|Number=Sing\|POS=NOUN`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin\|Voice=Act`, `POS=ADV`, `Number=Plur\|POS=DET\|PronType=Dem`, `Degree=Pos\|Number=Plur\|POS=ADJ`, `Definite=Ind\|Gender=Com\|Number=Plur\|POS=NOUN`, `POS=PUNCT`, `POS=CCONJ`, `Definite=Ind\|Degree=Cmp\|Number=Sing\|POS=ADJ`, `Degree=Cmp\|POS=ADJ`, `POS=PRON\|PartType=Inf`, `Gender=Com\|Number=Sing\|POS=DET\|PronType=Ind`, `Definite=Ind\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Case=Acc\|Gender=Neut\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Dem`, `Degree=Pos\|POS=ADV`, `Definite=Def\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `POS=PRON\|PronType=Dem`, `NumType=Card\|POS=NUM`, `Definite=Ind\|Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Case=Acc\|Gender=Com\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `Degree=Pos\|Gender=Com\|Number=Sing\|POS=ADJ`, `Case=Nom\|Gender=Com\|Number=Sing\|POS=PRON\|Person=3\|PronType=Prs`, `NumType=Ord\|POS=ADJ`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Mood=Ind\|POS=AUX\|Tense=Past\|VerbForm=Fin\|Voice=Act`, `POS=VERB\|VerbForm=Inf\|Voice=Act`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin\|Voice=Act`, `POS=NOUN`, `Mood=Ind\|POS=VERB\|Tense=Pres\|VerbForm=Fin\|Voice=Pass`, `POS=ADP\|PartType=Inf`, `Degree=Pos\|POS=ADJ`, `Definite=Def\|Gender=Com\|Number=Plur\|POS=NOUN`, `Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Com\|Number=Sing\|POS=NOUN`, `POS=AUX\|VerbForm=Inf\|Voice=Act`, `Definite=Ind\|Degree=Pos\|Gender=Com\|Number=Sing\|POS=ADJ`, `Gender=Com\|Number=Sing\|POS=DET\|PronType=Dem`, `Number=Plur\|POS=DET\|PronType=Ind`, `Gender=Com\|Number=Sing\|POS=PRON\|PronType=Ind`, `Case=Acc\|POS=PRON\|Person=3\|PronType=Prs\|Reflex=Yes`, `POS=PART\|PartType=Inf`, `Gender=Neut\|Number=Sing\|POS=DET\|PronType=Ind`, `Case=Acc\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Sing\|POS=NOUN`, `Case=Nom\|Number=Plur\|POS=PRON\|Person=3\|PronType=Prs`, `Case=Nom\|Gender=Com\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Nom\|Gender=Com\|POS=PRON\|PronType=Ind`, `Gender=Neut\|Number=Sing\|POS=PRON\|PronType=Ind`, `Mood=Imp\|POS=VERB`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Definite=Ind\|Number=Sing\|POS=AUX\|Tense=Past\|VerbForm=Part`, `POS=X`, `Case=Nom\|Gender=Com\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|Definite=Def\|Gender=Com\|Number=Plur\|POS=NOUN`, `POS=VERB\|Tense=Pres\|VerbForm=Part`, `Number=Plur\|POS=PRON\|PronType=Int,Rel`, `POS=VERB\|VerbForm=Inf\|Voice=Pass`, `Case=Gen\|Definite=Ind\|Gender=Com\|Number=Sing\|POS=NOUN`, `Degree=Cmp\|POS=ADV`, `POS=ADV\|PartType=Inf`, `Degree=Sup\|POS=ADV`, `Number=Plur\|POS=PRON\|PronType=Dem`, `Number=Plur\|POS=PRON\|PronType=Ind`, `Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Case=Acc\|Gender=Com\|Number=Sing\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|POS=PROPN`, `POS=ADP`, `Degree=Cmp\|Number=Plur\|POS=ADJ`, `Definite=Def\|Degree=Sup\|POS=ADJ`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Degree=Pos\|Number=Sing\|POS=ADJ`, `Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Gender=Com\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Number=Plur\|POS=PRON\|PronType=Rcp`, `Case=Gen\|Degree=Cmp\|POS=ADJ`, `POS=SPACE`, `Case=Gen\|Definite=Def\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Number[psor]=Plur\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=INTJ`, `Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Degree=Pos\|Gender=Neut\|Number=Sing\|POS=ADJ`, `Gender=Neut\|Number=Sing\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Case=Acc\|Gender=Com\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Plur\|POS=NOUN`, `Number=Sing\|POS=PRON\|PronType=Int,Rel`, `Number=Plur\|Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Gender=Neut\|Number=Sing\|POS=PRON\|PronType=Int,Rel`, `Definite=Def\|Degree=Sup\|Number=Plur\|POS=ADJ`, `Case=Nom\|Gender=Com\|Number=Sing\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Definite=Ind\|Number=Sing\|POS=NOUN`, `Number=Plur\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Number=Plur\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `POS=SYM`, `Case=Nom\|Gender=Com\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Degree=Sup\|POS=ADJ`, `Number=Plur\|POS=DET\|PronType=Ind\|Style=Arch`, `Case=Gen\|Gender=Com\|Number=Sing\|POS=DET\|PronType=Dem`, `Foreign=Yes\|POS=X`, `POS=DET\|Person=2\|Polite=Form\|Poss=Yes\|PronType=Prs`, `Gender=Neut\|Number=Sing\|POS=PRON\|PronType=Dem`, `Case=Acc\|Gender=Com\|Number=Plur\|POS=PRON\|Person=1\|PronType=Prs`, `Case=Gen\|Definite=Ind\|Gender=Neut\|Number=Sing\|POS=NOUN`, `Case=Gen\|POS=PRON\|PronType=Int,Rel`, `Gender=Com\|Number=Sing\|POS=PRON\|PronType=Dem`, `Abbr=Yes\|POS=X`, `Case=Gen\|Definite=Ind\|Gender=Com\|Number=Plur\|POS=NOUN`, `Definite=Def\|Degree=Abs\|POS=ADJ`, `Definite=Ind\|Degree=Sup\|Number=Sing\|POS=ADJ`, `Definite=Ind\|POS=NOUN`, `Gender=Com\|Number=Plur\|POS=NOUN`, `Number[psor]=Plur\|POS=DET\|Person=1\|Poss=Yes\|PronType=Prs`, `Gender=Com\|POS=PRON\|PronType=Int,Rel`, `Case=Nom\|Gender=Com\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Degree=Abs\|POS=ADV`, `POS=VERB\|VerbForm=Ger`, `POS=VERB\|Tense=Past\|VerbForm=Part`, `Definite=Def\|Degree=Sup\|Number=Sing\|POS=ADJ`, `Number=Plur\|Number[psor]=Plur\|POS=PRON\|Person=1\|Poss=Yes\|PronType=Prs\|Style=Form`, `Case=Gen\|Definite=Def\|Degree=Pos\|Number=Sing\|POS=ADJ`, `Case=Gen\|Degree=Pos\|Number=Plur\|POS=ADJ`, `Case=Acc\|Gender=Com\|POS=PRON\|Person=2\|Polite=Form\|PronType=Prs`, `Gender=Com\|Number=Sing\|POS=PRON\|PronType=Int,Rel`, `POS=VERB\|Tense=Pres`, `Case=Gen\|Number=Plur\|POS=DET\|PronType=Ind`, `Number[psor]=Plur\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=PRON\|Person=2\|Polite=Form\|Poss=Yes\|PronType=Prs`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `POS=AUX\|Tense=Pres\|VerbForm=Part`, `Mood=Ind\|POS=VERB\|Tense=Past\|VerbForm=Fin\|Voice=Pass`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Degree=Sup\|Number=Plur\|POS=ADJ`, `Case=Acc\|Gender=Com\|Number=Plur\|POS=PRON\|Person=2\|PronType=Prs`, `Gender=Neut\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs\|Reflex=Yes`, `Definite=Ind\|Number=Plur\|POS=NOUN`, `Case=Gen\|Number=Plur\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Mood=Imp\|POS=AUX`, `Gender=Com\|Number=Sing\|Number[psor]=Sing\|POS=PRON\|Person=1\|Poss=Yes\|PronType=Prs`, `Number[psor]=Sing\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `Definite=Def\|Gender=Com\|Number=Sing\|POS=VERB\|Tense=Past\|VerbForm=Part`, `Number=Plur\|Number[psor]=Sing\|POS=DET\|Person=2\|Poss=Yes\|PronType=Prs`, `Case=Gen\|Gender=Com\|Number=Sing\|POS=DET\|PronType=Ind`, `Case=Gen\|POS=NOUN`, `Number[psor]=Plur\|POS=PRON\|Person=3\|Poss=Yes\|PronType=Prs`, `POS=DET\|PronType=Dem`, `Definite=Def\|Number=Plur\|POS=NOUN` |
99
  | **`parser`** | `ROOT`, `acl:relcl`, `advcl`, `advmod`, `advmod:lmod`, `amod`, `appos`, `aux`, `case`, `cc`, `ccomp`, `compound:prt`, `conj`, `cop`, `dep`, `det`, `expl`, `fixed`, `flat`, `iobj`, `list`, `mark`, `nmod`, `nmod:poss`, `nsubj`, `nummod`, `obj`, `obl`, `obl:lmod`, `obl:tmod`, `punct`, `xcomp` |
100
  | **`ner`** | `LOC`, `MISC`, `ORG`, `PER` |
101
 
 
109
  | `TOKEN_P` | 99.78 |
110
  | `TOKEN_R` | 99.75 |
111
  | `TOKEN_F` | 99.76 |
112
+ | `POS_ACC` | 96.18 |
113
+ | `MORPH_ACC` | 94.84 |
114
+ | `MORPH_MICRO_P` | 96.75 |
115
+ | `MORPH_MICRO_R` | 96.22 |
116
+ | `MORPH_MICRO_F` | 96.49 |
117
+ | `SENTS_P` | 92.03 |
118
  | `SENTS_R` | 90.07 |
119
+ | `SENTS_F` | 91.04 |
120
+ | `DEP_UAS` | 82.16 |
121
+ | `DEP_LAS` | 78.02 |
122
+ | `LEMMA_ACC` | 94.97 |
123
+ | `TAG_ACC` | 96.18 |
124
+ | `ENTS_P` | 80.64 |
125
+ | `ENTS_R` | 78.96 |
126
+ | `ENTS_F` | 79.79 |
accuracy.json CHANGED
@@ -3,51 +3,51 @@
3
  "token_p": 0.9977732598,
4
  "token_r": 0.9974835463,
5
  "token_f": 0.997628382,
6
- "pos_acc": 0.9641646489,
7
- "morph_acc": 0.9505084746,
8
- "morph_micro_p": 0.9668578389,
9
- "morph_micro_r": 0.9615869971,
10
- "morph_micro_f": 0.9642152149,
11
  "morph_per_feat": {
12
  "Mood": {
13
- "p": 0.9723809524,
14
- "r": 0.9733079123,
15
- "f": 0.9728442115
16
  },
17
  "Tense": {
18
- "p": 0.9669172932,
19
- "r": 0.968373494,
20
- "f": 0.9676448457
21
  },
22
  "VerbForm": {
23
- "p": 0.9583588487,
24
- "r": 0.9577723378,
25
- "f": 0.9580655035
26
  },
27
  "Voice": {
28
- "p": 0.9739195231,
29
- "r": 0.9768310912,
30
- "f": 0.9753731343
31
  },
32
  "Definite": {
33
- "p": 0.964940239,
34
- "r": 0.9569340182,
35
- "f": 0.9609204523
36
  },
37
  "Gender": {
38
- "p": 0.9487608841,
39
- "r": 0.9415088069,
40
- "f": 0.9451209341
41
  },
42
  "Number": {
43
- "p": 0.9608615708,
44
- "r": 0.95409494,
45
- "f": 0.9574663002
46
  },
47
  "AdpType": {
48
- "p": 1.0,
49
  "r": 0.9920424403,
50
- "f": 0.9960053262
51
  },
52
  "PartType": {
53
  "p": 1.0,
@@ -55,29 +55,29 @@
55
  "f": 1.0
56
  },
57
  "Case": {
58
- "p": 0.9775641026,
59
- "r": 0.9636650869,
60
- "f": 0.9705648369
61
  },
62
  "Person": {
63
- "p": 0.9788359788,
64
- "r": 0.9857904085,
65
- "f": 0.982300885
66
  },
67
  "PronType": {
68
- "p": 0.9851607585,
69
- "r": 0.9827302632,
70
- "f": 0.9839440099
71
  },
72
  "NumType": {
73
- "p": 0.9863013699,
74
  "r": 0.9536423841,
75
- "f": 0.9696969697
76
  },
77
  "Degree": {
78
- "p": 0.9548229548,
79
- "r": 0.9421686747,
80
- "f": 0.9484536082
81
  },
82
  "Reflex": {
83
  "p": 1.0,
@@ -85,19 +85,19 @@
85
  "f": 1.0
86
  },
87
  "Number[psor]": {
88
- "p": 0.988372093,
89
- "r": 0.988372093,
90
- "f": 0.988372093
91
  },
92
  "Poss": {
93
- "p": 0.9886363636,
94
- "r": 0.9886363636,
95
- "f": 0.9886363636
96
  },
97
  "Foreign": {
98
- "p": 0.6666666667,
99
  "r": 0.4,
100
- "f": 0.5
101
  },
102
  "Abbr": {
103
  "p": 0.0,
@@ -110,151 +110,146 @@
110
  "f": 1.0
111
  },
112
  "Polite": {
113
- "p": 1.0,
114
  "r": 0.75,
115
- "f": 0.8571428571
116
  }
117
  },
118
- "sents_p": 0.9219600726,
119
  "sents_r": 0.9007092199,
120
- "sents_f": 0.9112107623,
121
- "dep_uas": 0.8130063132,
122
- "dep_las": 0.7723336499,
123
  "dep_las_per_type": {
124
  "advmod": {
125
- "p": 0.6868965517,
126
- "r": 0.7033898305,
127
- "f": 0.6950453594
128
  },
129
  "root": {
130
- "p": 0.8381818182,
131
- "r": 0.8173758865,
132
- "f": 0.8276481149
133
  },
134
  "nsubj": {
135
- "p": 0.8317460317,
136
- "r": 0.8291139241,
137
- "f": 0.8304278922
138
  },
139
  "case": {
140
- "p": 0.883218842,
141
- "r": 0.8875739645,
142
- "f": 0.8853910477
143
  },
144
  "obl": {
145
- "p": 0.6935483871,
146
- "r": 0.6677018634,
147
- "f": 0.6803797468
148
  },
149
  "cc": {
150
- "p": 0.7797101449,
151
- "r": 0.7819767442,
152
- "f": 0.7808417997
153
  },
154
  "conj": {
155
- "p": 0.6305555556,
156
- "r": 0.6053333333,
157
- "f": 0.6176870748
158
  },
159
  "obj": {
160
- "p": 0.7667269439,
161
- "r": 0.8233009709,
162
- "f": 0.7940074906
163
  },
164
  "aux": {
165
- "p": 0.8797653959,
166
- "r": 0.8746355685,
167
- "f": 0.8771929825
168
  },
169
  "acl:relcl": {
170
- "p": 0.6011235955,
171
- "r": 0.5783783784,
172
- "f": 0.5895316804
173
  },
174
  "advmod:lmod": {
175
- "p": 0.6388888889,
176
- "r": 0.6865671642,
177
- "f": 0.6618705036
178
  },
179
  "det": {
180
- "p": 0.9143327842,
181
- "r": 0.9143327842,
182
- "f": 0.9143327842
183
  },
184
  "amod": {
185
- "p": 0.7954173486,
186
- "r": 0.8293515358,
187
- "f": 0.8120300752
188
  },
189
  "nmod:poss": {
190
- "p": 0.6593406593,
191
- "r": 0.5940594059,
192
- "f": 0.625
193
  },
194
  "ccomp": {
195
- "p": 0.5890410959,
196
- "r": 0.6935483871,
197
- "f": 0.637037037
198
  },
199
  "nummod": {
200
- "p": 0.8512396694,
201
- "r": 0.8583333333,
202
- "f": 0.8547717842
203
  },
204
  "flat": {
205
- "p": 0.7514450867,
206
- "r": 0.8609271523,
207
- "f": 0.8024691358
208
  },
209
  "compound:prt": {
210
- "p": 0.4285714286,
211
- "r": 0.2195121951,
212
- "f": 0.2903225806
213
  },
214
  "advcl": {
215
- "p": 0.5909090909,
216
- "r": 0.5603448276,
217
- "f": 0.5752212389
218
  },
219
  "mark": {
220
- "p": 0.8742138365,
221
- "r": 0.8562628337,
222
- "f": 0.8651452282
223
  },
224
  "cop": {
225
- "p": 0.7891891892,
226
- "r": 0.8342857143,
227
- "f": 0.8111111111
228
  },
229
  "dep": {
230
- "p": 0.1538461538,
231
- "r": 0.2641509434,
232
- "f": 0.1944444444
233
  },
234
  "nmod": {
235
- "p": 0.6551724138,
236
- "r": 0.630859375,
237
- "f": 0.6427860697
238
  },
239
  "iobj": {
240
- "p": 0.7272727273,
241
- "r": 0.3636363636,
242
- "f": 0.4848484848
243
  },
244
  "xcomp": {
245
- "p": 0.5833333333,
246
- "r": 0.3559322034,
247
- "f": 0.4421052632
248
- },
249
- "appos": {
250
- "p": 0.4375,
251
- "r": 0.4242424242,
252
- "f": 0.4307692308
253
  },
254
  "list": {
255
- "p": 0.375,
256
- "r": 0.1666666667,
257
- "f": 0.2307692308
258
  },
259
  "vocative": {
260
  "p": 0.0,
@@ -262,57 +257,62 @@
262
  "f": 0.0
263
  },
264
  "fixed": {
265
- "p": 0.8918918919,
266
  "r": 0.8048780488,
267
- "f": 0.8461538462
268
  },
269
  "expl": {
270
- "p": 0.8181818182,
271
- "r": 0.7941176471,
272
- "f": 0.8059701493
 
 
 
 
 
273
  },
274
  "obl:tmod": {
275
- "p": 0.7777777778,
276
- "r": 0.3888888889,
277
- "f": 0.5185185185
278
  },
279
- "obl:lmod": {
280
  "p": 0.0,
281
  "r": 0.0,
282
  "f": 0.0
283
  },
284
- "discourse": {
285
  "p": 0.0,
286
  "r": 0.0,
287
  "f": 0.0
288
  }
289
  },
290
- "lemma_acc": 0.9481840194,
291
- "tag_acc": 0.9641646489,
292
- "ents_p": 0.8079331942,
293
- "ents_r": 0.80625,
294
- "ents_f": 0.8070907195,
295
  "ents_per_type": {
296
  "PER": {
297
- "p": 0.88125,
298
  "r": 0.8493975904,
299
- "f": 0.8650306748
300
  },
301
  "ORG": {
302
- "p": 0.7294117647,
303
- "r": 0.6888888889,
304
- "f": 0.7085714286
305
  },
306
  "MISC": {
307
- "p": 0.6991869919,
308
- "r": 0.7610619469,
309
- "f": 0.7288135593
310
  },
311
  "LOC": {
312
- "p": 0.8828828829,
313
- "r": 0.8828828829,
314
- "f": 0.8828828829
315
  }
316
  },
317
- "speed": 11453.5916881723
318
  }
 
3
  "token_p": 0.9977732598,
4
  "token_r": 0.9974835463,
5
  "token_f": 0.997628382,
6
+ "pos_acc": 0.9618401937,
7
+ "morph_acc": 0.948377724,
8
+ "morph_micro_p": 0.9675176369,
9
+ "morph_micro_r": 0.9622431982,
10
+ "morph_micro_f": 0.9648732095,
11
  "morph_per_feat": {
12
  "Mood": {
13
+ "p": 0.9799235182,
14
+ "r": 0.9771210677,
15
+ "f": 0.9785202864
16
  },
17
  "Tense": {
18
+ "p": 0.9743396226,
19
+ "r": 0.9721385542,
20
+ "f": 0.973237844
21
  },
22
  "VerbForm": {
23
+ "p": 0.9643953346,
24
+ "r": 0.9614443084,
25
+ "f": 0.9629175605
26
  },
27
  "Voice": {
28
+ "p": 0.976083707,
29
+ "r": 0.976083707,
30
+ "f": 0.976083707
31
  },
32
  "Definite": {
33
+ "p": 0.9622716442,
34
+ "r": 0.9573291189,
35
+ "f": 0.9597940186
36
  },
37
  "Gender": {
38
+ "p": 0.9466310874,
39
+ "r": 0.9431704885,
40
+ "f": 0.9448976194
41
  },
42
  "Number": {
43
+ "p": 0.9613361389,
44
+ "r": 0.9533124674,
45
+ "f": 0.9573074908
46
  },
47
  "AdpType": {
48
+ "p": 0.9982206406,
49
  "r": 0.9920424403,
50
+ "f": 0.9951219512
51
  },
52
  "PartType": {
53
  "p": 1.0,
 
55
  "f": 1.0
56
  },
57
  "Case": {
58
+ "p": 0.9741935484,
59
+ "r": 0.9541864139,
60
+ "f": 0.9640861931
61
  },
62
  "Person": {
63
+ "p": 0.9788732394,
64
+ "r": 0.9875666075,
65
+ "f": 0.9832007073
66
  },
67
  "PronType": {
68
+ "p": 0.9860197368,
69
+ "r": 0.9860197368,
70
+ "f": 0.9860197368
71
  },
72
  "NumType": {
73
+ "p": 0.9931034483,
74
  "r": 0.9536423841,
75
+ "f": 0.972972973
76
  },
77
  "Degree": {
78
+ "p": 0.9545454545,
79
+ "r": 0.9361445783,
80
+ "f": 0.9452554745
81
  },
82
  "Reflex": {
83
  "p": 1.0,
 
85
  "f": 1.0
86
  },
87
  "Number[psor]": {
88
+ "p": 0.9772727273,
89
+ "r": 1.0,
90
+ "f": 0.9885057471
91
  },
92
  "Poss": {
93
+ "p": 0.9887640449,
94
+ "r": 1.0,
95
+ "f": 0.9943502825
96
  },
97
  "Foreign": {
98
+ "p": 0.5,
99
  "r": 0.4,
100
+ "f": 0.4444444444
101
  },
102
  "Abbr": {
103
  "p": 0.0,
 
110
  "f": 1.0
111
  },
112
  "Polite": {
113
+ "p": 0.75,
114
  "r": 0.75,
115
+ "f": 0.75
116
  }
117
  },
118
+ "sents_p": 0.9202898551,
119
  "sents_r": 0.9007092199,
120
+ "sents_f": 0.9103942652,
121
+ "dep_uas": 0.8215642458,
122
+ "dep_las": 0.7802234637,
123
  "dep_las_per_type": {
124
  "advmod": {
125
+ "p": 0.7128851541,
126
+ "r": 0.7189265537,
127
+ "f": 0.7158931083
128
  },
129
  "root": {
130
+ "p": 0.8483754513,
131
+ "r": 0.8333333333,
132
+ "f": 0.8407871199
133
  },
134
  "nsubj": {
135
+ "p": 0.8333333333,
136
+ "r": 0.8333333333,
137
+ "f": 0.8333333333
138
  },
139
  "case": {
140
+ "p": 0.8933859822,
141
+ "r": 0.892504931,
142
+ "f": 0.8929452393
143
  },
144
  "obl": {
145
+ "p": 0.6905901116,
146
+ "r": 0.6723602484,
147
+ "f": 0.6813532651
148
  },
149
  "cc": {
150
+ "p": 0.7803468208,
151
+ "r": 0.7848837209,
152
+ "f": 0.7826086957
153
  },
154
  "conj": {
155
+ "p": 0.6422764228,
156
+ "r": 0.632,
157
+ "f": 0.6370967742
158
  },
159
  "obj": {
160
+ "p": 0.7892791128,
161
+ "r": 0.8291262136,
162
+ "f": 0.8087121212
163
  },
164
  "aux": {
165
+ "p": 0.8858858859,
166
+ "r": 0.860058309,
167
+ "f": 0.8727810651
168
  },
169
  "acl:relcl": {
170
+ "p": 0.5837837838,
171
+ "r": 0.5837837838,
172
+ "f": 0.5837837838
173
  },
174
  "advmod:lmod": {
175
+ "p": 0.7164179104,
176
+ "r": 0.7164179104,
177
+ "f": 0.7164179104
178
  },
179
  "det": {
180
+ "p": 0.9126853377,
181
+ "r": 0.9126853377,
182
+ "f": 0.9126853377
183
  },
184
  "amod": {
185
+ "p": 0.8155668359,
186
+ "r": 0.8225255973,
187
+ "f": 0.8190314359
188
  },
189
  "nmod:poss": {
190
+ "p": 0.6730769231,
191
+ "r": 0.6930693069,
192
+ "f": 0.6829268293
193
  },
194
  "ccomp": {
195
+ "p": 0.5967741935,
196
+ "r": 0.5967741935,
197
+ "f": 0.5967741935
198
  },
199
  "nummod": {
200
+ "p": 0.8416666667,
201
+ "r": 0.8416666667,
202
+ "f": 0.8416666667
203
  },
204
  "flat": {
205
+ "p": 0.765060241,
206
+ "r": 0.8410596026,
207
+ "f": 0.8012618297
208
  },
209
  "compound:prt": {
210
+ "p": 0.625,
211
+ "r": 0.3658536585,
212
+ "f": 0.4615384615
213
  },
214
  "advcl": {
215
+ "p": 0.6126126126,
216
+ "r": 0.5862068966,
217
+ "f": 0.5991189427
218
  },
219
  "mark": {
220
+ "p": 0.8553719008,
221
+ "r": 0.8501026694,
222
+ "f": 0.8527291452
223
  },
224
  "cop": {
225
+ "p": 0.825136612,
226
+ "r": 0.8628571429,
227
+ "f": 0.843575419
228
  },
229
  "dep": {
230
+ "p": 0.1875,
231
+ "r": 0.2830188679,
232
+ "f": 0.2255639098
233
  },
234
  "nmod": {
235
+ "p": 0.6581532417,
236
+ "r": 0.654296875,
237
+ "f": 0.6562193928
238
  },
239
  "iobj": {
240
+ "p": 0.7692307692,
241
+ "r": 0.4545454545,
242
+ "f": 0.5714285714
243
  },
244
  "xcomp": {
245
+ "p": 0.4705882353,
246
+ "r": 0.406779661,
247
+ "f": 0.4363636364
 
 
 
 
 
248
  },
249
  "list": {
250
+ "p": 0.4615384615,
251
+ "r": 0.3333333333,
252
+ "f": 0.3870967742
253
  },
254
  "vocative": {
255
  "p": 0.0,
 
257
  "f": 0.0
258
  },
259
  "fixed": {
260
+ "p": 0.9166666667,
261
  "r": 0.8048780488,
262
+ "f": 0.8571428571
263
  },
264
  "expl": {
265
+ "p": 0.8,
266
+ "r": 0.8235294118,
267
+ "f": 0.8115942029
268
+ },
269
+ "appos": {
270
+ "p": 0.4166666667,
271
+ "r": 0.4545454545,
272
+ "f": 0.4347826087
273
  },
274
  "obl:tmod": {
275
+ "p": 0.75,
276
+ "r": 0.3333333333,
277
+ "f": 0.4615384615
278
  },
279
+ "discourse": {
280
  "p": 0.0,
281
  "r": 0.0,
282
  "f": 0.0
283
  },
284
+ "obl:lmod": {
285
  "p": 0.0,
286
  "r": 0.0,
287
  "f": 0.0
288
  }
289
  },
290
+ "lemma_acc": 0.9497336562,
291
+ "tag_acc": 0.9618401937,
292
+ "ents_p": 0.8063829787,
293
+ "ents_r": 0.7895833333,
294
+ "ents_f": 0.7978947368,
295
  "ents_per_type": {
296
  "PER": {
297
+ "p": 0.8924050633,
298
  "r": 0.8493975904,
299
+ "f": 0.8703703704
300
  },
301
  "ORG": {
302
+ "p": 0.7073170732,
303
+ "r": 0.6444444444,
304
+ "f": 0.6744186047
305
  },
306
  "MISC": {
307
+ "p": 0.7142857143,
308
+ "r": 0.7079646018,
309
+ "f": 0.7111111111
310
  },
311
  "LOC": {
312
+ "p": 0.8474576271,
313
+ "r": 0.9009009009,
314
+ "f": 0.8733624454
315
  }
316
  },
317
+ "speed": 12214.1305450038
318
  }
da_core_news_md-any-py3-none-any.whl CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:25dcaba4499ac19b4f1d23884cc5896401eb1e2c896c6a49c10a6f8fe6190398
3
- size 42193668
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9ab33cc4d15f68126d012a01c972736fd789a76a7ade79425877a58f9f10797a
3
+ size 42193115
lemmatizer/cfg CHANGED
@@ -68,382 +68,379 @@
68
  145,
69
  147,
70
  148,
71
- 149,
72
- 153,
73
- 155,
74
- 158,
75
- 161,
76
- 164,
77
- 166,
78
- 168,
79
- 170,
80
- 172,
81
  174,
82
- 175,
83
- 177,
84
- 179,
85
- 182,
86
- 184,
87
- 186,
88
- 188,
89
- 190,
90
- 192,
91
- 194,
92
- 196,
93
- 199,
94
- 201,
95
  203,
96
- 204,
97
  207,
98
- 208,
99
  209,
 
100
  211,
101
  213,
102
- 214,
103
- 216,
104
- 218,
105
  220,
106
  222,
107
  224,
108
- 226,
109
  229,
110
- 231,
111
  232,
112
  233,
113
  235,
114
  236,
115
- 238,
116
- 239,
117
- 243,
118
- 249,
119
- 253,
120
- 255,
121
- 257,
122
- 259,
123
  261,
124
  262,
125
  263,
126
- 264,
127
- 267,
128
  269,
129
- 270,
130
- 272,
131
- 274,
132
- 276,
133
- 278,
134
- 280,
135
- 282,
136
  284,
137
  286,
 
138
  290,
139
- 291,
140
  293,
141
  295,
 
142
  297,
143
  299,
144
- 300,
145
- 302,
146
- 303,
147
  304,
148
- 306,
149
- 308,
150
- 311,
151
- 314,
152
  315,
153
- 317,
 
 
154
  320,
155
- 321,
156
  323,
157
- 324,
158
  326,
159
- 327,
160
- 328,
161
  330,
162
- 331,
163
  333,
164
  337,
165
  339,
166
- 340,
167
- 344,
168
  346,
169
- 350,
170
- 353,
 
 
171
  354,
172
  355,
173
- 358,
 
174
  360,
175
- 361,
176
  363,
177
- 365,
178
- 366,
179
- 369,
180
  372,
181
  373,
 
 
182
  376,
183
- 380,
184
- 382,
 
185
  383,
186
- 384,
187
- 386,
188
  387,
 
189
  389,
190
  391,
191
- 392,
192
- 394,
193
  395,
194
- 398,
195
  400,
196
  402,
 
197
  404,
 
198
  406,
 
199
  409,
200
- 411,
201
  412,
202
  413,
203
  415,
204
- 417,
205
- 420,
 
206
  421,
207
  423,
208
- 424,
209
  425,
210
  427,
211
  429,
212
  431,
213
  433,
214
- 434,
215
- 436,
216
  437,
217
  439,
218
- 440,
219
  442,
220
  444,
221
- 445,
222
- 449,
223
- 450,
224
  452,
225
  454,
226
- 457,
227
- 459,
 
 
228
  462,
229
  465,
230
  466,
231
- 468,
232
  470,
233
- 471,
234
  474,
235
  475,
236
  478,
237
- 480,
238
- 483,
239
- 485,
240
- 486,
241
  487,
242
  489,
 
243
  491,
244
  492,
245
  493,
246
- 495,
247
  496,
248
- 498,
249
- 500,
250
  501,
251
  502,
252
  503,
253
  504,
254
  505,
255
- 507,
256
  508,
257
  509,
258
- 510,
259
  511,
260
- 512,
261
- 514,
262
  515,
263
- 516,
264
- 518,
265
  519,
266
  520,
267
  521,
268
  523,
 
269
  525,
270
  526,
271
  528,
 
272
  531,
273
- 533,
274
- 535,
275
- 453,
276
- 536,
277
  538,
278
  539,
279
- 541,
280
- 545,
281
- 547,
282
  548,
283
- 549,
284
  550,
285
  551,
 
286
  553,
287
  554,
288
- 555,
289
- 557,
290
  559,
291
  560,
292
- 561,
293
- 563,
294
  565,
295
  566,
296
  567,
297
- 568,
298
  570,
299
- 571,
300
- 575,
301
- 577,
302
  578,
303
- 579,
304
- 582,
305
- 585,
306
  587,
307
- 589,
308
- 593,
309
  594,
310
- 596,
311
- 597,
312
  601,
 
313
  603,
314
- 605,
315
  609,
316
  611,
317
- 612,
318
- 613,
319
- 614,
320
  615,
321
- 616,
322
  617,
 
323
  619,
 
324
  621,
325
- 622,
326
- 624,
327
  625,
328
- 627,
329
  628,
330
- 629,
331
- 632,
332
- 634,
333
- 638,
 
334
  639,
335
- 640,
336
- 642,
337
- 644,
338
  647,
339
  649,
340
- 650,
341
- 651,
342
- 653,
343
  654,
344
  655,
345
  657,
346
  658,
347
- 659,
348
  661,
349
- 663,
350
- 665,
351
- 667,
352
- 669,
353
  670,
354
- 672,
355
- 674,
 
356
  676,
357
- 677,
358
  678,
359
  680,
360
- 682,
361
  683,
362
  685,
363
- 686,
364
  688,
365
- 689,
366
  690,
367
  691,
368
- 694,
369
- 695,
370
  696,
371
  697,
 
372
  699,
373
- 700,
374
  701,
375
  703,
 
376
  705,
377
  706,
378
- 707,
379
- 708,
380
- 712,
381
  715,
382
  716,
383
- 718,
384
  720,
385
- 724,
 
386
  726,
 
387
  729,
388
  730,
389
  732,
390
- 733,
391
  734,
392
  736,
393
- 738,
394
  739,
395
  740,
396
  741,
397
  742,
398
- 743,
399
- 744,
400
- 747,
401
- 749,
402
- 753,
403
- 756,
404
- 758,
405
  759,
 
406
  761,
407
- 762,
408
  763,
409
  764,
410
- 766,
411
- 768,
412
  769,
 
413
  771,
 
414
  773,
415
  774,
416
  775,
417
  776,
418
- 777,
419
- 781,
420
- 783,
421
  784,
422
  785,
423
- 788,
424
- 791,
 
425
  792,
426
- 794,
427
  796,
428
- 797,
429
  798,
430
- 799,
431
  800,
432
- 802,
433
  803,
434
  804,
435
  805,
436
  806,
437
  808,
438
  809,
439
- 810,
440
  811,
441
  812,
 
442
  814,
443
  815,
444
  817,
445
  819,
446
- 820,
447
  822,
448
  824,
449
  825,
@@ -452,6 +449,8 @@
452
  831,
453
  833,
454
  835,
455
- 837
 
 
456
  ]
457
  }
 
68
  145,
69
  147,
70
  148,
71
+ 152,
72
+ 154,
73
+ 157,
74
+ 160,
75
+ 163,
76
+ 165,
77
+ 167,
78
+ 169,
79
+ 171,
80
+ 173,
81
  174,
82
+ 176,
83
+ 178,
84
+ 181,
85
+ 183,
86
+ 185,
87
+ 187,
88
+ 189,
89
+ 191,
90
+ 193,
91
+ 195,
92
+ 198,
93
+ 200,
94
+ 202,
95
  203,
96
+ 206,
97
  207,
 
98
  209,
99
+ 210,
100
  211,
101
  213,
102
+ 215,
103
+ 217,
104
+ 219,
105
  220,
106
  222,
107
  224,
108
+ 227,
109
  229,
110
+ 230,
111
  232,
112
  233,
113
  235,
114
  236,
115
+ 240,
116
+ 246,
117
+ 250,
118
+ 252,
119
+ 254,
120
+ 256,
121
+ 258,
122
+ 260,
123
  261,
124
  262,
125
  263,
126
+ 266,
127
+ 268,
128
  269,
129
+ 271,
130
+ 273,
131
+ 275,
132
+ 277,
133
+ 279,
134
+ 283,
 
135
  284,
136
  286,
137
+ 288,
138
  290,
139
+ 292,
140
  293,
141
  295,
142
+ 296,
143
  297,
144
  299,
145
+ 301,
 
 
146
  304,
147
+ 307,
148
+ 309,
149
+ 312,
150
+ 313,
151
  315,
152
+ 316,
153
+ 318,
154
+ 319,
155
  320,
156
+ 322,
157
  323,
158
+ 325,
159
  326,
 
 
160
  330,
161
+ 332,
162
  333,
163
  337,
164
  339,
165
+ 343,
 
166
  346,
167
+ 347,
168
+ 348,
169
+ 351,
170
+ 352,
171
  354,
172
  355,
173
+ 356,
174
+ 359,
175
  360,
 
176
  363,
177
+ 364,
178
+ 367,
179
+ 371,
180
  372,
181
  373,
182
+ 374,
183
+ 375,
184
  376,
185
+ 377,
186
+ 379,
187
+ 381,
188
  383,
189
+ 385,
 
190
  387,
191
+ 388,
192
  389,
193
  391,
194
+ 393,
 
195
  395,
196
+ 397,
197
  400,
198
  402,
199
+ 403,
200
  404,
201
+ 405,
202
  406,
203
+ 408,
204
  409,
 
205
  412,
206
  413,
207
  415,
208
+ 416,
209
+ 418,
210
+ 419,
211
  421,
212
  423,
 
213
  425,
214
  427,
215
  429,
216
  431,
217
  433,
218
+ 435,
 
219
  437,
220
  439,
221
+ 441,
222
  442,
223
  444,
224
+ 446,
225
+ 447,
226
+ 451,
227
  452,
228
  454,
229
+ 455,
230
+ 456,
231
+ 458,
232
+ 461,
233
  462,
234
  465,
235
  466,
236
+ 469,
237
  470,
238
+ 472,
239
  474,
240
  475,
241
  478,
242
+ 479,
243
+ 482,
244
+ 484,
 
245
  487,
246
  489,
247
+ 490,
248
  491,
249
  492,
250
  493,
251
+ 494,
252
  496,
253
+ 497,
254
+ 499,
255
  501,
256
  502,
257
  503,
258
  504,
259
  505,
260
+ 506,
261
  508,
262
  509,
 
263
  511,
264
+ 513,
 
265
  515,
266
+ 517,
 
267
  519,
268
  520,
269
  521,
270
  523,
271
+ 524,
272
  525,
273
  526,
274
  528,
275
+ 529,
276
  531,
277
+ 532,
278
+ 534,
279
+ 537,
 
280
  538,
281
  539,
282
+ 540,
283
+ 542,
284
+ 544,
285
  548,
 
286
  550,
287
  551,
288
+ 552,
289
  553,
290
  554,
291
+ 556,
292
+ 558,
293
  559,
294
  560,
295
+ 562,
296
+ 564,
297
  565,
298
  566,
299
  567,
300
+ 569,
301
  570,
302
+ 574,
303
+ 576,
 
304
  578,
305
+ 581,
306
+ 583,
307
+ 584,
308
  587,
309
+ 590,
310
+ 592,
311
  594,
312
+ 598,
313
+ 599,
314
  601,
315
+ 602,
316
  603,
317
+ 607,
318
  609,
319
  611,
 
 
 
320
  615,
 
321
  617,
322
+ 618,
323
  619,
324
+ 620,
325
  621,
326
+ 623,
 
327
  625,
328
+ 626,
329
  628,
330
+ 630,
331
+ 631,
332
+ 633,
333
+ 635,
334
+ 636,
335
  639,
336
+ 641,
337
+ 645,
338
+ 646,
339
  647,
340
  649,
341
+ 652,
 
 
342
  654,
343
  655,
344
  657,
345
  658,
346
+ 660,
347
  661,
348
+ 662,
349
+ 664,
350
+ 666,
351
+ 668,
352
  670,
353
+ 671,
354
+ 673,
355
+ 675,
356
  676,
 
357
  678,
358
  680,
359
+ 681,
360
  683,
361
  685,
362
+ 687,
363
  688,
 
364
  690,
365
  691,
366
+ 692,
367
+ 693,
368
  696,
369
  697,
370
+ 698,
371
  699,
 
372
  701,
373
  703,
374
+ 704,
375
  705,
376
  706,
377
+ 710,
378
+ 713,
 
379
  715,
380
  716,
 
381
  720,
382
+ 722,
383
+ 725,
384
  726,
385
+ 728,
386
  729,
387
  730,
388
  732,
 
389
  734,
390
  736,
391
+ 737,
392
  739,
393
  740,
394
  741,
395
  742,
396
+ 745,
397
+ 746,
398
+ 748,
399
+ 752,
400
+ 755,
401
+ 757,
 
402
  759,
403
+ 760,
404
  761,
 
405
  763,
406
  764,
407
+ 765,
408
+ 767,
409
  769,
410
+ 770,
411
  771,
412
+ 772,
413
  773,
414
  774,
415
  775,
416
  776,
417
+ 780,
418
+ 782,
 
419
  784,
420
  785,
421
+ 786,
422
+ 787,
423
+ 790,
424
  792,
425
+ 795,
426
  796,
 
427
  798,
 
428
  800,
429
+ 801,
430
  803,
431
  804,
432
  805,
433
  806,
434
  808,
435
  809,
 
436
  811,
437
  812,
438
+ 813,
439
  814,
440
  815,
441
  817,
442
  819,
443
+ 821,
444
  822,
445
  824,
446
  825,
 
449
  831,
450
  833,
451
  835,
452
+ 837,
453
+ 839,
454
+ 841
455
  ]
456
  }
lemmatizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5dbaeda1129c701ac9da038242ad1d176d2d9b00e1b9fdaaefa9fd25435920f3
3
- size 176206
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:356c369c9c50b0510e9dfab74689db20b2e0cb65718095e901e600f4d74aa9b0
3
+ size 175818
lemmatizer/trees CHANGED
Binary files a/lemmatizer/trees and b/lemmatizer/trees differ
 
meta.json CHANGED
@@ -1,14 +1,14 @@
1
  {
2
  "lang":"da",
3
  "name":"core_news_md",
4
- "version":"3.3.0",
5
  "description":"Danish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
- "spacy_version":">=3.3.0.dev0,<3.4.0",
11
- "spacy_git_version":"849bef2de",
12
  "vectors":{
13
  "width":300,
14
  "vectors":20000,
@@ -106,6 +106,7 @@
106
  "Gender=Com|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs|Style=Form",
107
  "Number=Plur|POS=PRON|PronType=Rcp",
108
  "Case=Gen|Degree=Cmp|POS=ADJ",
 
109
  "Case=Gen|Definite=Def|Gender=Neut|Number=Plur|POS=NOUN",
110
  "Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
111
  "POS=INTJ",
@@ -247,51 +248,51 @@
247
  "token_p":0.9977732598,
248
  "token_r":0.9974835463,
249
  "token_f":0.997628382,
250
- "pos_acc":0.9641646489,
251
- "morph_acc":0.9505084746,
252
- "morph_micro_p":0.9668578389,
253
- "morph_micro_r":0.9615869971,
254
- "morph_micro_f":0.9642152149,
255
  "morph_per_feat":{
256
  "Mood":{
257
- "p":0.9723809524,
258
- "r":0.9733079123,
259
- "f":0.9728442115
260
  },
261
  "Tense":{
262
- "p":0.9669172932,
263
- "r":0.968373494,
264
- "f":0.9676448457
265
  },
266
  "VerbForm":{
267
- "p":0.9583588487,
268
- "r":0.9577723378,
269
- "f":0.9580655035
270
  },
271
  "Voice":{
272
- "p":0.9739195231,
273
- "r":0.9768310912,
274
- "f":0.9753731343
275
  },
276
  "Definite":{
277
- "p":0.964940239,
278
- "r":0.9569340182,
279
- "f":0.9609204523
280
  },
281
  "Gender":{
282
- "p":0.9487608841,
283
- "r":0.9415088069,
284
- "f":0.9451209341
285
  },
286
  "Number":{
287
- "p":0.9608615708,
288
- "r":0.95409494,
289
- "f":0.9574663002
290
  },
291
  "AdpType":{
292
- "p":1.0,
293
  "r":0.9920424403,
294
- "f":0.9960053262
295
  },
296
  "PartType":{
297
  "p":1.0,
@@ -299,29 +300,29 @@
299
  "f":1.0
300
  },
301
  "Case":{
302
- "p":0.9775641026,
303
- "r":0.9636650869,
304
- "f":0.9705648369
305
  },
306
  "Person":{
307
- "p":0.9788359788,
308
- "r":0.9857904085,
309
- "f":0.982300885
310
  },
311
  "PronType":{
312
- "p":0.9851607585,
313
- "r":0.9827302632,
314
- "f":0.9839440099
315
  },
316
  "NumType":{
317
- "p":0.9863013699,
318
  "r":0.9536423841,
319
- "f":0.9696969697
320
  },
321
  "Degree":{
322
- "p":0.9548229548,
323
- "r":0.9421686747,
324
- "f":0.9484536082
325
  },
326
  "Reflex":{
327
  "p":1.0,
@@ -329,19 +330,19 @@
329
  "f":1.0
330
  },
331
  "Number[psor]":{
332
- "p":0.988372093,
333
- "r":0.988372093,
334
- "f":0.988372093
335
  },
336
  "Poss":{
337
- "p":0.9886363636,
338
- "r":0.9886363636,
339
- "f":0.9886363636
340
  },
341
  "Foreign":{
342
- "p":0.6666666667,
343
  "r":0.4,
344
- "f":0.5
345
  },
346
  "Abbr":{
347
  "p":0.0,
@@ -354,151 +355,146 @@
354
  "f":1.0
355
  },
356
  "Polite":{
357
- "p":1.0,
358
  "r":0.75,
359
- "f":0.8571428571
360
  }
361
  },
362
- "sents_p":0.9219600726,
363
  "sents_r":0.9007092199,
364
- "sents_f":0.9112107623,
365
- "dep_uas":0.8130063132,
366
- "dep_las":0.7723336499,
367
  "dep_las_per_type":{
368
  "advmod":{
369
- "p":0.6868965517,
370
- "r":0.7033898305,
371
- "f":0.6950453594
372
  },
373
  "root":{
374
- "p":0.8381818182,
375
- "r":0.8173758865,
376
- "f":0.8276481149
377
  },
378
  "nsubj":{
379
- "p":0.8317460317,
380
- "r":0.8291139241,
381
- "f":0.8304278922
382
  },
383
  "case":{
384
- "p":0.883218842,
385
- "r":0.8875739645,
386
- "f":0.8853910477
387
  },
388
  "obl":{
389
- "p":0.6935483871,
390
- "r":0.6677018634,
391
- "f":0.6803797468
392
  },
393
  "cc":{
394
- "p":0.7797101449,
395
- "r":0.7819767442,
396
- "f":0.7808417997
397
  },
398
  "conj":{
399
- "p":0.6305555556,
400
- "r":0.6053333333,
401
- "f":0.6176870748
402
  },
403
  "obj":{
404
- "p":0.7667269439,
405
- "r":0.8233009709,
406
- "f":0.7940074906
407
  },
408
  "aux":{
409
- "p":0.8797653959,
410
- "r":0.8746355685,
411
- "f":0.8771929825
412
  },
413
  "acl:relcl":{
414
- "p":0.6011235955,
415
- "r":0.5783783784,
416
- "f":0.5895316804
417
  },
418
  "advmod:lmod":{
419
- "p":0.6388888889,
420
- "r":0.6865671642,
421
- "f":0.6618705036
422
  },
423
  "det":{
424
- "p":0.9143327842,
425
- "r":0.9143327842,
426
- "f":0.9143327842
427
  },
428
  "amod":{
429
- "p":0.7954173486,
430
- "r":0.8293515358,
431
- "f":0.8120300752
432
  },
433
  "nmod:poss":{
434
- "p":0.6593406593,
435
- "r":0.5940594059,
436
- "f":0.625
437
  },
438
  "ccomp":{
439
- "p":0.5890410959,
440
- "r":0.6935483871,
441
- "f":0.637037037
442
  },
443
  "nummod":{
444
- "p":0.8512396694,
445
- "r":0.8583333333,
446
- "f":0.8547717842
447
  },
448
  "flat":{
449
- "p":0.7514450867,
450
- "r":0.8609271523,
451
- "f":0.8024691358
452
  },
453
  "compound:prt":{
454
- "p":0.4285714286,
455
- "r":0.2195121951,
456
- "f":0.2903225806
457
  },
458
  "advcl":{
459
- "p":0.5909090909,
460
- "r":0.5603448276,
461
- "f":0.5752212389
462
  },
463
  "mark":{
464
- "p":0.8742138365,
465
- "r":0.8562628337,
466
- "f":0.8651452282
467
  },
468
  "cop":{
469
- "p":0.7891891892,
470
- "r":0.8342857143,
471
- "f":0.8111111111
472
  },
473
  "dep":{
474
- "p":0.1538461538,
475
- "r":0.2641509434,
476
- "f":0.1944444444
477
  },
478
  "nmod":{
479
- "p":0.6551724138,
480
- "r":0.630859375,
481
- "f":0.6427860697
482
  },
483
  "iobj":{
484
- "p":0.7272727273,
485
- "r":0.3636363636,
486
- "f":0.4848484848
487
  },
488
  "xcomp":{
489
- "p":0.5833333333,
490
- "r":0.3559322034,
491
- "f":0.4421052632
492
- },
493
- "appos":{
494
- "p":0.4375,
495
- "r":0.4242424242,
496
- "f":0.4307692308
497
  },
498
  "list":{
499
- "p":0.375,
500
- "r":0.1666666667,
501
- "f":0.2307692308
502
  },
503
  "vocative":{
504
  "p":0.0,
@@ -506,59 +502,64 @@
506
  "f":0.0
507
  },
508
  "fixed":{
509
- "p":0.8918918919,
510
  "r":0.8048780488,
511
- "f":0.8461538462
512
  },
513
  "expl":{
514
- "p":0.8181818182,
515
- "r":0.7941176471,
516
- "f":0.8059701493
 
 
 
 
 
517
  },
518
  "obl:tmod":{
519
- "p":0.7777777778,
520
- "r":0.3888888889,
521
- "f":0.5185185185
522
  },
523
- "obl:lmod":{
524
  "p":0.0,
525
  "r":0.0,
526
  "f":0.0
527
  },
528
- "discourse":{
529
  "p":0.0,
530
  "r":0.0,
531
  "f":0.0
532
  }
533
  },
534
- "lemma_acc":0.9481840194,
535
- "tag_acc":0.9641646489,
536
- "ents_p":0.8079331942,
537
- "ents_r":0.80625,
538
- "ents_f":0.8070907195,
539
  "ents_per_type":{
540
  "PER":{
541
- "p":0.88125,
542
  "r":0.8493975904,
543
- "f":0.8650306748
544
  },
545
  "ORG":{
546
- "p":0.7294117647,
547
- "r":0.6888888889,
548
- "f":0.7085714286
549
  },
550
  "MISC":{
551
- "p":0.6991869919,
552
- "r":0.7610619469,
553
- "f":0.7288135593
554
  },
555
  "LOC":{
556
- "p":0.8828828829,
557
- "r":0.8828828829,
558
- "f":0.8828828829
559
  }
560
  },
561
- "speed":11453.5916881723
562
  },
563
  "sources":[
564
  {
 
1
  {
2
  "lang":"da",
3
  "name":"core_news_md",
4
+ "version":"3.4.0",
5
  "description":"Danish pipeline optimized for CPU. Components: tok2vec, morphologizer, parser, lemmatizer (trainable_lemmatizer), senter, ner, attribute_ruler.",
6
  "author":"Explosion",
7
  "email":"contact@explosion.ai",
8
  "url":"https://explosion.ai",
9
  "license":"CC BY-SA 4.0",
10
+ "spacy_version":">=3.4.0,<3.5.0",
11
+ "spacy_git_version":"dd038b536",
12
  "vectors":{
13
  "width":300,
14
  "vectors":20000,
 
106
  "Gender=Com|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs|Style=Form",
107
  "Number=Plur|POS=PRON|PronType=Rcp",
108
  "Case=Gen|Degree=Cmp|POS=ADJ",
109
+ "POS=SPACE",
110
  "Case=Gen|Definite=Def|Gender=Neut|Number=Plur|POS=NOUN",
111
  "Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs",
112
  "POS=INTJ",
 
248
  "token_p":0.9977732598,
249
  "token_r":0.9974835463,
250
  "token_f":0.997628382,
251
+ "pos_acc":0.9618401937,
252
+ "morph_acc":0.948377724,
253
+ "morph_micro_p":0.9675176369,
254
+ "morph_micro_r":0.9622431982,
255
+ "morph_micro_f":0.9648732095,
256
  "morph_per_feat":{
257
  "Mood":{
258
+ "p":0.9799235182,
259
+ "r":0.9771210677,
260
+ "f":0.9785202864
261
  },
262
  "Tense":{
263
+ "p":0.9743396226,
264
+ "r":0.9721385542,
265
+ "f":0.973237844
266
  },
267
  "VerbForm":{
268
+ "p":0.9643953346,
269
+ "r":0.9614443084,
270
+ "f":0.9629175605
271
  },
272
  "Voice":{
273
+ "p":0.976083707,
274
+ "r":0.976083707,
275
+ "f":0.976083707
276
  },
277
  "Definite":{
278
+ "p":0.9622716442,
279
+ "r":0.9573291189,
280
+ "f":0.9597940186
281
  },
282
  "Gender":{
283
+ "p":0.9466310874,
284
+ "r":0.9431704885,
285
+ "f":0.9448976194
286
  },
287
  "Number":{
288
+ "p":0.9613361389,
289
+ "r":0.9533124674,
290
+ "f":0.9573074908
291
  },
292
  "AdpType":{
293
+ "p":0.9982206406,
294
  "r":0.9920424403,
295
+ "f":0.9951219512
296
  },
297
  "PartType":{
298
  "p":1.0,
 
300
  "f":1.0
301
  },
302
  "Case":{
303
+ "p":0.9741935484,
304
+ "r":0.9541864139,
305
+ "f":0.9640861931
306
  },
307
  "Person":{
308
+ "p":0.9788732394,
309
+ "r":0.9875666075,
310
+ "f":0.9832007073
311
  },
312
  "PronType":{
313
+ "p":0.9860197368,
314
+ "r":0.9860197368,
315
+ "f":0.9860197368
316
  },
317
  "NumType":{
318
+ "p":0.9931034483,
319
  "r":0.9536423841,
320
+ "f":0.972972973
321
  },
322
  "Degree":{
323
+ "p":0.9545454545,
324
+ "r":0.9361445783,
325
+ "f":0.9452554745
326
  },
327
  "Reflex":{
328
  "p":1.0,
 
330
  "f":1.0
331
  },
332
  "Number[psor]":{
333
+ "p":0.9772727273,
334
+ "r":1.0,
335
+ "f":0.9885057471
336
  },
337
  "Poss":{
338
+ "p":0.9887640449,
339
+ "r":1.0,
340
+ "f":0.9943502825
341
  },
342
  "Foreign":{
343
+ "p":0.5,
344
  "r":0.4,
345
+ "f":0.4444444444
346
  },
347
  "Abbr":{
348
  "p":0.0,
 
355
  "f":1.0
356
  },
357
  "Polite":{
358
+ "p":0.75,
359
  "r":0.75,
360
+ "f":0.75
361
  }
362
  },
363
+ "sents_p":0.9202898551,
364
  "sents_r":0.9007092199,
365
+ "sents_f":0.9103942652,
366
+ "dep_uas":0.8215642458,
367
+ "dep_las":0.7802234637,
368
  "dep_las_per_type":{
369
  "advmod":{
370
+ "p":0.7128851541,
371
+ "r":0.7189265537,
372
+ "f":0.7158931083
373
  },
374
  "root":{
375
+ "p":0.8483754513,
376
+ "r":0.8333333333,
377
+ "f":0.8407871199
378
  },
379
  "nsubj":{
380
+ "p":0.8333333333,
381
+ "r":0.8333333333,
382
+ "f":0.8333333333
383
  },
384
  "case":{
385
+ "p":0.8933859822,
386
+ "r":0.892504931,
387
+ "f":0.8929452393
388
  },
389
  "obl":{
390
+ "p":0.6905901116,
391
+ "r":0.6723602484,
392
+ "f":0.6813532651
393
  },
394
  "cc":{
395
+ "p":0.7803468208,
396
+ "r":0.7848837209,
397
+ "f":0.7826086957
398
  },
399
  "conj":{
400
+ "p":0.6422764228,
401
+ "r":0.632,
402
+ "f":0.6370967742
403
  },
404
  "obj":{
405
+ "p":0.7892791128,
406
+ "r":0.8291262136,
407
+ "f":0.8087121212
408
  },
409
  "aux":{
410
+ "p":0.8858858859,
411
+ "r":0.860058309,
412
+ "f":0.8727810651
413
  },
414
  "acl:relcl":{
415
+ "p":0.5837837838,
416
+ "r":0.5837837838,
417
+ "f":0.5837837838
418
  },
419
  "advmod:lmod":{
420
+ "p":0.7164179104,
421
+ "r":0.7164179104,
422
+ "f":0.7164179104
423
  },
424
  "det":{
425
+ "p":0.9126853377,
426
+ "r":0.9126853377,
427
+ "f":0.9126853377
428
  },
429
  "amod":{
430
+ "p":0.8155668359,
431
+ "r":0.8225255973,
432
+ "f":0.8190314359
433
  },
434
  "nmod:poss":{
435
+ "p":0.6730769231,
436
+ "r":0.6930693069,
437
+ "f":0.6829268293
438
  },
439
  "ccomp":{
440
+ "p":0.5967741935,
441
+ "r":0.5967741935,
442
+ "f":0.5967741935
443
  },
444
  "nummod":{
445
+ "p":0.8416666667,
446
+ "r":0.8416666667,
447
+ "f":0.8416666667
448
  },
449
  "flat":{
450
+ "p":0.765060241,
451
+ "r":0.8410596026,
452
+ "f":0.8012618297
453
  },
454
  "compound:prt":{
455
+ "p":0.625,
456
+ "r":0.3658536585,
457
+ "f":0.4615384615
458
  },
459
  "advcl":{
460
+ "p":0.6126126126,
461
+ "r":0.5862068966,
462
+ "f":0.5991189427
463
  },
464
  "mark":{
465
+ "p":0.8553719008,
466
+ "r":0.8501026694,
467
+ "f":0.8527291452
468
  },
469
  "cop":{
470
+ "p":0.825136612,
471
+ "r":0.8628571429,
472
+ "f":0.843575419
473
  },
474
  "dep":{
475
+ "p":0.1875,
476
+ "r":0.2830188679,
477
+ "f":0.2255639098
478
  },
479
  "nmod":{
480
+ "p":0.6581532417,
481
+ "r":0.654296875,
482
+ "f":0.6562193928
483
  },
484
  "iobj":{
485
+ "p":0.7692307692,
486
+ "r":0.4545454545,
487
+ "f":0.5714285714
488
  },
489
  "xcomp":{
490
+ "p":0.4705882353,
491
+ "r":0.406779661,
492
+ "f":0.4363636364
 
 
 
 
 
493
  },
494
  "list":{
495
+ "p":0.4615384615,
496
+ "r":0.3333333333,
497
+ "f":0.3870967742
498
  },
499
  "vocative":{
500
  "p":0.0,
 
502
  "f":0.0
503
  },
504
  "fixed":{
505
+ "p":0.9166666667,
506
  "r":0.8048780488,
507
+ "f":0.8571428571
508
  },
509
  "expl":{
510
+ "p":0.8,
511
+ "r":0.8235294118,
512
+ "f":0.8115942029
513
+ },
514
+ "appos":{
515
+ "p":0.4166666667,
516
+ "r":0.4545454545,
517
+ "f":0.4347826087
518
  },
519
  "obl:tmod":{
520
+ "p":0.75,
521
+ "r":0.3333333333,
522
+ "f":0.4615384615
523
  },
524
+ "discourse":{
525
  "p":0.0,
526
  "r":0.0,
527
  "f":0.0
528
  },
529
+ "obl:lmod":{
530
  "p":0.0,
531
  "r":0.0,
532
  "f":0.0
533
  }
534
  },
535
+ "lemma_acc":0.9497336562,
536
+ "tag_acc":0.9618401937,
537
+ "ents_p":0.8063829787,
538
+ "ents_r":0.7895833333,
539
+ "ents_f":0.7978947368,
540
  "ents_per_type":{
541
  "PER":{
542
+ "p":0.8924050633,
543
  "r":0.8493975904,
544
+ "f":0.8703703704
545
  },
546
  "ORG":{
547
+ "p":0.7073170732,
548
+ "r":0.6444444444,
549
+ "f":0.6744186047
550
  },
551
  "MISC":{
552
+ "p":0.7142857143,
553
+ "r":0.7079646018,
554
+ "f":0.7111111111
555
  },
556
  "LOC":{
557
+ "p":0.8474576271,
558
+ "r":0.9009009009,
559
+ "f":0.8733624454
560
  }
561
  },
562
+ "speed":12214.1305450038
563
  },
564
  "sources":[
565
  {
morphologizer/cfg CHANGED
@@ -87,6 +87,7 @@
87
  "Gender=Com|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs|Style=Form":"Gender=Com|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs|Style=Form",
88
  "Number=Plur|POS=PRON|PronType=Rcp":"Number=Plur|PronType=Rcp",
89
  "Case=Gen|Degree=Cmp|POS=ADJ":"Case=Gen|Degree=Cmp",
 
90
  "Case=Gen|Definite=Def|Gender=Neut|Number=Plur|POS=NOUN":"Case=Gen|Definite=Def|Gender=Neut|Number=Plur",
91
  "Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
92
  "POS=INTJ":"",
@@ -246,6 +247,7 @@
246
  "Gender=Com|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs|Style=Form":90,
247
  "Number=Plur|POS=PRON|PronType=Rcp":95,
248
  "Case=Gen|Degree=Cmp|POS=ADJ":84,
 
249
  "Case=Gen|Definite=Def|Gender=Neut|Number=Plur|POS=NOUN":92,
250
  "Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
251
  "POS=INTJ":91,
 
87
  "Gender=Com|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs|Style=Form":"Gender=Com|Number=Sing|Number[psor]=Plur|Person=1|Poss=Yes|PronType=Prs|Style=Form",
88
  "Number=Plur|POS=PRON|PronType=Rcp":"Number=Plur|PronType=Rcp",
89
  "Case=Gen|Degree=Cmp|POS=ADJ":"Case=Gen|Degree=Cmp",
90
+ "POS=SPACE":"",
91
  "Case=Gen|Definite=Def|Gender=Neut|Number=Plur|POS=NOUN":"Case=Gen|Definite=Def|Gender=Neut|Number=Plur",
92
  "Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":"Number[psor]=Plur|Person=3|Poss=Yes|PronType=Prs",
93
  "POS=INTJ":"",
 
247
  "Gender=Com|Number=Sing|Number[psor]=Plur|POS=DET|Person=1|Poss=Yes|PronType=Prs|Style=Form":90,
248
  "Number=Plur|POS=PRON|PronType=Rcp":95,
249
  "Case=Gen|Degree=Cmp|POS=ADJ":84,
250
+ "POS=SPACE":103,
251
  "Case=Gen|Definite=Def|Gender=Neut|Number=Plur|POS=NOUN":92,
252
  "Number[psor]=Plur|POS=DET|Person=3|Poss=Yes|PronType=Prs":90,
253
  "POS=INTJ":91,
morphologizer/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:20e85c840781c0f123abc619c03c85399ed4a8bb47ae7fa1535c3b6d4d75276b
3
- size 61351
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1f3dd440cc2b2ffe48e5129e46f7874970c6979b2c57ddb362c031a7d0292ecd
3
+ size 61739
ner/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:444f9832c0b6efee7c93e41b2bd5ef98a098d6f0a71e36a62f7677a042909eda
3
  size 6496592
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a1b8f5a2faae4c56989b79b266532a0a0e010ee937865c281589fd2cf3ec912d
3
  size 6496592
ner/moves CHANGED
@@ -1 +1 @@
1
- ��moves��{"0":{},"1":{"PER":2146,"MISC":1273,"ORG":1267,"LOC":1144},"2":{"PER":2146,"MISC":1273,"ORG":1267,"LOC":1144},"3":{"PER":2146,"MISC":1273,"ORG":1267,"LOC":1144},"4":{"PER":2146,"MISC":1273,"ORG":1267,"LOC":1144,"":1},"5":{"":1}}�cfg��neg_key�
 
1
+ ��moves��{"0":{},"1":{"PER":2147,"MISC":1275,"ORG":1268,"LOC":1145},"2":{"PER":2147,"MISC":1275,"ORG":1268,"LOC":1145},"3":{"PER":2147,"MISC":1275,"ORG":1268,"LOC":1145},"4":{"PER":2147,"MISC":1275,"ORG":1268,"LOC":1145,"":1},"5":{"":1}}�cfg��neg_key�
parser/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:aae04c7eef9ac270ea79e71070b4d694069e21888c8adc6747f24c97da6c915d
3
  size 308728
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a8cc422d00dc50b0be029d66e9edd548bb761248057b597b19f8f94f5f283bcd
3
  size 308728
parser/moves CHANGED
@@ -1 +1 @@
1
- ��moves�D{"0":{"":41615},"1":{"":34382},"2":{"case":7526,"nsubj":6005,"det":4341,"amod":3967,"advmod":3662,"mark":3530,"aux":2436,"cc":2264,"punct":2187,"cop":1330,"obl":894,"nummod":834,"nmod:poss":656,"nmod":463,"expl":291,"ccomp":203,"obj":195,"xcomp":122,"case||nmod":73,"obl:tmod":53,"dep":48,"acl:relcl":43},"3":{"punct":8693,"obl":3951,"obj":3760,"nmod":3569,"conj":2747,"advmod":2087,"flat":1302,"nsubj":1169,"acl:relcl":1132,"advcl":809,"amod":622,"advmod:lmod":423,"fixed":390,"dep":322,"xcomp":272,"appos":268,"compound:prt":261,"ccomp":252,"acl:relcl||nsubj":237,"case":202,"nummod":168,"list":159,"nmod:poss":156,"punct||conj":151,"cc":135,"mark":133,"iobj":107,"expl":77,"cop":69,"nmod||case":60,"aux":48,"obl:tmod":45,"obl:lmod":44,"cc||case":43,"advcl||advmod":43,"cc||conj":40,"case||obl":38,"punct||case":33},"4":{"ROOT":4383}}�cfg��neg_key�
 
1
+ ��moves�D{"0":{"":41618},"1":{"":34694},"2":{"case":7526,"nsubj":6005,"det":4341,"amod":3967,"advmod":3662,"mark":3530,"aux":2436,"cc":2264,"punct":2187,"cop":1330,"obl":894,"nummod":834,"nmod:poss":656,"nmod":463,"expl":291,"ccomp":203,"obj":195,"xcomp":122,"case||nmod":73,"obl:tmod":53,"dep":51,"acl:relcl":43},"3":{"punct":8693,"obl":3951,"obj":3760,"nmod":3569,"conj":2747,"advmod":2087,"flat":1302,"nsubj":1169,"acl:relcl":1132,"advcl":809,"dep":634,"amod":622,"advmod:lmod":423,"fixed":390,"xcomp":272,"appos":268,"compound:prt":261,"ccomp":252,"acl:relcl||nsubj":237,"case":202,"nummod":168,"list":159,"nmod:poss":156,"punct||conj":151,"cc":135,"mark":133,"iobj":107,"expl":77,"cop":69,"nmod||case":60,"aux":48,"obl:tmod":45,"obl:lmod":44,"cc||case":43,"advcl||advmod":43,"cc||conj":40,"case||obl":38,"punct||case":33},"4":{"ROOT":4383}}�cfg��neg_key�
senter/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:4c17e994908cc6549918a2f0af54d58ec0988bc312bd7c574607b97218e51b9b
3
  size 219953
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c50f933bed18d134dc0323a61e7baf009fb0b703108ca70f0d650a03ab0f50ef
3
  size 219953
tok2vec/model CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:624296ccca73db9a8aa6cf2abbfb11dd88155ffa8c0bd55a79243c0ef4627a04
3
  size 6365604
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69f3bc3816250579fd4b1d28475510cfeeeb068570a0c765b83199b02c6d51fd
3
  size 6365604
vocab/strings.json CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:e742e4f89864a4c4e0324e2c5f25f320183d5db9dd09d3e8fa9e7260bc26ab56
3
- size 10080884
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6dd21462fbe7a706e335e3d37fcc588191e3dd92fd2cf26856583ef5adc2ea32
3
+ size 10087412