devhem commited on
Commit
d285f7e
·
verified ·
1 Parent(s): 37f5975

Training in progress, epoch 2

Browse files
Files changed (3) hide show
  1. config.json +5 -5
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "answerdotai/ModernBERT-base",
3
  "architectures": [
4
  "ModernBertForSequenceClassification"
5
  ],
@@ -19,7 +19,7 @@
19
  "global_rope_theta": 160000.0,
20
  "gradient_checkpointing": false,
21
  "hidden_activation": "gelu",
22
- "hidden_size": 768,
23
  "id2label": {
24
  "0": "Cybercrime",
25
  "1": "Drugs",
@@ -33,7 +33,7 @@
33
  },
34
  "initializer_cutoff_factor": 2.0,
35
  "initializer_range": 0.02,
36
- "intermediate_size": 1152,
37
  "label2id": {
38
  "Cybercrime": 0,
39
  "Drugs": 1,
@@ -54,8 +54,8 @@
54
  "model_type": "modernbert",
55
  "norm_bias": false,
56
  "norm_eps": 1e-05,
57
- "num_attention_heads": 12,
58
- "num_hidden_layers": 22,
59
  "pad_token_id": 50283,
60
  "position_embedding_type": "absolute",
61
  "problem_type": "single_label_classification",
 
1
  {
2
+ "_name_or_path": "answerdotai/ModernBERT-large",
3
  "architectures": [
4
  "ModernBertForSequenceClassification"
5
  ],
 
19
  "global_rope_theta": 160000.0,
20
  "gradient_checkpointing": false,
21
  "hidden_activation": "gelu",
22
+ "hidden_size": 1024,
23
  "id2label": {
24
  "0": "Cybercrime",
25
  "1": "Drugs",
 
33
  },
34
  "initializer_cutoff_factor": 2.0,
35
  "initializer_range": 0.02,
36
+ "intermediate_size": 2624,
37
  "label2id": {
38
  "Cybercrime": 0,
39
  "Drugs": 1,
 
54
  "model_type": "modernbert",
55
  "norm_bias": false,
56
  "norm_eps": 1e-05,
57
+ "num_attention_heads": 16,
58
+ "num_hidden_layers": 28,
59
  "pad_token_id": 50283,
60
  "position_embedding_type": "absolute",
61
  "problem_type": "single_label_classification",
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:10e2f0fc8ff67073748e47a2c481930d0e6e909987bb1b294b5f1e223c411542
3
- size 598461316
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9d8f17b1cad46fa95c08e2c7e65f5255438a65e86ace86fcf58e08b918ad3093
3
+ size 1583380340
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c98919011773fa79aad9d0a2f5e350ebc3d1ef31f63a789dbf08d97f95264b8c
3
  size 5368
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:064661a9a471e66faca7c0a5236df67c5db4552a1283dd08400a3e20ff809acb
3
  size 5368