|
{ |
|
"architectures": [ |
|
"OBILanguageModel" |
|
], |
|
"auto_map": { |
|
"AutoConfig": "modelConfig.OBIConfig", |
|
"AutoModel": "modelLM.OBILanguageModel", |
|
"AutoModelForCausalLM": "modelLM.OBILanguageModel", |
|
"AutoModelForQuestionAnswering": "modelLM.OBILanguageModel" |
|
}, |
|
"batch_size": 24, |
|
"block_size": 150, |
|
"device": "cuda", |
|
"eval_interval": 500, |
|
"hidden_dropout_prob": 0.1, |
|
"hidden_size": 256, |
|
"learning_rate": 0.001, |
|
"max_iters": 20000, |
|
"num_attention_heads": 32, |
|
"num_hidden_layers": 24, |
|
"torch_dtype": "float32", |
|
"transformers_version": "4.34.0", |
|
"vocab_size": 5000 |
|
} |
|
|