Initial model upload

Files changed (5) hide show

config.json ADDED Viewed

+{
+	"attention_probs_dropout_prob": 0.1,
+	"hidden_act": "gelu",
+	"hidden_dropout_prob": 0.1,
+	"hidden_size": 768,
+	"initializer_range": 0.02,
+	"intermediate_size": 3072,
+	"max_position_embeddings": 512,
+	"relative_attention": true,
+	"position_buckets": 256,
+	"norm_rel_ebd": "layer_norm",
+	"share_att_key": true,
+	"pos_att_type": "p2c|c2p",
+	"layer_norm_eps": 1e-7,
+	"max_relative_positions": -1,
+	"position_biased_input": false,
+	"num_attention_heads": 12,
+	"attention_head_size": 64,
+	"num_hidden_layers": 12,
+	"type_vocab_size": 0,
+	"vocab_size": 50100,
+	"model_type": "deberta-v2",
+	"architectures": ["DebertaV2Model"],
+	"tokenizer_class": "DebertaV2Tokenizer"
+}

pytorch.model-230000.bin ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:188586666f4047ab4e36e7d5bb956e80c7f1d41a9f404ef7dba07d8f37ebb9da
+size 249956079

sentencepiece.model ADDED Viewed

+version https://git-lfs.github.com/spec/v1
+oid sha256:53943749cee1a32c11d02d56c2cef3420fdc42a572685d2829e1bc95f29f44d6
+size 1519783

tokenizer_config.json ADDED Viewed

+{
+  "model_max_length": 512,
+  "padding_side": "right",
+  "truncation_side": "right"
+}

vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff