elyziumm commited on Feb 27, 2024

Commit

24fabe2

verified ·

1 Parent(s): c29b083

Training in progress, epoch 1

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

model.safetensors +1 -1
run-0/checkpoint-14/config.json +25 -0
run-0/checkpoint-14/model.safetensors +3 -0
run-0/checkpoint-14/optimizer.pt +3 -0
run-0/checkpoint-14/rng_state.pth +3 -0
run-0/checkpoint-14/scheduler.pt +3 -0
run-0/checkpoint-14/special_tokens_map.json +7 -0
run-0/checkpoint-14/tokenizer.json +0 -0
run-0/checkpoint-14/tokenizer_config.json +55 -0
run-0/checkpoint-14/trainer_state.json +35 -0
run-0/checkpoint-14/training_args.bin +3 -0
run-0/checkpoint-14/vocab.txt +0 -0
run-0/checkpoint-28/config.json +25 -0
run-0/checkpoint-28/model.safetensors +3 -0
run-0/checkpoint-28/optimizer.pt +3 -0
run-0/checkpoint-28/rng_state.pth +3 -0
run-0/checkpoint-28/scheduler.pt +3 -0
run-0/checkpoint-28/special_tokens_map.json +7 -0
run-0/checkpoint-28/tokenizer.json +0 -0
run-0/checkpoint-28/tokenizer_config.json +55 -0
run-0/checkpoint-28/trainer_state.json +44 -0
run-0/checkpoint-28/training_args.bin +3 -0
run-0/checkpoint-28/vocab.txt +0 -0
run-0/checkpoint-42/config.json +25 -0
run-0/checkpoint-42/model.safetensors +3 -0
run-0/checkpoint-42/optimizer.pt +3 -0
run-0/checkpoint-42/rng_state.pth +3 -0
run-0/checkpoint-42/scheduler.pt +3 -0
run-0/checkpoint-42/special_tokens_map.json +7 -0
run-0/checkpoint-42/tokenizer.json +0 -0
run-0/checkpoint-42/tokenizer_config.json +55 -0
run-0/checkpoint-42/trainer_state.json +53 -0
run-0/checkpoint-42/training_args.bin +3 -0
run-0/checkpoint-42/vocab.txt +0 -0
run-1/checkpoint-108/config.json +25 -0
run-1/checkpoint-108/model.safetensors +3 -0
run-1/checkpoint-108/optimizer.pt +3 -0
run-1/checkpoint-108/rng_state.pth +3 -0
run-1/checkpoint-108/scheduler.pt +3 -0
run-1/checkpoint-108/special_tokens_map.json +7 -0
run-1/checkpoint-108/tokenizer.json +0 -0
run-1/checkpoint-108/tokenizer_config.json +55 -0
run-1/checkpoint-108/trainer_state.json +44 -0
run-1/checkpoint-108/training_args.bin +3 -0
run-1/checkpoint-108/vocab.txt +0 -0
run-1/checkpoint-162/config.json +25 -0
run-1/checkpoint-162/model.safetensors +3 -0
run-1/checkpoint-162/optimizer.pt +3 -0
run-1/checkpoint-162/rng_state.pth +3 -0
run-1/checkpoint-162/scheduler.pt +3 -0

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:311ad80eeced418e5b8f6bf3ce220992709c68d22449620c8792ba85dcad9937
 size 267832560

 version https://git-lfs.github.com/spec/v1
+oid sha256:0bb34911143ff7176ccd35a81ba127c7c06efc0693c31ce6ca68c573d8e935fb
 size 267832560

run-0/checkpoint-14/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-0/checkpoint-14/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:53bf9cf4a8f2d497d9b7e6d6925c26422440051f7b16bdeb792cb8546d1d4dd8
+size 267832560

run-0/checkpoint-14/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fb3ce376d006ef078685bf78acdd3f5e5b1f663aaa3fbbda7ed1baaaf086a1af
+size 535727290

run-0/checkpoint-14/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:27ecb4a31ae02b837820166556ddb603e86a471d753f4c4cf3b72ab71058338b
+size 14308

run-0/checkpoint-14/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b1240b0cc17a1c00a7f8941fbc8f6072f1feba3ab69d5a1a418614cfcf591387
+size 1064

run-0/checkpoint-14/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-14/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-14/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-14/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": -0.049473020853933444,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-14",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 14,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.693752646446228,
+      "eval_matthews_correlation": -0.049473020853933444,
+      "eval_runtime": 0.7156,
+      "eval_samples_per_second": 1457.617,
+      "eval_steps_per_second": 92.237,
+      "step": 14
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 42,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.8537810359672543e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-0/checkpoint-14/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab15ea8b3b6e887d3f4c7d1a4a5b4259c31785b612e2554bf41e26b00703d40b
+size 4984

run-0/checkpoint-14/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-28/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-0/checkpoint-28/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c8a5ab67a0d630b790552c5f6b598c5e3912913235c419748b594ce2eabde219
+size 267832560

run-0/checkpoint-28/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:311b94f047bd7287937bf0e3f01854c48d9bd4efd4195bbddcef898e086e0eab
+size 535727290

run-0/checkpoint-28/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:565af3c076060d6c9573103827473fbcf37dcb4502a44c9fb7264192acec0e73
+size 14308

run-0/checkpoint-28/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2a6ed42a9057bb3fcc0e6542a39aa3a6063692c59f660cccf0073fa0f2570618
+size 1064

run-0/checkpoint-28/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-28/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-28/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-28/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": -0.01620482918319043,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-28",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 28,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.693752646446228,
+      "eval_matthews_correlation": -0.049473020853933444,
+      "eval_runtime": 0.7156,
+      "eval_samples_per_second": 1457.617,
+      "eval_steps_per_second": 92.237,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.681831955909729,
+      "eval_matthews_correlation": -0.01620482918319043,
+      "eval_runtime": 0.7313,
+      "eval_samples_per_second": 1426.325,
+      "eval_steps_per_second": 90.256,
+      "step": 28
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 42,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.8537810359672543e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-0/checkpoint-28/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab15ea8b3b6e887d3f4c7d1a4a5b4259c31785b612e2554bf41e26b00703d40b
+size 4984

run-0/checkpoint-28/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-42/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-0/checkpoint-42/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8df601be148323e1e9563e7bb60cc5d070bf81507b72724382413b689217cf89
+size 267832560

run-0/checkpoint-42/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc084385d9f3bf22dae76b60956c8f865064f28ed80642ae7f8d3bc415e97de1
+size 535727290

run-0/checkpoint-42/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:d7423ba5525b03a6c7a55b109b1a55a96190d3acd042fd60b80c775d6cce8194
+size 14308

run-0/checkpoint-42/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:3125f8bab7fa1cd2bad6911f8c822a67f2face52975dd659eb57f1516b5c6d27
+size 1064

run-0/checkpoint-42/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-42/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-42/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-42/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": -0.01620482918319043,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-0/checkpoint-28",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 42,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.693752646446228,
+      "eval_matthews_correlation": -0.049473020853933444,
+      "eval_runtime": 0.7156,
+      "eval_samples_per_second": 1457.617,
+      "eval_steps_per_second": 92.237,
+      "step": 14
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.681831955909729,
+      "eval_matthews_correlation": -0.01620482918319043,
+      "eval_runtime": 0.7313,
+      "eval_samples_per_second": 1426.325,
+      "eval_steps_per_second": 90.256,
+      "step": 28
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.6774820685386658,
+      "eval_matthews_correlation": -0.07487637328811393,
+      "eval_runtime": 0.7898,
+      "eval_samples_per_second": 1320.614,
+      "eval_steps_per_second": 83.567,
+      "step": 42
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 42,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 3,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 64,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 1.8537810359672543e-06,
+    "num_train_epochs": 3,
+    "per_device_train_batch_size": 64,
+    "seed": 24
+  }
+}

run-0/checkpoint-42/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ab15ea8b3b6e887d3f4c7d1a4a5b4259c31785b612e2554bf41e26b00703d40b
+size 4984

run-0/checkpoint-42/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fa59baf00d49c2c43f1a9e2e2e5debb4996a98ab59b4fe48b822279e0499003e
+size 267832560

run-1/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6c72146c7a6057facbbaccf5a7abe1d69d99a38f26dd6d1a67a63b981864368a
+size 535727290

run-1/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00e7e60447fe6b0b398d23f91b0df5696220d68e25fe4da0911193612264b803
+size 14244

run-1/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4e0b353d7686c1ff2243ea07536737d287529e857de5097a25be7817f1ac6dfe
+size 1064

run-1/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "DistilBertTokenizer",
+  "unk_token": "[UNK]"
+}

run-1/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.06558874629318973,
+  "best_model_checkpoint": "distilbert-base-uncased-finetuned-cola/run-1/checkpoint-108",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.6013498306274414,
+      "eval_matthews_correlation": 0.0,
+      "eval_runtime": 0.7736,
+      "eval_samples_per_second": 1348.188,
+      "eval_steps_per_second": 85.312,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5713459849357605,
+      "eval_matthews_correlation": 0.06558874629318973,
+      "eval_runtime": 0.7811,
+      "eval_samples_per_second": 1335.339,
+      "eval_steps_per_second": 84.499,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 216,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 4,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 9.949027266163136e-06,
+    "num_train_epochs": 4,
+    "per_device_train_batch_size": 16,
+    "seed": 28
+  }
+}

run-1/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f5bd187b1e21f30e375b298fae3a1c88f13a4d7d49c0628ce83bef9b8e92f084
+size 4984

run-1/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-1/checkpoint-162/config.json ADDED Viewed

	@@ -0,0 +1,25 @@

+{
+  "_name_or_path": "distilbert-base-uncased",
+  "activation": "gelu",
+  "architectures": [
+    "DistilBertForSequenceClassification"
+  ],
+  "attention_dropout": 0.1,
+  "dim": 768,
+  "dropout": 0.1,
+  "hidden_dim": 3072,
+  "initializer_range": 0.02,
+  "max_position_embeddings": 512,
+  "model_type": "distilbert",
+  "n_heads": 12,
+  "n_layers": 6,
+  "pad_token_id": 0,
+  "problem_type": "single_label_classification",
+  "qa_dropout": 0.1,
+  "seq_classif_dropout": 0.2,
+  "sinusoidal_pos_embds": false,
+  "tie_weights_": true,
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.1",
+  "vocab_size": 30522
+}

run-1/checkpoint-162/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b5531e0b7298af00d2a7275d87d1e219c5b8006b6ad02ae60ed18916490e1828
+size 267832560

run-1/checkpoint-162/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:57fb93d0d5e4cb45bfe34dee0c44232b0e19bb78a7eac7fe6d75c3b2b9a00e24
+size 535727290

run-1/checkpoint-162/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:210f6311babf339b2041dd94e325452cfc47bb4600ce72bcc997b3fc1f605149
+size 14244

run-1/checkpoint-162/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:64b866b7bfef3029bf9cd974b27d5fb68e9f437c380516c7eb4b6809e62483c1
+size 1064