anamelchor commited on Mar 5

Commit

229dbcd

•

1 Parent(s): b7fe036

Training in progress, epoch 4

Browse files

Files changed (47) hide show

model.safetensors +1 -1
run-0/checkpoint-108/config.json +27 -0
run-0/checkpoint-108/model.safetensors +3 -0
run-0/checkpoint-108/optimizer.pt +3 -0
run-0/checkpoint-108/rng_state.pth +3 -0
run-0/checkpoint-108/scheduler.pt +3 -0
run-0/checkpoint-108/special_tokens_map.json +7 -0
run-0/checkpoint-108/tokenizer.json +0 -0
run-0/checkpoint-108/tokenizer_config.json +55 -0
run-0/checkpoint-108/trainer_state.json +44 -0
run-0/checkpoint-108/training_args.bin +3 -0
run-0/checkpoint-108/vocab.txt +0 -0
run-0/checkpoint-162/config.json +27 -0
run-0/checkpoint-162/model.safetensors +3 -0
run-0/checkpoint-162/optimizer.pt +3 -0
run-0/checkpoint-162/rng_state.pth +3 -0
run-0/checkpoint-162/scheduler.pt +3 -0
run-0/checkpoint-162/special_tokens_map.json +7 -0
run-0/checkpoint-162/tokenizer.json +0 -0
run-0/checkpoint-162/tokenizer_config.json +55 -0
run-0/checkpoint-162/trainer_state.json +53 -0
run-0/checkpoint-162/training_args.bin +3 -0
run-0/checkpoint-162/vocab.txt +0 -0
run-0/checkpoint-216/config.json +27 -0
run-0/checkpoint-216/model.safetensors +3 -0
run-0/checkpoint-216/optimizer.pt +3 -0
run-0/checkpoint-216/rng_state.pth +3 -0
run-0/checkpoint-216/scheduler.pt +3 -0
run-0/checkpoint-216/special_tokens_map.json +7 -0
run-0/checkpoint-216/tokenizer.json +0 -0
run-0/checkpoint-216/tokenizer_config.json +55 -0
run-0/checkpoint-216/trainer_state.json +62 -0
run-0/checkpoint-216/training_args.bin +3 -0
run-0/checkpoint-216/vocab.txt +0 -0
run-0/checkpoint-54/config.json +27 -0
run-0/checkpoint-54/model.safetensors +3 -0
run-0/checkpoint-54/optimizer.pt +3 -0
run-0/checkpoint-54/rng_state.pth +3 -0
run-0/checkpoint-54/scheduler.pt +3 -0
run-0/checkpoint-54/special_tokens_map.json +7 -0
run-0/checkpoint-54/tokenizer.json +0 -0
run-0/checkpoint-54/tokenizer_config.json +55 -0
run-0/checkpoint-54/trainer_state.json +35 -0
run-0/checkpoint-54/training_args.bin +3 -0
run-0/checkpoint-54/vocab.txt +0 -0
runs/Mar05_08-21-06_22d65867544c/events.out.tfevents.1709627028.22d65867544c.687.2 +3 -0
training_args.bin +1 -1

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:63de5e608cd3b7088c60a27fbcdcbdb0e534a91d291e0cd8d5bbc5ed3ccc9fab
 size 437958648

 version https://git-lfs.github.com/spec/v1
+oid sha256:7ce6a4f7e7eb4cbc9bfe52e450da2cd3e0a7dd1778c413ad54dfcb3dae6ff8f8
 size 437958648

run-0/checkpoint-108/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-0/checkpoint-108/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5e2165cc9e251dead5cfd6e846a484327e47100c99a4e9f4edcca314b76e7fa9
+size 437958648

run-0/checkpoint-108/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c51bf92baf54492ccf59e7144fd46eb93b382d77fff5328dedd705915ae16b0a
+size 876038394

run-0/checkpoint-108/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8a6a90c7db61f2f3a79f110f835edf45315a90589b0a7d896fa2bf6a3cd8616c
+size 14244

run-0/checkpoint-108/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:208286f847429d5827f0b40bef044476821b45ef90411d495bc117b95392f230
+size 1064

run-0/checkpoint-108/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-108/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-108/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-108/trainer_state.json ADDED Viewed

	@@ -0,0 +1,44 @@

+{
+  "best_metric": 0.41511377999074933,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-cola/run-0/checkpoint-54",
+  "epoch": 2.0,
+  "eval_steps": 500,
+  "global_step": 108,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5203360915184021,
+      "eval_matthews_correlation": 0.41511377999074933,
+      "eval_runtime": 1.9904,
+      "eval_samples_per_second": 524.008,
+      "eval_steps_per_second": 33.159,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5846976637840271,
+      "eval_matthews_correlation": 0.37671460599948314,
+      "eval_runtime": 1.6504,
+      "eval_samples_per_second": 631.971,
+      "eval_steps_per_second": 39.991,
+      "step": 108
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.1361563767542035e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 4
+  }
+}

run-0/checkpoint-108/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b6505b8e73320ba9e2d171cca238eeff0ac60122b6fd186ebd38cd529d9a067
+size 4920

run-0/checkpoint-108/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-162/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-0/checkpoint-162/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:be229f1c869a5493d3b04b897d7c4680ababb73731fcb02136141635eecb3bc6
+size 437958648

run-0/checkpoint-162/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:5295ec51c7b88617a633b69010ea0284e2df9c7db61563af84683b1744f87133
+size 876038394

run-0/checkpoint-162/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:71bc21f12db6819963eaaefaa8c8e498703e11ff911c1c94d1e7364780ac2ae3
+size 14244

run-0/checkpoint-162/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:97d3973a6d6cc4e8c6b19dda0e98420a27516777a8de1fee1cd336e0a735c63c
+size 1064

run-0/checkpoint-162/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-162/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-162/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-162/trainer_state.json ADDED Viewed

	@@ -0,0 +1,53 @@

+{
+  "best_metric": 0.45523070208567706,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-cola/run-0/checkpoint-162",
+  "epoch": 3.0,
+  "eval_steps": 500,
+  "global_step": 162,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5203360915184021,
+      "eval_matthews_correlation": 0.41511377999074933,
+      "eval_runtime": 1.9904,
+      "eval_samples_per_second": 524.008,
+      "eval_steps_per_second": 33.159,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5846976637840271,
+      "eval_matthews_correlation": 0.37671460599948314,
+      "eval_runtime": 1.6504,
+      "eval_samples_per_second": 631.971,
+      "eval_steps_per_second": 39.991,
+      "step": 108
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.8647810816764832,
+      "eval_matthews_correlation": 0.45523070208567706,
+      "eval_runtime": 2.7002,
+      "eval_samples_per_second": 386.266,
+      "eval_steps_per_second": 24.443,
+      "step": 162
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.1361563767542035e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 4
+  }
+}

run-0/checkpoint-162/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b6505b8e73320ba9e2d171cca238eeff0ac60122b6fd186ebd38cd529d9a067
+size 4920

run-0/checkpoint-162/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-216/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-0/checkpoint-216/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7ce6a4f7e7eb4cbc9bfe52e450da2cd3e0a7dd1778c413ad54dfcb3dae6ff8f8
+size 437958648

run-0/checkpoint-216/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:6517fffc1f6b20359a4e2a36f31cb4818625537f027080a929277cffbe4cb00a
+size 876038394

run-0/checkpoint-216/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:08f2f5c0171cd35e37325128516ee356a2973d301ceefcd04255c7208b9a80d8
+size 14244

run-0/checkpoint-216/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c22e97f8272ec0f3ce24a5b5c4c4dff3a2cdc96d778dfec7dac51821191b0f88
+size 1064

run-0/checkpoint-216/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-216/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-216/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-216/trainer_state.json ADDED Viewed

	@@ -0,0 +1,62 @@

+{
+  "best_metric": 0.45523070208567706,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-cola/run-0/checkpoint-162",
+  "epoch": 4.0,
+  "eval_steps": 500,
+  "global_step": 216,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5203360915184021,
+      "eval_matthews_correlation": 0.41511377999074933,
+      "eval_runtime": 1.9904,
+      "eval_samples_per_second": 524.008,
+      "eval_steps_per_second": 33.159,
+      "step": 54
+    },
+    {
+      "epoch": 2.0,
+      "eval_loss": 0.5846976637840271,
+      "eval_matthews_correlation": 0.37671460599948314,
+      "eval_runtime": 1.6504,
+      "eval_samples_per_second": 631.971,
+      "eval_steps_per_second": 39.991,
+      "step": 108
+    },
+    {
+      "epoch": 3.0,
+      "eval_loss": 0.8647810816764832,
+      "eval_matthews_correlation": 0.45523070208567706,
+      "eval_runtime": 2.7002,
+      "eval_samples_per_second": 386.266,
+      "eval_steps_per_second": 24.443,
+      "step": 162
+    },
+    {
+      "epoch": 4.0,
+      "eval_loss": 1.0349252223968506,
+      "eval_matthews_correlation": 0.44680434771969624,
+      "eval_runtime": 1.3792,
+      "eval_samples_per_second": 756.257,
+      "eval_steps_per_second": 47.855,
+      "step": 216
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.1361563767542035e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 4
+  }
+}

run-0/checkpoint-216/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b6505b8e73320ba9e2d171cca238eeff0ac60122b6fd186ebd38cd529d9a067
+size 4920

run-0/checkpoint-216/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-54/config.json ADDED Viewed

	@@ -0,0 +1,27 @@

+{
+  "_name_or_path": "bert-base-uncased",
+  "architectures": [
+    "BertForSequenceClassification"
+  ],
+  "attention_probs_dropout_prob": 0.1,
+  "classifier_dropout": null,
+  "gradient_checkpointing": false,
+  "hidden_act": "gelu",
+  "hidden_dropout_prob": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "intermediate_size": 3072,
+  "layer_norm_eps": 1e-12,
+  "max_position_embeddings": 512,
+  "model_type": "bert",
+  "num_attention_heads": 12,
+  "num_hidden_layers": 12,
+  "pad_token_id": 0,
+  "position_embedding_type": "absolute",
+  "problem_type": "single_label_classification",
+  "torch_dtype": "float32",
+  "transformers_version": "4.38.2",
+  "type_vocab_size": 2,
+  "use_cache": true,
+  "vocab_size": 30522
+}

run-0/checkpoint-54/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fc61e577a9070eb5643b470443595424828357a4640ca0aa32b47482d50c1b33
+size 437958648

run-0/checkpoint-54/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a03c93e9f8a1a57ef4642f6af8e76c086f0b96cd7d58a661baa840f522ca4a73
+size 876038394

run-0/checkpoint-54/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:36a79f5f94618b996d56800eebdc41e881c20f5d187f58d4ba4a72c27648746a
+size 14244

run-0/checkpoint-54/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04f63ee999e05fbb51074bb8cfde454feae125414a25fb4795604de77682d652
+size 1064

run-0/checkpoint-54/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,7 @@

+{
+  "cls_token": "[CLS]",
+  "mask_token": "[MASK]",
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-54/tokenizer.json ADDED Viewed

The diff for this file is too large to render. See raw diff

run-0/checkpoint-54/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,55 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "[PAD]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "100": {
+      "content": "[UNK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "101": {
+      "content": "[CLS]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "102": {
+      "content": "[SEP]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "103": {
+      "content": "[MASK]",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    }
+  },
+  "clean_up_tokenization_spaces": true,
+  "cls_token": "[CLS]",
+  "do_lower_case": true,
+  "mask_token": "[MASK]",
+  "model_max_length": 512,
+  "pad_token": "[PAD]",
+  "sep_token": "[SEP]",
+  "strip_accents": null,
+  "tokenize_chinese_chars": true,
+  "tokenizer_class": "BertTokenizer",
+  "unk_token": "[UNK]"
+}

run-0/checkpoint-54/trainer_state.json ADDED Viewed

	@@ -0,0 +1,35 @@

+{
+  "best_metric": 0.41511377999074933,
+  "best_model_checkpoint": "bert-base-uncased-finetuned-cola/run-0/checkpoint-54",
+  "epoch": 1.0,
+  "eval_steps": 500,
+  "global_step": 54,
+  "is_hyper_param_search": true,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 1.0,
+      "eval_loss": 0.5203360915184021,
+      "eval_matthews_correlation": 0.41511377999074933,
+      "eval_runtime": 1.9904,
+      "eval_samples_per_second": 524.008,
+      "eval_steps_per_second": 33.159,
+      "step": 54
+    }
+  ],
+  "logging_steps": 500,
+  "max_steps": 270,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 5,
+  "save_steps": 500,
+  "total_flos": 0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": {
+    "learning_rate": 4.1361563767542035e-05,
+    "num_train_epochs": 5,
+    "per_device_train_batch_size": 16,
+    "seed": 4
+  }
+}

run-0/checkpoint-54/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4b6505b8e73320ba9e2d171cca238eeff0ac60122b6fd186ebd38cd529d9a067
+size 4920

run-0/checkpoint-54/vocab.txt ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Mar05_08-21-06_22d65867544c/events.out.tfevents.1709627028.22d65867544c.687.2 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a3edf229cfaf4af857fe680ec673251f3f23dd9c28551dbe039f3ff66a698957
+size 6653

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:acc73a60c4dd966d4cd8789cb1df3c5f4fc642580e1d5e8258be0b13f81e76cd
 size 4920

 version https://git-lfs.github.com/spec/v1
+oid sha256:4b6505b8e73320ba9e2d171cca238eeff0ac60122b6fd186ebd38cd529d9a067
 size 4920