Upload folder using huggingface_hub

Browse files

Files changed (4) hide show

README.md +46 -0
hparams.yaml +63 -0
main.log +140 -0
tb_logs/version_0/events.out.tfevents.1713881489.dev-gpu-pl487.1865581.0 +3 -0

README.md ADDED Viewed

	@@ -0,0 +1,46 @@

+## Run info
+- complete_hash: b97998c098e0d34fa00d918d670b8f9b
+- short_hash: b9799b8f9b
+### Configuration
+```yaml
+data:
+  batch_size: 32
+  data_seed: 42
+  drop_last: false
+  eval_batch_size: 128
+  max_length: 512
+  multiprocessing_context: null
+  num_workers: 8
+  persistent_workers: false
+  pin_memory: true
+  replacement: false
+  shuffle: true
+dataset: mnli
+estimator:
+  accelerator: gpu
+  convert_to_bettertransformer: false
+  deterministic: true
+  precision: bf16-true
+  tf32_mode: high
+fit:
+  enable_progress_bar: true
+  limit_train_batches: null
+  log_interval: 100
+  max_epochs: 20
+  min_epochs: null
+  optimizer_kwargs:
+    init_kwargs:
+      fused: true
+    lr: 3.0e-05
+    name: adamw
+  scheduler_kwargs:
+    name: constant_schedule_with_warmup
+    num_warmup_steps: 2000
+model:
+  base_model: roberta-base
+  name: roberta-base
+  revision: null
+  seed: 42
+seed: 42
+```

hparams.yaml ADDED Viewed

	@@ -0,0 +1,63 @@

+experiment_group: training
+run_name: roberta-base_2024-04-23T15-11-06
+seed: 42
+model:
+  name: roberta-base
+  revision: null
+  seed: 42
+  base_model: roberta-base
+estimator:
+  accelerator: gpu
+  precision: bf16-true
+  deterministic: true
+  tf32_mode: high
+  convert_to_bettertransformer: false
+fit:
+  max_epochs: 20
+  min_epochs: null
+  optimizer_kwargs:
+    name: adamw
+    lr: 3.0e-05
+    init_kwargs:
+      fused: true
+  scheduler_kwargs:
+    name: constant_schedule_with_warmup
+    num_warmup_steps: 2000
+  log_interval: 100
+  enable_progress_bar: true
+  limit_train_batches: null
+data:
+  batch_size: 32
+  eval_batch_size: 128
+  shuffle: true
+  replacement: false
+  data_seed: 42
+  drop_last: false
+  num_workers: 8
+  pin_memory: true
+  persistent_workers: false
+  multiprocessing_context: null
+  max_length: 512
+root_path: /home/pl487/coreset-project
+data_path: /home/pl487/coreset-project/data/processed
+dataset: mnli
+dataset_split: train
+evaluation: null
+loggers:
+  tensorboard:
+    _target_: energizer.loggers.TensorBoardLogger
+    root_dir: ./
+    name: tb_logs
+    version: null
+callbacks:
+  timer:
+    _target_: energizer.active_learning.callbacks.Timer
+  lr_monitor:
+    _target_: energizer.callbacks.lr_monitor.LearningRateMonitor
+  model_checkpoint:
+    _target_: energizer.callbacks.model_checkpoint.ModelCheckpoint
+    dirpath: .checkpoints
+    stage: train
+    frequency: 1:epoch
+user:
+  id: pl487

main.log ADDED Viewed

	@@ -0,0 +1,140 @@

+[2024-04-23 15:11:06,594][hydra][INFO] -
+experiment_group: training
+run_name: roberta-base_2024-04-23T15-11-06
+seed: 42
+model:
+  name: roberta-base
+  revision: null
+  seed: 42
+  base_model: roberta-base
+estimator:
+  accelerator: gpu
+  precision: bf16-true
+  deterministic: true
+  tf32_mode: high
+  convert_to_bettertransformer: false
+fit:
+  max_epochs: 20
+  min_epochs: null
+  optimizer_kwargs:
+    name: adamw
+    lr: 3.0e-05
+    init_kwargs:
+      fused: true
+  scheduler_kwargs:
+    name: constant_schedule_with_warmup
+    num_warmup_steps: 2000
+  log_interval: 100
+  enable_progress_bar: true
+  limit_train_batches: null
+data:
+  batch_size: 32
+  eval_batch_size: 128
+  shuffle: true
+  replacement: false
+  data_seed: 42
+  drop_last: false
+  num_workers: 8
+  pin_memory: true
+  persistent_workers: false
+  multiprocessing_context: null
+  max_length: 512
+root_path: /home/pl487/coreset-project
+data_path: /home/pl487/coreset-project/data/processed
+dataset: mnli
+dataset_split: train
+evaluation: null
+loggers:
+  tensorboard:
+    _target_: energizer.loggers.TensorBoardLogger
+    root_dir: ./
+    name: tb_logs
+    version: null
+callbacks:
+  timer:
+    _target_: energizer.active_learning.callbacks.Timer
+  lr_monitor:
+    _target_: energizer.callbacks.lr_monitor.LearningRateMonitor
+  model_checkpoint:
+    _target_: energizer.callbacks.model_checkpoint.ModelCheckpoint
+    dirpath: .checkpoints
+    stage: train
+    frequency: 1:epoch
+user:
+  id: pl487
+======================================================================
+[2024-04-23 15:11:06,595][hydra][INFO] - Seed enabled: 42
+[2024-04-23 15:11:06,963][hydra][INFO] - Label distribution:
+{<RunningStage.TRAIN: 'train'>: {'0-(entailment)': 130899, '1-(neutral)': 130900, '2-(contradiction)': 130903}}
+[2024-04-23 15:11:19,109][hydra][INFO] - Loggers: [<energizer.loggers.tensorboard.TensorBoardLogger object at 0x7f86f05beb00>]
+[2024-04-23 15:11:19,110][hydra][INFO] - Callbacks: [<energizer.active_learning.callbacks.Timer object at 0x7f86deae60b0>, <energizer.callbacks.lr_monitor.LearningRateMonitor object at 0x7f86deae6110>, <energizer.callbacks.model_checkpoint.ModelCheckpoint object at 0x7f86deae6620>]
+[2024-04-23 15:11:19,113][hydra][INFO] - Model summary:
+Total num params: 124.6M
+Of which trainable: 124.6M
+With a memory footprint of 0.25GB
+Total memory allocated 0.77GB
+[2024-04-23 15:11:19,754][hydra][INFO] - Dataloading params:
+SequenceClassificationDataloaderArgs(batch_size=32, eval_batch_size=128, num_workers=8, pin_memory=True, drop_last=False, persistent_workers=False, shuffle=True, replacement=False, data_seed=42, multiprocessing_context=None, max_length=512)
+[2024-04-23 15:11:19,760][hydra][INFO] - Batch:
+{<InputKeys.INPUT_IDS: 'input_ids'>: tensor([[    0,  3056, 37463,    14,    18,   761,     9,  4678,   939,  1266,
+            51,   214,   190,  3406,    24,     7,     7,   147,   122, 37463,
+            14,    51, 26112,    15,  1012,    47,   216,   114,   110,   114,
+            47, 37463,    47,   216,    33,   626,    42,    50,   114,    47,
+           240,    42, 37463, 37463,    52,   581, 14811,    13,    47,     8,
+            47,   218,    75,    33,     7,   582,   201,  3867,    47,    53,
+           172,    99,    51,   218,    75,  1137,    47,    16,    14,   114,
+            47,   114,    51,   339,    47,   492,   106,    23,   513,    10,
+           371,     9,     5,     9,     5,   631,    14,    51,   339,    98,
+          1437,   939,   218,    75,   216,    24,    16, 37463,    24,    18,
+           562,     7,    28,    55,   265,   122,  1195,    87, 37463,   888,
+         37463,  4098,    19,     5,  1846,    87,    19, 37463,  7252,     5,
+         37463,  8653,    51,     5,     5,  3969,    32,    95,    11,    24,
+            13,     5,   418,  1437,   939,   437,   939,   437,  7013,   939,
+           216,   939,   939,  2854,    19,    47,   939,   206,    47,   214,
+           588,    47,   214,   182,   235,    14,     5,  3770,   197,   939,
+           206,    51,   197,    33,    41,  3871,  1280,     9,    47,   216,
+          2085,    51,    64,    33,    10,   367,    53,   939,   206,   144,
+             9,   106,   197,    28,    45, 37463,  3969,    11,     5,   754,
+             8,    14,    18,   169,   169,    51,   348,  5335,    88,  2302,
+            24,    18,   142,     9,     5,     5,   488,   383,    47,   216,
+             5, 37482,     8,   960,    53, 37463,    53,   117,   939,   216,
+            52,    24,  7252,    52,   214,    11,  4788,     8, 37463,    52,
+            33,     5,   276,   631, 22002,   154,     8,     8, 37463,    51,
+            32,  6901,   106,    66,   939,  1266,    95,     5,  1675,  2878,
+          3645,   631,    51,   905,   106,    66,   142,     9,    51,   218,
+            75,    33,   143,   317,     7,   489,     7,   342,   106,    98,
+          4909,    14,   115,    47,   216, 37463,  3867, 37463,    57,    10,
+           538,  2970,    53, 37463, 37463,   190,     5,   181,  6502,   352,
+           410,  2682,   939,  1266,     5,     5,  1669,    14, 13585,   452,
+            11,   730,    16,     5,  1802,     8, 14051,    14,   189,    28,
+           549,    24,    18,    10,  6279,    50,  2196,    50,  3046,  1493,
+          7252,    51,    32,     5,  1980,    14,    32,   164,     7,   582,
+             8,    51,    32,     5,    65,    14,    32,   164,     7,  6297,
+             8,     5,    97,   621,    47,   216,   114,    51,   582,   114,
+            51,   114,    51, 37463,  2237,   106, 37463,     8, 37463,   172,
+             5,    47,   216,    86,     5,   488,  1239,    81, 37463,   457,
+             5,    86, 37463,    51,  1169,   905,   106,   213,    50,    51,
+           120,   160,    19,    10,    10,  3645,   142,    51,   348,    56,
+            10,  2470,    14,    47,   216,  2653,    14,    14,    51,  3559,
+            75,    70,   561,    77,    51,   222,    24,     2,     2,   100,
+           206,    14,    89,   197,    28,    41,  3871,  8985,     9, 14218,
+            11,    84,  3770,     4,     2]]), <InputKeys.ATT_MASK: 'attention_mask'>: tensor([[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
+         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]]), <InputKeys.LABELS: 'labels'>: tensor([0]), <InputKeys.ON_CPU: 'on_cpu'>: {<SpecialKeys.ID: 'uid'>: [221950]}}
+[2024-04-23 20:57:35,566][hydra][INFO] - Training complete

tb_logs/version_0/events.out.tfevents.1713881489.dev-gpu-pl487.1865581.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ce788d1e3351858236cf312c2923a9c037c088eb82249cdb01fed9520a256f5f
+size 1855634