File size: 7,742 Bytes

7806f40

[2024-04-23 15:11:06,594][hydra][INFO] - 
experiment_group: training
run_name: roberta-base_2024-04-23T15-11-06
seed: 42
model:
  name: roberta-base
  revision: null
  seed: 42
  base_model: roberta-base
estimator:
  accelerator: gpu
  precision: bf16-true
  deterministic: true
  tf32_mode: high
  convert_to_bettertransformer: false
fit:
  max_epochs: 20
  min_epochs: null
  optimizer_kwargs:
    name: adamw
    lr: 3.0e-05
    init_kwargs:
      fused: true
  scheduler_kwargs:
    name: constant_schedule_with_warmup
    num_warmup_steps: 2000
  log_interval: 100
  enable_progress_bar: true
  limit_train_batches: null
data:
  batch_size: 32
  eval_batch_size: 128
  shuffle: true
  replacement: false
  data_seed: 42
  drop_last: false
  num_workers: 8
  pin_memory: true
  persistent_workers: false
  multiprocessing_context: null
  max_length: 512
root_path: /home/pl487/coreset-project
data_path: /home/pl487/coreset-project/data/processed
dataset: mnli
dataset_split: train
evaluation: null
loggers:
  tensorboard:
    _target_: energizer.loggers.TensorBoardLogger
    root_dir: ./
    name: tb_logs
    version: null
callbacks:
  timer:
    _target_: energizer.active_learning.callbacks.Timer
  lr_monitor:
    _target_: energizer.callbacks.lr_monitor.LearningRateMonitor
  model_checkpoint:
    _target_: energizer.callbacks.model_checkpoint.ModelCheckpoint
    dirpath: .checkpoints
    stage: train
    frequency: 1:epoch
user:
  id: pl487

======================================================================
[2024-04-23 15:11:06,595][hydra][INFO] - Seed enabled: 42
[2024-04-23 15:11:06,963][hydra][INFO] - Label distribution:
{<RunningStage.TRAIN: 'train'>: {'0-(entailment)': 130899, '1-(neutral)': 130900, '2-(contradiction)': 130903}}
[2024-04-23 15:11:19,109][hydra][INFO] - Loggers: [<energizer.loggers.tensorboard.TensorBoardLogger object at 0x7f86f05beb00>]
[2024-04-23 15:11:19,110][hydra][INFO] - Callbacks: [<energizer.active_learning.callbacks.Timer object at 0x7f86deae60b0>, <energizer.callbacks.lr_monitor.LearningRateMonitor object at 0x7f86deae6110>, <energizer.callbacks.model_checkpoint.ModelCheckpoint object at 0x7f86deae6620>]
[2024-04-23 15:11:19,113][hydra][INFO] - Model summary:
Total num params: 124.6M
Of which trainable: 124.6M
With a memory footprint of 0.25GB
Total memory allocated 0.77GB
[2024-04-23 15:11:19,754][hydra][INFO] - Dataloading params:
SequenceClassificationDataloaderArgs(batch_size=32, eval_batch_size=128, num_workers=8, pin_memory=True, drop_last=False, persistent_workers=False, shuffle=True, replacement=False, data_seed=42, multiprocessing_context=None, max_length=512)
[2024-04-23 15:11:19,760][hydra][INFO] - Batch:
{<InputKeys.INPUT_IDS: 'input_ids'>: tensor([[    0,  3056, 37463,    14,    18,   761,     9,  4678,   939,  1266,
            51,   214,   190,  3406,    24,     7,     7,   147,   122, 37463,
            14,    51, 26112,    15,  1012,    47,   216,   114,   110,   114,
            47, 37463,    47,   216,    33,   626,    42,    50,   114,    47,
           240,    42, 37463, 37463,    52,   581, 14811,    13,    47,     8,
            47,   218,    75,    33,     7,   582,   201,  3867,    47,    53,
           172,    99,    51,   218,    75,  1137,    47,    16,    14,   114,
            47,   114,    51,   339,    47,   492,   106,    23,   513,    10,
           371,     9,     5,     9,     5,   631,    14,    51,   339,    98,
          1437,   939,   218,    75,   216,    24,    16, 37463,    24,    18,
           562,     7,    28,    55,   265,   122,  1195,    87, 37463,   888,
         37463,  4098,    19,     5,  1846,    87,    19, 37463,  7252,     5,
         37463,  8653,    51,     5,     5,  3969,    32,    95,    11,    24,
            13,     5,   418,  1437,   939,   437,   939,   437,  7013,   939,
           216,   939,   939,  2854,    19,    47,   939,   206,    47,   214,
           588,    47,   214,   182,   235,    14,     5,  3770,   197,   939,
           206,    51,   197,    33,    41,  3871,  1280,     9,    47,   216,
          2085,    51,    64,    33,    10,   367,    53,   939,   206,   144,
             9,   106,   197,    28,    45, 37463,  3969,    11,     5,   754,
             8,    14,    18,   169,   169,    51,   348,  5335,    88,  2302,
            24,    18,   142,     9,     5,     5,   488,   383,    47,   216,
             5, 37482,     8,   960,    53, 37463,    53,   117,   939,   216,
            52,    24,  7252,    52,   214,    11,  4788,     8, 37463,    52,
            33,     5,   276,   631, 22002,   154,     8,     8, 37463,    51,
            32,  6901,   106,    66,   939,  1266,    95,     5,  1675,  2878,
          3645,   631,    51,   905,   106,    66,   142,     9,    51,   218,
            75,    33,   143,   317,     7,   489,     7,   342,   106,    98,
          4909,    14,   115,    47,   216, 37463,  3867, 37463,    57,    10,
           538,  2970,    53, 37463, 37463,   190,     5,   181,  6502,   352,
           410,  2682,   939,  1266,     5,     5,  1669,    14, 13585,   452,
            11,   730,    16,     5,  1802,     8, 14051,    14,   189,    28,
           549,    24,    18,    10,  6279,    50,  2196,    50,  3046,  1493,
          7252,    51,    32,     5,  1980,    14,    32,   164,     7,   582,
             8,    51,    32,     5,    65,    14,    32,   164,     7,  6297,
             8,     5,    97,   621,    47,   216,   114,    51,   582,   114,
            51,   114,    51, 37463,  2237,   106, 37463,     8, 37463,   172,
             5,    47,   216,    86,     5,   488,  1239,    81, 37463,   457,
             5,    86, 37463,    51,  1169,   905,   106,   213,    50,    51,
           120,   160,    19,    10,    10,  3645,   142,    51,   348,    56,
            10,  2470,    14,    47,   216,  2653,    14,    14,    51,  3559,
            75,    70,   561,    77,    51,   222,    24,     2,     2,   100,
           206,    14,    89,   197,    28,    41,  3871,  8985,     9, 14218,
            11,    84,  3770,     4,     2]]), <InputKeys.ATT_MASK: 'attention_mask'>: tensor([[1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1,
         1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1]]), <InputKeys.LABELS: 'labels'>: tensor([0]), <InputKeys.ON_CPU: 'on_cpu'>: {<SpecialKeys.ID: 'uid'>: [221950]}}
[2024-04-23 20:57:35,566][hydra][INFO] - Training complete