{ "os": "Linux-5.4.0-147-generic-x86_64-with-glibc2.31", "python": "3.9.16", "heartbeatAt": "2023-07-25T19:29:32.638362", "startedAt": "2023-07-25T19:29:32.561287", "docker": null, "gpu": "NVIDIA A100-SXM4-80GB", "gpu_count": 8, "cpu_count": 64, "cuda": null, "args": [ "--local_rank=0", "--train_datasets", "bt", "--model_name_or_path", "cerebras/btlm-3b-8k-base", "--max_length", "8092", "--trust_remote_code", "True", "--epochs", "3", "--per_device_train_batch_size", "2", "--per_device_eval_batch_size", "82", "--gradient_accumulation_steps", "1", "--gradient_checkpointing", "--learning_rate", "2e-5", "--lr_scheduler_type", "cosine", "--num_warmup_steps", "20", "--weight_decay", "0.0", "--seed", "42", "--output_dir", "/home/paperspace/safe-rlhf/output/sft", "--log_type", "wandb", "--log_project", "BT-Training", "--zero_stage", "3", "--bf16", "True", "--tf32", "True" ], "state": "running", "program": "-m safe_rlhf.finetune.__main__", "git": { "remote": "https://github.com/robertalanm/safe-rlhf", "commit": "4b5266714a6d66aea11ec473fe29b6b57c48e40a" }, "email": null, "root": "/home/paperspace/safe-rlhf", "host": "psiohuej6", "username": "paperspace", "executable": "/usr/bin/python3.9" }