{ "os": "Linux-6.8.0-48-generic-x86_64-with-glibc2.39", "python": "3.10.0", "heartbeatAt": "2024-12-31T10:00:55.248811", "startedAt": "2024-12-31T10:00:54.766527", "docker": null, "cuda": null, "args": [ "--model_family", "llama", "--apply_instruct_masks", "--token_scaled_loss", "--seq_parallel_size", "8", "--report_to", "wandb", "--do_train", "--model_name_or_path", "/datasets/ai/llama3/meta-llama/models--meta-llama--Meta-Llama-3.1-8B-Instruct/snapshots/5206a32e0bd3067aef1ce90f5528ade7d866253f/", "--config_name", "/datasets/ai/llama3/meta-llama/models--meta-llama--Meta-Llama-3.1-8B-Instruct/snapshots/5206a32e0bd3067aef1ce90f5528ade7d866253f/", "--tokenizer_name", "/datasets/ai/llama3/meta-llama/models--meta-llama--Meta-Llama-3.1-8B-Instruct/snapshots/5206a32e0bd3067aef1ce90f5528ade7d866253f/", "--run_name", "_llama-3.1-8b-instruct_bsz-16_lr-1e-6_epochs-1_", "--output_dir", "/scratch3/workspace/ctpham_umass_edu-ft/_llama-3.1-8b-instruct_bsz-16_lr-1e-6_epochs-1_", "--config_overrides_json", "", "--gradient_accumulation_steps", "2", "--per_device_train_batch_size", "1", "--bf16", "--learning_rate", "1e-6", "--min_lr_ratio", "0.1", "--lr_scheduler_type", "cosine", "--max_grad_norm", "1.0", "--adam_beta1", "0.9", "--adam_beta2", "0.95", "--weight_decay", "0.1", "--warmup_ratio", "0.05", "--optim", "adamw_torch", "--logging_steps", "1", "--log_level", "info", "--save_steps", "200", "--dataloader_num_workers", "1", "--disable_tqdm", "true", "--use_fast_tokenizer", "false", "--remove_unused_columns", "false", "--ddp_find_unused_parameters", "false", "--fsdp", "auto_wrap offload", "--gradient_checkpointing", "--tokenized_mds_train", "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev/data/ft/bookclaim_balanced_pack_complete", "--cuda_empty_cache", "--num_train_epochs", "1" ], "state": "running", "program": "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev/prolong-final/finetune.py", "codePathLocal": "finetune.py", "codePath": "prolong-final/finetune.py", "git": { "remote": "https://github.com/chtmp223/BookGen-dev.git", "commit": "0e796521430a0f767be7c4dadba5c2fcaee1f909" }, "email": "ctpham@umass.edu", "root": "/work/pi_miyyer_umass_edu/ctpham/BookClaim-dev", "host": "gpu020", "username": "ctpham_umass_edu", "executable": "/scratch3/workspace/ctpham_umass_edu-ft/envs/prolong-final/bin/python3.10", "cpu_count": 112, "cpu_count_logical": 112, "cpu_freq": { "current": 957.8740624999999, "min": 800.0, "max": 3800.0 }, "cpu_freq_per_core": [ { "current": 2463.059, "min": 800.0, "max": 3800.0 }, { "current": 759.577, "min": 800.0, "max": 3800.0 }, { "current": 2024.63, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 2400.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 1740.158, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 1100.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 2035.036, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 1400.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 1900.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 790.179, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 1800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 1393.77, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 3800.0, "min": 800.0, "max": 3800.0 }, { "current": 1439.809, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 3800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 782.956, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 783.716, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 783.035, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 784.273, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 784.246, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 784.059, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 790.704, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 }, { "current": 800.0, "min": 800.0, "max": 3800.0 } ], "disk": { "/": { "total": 438.487850189209, "used": 18.201271057128906 } }, "gpu": "NVIDIA A100-SXM4-80GB", "gpu_count": 8, "gpu_devices": [ { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 }, { "name": "NVIDIA A100-SXM4-80GB", "memory_total": 85899345920 } ], "memory": { "total": 2015.3287239074707 } }