Veldrovive commited on
Commit
8d982fd
1 Parent(s): 48925c9

Upload decoder/2.4B_fp16/decoder_config.json with huggingface_hub

Browse files
decoder/2.4B_fp16/decoder_config.json CHANGED
@@ -56,16 +56,13 @@
56
  "wd": 0.0,
57
  "warmup_steps": 1000,
58
  "max_grad_norm": 0.5,
59
- "save_every_n_samples": 545400,
60
  "n_sample_images": 10,
61
  "device": "cuda:0",
62
- "epoch_samples": 2100000,
63
  "validation_samples": 100000,
64
  "use_ema": true,
65
- "ema_beta": 0.99,
66
- "save_all": false,
67
- "save_latest": true,
68
- "save_best": true,
69
  "unet_training_mask": [true],
70
  "find_unused_parameters": false
71
  },
@@ -88,7 +85,7 @@
88
 
89
  "wandb_entity": "Veldrovive",
90
  "wandb_project": "dalle2_train_decoder",
91
- "wandb_run_name": "2.4B deepspeed fp16",
92
 
93
  "auto_resume": true,
94
  "verbose": true
 
56
  "wd": 0.0,
57
  "warmup_steps": 1000,
58
  "max_grad_norm": 0.5,
59
+ "save_every_n_samples": 1500000,
60
  "n_sample_images": 10,
61
  "device": "cuda:0",
62
+ "epoch_samples": 3000000,
63
  "validation_samples": 100000,
64
  "use_ema": true,
65
+ "ema_beta": 0.9999,
 
 
 
66
  "unet_training_mask": [true],
67
  "find_unused_parameters": false
68
  },
 
85
 
86
  "wandb_entity": "Veldrovive",
87
  "wandb_project": "dalle2_train_decoder",
88
+ "wandb_run_name": "3B deepspeed fp16",
89
 
90
  "auto_resume": true,
91
  "verbose": true