|
{ |
|
"best_metric": 0.15759548544883728, |
|
"best_model_checkpoint": "smart_tv_hand_gestures_image_detection/checkpoint-15190", |
|
"epoch": 10.0, |
|
"eval_steps": 500, |
|
"global_step": 15190, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 0.32916392363396973, |
|
"grad_norm": 1.4565895795822144, |
|
"learning_rate": 9.702774108322324e-07, |
|
"loss": 2.1185, |
|
"step": 500 |
|
}, |
|
{ |
|
"epoch": 0.6583278472679395, |
|
"grad_norm": 1.595917820930481, |
|
"learning_rate": 9.372523117569352e-07, |
|
"loss": 1.8436, |
|
"step": 1000 |
|
}, |
|
{ |
|
"epoch": 0.9874917709019092, |
|
"grad_norm": 2.2012250423431396, |
|
"learning_rate": 9.04227212681638e-07, |
|
"loss": 1.4844, |
|
"step": 1500 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_accuracy": 0.9256790123456791, |
|
"eval_loss": 1.3686660528182983, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 139.1921, |
|
"eval_samples_per_second": 87.289, |
|
"eval_steps_per_second": 10.913, |
|
"step": 1519 |
|
}, |
|
{ |
|
"epoch": 1.316655694535879, |
|
"grad_norm": 1.8626253604888916, |
|
"learning_rate": 8.712021136063408e-07, |
|
"loss": 1.1357, |
|
"step": 2000 |
|
}, |
|
{ |
|
"epoch": 1.6458196181698486, |
|
"grad_norm": 1.5412793159484863, |
|
"learning_rate": 8.381770145310435e-07, |
|
"loss": 0.8734, |
|
"step": 2500 |
|
}, |
|
{ |
|
"epoch": 1.9749835418038182, |
|
"grad_norm": 1.9414352178573608, |
|
"learning_rate": 8.051519154557464e-07, |
|
"loss": 0.6898, |
|
"step": 3000 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_accuracy": 0.98559670781893, |
|
"eval_loss": 0.6899833679199219, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 140.1792, |
|
"eval_samples_per_second": 86.675, |
|
"eval_steps_per_second": 10.836, |
|
"step": 3038 |
|
}, |
|
{ |
|
"epoch": 2.3041474654377883, |
|
"grad_norm": 1.410414218902588, |
|
"learning_rate": 7.72126816380449e-07, |
|
"loss": 0.5598, |
|
"step": 3500 |
|
}, |
|
{ |
|
"epoch": 2.633311389071758, |
|
"grad_norm": 1.2400822639465332, |
|
"learning_rate": 7.391017173051519e-07, |
|
"loss": 0.4651, |
|
"step": 4000 |
|
}, |
|
{ |
|
"epoch": 2.9624753127057275, |
|
"grad_norm": 0.9760797023773193, |
|
"learning_rate": 7.060766182298547e-07, |
|
"loss": 0.3972, |
|
"step": 4500 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_accuracy": 0.9925925925925926, |
|
"eval_loss": 0.42788437008857727, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 138.4606, |
|
"eval_samples_per_second": 87.751, |
|
"eval_steps_per_second": 10.971, |
|
"step": 4557 |
|
}, |
|
{ |
|
"epoch": 3.291639236339697, |
|
"grad_norm": 0.7729864120483398, |
|
"learning_rate": 6.730515191545574e-07, |
|
"loss": 0.3433, |
|
"step": 5000 |
|
}, |
|
{ |
|
"epoch": 3.6208031599736668, |
|
"grad_norm": 0.7019414305686951, |
|
"learning_rate": 6.400264200792602e-07, |
|
"loss": 0.3052, |
|
"step": 5500 |
|
}, |
|
{ |
|
"epoch": 3.9499670836076364, |
|
"grad_norm": 0.6397891044616699, |
|
"learning_rate": 6.070013210039629e-07, |
|
"loss": 0.2739, |
|
"step": 6000 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_accuracy": 0.9956378600823045, |
|
"eval_loss": 0.3098331689834595, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 140.6468, |
|
"eval_samples_per_second": 86.387, |
|
"eval_steps_per_second": 10.8, |
|
"step": 6076 |
|
}, |
|
{ |
|
"epoch": 4.279131007241606, |
|
"grad_norm": 0.9204681515693665, |
|
"learning_rate": 5.739762219286658e-07, |
|
"loss": 0.2502, |
|
"step": 6500 |
|
}, |
|
{ |
|
"epoch": 4.6082949308755765, |
|
"grad_norm": 0.8557950854301453, |
|
"learning_rate": 5.409511228533686e-07, |
|
"loss": 0.2293, |
|
"step": 7000 |
|
}, |
|
{ |
|
"epoch": 4.937458854509546, |
|
"grad_norm": 0.5376387238502502, |
|
"learning_rate": 5.079260237780713e-07, |
|
"loss": 0.2135, |
|
"step": 7500 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_accuracy": 0.9967901234567901, |
|
"eval_loss": 0.2464514970779419, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 143.0601, |
|
"eval_samples_per_second": 84.929, |
|
"eval_steps_per_second": 10.618, |
|
"step": 7595 |
|
}, |
|
{ |
|
"epoch": 5.266622778143516, |
|
"grad_norm": 2.1749770641326904, |
|
"learning_rate": 4.749009247027741e-07, |
|
"loss": 0.1991, |
|
"step": 8000 |
|
}, |
|
{ |
|
"epoch": 5.595786701777485, |
|
"grad_norm": 0.4924432039260864, |
|
"learning_rate": 4.418758256274769e-07, |
|
"loss": 0.1887, |
|
"step": 8500 |
|
}, |
|
{ |
|
"epoch": 5.924950625411455, |
|
"grad_norm": 0.44754961133003235, |
|
"learning_rate": 4.088507265521796e-07, |
|
"loss": 0.1787, |
|
"step": 9000 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_accuracy": 0.9973662551440329, |
|
"eval_loss": 0.20901748538017273, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 143.6019, |
|
"eval_samples_per_second": 84.609, |
|
"eval_steps_per_second": 10.578, |
|
"step": 9114 |
|
}, |
|
{ |
|
"epoch": 6.254114549045425, |
|
"grad_norm": 1.0733314752578735, |
|
"learning_rate": 3.758256274768824e-07, |
|
"loss": 0.1706, |
|
"step": 9500 |
|
}, |
|
{ |
|
"epoch": 6.583278472679394, |
|
"grad_norm": 0.45371586084365845, |
|
"learning_rate": 3.428005284015852e-07, |
|
"loss": 0.1637, |
|
"step": 10000 |
|
}, |
|
{ |
|
"epoch": 6.912442396313364, |
|
"grad_norm": 0.3785471022129059, |
|
"learning_rate": 3.09775429326288e-07, |
|
"loss": 0.1571, |
|
"step": 10500 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_accuracy": 0.9988477366255144, |
|
"eval_loss": 0.1836911290884018, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 141.3146, |
|
"eval_samples_per_second": 85.978, |
|
"eval_steps_per_second": 10.749, |
|
"step": 10633 |
|
}, |
|
{ |
|
"epoch": 7.2416063199473335, |
|
"grad_norm": 0.774605393409729, |
|
"learning_rate": 2.7675033025099076e-07, |
|
"loss": 0.1517, |
|
"step": 11000 |
|
}, |
|
{ |
|
"epoch": 7.570770243581303, |
|
"grad_norm": 0.49195748567581177, |
|
"learning_rate": 2.437252311756935e-07, |
|
"loss": 0.1477, |
|
"step": 11500 |
|
}, |
|
{ |
|
"epoch": 7.899934167215273, |
|
"grad_norm": 0.32700517773628235, |
|
"learning_rate": 2.107001321003963e-07, |
|
"loss": 0.1439, |
|
"step": 12000 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_accuracy": 0.9981069958847737, |
|
"eval_loss": 0.17038238048553467, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 142.0518, |
|
"eval_samples_per_second": 85.532, |
|
"eval_steps_per_second": 10.693, |
|
"step": 12152 |
|
}, |
|
{ |
|
"epoch": 8.229098090849243, |
|
"grad_norm": 0.36188894510269165, |
|
"learning_rate": 1.7767503302509906e-07, |
|
"loss": 0.1402, |
|
"step": 12500 |
|
}, |
|
{ |
|
"epoch": 8.558262014483212, |
|
"grad_norm": 0.38871052861213684, |
|
"learning_rate": 1.4464993394980185e-07, |
|
"loss": 0.1385, |
|
"step": 13000 |
|
}, |
|
{ |
|
"epoch": 8.887425938117183, |
|
"grad_norm": 0.33406054973602295, |
|
"learning_rate": 1.1162483487450462e-07, |
|
"loss": 0.1359, |
|
"step": 13500 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_accuracy": 0.9986008230452675, |
|
"eval_loss": 0.16055729985237122, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 143.3485, |
|
"eval_samples_per_second": 84.758, |
|
"eval_steps_per_second": 10.597, |
|
"step": 13671 |
|
}, |
|
{ |
|
"epoch": 9.216589861751151, |
|
"grad_norm": 0.32042938470840454, |
|
"learning_rate": 7.85997357992074e-08, |
|
"loss": 0.1341, |
|
"step": 14000 |
|
}, |
|
{ |
|
"epoch": 9.545753785385122, |
|
"grad_norm": 0.29274484515190125, |
|
"learning_rate": 4.557463672391017e-08, |
|
"loss": 0.1333, |
|
"step": 14500 |
|
}, |
|
{ |
|
"epoch": 9.874917709019092, |
|
"grad_norm": 0.3197895288467407, |
|
"learning_rate": 1.2549537648612946e-08, |
|
"loss": 0.1331, |
|
"step": 15000 |
|
}, |
|
{ |
|
"epoch": 10.0, |
|
"eval_accuracy": 0.9990123456790123, |
|
"eval_loss": 0.15759548544883728, |
|
"eval_model_preparation_time": 0.0043, |
|
"eval_runtime": 142.0855, |
|
"eval_samples_per_second": 85.512, |
|
"eval_steps_per_second": 10.691, |
|
"step": 15190 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 15190, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 3.76634697648169e+19, |
|
"train_batch_size": 32, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|