|
{ |
|
"best_global_step": null, |
|
"best_metric": null, |
|
"best_model_checkpoint": null, |
|
"epoch": 9.9697933227345, |
|
"eval_steps": 500, |
|
"global_step": 3140, |
|
"is_hyper_param_search": false, |
|
"is_local_process_zero": true, |
|
"is_world_process_zero": true, |
|
"log_history": [ |
|
{ |
|
"epoch": 1.0, |
|
"grad_norm": 158.74639892578125, |
|
"learning_rate": 1e-05, |
|
"loss": 32.2084, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 1.0, |
|
"eval_loss": 24.951730728149414, |
|
"eval_map": 0.1754, |
|
"eval_map_50": 0.3241, |
|
"eval_map_75": 0.1688, |
|
"eval_map_car": 0.3414, |
|
"eval_map_large": 0.9036, |
|
"eval_map_medium": 0.3559, |
|
"eval_map_person": 0.0093, |
|
"eval_map_small": 0.0901, |
|
"eval_mar_1": 0.0848, |
|
"eval_mar_10": 0.2249, |
|
"eval_mar_100": 0.2625, |
|
"eval_mar_100_car": 0.4833, |
|
"eval_mar_100_person": 0.0417, |
|
"eval_mar_large": 0.9383, |
|
"eval_mar_medium": 0.4585, |
|
"eval_mar_small": 0.1937, |
|
"eval_runtime": 2344.5076, |
|
"eval_samples_per_second": 1.271, |
|
"eval_steps_per_second": 0.159, |
|
"step": 315 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"grad_norm": 270.61004638671875, |
|
"learning_rate": 1e-05, |
|
"loss": 26.4262, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 2.0, |
|
"eval_loss": 23.843828201293945, |
|
"eval_map": 0.1907, |
|
"eval_map_50": 0.358, |
|
"eval_map_75": 0.1793, |
|
"eval_map_car": 0.3657, |
|
"eval_map_large": 0.9182, |
|
"eval_map_medium": 0.3764, |
|
"eval_map_person": 0.0157, |
|
"eval_map_small": 0.1022, |
|
"eval_mar_1": 0.0904, |
|
"eval_mar_10": 0.2378, |
|
"eval_mar_100": 0.2851, |
|
"eval_mar_100_car": 0.5024, |
|
"eval_mar_100_person": 0.0677, |
|
"eval_mar_large": 0.9446, |
|
"eval_mar_medium": 0.4779, |
|
"eval_mar_small": 0.2184, |
|
"eval_runtime": 2137.7262, |
|
"eval_samples_per_second": 1.394, |
|
"eval_steps_per_second": 0.174, |
|
"step": 630 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"grad_norm": 71.99009704589844, |
|
"learning_rate": 1e-05, |
|
"loss": 24.7264, |
|
"step": 945 |
|
}, |
|
{ |
|
"epoch": 3.0, |
|
"eval_loss": 22.73570442199707, |
|
"eval_map": 0.197, |
|
"eval_map_50": 0.3715, |
|
"eval_map_75": 0.189, |
|
"eval_map_car": 0.3769, |
|
"eval_map_large": 0.9337, |
|
"eval_map_medium": 0.3803, |
|
"eval_map_person": 0.017, |
|
"eval_map_small": 0.1086, |
|
"eval_mar_1": 0.0912, |
|
"eval_mar_10": 0.2441, |
|
"eval_mar_100": 0.2901, |
|
"eval_mar_100_car": 0.5086, |
|
"eval_mar_100_person": 0.0716, |
|
"eval_mar_large": 0.9531, |
|
"eval_mar_medium": 0.4819, |
|
"eval_mar_small": 0.2234, |
|
"eval_runtime": 2120.9315, |
|
"eval_samples_per_second": 1.406, |
|
"eval_steps_per_second": 0.176, |
|
"step": 945 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"grad_norm": 139.4793701171875, |
|
"learning_rate": 1e-05, |
|
"loss": 23.7704, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 4.0, |
|
"eval_loss": 22.542678833007812, |
|
"eval_map": 0.2001, |
|
"eval_map_50": 0.3753, |
|
"eval_map_75": 0.1878, |
|
"eval_map_car": 0.3791, |
|
"eval_map_large": 0.9368, |
|
"eval_map_medium": 0.3902, |
|
"eval_map_person": 0.0211, |
|
"eval_map_small": 0.1092, |
|
"eval_mar_1": 0.0924, |
|
"eval_mar_10": 0.2519, |
|
"eval_mar_100": 0.2994, |
|
"eval_mar_100_car": 0.513, |
|
"eval_mar_100_person": 0.0858, |
|
"eval_mar_large": 0.9552, |
|
"eval_mar_medium": 0.4914, |
|
"eval_mar_small": 0.2332, |
|
"eval_runtime": 2105.3394, |
|
"eval_samples_per_second": 1.416, |
|
"eval_steps_per_second": 0.177, |
|
"step": 1260 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"grad_norm": 127.59090423583984, |
|
"learning_rate": 1e-05, |
|
"loss": 22.7954, |
|
"step": 1575 |
|
}, |
|
{ |
|
"epoch": 5.0, |
|
"eval_loss": 22.09284782409668, |
|
"eval_map": 0.2071, |
|
"eval_map_50": 0.3926, |
|
"eval_map_75": 0.195, |
|
"eval_map_car": 0.3906, |
|
"eval_map_large": 0.933, |
|
"eval_map_medium": 0.4043, |
|
"eval_map_person": 0.0237, |
|
"eval_map_small": 0.1184, |
|
"eval_mar_1": 0.0961, |
|
"eval_mar_10": 0.2594, |
|
"eval_mar_100": 0.3075, |
|
"eval_mar_100_car": 0.5253, |
|
"eval_mar_100_person": 0.0897, |
|
"eval_mar_large": 0.9524, |
|
"eval_mar_medium": 0.5028, |
|
"eval_mar_small": 0.2418, |
|
"eval_runtime": 2143.0597, |
|
"eval_samples_per_second": 1.391, |
|
"eval_steps_per_second": 0.174, |
|
"step": 1575 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"grad_norm": 204.32794189453125, |
|
"learning_rate": 1e-05, |
|
"loss": 22.2719, |
|
"step": 1890 |
|
}, |
|
{ |
|
"epoch": 6.0, |
|
"eval_loss": 21.853883743286133, |
|
"eval_map": 0.2135, |
|
"eval_map_50": 0.4034, |
|
"eval_map_75": 0.1965, |
|
"eval_map_car": 0.3985, |
|
"eval_map_large": 0.9446, |
|
"eval_map_medium": 0.4159, |
|
"eval_map_person": 0.0285, |
|
"eval_map_small": 0.1216, |
|
"eval_mar_1": 0.0973, |
|
"eval_mar_10": 0.265, |
|
"eval_mar_100": 0.3128, |
|
"eval_mar_100_car": 0.5309, |
|
"eval_mar_100_person": 0.0946, |
|
"eval_mar_large": 0.9608, |
|
"eval_mar_medium": 0.5031, |
|
"eval_mar_small": 0.2478, |
|
"eval_runtime": 2117.1549, |
|
"eval_samples_per_second": 1.408, |
|
"eval_steps_per_second": 0.176, |
|
"step": 1890 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"grad_norm": 294.1410217285156, |
|
"learning_rate": 1e-05, |
|
"loss": 21.6338, |
|
"step": 2205 |
|
}, |
|
{ |
|
"epoch": 7.0, |
|
"eval_loss": 21.785621643066406, |
|
"eval_map": 0.2125, |
|
"eval_map_50": 0.4048, |
|
"eval_map_75": 0.1965, |
|
"eval_map_car": 0.3956, |
|
"eval_map_large": 0.9388, |
|
"eval_map_medium": 0.4207, |
|
"eval_map_person": 0.0293, |
|
"eval_map_small": 0.1201, |
|
"eval_mar_1": 0.0967, |
|
"eval_mar_10": 0.2641, |
|
"eval_mar_100": 0.3131, |
|
"eval_mar_100_car": 0.524, |
|
"eval_mar_100_person": 0.1023, |
|
"eval_mar_large": 0.957, |
|
"eval_mar_medium": 0.5119, |
|
"eval_mar_small": 0.2466, |
|
"eval_runtime": 2136.0852, |
|
"eval_samples_per_second": 1.396, |
|
"eval_steps_per_second": 0.175, |
|
"step": 2205 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"grad_norm": 773.2018432617188, |
|
"learning_rate": 1e-05, |
|
"loss": 21.3044, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 8.0, |
|
"eval_loss": 21.470380783081055, |
|
"eval_map": 0.2152, |
|
"eval_map_50": 0.4046, |
|
"eval_map_75": 0.2003, |
|
"eval_map_car": 0.4002, |
|
"eval_map_large": 0.9421, |
|
"eval_map_medium": 0.4233, |
|
"eval_map_person": 0.0301, |
|
"eval_map_small": 0.1229, |
|
"eval_mar_1": 0.0983, |
|
"eval_mar_10": 0.2663, |
|
"eval_mar_100": 0.3149, |
|
"eval_mar_100_car": 0.5274, |
|
"eval_mar_100_person": 0.1024, |
|
"eval_mar_large": 0.9592, |
|
"eval_mar_medium": 0.5109, |
|
"eval_mar_small": 0.2487, |
|
"eval_runtime": 2146.733, |
|
"eval_samples_per_second": 1.389, |
|
"eval_steps_per_second": 0.174, |
|
"step": 2520 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"grad_norm": 165.142333984375, |
|
"learning_rate": 1e-05, |
|
"loss": 20.9003, |
|
"step": 2835 |
|
}, |
|
{ |
|
"epoch": 9.0, |
|
"eval_loss": 21.556129455566406, |
|
"eval_map": 0.2151, |
|
"eval_map_50": 0.4079, |
|
"eval_map_75": 0.1994, |
|
"eval_map_car": 0.3997, |
|
"eval_map_large": 0.946, |
|
"eval_map_medium": 0.4264, |
|
"eval_map_person": 0.0304, |
|
"eval_map_small": 0.124, |
|
"eval_mar_1": 0.0977, |
|
"eval_mar_10": 0.2678, |
|
"eval_mar_100": 0.3194, |
|
"eval_mar_100_car": 0.5286, |
|
"eval_mar_100_person": 0.1102, |
|
"eval_mar_large": 0.9598, |
|
"eval_mar_medium": 0.5132, |
|
"eval_mar_small": 0.2535, |
|
"eval_runtime": 2155.2505, |
|
"eval_samples_per_second": 1.383, |
|
"eval_steps_per_second": 0.173, |
|
"step": 2835 |
|
}, |
|
{ |
|
"epoch": 9.9697933227345, |
|
"grad_norm": 129.1219024658203, |
|
"learning_rate": 1e-05, |
|
"loss": 20.5867, |
|
"step": 3140 |
|
}, |
|
{ |
|
"epoch": 9.9697933227345, |
|
"eval_loss": 21.46815299987793, |
|
"eval_map": 0.2191, |
|
"eval_map_50": 0.4214, |
|
"eval_map_75": 0.2032, |
|
"eval_map_car": 0.406, |
|
"eval_map_large": 0.9458, |
|
"eval_map_medium": 0.4299, |
|
"eval_map_person": 0.0323, |
|
"eval_map_small": 0.1293, |
|
"eval_mar_1": 0.0979, |
|
"eval_mar_10": 0.2731, |
|
"eval_mar_100": 0.3209, |
|
"eval_mar_100_car": 0.5312, |
|
"eval_mar_100_person": 0.1106, |
|
"eval_mar_large": 0.9604, |
|
"eval_mar_medium": 0.5212, |
|
"eval_mar_small": 0.2542, |
|
"eval_runtime": 2156.7988, |
|
"eval_samples_per_second": 1.382, |
|
"eval_steps_per_second": 0.173, |
|
"step": 3140 |
|
}, |
|
{ |
|
"epoch": 9.9697933227345, |
|
"step": 3140, |
|
"total_flos": 5.249371936187105e+18, |
|
"train_loss": 23.672178231986464, |
|
"train_runtime": 32632.6381, |
|
"train_samples_per_second": 1.54, |
|
"train_steps_per_second": 0.096 |
|
} |
|
], |
|
"logging_steps": 500, |
|
"max_steps": 3140, |
|
"num_input_tokens_seen": 0, |
|
"num_train_epochs": 10, |
|
"save_steps": 500, |
|
"stateful_callbacks": { |
|
"TrainerControl": { |
|
"args": { |
|
"should_epoch_stop": false, |
|
"should_evaluate": false, |
|
"should_log": false, |
|
"should_save": true, |
|
"should_training_stop": true |
|
}, |
|
"attributes": {} |
|
} |
|
}, |
|
"total_flos": 5.249371936187105e+18, |
|
"train_batch_size": 8, |
|
"trial_name": null, |
|
"trial_params": null |
|
} |
|
|