yeray142's picture
End of training
40a3487 verified
{
"best_global_step": null,
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 9.9697933227345,
"eval_steps": 500,
"global_step": 3140,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 158.74639892578125,
"learning_rate": 1e-05,
"loss": 32.2084,
"step": 315
},
{
"epoch": 1.0,
"eval_loss": 24.951730728149414,
"eval_map": 0.1754,
"eval_map_50": 0.3241,
"eval_map_75": 0.1688,
"eval_map_car": 0.3414,
"eval_map_large": 0.9036,
"eval_map_medium": 0.3559,
"eval_map_person": 0.0093,
"eval_map_small": 0.0901,
"eval_mar_1": 0.0848,
"eval_mar_10": 0.2249,
"eval_mar_100": 0.2625,
"eval_mar_100_car": 0.4833,
"eval_mar_100_person": 0.0417,
"eval_mar_large": 0.9383,
"eval_mar_medium": 0.4585,
"eval_mar_small": 0.1937,
"eval_runtime": 2344.5076,
"eval_samples_per_second": 1.271,
"eval_steps_per_second": 0.159,
"step": 315
},
{
"epoch": 2.0,
"grad_norm": 270.61004638671875,
"learning_rate": 1e-05,
"loss": 26.4262,
"step": 630
},
{
"epoch": 2.0,
"eval_loss": 23.843828201293945,
"eval_map": 0.1907,
"eval_map_50": 0.358,
"eval_map_75": 0.1793,
"eval_map_car": 0.3657,
"eval_map_large": 0.9182,
"eval_map_medium": 0.3764,
"eval_map_person": 0.0157,
"eval_map_small": 0.1022,
"eval_mar_1": 0.0904,
"eval_mar_10": 0.2378,
"eval_mar_100": 0.2851,
"eval_mar_100_car": 0.5024,
"eval_mar_100_person": 0.0677,
"eval_mar_large": 0.9446,
"eval_mar_medium": 0.4779,
"eval_mar_small": 0.2184,
"eval_runtime": 2137.7262,
"eval_samples_per_second": 1.394,
"eval_steps_per_second": 0.174,
"step": 630
},
{
"epoch": 3.0,
"grad_norm": 71.99009704589844,
"learning_rate": 1e-05,
"loss": 24.7264,
"step": 945
},
{
"epoch": 3.0,
"eval_loss": 22.73570442199707,
"eval_map": 0.197,
"eval_map_50": 0.3715,
"eval_map_75": 0.189,
"eval_map_car": 0.3769,
"eval_map_large": 0.9337,
"eval_map_medium": 0.3803,
"eval_map_person": 0.017,
"eval_map_small": 0.1086,
"eval_mar_1": 0.0912,
"eval_mar_10": 0.2441,
"eval_mar_100": 0.2901,
"eval_mar_100_car": 0.5086,
"eval_mar_100_person": 0.0716,
"eval_mar_large": 0.9531,
"eval_mar_medium": 0.4819,
"eval_mar_small": 0.2234,
"eval_runtime": 2120.9315,
"eval_samples_per_second": 1.406,
"eval_steps_per_second": 0.176,
"step": 945
},
{
"epoch": 4.0,
"grad_norm": 139.4793701171875,
"learning_rate": 1e-05,
"loss": 23.7704,
"step": 1260
},
{
"epoch": 4.0,
"eval_loss": 22.542678833007812,
"eval_map": 0.2001,
"eval_map_50": 0.3753,
"eval_map_75": 0.1878,
"eval_map_car": 0.3791,
"eval_map_large": 0.9368,
"eval_map_medium": 0.3902,
"eval_map_person": 0.0211,
"eval_map_small": 0.1092,
"eval_mar_1": 0.0924,
"eval_mar_10": 0.2519,
"eval_mar_100": 0.2994,
"eval_mar_100_car": 0.513,
"eval_mar_100_person": 0.0858,
"eval_mar_large": 0.9552,
"eval_mar_medium": 0.4914,
"eval_mar_small": 0.2332,
"eval_runtime": 2105.3394,
"eval_samples_per_second": 1.416,
"eval_steps_per_second": 0.177,
"step": 1260
},
{
"epoch": 5.0,
"grad_norm": 127.59090423583984,
"learning_rate": 1e-05,
"loss": 22.7954,
"step": 1575
},
{
"epoch": 5.0,
"eval_loss": 22.09284782409668,
"eval_map": 0.2071,
"eval_map_50": 0.3926,
"eval_map_75": 0.195,
"eval_map_car": 0.3906,
"eval_map_large": 0.933,
"eval_map_medium": 0.4043,
"eval_map_person": 0.0237,
"eval_map_small": 0.1184,
"eval_mar_1": 0.0961,
"eval_mar_10": 0.2594,
"eval_mar_100": 0.3075,
"eval_mar_100_car": 0.5253,
"eval_mar_100_person": 0.0897,
"eval_mar_large": 0.9524,
"eval_mar_medium": 0.5028,
"eval_mar_small": 0.2418,
"eval_runtime": 2143.0597,
"eval_samples_per_second": 1.391,
"eval_steps_per_second": 0.174,
"step": 1575
},
{
"epoch": 6.0,
"grad_norm": 204.32794189453125,
"learning_rate": 1e-05,
"loss": 22.2719,
"step": 1890
},
{
"epoch": 6.0,
"eval_loss": 21.853883743286133,
"eval_map": 0.2135,
"eval_map_50": 0.4034,
"eval_map_75": 0.1965,
"eval_map_car": 0.3985,
"eval_map_large": 0.9446,
"eval_map_medium": 0.4159,
"eval_map_person": 0.0285,
"eval_map_small": 0.1216,
"eval_mar_1": 0.0973,
"eval_mar_10": 0.265,
"eval_mar_100": 0.3128,
"eval_mar_100_car": 0.5309,
"eval_mar_100_person": 0.0946,
"eval_mar_large": 0.9608,
"eval_mar_medium": 0.5031,
"eval_mar_small": 0.2478,
"eval_runtime": 2117.1549,
"eval_samples_per_second": 1.408,
"eval_steps_per_second": 0.176,
"step": 1890
},
{
"epoch": 7.0,
"grad_norm": 294.1410217285156,
"learning_rate": 1e-05,
"loss": 21.6338,
"step": 2205
},
{
"epoch": 7.0,
"eval_loss": 21.785621643066406,
"eval_map": 0.2125,
"eval_map_50": 0.4048,
"eval_map_75": 0.1965,
"eval_map_car": 0.3956,
"eval_map_large": 0.9388,
"eval_map_medium": 0.4207,
"eval_map_person": 0.0293,
"eval_map_small": 0.1201,
"eval_mar_1": 0.0967,
"eval_mar_10": 0.2641,
"eval_mar_100": 0.3131,
"eval_mar_100_car": 0.524,
"eval_mar_100_person": 0.1023,
"eval_mar_large": 0.957,
"eval_mar_medium": 0.5119,
"eval_mar_small": 0.2466,
"eval_runtime": 2136.0852,
"eval_samples_per_second": 1.396,
"eval_steps_per_second": 0.175,
"step": 2205
},
{
"epoch": 8.0,
"grad_norm": 773.2018432617188,
"learning_rate": 1e-05,
"loss": 21.3044,
"step": 2520
},
{
"epoch": 8.0,
"eval_loss": 21.470380783081055,
"eval_map": 0.2152,
"eval_map_50": 0.4046,
"eval_map_75": 0.2003,
"eval_map_car": 0.4002,
"eval_map_large": 0.9421,
"eval_map_medium": 0.4233,
"eval_map_person": 0.0301,
"eval_map_small": 0.1229,
"eval_mar_1": 0.0983,
"eval_mar_10": 0.2663,
"eval_mar_100": 0.3149,
"eval_mar_100_car": 0.5274,
"eval_mar_100_person": 0.1024,
"eval_mar_large": 0.9592,
"eval_mar_medium": 0.5109,
"eval_mar_small": 0.2487,
"eval_runtime": 2146.733,
"eval_samples_per_second": 1.389,
"eval_steps_per_second": 0.174,
"step": 2520
},
{
"epoch": 9.0,
"grad_norm": 165.142333984375,
"learning_rate": 1e-05,
"loss": 20.9003,
"step": 2835
},
{
"epoch": 9.0,
"eval_loss": 21.556129455566406,
"eval_map": 0.2151,
"eval_map_50": 0.4079,
"eval_map_75": 0.1994,
"eval_map_car": 0.3997,
"eval_map_large": 0.946,
"eval_map_medium": 0.4264,
"eval_map_person": 0.0304,
"eval_map_small": 0.124,
"eval_mar_1": 0.0977,
"eval_mar_10": 0.2678,
"eval_mar_100": 0.3194,
"eval_mar_100_car": 0.5286,
"eval_mar_100_person": 0.1102,
"eval_mar_large": 0.9598,
"eval_mar_medium": 0.5132,
"eval_mar_small": 0.2535,
"eval_runtime": 2155.2505,
"eval_samples_per_second": 1.383,
"eval_steps_per_second": 0.173,
"step": 2835
},
{
"epoch": 9.9697933227345,
"grad_norm": 129.1219024658203,
"learning_rate": 1e-05,
"loss": 20.5867,
"step": 3140
},
{
"epoch": 9.9697933227345,
"eval_loss": 21.46815299987793,
"eval_map": 0.2191,
"eval_map_50": 0.4214,
"eval_map_75": 0.2032,
"eval_map_car": 0.406,
"eval_map_large": 0.9458,
"eval_map_medium": 0.4299,
"eval_map_person": 0.0323,
"eval_map_small": 0.1293,
"eval_mar_1": 0.0979,
"eval_mar_10": 0.2731,
"eval_mar_100": 0.3209,
"eval_mar_100_car": 0.5312,
"eval_mar_100_person": 0.1106,
"eval_mar_large": 0.9604,
"eval_mar_medium": 0.5212,
"eval_mar_small": 0.2542,
"eval_runtime": 2156.7988,
"eval_samples_per_second": 1.382,
"eval_steps_per_second": 0.173,
"step": 3140
},
{
"epoch": 9.9697933227345,
"step": 3140,
"total_flos": 5.249371936187105e+18,
"train_loss": 23.672178231986464,
"train_runtime": 32632.6381,
"train_samples_per_second": 1.54,
"train_steps_per_second": 0.096
}
],
"logging_steps": 500,
"max_steps": 3140,
"num_input_tokens_seen": 0,
"num_train_epochs": 10,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 5.249371936187105e+18,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}