{ "best_metric": 1.79039466381073, "best_model_checkpoint": "/scratch/skscla001/speech/results/xls-r-300m-nyagen-combined-hp-tuning-test-model/run-1/checkpoint-600", "epoch": 28.72112676056338, "eval_steps": 100, "global_step": 660, "is_hyper_param_search": true, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 4.3605633802816905, "eval_loss": 5.015230178833008, "eval_runtime": 27.3065, "eval_samples_per_second": 12.232, "eval_steps_per_second": 3.076, "eval_wer": 1.0, "step": 100 }, { "epoch": 8.721126760563381, "eval_loss": 3.2265713214874268, "eval_runtime": 27.3177, "eval_samples_per_second": 12.227, "eval_steps_per_second": 3.075, "eval_wer": 1.0, "step": 200 }, { "epoch": 13.045070422535211, "eval_loss": 2.866999387741089, "eval_runtime": 27.1809, "eval_samples_per_second": 12.288, "eval_steps_per_second": 3.09, "eval_wer": 0.9997761361092455, "step": 300 }, { "epoch": 17.4056338028169, "eval_loss": 2.18796968460083, "eval_runtime": 27.3348, "eval_samples_per_second": 12.219, "eval_steps_per_second": 3.073, "eval_wer": 0.9952988582941572, "step": 400 }, { "epoch": 21.76619718309859, "grad_norm": 13.245641708374023, "learning_rate": 7.627503725040675e-05, "loss": 65.9261, "step": 500 }, { "epoch": 21.76619718309859, "eval_loss": 1.897925853729248, "eval_runtime": 27.2806, "eval_samples_per_second": 12.243, "eval_steps_per_second": 3.079, "eval_wer": 0.9890306693530334, "step": 500 }, { "epoch": 26.090140845070422, "eval_loss": 1.79039466381073, "eval_runtime": 27.3755, "eval_samples_per_second": 12.201, "eval_steps_per_second": 3.068, "eval_wer": 0.9798522498321021, "step": 600 } ], "logging_steps": 500, "max_steps": 660, "num_input_tokens_seen": 0, "num_train_epochs": 30, "save_steps": 400, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 4, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 0 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.929126147071394e+19, "train_batch_size": 8, "trial_name": null, "trial_params": { "learning_rate": 7.720145470688942e-05, "per_device_eval_batch_size": 4, "per_device_train_batch_size": 8 } }