{ "best_global_step": 2500, "best_metric": 0.8745242401633876, "best_model_checkpoint": "models\\improved_model\\checkpoint-2500", "epoch": 5.0, "eval_steps": 500, "global_step": 3435, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.14556040756914118, "grad_norm": 5.4006147384643555, "learning_rate": 9.900000000000002e-06, "loss": 1.0779, "step": 100 }, { "epoch": 0.29112081513828236, "grad_norm": 7.964382171630859, "learning_rate": 1.9900000000000003e-05, "loss": 0.3444, "step": 200 }, { "epoch": 0.4366812227074236, "grad_norm": 6.473100185394287, "learning_rate": 2.9900000000000002e-05, "loss": 0.2621, "step": 300 }, { "epoch": 0.5822416302765647, "grad_norm": 2.3269290924072266, "learning_rate": 3.99e-05, "loss": 0.2215, "step": 400 }, { "epoch": 0.727802037845706, "grad_norm": 1.0794602632522583, "learning_rate": 4.99e-05, "loss": 0.1994, "step": 500 }, { "epoch": 0.727802037845706, "eval_accuracy": 0.8291404612159329, "eval_f1": 0.8347849048667186, "eval_f1_bearish": 0.7192982456140351, "eval_f1_bullish": 0.8773747841105354, "eval_f1_neutral": 0.7843137254901961, "eval_loss": 0.16642487049102783, "eval_precision": 0.8522584333905088, "eval_precision_bearish": 0.6212121212121212, "eval_precision_bullish": 0.9407407407407408, "eval_precision_neutral": 0.7407407407407407, "eval_recall": 0.8291404612159329, "eval_recall_bearish": 0.8541666666666666, "eval_recall_bullish": 0.8220064724919094, "eval_recall_neutral": 0.8333333333333334, "eval_runtime": 8.1987, "eval_samples_per_second": 116.359, "eval_steps_per_second": 3.659, "step": 500 }, { "epoch": 0.8733624454148472, "grad_norm": 10.456722259521484, "learning_rate": 4.831345826235094e-05, "loss": 0.1798, "step": 600 }, { "epoch": 1.0189228529839884, "grad_norm": 0.8317745327949524, "learning_rate": 4.660988074957411e-05, "loss": 0.1477, "step": 700 }, { "epoch": 1.1644832605531295, "grad_norm": 13.93519401550293, "learning_rate": 4.490630323679728e-05, "loss": 0.1027, "step": 800 }, { "epoch": 1.3100436681222707, "grad_norm": 5.650792598724365, "learning_rate": 4.320272572402044e-05, "loss": 0.1093, "step": 900 }, { "epoch": 1.455604075691412, "grad_norm": 2.2038004398345947, "learning_rate": 4.1499148211243615e-05, "loss": 0.1091, "step": 1000 }, { "epoch": 1.455604075691412, "eval_accuracy": 0.8542976939203354, "eval_f1": 0.854962642061992, "eval_f1_bearish": 0.7436823104693141, "eval_f1_bullish": 0.9034369885433715, "eval_f1_neutral": 0.78239608801956, "eval_loss": 0.22784079611301422, "eval_precision": 0.85731689649448, "eval_precision_bearish": 0.7744360902255639, "eval_precision_bullish": 0.9139072847682119, "eval_precision_neutral": 0.7373271889400922, "eval_recall": 0.8542976939203354, "eval_recall_bearish": 0.7152777777777778, "eval_recall_bullish": 0.8932038834951457, "eval_recall_neutral": 0.8333333333333334, "eval_runtime": 8.8257, "eval_samples_per_second": 108.094, "eval_steps_per_second": 3.399, "step": 1000 }, { "epoch": 1.6011644832605532, "grad_norm": 4.665580749511719, "learning_rate": 3.9795570698466784e-05, "loss": 0.0851, "step": 1100 }, { "epoch": 1.7467248908296944, "grad_norm": 0.20554736256599426, "learning_rate": 3.809199318568995e-05, "loss": 0.0983, "step": 1200 }, { "epoch": 1.8922852983988356, "grad_norm": 2.3172614574432373, "learning_rate": 3.638841567291312e-05, "loss": 0.0908, "step": 1300 }, { "epoch": 2.037845705967977, "grad_norm": 0.20416907966136932, "learning_rate": 3.468483816013629e-05, "loss": 0.072, "step": 1400 }, { "epoch": 2.183406113537118, "grad_norm": 0.08527473360300064, "learning_rate": 3.298126064735946e-05, "loss": 0.0316, "step": 1500 }, { "epoch": 2.183406113537118, "eval_accuracy": 0.8616352201257862, "eval_f1": 0.8636672911856373, "eval_f1_bearish": 0.7516339869281046, "eval_f1_bullish": 0.9054726368159204, "eval_f1_neutral": 0.8131313131313131, "eval_loss": 0.24344488978385925, "eval_precision": 0.8675144411363428, "eval_precision_bearish": 0.7098765432098766, "eval_precision_bullish": 0.9285714285714286, "eval_precision_neutral": 0.7892156862745098, "eval_recall": 0.8616352201257862, "eval_recall_bearish": 0.7986111111111112, "eval_recall_bullish": 0.883495145631068, "eval_recall_neutral": 0.8385416666666666, "eval_runtime": 8.6074, "eval_samples_per_second": 110.835, "eval_steps_per_second": 3.485, "step": 1500 }, { "epoch": 2.328966521106259, "grad_norm": 7.853630065917969, "learning_rate": 3.1277683134582626e-05, "loss": 0.0363, "step": 1600 }, { "epoch": 2.4745269286754, "grad_norm": 0.3771085739135742, "learning_rate": 2.957410562180579e-05, "loss": 0.0347, "step": 1700 }, { "epoch": 2.6200873362445414, "grad_norm": 3.0605719089508057, "learning_rate": 2.787052810902896e-05, "loss": 0.0319, "step": 1800 }, { "epoch": 2.7656477438136826, "grad_norm": 3.2105116844177246, "learning_rate": 2.616695059625213e-05, "loss": 0.0359, "step": 1900 }, { "epoch": 2.911208151382824, "grad_norm": 3.7454285621643066, "learning_rate": 2.44633730834753e-05, "loss": 0.0361, "step": 2000 }, { "epoch": 2.911208151382824, "eval_accuracy": 0.8584905660377359, "eval_f1": 0.8593807235316668, "eval_f1_bearish": 0.7571428571428571, "eval_f1_bullish": 0.9074529074529074, "eval_f1_neutral": 0.7813267813267813, "eval_loss": 0.2744849622249603, "eval_precision": 0.8616426481335732, "eval_precision_bearish": 0.7794117647058824, "eval_precision_bullish": 0.9187396351575456, "eval_precision_neutral": 0.7395348837209302, "eval_recall": 0.8584905660377359, "eval_recall_bearish": 0.7361111111111112, "eval_recall_bullish": 0.8964401294498382, "eval_recall_neutral": 0.828125, "eval_runtime": 8.1534, "eval_samples_per_second": 117.007, "eval_steps_per_second": 3.679, "step": 2000 }, { "epoch": 3.056768558951965, "grad_norm": 0.04752872511744499, "learning_rate": 2.2759795570698465e-05, "loss": 0.0169, "step": 2100 }, { "epoch": 3.2023289665211063, "grad_norm": 3.445439100265503, "learning_rate": 2.1056218057921637e-05, "loss": 0.0094, "step": 2200 }, { "epoch": 3.3478893740902476, "grad_norm": 1.7491494417190552, "learning_rate": 1.9352640545144805e-05, "loss": 0.0084, "step": 2300 }, { "epoch": 3.493449781659389, "grad_norm": 1.3558599948883057, "learning_rate": 1.7649063032367974e-05, "loss": 0.0155, "step": 2400 }, { "epoch": 3.6390101892285296, "grad_norm": 0.7178720235824585, "learning_rate": 1.5945485519591142e-05, "loss": 0.0166, "step": 2500 }, { "epoch": 3.6390101892285296, "eval_accuracy": 0.8752620545073375, "eval_f1": 0.8745242401633876, "eval_f1_bearish": 0.7612456747404844, "eval_f1_bullish": 0.9131474103585657, "eval_f1_neutral": 0.8351648351648352, "eval_loss": 0.27798759937286377, "eval_precision": 0.8750783502197678, "eval_precision_bearish": 0.7586206896551724, "eval_precision_bullish": 0.8995290423861853, "eval_precision_neutral": 0.8837209302325582, "eval_recall": 0.8752620545073375, "eval_recall_bearish": 0.7638888888888888, "eval_recall_bullish": 0.9271844660194175, "eval_recall_neutral": 0.7916666666666666, "eval_runtime": 8.5538, "eval_samples_per_second": 111.529, "eval_steps_per_second": 3.507, "step": 2500 }, { "epoch": 3.7845705967976713, "grad_norm": 0.5409824252128601, "learning_rate": 1.424190800681431e-05, "loss": 0.0072, "step": 2600 }, { "epoch": 3.930131004366812, "grad_norm": 0.007624503690749407, "learning_rate": 1.253833049403748e-05, "loss": 0.0051, "step": 2700 }, { "epoch": 4.075691411935954, "grad_norm": 0.03979913145303726, "learning_rate": 1.0834752981260648e-05, "loss": 0.0106, "step": 2800 }, { "epoch": 4.2212518195050945, "grad_norm": 0.025390487164258957, "learning_rate": 9.131175468483816e-06, "loss": 0.003, "step": 2900 }, { "epoch": 4.366812227074236, "grad_norm": 8.90622615814209, "learning_rate": 7.427597955706985e-06, "loss": 0.0066, "step": 3000 }, { "epoch": 4.366812227074236, "eval_accuracy": 0.8742138364779874, "eval_f1": 0.8740584051302639, "eval_f1_bearish": 0.7659574468085106, "eval_f1_bullish": 0.9174757281553398, "eval_f1_neutral": 0.8153846153846154, "eval_loss": 0.3259490132331848, "eval_precision": 0.8740853986957351, "eval_precision_bearish": 0.782608695652174, "eval_precision_bullish": 0.9174757281553398, "eval_precision_neutral": 0.803030303030303, "eval_recall": 0.8742138364779874, "eval_recall_bearish": 0.75, "eval_recall_bullish": 0.9174757281553398, "eval_recall_neutral": 0.828125, "eval_runtime": 9.0626, "eval_samples_per_second": 105.268, "eval_steps_per_second": 3.31, "step": 3000 }, { "epoch": 4.512372634643377, "grad_norm": 0.0042578354477882385, "learning_rate": 5.724020442930154e-06, "loss": 0.0021, "step": 3100 }, { "epoch": 4.657933042212518, "grad_norm": 0.0550072155892849, "learning_rate": 4.0204429301533224e-06, "loss": 0.0065, "step": 3200 }, { "epoch": 4.8034934497816595, "grad_norm": 0.019497277215123177, "learning_rate": 2.3168654173764905e-06, "loss": 0.0023, "step": 3300 }, { "epoch": 4.9490538573508, "grad_norm": 0.012889917939901352, "learning_rate": 6.132879045996593e-07, "loss": 0.0031, "step": 3400 } ], "logging_steps": 100, "max_steps": 3435, "num_input_tokens_seen": 0, "num_train_epochs": 5, "save_steps": 500, "stateful_callbacks": { "EarlyStoppingCallback": { "args": { "early_stopping_patience": 3, "early_stopping_threshold": 0.0 }, "attributes": { "early_stopping_patience_counter": 1 } }, "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.444624220035584e+16, "train_batch_size": 16, "trial_name": null, "trial_params": null }