codealchemist01's picture
Upload financial-sentiment-improved model
345d0ac verified
{
"best_global_step": 2500,
"best_metric": 0.8745242401633876,
"best_model_checkpoint": "models\\improved_model\\checkpoint-2500",
"epoch": 5.0,
"eval_steps": 500,
"global_step": 3435,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.14556040756914118,
"grad_norm": 5.4006147384643555,
"learning_rate": 9.900000000000002e-06,
"loss": 1.0779,
"step": 100
},
{
"epoch": 0.29112081513828236,
"grad_norm": 7.964382171630859,
"learning_rate": 1.9900000000000003e-05,
"loss": 0.3444,
"step": 200
},
{
"epoch": 0.4366812227074236,
"grad_norm": 6.473100185394287,
"learning_rate": 2.9900000000000002e-05,
"loss": 0.2621,
"step": 300
},
{
"epoch": 0.5822416302765647,
"grad_norm": 2.3269290924072266,
"learning_rate": 3.99e-05,
"loss": 0.2215,
"step": 400
},
{
"epoch": 0.727802037845706,
"grad_norm": 1.0794602632522583,
"learning_rate": 4.99e-05,
"loss": 0.1994,
"step": 500
},
{
"epoch": 0.727802037845706,
"eval_accuracy": 0.8291404612159329,
"eval_f1": 0.8347849048667186,
"eval_f1_bearish": 0.7192982456140351,
"eval_f1_bullish": 0.8773747841105354,
"eval_f1_neutral": 0.7843137254901961,
"eval_loss": 0.16642487049102783,
"eval_precision": 0.8522584333905088,
"eval_precision_bearish": 0.6212121212121212,
"eval_precision_bullish": 0.9407407407407408,
"eval_precision_neutral": 0.7407407407407407,
"eval_recall": 0.8291404612159329,
"eval_recall_bearish": 0.8541666666666666,
"eval_recall_bullish": 0.8220064724919094,
"eval_recall_neutral": 0.8333333333333334,
"eval_runtime": 8.1987,
"eval_samples_per_second": 116.359,
"eval_steps_per_second": 3.659,
"step": 500
},
{
"epoch": 0.8733624454148472,
"grad_norm": 10.456722259521484,
"learning_rate": 4.831345826235094e-05,
"loss": 0.1798,
"step": 600
},
{
"epoch": 1.0189228529839884,
"grad_norm": 0.8317745327949524,
"learning_rate": 4.660988074957411e-05,
"loss": 0.1477,
"step": 700
},
{
"epoch": 1.1644832605531295,
"grad_norm": 13.93519401550293,
"learning_rate": 4.490630323679728e-05,
"loss": 0.1027,
"step": 800
},
{
"epoch": 1.3100436681222707,
"grad_norm": 5.650792598724365,
"learning_rate": 4.320272572402044e-05,
"loss": 0.1093,
"step": 900
},
{
"epoch": 1.455604075691412,
"grad_norm": 2.2038004398345947,
"learning_rate": 4.1499148211243615e-05,
"loss": 0.1091,
"step": 1000
},
{
"epoch": 1.455604075691412,
"eval_accuracy": 0.8542976939203354,
"eval_f1": 0.854962642061992,
"eval_f1_bearish": 0.7436823104693141,
"eval_f1_bullish": 0.9034369885433715,
"eval_f1_neutral": 0.78239608801956,
"eval_loss": 0.22784079611301422,
"eval_precision": 0.85731689649448,
"eval_precision_bearish": 0.7744360902255639,
"eval_precision_bullish": 0.9139072847682119,
"eval_precision_neutral": 0.7373271889400922,
"eval_recall": 0.8542976939203354,
"eval_recall_bearish": 0.7152777777777778,
"eval_recall_bullish": 0.8932038834951457,
"eval_recall_neutral": 0.8333333333333334,
"eval_runtime": 8.8257,
"eval_samples_per_second": 108.094,
"eval_steps_per_second": 3.399,
"step": 1000
},
{
"epoch": 1.6011644832605532,
"grad_norm": 4.665580749511719,
"learning_rate": 3.9795570698466784e-05,
"loss": 0.0851,
"step": 1100
},
{
"epoch": 1.7467248908296944,
"grad_norm": 0.20554736256599426,
"learning_rate": 3.809199318568995e-05,
"loss": 0.0983,
"step": 1200
},
{
"epoch": 1.8922852983988356,
"grad_norm": 2.3172614574432373,
"learning_rate": 3.638841567291312e-05,
"loss": 0.0908,
"step": 1300
},
{
"epoch": 2.037845705967977,
"grad_norm": 0.20416907966136932,
"learning_rate": 3.468483816013629e-05,
"loss": 0.072,
"step": 1400
},
{
"epoch": 2.183406113537118,
"grad_norm": 0.08527473360300064,
"learning_rate": 3.298126064735946e-05,
"loss": 0.0316,
"step": 1500
},
{
"epoch": 2.183406113537118,
"eval_accuracy": 0.8616352201257862,
"eval_f1": 0.8636672911856373,
"eval_f1_bearish": 0.7516339869281046,
"eval_f1_bullish": 0.9054726368159204,
"eval_f1_neutral": 0.8131313131313131,
"eval_loss": 0.24344488978385925,
"eval_precision": 0.8675144411363428,
"eval_precision_bearish": 0.7098765432098766,
"eval_precision_bullish": 0.9285714285714286,
"eval_precision_neutral": 0.7892156862745098,
"eval_recall": 0.8616352201257862,
"eval_recall_bearish": 0.7986111111111112,
"eval_recall_bullish": 0.883495145631068,
"eval_recall_neutral": 0.8385416666666666,
"eval_runtime": 8.6074,
"eval_samples_per_second": 110.835,
"eval_steps_per_second": 3.485,
"step": 1500
},
{
"epoch": 2.328966521106259,
"grad_norm": 7.853630065917969,
"learning_rate": 3.1277683134582626e-05,
"loss": 0.0363,
"step": 1600
},
{
"epoch": 2.4745269286754,
"grad_norm": 0.3771085739135742,
"learning_rate": 2.957410562180579e-05,
"loss": 0.0347,
"step": 1700
},
{
"epoch": 2.6200873362445414,
"grad_norm": 3.0605719089508057,
"learning_rate": 2.787052810902896e-05,
"loss": 0.0319,
"step": 1800
},
{
"epoch": 2.7656477438136826,
"grad_norm": 3.2105116844177246,
"learning_rate": 2.616695059625213e-05,
"loss": 0.0359,
"step": 1900
},
{
"epoch": 2.911208151382824,
"grad_norm": 3.7454285621643066,
"learning_rate": 2.44633730834753e-05,
"loss": 0.0361,
"step": 2000
},
{
"epoch": 2.911208151382824,
"eval_accuracy": 0.8584905660377359,
"eval_f1": 0.8593807235316668,
"eval_f1_bearish": 0.7571428571428571,
"eval_f1_bullish": 0.9074529074529074,
"eval_f1_neutral": 0.7813267813267813,
"eval_loss": 0.2744849622249603,
"eval_precision": 0.8616426481335732,
"eval_precision_bearish": 0.7794117647058824,
"eval_precision_bullish": 0.9187396351575456,
"eval_precision_neutral": 0.7395348837209302,
"eval_recall": 0.8584905660377359,
"eval_recall_bearish": 0.7361111111111112,
"eval_recall_bullish": 0.8964401294498382,
"eval_recall_neutral": 0.828125,
"eval_runtime": 8.1534,
"eval_samples_per_second": 117.007,
"eval_steps_per_second": 3.679,
"step": 2000
},
{
"epoch": 3.056768558951965,
"grad_norm": 0.04752872511744499,
"learning_rate": 2.2759795570698465e-05,
"loss": 0.0169,
"step": 2100
},
{
"epoch": 3.2023289665211063,
"grad_norm": 3.445439100265503,
"learning_rate": 2.1056218057921637e-05,
"loss": 0.0094,
"step": 2200
},
{
"epoch": 3.3478893740902476,
"grad_norm": 1.7491494417190552,
"learning_rate": 1.9352640545144805e-05,
"loss": 0.0084,
"step": 2300
},
{
"epoch": 3.493449781659389,
"grad_norm": 1.3558599948883057,
"learning_rate": 1.7649063032367974e-05,
"loss": 0.0155,
"step": 2400
},
{
"epoch": 3.6390101892285296,
"grad_norm": 0.7178720235824585,
"learning_rate": 1.5945485519591142e-05,
"loss": 0.0166,
"step": 2500
},
{
"epoch": 3.6390101892285296,
"eval_accuracy": 0.8752620545073375,
"eval_f1": 0.8745242401633876,
"eval_f1_bearish": 0.7612456747404844,
"eval_f1_bullish": 0.9131474103585657,
"eval_f1_neutral": 0.8351648351648352,
"eval_loss": 0.27798759937286377,
"eval_precision": 0.8750783502197678,
"eval_precision_bearish": 0.7586206896551724,
"eval_precision_bullish": 0.8995290423861853,
"eval_precision_neutral": 0.8837209302325582,
"eval_recall": 0.8752620545073375,
"eval_recall_bearish": 0.7638888888888888,
"eval_recall_bullish": 0.9271844660194175,
"eval_recall_neutral": 0.7916666666666666,
"eval_runtime": 8.5538,
"eval_samples_per_second": 111.529,
"eval_steps_per_second": 3.507,
"step": 2500
},
{
"epoch": 3.7845705967976713,
"grad_norm": 0.5409824252128601,
"learning_rate": 1.424190800681431e-05,
"loss": 0.0072,
"step": 2600
},
{
"epoch": 3.930131004366812,
"grad_norm": 0.007624503690749407,
"learning_rate": 1.253833049403748e-05,
"loss": 0.0051,
"step": 2700
},
{
"epoch": 4.075691411935954,
"grad_norm": 0.03979913145303726,
"learning_rate": 1.0834752981260648e-05,
"loss": 0.0106,
"step": 2800
},
{
"epoch": 4.2212518195050945,
"grad_norm": 0.025390487164258957,
"learning_rate": 9.131175468483816e-06,
"loss": 0.003,
"step": 2900
},
{
"epoch": 4.366812227074236,
"grad_norm": 8.90622615814209,
"learning_rate": 7.427597955706985e-06,
"loss": 0.0066,
"step": 3000
},
{
"epoch": 4.366812227074236,
"eval_accuracy": 0.8742138364779874,
"eval_f1": 0.8740584051302639,
"eval_f1_bearish": 0.7659574468085106,
"eval_f1_bullish": 0.9174757281553398,
"eval_f1_neutral": 0.8153846153846154,
"eval_loss": 0.3259490132331848,
"eval_precision": 0.8740853986957351,
"eval_precision_bearish": 0.782608695652174,
"eval_precision_bullish": 0.9174757281553398,
"eval_precision_neutral": 0.803030303030303,
"eval_recall": 0.8742138364779874,
"eval_recall_bearish": 0.75,
"eval_recall_bullish": 0.9174757281553398,
"eval_recall_neutral": 0.828125,
"eval_runtime": 9.0626,
"eval_samples_per_second": 105.268,
"eval_steps_per_second": 3.31,
"step": 3000
},
{
"epoch": 4.512372634643377,
"grad_norm": 0.0042578354477882385,
"learning_rate": 5.724020442930154e-06,
"loss": 0.0021,
"step": 3100
},
{
"epoch": 4.657933042212518,
"grad_norm": 0.0550072155892849,
"learning_rate": 4.0204429301533224e-06,
"loss": 0.0065,
"step": 3200
},
{
"epoch": 4.8034934497816595,
"grad_norm": 0.019497277215123177,
"learning_rate": 2.3168654173764905e-06,
"loss": 0.0023,
"step": 3300
},
{
"epoch": 4.9490538573508,
"grad_norm": 0.012889917939901352,
"learning_rate": 6.132879045996593e-07,
"loss": 0.0031,
"step": 3400
}
],
"logging_steps": 100,
"max_steps": 3435,
"num_input_tokens_seen": 0,
"num_train_epochs": 5,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 3,
"early_stopping_threshold": 0.0
},
"attributes": {
"early_stopping_patience_counter": 1
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.444624220035584e+16,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}