| { | |
| "best_metric": null, | |
| "best_model_checkpoint": null, | |
| "epoch": 3.0, | |
| "eval_steps": 100, | |
| "global_step": 3039, | |
| "is_hyper_param_search": false, | |
| "is_local_process_zero": true, | |
| "is_world_process_zero": true, | |
| "log_history": [ | |
| { | |
| "epoch": 0.09871668311944719, | |
| "grad_norm": 7.595918655395508, | |
| "learning_rate": 6.578947368421054e-06, | |
| "loss": 0.4785, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.09871668311944719, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.48153268812956745, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8239186253209559, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.6804266245309105, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.7476298637171638, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6014421644194009, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.5954963687693909, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.650756003676077, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.48153268812956745, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.0823918625320956, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.22680887484363688, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.14952597274343274, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.48153268812956745, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8239186253209559, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.6804266245309105, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.7476298637171638, | |
| "eval_loss": 0.4484286308288574, | |
| "eval_runtime": 204.03, | |
| "eval_samples_per_second": 9.925, | |
| "eval_steps_per_second": 0.622, | |
| "step": 100 | |
| }, | |
| { | |
| "epoch": 0.19743336623889438, | |
| "grad_norm": 10.92927074432373, | |
| "learning_rate": 1.3157894736842108e-05, | |
| "loss": 0.4112, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.19743336623889438, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5033083152281256, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8463855421686747, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7041279873592732, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.772615050365396, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.624250951720462, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6187061477761295, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.6738741593374042, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5033083152281256, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08463855421686747, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2347093291197577, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1545230100730792, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5033083152281256, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8463855421686747, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7041279873592732, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.772615050365396, | |
| "eval_loss": 0.3707010746002197, | |
| "eval_runtime": 203.8165, | |
| "eval_samples_per_second": 9.935, | |
| "eval_steps_per_second": 0.623, | |
| "step": 200 | |
| }, | |
| { | |
| "epoch": 0.29615004935834155, | |
| "grad_norm": 33.57826232910156, | |
| "learning_rate": 1.9736842105263158e-05, | |
| "loss": 0.2838, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.29615004935834155, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5243432747382974, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.860655737704918, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7234841003357693, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.7913292514319573, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6432678473897245, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6380460561998335, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.6920347683997495, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5243432747382974, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.0860655737704918, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.24116136677858976, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.15826585028639148, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5243432747382974, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.860655737704918, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7234841003357693, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.7913292514319573, | |
| "eval_loss": 0.32815688848495483, | |
| "eval_runtime": 203.3881, | |
| "eval_samples_per_second": 9.956, | |
| "eval_steps_per_second": 0.624, | |
| "step": 300 | |
| }, | |
| { | |
| "epoch": 0.39486673247778875, | |
| "grad_norm": 2.814175605773926, | |
| "learning_rate": 1.9297989031078612e-05, | |
| "loss": 0.2422, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.39486673247778875, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5371321350977681, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8726051747975508, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7371123839620778, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8044143788267826, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6563831674366017, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6514166541262787, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7051169138321652, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5371321350977681, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08726051747975509, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.24570412798735927, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1608828757653565, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5371321350977681, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8726051747975508, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7371123839620778, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8044143788267826, | |
| "eval_loss": 0.28870803117752075, | |
| "eval_runtime": 203.6125, | |
| "eval_samples_per_second": 9.945, | |
| "eval_steps_per_second": 0.624, | |
| "step": 400 | |
| }, | |
| { | |
| "epoch": 0.49358341559723595, | |
| "grad_norm": 7.553986072540283, | |
| "learning_rate": 1.856672760511883e-05, | |
| "loss": 0.2369, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.49358341559723595, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5465139245506616, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8817894528935414, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7465929290934229, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8143393245111594, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6652980546980072, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6607006284309909, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.714385034123883, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5465139245506616, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08817894528935415, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.24886430969780762, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16286786490223187, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5465139245506616, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8817894528935414, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7465929290934229, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8143393245111594, | |
| "eval_loss": 0.28374621272087097, | |
| "eval_runtime": 204.4559, | |
| "eval_samples_per_second": 9.904, | |
| "eval_steps_per_second": 0.621, | |
| "step": 500 | |
| }, | |
| { | |
| "epoch": 0.5923000987166831, | |
| "grad_norm": 32.98969268798828, | |
| "learning_rate": 1.783546617915905e-05, | |
| "loss": 0.2899, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.5923000987166831, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5526367766146554, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8908749753110804, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7583448548291527, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8260912502468892, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6738304576911812, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.669296996730104, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7232271970632966, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5526367766146554, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08908749753110803, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.25278161827638423, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16521825004937787, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5526367766146554, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8908749753110804, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7583448548291527, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8260912502468892, | |
| "eval_loss": 0.26842400431632996, | |
| "eval_runtime": 203.2737, | |
| "eval_samples_per_second": 9.962, | |
| "eval_steps_per_second": 0.625, | |
| "step": 600 | |
| }, | |
| { | |
| "epoch": 0.6910167818361304, | |
| "grad_norm": 9.886919021606445, | |
| "learning_rate": 1.710420475319927e-05, | |
| "loss": 0.1801, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 0.6910167818361304, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5653268812956745, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8955164921983014, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7669365988544341, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8332510369346238, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.683737510172223, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6793955094382355, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7320247334733945, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5653268812956745, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08955164921983014, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.255645532951478, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16665020738692476, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5653268812956745, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8955164921983014, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7669365988544341, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8332510369346238, | |
| "eval_loss": 0.2664617896080017, | |
| "eval_runtime": 203.9076, | |
| "eval_samples_per_second": 9.931, | |
| "eval_steps_per_second": 0.623, | |
| "step": 700 | |
| }, | |
| { | |
| "epoch": 0.7897334649555775, | |
| "grad_norm": 17.79576873779297, | |
| "learning_rate": 1.637294332723949e-05, | |
| "loss": 0.2279, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.7897334649555775, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5654256369741261, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8918131542563698, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7636282836263085, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8272763183883073, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6824116708533701, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6777940607081065, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7298590424609255, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5654256369741261, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08918131542563698, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2545427612087695, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16545526367766147, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5654256369741261, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8918131542563698, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7636282836263085, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8272763183883073, | |
| "eval_loss": 0.2617240250110626, | |
| "eval_runtime": 203.217, | |
| "eval_samples_per_second": 9.965, | |
| "eval_steps_per_second": 0.625, | |
| "step": 800 | |
| }, | |
| { | |
| "epoch": 0.8884501480750246, | |
| "grad_norm": 29.348552703857422, | |
| "learning_rate": 1.564168190127971e-05, | |
| "loss": 0.2051, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 0.8884501480750246, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5677463954177365, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.8971953387319771, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7670353545328856, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8318190795970768, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6851778091536691, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6808611691104925, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7334481505960582, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5677463954177365, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.08971953387319773, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.25567845151096186, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16636381591941535, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5677463954177365, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.8971953387319771, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7670353545328856, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8318190795970768, | |
| "eval_loss": 0.26834186911582947, | |
| "eval_runtime": 203.4633, | |
| "eval_samples_per_second": 9.953, | |
| "eval_steps_per_second": 0.624, | |
| "step": 900 | |
| }, | |
| { | |
| "epoch": 0.9871668311944719, | |
| "grad_norm": 0.5696656703948975, | |
| "learning_rate": 1.491042047531993e-05, | |
| "loss": 0.2097, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 0.9871668311944719, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5728323128579893, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9064783725064192, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7784910132332609, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8429290934228718, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.692767963880535, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6886411963231704, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.741697294005231, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5728323128579893, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09064783725064192, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.259497004411087, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1685858186845744, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5728323128579893, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9064783725064192, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7784910132332609, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8429290934228718, | |
| "eval_loss": 0.2445395439863205, | |
| "eval_runtime": 203.8284, | |
| "eval_samples_per_second": 9.935, | |
| "eval_steps_per_second": 0.623, | |
| "step": 1000 | |
| }, | |
| { | |
| "epoch": 1.085883514313919, | |
| "grad_norm": 5.538768291473389, | |
| "learning_rate": 1.4179159049360148e-05, | |
| "loss": 0.1047, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 1.085883514313919, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5813253012048193, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9092435315030615, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7825399960497729, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8449535848311278, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6984402538800855, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6944231453526992, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7466897096167746, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5813253012048193, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09092435315030614, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2608466653499243, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16899071696622553, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5813253012048193, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9092435315030615, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7825399960497729, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8449535848311278, | |
| "eval_loss": 0.23973241448402405, | |
| "eval_runtime": 203.3277, | |
| "eval_samples_per_second": 9.959, | |
| "eval_steps_per_second": 0.625, | |
| "step": 1100 | |
| }, | |
| { | |
| "epoch": 1.1846001974333662, | |
| "grad_norm": 6.3217902183532715, | |
| "learning_rate": 1.3447897623400368e-05, | |
| "loss": 0.0984, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 1.1846001974333662, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5921390479952597, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9151688722101521, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7911317400750543, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8541378629271184, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7083777420863926, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7045087061752225, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.755835586028989, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5921390479952597, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09151688722101521, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2637105800250181, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1708275725854237, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5921390479952597, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9151688722101521, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7911317400750543, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8541378629271184, | |
| "eval_loss": 0.2229250818490982, | |
| "eval_runtime": 203.6954, | |
| "eval_samples_per_second": 9.941, | |
| "eval_steps_per_second": 0.623, | |
| "step": 1200 | |
| }, | |
| { | |
| "epoch": 1.2833168805528135, | |
| "grad_norm": 11.505134582519531, | |
| "learning_rate": 1.2716636197440586e-05, | |
| "loss": 0.0498, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 1.2833168805528135, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5782638751728224, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9055895714003556, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7789354137862927, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8386825992494569, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.6954513367155198, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.6912109797503966, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7433337553688117, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5782638751728224, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09055895714003556, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2596451379287642, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.16773651984989138, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5782638751728224, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9055895714003556, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7789354137862927, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8386825992494569, | |
| "eval_loss": 0.2586788237094879, | |
| "eval_runtime": 204.0885, | |
| "eval_samples_per_second": 9.922, | |
| "eval_steps_per_second": 0.622, | |
| "step": 1300 | |
| }, | |
| { | |
| "epoch": 1.3820335636722607, | |
| "grad_norm": 1.1614787578582764, | |
| "learning_rate": 1.1985374771480804e-05, | |
| "loss": 0.0993, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 1.3820335636722607, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.59411416156429, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9151194943709263, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7925636974126012, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8543353742840213, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7096847447019631, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.705814299351989, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7568020206373794, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.59411416156429, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09151194943709264, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2641878991375337, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17086707485680427, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.59411416156429, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9151194943709263, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7925636974126012, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8543353742840213, | |
| "eval_loss": 0.2147156298160553, | |
| "eval_runtime": 204.4732, | |
| "eval_samples_per_second": 9.903, | |
| "eval_steps_per_second": 0.621, | |
| "step": 1400 | |
| }, | |
| { | |
| "epoch": 1.4807502467917077, | |
| "grad_norm": 1.6429851055145264, | |
| "learning_rate": 1.1254113345521024e-05, | |
| "loss": 0.0621, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.4807502467917077, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5962867864902232, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9217855026664034, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7997234841003358, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.860853249061821, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7136002941229976, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7100783500904636, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7616828218263099, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5962867864902232, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09217855026664035, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2665744947001119, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1721706498123642, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5962867864902232, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9217855026664034, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7997234841003358, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.860853249061821, | |
| "eval_loss": 0.20447228848934174, | |
| "eval_runtime": 204.051, | |
| "eval_samples_per_second": 9.924, | |
| "eval_steps_per_second": 0.622, | |
| "step": 1500 | |
| }, | |
| { | |
| "epoch": 1.579466929911155, | |
| "grad_norm": 15.424310684204102, | |
| "learning_rate": 1.0522851919561243e-05, | |
| "loss": 0.0922, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.579466929911155, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.5950029626703536, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9201560339719533, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.7980446375666601, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.858038712225953, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7121969229630567, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7085377027234775, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7601050276866773, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.5950029626703536, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09201560339719535, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.26601487918888667, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17160774244519061, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.5950029626703536, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9201560339719533, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.7980446375666601, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.858038712225953, | |
| "eval_loss": 0.20542284846305847, | |
| "eval_runtime": 203.1105, | |
| "eval_samples_per_second": 9.97, | |
| "eval_steps_per_second": 0.625, | |
| "step": 1600 | |
| }, | |
| { | |
| "epoch": 1.678183613030602, | |
| "grad_norm": 4.0268096923828125, | |
| "learning_rate": 9.791590493601464e-06, | |
| "loss": 0.1093, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 1.678183613030602, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6026071499111199, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9248469286984001, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8095496741062611, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8681117914280071, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7204789219182511, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7169305441908291, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7677587208908659, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6026071499111199, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09248469286984001, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.26984989136875365, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1736223582856014, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6026071499111199, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9248469286984001, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8095496741062611, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8681117914280071, | |
| "eval_loss": 0.1992715299129486, | |
| "eval_runtime": 203.9449, | |
| "eval_samples_per_second": 9.929, | |
| "eval_steps_per_second": 0.623, | |
| "step": 1700 | |
| }, | |
| { | |
| "epoch": 1.7769002961500493, | |
| "grad_norm": 0.6978006958961487, | |
| "learning_rate": 9.060329067641682e-06, | |
| "loss": 0.0795, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.7769002961500493, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.605816709460794, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9286984001580091, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8117222990321944, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8722101520837449, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7237388658743508, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7203004837460861, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7712328450315743, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.605816709460794, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09286984001580093, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2705740996773981, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17444203041674897, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.605816709460794, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9286984001580091, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8117222990321944, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8722101520837449, | |
| "eval_loss": 0.19426828622817993, | |
| "eval_runtime": 204.0488, | |
| "eval_samples_per_second": 9.924, | |
| "eval_steps_per_second": 0.622, | |
| "step": 1800 | |
| }, | |
| { | |
| "epoch": 1.8756169792694966, | |
| "grad_norm": 2.5955662727355957, | |
| "learning_rate": 8.329067641681902e-06, | |
| "loss": 0.1181, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 1.8756169792694966, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6043353742840213, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9297847126209757, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8089077621963263, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8701362828362631, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7219374022367849, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7185761194661708, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7700958544922684, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6043353742840213, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09297847126209759, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2696359207321088, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17402725656725263, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6043353742840213, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9297847126209757, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8089077621963263, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8701362828362631, | |
| "eval_loss": 0.20659147202968597, | |
| "eval_runtime": 204.0716, | |
| "eval_samples_per_second": 9.923, | |
| "eval_steps_per_second": 0.622, | |
| "step": 1900 | |
| }, | |
| { | |
| "epoch": 1.9743336623889438, | |
| "grad_norm": 0.8803901672363281, | |
| "learning_rate": 7.597806215722121e-06, | |
| "loss": 0.0709, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 1.9743336623889438, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.603199683981829, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9302784910132332, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8102903416946474, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8703831720323919, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7214873578820934, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7181931668908422, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7699451899898953, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.603199683981829, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09302784910132333, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.27009678056488245, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1740766344064784, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.603199683981829, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9302784910132332, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8102903416946474, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8703831720323919, | |
| "eval_loss": 0.19996753334999084, | |
| "eval_runtime": 203.9747, | |
| "eval_samples_per_second": 9.928, | |
| "eval_steps_per_second": 0.623, | |
| "step": 2000 | |
| }, | |
| { | |
| "epoch": 2.073050345508391, | |
| "grad_norm": 0.9776083827018738, | |
| "learning_rate": 6.866544789762341e-06, | |
| "loss": 0.0423, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 2.073050345508391, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6150503653960103, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9359075646849694, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8209065771281848, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8796168279676081, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7317976394363255, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.728681000348013, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7793256141306921, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6150503653960103, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09359075646849695, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.27363552570939487, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17592336559352165, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6150503653960103, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9359075646849694, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8209065771281848, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8796168279676081, | |
| "eval_loss": 0.19277189671993256, | |
| "eval_runtime": 203.5377, | |
| "eval_samples_per_second": 9.949, | |
| "eval_steps_per_second": 0.624, | |
| "step": 2100 | |
| }, | |
| { | |
| "epoch": 2.171767028627838, | |
| "grad_norm": 0.3466501235961914, | |
| "learning_rate": 6.13528336380256e-06, | |
| "loss": 0.0365, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 2.171767028627838, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6160379221805253, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9352162749358088, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8210547106458621, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8787280268615445, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7324401240286031, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7293587895689079, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7796830803735836, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6160379221805253, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.0935216274935809, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2736849035486207, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17574560537230893, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6160379221805253, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9352162749358088, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8210547106458621, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8787280268615445, | |
| "eval_loss": 0.2016632854938507, | |
| "eval_runtime": 203.3562, | |
| "eval_samples_per_second": 9.958, | |
| "eval_steps_per_second": 0.625, | |
| "step": 2200 | |
| }, | |
| { | |
| "epoch": 2.270483711747285, | |
| "grad_norm": 11.319628715515137, | |
| "learning_rate": 5.40402193784278e-06, | |
| "loss": 0.0488, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 2.270483711747285, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6060635986569227, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9303772466916848, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.810784120086905, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8715188623345842, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7233919610739875, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7200670950782208, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7713978686997449, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6060635986569227, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09303772466916849, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.27026137336230166, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17430377246691683, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6060635986569227, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9303772466916848, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.810784120086905, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8715188623345842, | |
| "eval_loss": 0.2220190316438675, | |
| "eval_runtime": 203.7981, | |
| "eval_samples_per_second": 9.936, | |
| "eval_steps_per_second": 0.623, | |
| "step": 2300 | |
| }, | |
| { | |
| "epoch": 2.3692003948667324, | |
| "grad_norm": 1.2127763032913208, | |
| "learning_rate": 4.672760511882998e-06, | |
| "loss": 0.0405, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 2.3692003948667324, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.612482717756271, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9345249851866483, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8190302192376062, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8769010468101915, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7299302543873705, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7267631415592252, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7775318729565346, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.612482717756271, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09345249851866484, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.27301007307920205, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17538020936203833, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.612482717756271, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9345249851866483, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8190302192376062, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8769010468101915, | |
| "eval_loss": 0.20903073251247406, | |
| "eval_runtime": 204.2344, | |
| "eval_samples_per_second": 9.915, | |
| "eval_steps_per_second": 0.622, | |
| "step": 2400 | |
| }, | |
| { | |
| "epoch": 2.4679170779861797, | |
| "grad_norm": 0.3473336398601532, | |
| "learning_rate": 3.941499085923218e-06, | |
| "loss": 0.0327, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.4679170779861797, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6181611692672329, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9379814339324511, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8215484890381197, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8832214102310882, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7347609073841157, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7317605707764854, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7821769875234544, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6181611692672329, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09379814339324512, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.27384949634603983, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17664428204621765, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6181611692672329, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9379814339324511, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8215484890381197, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8832214102310882, | |
| "eval_loss": 0.1959671527147293, | |
| "eval_runtime": 204.2804, | |
| "eval_samples_per_second": 9.913, | |
| "eval_steps_per_second": 0.622, | |
| "step": 2500 | |
| }, | |
| { | |
| "epoch": 2.566633761105627, | |
| "grad_norm": 3.084174871444702, | |
| "learning_rate": 3.210237659963437e-06, | |
| "loss": 0.0369, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 2.566633761105627, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6188524590163934, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9379814339324511, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8248568042662453, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.882678253999605, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7355447502017791, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7324816047954649, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7827478877040044, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6188524590163934, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09379814339324513, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2749522680887484, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17653565079992103, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6188524590163934, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9379814339324511, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8248568042662453, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.882678253999605, | |
| "eval_loss": 0.19852839410305023, | |
| "eval_runtime": 203.3999, | |
| "eval_samples_per_second": 9.956, | |
| "eval_steps_per_second": 0.624, | |
| "step": 2600 | |
| }, | |
| { | |
| "epoch": 2.665350444225074, | |
| "grad_norm": 0.2841149568557739, | |
| "learning_rate": 2.4789762340036565e-06, | |
| "loss": 0.0493, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 2.665350444225074, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6227039304760024, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9392652577523207, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8246099150701165, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8839126999802489, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7377982498848669, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7347973078888687, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7847760881684369, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6227039304760024, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.0939265257752321, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2748699716900388, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.1767825399960498, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6227039304760024, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9392652577523207, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8246099150701165, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8839126999802489, | |
| "eval_loss": 0.1986970454454422, | |
| "eval_runtime": 203.1067, | |
| "eval_samples_per_second": 9.97, | |
| "eval_steps_per_second": 0.625, | |
| "step": 2700 | |
| }, | |
| { | |
| "epoch": 2.7640671273445214, | |
| "grad_norm": 35.21987533569336, | |
| "learning_rate": 1.7477148080438758e-06, | |
| "loss": 0.0466, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 2.7640671273445214, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6232964645467114, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9393640134307722, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8262887616037922, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8854434129962473, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7388327302504635, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7358363978944812, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7856277834747031, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6232964645467114, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09393640134307724, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2754295872012641, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17708868259924945, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6232964645467114, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9393640134307722, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8262887616037922, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8854434129962473, | |
| "eval_loss": 0.20075508952140808, | |
| "eval_runtime": 203.5383, | |
| "eval_samples_per_second": 9.949, | |
| "eval_steps_per_second": 0.624, | |
| "step": 2800 | |
| }, | |
| { | |
| "epoch": 2.8627838104639682, | |
| "grad_norm": 1.2376320362091064, | |
| "learning_rate": 1.0164533820840951e-06, | |
| "loss": 0.03, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 2.8627838104639682, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.6220620185660676, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9396109026269011, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8248568042662453, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8844558562117322, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7376002793094979, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7346429237637674, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7847496074277119, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.6220620185660676, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09396109026269013, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2749522680887484, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17689117124234646, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.6220620185660676, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9396109026269011, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8248568042662453, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8844558562117322, | |
| "eval_loss": 0.2035462111234665, | |
| "eval_runtime": 202.781, | |
| "eval_samples_per_second": 9.986, | |
| "eval_steps_per_second": 0.626, | |
| "step": 2900 | |
| }, | |
| { | |
| "epoch": 2.9615004935834155, | |
| "grad_norm": 0.5317863821983337, | |
| "learning_rate": 2.8519195612431445e-07, | |
| "loss": 0.0633, | |
| "step": 3000 | |
| }, | |
| { | |
| "epoch": 2.9615004935834155, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@1": 0.621963262887616, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@10": 0.9401046810191586, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@3": 0.8262393837645665, | |
| "eval_custom_dataset_evaluation_cosine_accuracy@5": 0.8843077226940549, | |
| "eval_custom_dataset_evaluation_cosine_map@100": 0.7376242387041089, | |
| "eval_custom_dataset_evaluation_cosine_mrr@10": 0.7346985522104195, | |
| "eval_custom_dataset_evaluation_cosine_ndcg@10": 0.7849111131501391, | |
| "eval_custom_dataset_evaluation_cosine_precision@1": 0.621963262887616, | |
| "eval_custom_dataset_evaluation_cosine_precision@10": 0.09401046810191586, | |
| "eval_custom_dataset_evaluation_cosine_precision@3": 0.2754131279215221, | |
| "eval_custom_dataset_evaluation_cosine_precision@5": 0.17686154453881098, | |
| "eval_custom_dataset_evaluation_cosine_recall@1": 0.621963262887616, | |
| "eval_custom_dataset_evaluation_cosine_recall@10": 0.9401046810191586, | |
| "eval_custom_dataset_evaluation_cosine_recall@3": 0.8262393837645665, | |
| "eval_custom_dataset_evaluation_cosine_recall@5": 0.8843077226940549, | |
| "eval_loss": 0.20363624393939972, | |
| "eval_runtime": 203.946, | |
| "eval_samples_per_second": 9.929, | |
| "eval_steps_per_second": 0.623, | |
| "step": 3000 | |
| } | |
| ], | |
| "logging_steps": 100, | |
| "max_steps": 3039, | |
| "num_input_tokens_seen": 0, | |
| "num_train_epochs": 3, | |
| "save_steps": 500, | |
| "stateful_callbacks": { | |
| "TrainerControl": { | |
| "args": { | |
| "should_epoch_stop": false, | |
| "should_evaluate": false, | |
| "should_log": false, | |
| "should_save": true, | |
| "should_training_stop": true | |
| }, | |
| "attributes": {} | |
| } | |
| }, | |
| "total_flos": 0.0, | |
| "train_batch_size": 16, | |
| "trial_name": null, | |
| "trial_params": null | |
| } | |