Upload ./trainer_log.jsonl with huggingface_hub
Browse files- trainer_log.jsonl +28 -50
trainer_log.jsonl
CHANGED
@@ -1,50 +1,28 @@
|
|
1 |
-
{"current_steps": 1, "total_steps":
|
2 |
-
{"current_steps":
|
3 |
-
{"current_steps":
|
4 |
-
{"current_steps":
|
5 |
-
{"current_steps":
|
6 |
-
{"current_steps":
|
7 |
-
{"current_steps":
|
8 |
-
{"current_steps":
|
9 |
-
{"current_steps":
|
10 |
-
{"current_steps":
|
11 |
-
{"current_steps":
|
12 |
-
{"current_steps":
|
13 |
-
{"current_steps":
|
14 |
-
{"current_steps":
|
15 |
-
{"current_steps":
|
16 |
-
{"current_steps":
|
17 |
-
{"current_steps":
|
18 |
-
{"current_steps":
|
19 |
-
{"current_steps":
|
20 |
-
{"current_steps":
|
21 |
-
{"current_steps":
|
22 |
-
{"current_steps":
|
23 |
-
{"current_steps":
|
24 |
-
{"current_steps":
|
25 |
-
{"current_steps":
|
26 |
-
{"current_steps":
|
27 |
-
{"current_steps":
|
28 |
-
{"current_steps":
|
29 |
-
{"current_steps": 115, "total_steps": 192, "loss": 0.3573, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.329471712759216e-08, "epoch": 2.3958333333333335, "percentage": 59.9, "elapsed_time": "0:09:26", "remaining_time": "0:06:19"}
|
30 |
-
{"current_steps": 120, "total_steps": 192, "loss": 0.3982, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.161995210302015e-08, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "0:09:33", "remaining_time": "0:05:43"}
|
31 |
-
{"current_steps": 120, "total_steps": 192, "loss": null, "eval_loss": 0.8576084971427917, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.5, "percentage": 62.5, "elapsed_time": "0:09:33", "remaining_time": "0:05:43"}
|
32 |
-
{"current_steps": 125, "total_steps": 192, "loss": 0.3815, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.075841465580837e-08, "epoch": 2.6041666666666665, "percentage": 65.1, "elapsed_time": "0:11:10", "remaining_time": "0:05:59"}
|
33 |
-
{"current_steps": 130, "total_steps": 192, "loss": 0.3762, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.033564114946932e-08, "epoch": 2.7083333333333335, "percentage": 67.71, "elapsed_time": "0:11:17", "remaining_time": "0:05:22"}
|
34 |
-
{"current_steps": 135, "total_steps": 192, "loss": 0.3809, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.013915282607116e-08, "epoch": 2.8125, "percentage": 70.31, "elapsed_time": "0:11:23", "remaining_time": "0:04:48"}
|
35 |
-
{"current_steps": 140, "total_steps": 192, "loss": 0.3742, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.005343402153039e-08, "epoch": 2.9166666666666665, "percentage": 72.92, "elapsed_time": "0:11:30", "remaining_time": "0:04:16"}
|
36 |
-
{"current_steps": 140, "total_steps": 192, "loss": null, "eval_loss": 0.8624204993247986, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 2.9166666666666665, "percentage": 72.92, "elapsed_time": "0:11:30", "remaining_time": "0:04:16"}
|
37 |
-
{"current_steps": 145, "total_steps": 192, "loss": 0.3793, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.001872829857116e-08, "epoch": 3.0208333333333335, "percentage": 75.52, "elapsed_time": "0:13:06", "remaining_time": "0:04:15"}
|
38 |
-
{"current_steps": 150, "total_steps": 192, "loss": 0.3734, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000587713853837e-08, "epoch": 3.125, "percentage": 78.12, "elapsed_time": "0:13:15", "remaining_time": "0:03:42"}
|
39 |
-
{"current_steps": 155, "total_steps": 192, "loss": 0.3713, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0001608748597456e-08, "epoch": 3.2291666666666665, "percentage": 80.73, "elapsed_time": "0:13:22", "remaining_time": "0:03:11"}
|
40 |
-
{"current_steps": 160, "total_steps": 192, "loss": 0.3692, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000370319656156e-08, "epoch": 3.3333333333333335, "percentage": 83.33, "elapsed_time": "0:13:29", "remaining_time": "0:02:41"}
|
41 |
-
{"current_steps": 160, "total_steps": 192, "loss": null, "eval_loss": 0.8662496209144592, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.3333333333333335, "percentage": 83.33, "elapsed_time": "0:13:29", "remaining_time": "0:02:41"}
|
42 |
-
{"current_steps": 165, "total_steps": 192, "loss": 0.3657, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000067945715855e-08, "epoch": 3.4375, "percentage": 85.94, "elapsed_time": "0:15:04", "remaining_time": "0:02:28"}
|
43 |
-
{"current_steps": 170, "total_steps": 192, "loss": 0.3513, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000009144677036e-08, "epoch": 3.5416666666666665, "percentage": 88.54, "elapsed_time": "0:15:11", "remaining_time": "0:01:57"}
|
44 |
-
{"current_steps": 175, "total_steps": 192, "loss": 0.3683, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.0000000785521776e-08, "epoch": 3.6458333333333335, "percentage": 91.15, "elapsed_time": "0:15:17", "remaining_time": "0:01:29"}
|
45 |
-
{"current_steps": 180, "total_steps": 192, "loss": 0.3667, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000003317662e-08, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "0:15:25", "remaining_time": "0:01:01"}
|
46 |
-
{"current_steps": 180, "total_steps": 192, "loss": null, "eval_loss": 0.8689968585968018, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 3.75, "percentage": 93.75, "elapsed_time": "0:15:25", "remaining_time": "0:01:01"}
|
47 |
-
{"current_steps": 185, "total_steps": 192, "loss": 0.3741, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000000038355e-08, "epoch": 3.8541666666666665, "percentage": 96.35, "elapsed_time": "0:17:01", "remaining_time": "0:00:38"}
|
48 |
-
{"current_steps": 190, "total_steps": 192, "loss": 0.3694, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 5.000000000000018e-08, "epoch": 3.9583333333333335, "percentage": 98.96, "elapsed_time": "0:17:08", "remaining_time": "0:00:10"}
|
49 |
-
{"current_steps": 192, "total_steps": 192, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "0:17:10", "remaining_time": "0:00:00"}
|
50 |
-
{"current_steps": 3, "total_steps": 3, "loss": null, "eval_loss": 0.8514555096626282, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 4.0, "percentage": 100.0, "elapsed_time": "0:17:44", "remaining_time": "0:00:00"}
|
|
|
1 |
+
{"current_steps": 1, "total_steps": 48, "loss": 0.9436, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 0.0, "epoch": 0.020833333333333332, "percentage": 2.08, "elapsed_time": "0:00:05", "remaining_time": "0:04:25"}
|
2 |
+
{"current_steps": 3, "total_steps": 48, "loss": 0.8831, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 7.5e-07, "epoch": 0.0625, "percentage": 6.25, "elapsed_time": "0:00:07", "remaining_time": "0:01:48"}
|
3 |
+
{"current_steps": 5, "total_steps": 48, "loss": null, "eval_loss": 0.9745497703552246, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.10416666666666667, "percentage": 10.42, "elapsed_time": "0:00:08", "remaining_time": "0:01:14"}
|
4 |
+
{"current_steps": 6, "total_steps": 48, "loss": 1.005, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.25e-06, "epoch": 0.125, "percentage": 12.5, "elapsed_time": "0:00:10", "remaining_time": "0:01:11"}
|
5 |
+
{"current_steps": 9, "total_steps": 48, "loss": 0.8656, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.865909090909091e-06, "epoch": 0.1875, "percentage": 18.75, "elapsed_time": "0:00:12", "remaining_time": "0:00:53"}
|
6 |
+
{"current_steps": 10, "total_steps": 48, "loss": null, "eval_loss": 0.8130785822868347, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.20833333333333334, "percentage": 20.83, "elapsed_time": "0:00:12", "remaining_time": "0:00:49"}
|
7 |
+
{"current_steps": 12, "total_steps": 48, "loss": 0.7828, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.6647727272727274e-06, "epoch": 0.25, "percentage": 25.0, "elapsed_time": "0:01:00", "remaining_time": "0:03:02"}
|
8 |
+
{"current_steps": 15, "total_steps": 48, "loss": 0.834, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.4636363636363635e-06, "epoch": 0.3125, "percentage": 31.25, "elapsed_time": "0:01:03", "remaining_time": "0:02:18"}
|
9 |
+
{"current_steps": 15, "total_steps": 48, "loss": null, "eval_loss": 0.802370548248291, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.3125, "percentage": 31.25, "elapsed_time": "0:01:03", "remaining_time": "0:02:18"}
|
10 |
+
{"current_steps": 18, "total_steps": 48, "loss": 0.7683, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.2625e-06, "epoch": 0.375, "percentage": 37.5, "elapsed_time": "0:01:06", "remaining_time": "0:01:50"}
|
11 |
+
{"current_steps": 20, "total_steps": 48, "loss": null, "eval_loss": 0.7906376719474792, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.4166666666666667, "percentage": 41.67, "elapsed_time": "0:01:08", "remaining_time": "0:01:35"}
|
12 |
+
{"current_steps": 21, "total_steps": 48, "loss": 0.7992, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.0613636363636364e-06, "epoch": 0.4375, "percentage": 43.75, "elapsed_time": "0:01:57", "remaining_time": "0:02:30"}
|
13 |
+
{"current_steps": 24, "total_steps": 48, "loss": 0.7188, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.8602272727272725e-06, "epoch": 0.5, "percentage": 50.0, "elapsed_time": "0:01:59", "remaining_time": "0:01:59"}
|
14 |
+
{"current_steps": 25, "total_steps": 48, "loss": null, "eval_loss": 0.7848005294799805, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.5208333333333334, "percentage": 52.08, "elapsed_time": "0:01:59", "remaining_time": "0:01:50"}
|
15 |
+
{"current_steps": 27, "total_steps": 48, "loss": 0.7912, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.659090909090909e-06, "epoch": 0.5625, "percentage": 56.25, "elapsed_time": "0:02:01", "remaining_time": "0:01:34"}
|
16 |
+
{"current_steps": 30, "total_steps": 48, "loss": 0.8186, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.4579545454545454e-06, "epoch": 0.625, "percentage": 62.5, "elapsed_time": "0:02:03", "remaining_time": "0:01:14"}
|
17 |
+
{"current_steps": 30, "total_steps": 48, "loss": null, "eval_loss": 0.7805004119873047, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.625, "percentage": 62.5, "elapsed_time": "0:02:03", "remaining_time": "0:01:14"}
|
18 |
+
{"current_steps": 33, "total_steps": 48, "loss": 0.6864, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.2568181818181817e-06, "epoch": 0.6875, "percentage": 68.75, "elapsed_time": "0:02:54", "remaining_time": "0:01:19"}
|
19 |
+
{"current_steps": 35, "total_steps": 48, "loss": null, "eval_loss": 0.7762691378593445, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.7291666666666666, "percentage": 72.92, "elapsed_time": "0:02:55", "remaining_time": "0:01:05"}
|
20 |
+
{"current_steps": 36, "total_steps": 48, "loss": 0.7509, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 1.0556818181818182e-06, "epoch": 0.75, "percentage": 75.0, "elapsed_time": "0:02:57", "remaining_time": "0:00:59"}
|
21 |
+
{"current_steps": 39, "total_steps": 48, "loss": 0.7036, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 8.545454545454544e-07, "epoch": 0.8125, "percentage": 81.25, "elapsed_time": "0:02:59", "remaining_time": "0:00:41"}
|
22 |
+
{"current_steps": 40, "total_steps": 48, "loss": null, "eval_loss": 0.7741249203681946, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.8333333333333334, "percentage": 83.33, "elapsed_time": "0:02:59", "remaining_time": "0:00:35"}
|
23 |
+
{"current_steps": 42, "total_steps": 48, "loss": 0.7763, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 6.534090909090911e-07, "epoch": 0.875, "percentage": 87.5, "elapsed_time": "0:03:50", "remaining_time": "0:00:32"}
|
24 |
+
{"current_steps": 45, "total_steps": 48, "loss": 0.8125, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 4.522727272727273e-07, "epoch": 0.9375, "percentage": 93.75, "elapsed_time": "0:03:52", "remaining_time": "0:00:15"}
|
25 |
+
{"current_steps": 45, "total_steps": 48, "loss": null, "eval_loss": 0.7722158432006836, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 0.9375, "percentage": 93.75, "elapsed_time": "0:03:52", "remaining_time": "0:00:15"}
|
26 |
+
{"current_steps": 48, "total_steps": 48, "loss": 0.8029, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": 2.511363636363638e-07, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:03:55", "remaining_time": "0:00:00"}
|
27 |
+
{"current_steps": 48, "total_steps": 48, "loss": null, "eval_loss": null, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:03:55", "remaining_time": "0:00:00"}
|
28 |
+
{"current_steps": 3, "total_steps": 3, "loss": null, "eval_loss": 0.7741249203681946, "predict_loss": null, "reward": null, "learning_rate": null, "epoch": 1.0, "percentage": 100.0, "elapsed_time": "0:04:33", "remaining_time": "0:00:00"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|