Training in progress, epoch 2
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4903351912
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7ee78e249f79f3d42ca25bfdb7c3709c9b898902fba4a84e8a6bf7761ca183f3
|
| 3 |
size 4903351912
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4947570872
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ce8eab3e958c300d44844e05ee39c77c4c68e0fd408b983b67e9aa7ba8691f3e
|
| 3 |
size 4947570872
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4962221464
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:cb02e1b86c1efdd70dd86e18b87222af4946d03a828f29cb52b01df419478da4
|
| 3 |
size 4962221464
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3670322200
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:e230add5f8da9e86971db0fe6fb4245bf09df7fee6efd86fef1e09019506edcb
|
| 3 |
size 3670322200
|
trainer_log.jsonl
CHANGED
|
@@ -88,3 +88,47 @@
|
|
| 88 |
{"current_steps": 870, "total_steps": 1329, "loss": 0.5456, "learning_rate": 5e-06, "epoch": 1.9633286318758816, "percentage": 65.46, "elapsed_time": "21:40:18", "remaining_time": "11:26:01"}
|
| 89 |
{"current_steps": 880, "total_steps": 1329, "loss": 0.5439, "learning_rate": 5e-06, "epoch": 1.9858956276445698, "percentage": 66.22, "elapsed_time": "21:55:06", "remaining_time": "11:11:00"}
|
| 90 |
{"current_steps": 886, "total_steps": 1329, "eval_loss": 0.5872690677642822, "epoch": 1.9994358251057829, "percentage": 66.67, "elapsed_time": "22:15:46", "remaining_time": "11:07:53"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 88 |
{"current_steps": 870, "total_steps": 1329, "loss": 0.5456, "learning_rate": 5e-06, "epoch": 1.9633286318758816, "percentage": 65.46, "elapsed_time": "21:40:18", "remaining_time": "11:26:01"}
|
| 89 |
{"current_steps": 880, "total_steps": 1329, "loss": 0.5439, "learning_rate": 5e-06, "epoch": 1.9858956276445698, "percentage": 66.22, "elapsed_time": "21:55:06", "remaining_time": "11:11:00"}
|
| 90 |
{"current_steps": 886, "total_steps": 1329, "eval_loss": 0.5872690677642822, "epoch": 1.9994358251057829, "percentage": 66.67, "elapsed_time": "22:15:46", "remaining_time": "11:07:53"}
|
| 91 |
+
{"current_steps": 890, "total_steps": 1329, "loss": 0.5671, "learning_rate": 5e-06, "epoch": 2.008462623413258, "percentage": 66.97, "elapsed_time": "22:22:46", "remaining_time": "11:02:20"}
|
| 92 |
+
{"current_steps": 900, "total_steps": 1329, "loss": 0.4778, "learning_rate": 5e-06, "epoch": 2.0310296191819464, "percentage": 67.72, "elapsed_time": "22:37:35", "remaining_time": "10:47:07"}
|
| 93 |
+
{"current_steps": 910, "total_steps": 1329, "loss": 0.4796, "learning_rate": 5e-06, "epoch": 2.0535966149506346, "percentage": 68.47, "elapsed_time": "22:52:25", "remaining_time": "10:31:55"}
|
| 94 |
+
{"current_steps": 920, "total_steps": 1329, "loss": 0.4721, "learning_rate": 5e-06, "epoch": 2.076163610719323, "percentage": 69.22, "elapsed_time": "23:07:14", "remaining_time": "10:16:43"}
|
| 95 |
+
{"current_steps": 930, "total_steps": 1329, "loss": 0.4795, "learning_rate": 5e-06, "epoch": 2.098730606488011, "percentage": 69.98, "elapsed_time": "23:22:04", "remaining_time": "10:01:32"}
|
| 96 |
+
{"current_steps": 940, "total_steps": 1329, "loss": 0.4837, "learning_rate": 5e-06, "epoch": 2.1212976022566994, "percentage": 70.73, "elapsed_time": "23:36:54", "remaining_time": "9:46:21"}
|
| 97 |
+
{"current_steps": 950, "total_steps": 1329, "loss": 0.4853, "learning_rate": 5e-06, "epoch": 2.143864598025388, "percentage": 71.48, "elapsed_time": "23:51:43", "remaining_time": "9:31:11"}
|
| 98 |
+
{"current_steps": 960, "total_steps": 1329, "loss": 0.4816, "learning_rate": 5e-06, "epoch": 2.1664315937940763, "percentage": 72.23, "elapsed_time": "1 day, 0:06:33", "remaining_time": "9:16:01"}
|
| 99 |
+
{"current_steps": 970, "total_steps": 1329, "loss": 0.4798, "learning_rate": 5e-06, "epoch": 2.1889985895627646, "percentage": 72.99, "elapsed_time": "1 day, 0:21:23", "remaining_time": "9:00:51"}
|
| 100 |
+
{"current_steps": 980, "total_steps": 1329, "loss": 0.4748, "learning_rate": 5e-06, "epoch": 2.211565585331453, "percentage": 73.74, "elapsed_time": "1 day, 0:36:13", "remaining_time": "8:45:42"}
|
| 101 |
+
{"current_steps": 990, "total_steps": 1329, "loss": 0.4747, "learning_rate": 5e-06, "epoch": 2.234132581100141, "percentage": 74.49, "elapsed_time": "1 day, 0:51:03", "remaining_time": "8:30:34"}
|
| 102 |
+
{"current_steps": 1000, "total_steps": 1329, "loss": 0.4836, "learning_rate": 5e-06, "epoch": 2.2566995768688294, "percentage": 75.24, "elapsed_time": "1 day, 1:05:53", "remaining_time": "8:15:26"}
|
| 103 |
+
{"current_steps": 1010, "total_steps": 1329, "loss": 0.4899, "learning_rate": 5e-06, "epoch": 2.2792665726375176, "percentage": 76.0, "elapsed_time": "1 day, 1:20:43", "remaining_time": "8:00:18"}
|
| 104 |
+
{"current_steps": 1020, "total_steps": 1329, "loss": 0.4843, "learning_rate": 5e-06, "epoch": 2.301833568406206, "percentage": 76.75, "elapsed_time": "1 day, 1:35:33", "remaining_time": "7:45:10"}
|
| 105 |
+
{"current_steps": 1030, "total_steps": 1329, "loss": 0.4887, "learning_rate": 5e-06, "epoch": 2.324400564174894, "percentage": 77.5, "elapsed_time": "1 day, 1:50:22", "remaining_time": "7:30:03"}
|
| 106 |
+
{"current_steps": 1040, "total_steps": 1329, "loss": 0.4865, "learning_rate": 5e-06, "epoch": 2.3469675599435824, "percentage": 78.25, "elapsed_time": "1 day, 2:05:12", "remaining_time": "7:14:56"}
|
| 107 |
+
{"current_steps": 1050, "total_steps": 1329, "loss": 0.4844, "learning_rate": 5e-06, "epoch": 2.3695345557122707, "percentage": 79.01, "elapsed_time": "1 day, 2:20:02", "remaining_time": "6:59:50"}
|
| 108 |
+
{"current_steps": 1060, "total_steps": 1329, "loss": 0.4837, "learning_rate": 5e-06, "epoch": 2.392101551480959, "percentage": 79.76, "elapsed_time": "1 day, 2:34:52", "remaining_time": "6:44:44"}
|
| 109 |
+
{"current_steps": 1070, "total_steps": 1329, "loss": 0.4849, "learning_rate": 5e-06, "epoch": 2.414668547249647, "percentage": 80.51, "elapsed_time": "1 day, 2:49:42", "remaining_time": "6:29:38"}
|
| 110 |
+
{"current_steps": 1080, "total_steps": 1329, "loss": 0.4883, "learning_rate": 5e-06, "epoch": 2.4372355430183354, "percentage": 81.26, "elapsed_time": "1 day, 3:04:32", "remaining_time": "6:14:32"}
|
| 111 |
+
{"current_steps": 1090, "total_steps": 1329, "loss": 0.4866, "learning_rate": 5e-06, "epoch": 2.459802538787024, "percentage": 82.02, "elapsed_time": "1 day, 3:19:22", "remaining_time": "5:59:27"}
|
| 112 |
+
{"current_steps": 1100, "total_steps": 1329, "loss": 0.4897, "learning_rate": 5e-06, "epoch": 2.4823695345557124, "percentage": 82.77, "elapsed_time": "1 day, 3:34:12", "remaining_time": "5:44:22"}
|
| 113 |
+
{"current_steps": 1110, "total_steps": 1329, "loss": 0.4928, "learning_rate": 5e-06, "epoch": 2.5049365303244007, "percentage": 83.52, "elapsed_time": "1 day, 3:49:01", "remaining_time": "5:29:17"}
|
| 114 |
+
{"current_steps": 1120, "total_steps": 1329, "loss": 0.4834, "learning_rate": 5e-06, "epoch": 2.527503526093089, "percentage": 84.27, "elapsed_time": "1 day, 4:03:51", "remaining_time": "5:14:13"}
|
| 115 |
+
{"current_steps": 1130, "total_steps": 1329, "loss": 0.4884, "learning_rate": 5e-06, "epoch": 2.550070521861777, "percentage": 85.03, "elapsed_time": "1 day, 4:18:40", "remaining_time": "4:59:08"}
|
| 116 |
+
{"current_steps": 1140, "total_steps": 1329, "loss": 0.4867, "learning_rate": 5e-06, "epoch": 2.5726375176304654, "percentage": 85.78, "elapsed_time": "1 day, 4:33:30", "remaining_time": "4:44:04"}
|
| 117 |
+
{"current_steps": 1150, "total_steps": 1329, "loss": 0.4875, "learning_rate": 5e-06, "epoch": 2.5952045133991537, "percentage": 86.53, "elapsed_time": "1 day, 4:48:19", "remaining_time": "4:29:01"}
|
| 118 |
+
{"current_steps": 1160, "total_steps": 1329, "loss": 0.4911, "learning_rate": 5e-06, "epoch": 2.617771509167842, "percentage": 87.28, "elapsed_time": "1 day, 5:03:09", "remaining_time": "4:13:57"}
|
| 119 |
+
{"current_steps": 1170, "total_steps": 1329, "loss": 0.4803, "learning_rate": 5e-06, "epoch": 2.64033850493653, "percentage": 88.04, "elapsed_time": "1 day, 5:17:58", "remaining_time": "3:58:54"}
|
| 120 |
+
{"current_steps": 1180, "total_steps": 1329, "loss": 0.491, "learning_rate": 5e-06, "epoch": 2.6629055007052185, "percentage": 88.79, "elapsed_time": "1 day, 5:32:48", "remaining_time": "3:43:51"}
|
| 121 |
+
{"current_steps": 1190, "total_steps": 1329, "loss": 0.4917, "learning_rate": 5e-06, "epoch": 2.685472496473907, "percentage": 89.54, "elapsed_time": "1 day, 5:47:37", "remaining_time": "3:28:48"}
|
| 122 |
+
{"current_steps": 1200, "total_steps": 1329, "loss": 0.4903, "learning_rate": 5e-06, "epoch": 2.7080394922425954, "percentage": 90.29, "elapsed_time": "1 day, 6:02:27", "remaining_time": "3:13:45"}
|
| 123 |
+
{"current_steps": 1210, "total_steps": 1329, "loss": 0.4916, "learning_rate": 5e-06, "epoch": 2.7306064880112837, "percentage": 91.05, "elapsed_time": "1 day, 6:17:16", "remaining_time": "2:58:43"}
|
| 124 |
+
{"current_steps": 1220, "total_steps": 1329, "loss": 0.4882, "learning_rate": 5e-06, "epoch": 2.753173483779972, "percentage": 91.8, "elapsed_time": "1 day, 6:32:05", "remaining_time": "2:43:41"}
|
| 125 |
+
{"current_steps": 1230, "total_steps": 1329, "loss": 0.4947, "learning_rate": 5e-06, "epoch": 2.77574047954866, "percentage": 92.55, "elapsed_time": "1 day, 6:46:54", "remaining_time": "2:28:39"}
|
| 126 |
+
{"current_steps": 1240, "total_steps": 1329, "loss": 0.4929, "learning_rate": 5e-06, "epoch": 2.7983074753173485, "percentage": 93.3, "elapsed_time": "1 day, 7:01:44", "remaining_time": "2:13:37"}
|
| 127 |
+
{"current_steps": 1250, "total_steps": 1329, "loss": 0.4931, "learning_rate": 5e-06, "epoch": 2.8208744710860367, "percentage": 94.06, "elapsed_time": "1 day, 7:16:34", "remaining_time": "1:58:35"}
|
| 128 |
+
{"current_steps": 1260, "total_steps": 1329, "loss": 0.4949, "learning_rate": 5e-06, "epoch": 2.843441466854725, "percentage": 94.81, "elapsed_time": "1 day, 7:31:23", "remaining_time": "1:43:34"}
|
| 129 |
+
{"current_steps": 1270, "total_steps": 1329, "loss": 0.4918, "learning_rate": 5e-06, "epoch": 2.8660084626234132, "percentage": 95.56, "elapsed_time": "1 day, 7:46:13", "remaining_time": "1:28:33"}
|
| 130 |
+
{"current_steps": 1280, "total_steps": 1329, "loss": 0.4899, "learning_rate": 5e-06, "epoch": 2.8885754583921015, "percentage": 96.31, "elapsed_time": "1 day, 8:01:03", "remaining_time": "1:13:32"}
|
| 131 |
+
{"current_steps": 1290, "total_steps": 1329, "loss": 0.4937, "learning_rate": 5e-06, "epoch": 2.9111424541607898, "percentage": 97.07, "elapsed_time": "1 day, 8:15:52", "remaining_time": "0:58:31"}
|
| 132 |
+
{"current_steps": 1300, "total_steps": 1329, "loss": 0.4893, "learning_rate": 5e-06, "epoch": 2.933709449929478, "percentage": 97.82, "elapsed_time": "1 day, 8:30:42", "remaining_time": "0:43:30"}
|
| 133 |
+
{"current_steps": 1310, "total_steps": 1329, "loss": 0.4932, "learning_rate": 5e-06, "epoch": 2.9562764456981663, "percentage": 98.57, "elapsed_time": "1 day, 8:45:31", "remaining_time": "0:28:30"}
|
| 134 |
+
{"current_steps": 1320, "total_steps": 1329, "loss": 0.4896, "learning_rate": 5e-06, "epoch": 2.9788434414668545, "percentage": 99.32, "elapsed_time": "1 day, 9:00:21", "remaining_time": "0:13:30"}
|