Training in progress, step 1272
Browse files
model-00001-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4976698672
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:2bf5a33c512ef8b5c202abc4439f21ca03595e9aef8343cfbbce85291a902d84
|
| 3 |
size 4976698672
|
model-00002-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4999802720
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6f799d6013a45bc8062cde27c6610e08bda0404976fbd1b3b167b68c1f4abd12
|
| 3 |
size 4999802720
|
model-00003-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4915916176
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9b6945ec913e7df4df661cffd305a745730ab4a91d6e37307ab97bb4e8488f09
|
| 3 |
size 4915916176
|
model-00004-of-00004.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1168138808
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f376121fd93978caedc1d3f587383997618cede5c777309e87c04d84956f0c29
|
| 3 |
size 1168138808
|
runs/Feb25_22-23-30_COE-CS-sv003/events.out.tfevents.1740522241.COE-CS-sv003.325787.0
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0c9ffae8553207e289546d0218d0fcf954a966ab85d4d8552b35121d246167ae
|
| 3 |
+
size 32633
|
trainer_log.jsonl
CHANGED
|
@@ -98,3 +98,31 @@
|
|
| 98 |
{"current_steps": 980, "total_steps": 1272, "loss": 0.1121, "lr": 1.981730090920969e-06, "epoch": 2.306900102986612, "percentage": 77.04, "elapsed_time": "15:01:21", "remaining_time": "4:28:34"}
|
| 99 |
{"current_steps": 990, "total_steps": 1272, "loss": 0.1103, "lr": 1.8541198882757892e-06, "epoch": 2.330439899955863, "percentage": 77.83, "elapsed_time": "15:10:30", "remaining_time": "4:19:21"}
|
| 100 |
{"current_steps": 1000, "total_steps": 1272, "loss": 0.1111, "lr": 1.73017475120072e-06, "epoch": 2.353979696925114, "percentage": 78.62, "elapsed_time": "15:19:43", "remaining_time": "4:10:09"}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 98 |
{"current_steps": 980, "total_steps": 1272, "loss": 0.1121, "lr": 1.981730090920969e-06, "epoch": 2.306900102986612, "percentage": 77.04, "elapsed_time": "15:01:21", "remaining_time": "4:28:34"}
|
| 99 |
{"current_steps": 990, "total_steps": 1272, "loss": 0.1103, "lr": 1.8541198882757892e-06, "epoch": 2.330439899955863, "percentage": 77.83, "elapsed_time": "15:10:30", "remaining_time": "4:19:21"}
|
| 100 |
{"current_steps": 1000, "total_steps": 1272, "loss": 0.1111, "lr": 1.73017475120072e-06, "epoch": 2.353979696925114, "percentage": 78.62, "elapsed_time": "15:19:43", "remaining_time": "4:10:09"}
|
| 101 |
+
{"current_steps": 1010, "total_steps": 1272, "loss": 0.1101, "lr": 1.6099751396144142e-06, "epoch": 2.3775194938943653, "percentage": 79.4, "elapsed_time": "15:30:52", "remaining_time": "4:01:28"}
|
| 102 |
+
{"current_steps": 1020, "total_steps": 1272, "loss": 0.1085, "lr": 1.493599081999453e-06, "epoch": 2.4010592908636164, "percentage": 80.19, "elapsed_time": "15:40:03", "remaining_time": "3:52:15"}
|
| 103 |
+
{"current_steps": 1030, "total_steps": 1272, "loss": 0.109, "lr": 1.3811221247495784e-06, "epoch": 2.4245990878328674, "percentage": 80.97, "elapsed_time": "15:49:12", "remaining_time": "3:43:01"}
|
| 104 |
+
{"current_steps": 1040, "total_steps": 1272, "loss": 0.1083, "lr": 1.2726172831281898e-06, "epoch": 2.448138884802119, "percentage": 81.76, "elapsed_time": "15:58:24", "remaining_time": "3:33:47"}
|
| 105 |
+
{"current_steps": 1050, "total_steps": 1272, "loss": 0.1079, "lr": 1.1681549938699157e-06, "epoch": 2.47167868177137, "percentage": 82.55, "elapsed_time": "16:07:34", "remaining_time": "3:24:34"}
|
| 106 |
+
{"current_steps": 1060, "total_steps": 1272, "loss": 0.1084, "lr": 1.0678030694561044e-06, "epoch": 2.495218478740621, "percentage": 83.33, "elapsed_time": "16:16:44", "remaining_time": "3:15:20"}
|
| 107 |
+
{"current_steps": 1070, "total_steps": 1272, "loss": 0.1084, "lr": 9.716266540938183e-07, "epoch": 2.518758275709872, "percentage": 84.12, "elapsed_time": "16:25:57", "remaining_time": "3:06:08"}
|
| 108 |
+
{"current_steps": 1080, "total_steps": 1272, "loss": 0.106, "lr": 8.796881814269941e-07, "epoch": 2.542298072679123, "percentage": 84.91, "elapsed_time": "16:35:07", "remaining_time": "2:56:54"}
|
| 109 |
+
{"current_steps": 1090, "total_steps": 1272, "loss": 0.1037, "lr": 7.92047334007169e-07, "epoch": 2.5658378696483743, "percentage": 85.69, "elapsed_time": "16:44:17", "remaining_time": "2:47:41"}
|
| 110 |
+
{"current_steps": 1100, "total_steps": 1272, "loss": 0.1044, "lr": 7.087610045501023e-07, "epoch": 2.5893776666176254, "percentage": 86.48, "elapsed_time": "16:53:27", "remaining_time": "2:38:28"}
|
| 111 |
+
{"current_steps": 1110, "total_steps": 1272, "loss": 0.1051, "lr": 6.29883259003445e-07, "epoch": 2.612917463586877, "percentage": 87.26, "elapsed_time": "17:02:37", "remaining_time": "2:29:14"}
|
| 112 |
+
{"current_steps": 1120, "total_steps": 1272, "loss": 0.1031, "lr": 5.554653014494176e-07, "epoch": 2.636457260556128, "percentage": 88.05, "elapsed_time": "17:11:47", "remaining_time": "2:20:01"}
|
| 113 |
+
{"current_steps": 1130, "total_steps": 1272, "loss": 0.1039, "lr": 4.855554408652985e-07, "epoch": 2.659997057525379, "percentage": 88.84, "elapsed_time": "17:20:58", "remaining_time": "2:10:48"}
|
| 114 |
+
{"current_steps": 1140, "total_steps": 1272, "loss": 0.1032, "lr": 4.201990597632832e-07, "epoch": 2.68353685449463, "percentage": 89.62, "elapsed_time": "17:30:08", "remaining_time": "2:01:35"}
|
| 115 |
+
{"current_steps": 1150, "total_steps": 1272, "loss": 0.105, "lr": 3.5943858473009237e-07, "epoch": 2.707076651463881, "percentage": 90.41, "elapsed_time": "17:39:17", "remaining_time": "1:52:22"}
|
| 116 |
+
{"current_steps": 1160, "total_steps": 1272, "loss": 0.1029, "lr": 3.033134588854289e-07, "epoch": 2.7306164484331323, "percentage": 91.19, "elapsed_time": "17:48:27", "remaining_time": "1:43:09"}
|
| 117 |
+
{"current_steps": 1170, "total_steps": 1272, "loss": 0.1048, "lr": 2.518601162771755e-07, "epoch": 2.7541562454023834, "percentage": 91.98, "elapsed_time": "17:57:40", "remaining_time": "1:33:57"}
|
| 118 |
+
{"current_steps": 1180, "total_steps": 1272, "loss": 0.102, "lr": 2.0511195822997013e-07, "epoch": 2.777696042371635, "percentage": 92.77, "elapsed_time": "18:06:51", "remaining_time": "1:24:44"}
|
| 119 |
+
{"current_steps": 1190, "total_steps": 1272, "loss": 0.1028, "lr": 1.6309933166247403e-07, "epoch": 2.801235839340886, "percentage": 93.55, "elapsed_time": "18:16:04", "remaining_time": "1:15:31"}
|
| 120 |
+
{"current_steps": 1200, "total_steps": 1272, "loss": 0.1006, "lr": 1.258495093874454e-07, "epoch": 2.824775636310137, "percentage": 94.34, "elapsed_time": "18:25:13", "remaining_time": "1:06:18"}
|
| 121 |
+
{"current_steps": 1210, "total_steps": 1272, "loss": 0.1029, "lr": 9.338667240738619e-08, "epoch": 2.848315433279388, "percentage": 95.13, "elapsed_time": "18:34:24", "remaining_time": "0:57:06"}
|
| 122 |
+
{"current_steps": 1220, "total_steps": 1272, "loss": 0.102, "lr": 6.573189421726466e-08, "epoch": 2.871855230248639, "percentage": 95.91, "elapsed_time": "18:43:35", "remaining_time": "0:47:53"}
|
| 123 |
+
{"current_steps": 1230, "total_steps": 1272, "loss": 0.1032, "lr": 4.2903127124496454e-08, "epoch": 2.8953950272178903, "percentage": 96.7, "elapsed_time": "18:52:46", "remaining_time": "0:38:40"}
|
| 124 |
+
{"current_steps": 1240, "total_steps": 1272, "loss": 0.1031, "lr": 2.4915190595068415e-08, "epoch": 2.9189348241871413, "percentage": 97.48, "elapsed_time": "19:01:57", "remaining_time": "0:29:28"}
|
| 125 |
+
{"current_steps": 1250, "total_steps": 1272, "loss": 0.0998, "lr": 1.1779761633370633e-08, "epoch": 2.942474621156393, "percentage": 98.27, "elapsed_time": "19:11:09", "remaining_time": "0:20:15"}
|
| 126 |
+
{"current_steps": 1260, "total_steps": 1272, "loss": 0.1005, "lr": 3.50536720197997e-09, "epoch": 2.966014418125644, "percentage": 99.06, "elapsed_time": "19:20:21", "remaining_time": "0:11:03"}
|
| 127 |
+
{"current_steps": 1270, "total_steps": 1272, "loss": 0.1019, "lr": 9.73786863237014e-11, "epoch": 2.989554215094895, "percentage": 99.84, "elapsed_time": "19:29:30", "remaining_time": "0:01:50"}
|
| 128 |
+
{"current_steps": 1272, "total_steps": 1272, "epoch": 2.994262174488745, "percentage": 100.0, "elapsed_time": "19:33:34", "remaining_time": "0:00:00"}
|