Training in progress, epoch 1
Browse files
README.md
CHANGED
|
@@ -37,7 +37,7 @@ This model was trained with SFT.
|
|
| 37 |
- TRL: 0.23.0
|
| 38 |
- Transformers: 4.56.1
|
| 39 |
- Pytorch: 2.8.0+cu126
|
| 40 |
-
- Datasets: 4.1.
|
| 41 |
- Tokenizers: 0.22.0
|
| 42 |
|
| 43 |
## Citations
|
|
|
|
| 37 |
- TRL: 0.23.0
|
| 38 |
- Transformers: 4.56.1
|
| 39 |
- Pytorch: 2.8.0+cu126
|
| 40 |
+
- Datasets: 4.1.1
|
| 41 |
- Tokenizers: 0.22.0
|
| 42 |
|
| 43 |
## Citations
|
adapter_config.json
CHANGED
|
@@ -25,13 +25,13 @@
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
-
"
|
|
|
|
| 29 |
"gate_proj",
|
| 30 |
"v_proj",
|
| 31 |
-
"
|
| 32 |
-
"o_proj",
|
| 33 |
"up_proj",
|
| 34 |
-
"
|
| 35 |
],
|
| 36 |
"target_parameters": null,
|
| 37 |
"task_type": "CAUSAL_LM",
|
|
|
|
| 25 |
"rank_pattern": {},
|
| 26 |
"revision": null,
|
| 27 |
"target_modules": [
|
| 28 |
+
"q_proj",
|
| 29 |
+
"down_proj",
|
| 30 |
"gate_proj",
|
| 31 |
"v_proj",
|
| 32 |
+
"k_proj",
|
|
|
|
| 33 |
"up_proj",
|
| 34 |
+
"o_proj"
|
| 35 |
],
|
| 36 |
"target_parameters": null,
|
| 37 |
"task_type": "CAUSAL_LM",
|
adapter_model.safetensors
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 4785795512
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:fbbd66503b7a3a062c28ab734d3e20c0e199e1225f758312ef906c40976f96fd
|
| 3 |
size 4785795512
|
runs/Sep17_07-03-03_918933b8a591/events.out.tfevents.1758092585.918933b8a591.321.1
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d3eb933eea986673ca1dad567846b90c40699db7fa8ab082cbf9caa2d3901f45
|
| 3 |
+
size 10506
|
runs/Sep18_14-24-06_6abdf55d0343/events.out.tfevents.1758205455.6abdf55d0343.1143.0
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:410e06bdd1b750b07f561b7733b7793877425537bd0b4c7a125afd421e4ab12c
|
| 3 |
+
size 6454
|
training_args.bin
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6289
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:7df5dabb565f266c7a6a5b86a1e09cb94122ff5b3eb06c9baec9f114f2b8ed36
|
| 3 |
size 6289
|