Model save
Browse files
README.md
CHANGED
@@ -19,8 +19,6 @@ should probably proofread and complete it, then remove this comment. -->
|
|
19 |
# gemma7b-kasa-coding-11-v1
|
20 |
|
21 |
This model is a fine-tuned version of [google/gemma-7b](https://huggingface.co/google/gemma-7b) on the generator dataset.
|
22 |
-
It achieves the following results on the evaluation set:
|
23 |
-
- Loss: 9.9363
|
24 |
|
25 |
## Model description
|
26 |
|
@@ -55,9 +53,6 @@ The following hyperparameters were used during training:
|
|
55 |
|
56 |
### Training results
|
57 |
|
58 |
-
| Training Loss | Epoch | Step | Validation Loss |
|
59 |
-
|:-------------:|:-----:|:----:|:---------------:|
|
60 |
-
| 10.3696 | 1.0 | 140 | 9.9363 |
|
61 |
|
62 |
|
63 |
### Framework versions
|
|
|
19 |
# gemma7b-kasa-coding-11-v1
|
20 |
|
21 |
This model is a fine-tuned version of [google/gemma-7b](https://huggingface.co/google/gemma-7b) on the generator dataset.
|
|
|
|
|
22 |
|
23 |
## Model description
|
24 |
|
|
|
53 |
|
54 |
### Training results
|
55 |
|
|
|
|
|
|
|
56 |
|
57 |
|
58 |
### Framework versions
|
adapter_config.json
CHANGED
@@ -5,7 +5,7 @@
|
|
5 |
"bias": "none",
|
6 |
"fan_in_fan_out": false,
|
7 |
"inference_mode": true,
|
8 |
-
"init_lora_weights":
|
9 |
"layer_replication": null,
|
10 |
"layers_pattern": null,
|
11 |
"layers_to_transform": null,
|
|
|
5 |
"bias": "none",
|
6 |
"fan_in_fan_out": false,
|
7 |
"inference_mode": true,
|
8 |
+
"init_lora_weights": true,
|
9 |
"layer_replication": null,
|
10 |
"layers_pattern": null,
|
11 |
"layers_to_transform": null,
|
all_results.json
CHANGED
@@ -6,9 +6,9 @@
|
|
6 |
"eval_samples_per_second": 122.269,
|
7 |
"eval_steps_per_second": 2.061,
|
8 |
"total_flos": 4.268850850782249e+17,
|
9 |
-
"train_loss":
|
10 |
-
"train_runtime":
|
11 |
"train_samples": 51241,
|
12 |
-
"train_samples_per_second":
|
13 |
-
"train_steps_per_second":
|
14 |
}
|
|
|
6 |
"eval_samples_per_second": 122.269,
|
7 |
"eval_steps_per_second": 2.061,
|
8 |
"total_flos": 4.268850850782249e+17,
|
9 |
+
"train_loss": 0.0,
|
10 |
+
"train_runtime": 0.0104,
|
11 |
"train_samples": 51241,
|
12 |
+
"train_samples_per_second": 1725286.468,
|
13 |
+
"train_steps_per_second": 13490.846
|
14 |
}
|
runs/Nov18_17-29-16_bold-food-flourishes-fin-02/events.out.tfevents.1731951860.bold-food-flourishes-fin-02.93842.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:67123b9f4ad63877e399824e3133b426e5f1d5d6aa0f13a073f5c411afe3fec4
|
3 |
+
size 6076
|
train_results.json
CHANGED
@@ -1,9 +1,9 @@
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"total_flos": 4.268850850782249e+17,
|
4 |
-
"train_loss":
|
5 |
-
"train_runtime":
|
6 |
"train_samples": 51241,
|
7 |
-
"train_samples_per_second":
|
8 |
-
"train_steps_per_second":
|
9 |
}
|
|
|
1 |
{
|
2 |
"epoch": 1.0,
|
3 |
"total_flos": 4.268850850782249e+17,
|
4 |
+
"train_loss": 0.0,
|
5 |
+
"train_runtime": 0.0104,
|
6 |
"train_samples": 51241,
|
7 |
+
"train_samples_per_second": 1725286.468,
|
8 |
+
"train_steps_per_second": 13490.846
|
9 |
}
|
trainer_state.json
CHANGED
@@ -211,22 +211,14 @@
|
|
211 |
"loss": 10.3696,
|
212 |
"step": 140
|
213 |
},
|
214 |
-
{
|
215 |
-
"epoch": 1.0,
|
216 |
-
"eval_loss": 9.936275482177734,
|
217 |
-
"eval_runtime": 1.4505,
|
218 |
-
"eval_samples_per_second": 122.712,
|
219 |
-
"eval_steps_per_second": 2.068,
|
220 |
-
"step": 140
|
221 |
-
},
|
222 |
{
|
223 |
"epoch": 1.0,
|
224 |
"step": 140,
|
225 |
"total_flos": 4.268850850782249e+17,
|
226 |
-
"train_loss":
|
227 |
-
"train_runtime":
|
228 |
-
"train_samples_per_second":
|
229 |
-
"train_steps_per_second":
|
230 |
}
|
231 |
],
|
232 |
"logging_steps": 5,
|
|
|
211 |
"loss": 10.3696,
|
212 |
"step": 140
|
213 |
},
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
214 |
{
|
215 |
"epoch": 1.0,
|
216 |
"step": 140,
|
217 |
"total_flos": 4.268850850782249e+17,
|
218 |
+
"train_loss": 0.0,
|
219 |
+
"train_runtime": 0.0104,
|
220 |
+
"train_samples_per_second": 1725286.468,
|
221 |
+
"train_steps_per_second": 13490.846
|
222 |
}
|
223 |
],
|
224 |
"logging_steps": 5,
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5816
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:50695091913ac2106f6db57ae23750875e32e773c2c58db582498b3010055545
|
3 |
size 5816
|