Training in progress, step 10, checkpoint
Browse files
last-checkpoint/config.json
CHANGED
@@ -40,7 +40,7 @@
|
|
40 |
"pad_token_id": 50257,
|
41 |
"scale_embedding": false,
|
42 |
"torch_dtype": "float32",
|
43 |
-
"transformers_version": "4.50.
|
44 |
"use_cache": false,
|
45 |
"use_weighted_layer_sum": false,
|
46 |
"vocab_size": 51871
|
|
|
40 |
"pad_token_id": 50257,
|
41 |
"scale_embedding": false,
|
42 |
"torch_dtype": "float32",
|
43 |
+
"transformers_version": "4.50.3",
|
44 |
"use_cache": false,
|
45 |
"use_weighted_layer_sum": false,
|
46 |
"vocab_size": 51871
|
last-checkpoint/generation_config.json
CHANGED
@@ -170,6 +170,6 @@
|
|
170 |
"transcribe": 50359,
|
171 |
"translate": 50358
|
172 |
},
|
173 |
-
"transformers_version": "4.50.
|
174 |
"use_cache": false
|
175 |
}
|
|
|
170 |
"transcribe": 50359,
|
171 |
"translate": 50358
|
172 |
},
|
173 |
+
"transformers_version": "4.50.3",
|
174 |
"use_cache": false
|
175 |
}
|
last-checkpoint/model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 967013512
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:015cd4067c182630d745f697676defa8ae8a26985817aa4f9ca4f02ae2bd786b
|
3 |
size 967013512
|
last-checkpoint/optimizer.pt
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 1925100908
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a4c54ce75022b03e1e5c9f8016fef653aa2c3761ba9375735aeb8eb95c64cdc1
|
3 |
size 1925100908
|
last-checkpoint/trainer_state.json
CHANGED
@@ -11,9 +11,9 @@
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 10.0,
|
14 |
-
"grad_norm":
|
15 |
"learning_rate": 7.000000000000001e-06,
|
16 |
-
"loss": 2.
|
17 |
"step": 10
|
18 |
}
|
19 |
],
|
|
|
11 |
"log_history": [
|
12 |
{
|
13 |
"epoch": 10.0,
|
14 |
+
"grad_norm": 19.040071487426758,
|
15 |
"learning_rate": 7.000000000000001e-06,
|
16 |
+
"loss": 2.5812,
|
17 |
"step": 10
|
18 |
}
|
19 |
],
|