Training in progress, step 30000
Browse files
config.json
CHANGED
@@ -40,7 +40,7 @@
|
|
40 |
}
|
41 |
},
|
42 |
"torch_dtype": "bfloat16",
|
43 |
-
"transformers_version": "4.44.
|
44 |
"use_cache": true,
|
45 |
"vocab_size": 50257
|
46 |
}
|
|
|
40 |
}
|
41 |
},
|
42 |
"torch_dtype": "bfloat16",
|
43 |
+
"transformers_version": "4.44.1",
|
44 |
"use_cache": true,
|
45 |
"vocab_size": 50257
|
46 |
}
|
logs/attn_norm=layernorm_teacher_only_affine, attn_projector=mlp_256_l2, attn_weight=5, learning_rate=0.0002, per_device_train_batch_size=16, warmup_ratio=0/events.out.tfevents.1725468061.e3f806ea38c9
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
-
size
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:2a92d9d85b2afc8e69655ff6cc4f40e17b586e71aaf1d9648f19b22fbf123f14
|
3 |
+
size 946271
|
model.safetensors
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 163832792
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6117cb21ba689d240b7281a26ae8cffcda5e8b1494a6692f473e01c98e9dbb45
|
3 |
size 163832792
|
training_args.bin
CHANGED
@@ -1,3 +1,3 @@
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:
|
3 |
size 5560
|
|
|
1 |
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e94eaa60413c4cf51d9a6a08dd8682d66f9ca672b582d54a821d965d88721e41
|
3 |
size 5560
|