Training in progress, step 500
Browse files
config.json
ADDED
|
@@ -0,0 +1,29 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
{
|
| 2 |
+
"_name_or_path": "huawei-noah/TinyBERT_General_4L_312D",
|
| 3 |
+
"architectures": [
|
| 4 |
+
"BertLMHeadModel"
|
| 5 |
+
],
|
| 6 |
+
"attention_probs_dropout_prob": 0.1,
|
| 7 |
+
"cell": {},
|
| 8 |
+
"classifier_dropout": null,
|
| 9 |
+
"emb_size": 312,
|
| 10 |
+
"hidden_act": "gelu",
|
| 11 |
+
"hidden_dropout_prob": 0.1,
|
| 12 |
+
"hidden_size": 312,
|
| 13 |
+
"initializer_range": 0.02,
|
| 14 |
+
"intermediate_size": 1200,
|
| 15 |
+
"layer_norm_eps": 1e-12,
|
| 16 |
+
"max_position_embeddings": 512,
|
| 17 |
+
"model_type": "bert",
|
| 18 |
+
"num_attention_heads": 12,
|
| 19 |
+
"num_hidden_layers": 4,
|
| 20 |
+
"pad_token_id": 0,
|
| 21 |
+
"position_embedding_type": "absolute",
|
| 22 |
+
"pre_trained": "",
|
| 23 |
+
"structure": [],
|
| 24 |
+
"torch_dtype": "float32",
|
| 25 |
+
"transformers_version": "4.40.0",
|
| 26 |
+
"type_vocab_size": 2,
|
| 27 |
+
"use_cache": true,
|
| 28 |
+
"vocab_size": 30522
|
| 29 |
+
}
|
model.safetensors
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1c3f73a7f4c31712817c31e7920b6808b412a8da452ba3c6449e1c47ec20f9aa
|
| 3 |
+
size 57534056
|
runs/Apr26_04-20-18_4643bc53c803/events.out.tfevents.1714105219.4643bc53c803.241.2
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:d61c91f024051ff81972d9a665300af4aad280743dac64e90ac835ddc9adc617
|
| 3 |
+
size 4184
|
runs/Apr26_04-21-20_4643bc53c803/events.out.tfevents.1714105281.4643bc53c803.241.3
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:567909d537ee10ec205e5b246b664b5655ff7ab420cf538b4d46cbb30920d158
|
| 3 |
+
size 4903
|
training_args.bin
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f36b014c9a6f6014e3273c494ac6ddbc1fbdf986897f7a154ec3c7f5c7f76c47
|
| 3 |
+
size 4984
|