Training in progress, step 200
Browse files
.gitignore
ADDED
@@ -0,0 +1 @@
|
|
|
|
|
1 |
+
checkpoint-*/
|
config.json
ADDED
@@ -0,0 +1,22 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
1 |
+
{
|
2 |
+
"activation": "gelu",
|
3 |
+
"architectures": [
|
4 |
+
"DistilBertForMaskedLM"
|
5 |
+
],
|
6 |
+
"attention_dropout": 0.1,
|
7 |
+
"dim": 768,
|
8 |
+
"dropout": 0.1,
|
9 |
+
"hidden_dim": 3072,
|
10 |
+
"initializer_range": 0.02,
|
11 |
+
"max_position_embeddings": 124,
|
12 |
+
"model_type": "distilbert",
|
13 |
+
"n_heads": 12,
|
14 |
+
"n_layers": 6,
|
15 |
+
"pad_token_id": 0,
|
16 |
+
"qa_dropout": 0.1,
|
17 |
+
"seq_classif_dropout": 0.2,
|
18 |
+
"sinusoidal_pos_embds": false,
|
19 |
+
"torch_dtype": "float32",
|
20 |
+
"transformers_version": "4.26.1",
|
21 |
+
"vocab_size": 30522
|
22 |
+
}
|
pytorch_model.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1aaa061078757b42dc1e463291030f08197b510713ab9c5081d15bc461aa3d53
|
3 |
+
size 266786097
|
runs/Mar08_10-55-15_2fae1b225e0f/1678273036.5727026/events.out.tfevents.1678273036.2fae1b225e0f.566.1
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6b421e6ef231147e8aac1cb61e90ba160a17362848a0d507de850c02b48390d6
|
3 |
+
size 5661
|
runs/Mar08_10-55-15_2fae1b225e0f/events.out.tfevents.1678273030.2fae1b225e0f.566.0
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:bfdbb4831a3433673227d993e27f2ba7cc0f19464733908ca6b18e39033f9032
|
3 |
+
size 4196
|
training_args.bin
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e262b16b89cadae40b5940580368053df5e09c8a4d8c162d52276fc3bc11d005
|
3 |
+
size 3451
|