luissattelmayer commited on
Commit
78cb6d9
·
verified ·
1 Parent(s): 8f9efa9

Training in progress, epoch 1

Browse files
Files changed (3) hide show
  1. config.json +11 -12
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -1,16 +1,15 @@
1
  {
2
- "_name_or_path": "EuroBERT/EuroBERT-610m",
3
  "architectures": [
4
  "EuroBertForSequenceClassification"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "auto_map": {
9
- "AutoConfig": "EuroBERT/EuroBERT-610m--configuration_eurobert.EuroBertConfig",
10
- "AutoModel": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertModel",
11
- "AutoModelForMaskedLM": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertForMaskedLM",
12
- "AutoModelForPreTraining": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertPreTrainedModel",
13
- "AutoModelForSequenceClassification": "EuroBERT/EuroBERT-610m--modeling_eurobert.EuroBertForSequenceClassification"
14
  },
15
  "bos_token": "<|begin_of_text|>",
16
  "bos_token_id": 128000,
@@ -20,13 +19,13 @@
20
  "head_dim": 64,
21
  "hidden_act": "silu",
22
  "hidden_dropout": 0.0,
23
- "hidden_size": 1152,
24
  "id2label": {
25
  "0": "0",
26
  "1": "1"
27
  },
28
  "initializer_range": 0.02,
29
- "intermediate_size": 4096,
30
  "label2id": {
31
  "0": 0,
32
  "1": 1
@@ -36,9 +35,9 @@
36
  "max_position_embeddings": 8192,
37
  "mlp_bias": false,
38
  "model_type": "eurobert",
39
- "num_attention_heads": 18,
40
- "num_hidden_layers": 26,
41
- "num_key_value_heads": 6,
42
  "pad_token": "<|end_of_text|>",
43
  "pad_token_id": 128001,
44
  "pretraining_tp": 1,
@@ -48,7 +47,7 @@
48
  "rope_theta": 250000,
49
  "tie_word_embeddings": false,
50
  "torch_dtype": "float32",
51
- "transformers_version": "4.49.0",
52
  "use_cache": false,
53
  "vocab_size": 128256
54
  }
 
1
  {
 
2
  "architectures": [
3
  "EuroBertForSequenceClassification"
4
  ],
5
  "attention_bias": false,
6
  "attention_dropout": 0.0,
7
  "auto_map": {
8
+ "AutoConfig": "EuroBERT/EuroBERT-210m--configuration_eurobert.EuroBertConfig",
9
+ "AutoModel": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertModel",
10
+ "AutoModelForMaskedLM": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertForMaskedLM",
11
+ "AutoModelForPreTraining": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertPreTrainedModel",
12
+ "AutoModelForSequenceClassification": "EuroBERT/EuroBERT-210m--modeling_eurobert.EuroBertForSequenceClassification"
13
  },
14
  "bos_token": "<|begin_of_text|>",
15
  "bos_token_id": 128000,
 
19
  "head_dim": 64,
20
  "hidden_act": "silu",
21
  "hidden_dropout": 0.0,
22
+ "hidden_size": 768,
23
  "id2label": {
24
  "0": "0",
25
  "1": "1"
26
  },
27
  "initializer_range": 0.02,
28
+ "intermediate_size": 3072,
29
  "label2id": {
30
  "0": 0,
31
  "1": 1
 
35
  "max_position_embeddings": 8192,
36
  "mlp_bias": false,
37
  "model_type": "eurobert",
38
+ "num_attention_heads": 12,
39
+ "num_hidden_layers": 12,
40
+ "num_key_value_heads": 12,
41
  "pad_token": "<|end_of_text|>",
42
  "pad_token_id": 128001,
43
  "pretraining_tp": 1,
 
47
  "rope_theta": 250000,
48
  "tie_word_embeddings": false,
49
  "torch_dtype": "float32",
50
+ "transformers_version": "4.50.0",
51
  "use_cache": false,
52
  "vocab_size": 128256
53
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:c0289bf456b13899f07fb660197e0da334142142bcb4a98041059de9722bb88b
3
- size 2436848328
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:88215de169f7af3fbc30ea92fb1c74843b05370ed875686b7a1852e64231832d
3
+ size 849445136
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:23b7edee952c7f1a904d544feae7c382707e1ccc4e4ba403182cfeb43e266c73
3
  size 5560
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:336c23221c999b6703bd74f02883eb0888eebdbf42405639153ae63bc135718f
3
  size 5560