ponytail commited on
Commit
295bf85
·
verified ·
1 Parent(s): 62b657a

Update config.json

Browse files
Files changed (1) hide show
  1. config.json +14 -153
config.json CHANGED
@@ -33,161 +33,22 @@
33
  },
34
  "torch_dtype": "float16",
35
  "transformers_version": "4.48.0",
36
- "vision_config": {
37
- "_name_or_path": "google/siglip-so400m-patch14-384",
38
  "architectures": [
39
- "SiglipModel"
40
  ],
41
- "model_type": "siglip",
42
- "text_config": {
43
- "_attn_implementation_autoset": false,
44
- "_name_or_path": "",
45
- "add_cross_attention": false,
46
- "architectures": null,
47
- "attention_dropout": 0.0,
48
- "bad_words_ids": null,
49
- "begin_suppress_tokens": null,
50
- "bos_token_id": 49406,
51
- "chunk_size_feed_forward": 0,
52
- "cross_attention_hidden_size": null,
53
- "decoder_start_token_id": null,
54
- "diversity_penalty": 0.0,
55
- "do_sample": false,
56
- "early_stopping": false,
57
- "encoder_no_repeat_ngram_size": 0,
58
- "eos_token_id": 49407,
59
- "exponential_decay_length_penalty": null,
60
- "finetuning_task": null,
61
- "forced_bos_token_id": null,
62
- "forced_eos_token_id": null,
63
- "hidden_act": "gelu_pytorch_tanh",
64
- "hidden_size": 1152,
65
- "id2label": {
66
- "0": "LABEL_0",
67
- "1": "LABEL_1"
68
- },
69
- "intermediate_size": 4304,
70
- "is_decoder": false,
71
- "is_encoder_decoder": false,
72
- "label2id": {
73
- "LABEL_0": 0,
74
- "LABEL_1": 1
75
- },
76
- "layer_norm_eps": 1e-06,
77
- "length_penalty": 1.0,
78
- "max_length": 20,
79
- "max_position_embeddings": 64,
80
- "min_length": 0,
81
- "model_type": "siglip_text_model",
82
- "no_repeat_ngram_size": 0,
83
- "num_attention_heads": 16,
84
- "num_beam_groups": 1,
85
- "num_beams": 1,
86
- "num_hidden_layers": 27,
87
- "num_return_sequences": 1,
88
- "output_attentions": false,
89
- "output_hidden_states": false,
90
- "output_scores": false,
91
- "pad_token_id": 1,
92
- "prefix": null,
93
- "problem_type": null,
94
- "pruned_heads": {},
95
- "remove_invalid_values": false,
96
- "repetition_penalty": 1.0,
97
- "return_dict": true,
98
- "return_dict_in_generate": false,
99
- "sep_token_id": null,
100
- "suppress_tokens": null,
101
- "task_specific_params": null,
102
- "temperature": 1.0,
103
- "tf_legacy_loss": false,
104
- "tie_encoder_decoder": false,
105
- "tie_word_embeddings": true,
106
- "tokenizer_class": null,
107
- "top_k": 50,
108
- "top_p": 1.0,
109
- "torch_dtype": null,
110
- "torchscript": false,
111
- "typical_p": 1.0,
112
- "use_bfloat16": false,
113
- "vocab_size": 32000
114
- },
115
- "torch_dtype": "float32",
116
- "vision_config": {
117
- "_attn_implementation_autoset": false,
118
- "_name_or_path": "",
119
- "add_cross_attention": false,
120
- "architectures": null,
121
- "attention_dropout": 0.0,
122
- "bad_words_ids": null,
123
- "begin_suppress_tokens": null,
124
- "bos_token_id": null,
125
- "chunk_size_feed_forward": 0,
126
- "cross_attention_hidden_size": null,
127
- "decoder_start_token_id": null,
128
- "diversity_penalty": 0.0,
129
- "do_sample": false,
130
- "early_stopping": false,
131
- "encoder_no_repeat_ngram_size": 0,
132
- "eos_token_id": null,
133
- "exponential_decay_length_penalty": null,
134
- "finetuning_task": null,
135
- "forced_bos_token_id": null,
136
- "forced_eos_token_id": null,
137
- "hidden_act": "gelu_pytorch_tanh",
138
- "hidden_size": 1152,
139
- "id2label": {
140
- "0": "LABEL_0",
141
- "1": "LABEL_1"
142
- },
143
- "image_size": 384,
144
- "intermediate_size": 4304,
145
- "is_decoder": false,
146
- "is_encoder_decoder": false,
147
- "label2id": {
148
- "LABEL_0": 0,
149
- "LABEL_1": 1
150
- },
151
- "layer_norm_eps": 1e-06,
152
- "length_penalty": 1.0,
153
- "max_length": 20,
154
- "min_length": 0,
155
- "model_type": "siglip_vision_model",
156
- "no_repeat_ngram_size": 0,
157
- "num_attention_heads": 16,
158
- "num_beam_groups": 1,
159
- "num_beams": 1,
160
- "num_channels": 3,
161
- "num_hidden_layers": 27,
162
- "num_return_sequences": 1,
163
- "output_attentions": false,
164
- "output_hidden_states": false,
165
- "output_scores": false,
166
- "pad_token_id": null,
167
- "patch_size": 14,
168
- "prefix": null,
169
- "problem_type": null,
170
- "pruned_heads": {},
171
- "remove_invalid_values": false,
172
- "repetition_penalty": 1.0,
173
- "return_dict": true,
174
- "return_dict_in_generate": false,
175
- "sep_token_id": null,
176
- "suppress_tokens": null,
177
- "task_specific_params": null,
178
- "temperature": 1.0,
179
- "tf_legacy_loss": false,
180
- "tie_encoder_decoder": false,
181
- "tie_word_embeddings": true,
182
- "tokenizer_class": null,
183
- "top_k": 50,
184
- "top_p": 1.0,
185
- "torch_dtype": null,
186
- "torchscript": false,
187
- "typical_p": 1.0,
188
- "use_bfloat16": false
189
- }
190
  },
191
  "vision_feature_layer": -2,
192
- "vision_feature_select_strategy": "full"
193
  }
 
33
  },
34
  "torch_dtype": "float16",
35
  "transformers_version": "4.48.0",
36
+ "vision_config": {
37
+ "_name_or_path": "./iter_45000_ft/vit_merge_lora",
38
  "architectures": [
39
+ "SiglipVisionModel"
40
  ],
41
+ "hidden_act": "gelu_pytorch_tanh",
42
+ "hidden_size": 1152,
43
+ "image_size": 384,
44
+ "intermediate_size": 4304,
45
+ "layer_norm_eps": 1e-06,
46
+ "model_type": "siglip_vision_model",
47
+ "num_attention_heads": 16,
48
+ "num_hidden_layers": 27,
49
+ "patch_size": 14,
50
+ "torch_dtype": "float32"
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
51
  },
52
  "vision_feature_layer": -2,
53
+ "vision_feature_select_strategy": "default"
54
  }