CodCodingCode commited on
Commit
18719c3
·
verified ·
1 Parent(s): 553e553

Training in progress, step 500

Browse files
Files changed (28) hide show
  1. .gitattributes +1 -0
  2. adapter_config.json +41 -0
  3. adapter_model.safetensors +3 -0
  4. added_tokens.json +3 -0
  5. chat_template.jinja +47 -0
  6. runs/Jul12_19-24-10_192-222-50-225/events.out.tfevents.1752348251.192-222-50-225.6308.0 +3 -0
  7. runs/Jul12_19-26-47_192-222-50-225/events.out.tfevents.1752348407.192-222-50-225.6572.0 +3 -0
  8. runs/Jul12_19-29-33_192-222-50-225/events.out.tfevents.1752348573.192-222-50-225.6698.0 +3 -0
  9. runs/Jul12_19-31-33_192-222-50-225/events.out.tfevents.1752348693.192-222-50-225.6847.0 +3 -0
  10. runs/Jul12_19-38-15_192-222-50-225/events.out.tfevents.1752349095.192-222-50-225.7027.0 +3 -0
  11. runs/Jul12_19-39-22_192-222-50-225/events.out.tfevents.1752349163.192-222-50-225.7305.0 +3 -0
  12. runs/Jul12_19-41-25_192-222-50-225/events.out.tfevents.1752349285.192-222-50-225.7432.0 +3 -0
  13. runs/Jul12_19-43-12_192-222-50-225/events.out.tfevents.1752349392.192-222-50-225.7652.0 +3 -0
  14. runs/Jul12_19-44-41_192-222-50-225/events.out.tfevents.1752349481.192-222-50-225.7797.0 +3 -0
  15. runs/Jul12_19-47-45_192-222-50-225/events.out.tfevents.1752349665.192-222-50-225.8096.0 +3 -0
  16. runs/Jul12_20-19-06_192-222-50-225/events.out.tfevents.1752351546.192-222-50-225.8742.0 +3 -0
  17. runs/Jul12_20-20-25_192-222-50-225/events.out.tfevents.1752351625.192-222-50-225.8866.0 +3 -0
  18. runs/Jul12_20-31-47_192-222-50-225/events.out.tfevents.1752352308.192-222-50-225.9439.0 +3 -0
  19. runs/Jul12_21-41-52_192-222-50-225/events.out.tfevents.1752356513.192-222-50-225.11670.0 +3 -0
  20. runs/Jul12_21-58-20_192-222-50-225/events.out.tfevents.1752357500.192-222-50-225.12327.0 +3 -0
  21. runs/Jul12_22-02-49_192-222-50-225/events.out.tfevents.1752357769.192-222-50-225.12553.0 +3 -0
  22. runs/Jul12_22-06-18_192-222-50-225/events.out.tfevents.1752357978.192-222-50-225.12764.0 +3 -0
  23. runs/Jul12_22-07-56_192-222-50-225/events.out.tfevents.1752358076.192-222-50-225.12949.0 +3 -0
  24. special_tokens_map.json +33 -0
  25. tokenizer.json +3 -0
  26. tokenizer.model +3 -0
  27. tokenizer_config.json +0 -0
  28. training_args.bin +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
adapter_config.json ADDED
@@ -0,0 +1,41 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "google/medgemma-27b-text-it",
5
+ "bias": "none",
6
+ "corda_config": null,
7
+ "eva_config": null,
8
+ "exclude_modules": null,
9
+ "fan_in_fan_out": false,
10
+ "inference_mode": true,
11
+ "init_lora_weights": true,
12
+ "layer_replication": null,
13
+ "layers_pattern": null,
14
+ "layers_to_transform": null,
15
+ "loftq_config": {},
16
+ "lora_alpha": 16,
17
+ "lora_bias": false,
18
+ "lora_dropout": 0.1,
19
+ "megatron_config": null,
20
+ "megatron_core": "megatron.core",
21
+ "modules_to_save": null,
22
+ "peft_type": "LORA",
23
+ "qalora_group_size": 16,
24
+ "r": 8,
25
+ "rank_pattern": {},
26
+ "revision": null,
27
+ "target_modules": [
28
+ "down_proj",
29
+ "gate_proj",
30
+ "up_proj",
31
+ "q_proj",
32
+ "o_proj",
33
+ "k_proj",
34
+ "v_proj"
35
+ ],
36
+ "task_type": "CAUSAL_LM",
37
+ "trainable_token_indices": null,
38
+ "use_dora": false,
39
+ "use_qalora": false,
40
+ "use_rslora": false
41
+ }
adapter_model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5e05719bbf60fa0883c17f8143fc8ac368073f7e1ed01e97966d559b583f1ea3
3
+ size 227149016
added_tokens.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ {
2
+ "<image_soft_token>": 262144
3
+ }
chat_template.jinja ADDED
@@ -0,0 +1,47 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {{ bos_token }}
2
+ {%- if messages[0]['role'] == 'system' -%}
3
+ {%- if messages[0]['content'] is string -%}
4
+ {%- set first_user_prefix = messages[0]['content'] + '
5
+
6
+ ' -%}
7
+ {%- else -%}
8
+ {%- set first_user_prefix = messages[0]['content'][0]['text'] + '
9
+
10
+ ' -%}
11
+ {%- endif -%}
12
+ {%- set loop_messages = messages[1:] -%}
13
+ {%- else -%}
14
+ {%- set first_user_prefix = "" -%}
15
+ {%- set loop_messages = messages -%}
16
+ {%- endif -%}
17
+ {%- for message in loop_messages -%}
18
+ {%- if (message['role'] == 'user') != (loop.index0 % 2 == 0) -%}
19
+ {{ raise_exception("Conversation roles must alternate user/assistant/user/assistant/...") }}
20
+ {%- endif -%}
21
+ {%- if (message['role'] == 'assistant') -%}
22
+ {%- set role = "model" -%}
23
+ {%- else -%}
24
+ {%- set role = message['role'] -%}
25
+ {%- endif -%}
26
+ {{ '<start_of_turn>' + role + '
27
+ ' + (first_user_prefix if loop.first else "") }}
28
+ {%- if message['content'] is string -%}
29
+ {{ message['content'] | trim }}
30
+ {%- elif message['content'] is iterable -%}
31
+ {%- for item in message['content'] -%}
32
+ {%- if item['type'] == 'image' -%}
33
+ {{ '<start_of_image>' }}
34
+ {%- elif item['type'] == 'text' -%}
35
+ {{ item['text'] | trim }}
36
+ {%- endif -%}
37
+ {%- endfor -%}
38
+ {%- else -%}
39
+ {{ raise_exception("Invalid content type") }}
40
+ {%- endif -%}
41
+ {{ '<end_of_turn>
42
+ ' }}
43
+ {%- endfor -%}
44
+ {%- if add_generation_prompt -%}
45
+ {{'<start_of_turn>model
46
+ '}}
47
+ {%- endif -%}
runs/Jul12_19-24-10_192-222-50-225/events.out.tfevents.1752348251.192-222-50-225.6308.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b1b6be921a73aeb3ab0804fc50c9bb4580976d2c38f3125e4bedbad073cc1449
3
+ size 6891
runs/Jul12_19-26-47_192-222-50-225/events.out.tfevents.1752348407.192-222-50-225.6572.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:95ace9e21dc18f1d284383c3648a1e8630824b59323a53807400e9175588a8c9
3
+ size 6892
runs/Jul12_19-29-33_192-222-50-225/events.out.tfevents.1752348573.192-222-50-225.6698.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:c13b87871c43cbf3fb64f3ef33bf560010707d50b8b60d8b39f8abc7fc3083ae
3
+ size 6892
runs/Jul12_19-31-33_192-222-50-225/events.out.tfevents.1752348693.192-222-50-225.6847.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00a283d76d942e13e27e2c183defb4540fd396b4820ee075a617194d29f097d5
3
+ size 6893
runs/Jul12_19-38-15_192-222-50-225/events.out.tfevents.1752349095.192-222-50-225.7027.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b4c0c0e5ea1ace7038d10cbf85c24dba577673ffe6b0cf116c0e88fd351eabf0
3
+ size 6893
runs/Jul12_19-39-22_192-222-50-225/events.out.tfevents.1752349163.192-222-50-225.7305.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3fe6a176bed126c91b92eb1ba79179450549f18aaaaa1d7f010db970e1a852bd
3
+ size 6893
runs/Jul12_19-41-25_192-222-50-225/events.out.tfevents.1752349285.192-222-50-225.7432.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5d16b1ad02e295fbcc2ef6f6084d373c1d439545bb9a9160451129b8f75d9531
3
+ size 6893
runs/Jul12_19-43-12_192-222-50-225/events.out.tfevents.1752349392.192-222-50-225.7652.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:069030f9bfe769d4cf601803a58d7465075330a934ca42bd23a4e4b6e99a1a48
3
+ size 4184
runs/Jul12_19-44-41_192-222-50-225/events.out.tfevents.1752349481.192-222-50-225.7797.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b8f047bd223586890425efc4d482769a81c215251e028cbccc4ec9759f9bbab0
3
+ size 7099
runs/Jul12_19-47-45_192-222-50-225/events.out.tfevents.1752349665.192-222-50-225.8096.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6bec3ae561a486f45efaead0b312152acc93473ba889f6d01dad0a883c84f587
3
+ size 8547
runs/Jul12_20-19-06_192-222-50-225/events.out.tfevents.1752351546.192-222-50-225.8742.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a830f99e21f86c6a3b3ec61c392633bab1c70357f96e2e92933ce7bb7f6bd669
3
+ size 6891
runs/Jul12_20-20-25_192-222-50-225/events.out.tfevents.1752351625.192-222-50-225.8866.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7aa1f058e63f2ac5ba5553b2db363d9f7feb5b2ee0a5e1f693f93047016d5a56
3
+ size 6891
runs/Jul12_20-31-47_192-222-50-225/events.out.tfevents.1752352308.192-222-50-225.9439.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:37019e27e146050f4cf1ef1805dd428507f302dcfbcc7ff34bbea0772e0df5cd
3
+ size 11445
runs/Jul12_21-41-52_192-222-50-225/events.out.tfevents.1752356513.192-222-50-225.11670.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:5f7a7fea5c133afb19f21217b51e08b0ba3f0a0b6ee3a9c514f8a3b51469a717
3
+ size 7098
runs/Jul12_21-58-20_192-222-50-225/events.out.tfevents.1752357500.192-222-50-225.12327.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e0d74b62b8a0951d8f815d3067045b4dc97cfd48eecf42ef78aa36559989db5
3
+ size 6891
runs/Jul12_22-02-49_192-222-50-225/events.out.tfevents.1752357769.192-222-50-225.12553.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bd39d37ee5ab1f62a6737343d058da5e07b765b74e243844ca79a7d63e2a6ff4
3
+ size 6891
runs/Jul12_22-06-18_192-222-50-225/events.out.tfevents.1752357978.192-222-50-225.12764.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:98f812c151877c96db17cd630ef17047e75dd2c4deabb9ed820763fd609e1c45
3
+ size 6890
runs/Jul12_22-07-56_192-222-50-225/events.out.tfevents.1752358076.192-222-50-225.12949.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:19af3d4f61f6e93d7c64a4135ecef73ecade4c86d0371a41609e878fe3139fc7
3
+ size 27890
special_tokens_map.json ADDED
@@ -0,0 +1,33 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "boi_token": "<start_of_image>",
3
+ "bos_token": {
4
+ "content": "<bos>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ "eoi_token": "<end_of_image>",
11
+ "eos_token": {
12
+ "content": "<eos>",
13
+ "lstrip": false,
14
+ "normalized": false,
15
+ "rstrip": false,
16
+ "single_word": false
17
+ },
18
+ "image_token": "<image_soft_token>",
19
+ "pad_token": {
20
+ "content": "<pad>",
21
+ "lstrip": false,
22
+ "normalized": false,
23
+ "rstrip": false,
24
+ "single_word": false
25
+ },
26
+ "unk_token": {
27
+ "content": "<unk>",
28
+ "lstrip": false,
29
+ "normalized": false,
30
+ "rstrip": false,
31
+ "single_word": false
32
+ }
33
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4667f2089529e8e7657cfb6d1c19910ae71ff5f28aa7ab2ff2763330affad795
3
+ size 33384568
tokenizer.model ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1299c11d7cf632ef3b4e11937501358ada021bbdf7c47638d13c0ee982f2e79c
3
+ size 4689074
tokenizer_config.json ADDED
The diff for this file is too large to render. See raw diff
 
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:48572e727f9358ffb659e66e6fe98c5882313230ec3af83df5f2140596f04482
3
+ size 5905