pksx01
/

sarvam-1-it-bhojpuri

Text Generation

text-generation-inference

Model card Files Files and versions Community

pksx01 commited on Dec 18, 2024

Commit

4152687

·

verified ·

1 Parent(s): 5832bb1

One complete epoch training

Files changed (2) hide show

adapter_config.json +7 -4
adapter_model.safetensors +1 -1

adapter_config.json CHANGED Viewed

@@ -6,6 +6,8 @@
   },
   "base_model_name_or_path": "sarvamai/sarvam-1",
   "bias": "none",
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
@@ -14,6 +16,7 @@
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 128,
   "lora_dropout": 0.0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
@@ -23,13 +26,13 @@
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
-    "up_proj",
-    "k_proj",
-    "gate_proj",
     "q_proj",
     "down_proj",
     "lm_head",
-    "v_projo_proj"
   ],
   "task_type": null,
   "use_dora": false,

   },
   "base_model_name_or_path": "sarvamai/sarvam-1",
   "bias": "none",
+  "eva_config": null,
+  "exclude_modules": null,
   "fan_in_fan_out": false,
   "inference_mode": true,
   "init_lora_weights": true,
   "layers_to_transform": null,
   "loftq_config": {},
   "lora_alpha": 128,
+  "lora_bias": false,
   "lora_dropout": 0.0,
   "megatron_config": null,
   "megatron_core": "megatron.core",
   "rank_pattern": {},
   "revision": null,
   "target_modules": [
     "q_proj",
+    "up_proj",
     "down_proj",
+    "gate_proj",
+    "v_projo_proj",
     "lm_head",
+    "k_proj"
   ],
   "task_type": null,
   "use_dora": false,

adapter_model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:913adf1373b2ca46325a115183f9f8f1eaff18b72ca55790dd9d503dd00ae53f
 size 907982296

 version https://git-lfs.github.com/spec/v1
+oid sha256:78c9c37dd4d3bee89a4d1379a7a34e16b8e3d4ff0936f3cbf8620ac7c82c4819
 size 907982296