End of training

Browse files

Files changed (11) hide show

README.md +77 -14
config.json +3 -4
generation_config.json +101 -3
model-00001-of-00002.safetensors +3 -0
model-00002-of-00002.safetensors +3 -0
model.safetensors.index.json +0 -0
runs/Jul11_12-21-48_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752236513.experienced-olive-magpie-5dc9947595-7lcfb.1358.0 +3 -0
runs/Jul11_12-22-32_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752236557.experienced-olive-magpie-5dc9947595-7lcfb.1358.1 +3 -0
runs/Jul11_12-24-21_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752236665.experienced-olive-magpie-5dc9947595-7lcfb.1895.0 +3 -0
runs/Jul11_12-36-41_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752237405.experienced-olive-magpie-5dc9947595-7lcfb.2358.0 +3 -0
training_args.bin +2 -2

README.md CHANGED Viewed

@@ -1,21 +1,84 @@
 ---
-base_model: unsloth/whisper-large-v3
-tags:
-- text-generation-inference
-- transformers
-- unsloth
-- whisper
 license: apache-2.0
-language:
-- en
 ---
-# Uploaded finetuned  model
-- **Developed by:** kingabzpro
-- **License:** apache-2.0
-- **Finetuned from model :** unsloth/whisper-large-v3
-This whisper model was trained 2x faster with [Unsloth](https://github.com/unslothai/unsloth) and Huggingface's TRL library.
-[<img src="https://raw.githubusercontent.com/unslothai/unsloth/main/images/unsloth%20made%20with%20love.png" width="200"/>](https://github.com/unslothai/unsloth)

 ---
+library_name: transformers
 license: apache-2.0
+base_model: openai/whisper-large-v3
+tags:
+- generated_from_trainer
+datasets:
+- common_voice_17_0
+metrics:
+- wer
+model-index:
+- name: whisper-large-v3-urdu
+  results:
+  - task:
+      name: Automatic Speech Recognition
+      type: automatic-speech-recognition
+    dataset:
+      name: common_voice_17_0
+      type: common_voice_17_0
+      config: ur
+      split: test[:600]
+      args: ur
+    metrics:
+    - name: Wer
+      type: wer
+      value: 21.47124719940254
 ---
+<!-- This model card has been generated automatically according to the information the Trainer had access to. You
+should probably proofread and complete it, then remove this comment. -->
+# whisper-large-v3-urdu
+This model is a fine-tuned version of [openai/whisper-large-v3](https://huggingface.co/openai/whisper-large-v3) on the common_voice_17_0 dataset.
+It achieves the following results on the evaluation set:
+- Loss: 0.0204
+- Wer: 21.4712
+- Cer: 7.1975
+## Model description
+More information needed
+## Intended uses & limitations
+More information needed
+## Training and evaluation data
+More information needed
+## Training procedure
+### Training hyperparameters
+The following hyperparameters were used during training:
+- learning_rate: 3e-05
+- train_batch_size: 8
+- eval_batch_size: 4
+- seed: 42
+- gradient_accumulation_steps: 2
+- total_train_batch_size: 16
+- optimizer: Use adamw_torch with betas=(0.9,0.999) and epsilon=1e-08 and optimizer_args=No additional optimizer arguments
+- lr_scheduler_type: cosine
+- lr_scheduler_warmup_steps: 100
+- training_steps: 1500
+### Training results
+| Training Loss | Epoch  | Step | Validation Loss | Wer     | Cer     |
+|:-------------:|:------:|:----:|:---------------:|:-------:|:-------:|
+| 0.0261        | 0.5089 | 300  | 0.0254          | 30.0224 | 10.3646 |
+| 0.0211        | 1.0170 | 600  | 0.0226          | 25.8588 | 8.5780  |
+| 0.0121        | 1.5259 | 900  | 0.0206          | 24.2158 | 7.9412  |
+| 0.0093        | 2.0339 | 1200 | 0.0195          | 21.3032 | 7.2018  |
+| 0.0043        | 2.5428 | 1500 | 0.0204          | 21.4712 | 7.1975  |
+### Framework versions
+- Transformers 4.52.2
+- Pytorch 2.7.1+cu126
+- Datasets 3.4.1
+- Tokenizers 0.21.2

config.json CHANGED Viewed

@@ -36,12 +36,11 @@
   "model_type": "whisper",
   "num_hidden_layers": 32,
   "num_mel_bins": 128,
-  "pad_token_id": 50257,
   "scale_embedding": false,
-  "torch_dtype": "bfloat16",
   "transformers_version": "4.52.2",
-  "unsloth_version": "2025.7.3",
-  "use_cache": true,
   "use_weighted_layer_sum": false,
   "vocab_size": 51866
 }

   "model_type": "whisper",
   "num_hidden_layers": 32,
   "num_mel_bins": 128,
+  "pad_token_id": 50256,
   "scale_embedding": false,
+  "torch_dtype": "float32",
   "transformers_version": "4.52.2",
+  "use_cache": false,
   "use_weighted_layer_sum": false,
   "vocab_size": 51866
 }

generation_config.json CHANGED Viewed

@@ -41,7 +41,6 @@
       6
     ]
   ],
-  "attn_implementation": "sdpa",
   "begin_suppress_tokens": [
     220,
     50257
@@ -49,6 +48,16 @@
   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
@@ -152,14 +161,103 @@
     "<|yue|>": 50358,
     "<|zh|>": 50260
   },
-  "language": "<|ur|>",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50364,
   "pad_token_id": 50257,
   "prev_sot_token_id": 50362,
   "return_timestamps": false,
-  "suppress_tokens": [],
   "task": "transcribe",
   "task_to_id": {
     "transcribe": 50360,

       6
     ]
   ],
   "begin_suppress_tokens": [
     220,
     50257
   "bos_token_id": 50257,
   "decoder_start_token_id": 50258,
   "eos_token_id": 50257,
+  "forced_decoder_ids": [
+    [
+      1,
+      null
+    ],
+    [
+      2,
+      50360
+    ]
+  ],
   "is_multilingual": true,
   "lang_to_id": {
     "<|af|>": 50327,
     "<|yue|>": 50358,
     "<|zh|>": 50260
   },
+  "language": "ur",
   "max_initial_timestamp_index": 50,
   "max_length": 448,
   "no_timestamps_token_id": 50364,
   "pad_token_id": 50257,
   "prev_sot_token_id": 50362,
   "return_timestamps": false,
+  "suppress_tokens": [
+    1,
+    2,
+    7,
+    8,
+    9,
+    10,
+    14,
+    25,
+    26,
+    27,
+    28,
+    29,
+    31,
+    58,
+    59,
+    60,
+    61,
+    62,
+    63,
+    90,
+    91,
+    92,
+    93,
+    359,
+    503,
+    522,
+    542,
+    873,
+    893,
+    902,
+    918,
+    922,
+    931,
+    1350,
+    1853,
+    1982,
+    2460,
+    2627,
+    3246,
+    3253,
+    3268,
+    3536,
+    3846,
+    3961,
+    4183,
+    4667,
+    6585,
+    6647,
+    7273,
+    9061,
+    9383,
+    10428,
+    10929,
+    11938,
+    12033,
+    12331,
+    12562,
+    13793,
+    14157,
+    14635,
+    15265,
+    15618,
+    16553,
+    16604,
+    18362,
+    18956,
+    20075,
+    21675,
+    22520,
+    26130,
+    26161,
+    26435,
+    28279,
+    29464,
+    31650,
+    32302,
+    32470,
+    36865,
+    42863,
+    47425,
+    49870,
+    50254,
+    50258,
+    50359,
+    50360,
+    50361,
+    50362,
+    50363
+  ],
   "task": "transcribe",
   "task_to_id": {
     "transcribe": 50360,

model-00001-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04e3d50d63894749f20519f76234e580187a999fe35bc497acb051ec61c51780
+size 4993448880

model-00002-of-00002.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:00022667711dccc4a4f9f767a5190c9c64633d551371e34921cedf9e493ad13f
+size 1180663192

model.safetensors.index.json ADDED Viewed

The diff for this file is too large to render. See raw diff

runs/Jul11_12-21-48_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752236513.experienced-olive-magpie-5dc9947595-7lcfb.1358.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:06b16e109803907eb4210981d851ea1f7e1da18b4547da5fc1db08c518f64b3c
+size 5720

runs/Jul11_12-22-32_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752236557.experienced-olive-magpie-5dc9947595-7lcfb.1358.1 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:84354cbef6a3af8605ef818eb368b6c4172edad6323081c1f9a08e7e94f151ab
+size 5719

runs/Jul11_12-24-21_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752236665.experienced-olive-magpie-5dc9947595-7lcfb.1895.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:61a7eb3c652dd5d5807abd8ba5b391bc40e47acf2b392707208c1f89537f32ad
+size 7617

runs/Jul11_12-36-41_experienced-olive-magpie-5dc9947595-7lcfb/events.out.tfevents.1752237405.experienced-olive-magpie-5dc9947595-7lcfb.2358.0 ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:037f26127ea68f79144c3380f3d3b8674ae8b107906fed7939967581b443ea38
+size 11059

training_args.bin CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:c77f505fdacac100ce01a22a187142ff55f617edec1e36428a54e33318b9175f
-size 5496

 version https://git-lfs.github.com/spec/v1
+oid sha256:fc2b29115fcaf76108d1411838ba92d80061311ae84bb9b94fdd8429b94dd38a
+size 5905