JaparSidik4 commited on Mar 3

Commit

e9d3992

verified ·

1 Parent(s): ff0eb53

Upload folder using huggingface_hub

Browse files

Files changed (48) hide show

checkpoint-1000/added_tokens.json +4 -0
checkpoint-1000/config.json +92 -0
checkpoint-1000/model.safetensors +3 -0
checkpoint-1000/optimizer.pt +3 -0
checkpoint-1000/rng_state.pth +3 -0
checkpoint-1000/scaler.pt +3 -0
checkpoint-1000/scheduler.pt +3 -0
checkpoint-1000/special_tokens_map.json +13 -0
checkpoint-1000/spm_char.model +3 -0
checkpoint-1000/tokenizer_config.json +64 -0
checkpoint-1000/trainer_state.json +321 -0
checkpoint-1000/training_args.bin +3 -0
checkpoint-2000/added_tokens.json +4 -0
checkpoint-2000/config.json +92 -0
checkpoint-2000/model.safetensors +3 -0
checkpoint-2000/optimizer.pt +3 -0
checkpoint-2000/rng_state.pth +3 -0
checkpoint-2000/scaler.pt +3 -0
checkpoint-2000/scheduler.pt +3 -0
checkpoint-2000/special_tokens_map.json +13 -0
checkpoint-2000/spm_char.model +3 -0
checkpoint-2000/tokenizer_config.json +64 -0
checkpoint-2000/trainer_state.json +609 -0
checkpoint-2000/training_args.bin +3 -0
checkpoint-3000/added_tokens.json +4 -0
checkpoint-3000/config.json +92 -0
checkpoint-3000/model.safetensors +3 -0
checkpoint-3000/optimizer.pt +3 -0
checkpoint-3000/rng_state.pth +3 -0
checkpoint-3000/scaler.pt +3 -0
checkpoint-3000/scheduler.pt +3 -0
checkpoint-3000/special_tokens_map.json +13 -0
checkpoint-3000/spm_char.model +3 -0
checkpoint-3000/tokenizer_config.json +64 -0
checkpoint-3000/trainer_state.json +897 -0
checkpoint-3000/training_args.bin +3 -0
checkpoint-4000/added_tokens.json +4 -0
checkpoint-4000/config.json +92 -0
checkpoint-4000/model.safetensors +3 -0
checkpoint-4000/optimizer.pt +3 -0
checkpoint-4000/rng_state.pth +3 -0
checkpoint-4000/scaler.pt +3 -0
checkpoint-4000/scheduler.pt +3 -0
checkpoint-4000/special_tokens_map.json +13 -0
checkpoint-4000/spm_char.model +3 -0
checkpoint-4000/tokenizer_config.json +64 -0
checkpoint-4000/trainer_state.json +1185 -0
checkpoint-4000/training_args.bin +3 -0

checkpoint-1000/added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "<ctc_blank>": 80,
+  "<mask>": 79
+}

checkpoint-1000/config.json ADDED Viewed

	@@ -0,0 +1,92 @@

+{
+  "_name_or_path": "microsoft/speecht5_tts",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "SpeechT5ForTextToSpeech"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 0,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
+  "decoder_layerdrop": 0.1,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 2,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
+  "encoder_layerdrop": 0.1,
+  "encoder_layers": 12,
+  "encoder_max_relative_position": 160,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "guided_attention_loss_num_heads": 2,
+  "guided_attention_loss_scale": 10.0,
+  "guided_attention_loss_sigma": 0.4,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "is_encoder_decoder": true,
+  "layer_norm_eps": 1e-05,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "max_length": 1876,
+  "max_speech_positions": 1876,
+  "max_text_positions": 600,
+  "model_type": "speecht5",
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_mel_bins": 80,
+  "pad_token_id": 1,
+  "positional_dropout": 0.1,
+  "reduction_factor": 2,
+  "scale_embedding": false,
+  "speaker_embedding_dim": 512,
+  "speech_decoder_postnet_dropout": 0.5,
+  "speech_decoder_postnet_kernel": 5,
+  "speech_decoder_postnet_layers": 5,
+  "speech_decoder_postnet_units": 256,
+  "speech_decoder_prenet_dropout": 0.5,
+  "speech_decoder_prenet_layers": 2,
+  "speech_decoder_prenet_units": 256,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.0.dev0",
+  "use_cache": false,
+  "use_guided_attention_loss": true,
+  "vocab_size": 81
+}

checkpoint-1000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:33cbbe0323c17fa0dd71cd2be9b960ae209a74e0c8e874a3d66f1b1921059f37
+size 577789320

checkpoint-1000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:f1314809864351fb28e22d1c4f0ac2574355a1164728336ff9f7690f48e444e7
+size 1155772233

checkpoint-1000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:585ca82d8e14932ad03539b98b5915a62b45c3c2faf89e0a54708e90b136e1d0
+size 14244

checkpoint-1000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:87aa44525984371790d54d96d799fdac8e4a1fd53749608cf9dcf03ca2c78583
+size 988

checkpoint-1000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:04adfa1aca9f7b9ed4b807866282ff1495e43e68a72612345d80bdb13c2a1305
+size 1064

checkpoint-1000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

checkpoint-1000/spm_char.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fcc48f3e225f627b1641db410ceb0c8649bd2b0c982e150b03f8be3728ab560
+size 238473

checkpoint-1000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "79": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "80": {
+      "content": "<ctc_blank>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 600,
+  "normalize": false,
+  "pad_token": "<pad>",
+  "processor_class": "SpeechT5Processor",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "SpeechT5Tokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-1000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,321 @@

+{
+  "best_metric": 0.4698790907859802,
+  "best_model_checkpoint": "./speecht5_tts_common_voice_17_0_id/checkpoint-1000",
+  "epoch": 7.142857142857143,
+  "eval_steps": 1000,
+  "global_step": 1000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.17857142857142858,
+      "grad_norm": 4.796061038970947,
+      "learning_rate": 4.6000000000000004e-07,
+      "loss": 1.0232,
+      "step": 25
+    },
+    {
+      "epoch": 0.35714285714285715,
+      "grad_norm": 6.88640022277832,
+      "learning_rate": 9.600000000000001e-07,
+      "loss": 0.9412,
+      "step": 50
+    },
+    {
+      "epoch": 0.5357142857142857,
+      "grad_norm": 4.282207489013672,
+      "learning_rate": 1.46e-06,
+      "loss": 0.8431,
+      "step": 75
+    },
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4.095445156097412,
+      "learning_rate": 1.9600000000000003e-06,
+      "loss": 0.7959,
+      "step": 100
+    },
+    {
+      "epoch": 0.8928571428571429,
+      "grad_norm": 6.723930835723877,
+      "learning_rate": 2.46e-06,
+      "loss": 0.7825,
+      "step": 125
+    },
+    {
+      "epoch": 1.0714285714285714,
+      "grad_norm": 2.318833589553833,
+      "learning_rate": 2.96e-06,
+      "loss": 0.7967,
+      "step": 150
+    },
+    {
+      "epoch": 1.25,
+      "grad_norm": 2.1883444786071777,
+      "learning_rate": 3.46e-06,
+      "loss": 0.7826,
+      "step": 175
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 2.7793357372283936,
+      "learning_rate": 3.96e-06,
+      "loss": 0.7238,
+      "step": 200
+    },
+    {
+      "epoch": 1.6071428571428572,
+      "grad_norm": 3.0292282104492188,
+      "learning_rate": 4.4600000000000005e-06,
+      "loss": 0.6981,
+      "step": 225
+    },
+    {
+      "epoch": 1.7857142857142856,
+      "grad_norm": 4.8227314949035645,
+      "learning_rate": 4.960000000000001e-06,
+      "loss": 0.6753,
+      "step": 250
+    },
+    {
+      "epoch": 1.9642857142857144,
+      "grad_norm": 2.781235694885254,
+      "learning_rate": 5.460000000000001e-06,
+      "loss": 0.6337,
+      "step": 275
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 2.9240171909332275,
+      "learning_rate": 5.9600000000000005e-06,
+      "loss": 0.6499,
+      "step": 300
+    },
+    {
+      "epoch": 2.3214285714285716,
+      "grad_norm": 2.0720555782318115,
+      "learning_rate": 6.460000000000001e-06,
+      "loss": 0.5995,
+      "step": 325
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 3.025918483734131,
+      "learning_rate": 6.96e-06,
+      "loss": 0.6054,
+      "step": 350
+    },
+    {
+      "epoch": 2.678571428571429,
+      "grad_norm": 3.3047034740448,
+      "learning_rate": 7.4600000000000006e-06,
+      "loss": 0.5828,
+      "step": 375
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 2.4087064266204834,
+      "learning_rate": 7.960000000000002e-06,
+      "loss": 0.5706,
+      "step": 400
+    },
+    {
+      "epoch": 3.0357142857142856,
+      "grad_norm": 2.7837984561920166,
+      "learning_rate": 8.46e-06,
+      "loss": 0.579,
+      "step": 425
+    },
+    {
+      "epoch": 3.2142857142857144,
+      "grad_norm": 1.7530593872070312,
+      "learning_rate": 8.96e-06,
+      "loss": 0.5455,
+      "step": 450
+    },
+    {
+      "epoch": 3.392857142857143,
+      "grad_norm": 2.3677515983581543,
+      "learning_rate": 9.460000000000001e-06,
+      "loss": 0.5557,
+      "step": 475
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2.445343494415283,
+      "learning_rate": 9.960000000000001e-06,
+      "loss": 0.5686,
+      "step": 500
+    },
+    {
+      "epoch": 3.75,
+      "grad_norm": 4.732877731323242,
+      "learning_rate": 9.934285714285715e-06,
+      "loss": 0.5635,
+      "step": 525
+    },
+    {
+      "epoch": 3.928571428571429,
+      "grad_norm": 4.45880126953125,
+      "learning_rate": 9.862857142857144e-06,
+      "loss": 0.5477,
+      "step": 550
+    },
+    {
+      "epoch": 4.107142857142857,
+      "grad_norm": 3.9657559394836426,
+      "learning_rate": 9.791428571428571e-06,
+      "loss": 0.5563,
+      "step": 575
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 2.676309823989868,
+      "learning_rate": 9.72e-06,
+      "loss": 0.5221,
+      "step": 600
+    },
+    {
+      "epoch": 4.464285714285714,
+      "grad_norm": 2.89937686920166,
+      "learning_rate": 9.648571428571429e-06,
+      "loss": 0.5211,
+      "step": 625
+    },
+    {
+      "epoch": 4.642857142857143,
+      "grad_norm": 2.9824204444885254,
+      "learning_rate": 9.577142857142858e-06,
+      "loss": 0.5583,
+      "step": 650
+    },
+    {
+      "epoch": 4.821428571428571,
+      "grad_norm": 3.632369041442871,
+      "learning_rate": 9.505714285714287e-06,
+      "loss": 0.526,
+      "step": 675
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 2.352837324142456,
+      "learning_rate": 9.434285714285714e-06,
+      "loss": 0.5211,
+      "step": 700
+    },
+    {
+      "epoch": 5.178571428571429,
+      "grad_norm": 1.3236348628997803,
+      "learning_rate": 9.362857142857143e-06,
+      "loss": 0.5173,
+      "step": 725
+    },
+    {
+      "epoch": 5.357142857142857,
+      "grad_norm": 1.8493444919586182,
+      "learning_rate": 9.291428571428572e-06,
+      "loss": 0.5094,
+      "step": 750
+    },
+    {
+      "epoch": 5.535714285714286,
+      "grad_norm": 1.7403544187545776,
+      "learning_rate": 9.220000000000002e-06,
+      "loss": 0.5239,
+      "step": 775
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 4.10603666305542,
+      "learning_rate": 9.148571428571429e-06,
+      "loss": 0.5304,
+      "step": 800
+    },
+    {
+      "epoch": 5.892857142857143,
+      "grad_norm": 2.69100284576416,
+      "learning_rate": 9.077142857142858e-06,
+      "loss": 0.5224,
+      "step": 825
+    },
+    {
+      "epoch": 6.071428571428571,
+      "grad_norm": 1.956499695777893,
+      "learning_rate": 9.005714285714287e-06,
+      "loss": 0.5065,
+      "step": 850
+    },
+    {
+      "epoch": 6.25,
+      "grad_norm": 1.915540337562561,
+      "learning_rate": 8.934285714285716e-06,
+      "loss": 0.511,
+      "step": 875
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 2.1903812885284424,
+      "learning_rate": 8.862857142857143e-06,
+      "loss": 0.5132,
+      "step": 900
+    },
+    {
+      "epoch": 6.607142857142857,
+      "grad_norm": 1.666169285774231,
+      "learning_rate": 8.791428571428572e-06,
+      "loss": 0.5362,
+      "step": 925
+    },
+    {
+      "epoch": 6.785714285714286,
+      "grad_norm": 1.6485190391540527,
+      "learning_rate": 8.720000000000001e-06,
+      "loss": 0.5115,
+      "step": 950
+    },
+    {
+      "epoch": 6.964285714285714,
+      "grad_norm": 1.7726221084594727,
+      "learning_rate": 8.64857142857143e-06,
+      "loss": 0.5183,
+      "step": 975
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 2.7793469429016113,
+      "learning_rate": 8.577142857142858e-06,
+      "loss": 0.5133,
+      "step": 1000
+    },
+    {
+      "epoch": 7.142857142857143,
+      "eval_loss": 0.4698790907859802,
+      "eval_runtime": 10.706,
+      "eval_samples_per_second": 46.422,
+      "eval_steps_per_second": 5.885,
+      "step": 1000
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 4000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 29,
+  "save_steps": 1000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 2963090237724936.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-1000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a01e8c0a090b02699d5b506a30ffaf176234c63870a5a741f73db593b385337
+size 5560

checkpoint-2000/added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "<ctc_blank>": 80,
+  "<mask>": 79
+}

checkpoint-2000/config.json ADDED Viewed

	@@ -0,0 +1,92 @@

+{
+  "_name_or_path": "microsoft/speecht5_tts",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "SpeechT5ForTextToSpeech"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 0,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
+  "decoder_layerdrop": 0.1,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 2,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
+  "encoder_layerdrop": 0.1,
+  "encoder_layers": 12,
+  "encoder_max_relative_position": 160,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "guided_attention_loss_num_heads": 2,
+  "guided_attention_loss_scale": 10.0,
+  "guided_attention_loss_sigma": 0.4,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "is_encoder_decoder": true,
+  "layer_norm_eps": 1e-05,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "max_length": 1876,
+  "max_speech_positions": 1876,
+  "max_text_positions": 600,
+  "model_type": "speecht5",
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_mel_bins": 80,
+  "pad_token_id": 1,
+  "positional_dropout": 0.1,
+  "reduction_factor": 2,
+  "scale_embedding": false,
+  "speaker_embedding_dim": 512,
+  "speech_decoder_postnet_dropout": 0.5,
+  "speech_decoder_postnet_kernel": 5,
+  "speech_decoder_postnet_layers": 5,
+  "speech_decoder_postnet_units": 256,
+  "speech_decoder_prenet_dropout": 0.5,
+  "speech_decoder_prenet_layers": 2,
+  "speech_decoder_prenet_units": 256,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.0.dev0",
+  "use_cache": false,
+  "use_guided_attention_loss": true,
+  "vocab_size": 81
+}

checkpoint-2000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8af5f93c52f7348e0dd980f2d568d4d1a57e81e501bfb716dda04491379bf257
+size 577789320

checkpoint-2000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:8db569bdc5f32ee3acb80da044109ad11a26cf8f0933e4978089b6ac2e34be34
+size 1155772233

checkpoint-2000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ada26402e6f6f7923f2e77df566e5aa603082f9c0ae08d4066c59fd29adf6c17
+size 14244

checkpoint-2000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c0b23ed8ad30394561c40ec7ebe1b25b72685906a15189a8b49897599d008289
+size 988

checkpoint-2000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:9892f0087eb652598b43152ddd8519208d4c860334ace0372ec523095d6aebd8
+size 1064

checkpoint-2000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

checkpoint-2000/spm_char.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fcc48f3e225f627b1641db410ceb0c8649bd2b0c982e150b03f8be3728ab560
+size 238473

checkpoint-2000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "79": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "80": {
+      "content": "<ctc_blank>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 600,
+  "normalize": false,
+  "pad_token": "<pad>",
+  "processor_class": "SpeechT5Processor",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "SpeechT5Tokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-2000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,609 @@

+{
+  "best_metric": 0.45390585064888,
+  "best_model_checkpoint": "./speecht5_tts_common_voice_17_0_id/checkpoint-2000",
+  "epoch": 14.285714285714286,
+  "eval_steps": 1000,
+  "global_step": 2000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.17857142857142858,
+      "grad_norm": 4.796061038970947,
+      "learning_rate": 4.6000000000000004e-07,
+      "loss": 1.0232,
+      "step": 25
+    },
+    {
+      "epoch": 0.35714285714285715,
+      "grad_norm": 6.88640022277832,
+      "learning_rate": 9.600000000000001e-07,
+      "loss": 0.9412,
+      "step": 50
+    },
+    {
+      "epoch": 0.5357142857142857,
+      "grad_norm": 4.282207489013672,
+      "learning_rate": 1.46e-06,
+      "loss": 0.8431,
+      "step": 75
+    },
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4.095445156097412,
+      "learning_rate": 1.9600000000000003e-06,
+      "loss": 0.7959,
+      "step": 100
+    },
+    {
+      "epoch": 0.8928571428571429,
+      "grad_norm": 6.723930835723877,
+      "learning_rate": 2.46e-06,
+      "loss": 0.7825,
+      "step": 125
+    },
+    {
+      "epoch": 1.0714285714285714,
+      "grad_norm": 2.318833589553833,
+      "learning_rate": 2.96e-06,
+      "loss": 0.7967,
+      "step": 150
+    },
+    {
+      "epoch": 1.25,
+      "grad_norm": 2.1883444786071777,
+      "learning_rate": 3.46e-06,
+      "loss": 0.7826,
+      "step": 175
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 2.7793357372283936,
+      "learning_rate": 3.96e-06,
+      "loss": 0.7238,
+      "step": 200
+    },
+    {
+      "epoch": 1.6071428571428572,
+      "grad_norm": 3.0292282104492188,
+      "learning_rate": 4.4600000000000005e-06,
+      "loss": 0.6981,
+      "step": 225
+    },
+    {
+      "epoch": 1.7857142857142856,
+      "grad_norm": 4.8227314949035645,
+      "learning_rate": 4.960000000000001e-06,
+      "loss": 0.6753,
+      "step": 250
+    },
+    {
+      "epoch": 1.9642857142857144,
+      "grad_norm": 2.781235694885254,
+      "learning_rate": 5.460000000000001e-06,
+      "loss": 0.6337,
+      "step": 275
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 2.9240171909332275,
+      "learning_rate": 5.9600000000000005e-06,
+      "loss": 0.6499,
+      "step": 300
+    },
+    {
+      "epoch": 2.3214285714285716,
+      "grad_norm": 2.0720555782318115,
+      "learning_rate": 6.460000000000001e-06,
+      "loss": 0.5995,
+      "step": 325
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 3.025918483734131,
+      "learning_rate": 6.96e-06,
+      "loss": 0.6054,
+      "step": 350
+    },
+    {
+      "epoch": 2.678571428571429,
+      "grad_norm": 3.3047034740448,
+      "learning_rate": 7.4600000000000006e-06,
+      "loss": 0.5828,
+      "step": 375
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 2.4087064266204834,
+      "learning_rate": 7.960000000000002e-06,
+      "loss": 0.5706,
+      "step": 400
+    },
+    {
+      "epoch": 3.0357142857142856,
+      "grad_norm": 2.7837984561920166,
+      "learning_rate": 8.46e-06,
+      "loss": 0.579,
+      "step": 425
+    },
+    {
+      "epoch": 3.2142857142857144,
+      "grad_norm": 1.7530593872070312,
+      "learning_rate": 8.96e-06,
+      "loss": 0.5455,
+      "step": 450
+    },
+    {
+      "epoch": 3.392857142857143,
+      "grad_norm": 2.3677515983581543,
+      "learning_rate": 9.460000000000001e-06,
+      "loss": 0.5557,
+      "step": 475
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2.445343494415283,
+      "learning_rate": 9.960000000000001e-06,
+      "loss": 0.5686,
+      "step": 500
+    },
+    {
+      "epoch": 3.75,
+      "grad_norm": 4.732877731323242,
+      "learning_rate": 9.934285714285715e-06,
+      "loss": 0.5635,
+      "step": 525
+    },
+    {
+      "epoch": 3.928571428571429,
+      "grad_norm": 4.45880126953125,
+      "learning_rate": 9.862857142857144e-06,
+      "loss": 0.5477,
+      "step": 550
+    },
+    {
+      "epoch": 4.107142857142857,
+      "grad_norm": 3.9657559394836426,
+      "learning_rate": 9.791428571428571e-06,
+      "loss": 0.5563,
+      "step": 575
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 2.676309823989868,
+      "learning_rate": 9.72e-06,
+      "loss": 0.5221,
+      "step": 600
+    },
+    {
+      "epoch": 4.464285714285714,
+      "grad_norm": 2.89937686920166,
+      "learning_rate": 9.648571428571429e-06,
+      "loss": 0.5211,
+      "step": 625
+    },
+    {
+      "epoch": 4.642857142857143,
+      "grad_norm": 2.9824204444885254,
+      "learning_rate": 9.577142857142858e-06,
+      "loss": 0.5583,
+      "step": 650
+    },
+    {
+      "epoch": 4.821428571428571,
+      "grad_norm": 3.632369041442871,
+      "learning_rate": 9.505714285714287e-06,
+      "loss": 0.526,
+      "step": 675
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 2.352837324142456,
+      "learning_rate": 9.434285714285714e-06,
+      "loss": 0.5211,
+      "step": 700
+    },
+    {
+      "epoch": 5.178571428571429,
+      "grad_norm": 1.3236348628997803,
+      "learning_rate": 9.362857142857143e-06,
+      "loss": 0.5173,
+      "step": 725
+    },
+    {
+      "epoch": 5.357142857142857,
+      "grad_norm": 1.8493444919586182,
+      "learning_rate": 9.291428571428572e-06,
+      "loss": 0.5094,
+      "step": 750
+    },
+    {
+      "epoch": 5.535714285714286,
+      "grad_norm": 1.7403544187545776,
+      "learning_rate": 9.220000000000002e-06,
+      "loss": 0.5239,
+      "step": 775
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 4.10603666305542,
+      "learning_rate": 9.148571428571429e-06,
+      "loss": 0.5304,
+      "step": 800
+    },
+    {
+      "epoch": 5.892857142857143,
+      "grad_norm": 2.69100284576416,
+      "learning_rate": 9.077142857142858e-06,
+      "loss": 0.5224,
+      "step": 825
+    },
+    {
+      "epoch": 6.071428571428571,
+      "grad_norm": 1.956499695777893,
+      "learning_rate": 9.005714285714287e-06,
+      "loss": 0.5065,
+      "step": 850
+    },
+    {
+      "epoch": 6.25,
+      "grad_norm": 1.915540337562561,
+      "learning_rate": 8.934285714285716e-06,
+      "loss": 0.511,
+      "step": 875
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 2.1903812885284424,
+      "learning_rate": 8.862857142857143e-06,
+      "loss": 0.5132,
+      "step": 900
+    },
+    {
+      "epoch": 6.607142857142857,
+      "grad_norm": 1.666169285774231,
+      "learning_rate": 8.791428571428572e-06,
+      "loss": 0.5362,
+      "step": 925
+    },
+    {
+      "epoch": 6.785714285714286,
+      "grad_norm": 1.6485190391540527,
+      "learning_rate": 8.720000000000001e-06,
+      "loss": 0.5115,
+      "step": 950
+    },
+    {
+      "epoch": 6.964285714285714,
+      "grad_norm": 1.7726221084594727,
+      "learning_rate": 8.64857142857143e-06,
+      "loss": 0.5183,
+      "step": 975
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 2.7793469429016113,
+      "learning_rate": 8.577142857142858e-06,
+      "loss": 0.5133,
+      "step": 1000
+    },
+    {
+      "epoch": 7.142857142857143,
+      "eval_loss": 0.4698790907859802,
+      "eval_runtime": 10.706,
+      "eval_samples_per_second": 46.422,
+      "eval_steps_per_second": 5.885,
+      "step": 1000
+    },
+    {
+      "epoch": 7.321428571428571,
+      "grad_norm": 2.8019936084747314,
+      "learning_rate": 8.505714285714287e-06,
+      "loss": 0.518,
+      "step": 1025
+    },
+    {
+      "epoch": 7.5,
+      "grad_norm": 2.1961379051208496,
+      "learning_rate": 8.434285714285716e-06,
+      "loss": 0.5112,
+      "step": 1050
+    },
+    {
+      "epoch": 7.678571428571429,
+      "grad_norm": 2.5158090591430664,
+      "learning_rate": 8.362857142857143e-06,
+      "loss": 0.5091,
+      "step": 1075
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 2.2158660888671875,
+      "learning_rate": 8.291428571428572e-06,
+      "loss": 0.5121,
+      "step": 1100
+    },
+    {
+      "epoch": 8.035714285714286,
+      "grad_norm": 2.8917131423950195,
+      "learning_rate": 8.220000000000001e-06,
+      "loss": 0.5134,
+      "step": 1125
+    },
+    {
+      "epoch": 8.214285714285714,
+      "grad_norm": 1.9233217239379883,
+      "learning_rate": 8.148571428571428e-06,
+      "loss": 0.5101,
+      "step": 1150
+    },
+    {
+      "epoch": 8.392857142857142,
+      "grad_norm": 2.437870979309082,
+      "learning_rate": 8.077142857142857e-06,
+      "loss": 0.5138,
+      "step": 1175
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 1.7921634912490845,
+      "learning_rate": 8.005714285714286e-06,
+      "loss": 0.5155,
+      "step": 1200
+    },
+    {
+      "epoch": 8.75,
+      "grad_norm": 3.1069226264953613,
+      "learning_rate": 7.934285714285715e-06,
+      "loss": 0.5144,
+      "step": 1225
+    },
+    {
+      "epoch": 8.928571428571429,
+      "grad_norm": 1.7902675867080688,
+      "learning_rate": 7.862857142857143e-06,
+      "loss": 0.4973,
+      "step": 1250
+    },
+    {
+      "epoch": 9.107142857142858,
+      "grad_norm": 2.353273391723633,
+      "learning_rate": 7.791428571428572e-06,
+      "loss": 0.5035,
+      "step": 1275
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 2.3287203311920166,
+      "learning_rate": 7.72e-06,
+      "loss": 0.5085,
+      "step": 1300
+    },
+    {
+      "epoch": 9.464285714285714,
+      "grad_norm": 1.6508110761642456,
+      "learning_rate": 7.64857142857143e-06,
+      "loss": 0.5116,
+      "step": 1325
+    },
+    {
+      "epoch": 9.642857142857142,
+      "grad_norm": 1.8232289552688599,
+      "learning_rate": 7.577142857142857e-06,
+      "loss": 0.5033,
+      "step": 1350
+    },
+    {
+      "epoch": 9.821428571428571,
+      "grad_norm": 2.0248517990112305,
+      "learning_rate": 7.505714285714286e-06,
+      "loss": 0.4974,
+      "step": 1375
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3.7484123706817627,
+      "learning_rate": 7.434285714285715e-06,
+      "loss": 0.4947,
+      "step": 1400
+    },
+    {
+      "epoch": 10.178571428571429,
+      "grad_norm": 1.793626308441162,
+      "learning_rate": 7.362857142857144e-06,
+      "loss": 0.5008,
+      "step": 1425
+    },
+    {
+      "epoch": 10.357142857142858,
+      "grad_norm": 1.8825795650482178,
+      "learning_rate": 7.291428571428571e-06,
+      "loss": 0.4965,
+      "step": 1450
+    },
+    {
+      "epoch": 10.535714285714286,
+      "grad_norm": 2.0584166049957275,
+      "learning_rate": 7.22e-06,
+      "loss": 0.4946,
+      "step": 1475
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 3.3335680961608887,
+      "learning_rate": 7.148571428571429e-06,
+      "loss": 0.5048,
+      "step": 1500
+    },
+    {
+      "epoch": 10.892857142857142,
+      "grad_norm": 1.9972820281982422,
+      "learning_rate": 7.077142857142858e-06,
+      "loss": 0.5071,
+      "step": 1525
+    },
+    {
+      "epoch": 11.071428571428571,
+      "grad_norm": 2.2279226779937744,
+      "learning_rate": 7.0057142857142865e-06,
+      "loss": 0.4874,
+      "step": 1550
+    },
+    {
+      "epoch": 11.25,
+      "grad_norm": 2.168933868408203,
+      "learning_rate": 6.934285714285715e-06,
+      "loss": 0.5011,
+      "step": 1575
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 3.186655044555664,
+      "learning_rate": 6.862857142857144e-06,
+      "loss": 0.4963,
+      "step": 1600
+    },
+    {
+      "epoch": 11.607142857142858,
+      "grad_norm": 2.6348812580108643,
+      "learning_rate": 6.791428571428572e-06,
+      "loss": 0.5007,
+      "step": 1625
+    },
+    {
+      "epoch": 11.785714285714286,
+      "grad_norm": 3.1159684658050537,
+      "learning_rate": 6.720000000000001e-06,
+      "loss": 0.4997,
+      "step": 1650
+    },
+    {
+      "epoch": 11.964285714285714,
+      "grad_norm": 4.068305492401123,
+      "learning_rate": 6.648571428571429e-06,
+      "loss": 0.4919,
+      "step": 1675
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 2.315338134765625,
+      "learning_rate": 6.577142857142857e-06,
+      "loss": 0.4937,
+      "step": 1700
+    },
+    {
+      "epoch": 12.321428571428571,
+      "grad_norm": 1.5482977628707886,
+      "learning_rate": 6.505714285714286e-06,
+      "loss": 0.4964,
+      "step": 1725
+    },
+    {
+      "epoch": 12.5,
+      "grad_norm": 2.1527745723724365,
+      "learning_rate": 6.434285714285715e-06,
+      "loss": 0.494,
+      "step": 1750
+    },
+    {
+      "epoch": 12.678571428571429,
+      "grad_norm": 2.216703176498413,
+      "learning_rate": 6.3628571428571426e-06,
+      "loss": 0.4853,
+      "step": 1775
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 2.939267873764038,
+      "learning_rate": 6.2914285714285716e-06,
+      "loss": 0.4978,
+      "step": 1800
+    },
+    {
+      "epoch": 13.035714285714286,
+      "grad_norm": 2.3067381381988525,
+      "learning_rate": 6.220000000000001e-06,
+      "loss": 0.5023,
+      "step": 1825
+    },
+    {
+      "epoch": 13.214285714285714,
+      "grad_norm": 2.2849552631378174,
+      "learning_rate": 6.14857142857143e-06,
+      "loss": 0.5013,
+      "step": 1850
+    },
+    {
+      "epoch": 13.392857142857142,
+      "grad_norm": 1.8568611145019531,
+      "learning_rate": 6.077142857142858e-06,
+      "loss": 0.4855,
+      "step": 1875
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 2.784388542175293,
+      "learning_rate": 6.005714285714286e-06,
+      "loss": 0.4832,
+      "step": 1900
+    },
+    {
+      "epoch": 13.75,
+      "grad_norm": 1.718732237815857,
+      "learning_rate": 5.934285714285715e-06,
+      "loss": 0.4926,
+      "step": 1925
+    },
+    {
+      "epoch": 13.928571428571429,
+      "grad_norm": 2.3010714054107666,
+      "learning_rate": 5.862857142857143e-06,
+      "loss": 0.494,
+      "step": 1950
+    },
+    {
+      "epoch": 14.107142857142858,
+      "grad_norm": 2.0058493614196777,
+      "learning_rate": 5.791428571428572e-06,
+      "loss": 0.4901,
+      "step": 1975
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 2.311893939971924,
+      "learning_rate": 5.72e-06,
+      "loss": 0.4774,
+      "step": 2000
+    },
+    {
+      "epoch": 14.285714285714286,
+      "eval_loss": 0.45390585064888,
+      "eval_runtime": 18.3883,
+      "eval_samples_per_second": 27.028,
+      "eval_steps_per_second": 3.426,
+      "step": 2000
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 4000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 29,
+  "save_steps": 1000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 5927807866030776.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-2000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a01e8c0a090b02699d5b506a30ffaf176234c63870a5a741f73db593b385337
+size 5560

checkpoint-3000/added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "<ctc_blank>": 80,
+  "<mask>": 79
+}

checkpoint-3000/config.json ADDED Viewed

	@@ -0,0 +1,92 @@

+{
+  "_name_or_path": "microsoft/speecht5_tts",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "SpeechT5ForTextToSpeech"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 0,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
+  "decoder_layerdrop": 0.1,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 2,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
+  "encoder_layerdrop": 0.1,
+  "encoder_layers": 12,
+  "encoder_max_relative_position": 160,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "guided_attention_loss_num_heads": 2,
+  "guided_attention_loss_scale": 10.0,
+  "guided_attention_loss_sigma": 0.4,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "is_encoder_decoder": true,
+  "layer_norm_eps": 1e-05,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "max_length": 1876,
+  "max_speech_positions": 1876,
+  "max_text_positions": 600,
+  "model_type": "speecht5",
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_mel_bins": 80,
+  "pad_token_id": 1,
+  "positional_dropout": 0.1,
+  "reduction_factor": 2,
+  "scale_embedding": false,
+  "speaker_embedding_dim": 512,
+  "speech_decoder_postnet_dropout": 0.5,
+  "speech_decoder_postnet_kernel": 5,
+  "speech_decoder_postnet_layers": 5,
+  "speech_decoder_postnet_units": 256,
+  "speech_decoder_prenet_dropout": 0.5,
+  "speech_decoder_prenet_layers": 2,
+  "speech_decoder_prenet_units": 256,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.0.dev0",
+  "use_cache": false,
+  "use_guided_attention_loss": true,
+  "vocab_size": 81
+}

checkpoint-3000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1cd68e450899c334ac78ad0994af7cabde4187c89fe02b7215159c76c2bce334
+size 577789320

checkpoint-3000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:c87eef7f0e2e00cbab7038d913581ba1792c5c003d283732899044684a57c635
+size 1155772233

checkpoint-3000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:ebd1aefed45469c63901268b01ba1869f235267cd8c436935a74b257cb260841
+size 14244

checkpoint-3000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a73b49b55d3aadf9516bb5b6bdc1d8930fb0d3a40da81083b6f1d89b5130278c
+size 988

checkpoint-3000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:30b4b82462a87716b3f11ac99d935386eaf7ea7c7ab13974e514e9689621e7eb
+size 1064

checkpoint-3000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

checkpoint-3000/spm_char.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fcc48f3e225f627b1641db410ceb0c8649bd2b0c982e150b03f8be3728ab560
+size 238473

checkpoint-3000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "79": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "80": {
+      "content": "<ctc_blank>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 600,
+  "normalize": false,
+  "pad_token": "<pad>",
+  "processor_class": "SpeechT5Processor",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "SpeechT5Tokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-3000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,897 @@

+{
+  "best_metric": 0.44868698716163635,
+  "best_model_checkpoint": "./speecht5_tts_common_voice_17_0_id/checkpoint-3000",
+  "epoch": 21.428571428571427,
+  "eval_steps": 1000,
+  "global_step": 3000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.17857142857142858,
+      "grad_norm": 4.796061038970947,
+      "learning_rate": 4.6000000000000004e-07,
+      "loss": 1.0232,
+      "step": 25
+    },
+    {
+      "epoch": 0.35714285714285715,
+      "grad_norm": 6.88640022277832,
+      "learning_rate": 9.600000000000001e-07,
+      "loss": 0.9412,
+      "step": 50
+    },
+    {
+      "epoch": 0.5357142857142857,
+      "grad_norm": 4.282207489013672,
+      "learning_rate": 1.46e-06,
+      "loss": 0.8431,
+      "step": 75
+    },
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4.095445156097412,
+      "learning_rate": 1.9600000000000003e-06,
+      "loss": 0.7959,
+      "step": 100
+    },
+    {
+      "epoch": 0.8928571428571429,
+      "grad_norm": 6.723930835723877,
+      "learning_rate": 2.46e-06,
+      "loss": 0.7825,
+      "step": 125
+    },
+    {
+      "epoch": 1.0714285714285714,
+      "grad_norm": 2.318833589553833,
+      "learning_rate": 2.96e-06,
+      "loss": 0.7967,
+      "step": 150
+    },
+    {
+      "epoch": 1.25,
+      "grad_norm": 2.1883444786071777,
+      "learning_rate": 3.46e-06,
+      "loss": 0.7826,
+      "step": 175
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 2.7793357372283936,
+      "learning_rate": 3.96e-06,
+      "loss": 0.7238,
+      "step": 200
+    },
+    {
+      "epoch": 1.6071428571428572,
+      "grad_norm": 3.0292282104492188,
+      "learning_rate": 4.4600000000000005e-06,
+      "loss": 0.6981,
+      "step": 225
+    },
+    {
+      "epoch": 1.7857142857142856,
+      "grad_norm": 4.8227314949035645,
+      "learning_rate": 4.960000000000001e-06,
+      "loss": 0.6753,
+      "step": 250
+    },
+    {
+      "epoch": 1.9642857142857144,
+      "grad_norm": 2.781235694885254,
+      "learning_rate": 5.460000000000001e-06,
+      "loss": 0.6337,
+      "step": 275
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 2.9240171909332275,
+      "learning_rate": 5.9600000000000005e-06,
+      "loss": 0.6499,
+      "step": 300
+    },
+    {
+      "epoch": 2.3214285714285716,
+      "grad_norm": 2.0720555782318115,
+      "learning_rate": 6.460000000000001e-06,
+      "loss": 0.5995,
+      "step": 325
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 3.025918483734131,
+      "learning_rate": 6.96e-06,
+      "loss": 0.6054,
+      "step": 350
+    },
+    {
+      "epoch": 2.678571428571429,
+      "grad_norm": 3.3047034740448,
+      "learning_rate": 7.4600000000000006e-06,
+      "loss": 0.5828,
+      "step": 375
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 2.4087064266204834,
+      "learning_rate": 7.960000000000002e-06,
+      "loss": 0.5706,
+      "step": 400
+    },
+    {
+      "epoch": 3.0357142857142856,
+      "grad_norm": 2.7837984561920166,
+      "learning_rate": 8.46e-06,
+      "loss": 0.579,
+      "step": 425
+    },
+    {
+      "epoch": 3.2142857142857144,
+      "grad_norm": 1.7530593872070312,
+      "learning_rate": 8.96e-06,
+      "loss": 0.5455,
+      "step": 450
+    },
+    {
+      "epoch": 3.392857142857143,
+      "grad_norm": 2.3677515983581543,
+      "learning_rate": 9.460000000000001e-06,
+      "loss": 0.5557,
+      "step": 475
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2.445343494415283,
+      "learning_rate": 9.960000000000001e-06,
+      "loss": 0.5686,
+      "step": 500
+    },
+    {
+      "epoch": 3.75,
+      "grad_norm": 4.732877731323242,
+      "learning_rate": 9.934285714285715e-06,
+      "loss": 0.5635,
+      "step": 525
+    },
+    {
+      "epoch": 3.928571428571429,
+      "grad_norm": 4.45880126953125,
+      "learning_rate": 9.862857142857144e-06,
+      "loss": 0.5477,
+      "step": 550
+    },
+    {
+      "epoch": 4.107142857142857,
+      "grad_norm": 3.9657559394836426,
+      "learning_rate": 9.791428571428571e-06,
+      "loss": 0.5563,
+      "step": 575
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 2.676309823989868,
+      "learning_rate": 9.72e-06,
+      "loss": 0.5221,
+      "step": 600
+    },
+    {
+      "epoch": 4.464285714285714,
+      "grad_norm": 2.89937686920166,
+      "learning_rate": 9.648571428571429e-06,
+      "loss": 0.5211,
+      "step": 625
+    },
+    {
+      "epoch": 4.642857142857143,
+      "grad_norm": 2.9824204444885254,
+      "learning_rate": 9.577142857142858e-06,
+      "loss": 0.5583,
+      "step": 650
+    },
+    {
+      "epoch": 4.821428571428571,
+      "grad_norm": 3.632369041442871,
+      "learning_rate": 9.505714285714287e-06,
+      "loss": 0.526,
+      "step": 675
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 2.352837324142456,
+      "learning_rate": 9.434285714285714e-06,
+      "loss": 0.5211,
+      "step": 700
+    },
+    {
+      "epoch": 5.178571428571429,
+      "grad_norm": 1.3236348628997803,
+      "learning_rate": 9.362857142857143e-06,
+      "loss": 0.5173,
+      "step": 725
+    },
+    {
+      "epoch": 5.357142857142857,
+      "grad_norm": 1.8493444919586182,
+      "learning_rate": 9.291428571428572e-06,
+      "loss": 0.5094,
+      "step": 750
+    },
+    {
+      "epoch": 5.535714285714286,
+      "grad_norm": 1.7403544187545776,
+      "learning_rate": 9.220000000000002e-06,
+      "loss": 0.5239,
+      "step": 775
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 4.10603666305542,
+      "learning_rate": 9.148571428571429e-06,
+      "loss": 0.5304,
+      "step": 800
+    },
+    {
+      "epoch": 5.892857142857143,
+      "grad_norm": 2.69100284576416,
+      "learning_rate": 9.077142857142858e-06,
+      "loss": 0.5224,
+      "step": 825
+    },
+    {
+      "epoch": 6.071428571428571,
+      "grad_norm": 1.956499695777893,
+      "learning_rate": 9.005714285714287e-06,
+      "loss": 0.5065,
+      "step": 850
+    },
+    {
+      "epoch": 6.25,
+      "grad_norm": 1.915540337562561,
+      "learning_rate": 8.934285714285716e-06,
+      "loss": 0.511,
+      "step": 875
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 2.1903812885284424,
+      "learning_rate": 8.862857142857143e-06,
+      "loss": 0.5132,
+      "step": 900
+    },
+    {
+      "epoch": 6.607142857142857,
+      "grad_norm": 1.666169285774231,
+      "learning_rate": 8.791428571428572e-06,
+      "loss": 0.5362,
+      "step": 925
+    },
+    {
+      "epoch": 6.785714285714286,
+      "grad_norm": 1.6485190391540527,
+      "learning_rate": 8.720000000000001e-06,
+      "loss": 0.5115,
+      "step": 950
+    },
+    {
+      "epoch": 6.964285714285714,
+      "grad_norm": 1.7726221084594727,
+      "learning_rate": 8.64857142857143e-06,
+      "loss": 0.5183,
+      "step": 975
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 2.7793469429016113,
+      "learning_rate": 8.577142857142858e-06,
+      "loss": 0.5133,
+      "step": 1000
+    },
+    {
+      "epoch": 7.142857142857143,
+      "eval_loss": 0.4698790907859802,
+      "eval_runtime": 10.706,
+      "eval_samples_per_second": 46.422,
+      "eval_steps_per_second": 5.885,
+      "step": 1000
+    },
+    {
+      "epoch": 7.321428571428571,
+      "grad_norm": 2.8019936084747314,
+      "learning_rate": 8.505714285714287e-06,
+      "loss": 0.518,
+      "step": 1025
+    },
+    {
+      "epoch": 7.5,
+      "grad_norm": 2.1961379051208496,
+      "learning_rate": 8.434285714285716e-06,
+      "loss": 0.5112,
+      "step": 1050
+    },
+    {
+      "epoch": 7.678571428571429,
+      "grad_norm": 2.5158090591430664,
+      "learning_rate": 8.362857142857143e-06,
+      "loss": 0.5091,
+      "step": 1075
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 2.2158660888671875,
+      "learning_rate": 8.291428571428572e-06,
+      "loss": 0.5121,
+      "step": 1100
+    },
+    {
+      "epoch": 8.035714285714286,
+      "grad_norm": 2.8917131423950195,
+      "learning_rate": 8.220000000000001e-06,
+      "loss": 0.5134,
+      "step": 1125
+    },
+    {
+      "epoch": 8.214285714285714,
+      "grad_norm": 1.9233217239379883,
+      "learning_rate": 8.148571428571428e-06,
+      "loss": 0.5101,
+      "step": 1150
+    },
+    {
+      "epoch": 8.392857142857142,
+      "grad_norm": 2.437870979309082,
+      "learning_rate": 8.077142857142857e-06,
+      "loss": 0.5138,
+      "step": 1175
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 1.7921634912490845,
+      "learning_rate": 8.005714285714286e-06,
+      "loss": 0.5155,
+      "step": 1200
+    },
+    {
+      "epoch": 8.75,
+      "grad_norm": 3.1069226264953613,
+      "learning_rate": 7.934285714285715e-06,
+      "loss": 0.5144,
+      "step": 1225
+    },
+    {
+      "epoch": 8.928571428571429,
+      "grad_norm": 1.7902675867080688,
+      "learning_rate": 7.862857142857143e-06,
+      "loss": 0.4973,
+      "step": 1250
+    },
+    {
+      "epoch": 9.107142857142858,
+      "grad_norm": 2.353273391723633,
+      "learning_rate": 7.791428571428572e-06,
+      "loss": 0.5035,
+      "step": 1275
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 2.3287203311920166,
+      "learning_rate": 7.72e-06,
+      "loss": 0.5085,
+      "step": 1300
+    },
+    {
+      "epoch": 9.464285714285714,
+      "grad_norm": 1.6508110761642456,
+      "learning_rate": 7.64857142857143e-06,
+      "loss": 0.5116,
+      "step": 1325
+    },
+    {
+      "epoch": 9.642857142857142,
+      "grad_norm": 1.8232289552688599,
+      "learning_rate": 7.577142857142857e-06,
+      "loss": 0.5033,
+      "step": 1350
+    },
+    {
+      "epoch": 9.821428571428571,
+      "grad_norm": 2.0248517990112305,
+      "learning_rate": 7.505714285714286e-06,
+      "loss": 0.4974,
+      "step": 1375
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3.7484123706817627,
+      "learning_rate": 7.434285714285715e-06,
+      "loss": 0.4947,
+      "step": 1400
+    },
+    {
+      "epoch": 10.178571428571429,
+      "grad_norm": 1.793626308441162,
+      "learning_rate": 7.362857142857144e-06,
+      "loss": 0.5008,
+      "step": 1425
+    },
+    {
+      "epoch": 10.357142857142858,
+      "grad_norm": 1.8825795650482178,
+      "learning_rate": 7.291428571428571e-06,
+      "loss": 0.4965,
+      "step": 1450
+    },
+    {
+      "epoch": 10.535714285714286,
+      "grad_norm": 2.0584166049957275,
+      "learning_rate": 7.22e-06,
+      "loss": 0.4946,
+      "step": 1475
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 3.3335680961608887,
+      "learning_rate": 7.148571428571429e-06,
+      "loss": 0.5048,
+      "step": 1500
+    },
+    {
+      "epoch": 10.892857142857142,
+      "grad_norm": 1.9972820281982422,
+      "learning_rate": 7.077142857142858e-06,
+      "loss": 0.5071,
+      "step": 1525
+    },
+    {
+      "epoch": 11.071428571428571,
+      "grad_norm": 2.2279226779937744,
+      "learning_rate": 7.0057142857142865e-06,
+      "loss": 0.4874,
+      "step": 1550
+    },
+    {
+      "epoch": 11.25,
+      "grad_norm": 2.168933868408203,
+      "learning_rate": 6.934285714285715e-06,
+      "loss": 0.5011,
+      "step": 1575
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 3.186655044555664,
+      "learning_rate": 6.862857142857144e-06,
+      "loss": 0.4963,
+      "step": 1600
+    },
+    {
+      "epoch": 11.607142857142858,
+      "grad_norm": 2.6348812580108643,
+      "learning_rate": 6.791428571428572e-06,
+      "loss": 0.5007,
+      "step": 1625
+    },
+    {
+      "epoch": 11.785714285714286,
+      "grad_norm": 3.1159684658050537,
+      "learning_rate": 6.720000000000001e-06,
+      "loss": 0.4997,
+      "step": 1650
+    },
+    {
+      "epoch": 11.964285714285714,
+      "grad_norm": 4.068305492401123,
+      "learning_rate": 6.648571428571429e-06,
+      "loss": 0.4919,
+      "step": 1675
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 2.315338134765625,
+      "learning_rate": 6.577142857142857e-06,
+      "loss": 0.4937,
+      "step": 1700
+    },
+    {
+      "epoch": 12.321428571428571,
+      "grad_norm": 1.5482977628707886,
+      "learning_rate": 6.505714285714286e-06,
+      "loss": 0.4964,
+      "step": 1725
+    },
+    {
+      "epoch": 12.5,
+      "grad_norm": 2.1527745723724365,
+      "learning_rate": 6.434285714285715e-06,
+      "loss": 0.494,
+      "step": 1750
+    },
+    {
+      "epoch": 12.678571428571429,
+      "grad_norm": 2.216703176498413,
+      "learning_rate": 6.3628571428571426e-06,
+      "loss": 0.4853,
+      "step": 1775
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 2.939267873764038,
+      "learning_rate": 6.2914285714285716e-06,
+      "loss": 0.4978,
+      "step": 1800
+    },
+    {
+      "epoch": 13.035714285714286,
+      "grad_norm": 2.3067381381988525,
+      "learning_rate": 6.220000000000001e-06,
+      "loss": 0.5023,
+      "step": 1825
+    },
+    {
+      "epoch": 13.214285714285714,
+      "grad_norm": 2.2849552631378174,
+      "learning_rate": 6.14857142857143e-06,
+      "loss": 0.5013,
+      "step": 1850
+    },
+    {
+      "epoch": 13.392857142857142,
+      "grad_norm": 1.8568611145019531,
+      "learning_rate": 6.077142857142858e-06,
+      "loss": 0.4855,
+      "step": 1875
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 2.784388542175293,
+      "learning_rate": 6.005714285714286e-06,
+      "loss": 0.4832,
+      "step": 1900
+    },
+    {
+      "epoch": 13.75,
+      "grad_norm": 1.718732237815857,
+      "learning_rate": 5.934285714285715e-06,
+      "loss": 0.4926,
+      "step": 1925
+    },
+    {
+      "epoch": 13.928571428571429,
+      "grad_norm": 2.3010714054107666,
+      "learning_rate": 5.862857142857143e-06,
+      "loss": 0.494,
+      "step": 1950
+    },
+    {
+      "epoch": 14.107142857142858,
+      "grad_norm": 2.0058493614196777,
+      "learning_rate": 5.791428571428572e-06,
+      "loss": 0.4901,
+      "step": 1975
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 2.311893939971924,
+      "learning_rate": 5.72e-06,
+      "loss": 0.4774,
+      "step": 2000
+    },
+    {
+      "epoch": 14.285714285714286,
+      "eval_loss": 0.45390585064888,
+      "eval_runtime": 18.3883,
+      "eval_samples_per_second": 27.028,
+      "eval_steps_per_second": 3.426,
+      "step": 2000
+    },
+    {
+      "epoch": 14.464285714285714,
+      "grad_norm": 5.475688457489014,
+      "learning_rate": 5.6485714285714285e-06,
+      "loss": 0.479,
+      "step": 2025
+    },
+    {
+      "epoch": 14.642857142857142,
+      "grad_norm": 2.333171844482422,
+      "learning_rate": 5.5771428571428575e-06,
+      "loss": 0.487,
+      "step": 2050
+    },
+    {
+      "epoch": 14.821428571428571,
+      "grad_norm": 1.7914478778839111,
+      "learning_rate": 5.5057142857142865e-06,
+      "loss": 0.5042,
+      "step": 2075
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 2.343949317932129,
+      "learning_rate": 5.4342857142857155e-06,
+      "loss": 0.4994,
+      "step": 2100
+    },
+    {
+      "epoch": 15.178571428571429,
+      "grad_norm": 2.7536513805389404,
+      "learning_rate": 5.362857142857143e-06,
+      "loss": 0.492,
+      "step": 2125
+    },
+    {
+      "epoch": 15.357142857142858,
+      "grad_norm": 3.5288944244384766,
+      "learning_rate": 5.291428571428572e-06,
+      "loss": 0.4878,
+      "step": 2150
+    },
+    {
+      "epoch": 15.535714285714286,
+      "grad_norm": 4.280928611755371,
+      "learning_rate": 5.220000000000001e-06,
+      "loss": 0.4908,
+      "step": 2175
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 3.1674723625183105,
+      "learning_rate": 5.14857142857143e-06,
+      "loss": 0.4896,
+      "step": 2200
+    },
+    {
+      "epoch": 15.892857142857142,
+      "grad_norm": 1.4766712188720703,
+      "learning_rate": 5.077142857142857e-06,
+      "loss": 0.4891,
+      "step": 2225
+    },
+    {
+      "epoch": 16.071428571428573,
+      "grad_norm": 2.7163197994232178,
+      "learning_rate": 5.005714285714286e-06,
+      "loss": 0.4901,
+      "step": 2250
+    },
+    {
+      "epoch": 16.25,
+      "grad_norm": 2.2624833583831787,
+      "learning_rate": 4.934285714285715e-06,
+      "loss": 0.4841,
+      "step": 2275
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 3.0063624382019043,
+      "learning_rate": 4.862857142857143e-06,
+      "loss": 0.4826,
+      "step": 2300
+    },
+    {
+      "epoch": 16.607142857142858,
+      "grad_norm": 1.5605120658874512,
+      "learning_rate": 4.7914285714285715e-06,
+      "loss": 0.4808,
+      "step": 2325
+    },
+    {
+      "epoch": 16.785714285714285,
+      "grad_norm": 1.8184423446655273,
+      "learning_rate": 4.7200000000000005e-06,
+      "loss": 0.4743,
+      "step": 2350
+    },
+    {
+      "epoch": 16.964285714285715,
+      "grad_norm": 1.490218162536621,
+      "learning_rate": 4.648571428571429e-06,
+      "loss": 0.4848,
+      "step": 2375
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 2.210409641265869,
+      "learning_rate": 4.577142857142858e-06,
+      "loss": 0.4814,
+      "step": 2400
+    },
+    {
+      "epoch": 17.321428571428573,
+      "grad_norm": 1.8189564943313599,
+      "learning_rate": 4.505714285714286e-06,
+      "loss": 0.4749,
+      "step": 2425
+    },
+    {
+      "epoch": 17.5,
+      "grad_norm": 2.2493181228637695,
+      "learning_rate": 4.434285714285715e-06,
+      "loss": 0.4835,
+      "step": 2450
+    },
+    {
+      "epoch": 17.678571428571427,
+      "grad_norm": 2.454582452774048,
+      "learning_rate": 4.362857142857143e-06,
+      "loss": 0.4891,
+      "step": 2475
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 2.0914249420166016,
+      "learning_rate": 4.291428571428572e-06,
+      "loss": 0.4774,
+      "step": 2500
+    },
+    {
+      "epoch": 18.035714285714285,
+      "grad_norm": 1.6150003671646118,
+      "learning_rate": 4.22e-06,
+      "loss": 0.4826,
+      "step": 2525
+    },
+    {
+      "epoch": 18.214285714285715,
+      "grad_norm": 2.94893217086792,
+      "learning_rate": 4.148571428571429e-06,
+      "loss": 0.4894,
+      "step": 2550
+    },
+    {
+      "epoch": 18.392857142857142,
+      "grad_norm": 1.913024663925171,
+      "learning_rate": 4.0771428571428574e-06,
+      "loss": 0.4784,
+      "step": 2575
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 2.2716126441955566,
+      "learning_rate": 4.0057142857142864e-06,
+      "loss": 0.4709,
+      "step": 2600
+    },
+    {
+      "epoch": 18.75,
+      "grad_norm": 3.5856099128723145,
+      "learning_rate": 3.934285714285715e-06,
+      "loss": 0.4885,
+      "step": 2625
+    },
+    {
+      "epoch": 18.928571428571427,
+      "grad_norm": 4.390285015106201,
+      "learning_rate": 3.862857142857143e-06,
+      "loss": 0.4828,
+      "step": 2650
+    },
+    {
+      "epoch": 19.107142857142858,
+      "grad_norm": 3.690558910369873,
+      "learning_rate": 3.7914285714285722e-06,
+      "loss": 0.4862,
+      "step": 2675
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 3.1892879009246826,
+      "learning_rate": 3.7200000000000004e-06,
+      "loss": 0.4798,
+      "step": 2700
+    },
+    {
+      "epoch": 19.464285714285715,
+      "grad_norm": 2.4511208534240723,
+      "learning_rate": 3.648571428571429e-06,
+      "loss": 0.4844,
+      "step": 2725
+    },
+    {
+      "epoch": 19.642857142857142,
+      "grad_norm": 1.642425537109375,
+      "learning_rate": 3.5771428571428576e-06,
+      "loss": 0.4845,
+      "step": 2750
+    },
+    {
+      "epoch": 19.821428571428573,
+      "grad_norm": 1.53347909450531,
+      "learning_rate": 3.505714285714286e-06,
+      "loss": 0.4821,
+      "step": 2775
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 2.1212124824523926,
+      "learning_rate": 3.4342857142857143e-06,
+      "loss": 0.4756,
+      "step": 2800
+    },
+    {
+      "epoch": 20.178571428571427,
+      "grad_norm": 2.1033811569213867,
+      "learning_rate": 3.3628571428571433e-06,
+      "loss": 0.4729,
+      "step": 2825
+    },
+    {
+      "epoch": 20.357142857142858,
+      "grad_norm": 1.9785221815109253,
+      "learning_rate": 3.2914285714285715e-06,
+      "loss": 0.4783,
+      "step": 2850
+    },
+    {
+      "epoch": 20.535714285714285,
+      "grad_norm": 1.7057210206985474,
+      "learning_rate": 3.2200000000000005e-06,
+      "loss": 0.4728,
+      "step": 2875
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 2.1187682151794434,
+      "learning_rate": 3.1485714285714287e-06,
+      "loss": 0.4765,
+      "step": 2900
+    },
+    {
+      "epoch": 20.892857142857142,
+      "grad_norm": 2.3613460063934326,
+      "learning_rate": 3.0771428571428573e-06,
+      "loss": 0.4696,
+      "step": 2925
+    },
+    {
+      "epoch": 21.071428571428573,
+      "grad_norm": 1.5449374914169312,
+      "learning_rate": 3.005714285714286e-06,
+      "loss": 0.4753,
+      "step": 2950
+    },
+    {
+      "epoch": 21.25,
+      "grad_norm": 1.9528214931488037,
+      "learning_rate": 2.9342857142857144e-06,
+      "loss": 0.4777,
+      "step": 2975
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 1.8519726991653442,
+      "learning_rate": 2.8628571428571435e-06,
+      "loss": 0.4739,
+      "step": 3000
+    },
+    {
+      "epoch": 21.428571428571427,
+      "eval_loss": 0.44868698716163635,
+      "eval_runtime": 10.7576,
+      "eval_samples_per_second": 46.2,
+      "eval_steps_per_second": 5.856,
+      "step": 3000
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 4000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 29,
+  "save_steps": 1000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": false
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 8896616922279240.0,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-3000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a01e8c0a090b02699d5b506a30ffaf176234c63870a5a741f73db593b385337
+size 5560

checkpoint-4000/added_tokens.json ADDED Viewed

	@@ -0,0 +1,4 @@

+{
+  "<ctc_blank>": 80,
+  "<mask>": 79
+}

checkpoint-4000/config.json ADDED Viewed

	@@ -0,0 +1,92 @@

+{
+  "_name_or_path": "microsoft/speecht5_tts",
+  "activation_dropout": 0.1,
+  "apply_spec_augment": true,
+  "architectures": [
+    "SpeechT5ForTextToSpeech"
+  ],
+  "attention_dropout": 0.1,
+  "bos_token_id": 0,
+  "conv_bias": false,
+  "conv_dim": [
+    512,
+    512,
+    512,
+    512,
+    512,
+    512,
+    512
+  ],
+  "conv_kernel": [
+    10,
+    3,
+    3,
+    3,
+    3,
+    2,
+    2
+  ],
+  "conv_stride": [
+    5,
+    2,
+    2,
+    2,
+    2,
+    2,
+    2
+  ],
+  "decoder_attention_heads": 12,
+  "decoder_ffn_dim": 3072,
+  "decoder_layerdrop": 0.1,
+  "decoder_layers": 6,
+  "decoder_start_token_id": 2,
+  "encoder_attention_heads": 12,
+  "encoder_ffn_dim": 3072,
+  "encoder_layerdrop": 0.1,
+  "encoder_layers": 12,
+  "encoder_max_relative_position": 160,
+  "eos_token_id": 2,
+  "feat_extract_activation": "gelu",
+  "feat_extract_norm": "group",
+  "feat_proj_dropout": 0.0,
+  "guided_attention_loss_num_heads": 2,
+  "guided_attention_loss_scale": 10.0,
+  "guided_attention_loss_sigma": 0.4,
+  "hidden_act": "gelu",
+  "hidden_dropout": 0.1,
+  "hidden_size": 768,
+  "initializer_range": 0.02,
+  "is_encoder_decoder": true,
+  "layer_norm_eps": 1e-05,
+  "mask_feature_length": 10,
+  "mask_feature_min_masks": 0,
+  "mask_feature_prob": 0.0,
+  "mask_time_length": 10,
+  "mask_time_min_masks": 2,
+  "mask_time_prob": 0.05,
+  "max_length": 1876,
+  "max_speech_positions": 1876,
+  "max_text_positions": 600,
+  "model_type": "speecht5",
+  "num_conv_pos_embedding_groups": 16,
+  "num_conv_pos_embeddings": 128,
+  "num_feat_extract_layers": 7,
+  "num_mel_bins": 80,
+  "pad_token_id": 1,
+  "positional_dropout": 0.1,
+  "reduction_factor": 2,
+  "scale_embedding": false,
+  "speaker_embedding_dim": 512,
+  "speech_decoder_postnet_dropout": 0.5,
+  "speech_decoder_postnet_kernel": 5,
+  "speech_decoder_postnet_layers": 5,
+  "speech_decoder_postnet_units": 256,
+  "speech_decoder_prenet_dropout": 0.5,
+  "speech_decoder_prenet_layers": 2,
+  "speech_decoder_prenet_units": 256,
+  "torch_dtype": "float32",
+  "transformers_version": "4.50.0.dev0",
+  "use_cache": false,
+  "use_guided_attention_loss": true,
+  "vocab_size": 81
+}

checkpoint-4000/model.safetensors ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:a7f6c078a89790d6ee06ed66975fbf5180d360efd6cd656173ba550e5c4ba085
+size 577789320

checkpoint-4000/optimizer.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:2eb1e8a9ed6ee3d9b101138a9aeb165d43e422a016f1ef54cedf8a7c4fdf8c6d
+size 1155772233

checkpoint-4000/rng_state.pth ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:fa285bbb0d5868c090a0912d03b0c8f9b6ffbfc0b058d94be0776891decf5ab7
+size 14244

checkpoint-4000/scaler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:05ebaa20c6824a9fdb798c4b9ced025fecb94428858b5fc9ab59b75a52f7019a
+size 988

checkpoint-4000/scheduler.pt ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:4783d1aad67332b882158dbf71f702c2c19d09ed6c5f6dbf2a69dcc433c36f68
+size 1064

checkpoint-4000/special_tokens_map.json ADDED Viewed

	@@ -0,0 +1,13 @@

+{
+  "bos_token": "<s>",
+  "eos_token": "</s>",
+  "mask_token": {
+    "content": "<mask>",
+    "lstrip": true,
+    "normalized": true,
+    "rstrip": false,
+    "single_word": false
+  },
+  "pad_token": "<pad>",
+  "unk_token": "<unk>"
+}

checkpoint-4000/spm_char.model ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:7fcc48f3e225f627b1641db410ceb0c8649bd2b0c982e150b03f8be3728ab560
+size 238473

checkpoint-4000/tokenizer_config.json ADDED Viewed

	@@ -0,0 +1,64 @@

+{
+  "added_tokens_decoder": {
+    "0": {
+      "content": "<s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "1": {
+      "content": "<pad>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "2": {
+      "content": "</s>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "3": {
+      "content": "<unk>",
+      "lstrip": false,
+      "normalized": false,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "79": {
+      "content": "<mask>",
+      "lstrip": true,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": true
+    },
+    "80": {
+      "content": "<ctc_blank>",
+      "lstrip": false,
+      "normalized": true,
+      "rstrip": false,
+      "single_word": false,
+      "special": false
+    }
+  },
+  "bos_token": "<s>",
+  "clean_up_tokenization_spaces": false,
+  "eos_token": "</s>",
+  "extra_special_tokens": {},
+  "mask_token": "<mask>",
+  "model_max_length": 600,
+  "normalize": false,
+  "pad_token": "<pad>",
+  "processor_class": "SpeechT5Processor",
+  "sp_model_kwargs": {},
+  "tokenizer_class": "SpeechT5Tokenizer",
+  "unk_token": "<unk>"
+}

checkpoint-4000/trainer_state.json ADDED Viewed

	@@ -0,0 +1,1185 @@

+{
+  "best_metric": 0.4465157091617584,
+  "best_model_checkpoint": "./speecht5_tts_common_voice_17_0_id/checkpoint-4000",
+  "epoch": 28.571428571428573,
+  "eval_steps": 1000,
+  "global_step": 4000,
+  "is_hyper_param_search": false,
+  "is_local_process_zero": true,
+  "is_world_process_zero": true,
+  "log_history": [
+    {
+      "epoch": 0.17857142857142858,
+      "grad_norm": 4.796061038970947,
+      "learning_rate": 4.6000000000000004e-07,
+      "loss": 1.0232,
+      "step": 25
+    },
+    {
+      "epoch": 0.35714285714285715,
+      "grad_norm": 6.88640022277832,
+      "learning_rate": 9.600000000000001e-07,
+      "loss": 0.9412,
+      "step": 50
+    },
+    {
+      "epoch": 0.5357142857142857,
+      "grad_norm": 4.282207489013672,
+      "learning_rate": 1.46e-06,
+      "loss": 0.8431,
+      "step": 75
+    },
+    {
+      "epoch": 0.7142857142857143,
+      "grad_norm": 4.095445156097412,
+      "learning_rate": 1.9600000000000003e-06,
+      "loss": 0.7959,
+      "step": 100
+    },
+    {
+      "epoch": 0.8928571428571429,
+      "grad_norm": 6.723930835723877,
+      "learning_rate": 2.46e-06,
+      "loss": 0.7825,
+      "step": 125
+    },
+    {
+      "epoch": 1.0714285714285714,
+      "grad_norm": 2.318833589553833,
+      "learning_rate": 2.96e-06,
+      "loss": 0.7967,
+      "step": 150
+    },
+    {
+      "epoch": 1.25,
+      "grad_norm": 2.1883444786071777,
+      "learning_rate": 3.46e-06,
+      "loss": 0.7826,
+      "step": 175
+    },
+    {
+      "epoch": 1.4285714285714286,
+      "grad_norm": 2.7793357372283936,
+      "learning_rate": 3.96e-06,
+      "loss": 0.7238,
+      "step": 200
+    },
+    {
+      "epoch": 1.6071428571428572,
+      "grad_norm": 3.0292282104492188,
+      "learning_rate": 4.4600000000000005e-06,
+      "loss": 0.6981,
+      "step": 225
+    },
+    {
+      "epoch": 1.7857142857142856,
+      "grad_norm": 4.8227314949035645,
+      "learning_rate": 4.960000000000001e-06,
+      "loss": 0.6753,
+      "step": 250
+    },
+    {
+      "epoch": 1.9642857142857144,
+      "grad_norm": 2.781235694885254,
+      "learning_rate": 5.460000000000001e-06,
+      "loss": 0.6337,
+      "step": 275
+    },
+    {
+      "epoch": 2.142857142857143,
+      "grad_norm": 2.9240171909332275,
+      "learning_rate": 5.9600000000000005e-06,
+      "loss": 0.6499,
+      "step": 300
+    },
+    {
+      "epoch": 2.3214285714285716,
+      "grad_norm": 2.0720555782318115,
+      "learning_rate": 6.460000000000001e-06,
+      "loss": 0.5995,
+      "step": 325
+    },
+    {
+      "epoch": 2.5,
+      "grad_norm": 3.025918483734131,
+      "learning_rate": 6.96e-06,
+      "loss": 0.6054,
+      "step": 350
+    },
+    {
+      "epoch": 2.678571428571429,
+      "grad_norm": 3.3047034740448,
+      "learning_rate": 7.4600000000000006e-06,
+      "loss": 0.5828,
+      "step": 375
+    },
+    {
+      "epoch": 2.857142857142857,
+      "grad_norm": 2.4087064266204834,
+      "learning_rate": 7.960000000000002e-06,
+      "loss": 0.5706,
+      "step": 400
+    },
+    {
+      "epoch": 3.0357142857142856,
+      "grad_norm": 2.7837984561920166,
+      "learning_rate": 8.46e-06,
+      "loss": 0.579,
+      "step": 425
+    },
+    {
+      "epoch": 3.2142857142857144,
+      "grad_norm": 1.7530593872070312,
+      "learning_rate": 8.96e-06,
+      "loss": 0.5455,
+      "step": 450
+    },
+    {
+      "epoch": 3.392857142857143,
+      "grad_norm": 2.3677515983581543,
+      "learning_rate": 9.460000000000001e-06,
+      "loss": 0.5557,
+      "step": 475
+    },
+    {
+      "epoch": 3.571428571428571,
+      "grad_norm": 2.445343494415283,
+      "learning_rate": 9.960000000000001e-06,
+      "loss": 0.5686,
+      "step": 500
+    },
+    {
+      "epoch": 3.75,
+      "grad_norm": 4.732877731323242,
+      "learning_rate": 9.934285714285715e-06,
+      "loss": 0.5635,
+      "step": 525
+    },
+    {
+      "epoch": 3.928571428571429,
+      "grad_norm": 4.45880126953125,
+      "learning_rate": 9.862857142857144e-06,
+      "loss": 0.5477,
+      "step": 550
+    },
+    {
+      "epoch": 4.107142857142857,
+      "grad_norm": 3.9657559394836426,
+      "learning_rate": 9.791428571428571e-06,
+      "loss": 0.5563,
+      "step": 575
+    },
+    {
+      "epoch": 4.285714285714286,
+      "grad_norm": 2.676309823989868,
+      "learning_rate": 9.72e-06,
+      "loss": 0.5221,
+      "step": 600
+    },
+    {
+      "epoch": 4.464285714285714,
+      "grad_norm": 2.89937686920166,
+      "learning_rate": 9.648571428571429e-06,
+      "loss": 0.5211,
+      "step": 625
+    },
+    {
+      "epoch": 4.642857142857143,
+      "grad_norm": 2.9824204444885254,
+      "learning_rate": 9.577142857142858e-06,
+      "loss": 0.5583,
+      "step": 650
+    },
+    {
+      "epoch": 4.821428571428571,
+      "grad_norm": 3.632369041442871,
+      "learning_rate": 9.505714285714287e-06,
+      "loss": 0.526,
+      "step": 675
+    },
+    {
+      "epoch": 5.0,
+      "grad_norm": 2.352837324142456,
+      "learning_rate": 9.434285714285714e-06,
+      "loss": 0.5211,
+      "step": 700
+    },
+    {
+      "epoch": 5.178571428571429,
+      "grad_norm": 1.3236348628997803,
+      "learning_rate": 9.362857142857143e-06,
+      "loss": 0.5173,
+      "step": 725
+    },
+    {
+      "epoch": 5.357142857142857,
+      "grad_norm": 1.8493444919586182,
+      "learning_rate": 9.291428571428572e-06,
+      "loss": 0.5094,
+      "step": 750
+    },
+    {
+      "epoch": 5.535714285714286,
+      "grad_norm": 1.7403544187545776,
+      "learning_rate": 9.220000000000002e-06,
+      "loss": 0.5239,
+      "step": 775
+    },
+    {
+      "epoch": 5.714285714285714,
+      "grad_norm": 4.10603666305542,
+      "learning_rate": 9.148571428571429e-06,
+      "loss": 0.5304,
+      "step": 800
+    },
+    {
+      "epoch": 5.892857142857143,
+      "grad_norm": 2.69100284576416,
+      "learning_rate": 9.077142857142858e-06,
+      "loss": 0.5224,
+      "step": 825
+    },
+    {
+      "epoch": 6.071428571428571,
+      "grad_norm": 1.956499695777893,
+      "learning_rate": 9.005714285714287e-06,
+      "loss": 0.5065,
+      "step": 850
+    },
+    {
+      "epoch": 6.25,
+      "grad_norm": 1.915540337562561,
+      "learning_rate": 8.934285714285716e-06,
+      "loss": 0.511,
+      "step": 875
+    },
+    {
+      "epoch": 6.428571428571429,
+      "grad_norm": 2.1903812885284424,
+      "learning_rate": 8.862857142857143e-06,
+      "loss": 0.5132,
+      "step": 900
+    },
+    {
+      "epoch": 6.607142857142857,
+      "grad_norm": 1.666169285774231,
+      "learning_rate": 8.791428571428572e-06,
+      "loss": 0.5362,
+      "step": 925
+    },
+    {
+      "epoch": 6.785714285714286,
+      "grad_norm": 1.6485190391540527,
+      "learning_rate": 8.720000000000001e-06,
+      "loss": 0.5115,
+      "step": 950
+    },
+    {
+      "epoch": 6.964285714285714,
+      "grad_norm": 1.7726221084594727,
+      "learning_rate": 8.64857142857143e-06,
+      "loss": 0.5183,
+      "step": 975
+    },
+    {
+      "epoch": 7.142857142857143,
+      "grad_norm": 2.7793469429016113,
+      "learning_rate": 8.577142857142858e-06,
+      "loss": 0.5133,
+      "step": 1000
+    },
+    {
+      "epoch": 7.142857142857143,
+      "eval_loss": 0.4698790907859802,
+      "eval_runtime": 10.706,
+      "eval_samples_per_second": 46.422,
+      "eval_steps_per_second": 5.885,
+      "step": 1000
+    },
+    {
+      "epoch": 7.321428571428571,
+      "grad_norm": 2.8019936084747314,
+      "learning_rate": 8.505714285714287e-06,
+      "loss": 0.518,
+      "step": 1025
+    },
+    {
+      "epoch": 7.5,
+      "grad_norm": 2.1961379051208496,
+      "learning_rate": 8.434285714285716e-06,
+      "loss": 0.5112,
+      "step": 1050
+    },
+    {
+      "epoch": 7.678571428571429,
+      "grad_norm": 2.5158090591430664,
+      "learning_rate": 8.362857142857143e-06,
+      "loss": 0.5091,
+      "step": 1075
+    },
+    {
+      "epoch": 7.857142857142857,
+      "grad_norm": 2.2158660888671875,
+      "learning_rate": 8.291428571428572e-06,
+      "loss": 0.5121,
+      "step": 1100
+    },
+    {
+      "epoch": 8.035714285714286,
+      "grad_norm": 2.8917131423950195,
+      "learning_rate": 8.220000000000001e-06,
+      "loss": 0.5134,
+      "step": 1125
+    },
+    {
+      "epoch": 8.214285714285714,
+      "grad_norm": 1.9233217239379883,
+      "learning_rate": 8.148571428571428e-06,
+      "loss": 0.5101,
+      "step": 1150
+    },
+    {
+      "epoch": 8.392857142857142,
+      "grad_norm": 2.437870979309082,
+      "learning_rate": 8.077142857142857e-06,
+      "loss": 0.5138,
+      "step": 1175
+    },
+    {
+      "epoch": 8.571428571428571,
+      "grad_norm": 1.7921634912490845,
+      "learning_rate": 8.005714285714286e-06,
+      "loss": 0.5155,
+      "step": 1200
+    },
+    {
+      "epoch": 8.75,
+      "grad_norm": 3.1069226264953613,
+      "learning_rate": 7.934285714285715e-06,
+      "loss": 0.5144,
+      "step": 1225
+    },
+    {
+      "epoch": 8.928571428571429,
+      "grad_norm": 1.7902675867080688,
+      "learning_rate": 7.862857142857143e-06,
+      "loss": 0.4973,
+      "step": 1250
+    },
+    {
+      "epoch": 9.107142857142858,
+      "grad_norm": 2.353273391723633,
+      "learning_rate": 7.791428571428572e-06,
+      "loss": 0.5035,
+      "step": 1275
+    },
+    {
+      "epoch": 9.285714285714286,
+      "grad_norm": 2.3287203311920166,
+      "learning_rate": 7.72e-06,
+      "loss": 0.5085,
+      "step": 1300
+    },
+    {
+      "epoch": 9.464285714285714,
+      "grad_norm": 1.6508110761642456,
+      "learning_rate": 7.64857142857143e-06,
+      "loss": 0.5116,
+      "step": 1325
+    },
+    {
+      "epoch": 9.642857142857142,
+      "grad_norm": 1.8232289552688599,
+      "learning_rate": 7.577142857142857e-06,
+      "loss": 0.5033,
+      "step": 1350
+    },
+    {
+      "epoch": 9.821428571428571,
+      "grad_norm": 2.0248517990112305,
+      "learning_rate": 7.505714285714286e-06,
+      "loss": 0.4974,
+      "step": 1375
+    },
+    {
+      "epoch": 10.0,
+      "grad_norm": 3.7484123706817627,
+      "learning_rate": 7.434285714285715e-06,
+      "loss": 0.4947,
+      "step": 1400
+    },
+    {
+      "epoch": 10.178571428571429,
+      "grad_norm": 1.793626308441162,
+      "learning_rate": 7.362857142857144e-06,
+      "loss": 0.5008,
+      "step": 1425
+    },
+    {
+      "epoch": 10.357142857142858,
+      "grad_norm": 1.8825795650482178,
+      "learning_rate": 7.291428571428571e-06,
+      "loss": 0.4965,
+      "step": 1450
+    },
+    {
+      "epoch": 10.535714285714286,
+      "grad_norm": 2.0584166049957275,
+      "learning_rate": 7.22e-06,
+      "loss": 0.4946,
+      "step": 1475
+    },
+    {
+      "epoch": 10.714285714285714,
+      "grad_norm": 3.3335680961608887,
+      "learning_rate": 7.148571428571429e-06,
+      "loss": 0.5048,
+      "step": 1500
+    },
+    {
+      "epoch": 10.892857142857142,
+      "grad_norm": 1.9972820281982422,
+      "learning_rate": 7.077142857142858e-06,
+      "loss": 0.5071,
+      "step": 1525
+    },
+    {
+      "epoch": 11.071428571428571,
+      "grad_norm": 2.2279226779937744,
+      "learning_rate": 7.0057142857142865e-06,
+      "loss": 0.4874,
+      "step": 1550
+    },
+    {
+      "epoch": 11.25,
+      "grad_norm": 2.168933868408203,
+      "learning_rate": 6.934285714285715e-06,
+      "loss": 0.5011,
+      "step": 1575
+    },
+    {
+      "epoch": 11.428571428571429,
+      "grad_norm": 3.186655044555664,
+      "learning_rate": 6.862857142857144e-06,
+      "loss": 0.4963,
+      "step": 1600
+    },
+    {
+      "epoch": 11.607142857142858,
+      "grad_norm": 2.6348812580108643,
+      "learning_rate": 6.791428571428572e-06,
+      "loss": 0.5007,
+      "step": 1625
+    },
+    {
+      "epoch": 11.785714285714286,
+      "grad_norm": 3.1159684658050537,
+      "learning_rate": 6.720000000000001e-06,
+      "loss": 0.4997,
+      "step": 1650
+    },
+    {
+      "epoch": 11.964285714285714,
+      "grad_norm": 4.068305492401123,
+      "learning_rate": 6.648571428571429e-06,
+      "loss": 0.4919,
+      "step": 1675
+    },
+    {
+      "epoch": 12.142857142857142,
+      "grad_norm": 2.315338134765625,
+      "learning_rate": 6.577142857142857e-06,
+      "loss": 0.4937,
+      "step": 1700
+    },
+    {
+      "epoch": 12.321428571428571,
+      "grad_norm": 1.5482977628707886,
+      "learning_rate": 6.505714285714286e-06,
+      "loss": 0.4964,
+      "step": 1725
+    },
+    {
+      "epoch": 12.5,
+      "grad_norm": 2.1527745723724365,
+      "learning_rate": 6.434285714285715e-06,
+      "loss": 0.494,
+      "step": 1750
+    },
+    {
+      "epoch": 12.678571428571429,
+      "grad_norm": 2.216703176498413,
+      "learning_rate": 6.3628571428571426e-06,
+      "loss": 0.4853,
+      "step": 1775
+    },
+    {
+      "epoch": 12.857142857142858,
+      "grad_norm": 2.939267873764038,
+      "learning_rate": 6.2914285714285716e-06,
+      "loss": 0.4978,
+      "step": 1800
+    },
+    {
+      "epoch": 13.035714285714286,
+      "grad_norm": 2.3067381381988525,
+      "learning_rate": 6.220000000000001e-06,
+      "loss": 0.5023,
+      "step": 1825
+    },
+    {
+      "epoch": 13.214285714285714,
+      "grad_norm": 2.2849552631378174,
+      "learning_rate": 6.14857142857143e-06,
+      "loss": 0.5013,
+      "step": 1850
+    },
+    {
+      "epoch": 13.392857142857142,
+      "grad_norm": 1.8568611145019531,
+      "learning_rate": 6.077142857142858e-06,
+      "loss": 0.4855,
+      "step": 1875
+    },
+    {
+      "epoch": 13.571428571428571,
+      "grad_norm": 2.784388542175293,
+      "learning_rate": 6.005714285714286e-06,
+      "loss": 0.4832,
+      "step": 1900
+    },
+    {
+      "epoch": 13.75,
+      "grad_norm": 1.718732237815857,
+      "learning_rate": 5.934285714285715e-06,
+      "loss": 0.4926,
+      "step": 1925
+    },
+    {
+      "epoch": 13.928571428571429,
+      "grad_norm": 2.3010714054107666,
+      "learning_rate": 5.862857142857143e-06,
+      "loss": 0.494,
+      "step": 1950
+    },
+    {
+      "epoch": 14.107142857142858,
+      "grad_norm": 2.0058493614196777,
+      "learning_rate": 5.791428571428572e-06,
+      "loss": 0.4901,
+      "step": 1975
+    },
+    {
+      "epoch": 14.285714285714286,
+      "grad_norm": 2.311893939971924,
+      "learning_rate": 5.72e-06,
+      "loss": 0.4774,
+      "step": 2000
+    },
+    {
+      "epoch": 14.285714285714286,
+      "eval_loss": 0.45390585064888,
+      "eval_runtime": 18.3883,
+      "eval_samples_per_second": 27.028,
+      "eval_steps_per_second": 3.426,
+      "step": 2000
+    },
+    {
+      "epoch": 14.464285714285714,
+      "grad_norm": 5.475688457489014,
+      "learning_rate": 5.6485714285714285e-06,
+      "loss": 0.479,
+      "step": 2025
+    },
+    {
+      "epoch": 14.642857142857142,
+      "grad_norm": 2.333171844482422,
+      "learning_rate": 5.5771428571428575e-06,
+      "loss": 0.487,
+      "step": 2050
+    },
+    {
+      "epoch": 14.821428571428571,
+      "grad_norm": 1.7914478778839111,
+      "learning_rate": 5.5057142857142865e-06,
+      "loss": 0.5042,
+      "step": 2075
+    },
+    {
+      "epoch": 15.0,
+      "grad_norm": 2.343949317932129,
+      "learning_rate": 5.4342857142857155e-06,
+      "loss": 0.4994,
+      "step": 2100
+    },
+    {
+      "epoch": 15.178571428571429,
+      "grad_norm": 2.7536513805389404,
+      "learning_rate": 5.362857142857143e-06,
+      "loss": 0.492,
+      "step": 2125
+    },
+    {
+      "epoch": 15.357142857142858,
+      "grad_norm": 3.5288944244384766,
+      "learning_rate": 5.291428571428572e-06,
+      "loss": 0.4878,
+      "step": 2150
+    },
+    {
+      "epoch": 15.535714285714286,
+      "grad_norm": 4.280928611755371,
+      "learning_rate": 5.220000000000001e-06,
+      "loss": 0.4908,
+      "step": 2175
+    },
+    {
+      "epoch": 15.714285714285714,
+      "grad_norm": 3.1674723625183105,
+      "learning_rate": 5.14857142857143e-06,
+      "loss": 0.4896,
+      "step": 2200
+    },
+    {
+      "epoch": 15.892857142857142,
+      "grad_norm": 1.4766712188720703,
+      "learning_rate": 5.077142857142857e-06,
+      "loss": 0.4891,
+      "step": 2225
+    },
+    {
+      "epoch": 16.071428571428573,
+      "grad_norm": 2.7163197994232178,
+      "learning_rate": 5.005714285714286e-06,
+      "loss": 0.4901,
+      "step": 2250
+    },
+    {
+      "epoch": 16.25,
+      "grad_norm": 2.2624833583831787,
+      "learning_rate": 4.934285714285715e-06,
+      "loss": 0.4841,
+      "step": 2275
+    },
+    {
+      "epoch": 16.428571428571427,
+      "grad_norm": 3.0063624382019043,
+      "learning_rate": 4.862857142857143e-06,
+      "loss": 0.4826,
+      "step": 2300
+    },
+    {
+      "epoch": 16.607142857142858,
+      "grad_norm": 1.5605120658874512,
+      "learning_rate": 4.7914285714285715e-06,
+      "loss": 0.4808,
+      "step": 2325
+    },
+    {
+      "epoch": 16.785714285714285,
+      "grad_norm": 1.8184423446655273,
+      "learning_rate": 4.7200000000000005e-06,
+      "loss": 0.4743,
+      "step": 2350
+    },
+    {
+      "epoch": 16.964285714285715,
+      "grad_norm": 1.490218162536621,
+      "learning_rate": 4.648571428571429e-06,
+      "loss": 0.4848,
+      "step": 2375
+    },
+    {
+      "epoch": 17.142857142857142,
+      "grad_norm": 2.210409641265869,
+      "learning_rate": 4.577142857142858e-06,
+      "loss": 0.4814,
+      "step": 2400
+    },
+    {
+      "epoch": 17.321428571428573,
+      "grad_norm": 1.8189564943313599,
+      "learning_rate": 4.505714285714286e-06,
+      "loss": 0.4749,
+      "step": 2425
+    },
+    {
+      "epoch": 17.5,
+      "grad_norm": 2.2493181228637695,
+      "learning_rate": 4.434285714285715e-06,
+      "loss": 0.4835,
+      "step": 2450
+    },
+    {
+      "epoch": 17.678571428571427,
+      "grad_norm": 2.454582452774048,
+      "learning_rate": 4.362857142857143e-06,
+      "loss": 0.4891,
+      "step": 2475
+    },
+    {
+      "epoch": 17.857142857142858,
+      "grad_norm": 2.0914249420166016,
+      "learning_rate": 4.291428571428572e-06,
+      "loss": 0.4774,
+      "step": 2500
+    },
+    {
+      "epoch": 18.035714285714285,
+      "grad_norm": 1.6150003671646118,
+      "learning_rate": 4.22e-06,
+      "loss": 0.4826,
+      "step": 2525
+    },
+    {
+      "epoch": 18.214285714285715,
+      "grad_norm": 2.94893217086792,
+      "learning_rate": 4.148571428571429e-06,
+      "loss": 0.4894,
+      "step": 2550
+    },
+    {
+      "epoch": 18.392857142857142,
+      "grad_norm": 1.913024663925171,
+      "learning_rate": 4.0771428571428574e-06,
+      "loss": 0.4784,
+      "step": 2575
+    },
+    {
+      "epoch": 18.571428571428573,
+      "grad_norm": 2.2716126441955566,
+      "learning_rate": 4.0057142857142864e-06,
+      "loss": 0.4709,
+      "step": 2600
+    },
+    {
+      "epoch": 18.75,
+      "grad_norm": 3.5856099128723145,
+      "learning_rate": 3.934285714285715e-06,
+      "loss": 0.4885,
+      "step": 2625
+    },
+    {
+      "epoch": 18.928571428571427,
+      "grad_norm": 4.390285015106201,
+      "learning_rate": 3.862857142857143e-06,
+      "loss": 0.4828,
+      "step": 2650
+    },
+    {
+      "epoch": 19.107142857142858,
+      "grad_norm": 3.690558910369873,
+      "learning_rate": 3.7914285714285722e-06,
+      "loss": 0.4862,
+      "step": 2675
+    },
+    {
+      "epoch": 19.285714285714285,
+      "grad_norm": 3.1892879009246826,
+      "learning_rate": 3.7200000000000004e-06,
+      "loss": 0.4798,
+      "step": 2700
+    },
+    {
+      "epoch": 19.464285714285715,
+      "grad_norm": 2.4511208534240723,
+      "learning_rate": 3.648571428571429e-06,
+      "loss": 0.4844,
+      "step": 2725
+    },
+    {
+      "epoch": 19.642857142857142,
+      "grad_norm": 1.642425537109375,
+      "learning_rate": 3.5771428571428576e-06,
+      "loss": 0.4845,
+      "step": 2750
+    },
+    {
+      "epoch": 19.821428571428573,
+      "grad_norm": 1.53347909450531,
+      "learning_rate": 3.505714285714286e-06,
+      "loss": 0.4821,
+      "step": 2775
+    },
+    {
+      "epoch": 20.0,
+      "grad_norm": 2.1212124824523926,
+      "learning_rate": 3.4342857142857143e-06,
+      "loss": 0.4756,
+      "step": 2800
+    },
+    {
+      "epoch": 20.178571428571427,
+      "grad_norm": 2.1033811569213867,
+      "learning_rate": 3.3628571428571433e-06,
+      "loss": 0.4729,
+      "step": 2825
+    },
+    {
+      "epoch": 20.357142857142858,
+      "grad_norm": 1.9785221815109253,
+      "learning_rate": 3.2914285714285715e-06,
+      "loss": 0.4783,
+      "step": 2850
+    },
+    {
+      "epoch": 20.535714285714285,
+      "grad_norm": 1.7057210206985474,
+      "learning_rate": 3.2200000000000005e-06,
+      "loss": 0.4728,
+      "step": 2875
+    },
+    {
+      "epoch": 20.714285714285715,
+      "grad_norm": 2.1187682151794434,
+      "learning_rate": 3.1485714285714287e-06,
+      "loss": 0.4765,
+      "step": 2900
+    },
+    {
+      "epoch": 20.892857142857142,
+      "grad_norm": 2.3613460063934326,
+      "learning_rate": 3.0771428571428573e-06,
+      "loss": 0.4696,
+      "step": 2925
+    },
+    {
+      "epoch": 21.071428571428573,
+      "grad_norm": 1.5449374914169312,
+      "learning_rate": 3.005714285714286e-06,
+      "loss": 0.4753,
+      "step": 2950
+    },
+    {
+      "epoch": 21.25,
+      "grad_norm": 1.9528214931488037,
+      "learning_rate": 2.9342857142857144e-06,
+      "loss": 0.4777,
+      "step": 2975
+    },
+    {
+      "epoch": 21.428571428571427,
+      "grad_norm": 1.8519726991653442,
+      "learning_rate": 2.8628571428571435e-06,
+      "loss": 0.4739,
+      "step": 3000
+    },
+    {
+      "epoch": 21.428571428571427,
+      "eval_loss": 0.44868698716163635,
+      "eval_runtime": 10.7576,
+      "eval_samples_per_second": 46.2,
+      "eval_steps_per_second": 5.856,
+      "step": 3000
+    },
+    {
+      "epoch": 21.607142857142858,
+      "grad_norm": 1.5077314376831055,
+      "learning_rate": 2.7914285714285716e-06,
+      "loss": 0.4723,
+      "step": 3025
+    },
+    {
+      "epoch": 21.785714285714285,
+      "grad_norm": 1.6296398639678955,
+      "learning_rate": 2.7200000000000002e-06,
+      "loss": 0.4775,
+      "step": 3050
+    },
+    {
+      "epoch": 21.964285714285715,
+      "grad_norm": 2.155275821685791,
+      "learning_rate": 2.648571428571429e-06,
+      "loss": 0.4777,
+      "step": 3075
+    },
+    {
+      "epoch": 22.142857142857142,
+      "grad_norm": 1.4826477766036987,
+      "learning_rate": 2.5771428571428574e-06,
+      "loss": 0.4778,
+      "step": 3100
+    },
+    {
+      "epoch": 22.321428571428573,
+      "grad_norm": 4.133993148803711,
+      "learning_rate": 2.5057142857142856e-06,
+      "loss": 0.4867,
+      "step": 3125
+    },
+    {
+      "epoch": 22.5,
+      "grad_norm": 1.8221015930175781,
+      "learning_rate": 2.4342857142857146e-06,
+      "loss": 0.4843,
+      "step": 3150
+    },
+    {
+      "epoch": 22.678571428571427,
+      "grad_norm": 2.3254904747009277,
+      "learning_rate": 2.362857142857143e-06,
+      "loss": 0.4816,
+      "step": 3175
+    },
+    {
+      "epoch": 22.857142857142858,
+      "grad_norm": 1.7816497087478638,
+      "learning_rate": 2.2914285714285718e-06,
+      "loss": 0.4698,
+      "step": 3200
+    },
+    {
+      "epoch": 23.035714285714285,
+      "grad_norm": 2.3238487243652344,
+      "learning_rate": 2.2200000000000003e-06,
+      "loss": 0.4951,
+      "step": 3225
+    },
+    {
+      "epoch": 23.214285714285715,
+      "grad_norm": 2.038130044937134,
+      "learning_rate": 2.148571428571429e-06,
+      "loss": 0.4853,
+      "step": 3250
+    },
+    {
+      "epoch": 23.392857142857142,
+      "grad_norm": 2.0773870944976807,
+      "learning_rate": 2.077142857142857e-06,
+      "loss": 0.4674,
+      "step": 3275
+    },
+    {
+      "epoch": 23.571428571428573,
+      "grad_norm": 1.8331812620162964,
+      "learning_rate": 2.0057142857142857e-06,
+      "loss": 0.4748,
+      "step": 3300
+    },
+    {
+      "epoch": 23.75,
+      "grad_norm": 2.034414291381836,
+      "learning_rate": 1.9342857142857143e-06,
+      "loss": 0.4761,
+      "step": 3325
+    },
+    {
+      "epoch": 23.928571428571427,
+      "grad_norm": 2.0720574855804443,
+      "learning_rate": 1.8628571428571429e-06,
+      "loss": 0.4714,
+      "step": 3350
+    },
+    {
+      "epoch": 24.107142857142858,
+      "grad_norm": 1.5996496677398682,
+      "learning_rate": 1.7914285714285715e-06,
+      "loss": 0.4741,
+      "step": 3375
+    },
+    {
+      "epoch": 24.285714285714285,
+      "grad_norm": 1.812302827835083,
+      "learning_rate": 1.72e-06,
+      "loss": 0.4761,
+      "step": 3400
+    },
+    {
+      "epoch": 24.464285714285715,
+      "grad_norm": 3.9967708587646484,
+      "learning_rate": 1.6485714285714289e-06,
+      "loss": 0.4659,
+      "step": 3425
+    },
+    {
+      "epoch": 24.642857142857142,
+      "grad_norm": 2.3776981830596924,
+      "learning_rate": 1.5771428571428574e-06,
+      "loss": 0.4826,
+      "step": 3450
+    },
+    {
+      "epoch": 24.821428571428573,
+      "grad_norm": 2.67183780670166,
+      "learning_rate": 1.5057142857142858e-06,
+      "loss": 0.4808,
+      "step": 3475
+    },
+    {
+      "epoch": 25.0,
+      "grad_norm": 2.5007424354553223,
+      "learning_rate": 1.4342857142857144e-06,
+      "loss": 0.4744,
+      "step": 3500
+    },
+    {
+      "epoch": 25.178571428571427,
+      "grad_norm": 3.58581280708313,
+      "learning_rate": 1.362857142857143e-06,
+      "loss": 0.4861,
+      "step": 3525
+    },
+    {
+      "epoch": 25.357142857142858,
+      "grad_norm": 2.0921339988708496,
+      "learning_rate": 1.2914285714285716e-06,
+      "loss": 0.472,
+      "step": 3550
+    },
+    {
+      "epoch": 25.535714285714285,
+      "grad_norm": 1.7422988414764404,
+      "learning_rate": 1.2200000000000002e-06,
+      "loss": 0.4747,
+      "step": 3575
+    },
+    {
+      "epoch": 25.714285714285715,
+      "grad_norm": 2.5243210792541504,
+      "learning_rate": 1.1485714285714286e-06,
+      "loss": 0.4826,
+      "step": 3600
+    },
+    {
+      "epoch": 25.892857142857142,
+      "grad_norm": 1.8407930135726929,
+      "learning_rate": 1.0771428571428574e-06,
+      "loss": 0.4757,
+      "step": 3625
+    },
+    {
+      "epoch": 26.071428571428573,
+      "grad_norm": 2.1124722957611084,
+      "learning_rate": 1.0057142857142857e-06,
+      "loss": 0.4749,
+      "step": 3650
+    },
+    {
+      "epoch": 26.25,
+      "grad_norm": 2.7014122009277344,
+      "learning_rate": 9.342857142857144e-07,
+      "loss": 0.4737,
+      "step": 3675
+    },
+    {
+      "epoch": 26.428571428571427,
+      "grad_norm": 1.5146933794021606,
+      "learning_rate": 8.628571428571429e-07,
+      "loss": 0.4704,
+      "step": 3700
+    },
+    {
+      "epoch": 26.607142857142858,
+      "grad_norm": 1.398466944694519,
+      "learning_rate": 7.914285714285715e-07,
+      "loss": 0.4732,
+      "step": 3725
+    },
+    {
+      "epoch": 26.785714285714285,
+      "grad_norm": 1.5718879699707031,
+      "learning_rate": 7.2e-07,
+      "loss": 0.4715,
+      "step": 3750
+    },
+    {
+      "epoch": 26.964285714285715,
+      "grad_norm": 2.2760274410247803,
+      "learning_rate": 6.485714285714287e-07,
+      "loss": 0.4803,
+      "step": 3775
+    },
+    {
+      "epoch": 27.142857142857142,
+      "grad_norm": 1.6266584396362305,
+      "learning_rate": 5.771428571428572e-07,
+      "loss": 0.4738,
+      "step": 3800
+    },
+    {
+      "epoch": 27.321428571428573,
+      "grad_norm": 1.7928359508514404,
+      "learning_rate": 5.057142857142858e-07,
+      "loss": 0.4699,
+      "step": 3825
+    },
+    {
+      "epoch": 27.5,
+      "grad_norm": 2.1646013259887695,
+      "learning_rate": 4.342857142857143e-07,
+      "loss": 0.4752,
+      "step": 3850
+    },
+    {
+      "epoch": 27.678571428571427,
+      "grad_norm": 2.122992515563965,
+      "learning_rate": 3.6285714285714283e-07,
+      "loss": 0.4791,
+      "step": 3875
+    },
+    {
+      "epoch": 27.857142857142858,
+      "grad_norm": 2.3135998249053955,
+      "learning_rate": 2.914285714285715e-07,
+      "loss": 0.4722,
+      "step": 3900
+    },
+    {
+      "epoch": 28.035714285714285,
+      "grad_norm": 1.7877129316329956,
+      "learning_rate": 2.2e-07,
+      "loss": 0.4617,
+      "step": 3925
+    },
+    {
+      "epoch": 28.214285714285715,
+      "grad_norm": 2.576960802078247,
+      "learning_rate": 1.4857142857142857e-07,
+      "loss": 0.4693,
+      "step": 3950
+    },
+    {
+      "epoch": 28.392857142857142,
+      "grad_norm": 2.0099828243255615,
+      "learning_rate": 7.714285714285715e-08,
+      "loss": 0.4713,
+      "step": 3975
+    },
+    {
+      "epoch": 28.571428571428573,
+      "grad_norm": 1.6247307062149048,
+      "learning_rate": 5.714285714285715e-09,
+      "loss": 0.4845,
+      "step": 4000
+    },
+    {
+      "epoch": 28.571428571428573,
+      "eval_loss": 0.4465157091617584,
+      "eval_runtime": 10.9109,
+      "eval_samples_per_second": 45.551,
+      "eval_steps_per_second": 5.774,
+      "step": 4000
+    }
+  ],
+  "logging_steps": 25,
+  "max_steps": 4000,
+  "num_input_tokens_seen": 0,
+  "num_train_epochs": 29,
+  "save_steps": 1000,
+  "stateful_callbacks": {
+    "TrainerControl": {
+      "args": {
+        "should_epoch_stop": false,
+        "should_evaluate": false,
+        "should_log": false,
+        "should_save": true,
+        "should_training_stop": true
+      },
+      "attributes": {}
+    }
+  },
+  "total_flos": 1.186346947223592e+16,
+  "train_batch_size": 16,
+  "trial_name": null,
+  "trial_params": null
+}

checkpoint-4000/training_args.bin ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:1a01e8c0a090b02699d5b506a30ffaf176234c63870a5a741f73db593b385337
+size 5560