Upload 9 files
Browse files- .gitattributes +1 -0
- V2_10_epoches_BEST/Finished_model_files.zip +3 -0
- V2_10_epoches_BEST/Finished_model_files/config.json +159 -0
- V2_10_epoches_BEST/Finished_model_files/dataset.zip +3 -0
- V2_10_epoches_BEST/Finished_model_files/model.pth +3 -0
- V2_10_epoches_BEST/Finished_model_files/vocab.json +0 -0
- V2_10_epoches_BEST/Finished_model_files/vocab.json_ +0 -0
- V2_10_epoches_BEST/dataset.zip +3 -0
- V2_10_epoches_BEST/generated_output.wav +0 -0
- V2_10_epoches_BEST/ref.wav +3 -0
    	
        .gitattributes
    CHANGED
    
    | @@ -35,3 +35,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text | |
| 35 | 
             
            *tfevents* filter=lfs diff=lfs merge=lfs -text
         | 
| 36 | 
             
            Glory[[:space:]]Days锛歔[:space:]]Stories[[:space:]]by[[:space:]]Simon[[:space:]]Rich[[:space:]]路[[:space:]]Audiobook[[:space:]]preview[[:space:]]\[oOBLfNTtWNQ\].mp3 filter=lfs diff=lfs merge=lfs -text
         | 
| 37 | 
             
            V1_10Epoches/ref.wav filter=lfs diff=lfs merge=lfs -text
         | 
|  | 
|  | |
| 35 | 
             
            *tfevents* filter=lfs diff=lfs merge=lfs -text
         | 
| 36 | 
             
            Glory[[:space:]]Days锛歔[:space:]]Stories[[:space:]]by[[:space:]]Simon[[:space:]]Rich[[:space:]]路[[:space:]]Audiobook[[:space:]]preview[[:space:]]\[oOBLfNTtWNQ\].mp3 filter=lfs diff=lfs merge=lfs -text
         | 
| 37 | 
             
            V1_10Epoches/ref.wav filter=lfs diff=lfs merge=lfs -text
         | 
| 38 | 
            +
            V2_10_epoches_BEST/ref.wav filter=lfs diff=lfs merge=lfs -text
         | 
    	
        V2_10_epoches_BEST/Finished_model_files.zip
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:68bca750165ee9e439d819afcea069971b083999d34ed886489057da496224e8
         | 
| 3 | 
            +
            size 1842606552
         | 
    	
        V2_10_epoches_BEST/Finished_model_files/config.json
    ADDED
    
    | @@ -0,0 +1,159 @@ | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            {
         | 
| 2 | 
            +
                "output_path": "output",
         | 
| 3 | 
            +
                "logger_uri": null,
         | 
| 4 | 
            +
                "run_name": "run",
         | 
| 5 | 
            +
                "project_name": null,
         | 
| 6 | 
            +
                "run_description": "\ud83d\udc38Coqui trainer run.",
         | 
| 7 | 
            +
                "print_step": 25,
         | 
| 8 | 
            +
                "plot_step": 100,
         | 
| 9 | 
            +
                "model_param_stats": false,
         | 
| 10 | 
            +
                "wandb_entity": null,
         | 
| 11 | 
            +
                "dashboard_logger": "tensorboard",
         | 
| 12 | 
            +
                "save_on_interrupt": true,
         | 
| 13 | 
            +
                "log_model_step": null,
         | 
| 14 | 
            +
                "save_step": 10000,
         | 
| 15 | 
            +
                "save_n_checkpoints": 5,
         | 
| 16 | 
            +
                "save_checkpoints": true,
         | 
| 17 | 
            +
                "save_all_best": false,
         | 
| 18 | 
            +
                "save_best_after": 10000,
         | 
| 19 | 
            +
                "target_loss": null,
         | 
| 20 | 
            +
                "print_eval": false,
         | 
| 21 | 
            +
                "test_delay_epochs": 0,
         | 
| 22 | 
            +
                "run_eval": true,
         | 
| 23 | 
            +
                "run_eval_steps": null,
         | 
| 24 | 
            +
                "distributed_backend": "nccl",
         | 
| 25 | 
            +
                "distributed_url": "tcp://localhost:54321",
         | 
| 26 | 
            +
                "mixed_precision": false,
         | 
| 27 | 
            +
                "precision": "fp16",
         | 
| 28 | 
            +
                "epochs": 1000,
         | 
| 29 | 
            +
                "batch_size": 32,
         | 
| 30 | 
            +
                "eval_batch_size": 16,
         | 
| 31 | 
            +
                "grad_clip": 0.0,
         | 
| 32 | 
            +
                "scheduler_after_epoch": true,
         | 
| 33 | 
            +
                "lr": 0.001,
         | 
| 34 | 
            +
                "optimizer": "radam",
         | 
| 35 | 
            +
                "optimizer_params": null,
         | 
| 36 | 
            +
                "lr_scheduler": null,
         | 
| 37 | 
            +
                "lr_scheduler_params": {},
         | 
| 38 | 
            +
                "use_grad_scaler": false,
         | 
| 39 | 
            +
                "allow_tf32": false,
         | 
| 40 | 
            +
                "cudnn_enable": true,
         | 
| 41 | 
            +
                "cudnn_deterministic": false,
         | 
| 42 | 
            +
                "cudnn_benchmark": false,
         | 
| 43 | 
            +
                "training_seed": 54321,
         | 
| 44 | 
            +
                "model": "xtts",
         | 
| 45 | 
            +
                "num_loader_workers": 0,
         | 
| 46 | 
            +
                "num_eval_loader_workers": 0,
         | 
| 47 | 
            +
                "use_noise_augment": false,
         | 
| 48 | 
            +
                "audio": {
         | 
| 49 | 
            +
                    "sample_rate": 22050,
         | 
| 50 | 
            +
                    "output_sample_rate": 24000
         | 
| 51 | 
            +
                },
         | 
| 52 | 
            +
                "use_phonemes": false,
         | 
| 53 | 
            +
                "phonemizer": null,
         | 
| 54 | 
            +
                "phoneme_language": null,
         | 
| 55 | 
            +
                "compute_input_seq_cache": false,
         | 
| 56 | 
            +
                "text_cleaner": null,
         | 
| 57 | 
            +
                "enable_eos_bos_chars": false,
         | 
| 58 | 
            +
                "test_sentences_file": "",
         | 
| 59 | 
            +
                "phoneme_cache_path": null,
         | 
| 60 | 
            +
                "characters": null,
         | 
| 61 | 
            +
                "add_blank": false,
         | 
| 62 | 
            +
                "batch_group_size": 0,
         | 
| 63 | 
            +
                "loss_masking": null,
         | 
| 64 | 
            +
                "min_audio_len": 1,
         | 
| 65 | 
            +
                "max_audio_len": Infinity,
         | 
| 66 | 
            +
                "min_text_len": 1,
         | 
| 67 | 
            +
                "max_text_len": Infinity,
         | 
| 68 | 
            +
                "compute_f0": false,
         | 
| 69 | 
            +
                "compute_energy": false,
         | 
| 70 | 
            +
                "compute_linear_spec": false,
         | 
| 71 | 
            +
                "precompute_num_workers": 0,
         | 
| 72 | 
            +
                "start_by_longest": false,
         | 
| 73 | 
            +
                "shuffle": false,
         | 
| 74 | 
            +
                "drop_last": false,
         | 
| 75 | 
            +
                "datasets": [
         | 
| 76 | 
            +
                    {
         | 
| 77 | 
            +
                        "formatter": "",
         | 
| 78 | 
            +
                        "dataset_name": "",
         | 
| 79 | 
            +
                        "path": "",
         | 
| 80 | 
            +
                        "meta_file_train": "",
         | 
| 81 | 
            +
                        "ignored_speakers": null,
         | 
| 82 | 
            +
                        "language": "",
         | 
| 83 | 
            +
                        "phonemizer": "",
         | 
| 84 | 
            +
                        "meta_file_val": "",
         | 
| 85 | 
            +
                        "meta_file_attn_mask": ""
         | 
| 86 | 
            +
                    }
         | 
| 87 | 
            +
                ],
         | 
| 88 | 
            +
                "test_sentences": [],
         | 
| 89 | 
            +
                "eval_split_max_size": null,
         | 
| 90 | 
            +
                "eval_split_size": 0.01,
         | 
| 91 | 
            +
                "use_speaker_weighted_sampler": false,
         | 
| 92 | 
            +
                "speaker_weighted_sampler_alpha": 1.0,
         | 
| 93 | 
            +
                "use_language_weighted_sampler": false,
         | 
| 94 | 
            +
                "language_weighted_sampler_alpha": 1.0,
         | 
| 95 | 
            +
                "use_length_weighted_sampler": false,
         | 
| 96 | 
            +
                "length_weighted_sampler_alpha": 1.0,
         | 
| 97 | 
            +
                "model_args": {
         | 
| 98 | 
            +
                    "gpt_batch_size": 1,
         | 
| 99 | 
            +
                    "enable_redaction": false,
         | 
| 100 | 
            +
                    "kv_cache": true,
         | 
| 101 | 
            +
                    "gpt_checkpoint": null,
         | 
| 102 | 
            +
                    "clvp_checkpoint": null,
         | 
| 103 | 
            +
                    "decoder_checkpoint": null,
         | 
| 104 | 
            +
                    "num_chars": 255,
         | 
| 105 | 
            +
                    "tokenizer_file": "",
         | 
| 106 | 
            +
                    "gpt_max_audio_tokens": 605,
         | 
| 107 | 
            +
                    "gpt_max_text_tokens": 402,
         | 
| 108 | 
            +
                    "gpt_max_prompt_tokens": 70,
         | 
| 109 | 
            +
                    "gpt_layers": 30,
         | 
| 110 | 
            +
                    "gpt_n_model_channels": 1024,
         | 
| 111 | 
            +
                    "gpt_n_heads": 16,
         | 
| 112 | 
            +
                    "gpt_number_text_tokens": 6681,
         | 
| 113 | 
            +
                    "gpt_start_text_token": null,
         | 
| 114 | 
            +
                    "gpt_stop_text_token": null,
         | 
| 115 | 
            +
                    "gpt_num_audio_tokens": 1026,
         | 
| 116 | 
            +
                    "gpt_start_audio_token": 1024,
         | 
| 117 | 
            +
                    "gpt_stop_audio_token": 1025,
         | 
| 118 | 
            +
                    "gpt_code_stride_len": 1024,
         | 
| 119 | 
            +
                    "gpt_use_masking_gt_prompt_approach": true,
         | 
| 120 | 
            +
                    "gpt_use_perceiver_resampler": true,
         | 
| 121 | 
            +
                    "input_sample_rate": 22050,
         | 
| 122 | 
            +
                    "output_sample_rate": 24000,
         | 
| 123 | 
            +
                    "output_hop_length": 256,
         | 
| 124 | 
            +
                    "decoder_input_dim": 1024,
         | 
| 125 | 
            +
                    "d_vector_dim": 512,
         | 
| 126 | 
            +
                    "cond_d_vector_in_each_upsampling_layer": true,
         | 
| 127 | 
            +
                    "duration_const": 102400
         | 
| 128 | 
            +
                },
         | 
| 129 | 
            +
                "model_dir": null,
         | 
| 130 | 
            +
                "languages": [
         | 
| 131 | 
            +
                    "en",
         | 
| 132 | 
            +
                    "es",
         | 
| 133 | 
            +
                    "fr",
         | 
| 134 | 
            +
                    "de",
         | 
| 135 | 
            +
                    "it",
         | 
| 136 | 
            +
                    "pt",
         | 
| 137 | 
            +
                    "pl",
         | 
| 138 | 
            +
                    "tr",
         | 
| 139 | 
            +
                    "ru",
         | 
| 140 | 
            +
                    "nl",
         | 
| 141 | 
            +
                    "cs",
         | 
| 142 | 
            +
                    "ar",
         | 
| 143 | 
            +
                    "zh-cn",
         | 
| 144 | 
            +
                    "hu",
         | 
| 145 | 
            +
                    "ko",
         | 
| 146 | 
            +
                    "ja",
         | 
| 147 | 
            +
                    "hi"
         | 
| 148 | 
            +
                ],
         | 
| 149 | 
            +
                "temperature": 0.75,
         | 
| 150 | 
            +
                "length_penalty": 1.0,
         | 
| 151 | 
            +
                "repetition_penalty": 5.0,
         | 
| 152 | 
            +
                "top_k": 50,
         | 
| 153 | 
            +
                "top_p": 0.85,
         | 
| 154 | 
            +
                "num_gpt_outputs": 1,
         | 
| 155 | 
            +
                "gpt_cond_len": 30,
         | 
| 156 | 
            +
                "gpt_cond_chunk_len": 4,
         | 
| 157 | 
            +
                "max_ref_len": 30,
         | 
| 158 | 
            +
                "sound_norm_refs": false
         | 
| 159 | 
            +
            }
         | 
    	
        V2_10_epoches_BEST/Finished_model_files/dataset.zip
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:89d24c8c24bc3841d83ca2d1d721b9dde87ba4a592a114dcced545968e58dd2d
         | 
| 3 | 
            +
            size 110231783
         | 
    	
        V2_10_epoches_BEST/Finished_model_files/model.pth
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:5f8db4ed5378d504c1212dd0ff63cb3fb8785b8567cabb5724849f6ed701b6eb
         | 
| 3 | 
            +
            size 1868275926
         | 
    	
        V2_10_epoches_BEST/Finished_model_files/vocab.json
    ADDED
    
    | The diff for this file is too large to render. 
		See raw diff | 
|  | 
    	
        V2_10_epoches_BEST/Finished_model_files/vocab.json_
    ADDED
    
    | The diff for this file is too large to render. 
		See raw diff | 
|  | 
    	
        V2_10_epoches_BEST/dataset.zip
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:89d24c8c24bc3841d83ca2d1d721b9dde87ba4a592a114dcced545968e58dd2d
         | 
| 3 | 
            +
            size 110231783
         | 
    	
        V2_10_epoches_BEST/generated_output.wav
    ADDED
    
    | Binary file (419 kB). View file | 
|  | 
    	
        V2_10_epoches_BEST/ref.wav
    ADDED
    
    | @@ -0,0 +1,3 @@ | |
|  | |
|  | |
|  | 
|  | |
| 1 | 
            +
            version https://git-lfs.github.com/spec/v1
         | 
| 2 | 
            +
            oid sha256:7f605584ae157c40e54e8b8145267a290da705704f1e731a190ac4033dca7263
         | 
| 3 | 
            +
            size 3433040
         | 
