Spaces:
				
			
			
	
			
			
		Runtime error
		
	
	
	
			
			
	
	
	
	
		
		
		Runtime error
		
	Sync from GitHub repo
Browse filesThis Space is synced from the GitHub repo: https://github.com/SWivid/F5-TTS. Please submit contributions to the Space there
    	
        pyproject.toml
    CHANGED
    
    | @@ -4,7 +4,7 @@ build-backend = "setuptools.build_meta" | |
| 4 |  | 
| 5 | 
             
            [project]
         | 
| 6 | 
             
            name = "f5-tts"
         | 
| 7 | 
            -
            version = "0.2. | 
| 8 | 
             
            description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
         | 
| 9 | 
             
            readme = "README.md"
         | 
| 10 | 
             
            license = {text = "MIT License"}
         | 
|  | |
| 4 |  | 
| 5 | 
             
            [project]
         | 
| 6 | 
             
            name = "f5-tts"
         | 
| 7 | 
            +
            version = "0.2.1"
         | 
| 8 | 
             
            description = "F5-TTS: A Fairytaler that Fakes Fluent and Faithful Speech with Flow Matching"
         | 
| 9 | 
             
            readme = "README.md"
         | 
| 10 | 
             
            license = {text = "MIT License"}
         | 
    	
        src/f5_tts/configs/E2TTS_Base_train.yaml
    CHANGED
    
    | @@ -33,8 +33,9 @@ model: | |
| 33 | 
             
                win_length: 1024
         | 
| 34 | 
             
                n_fft: 1024
         | 
| 35 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 36 | 
            -
             | 
| 37 | 
            -
                 | 
|  | |
| 38 |  | 
| 39 | 
             
            ckpts:
         | 
| 40 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
|  | |
| 33 | 
             
                win_length: 1024
         | 
| 34 | 
             
                n_fft: 1024
         | 
| 35 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 36 | 
            +
              vocoder:
         | 
| 37 | 
            +
                is_local: False  # use local offline ckpt or not
         | 
| 38 | 
            +
                local_path: None  # local vocoder path
         | 
| 39 |  | 
| 40 | 
             
            ckpts:
         | 
| 41 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
    	
        src/f5_tts/configs/E2TTS_Small_train.yaml
    CHANGED
    
    | @@ -33,8 +33,9 @@ model: | |
| 33 | 
             
                win_length: 1024
         | 
| 34 | 
             
                n_fft: 1024
         | 
| 35 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 36 | 
            -
             | 
| 37 | 
            -
                 | 
|  | |
| 38 |  | 
| 39 | 
             
            ckpts:
         | 
| 40 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
|  | |
| 33 | 
             
                win_length: 1024
         | 
| 34 | 
             
                n_fft: 1024
         | 
| 35 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 36 | 
            +
              vocoder:
         | 
| 37 | 
            +
                is_local: False  # use local offline ckpt or not
         | 
| 38 | 
            +
                local_path: None  # local vocoder path
         | 
| 39 |  | 
| 40 | 
             
            ckpts:
         | 
| 41 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
    	
        src/f5_tts/configs/F5TTS_Base_train.yaml
    CHANGED
    
    | @@ -35,8 +35,9 @@ model: | |
| 35 | 
             
                win_length: 1024
         | 
| 36 | 
             
                n_fft: 1024
         | 
| 37 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 38 | 
            -
             | 
| 39 | 
            -
                 | 
|  | |
| 40 |  | 
| 41 | 
             
            ckpts:
         | 
| 42 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
|  | |
| 35 | 
             
                win_length: 1024
         | 
| 36 | 
             
                n_fft: 1024
         | 
| 37 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 38 | 
            +
              vocoder:
         | 
| 39 | 
            +
                is_local: False  # use local offline ckpt or not
         | 
| 40 | 
            +
                local_path: None  # local vocoder path
         | 
| 41 |  | 
| 42 | 
             
            ckpts:
         | 
| 43 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
    	
        src/f5_tts/configs/F5TTS_Small_train.yaml
    CHANGED
    
    | @@ -35,8 +35,9 @@ model: | |
| 35 | 
             
                win_length: 1024
         | 
| 36 | 
             
                n_fft: 1024
         | 
| 37 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 38 | 
            -
             | 
| 39 | 
            -
                 | 
|  | |
| 40 |  | 
| 41 | 
             
            ckpts:
         | 
| 42 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
|  | |
| 35 | 
             
                win_length: 1024
         | 
| 36 | 
             
                n_fft: 1024
         | 
| 37 | 
             
                mel_spec_type: vocos  # 'vocos' or 'bigvgan'
         | 
| 38 | 
            +
              vocoder:
         | 
| 39 | 
            +
                is_local: False  # use local offline ckpt or not
         | 
| 40 | 
            +
                local_path: None  # local vocoder path
         | 
| 41 |  | 
| 42 | 
             
            ckpts:
         | 
| 43 | 
             
              logger: wandb  # wandb | tensorboard | None
         | 
    	
        src/f5_tts/train/train.py
    CHANGED
    
    | @@ -59,8 +59,8 @@ def main(cfg): | |
| 59 | 
             
                    log_samples=True,
         | 
| 60 | 
             
                    bnb_optimizer=cfg.optim.bnb_optimizer,
         | 
| 61 | 
             
                    mel_spec_type=mel_spec_type,
         | 
| 62 | 
            -
                    is_local_vocoder=cfg.model. | 
| 63 | 
            -
                    local_vocoder_path=cfg.model. | 
| 64 | 
             
                )
         | 
| 65 |  | 
| 66 | 
             
                train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
         | 
|  | |
| 59 | 
             
                    log_samples=True,
         | 
| 60 | 
             
                    bnb_optimizer=cfg.optim.bnb_optimizer,
         | 
| 61 | 
             
                    mel_spec_type=mel_spec_type,
         | 
| 62 | 
            +
                    is_local_vocoder=cfg.model.vocoder.is_local,
         | 
| 63 | 
            +
                    local_vocoder_path=cfg.model.vocoder.local_path,
         | 
| 64 | 
             
                )
         | 
| 65 |  | 
| 66 | 
             
                train_dataset = load_dataset(cfg.datasets.name, tokenizer, mel_spec_kwargs=cfg.model.mel_spec)
         | 
