Spaces:

jbetker
/

tortoise

Build error

jbetker commited on May 3, 2022

Commit

9acce23

1 Parent(s): a4cda68

fix paths

Files changed (5) hide show

.gitignore CHANGED Viewed

@@ -129,7 +129,6 @@ dmypy.json
 .pyre/
 .idea/*
-tortoise/.models/*
-tortoise/random_voices/*
 .custom/*
 results/*

 .pyre/
 .idea/*
+.models/*
 .custom/*
 results/*

tortoise/models/arch_util.py CHANGED Viewed

@@ -290,7 +290,7 @@ class AudioMiniEncoder(nn.Module):
 class TorchMelSpectrogram(nn.Module):
     def __init__(self, filter_length=1024, hop_length=256, win_length=1024, n_mel_channels=80, mel_fmin=0, mel_fmax=8000,
-                 sampling_rate=22050, normalize=False, mel_norm_file='data/mel_norms.pth'):
         super().__init__()
         # These are the default tacotron values for the MEL spectrogram.
         self.filter_length = filter_length

 class TorchMelSpectrogram(nn.Module):
     def __init__(self, filter_length=1024, hop_length=256, win_length=1024, n_mel_channels=80, mel_fmin=0, mel_fmax=8000,
+                 sampling_rate=22050, normalize=False, mel_norm_file='tortoise/data/mel_norms.pth'):
         super().__init__()
         # These are the default tacotron values for the MEL spectrogram.
         self.filter_length = filter_length

tortoise/read.py CHANGED Viewed

@@ -28,7 +28,7 @@ def split_and_recombine_text(texts, desired_length=200, max_len=300):
 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
-    parser.add_argument('--textfile', type=str, help='A file containing the text to read.', default="data/riding_hood.txt")
     parser.add_argument('--voice', type=str, help='Selects the voice to use for generation. See options in voices/ directory (and add your own!) '
                                                  'Use the & character to join two voices together. Use a comma to perform inference on multiple voices.', default='pat')
     parser.add_argument('--output_path', type=str, help='Where to store outputs.', default='../results/longform/')

 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
+    parser.add_argument('--textfile', type=str, help='A file containing the text to read.', default="tortoise/data/riding_hood.txt")
     parser.add_argument('--voice', type=str, help='Selects the voice to use for generation. See options in voices/ directory (and add your own!) '
                                                  'Use the & character to join two voices together. Use a comma to perform inference on multiple voices.', default='pat')
     parser.add_argument('--output_path', type=str, help='Where to store outputs.', default='../results/longform/')

tortoise/utils/audio.py CHANGED Viewed

@@ -82,10 +82,10 @@ def dynamic_range_decompression(x, C=1):
 def get_voices():
-    subs = os.listdir('voices')
     voices = {}
     for sub in subs:
-        subj = os.path.join('voices', sub)
         if os.path.isdir(subj):
             voices[sub] = list(glob(f'{subj}/*.wav')) + list(glob(f'{subj}/*.mp3')) + list(glob(f'{subj}/*.pth'))
     return voices

 def get_voices():
+    subs = os.listdir('tortoise/voices')
     voices = {}
     for sub in subs:
+        subj = os.path.join('tortoise/voices', sub)
         if os.path.isdir(subj):
             voices[sub] = list(glob(f'{subj}/*.wav')) + list(glob(f'{subj}/*.mp3')) + list(glob(f'{subj}/*.pth'))
     return voices

tortoise/utils/tokenizer.py CHANGED Viewed

@@ -164,7 +164,7 @@ def lev_distance(s1, s2):
   return distances[-1]
 class VoiceBpeTokenizer:
-    def __init__(self, vocab_file='data/tokenizer.json'):
         if vocab_file is not None:
             self.tokenizer = Tokenizer.from_file(vocab_file)

   return distances[-1]
 class VoiceBpeTokenizer:
+    def __init__(self, vocab_file='tortoise/data/tokenizer.json'):
         if vocab_file is not None:
             self.tokenizer = Tokenizer.from_file(vocab_file)