mrfakename commited on
Commit
304bc5c
1 Parent(s): b624c42

Sync from GitHub repo

Browse files

This Space is synced from the GitHub repo: https://github.com/SWivid/F5-TTS. Please submit contributions to the Space there

Files changed (1) hide show
  1. api.py +14 -2
api.py CHANGED
@@ -7,6 +7,9 @@ from model import DiT, UNetT
7
  from model.utils import save_spectrogram
8
 
9
  from model.utils_infer import load_vocoder, load_model, infer_process, remove_silence_for_generated_wav
 
 
 
10
 
11
 
12
  class F5TTS:
@@ -26,6 +29,7 @@ class F5TTS:
26
  self.n_mel_channels = 100
27
  self.hop_length = 256
28
  self.target_rms = 0.1
 
29
 
30
  # Set device
31
  self.device = device or (
@@ -56,11 +60,11 @@ class F5TTS:
56
  self.ema_model = load_model(model_cls, model_cfg, ckpt_file, vocab_file, ode_method, use_ema, self.device)
57
 
58
  def export_wav(self, wav, file_wave, remove_silence=False):
 
 
59
  if remove_silence:
60
  remove_silence_for_generated_wav(file_wave)
61
 
62
- sf.write(file_wave, wav, self.target_sample_rate)
63
-
64
  def export_spectrogram(self, spect, file_spect):
65
  save_spectrogram(spect, file_spect)
66
 
@@ -81,7 +85,12 @@ class F5TTS:
81
  remove_silence=False,
82
  file_wave=None,
83
  file_spect=None,
 
84
  ):
 
 
 
 
85
  wav, sr, spect = infer_process(
86
  ref_file,
87
  ref_text,
@@ -116,4 +125,7 @@ if __name__ == "__main__":
116
  gen_text="""I don't really care what you call me. I've been a silent spectator, watching species evolve, empires rise and fall. But always remember, I am mighty and enduring. Respect me and I'll nurture you; ignore me and you shall face the consequences.""",
117
  file_wave="tests/out.wav",
118
  file_spect="tests/out.png",
 
119
  )
 
 
 
7
  from model.utils import save_spectrogram
8
 
9
  from model.utils_infer import load_vocoder, load_model, infer_process, remove_silence_for_generated_wav
10
+ from model.utils import seed_everything
11
+ import random
12
+ import sys
13
 
14
 
15
  class F5TTS:
 
29
  self.n_mel_channels = 100
30
  self.hop_length = 256
31
  self.target_rms = 0.1
32
+ self.seed = -1
33
 
34
  # Set device
35
  self.device = device or (
 
60
  self.ema_model = load_model(model_cls, model_cfg, ckpt_file, vocab_file, ode_method, use_ema, self.device)
61
 
62
  def export_wav(self, wav, file_wave, remove_silence=False):
63
+ sf.write(file_wave, wav, self.target_sample_rate)
64
+
65
  if remove_silence:
66
  remove_silence_for_generated_wav(file_wave)
67
 
 
 
68
  def export_spectrogram(self, spect, file_spect):
69
  save_spectrogram(spect, file_spect)
70
 
 
85
  remove_silence=False,
86
  file_wave=None,
87
  file_spect=None,
88
+ seed=-1,
89
  ):
90
+ if seed == -1:
91
+ seed = random.randint(0, sys.maxsize)
92
+ seed_everything(seed)
93
+ self.seed = seed
94
  wav, sr, spect = infer_process(
95
  ref_file,
96
  ref_text,
 
125
  gen_text="""I don't really care what you call me. I've been a silent spectator, watching species evolve, empires rise and fall. But always remember, I am mighty and enduring. Respect me and I'll nurture you; ignore me and you shall face the consequences.""",
126
  file_wave="tests/out.wav",
127
  file_spect="tests/out.png",
128
+ seed=-1, # random seed = -1
129
  )
130
+
131
+ print("seed :", f5tts.seed)