Biorrith commited on
Commit
d08c04c
·
1 Parent(s): 6737d99

Set new standard voices

Browse files
Files changed (4) hide show
  1. .gitattributes +1 -0
  2. app.py +23 -2
  3. samples/mic_trimmed.wav +3 -0
  4. samples/nic_trimmed.wav +3 -0
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ *.wav filter=lfs diff=lfs merge=lfs -text
app.py CHANGED
@@ -97,23 +97,38 @@ def generate(
97
  return (MODEL.sr, wav.squeeze(0).cpu().numpy())
98
 
99
 
 
 
 
 
 
 
 
 
100
  with gr.Blocks(title="Chatterbox Turbo") as demo:
101
  gr.Markdown("# ⚡ Chatterbox Turbo")
102
 
103
  with gr.Row():
104
  with gr.Column():
105
  text = gr.Textbox(
106
- value="Oh, that's hilarious! [chuckle] Um anyway, we do have a new model in store. It's the SkyNet T-800 series and it's got basically everything. Including AI integration with ChatGPT and all that jazz. Would you like me to get some prices for you?",
107
  label="Text to synthesize (max chars 300)",
108
  max_lines=5,
109
  elem_id="main_textbox"
110
  )
111
 
 
 
 
 
 
 
 
112
  ref_wav = gr.Audio(
113
  sources=["upload", "microphone"],
114
  type="filepath",
115
  label="Reference Audio File",
116
- value="https://storage.googleapis.com/chatterbox-demo-samples/turbo/2.wav",
117
  )
118
 
119
  run_btn = gr.Button("Generate ⚡", variant="primary")
@@ -130,6 +145,12 @@ with gr.Blocks(title="Chatterbox Turbo") as demo:
130
  min_p = gr.Slider(0.00, 1.00, step=0.01, label="Min P (Set to 0 to disable)", value=0.00)
131
  norm_loudness = gr.Checkbox(value=True, label="Normalize Loudness (-27 LUFS)")
132
 
 
 
 
 
 
 
133
  run_btn.click(
134
  fn=generate,
135
  inputs=[
 
97
  return (MODEL.sr, wav.squeeze(0).cpu().numpy())
98
 
99
 
100
+ VOICE_OPTIONS = {
101
+ "mic": "samples/mic_trimmed.wav",
102
+ "nic": "samples/nic_trimmed.wav"
103
+ }
104
+
105
+ def update_ref_audio(voice_name):
106
+ return VOICE_OPTIONS.get(voice_name, list(VOICE_OPTIONS.values())[0])
107
+
108
  with gr.Blocks(title="Chatterbox Turbo") as demo:
109
  gr.Markdown("# ⚡ Chatterbox Turbo")
110
 
111
  with gr.Row():
112
  with gr.Column():
113
  text = gr.Textbox(
114
+ value="København er Danmarks hovedstad og ligger øerne Sjælland og Amager, hvor mange turister besøger de smukke kanaler og historiske bygninger.",
115
  label="Text to synthesize (max chars 300)",
116
  max_lines=5,
117
  elem_id="main_textbox"
118
  )
119
 
120
+ voice = gr.Dropdown(
121
+ choices=list(VOICE_OPTIONS.keys()),
122
+ value="mic",
123
+ label="Voice Selection",
124
+ info="Choose a voice or upload your own below"
125
+ )
126
+
127
  ref_wav = gr.Audio(
128
  sources=["upload", "microphone"],
129
  type="filepath",
130
  label="Reference Audio File",
131
+ value=VOICE_OPTIONS["mic"],
132
  )
133
 
134
  run_btn = gr.Button("Generate ⚡", variant="primary")
 
145
  min_p = gr.Slider(0.00, 1.00, step=0.01, label="Min P (Set to 0 to disable)", value=0.00)
146
  norm_loudness = gr.Checkbox(value=True, label="Normalize Loudness (-27 LUFS)")
147
 
148
+ voice.change(
149
+ fn=update_ref_audio,
150
+ inputs=[voice],
151
+ outputs=[ref_wav],
152
+ )
153
+
154
  run_btn.click(
155
  fn=generate,
156
  inputs=[
samples/mic_trimmed.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:9b33d20de00571adcb1b02bb6601d65c47c8013985652ac54239f7dc0e7d19c0
3
+ size 1461102
samples/nic_trimmed.wav ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6026bc4e1ef0ec9d8e6d49b601fb7960023a545577685fd556be23387ff6b462
3
+ size 1555332