Skip to content

Commit 62d9842

Browse files
authoredAug 8, 2023
Tortoise and MBD improvements (rsxdalv#118)
1 parent 8f7543f commit 62d9842

File tree

5 files changed

+15
-3
lines changed

5 files changed

+15
-3
lines changed
 

‎README.md

+10
Original file line numberDiff line numberDiff line change
@@ -34,6 +34,16 @@ Google Colab demo: [![Open In Colab](https://colab.research.google.com/assets/co
3434
https://rsxdalv.github.io/bark-speaker-directory/
3535

3636
## Changelog
37+
Aug 8:
38+
* Update AudioCraft, improving MultiBandDiffusion performance
39+
* Fix Tortoise parameter 'cond_free' mismatch with 'ultra_fast' preset
40+
41+
Aug 7:
42+
* add tortoise deepspeed fix to colab
43+
44+
Aug 6:
45+
* Fix audiogen + mbd error, add tortoise fix for colab
46+
3747
Aug 4:
3848
* Add MultiBandDiffusion option to MusicGen https://github.com/rsxdalv/tts-generation-webui/pull/109
3949
* MusicGen/AudioGen save tokens on generation as .npz files.

‎requirements_audiocraft.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
# audiocraft==0.0.1 # MIT License
2-
audiocraft @ git+https://git@github.com/facebookresearch/audiocraft@c5157b5bf14bf83449c17ea1eeb66c19fb4bc7f0#egg=audiocraft # MIT License
2+
audiocraft @ git+https://git@github.com/facebookresearch/audiocraft@d6df4f0fff69a69299c5883fae4a4d6d7b8a7948#egg=audiocraft # MIT License

‎server.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -35,7 +35,7 @@ def reload_config_and_restart_ui():
3535
title="TTS Generation WebUI",
3636
analytics_enabled=False, # it broke too many times
3737
) as demo:
38-
gr.Markdown("# TTS Generation WebUI (Bark, MusicGen, Tortoise, RVC)")
38+
gr.Markdown("# TTS Generation WebUI (Bark, MusicGen + AudioGen, Tortoise, RVC)")
3939
with Joutai.singleton.tabs:
4040
from src.tortoise.generation_tab_tortoise import generation_tab_tortoise
4141
from src.settings_tab_gradio import settings_tab_gradio

‎src/tortoise/diffusion_params.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@ def diffusion_params():
66
iterations = gr.Slider(
77
label="Diffusion Iterations", value=30, minimum=4, maximum=400, step=1
88
)
9-
cond_free = gr.Checkbox(label="Cond Free", value=True)
9+
cond_free = gr.Checkbox(label="Cond Free", value=False)
1010
cond_free_k = gr.Slider(
1111
label="Cond Free K", value=2, minimum=0, maximum=10, step=1
1212
)

‎src/tortoise/gen_tortoise.py

+2
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,7 @@ def get_tts(
7070
kv_cache=False,
7171
use_deepspeed=False,
7272
half=False,
73+
device=None,
7374
):
7475
global MODEL
7576
if MODEL is None or force_reload:
@@ -79,6 +80,7 @@ def get_tts(
7980
kv_cache=kv_cache,
8081
use_deepspeed=use_deepspeed,
8182
half=half,
83+
device=device,
8284
)
8385
return MODEL
8486

0 commit comments

Comments
 (0)