Skip to content
This repository was archived by the owner on Feb 8, 2025. It is now read-only.

Add italian tokenizer support #108

Open
wants to merge 2 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
1 change: 1 addition & 0 deletions .gitignore
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,7 @@ __pycache__/
*.wav
*.npy
.vs/
.idea/
/models
/bark_ui_enhanced.egg-info
/build/lib/bark
Expand Down
3 changes: 3 additions & 0 deletions bark/hubert/hubert_manager.py
Original file line number Diff line number Diff line change
Expand Up @@ -42,6 +42,9 @@ def make_sure_tokenizer_installed(model: str = 'quantifier_hubert_base_ls960_14.
elif tokenizer_lang == 'pl':
repo = 'Hobis/bark-voice-cloning-polish-HuBERT-quantizer'
model = 'polish-HuBERT-quantizer_8_epoch.pth'
elif tokenizer_lang == 'it':
repo = 'gpwr/bark-it-tokenizer'
model = 'it_tokenizer.pth'
else:
raise 'Unknown Tokenizer Language!'
print(f'{local_file} not found. Downloading HuBERT custom tokenizer')
Expand Down
6 changes: 3 additions & 3 deletions webui.py
Original file line number Diff line number Diff line change
Expand Up @@ -61,12 +61,12 @@ def generate_text_to_speech(text, selected_speaker, text_temp, waveform_temp, eo
use_last_generation_as_history = "Use last generation as history" in complete_settings
save_last_generation = "Save generation as Voice" in complete_settings
for l in range(batchcount):
currentseed = seed
currentseed = int(seed)
if seed != None and seed > 2**32 - 1:
logger.warning(f"Seed {seed} > 2**32 - 1 (max), setting to random")
currentseed = None
if currentseed == None or currentseed <= 0:
currentseed = np.random.default_rng().integers(1, 2**32 - 1)
currentseed = int(np.random.default_rng().integers(1, 2**32 - 1))
assert(0 < currentseed and currentseed < 2**32)

progress(0, desc="Generating")
Expand Down Expand Up @@ -260,7 +260,7 @@ def create_version_html():
preload_models()

available_themes = ["Default", "gradio/glass", "gradio/monochrome", "gradio/seafoam", "gradio/soft", "gstaff/xkcd", "freddyaboulton/dracula_revamped", "ysharma/steampunk"]
tokenizer_language_list = ["de","en", "es", "pl"]
tokenizer_language_list = ["en", "de", "es", "pl", "it"]
prepare_training_list = ["Step 1: Semantics from Text","Step 2: WAV from Semantics"]

seed = -1
Expand Down