From 31cd81809578c60c17f14906cee2b2d00159e185 Mon Sep 17 00:00:00 2001 From: SWivid Date: Tue, 3 Jun 2025 21:23:47 +0800 Subject: [PATCH] formatting --- src/f5_tts/infer/SHARED.md | 23 ++++++++++++----------- src/f5_tts/train/finetune_gradio.py | 4 ++-- 2 files changed, 14 insertions(+), 13 deletions(-) diff --git a/src/f5_tts/infer/SHARED.md b/src/f5_tts/infer/SHARED.md index fc8f87d..90d3dd4 100644 --- a/src/f5_tts/infer/SHARED.md +++ b/src/f5_tts/infer/SHARED.md @@ -22,6 +22,8 @@ - [F5-TTS Base @ fi @ AsmoKoskinen](#f5-tts-base--fi--asmokoskinen) - [French](#french) - [F5-TTS Base @ fr @ RASPIAUDIO](#f5-tts-base--fr--raspiaudio) +- [German](#german) + - [F5-TTS Base @ de @ hvoss-techfak](#f5-tts-base--de--hvoss-techfak) - [Hindi](#hindi) - [F5-TTS Small @ hi @ SPRINGLab](#f5-tts-small--hi--springlab) - [Italian](#italian) @@ -33,8 +35,6 @@ - [F5-TTS Base @ ru @ HotDro4illa](#f5-tts-base--ru--hotdro4illa) - [Spanish](#spanish) - [F5-TTS Base @ es @ jpgallegoar](#f5-tts-base--es--jpgallegoar) -- [German](#german) - - [F5-TTS Base @ de @ hvoss-techfak](#f5-tts-base--de--hvoss-techfak) ## Multilingual @@ -99,6 +99,16 @@ Config: {"dim": 1024, "depth": 22, "heads": 16, "ff_mult": 2, "text_dim": 512, " - [Discussion about this training can be found here](https://github.com/SWivid/F5-TTS/issues/434). +## German + +#### F5-TTS Base @ de @ hvoss-techfak +|Model|🤗Hugging Face|Data (Hours)|Model License| +|:---:|:------------:|:-----------:|:-------------:| +|F5-TTS Base|[ckpt & vocab](https://huggingface.co/hvoss-techfak/F5-TTS-German)|[Mozilla Common Voice 19.0](https://commonvoice.mozilla.org/en/datasets) & 800 hours Crowdsourced |cc-by-nc-4.0| + +- Finetuned by [@hvoss-techfak](https://github.com/hvoss-techfak) + + ## Hindi #### F5-TTS Small @ hi @ SPRINGLab @@ -175,12 +185,3 @@ Config: {"dim": 1024, "depth": 22, "heads": 16, "ff_mult": 2, "text_dim": 512, " |F5-TTS Base|[ckpt & vocab](https://huggingface.co/jpgallegoar/F5-Spanish)|[Voxpopuli](https://huggingface.co/datasets/facebook/voxpopuli) & Crowdsourced & TEDx, 218 hours|cc0-1.0| - @jpgallegoar [GitHub repo](https://github.com/jpgallegoar/Spanish-F5), Jupyter Notebook and Gradio usage for Spanish model. - -## German - -#### F5-TTS Base @ de @ hvoss-techfak -|Model|🤗Hugging Face|Data (Hours)|Model License| -|:---:|:------------:|:-----------:|:-------------:| -|F5-TTS Base|[ckpt & vocab](https://huggingface.co/hvoss-techfak/F5-TTS-German)|[Mozilla Common Voice 19.0](https://commonvoice.mozilla.org/en/datasets) & 800 hours Crowdsourced |cc-by-nc-4.0| - -- Finetuned by [@hvoss-techfak](https://github.com/hvoss-techfak) diff --git a/src/f5_tts/train/finetune_gradio.py b/src/f5_tts/train/finetune_gradio.py index 7400add..e990673 100644 --- a/src/f5_tts/train/finetune_gradio.py +++ b/src/f5_tts/train/finetune_gradio.py @@ -434,7 +434,7 @@ def start_training( fp16 = "" cmd = ( - f"accelerate launch {fp16} \"{file_train}\" --exp_name {exp_name}" + f'accelerate launch {fp16} "{file_train}" --exp_name {exp_name}' f" --learning_rate {learning_rate}" f" --batch_size_per_gpu {batch_size_per_gpu}" f" --batch_size_type {batch_size_type}" @@ -453,7 +453,7 @@ def start_training( cmd += " --finetune" if file_checkpoint_train != "": - cmd += f" --pretrain \"{file_checkpoint_train}\"" + cmd += f' --pretrain "{file_checkpoint_train}"' if tokenizer_file != "": cmd += f" --tokenizer_path {tokenizer_file}"