mirror of
https://github.com/serp-ai/bark-with-voice-clone.git
synced 2025-12-16 11:48:09 +01:00
QoL updates
This commit is contained in:
@@ -9,13 +9,10 @@
|
|||||||
"from bark.generation import load_codec_model, generate_text_semantic\n",
|
"from bark.generation import load_codec_model, generate_text_semantic\n",
|
||||||
"from encodec.utils import convert_audio\n",
|
"from encodec.utils import convert_audio\n",
|
||||||
"\n",
|
"\n",
|
||||||
"from transformers import BertTokenizer\n",
|
|
||||||
"\n",
|
|
||||||
"import torchaudio\n",
|
"import torchaudio\n",
|
||||||
"import torch\n",
|
"import torch\n",
|
||||||
"\n",
|
"\n",
|
||||||
"model = load_codec_model(use_gpu=True)\n",
|
"model = load_codec_model(use_gpu=True)"
|
||||||
"tokenizer = BertTokenizer.from_pretrained(\"bert-base-multilingual-cased\")"
|
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
@@ -119,9 +116,15 @@
|
|||||||
"outputs": [],
|
"outputs": [],
|
||||||
"source": [
|
"source": [
|
||||||
"from bark.api import generate_audio\n",
|
"from bark.api import generate_audio\n",
|
||||||
|
"from transformers import BertTokenizer\n",
|
||||||
"from bark.generation import SAMPLE_RATE, preload_models, codec_decode, generate_coarse, generate_fine, generate_text_semantic\n",
|
"from bark.generation import SAMPLE_RATE, preload_models, codec_decode, generate_coarse, generate_fine, generate_text_semantic\n",
|
||||||
|
"\n",
|
||||||
|
"# Enter your prompt and speaker here\n",
|
||||||
"text_prompt = \"Hello, my name is Serpy. And, uh — and I like pizza. [laughs]\"\n",
|
"text_prompt = \"Hello, my name is Serpy. And, uh — and I like pizza. [laughs]\"\n",
|
||||||
"voice_name = \"speaker_0\" # use your custom voice name here if you have one"
|
"voice_name = \"speaker_0\" # use your custom voice name here if you have one\n",
|
||||||
|
"\n",
|
||||||
|
"# load the tokenizer\n",
|
||||||
|
"tokenizer = BertTokenizer.from_pretrained(\"bert-base-multilingual-cased\")"
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
|
|||||||
@@ -7,9 +7,15 @@
|
|||||||
"outputs": [],
|
"outputs": [],
|
||||||
"source": [
|
"source": [
|
||||||
"from bark.api import generate_audio\n",
|
"from bark.api import generate_audio\n",
|
||||||
|
"from transformers import BertTokenizer\n",
|
||||||
"from bark.generation import SAMPLE_RATE, preload_models, codec_decode, generate_coarse, generate_fine, generate_text_semantic\n",
|
"from bark.generation import SAMPLE_RATE, preload_models, codec_decode, generate_coarse, generate_fine, generate_text_semantic\n",
|
||||||
|
"\n",
|
||||||
|
"# Enter your prompt and speaker here\n",
|
||||||
"text_prompt = \"Hello, my name is Serpy. And, uh — and I like pizza. [laughs]\"\n",
|
"text_prompt = \"Hello, my name is Serpy. And, uh — and I like pizza. [laughs]\"\n",
|
||||||
"voice_name = \"speaker_0\" # use your custom voice name here if you have one"
|
"voice_name = \"speaker_0\" # use your custom voice name here if you have one\n",
|
||||||
|
"\n",
|
||||||
|
"# load the tokenizer\n",
|
||||||
|
"tokenizer = BertTokenizer.from_pretrained(\"bert-base-multilingual-cased\")"
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
|
|||||||
Reference in New Issue
Block a user