my_utils.py

import ffmpeg
import numpy as np

# import praatio
# import praatio.praat_scripts
import os
import sys

import random

import csv

platform_stft_mapping = {
    "linux": "stftpitchshift",
    "darwin": "stftpitchshift",
    "win32": "stftpitchshift.exe",
}

stft = platform_stft_mapping.get(sys.platform)
# praatEXE = join('.',os.path.abspath(os.getcwd()) + r"\Praat.exe")


def CSVutil(file, rw, type, *args):
    if type == "formanting":
        if rw == "r":
            with open(file) as fileCSVread:
                csv_reader = list(csv.reader(fileCSVread))
                return (
                    (csv_reader[0][0], csv_reader[0][1], csv_reader[0][2])
                    if csv_reader is not None
                    else (lambda: exec('raise ValueError("No data")'))()
                )
        else:
            if args:
                doformnt = args[0]
            else:
                doformnt = False
            qfr = args[1] if len(args) > 1 else 1.0
            tmb = args[2] if len(args) > 2 else 1.0
            with open(file, rw, newline="") as fileCSVwrite:
                csv_writer = csv.writer(fileCSVwrite, delimiter=",")
                csv_writer.writerow([doformnt, qfr, tmb])
    elif type == "stop":
        stop = args[0] if args else False
        with open(file, rw, newline="") as fileCSVwrite:
            csv_writer = csv.writer(fileCSVwrite, delimiter=",")
            csv_writer.writerow([stop])


def load_audio(file, sr, DoFormant, Quefrency, Timbre):
    converted = False
    DoFormant, Quefrency, Timbre = CSVutil("csvdb/formanting.csv", "r", "formanting")
    try:
        # https://github.com/openai/whisper/blob/main/whisper/audio.py#L26
        # This launches a subprocess to decode audio while down-mixing and resampling as necessary.
        # Requires the ffmpeg CLI and `ffmpeg-python` package to be installed.
        file = (
            file.strip(" ").strip('"').strip("\n").strip('"').strip(" ")
        )  # 防止小白拷路径头尾带了空格和"和回车
        file_formanted = file.strip(" ").strip('"').strip("\n").strip('"').strip(" ")

        # print(f"dofor={bool(DoFormant)} timbr={Timbre} quef={Quefrency}\n")

        if (
            lambda DoFormant: True
            if DoFormant.lower() == "true"
            else (False if DoFormant.lower() == "false" else DoFormant)
        )(DoFormant):
            numerator = round(random.uniform(1, 4), 4)
            # os.system(f"stftpitchshift -i {file} -q {Quefrency} -t {Timbre} -o {file_formanted}")
            # print('stftpitchshift -i "%s" -p 1.0 --rms -w 128 -v 8 -q %s -t %s -o "%s"' % (file, Quefrency, Timbre, file_formanted))

            if not file.endswith(".wav"):
                if not os.path.isfile(f"{file_formanted}.wav"):
                    converted = True
                    # print(f"\nfile = {file}\n")
                    # print(f"\nfile_formanted = {file_formanted}\n")
                    converting = (
                        ffmpeg.input(file_formanted, threads=0)
                        .output(f"{file_formanted}.wav")
                        .run(
                            cmd=["ffmpeg", "-nostdin"],
                            capture_stdout=True,
                            capture_stderr=True,
                        )
                    )
                else:
                    pass

            file_formanted = (
                f"{file_formanted}.wav"
                if not file_formanted.endswith(".wav")
                else file_formanted
            )

            print(f" · Formanting {file_formanted}...\n")

            os.system(
                '%s -i "%s" -q "%s" -t "%s" -o "%sFORMANTED_%s.wav"'
                % (
                    stft,
                    file_formanted,
                    Quefrency,
                    Timbre,
                    file_formanted,
                    str(numerator),
                )
            )

            print(f" · Formanted {file_formanted}!\n")

            # filepraat = (os.path.abspath(os.getcwd()) + '\\' + file).replace('/','\\')
            # file_formantedpraat = ('"' + os.path.abspath(os.getcwd()) + '/' + 'formanted'.join(file_formanted) + '"').replace('/','\\')
            # print("%sFORMANTED_%s.wav" % (file_formanted, str(numerator)))

            out, _ = (
                ffmpeg.input(
                    "%sFORMANTED_%s.wav" % (file_formanted, str(numerator)), threads=0
                )
                .output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sr)
                .run(
                    cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True
                )
            )

            try:
                os.remove("%sFORMANTED_%s.wav" % (file_formanted, str(numerator)))
            except Exception:
                pass
                print("couldn't remove formanted type of file")

        else:
            out, _ = (
                ffmpeg.input(file, threads=0)
                .output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sr)
                .run(
                    cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True
                )
            )
    except Exception as e:
        raise RuntimeError(f"Failed to load audio: {e}")

    if converted:
        try:
            os.remove(file_formanted)
        except Exception:
            pass
            print("couldn't remove converted type of file")
        converted = False

    return np.frombuffer(out, np.float32).flatten()
删除无用文件，增加--colab启动选项 2023-04-01 15:02:53 +08:00			`import ffmpeg`
			`import numpy as np`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00
			`# import praatio`
			`# import praatio.praat_scripts`
Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`import os`
linux 2023-07-27 11:04:45 +07:00			`import sys`

stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`import random`
Reformat and rewrite _get_name_params (#57) * Reformat * rewrite _get_name_params * Add workflow for automatic formatting * Revert "Add workflow for automatic formatting" This reverts commit 9111c5dbc1830248305fb075587a88be07ad3115. * revert Retrieval_based_Voice_Conversion_WebUI.ipynb --------- Co-authored-by: 源文雨 <41315874+fumiama@users.noreply.github.com> 2023-04-15 20:44:24 +09:00
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`import csv`
data storage overhaul switched from storing data in txt to sqlite3. no more formant.txt and stop.txt! all of the data from sql database is stored in memory of PC. 2023-07-25 05:53:47 +07:00
linux 2023-07-27 11:04:45 +07:00			`platform_stft_mapping = {`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`"linux": "stftpitchshift",`
			`"darwin": "stftpitchshift",`
			`"win32": "stftpitchshift.exe",`
linux 2023-07-27 11:04:45 +07:00			`}`
data storage overhaul switched from storing data in txt to sqlite3. no more formant.txt and stop.txt! all of the data from sql database is stored in memory of PC. 2023-07-25 05:53:47 +07:00
linux 2023-07-27 11:04:45 +07:00			`stft = platform_stft_mapping.get(sys.platform)`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`# praatEXE = join('.',os.path.abspath(os.getcwd()) + r"\Praat.exe")`

Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`def CSVutil(file, rw, type, *args):`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`if type == "formanting":`
			`if rw == "r":`
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`with open(file) as fileCSVread:`
			`csv_reader = list(csv.reader(fileCSVread))`
			`return (`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`(csv_reader[0][0], csv_reader[0][1], csv_reader[0][2])`
			`if csv_reader is not None`
			`else (lambda: exec('raise ValueError("No data")'))()`
			`)`
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`else:`
			`if args:`
			`doformnt = args[0]`
			`else:`
			`doformnt = False`
			`qfr = args[1] if len(args) > 1 else 1.0`
			`tmb = args[2] if len(args) > 2 else 1.0`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`with open(file, rw, newline="") as fileCSVwrite:`
			`csv_writer = csv.writer(fileCSVwrite, delimiter=",")`
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`csv_writer.writerow([doformnt, qfr, tmb])`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`elif type == "stop":`
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`stop = args[0] if args else False`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`with open(file, rw, newline="") as fileCSVwrite:`
			`csv_writer = csv.writer(fileCSVwrite, delimiter=",")`
sqldatastorage to csv 2023-07-29 00:23:52 +07:00			`csv_writer.writerow([stop])`
Reformat and rewrite _get_name_params (#57) * Reformat * rewrite _get_name_params * Add workflow for automatic formatting * Revert "Add workflow for automatic formatting" This reverts commit 9111c5dbc1830248305fb075587a88be07ad3115. * revert Retrieval_based_Voice_Conversion_WebUI.ipynb --------- Co-authored-by: 源文雨 <41315874+fumiama@users.noreply.github.com> 2023-04-15 20:44:24 +09:00
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`def load_audio(file, sr, DoFormant, Quefrency, Timbre):`
fixed non-formant inference 2023-07-26 23:01:10 +07:00			`converted = False`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`DoFormant, Quefrency, Timbre = CSVutil("csvdb/formanting.csv", "r", "formanting")`
Add files via upload 2023-03-31 17:54:38 +08:00			`try:`
			`# https://github.com/openai/whisper/blob/main/whisper/audio.py#L26`
			`# This launches a subprocess to decode audio while down-mixing and resampling as necessary.`
			# Requires the ffmpeg CLI and `ffmpeg-python` package to be installed.
Reformat and rewrite _get_name_params (#57) * Reformat * rewrite _get_name_params * Add workflow for automatic formatting * Revert "Add workflow for automatic formatting" This reverts commit 9111c5dbc1830248305fb075587a88be07ad3115. * revert Retrieval_based_Voice_Conversion_WebUI.ipynb --------- Co-authored-by: 源文雨 <41315874+fumiama@users.noreply.github.com> 2023-04-15 20:44:24 +09:00			`file = (`
			`file.strip(" ").strip('"').strip("\n").strip('"').strip(" ")`
			`) # 防止小白拷路径头尾带了空格和"和回车`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`file_formanted = file.strip(" ").strip('"').strip("\n").strip('"').strip(" ")`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
			`# print(f"dofor={bool(DoFormant)} timbr={Timbre} quef={Quefrency}\n")`

			`if (`
			`lambda DoFormant: True`
			`if DoFormant.lower() == "true"`
			`else (False if DoFormant.lower() == "false" else DoFormant)`
			`)(DoFormant):`
			`numerator = round(random.uniform(1, 4), 4)`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`# os.system(f"stftpitchshift -i {file} -q {Quefrency} -t {Timbre} -o {file_formanted}")`
			`# print('stftpitchshift -i "%s" -p 1.0 --rms -w 128 -v 8 -q %s -t %s -o "%s"' % (file, Quefrency, Timbre, file_formanted))`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
formanting fix now formanting accepts any audio, not just wavs. done with ffmpeg conversion. 2023-07-25 00:23:56 +07:00			`if not file.endswith(".wav"):`
stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`if not os.path.isfile(f"{file_formanted}.wav"):`
fixed non-formant inference 2023-07-26 23:01:10 +07:00			`converted = True`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`# print(f"\nfile = {file}\n")`
			`# print(f"\nfile_formanted = {file_formanted}\n")`
stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`converting = (`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`ffmpeg.input(file_formanted, threads=0)`
stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`.output(f"{file_formanted}.wav")`
			`.run(`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`cmd=["ffmpeg", "-nostdin"],`
			`capture_stdout=True,`
			`capture_stderr=True,`
stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`)`
formanting fix now formanting accepts any audio, not just wavs. done with ffmpeg conversion. 2023-07-25 00:23:56 +07:00			`)`
stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`else:`
			`pass`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
			`file_formanted = (`
			`f"{file_formanted}.wav"`
			`if not file_formanted.endswith(".wav")`
			`else file_formanted`
			`)`

stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`print(f" · Formanting {file_formanted}...\n")`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`os.system(`
linux 2023-07-27 11:04:45 +07:00			`'%s -i "%s" -q "%s" -t "%s" -o "%sFORMANTED_%s.wav"'`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`% (`
			`stft,`
			`file_formanted,`
			`Quefrency,`
			`Timbre,`
			`file_formanted,`
			`str(numerator),`
			`)`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`)`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
stftpshift overhaul + fixes fixed cli traceback + implemented formant shifting fixed batch conversion 2023-07-26 06:24:23 +07:00			`print(f" · Formanted {file_formanted}!\n")`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`# filepraat = (os.path.abspath(os.getcwd()) + '\\' + file).replace('/','\\')`
			`# file_formantedpraat = ('"' + os.path.abspath(os.getcwd()) + '/' + 'formanted'.join(file_formanted) + '"').replace('/','\\')`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`# print("%sFORMANTED_%s.wav" % (file_formanted, str(numerator)))`

Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`out, _ = (`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`ffmpeg.input(`
			`"%sFORMANTED_%s.wav" % (file_formanted, str(numerator)), threads=0`
			`)`
Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`.output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sr)`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`.run(`
			`cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True`
			`)`
Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`)`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`try:`
			`os.remove("%sFORMANTED_%s.wav" % (file_formanted, str(numerator)))`
			`except Exception:`
			`pass`
			`print("couldn't remove formanted type of file")`

Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`else:`
			`out, _ = (`
			`ffmpeg.input(file, threads=0)`
			`.output("-", format="f32le", acodec="pcm_f32le", ac=1, ar=sr)`
Apply Code Formatter Change 2023-07-23 03:47:53 +00:00			`.run(`
			`cmd=["ffmpeg", "-nostdin"], capture_stdout=True, capture_stderr=True`
			`)`
Tweaked files upload and replace 2023-07-21 20:36:54 +07:00			`)`
fix: train step2a & add arg --port --pycmd --noparallel 2023-04-01 16:42:19 +08:00			`except Exception as e:`
			`raise RuntimeError(f"Failed to load audio: {e}")`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
fixed non-formant inference 2023-07-26 23:01:10 +07:00			`if converted:`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00			`try:`
			`os.remove(file_formanted)`
			`except Exception:`
			`pass`
			`print("couldn't remove converted type of file")`
fixed non-formant inference 2023-07-26 23:01:10 +07:00			`converted = False`
Apply Code Formatter Change 2023-07-28 23:45:47 +00:00
Format code (#142) Co-authored-by: github-actions[bot] <github-actions[bot]@users.noreply.github.com> 2023-04-24 20:35:56 +08:00			`return np.frombuffer(out, np.float32).flatten()`