From 593b740709996313fc88557adba6ab19e39f52e5 Mon Sep 17 00:00:00 2001 From: kalomaze <66376113+kalomaze@users.noreply.github.com> Date: Sat, 22 Jul 2023 22:47:38 -0500 Subject: [PATCH] Fix training times by fixing fp16 detection --- config.py | 64 +++++++++++++++++++++++++++++++++++++++++++++---------- 1 file changed, 53 insertions(+), 11 deletions(-) diff --git a/config.py b/config.py index 2f64e13..9584c29 100644 --- a/config.py +++ b/config.py @@ -1,20 +1,62 @@ import argparse import sys import torch +import json from multiprocessing import cpu_count +global usefp16 +usefp16 = False def use_fp32_config(): - for config_file in ["32k.json", "40k.json", "48k.json"]: - with open(f"configs/{config_file}", "r") as f: - strr = f.read().replace("true", "false") - with open(f"configs/{config_file}", "w") as f: - f.write(strr) - with open("trainset_preprocess_pipeline_print.py", "r") as f: - strr = f.read().replace("3.7", "3.0") - with open("trainset_preprocess_pipeline_print.py", "w") as f: - f.write(strr) + usefp16 = False + device_capability = 0 + if torch.cuda.is_available(): + device = torch.device("cuda:0") # Assuming you have only one GPU (index 0). + device_capability = torch.cuda.get_device_capability(device)[0] + if device_capability >= 7: + usefp16 = True + for config_file in ["32k.json", "40k.json", "48k.json"]: + with open(f"configs/{config_file}", "r") as d: + data = json.load(d) + if "train" in data and "fp16_run" in data["train"]: + data["train"]["fp16_run"] = True + + with open(f"configs/{config_file}", "w") as d: + json.dump(data, d, indent=4) + + print(f"Set fp16_run to true in {config_file}") + + with open("trainset_preprocess_pipeline_print.py", "r", encoding="utf-8") as f: + strr = f.read() + + strr = strr.replace("3.0", "3.7") + + with open("trainset_preprocess_pipeline_print.py", "w", encoding="utf-8") as f: + f.write(strr) + else: + for config_file in ["32k.json", "40k.json", "48k.json"]: + with open(f"configs/{config_file}", "r") as f: + data = json.load(f) + + if "train" in data and "fp16_run" in data["train"]: + data["train"]["fp16_run"] = False + + with open(f"configs/{config_file}", "w") as d: + json.dump(data, d, indent=4) + + print(f"Set fp16_run to false in {config_file}") + + with open("trainset_preprocess_pipeline_print.py", "r", encoding="utf-8") as f: + strr = f.read() + + strr = strr.replace("3.7", "3.0") + + with open("trainset_preprocess_pipeline_print.py", "w", encoding="utf-8") as f: + f.write(strr) + else: + print("CUDA is not available. Make sure you have an NVIDIA GPU and CUDA installed.") + return (usefp16, device_capability) class Config: def __init__(self): @@ -95,9 +137,9 @@ class Config: ): print("Found GPU", self.gpu_name, ", force to fp32") self.is_half = False - use_fp32_config() else: print("Found GPU", self.gpu_name) + use_fp32_config() self.gpu_mem = int( torch.cuda.get_device_properties(i_device).total_memory / 1024 @@ -143,4 +185,4 @@ class Config: x_center = 30 x_max = 32 - return x_pad, x_query, x_center, x_max + return x_pad, x_query, x_center, x_max \ No newline at end of file