Commit Graph - TTS - Code by DblK

Mirrors/TTS

Fork 0

mirror of https://github.com/coqui-ai/TTS.git synced 2026-07-10 12:32:09 +02:00

Commit Graph

Select branches

Hide Pull Requests

1316-rebase

Edresson-patch-1

Fix-typo-workflow-text

Fix_#1380

VITS-debug-dp

VITS-upsample

add-synpaflex-formatter

add_lang_code

add_neural_hmm_model

api_model_path

attribute-extraction

audio_len_sampler

calling_hf_models

cml-recipe

cml-tts-recipe

conflict_resolve

cpu-only-docker-image

d_vector_serialization

dev

dev-emotion

dev-emotion-rebased

dev-fix-scl

dev-managers

dev-update-readme

dev-yourtts-rec

dev_bark

docs_fix

emotion-dataset

emotion_cond_module

env_tos

fairseq_port

faster-linting

finetune_bark

fix-1423

fix-asserts+mas

fix-publish

fix-xtts-download

fix_#2797

fix_aux_tests

fix_bce_loss

fix_comp_emb

fix_condition_dp_on_speaker

fix_delightfulltts

fix_doc_dataset

fix_style

fix_warn

fix_xtts_load

fix_xtts_v1.1

fix_xtts_v1.1_

fix_zoo_test

force_phonemizer_definition

hifigan

init_stt_v2

main

mp3_len_fix

p3_11

patch-print-license

print_license_info

remove_v1_doc

revert-3038-xtts_redonwload

run_ci_for_v0.20.6

thorsten_models

timeout-check-config

tortoise_fixup

tortoise_pr_fixup

unbind_trainer_ver

unified_api_forwardtts2

update-coqpit-req

update-workflows

update_checkpoint_name

update_model_save

update_trainer

update_xtts_cloning

vits-pitch-pred

vits-pitch-pred-new

xtts

xtts_demo

xtts_redonwload

xtts_trainer

yourtts_adaptive_weight

#1

#10

#1000

#1007

#1009

#1020

#1021

#1022

#1026

#1027

#1028

#1031

#1032

#1043

#1044

#1047

#1048

#1049

#1050

#1051

#1054

#1055

#1056

#1060

#1069

#1078

#1079

#1080

#11

#1125

#1162

#1162

#1190

#1191

#1195

#1207

#1216

#1224

#1225

#1227

#1228

#1238

#1251

#1265

#1274

#1276

#1279

#1280

#1282

#1288

#1303

#1315

#1316

#1324

#1337

#1346

#1347

#1348

#1349

#1353

#1354

#1363

#1365

#1367

#1370

#1374

#1386

#1391

#1395

#1397

#1399

#1402

#1403

#1404

#1405

#1406

#1409

#1411

#1418

#1419

#1422

#1424

#1431

#1434

#1435

#1436

#1437

#1441

#1451

#1452

#1456

#1459

#1461

#1463

#1469

#1470

#1478

#1498

#15

#1510

#1511

#1512

#1514

#1524

#1526

#1527

#1532

#1535

#1537

#1538

#1539

#1540

#1541

#1542

#1544

#1545

#1550

#1555

#1556

#1557

#1558

#1560

#1561

#1562

#1564

#1565

#1567

#1570

#1572

#1573

#1574

#1581

#1583

#1584

#1587

#1589

#1597

#1599

#16

#1616

#1618

#1620

#1623

#1629

#1630

#1638

#1640

#1641

#1653

#1661

#1664

#1666

#1675

#1676

#1679

#1679

#1682

#1686

#1694

#1705

#1717

#1718

#1726

#1739

#1749

#1753

#1760

#1765

#1767

#1768

#1776

#1780

#1791

#1792

#1796

#1797

#1801

#1807

#1809

#1810

#1821

#1822

#1825

#1835

#1844

#1853

#1871

#1872

#1873

#1882

#1898

#1905

#1912

#1914

#1928

#1933

#1938

#1940

#1942

#1945

#1946

#1967

#1970

#1971

#1977

#1978

#1991

#1994

#2

#2001

#2019

#2024

#2048

#2054

#2065

#2066

#2071

#2073

#2077

#2079

#2086

#2095

#2102

#2103

#2114

#2116

#2132

#2135

#2136

#2138

#2140

#2144

#2146

#2149

#2150

#2153

#2154

#2161

#2162

#2169

#2178

#2183

#2187

#2189

#2194

#2195

#2198

#2203

#2204

#2205

#2206

#2211

#2218

#2223

#2226

#2228

#2229

#2234

#2242

#2244

#2245

#2248

#2249

#2253

#2257

#2271

#2272

#2276

#2277

#2284

#2295

#2303

#2305

#2310

#2314

#2316

#2325

#2326

#2328

#2329

#2337

#2339

#2349

#2352

#2357

#2364

#2377

#2379

#2380

#2389

#2390

#2393

#2399

#2407

#2418

#2427

#2435

#2445

#2445

#2451

#2460

#2462

#2463

#2463

#2470

#2475

#2478

#2480

#2484

#2485

#2489

#2495

#2499

#2508

#2509

#2515

#2518

#2519

#2524

#2526

#2527

#2532

#2533

#2540

#2543

#2547

#2549

#2551

#2563

#2571

#2572

#2576

#2577

#2582

#2587

#2592

#2595

#2596

#2600

#2603

#2604

#2616

#2617

#2626

#2628

#2629

#2638

#2647

#2650

#2651

#2653

#2655

#2659

#2661

#2662

#2663

#2666

#2666

#2667

#2668

#2671

#2682

#2685

#2695

#2697

#2698

#2700

#2718

#2725

#2733

#2735

#2741

#2743

#2748

#2750

#2751

#2754

#2756

#2757

#2776

#2783

#2790

#2791

#2806

#2808

#2816

#2822

#2823

#2826

#2831

#2836

#2838

#2840

#2843

#2845

#2846

#2851

#2854

#2855

#2856

#2861

#2870

#2871

#2875

#2876

#2893

#2894

#2899

#2909

#2912

#2914

#2919

#2922

#2925

#2926

#2934

#2939

#2943

#2945

#2949

#2950

#2951

#2954

#2956

#2961

#2963

#2970

#2981

#2983

#2990

#2992

#2993

#2999

#3

#3001

#3003

#3004

#3009

#3010

#3011

#3012

#3021

#3027

#3035

#3036

#3038

#3048

#3057

#3058

#3061

#3062

#3065

#3066

#3070

#3071

#3081

#3082

#3086

#3089

#3090

#3092

#3093

#3094

#3096

#3103

#3105

#3108

#3109

#3115

#3117

#3120

#3126

#3127

#3128

#3129

#3130

#3133

#3137

#3138

#3149

#3150

#3151

#3154

#3156

#3158

#3159

#3160

#3168

#3169

#3170

#3172

#3173

#3176

#3179

#3182

#3183

#3195

#3201

#3203

#3207

#3208

#3210

#3214

#3215

#3216

#3226

#3227

#3230

#3238

#3239

#3241

#3242

#3243

#3247

#3248

#3249

#3251

#3263

#3273

#3275

#3279

#3281

#3286

#3294

#3296

#3297

#3300

#3318

#3319

#3329

#3336

#3341

#3349

#3351

#3352

#3353

#3355

#3368

#3373

#3381

#3385

#3390

#3391

#3392

#3404

#3405

#3412

#3414

#3422

#3423

#3437

#3442

#3446

#3450

#3469

#3471

#3476

#3476

#3487

#3492

#3497

#3500

#3502

#3504

#3509

#3511

#3523

#3528

#3547

#3547

#3561

#3582

#3589

#3594

#3597

#3615

#3622

#3625

#3625

#3632

#3633

#3634

#3651

#3652

#3660

#3666

#367

#3672

#3690

#3696

#3708

#3719

#3720

#3724

#373

#3730

#3747

#375

#3755

#3765

#3769

#3788

#3789

#379

#3792

#3809

#3832

#384

#3852

#3853

#393

#394

#395

#3963

#3963

#3969

#3973

#3977

#398

#3994

#3997

#4

#4000

#4021

#4023

#4052

#4088

#4088

#4090

#4090

#4091

#4091

#4115

#4120

#4166

#4173

#4174

#4175

#4175

#4182

#4188

#4194

#420

#4214

#422

#423

#4298

#430

#4300

#4306

#4320

#4330

#4336

#4337

#435

#4351

#4352

#4355

#4358

#4362

#4362

#4367

#4368

#4380

#4384

#4384

#4390

#4397

#4399

#4401

#4402

#4403

#4404

#4407

#441

#4413

#4414

#4421

#4423

#445

#446

#453

#454

#457

#462

#468

#476

#477

#479

#481

#487

#488

#495

#5

#501

#502

#506

#508

#510

#518

#519

#520

#523

#524

#526

#527

#532

#535

#543

#544

#545

#546

#550

#551

#552

#557

#558

#559

#561

#562

#572

#581

#586

#6

#602

#606

#609

#611

#613

#617

#619

#620

#628

#629

#630

#642

#645

#656

#658

#664

#667

#673

#674

#683

#685

#689

#694

#696

#699

#7

#701

#702

#706

#708

#713

#716

#717

#718

#719

#722

#724

#725

#726

#727

#731

#736

#742

#751

#758

#762

#766

#777

#784

#785

#787

#789

#790

#791

#792

#793

#800

#802

#803

#814

#815

#831

#847

#848

#882

#887

#888

#889

#891

#893

#898

#899

#900

#901

#914

#922

#931

#937

#943

#977

#983

#984

#995

speaker_encoder_model

v0.0.10

v0.0.11

v0.0.12

v0.0.13

v0.0.14

v0.0.15

v0.0.15.1

v0.0.9

v0.1.0

v0.1.1

v0.1.2

v0.1.3

v0.10.0

v0.10.0_models

v0.10.1

v0.10.1_models

v0.10.2

v0.11.0

v0.11.0_models

v0.11.1

v0.12.0

v0.13.0

v0.13.0_models

v0.13.1

v0.13.2

v0.13.3

v0.13.3_models

v0.14.0

v0.14.0_models

v0.14.1

v0.14.1_models

v0.14.2

v0.14.3

v0.15.0

v0.15.1

v0.15.2

v0.15.4

v0.15.5

v0.15.6

v0.16.0

v0.16.1

v0.16.2

v0.16.3

v0.16.4

v0.16.5

v0.16.6

v0.17.0

v0.17.1

v0.17.10

v0.17.2

v0.17.3

v0.17.4

v0.17.5

v0.17.6

v0.17.7

v0.17.8

v0.17.9

v0.18.0

v0.18.1

v0.18.2

v0.19.0

v0.19.1

v0.2.0

v0.2.1

v0.2.2

v0.20.0

v0.20.1

v0.20.2

v0.20.3

v0.20.4

v0.20.5

v0.20.6

v0.21.0

v0.21.1

v0.21.2

v0.21.3

v0.22.0

v0.3.0

v0.3.1

v0.4.0

v0.4.1

v0.4.2

v0.5.0

v0.5.0_models

v0.6.0

v0.6.0_models

v0.6.1

v0.6.1_models

v0.6.2

v0.6.2_models

v0.7.0

v0.7.0_models

v0.7.1

v0.7.1_models

v0.8.0

v0.8.0_models

v0.9.0

7bb45a20ec Build and publish CPU only Docker image Reuben Morais 2022-05-11 14:41:07 +02:00
27cf388a79 Update CI tests (#1572) Eren Gölge 2022-05-12 18:41:01 +02:00
4857967063 🐍 Python 3.10.x support and drop Python 3.6 support (#1565) Eren Gölge 2022-05-12 15:50:25 +02:00
a97eed696a Fix the bug in eSpeak wrapper for eSpeak version 1.48.15 (#1560) Edresson Casanova 2022-05-12 10:15:18 -03:00
e45ae57aef Merge pull request #1550 from coqui-ai/fix-upsampling-asserts Eren Gölge 2022-05-12 14:51:41 +02:00
175ca06388 Add reinit text encoder and duration predictor parameter (#1562) Edresson Casanova 2022-05-09 14:28:37 -03:00
182711043c Fix the VITS upsampling asserts Edresson Casanova 2022-05-07 14:13:05 -03:00
f9d91a55f2 Improve data_path resolvement (#1567) Taras Sereda 2022-05-12 14:10:35 +03:00
d5d590bc36 Fix Dockerfile Eren Gölge 2022-05-12 12:55:27 +02:00
6484be687c Build and publish CPU only Docker image Reuben Morais 2022-05-11 14:41:07 +02:00
2fc38f67d2 Update SpeakerManager init in Synthesizer Eren Gölge 2022-05-11 11:32:27 +02:00
c3f8c4d5eb Return default SpeakerManager if no d_vector_file Eren Gölge 2022-05-11 11:31:45 +02:00
121e9ed685 Pass use_cuda to init_encoder Eren Gölge 2022-05-11 11:31:17 +02:00
c18bd21b3f Return durations at VITS inference Eren Gölge 2022-05-11 11:30:05 +02:00
5021a03de0 Use torch.no_grad for VITS inference Eren Gölge 2022-05-11 11:29:36 +02:00
3f03e3012c Fix batch_group_size in VITS Eren Gölge 2022-05-07 13:40:34 +02:00
fa887ef5f9 Fix issue probably-meant-fstring found at https://codereview.doctor (#1532) code-review-doctor 2022-05-07 12:33:40 +01:00
a34076af35 Update documentation for multi-gpu training Arvind Suresh 2022-05-03 08:01:10 -04:00
a0a9279e4b Fix GAN optimizer order Eren Gölge 2022-05-07 13:28:22 +02:00
60034674f9 Remove audio padding before mel spec extraction Edresson Casanova 2022-04-28 15:40:16 -03:00
fbdf76b2fc returns y_mask in VITS inference (#1540) WeberJulian 2022-04-27 10:42:26 +02:00
5680b599ca Fix style fix-asserts+mas Edresson Casanova 2022-05-02 15:51:42 -03:00
39db650bdb Fix the VITS upsampling asserts Edresson Casanova 2022-05-02 15:43:23 -03:00
2f39054557 Fix unit test Edresson Casanova 2022-04-29 16:29:44 -03:00
4693d87974 Fix style Edresson Casanova 2022-04-29 07:28:39 -03:00
9fa014ce34 Change order of HIFI-GAN optimizers to be equal than the original repository Edresson Casanova 2022-04-28 17:08:04 -03:00
1ff925d558 Remove audio padding before mel spec extraction Edresson Casanova 2022-04-28 15:40:16 -03:00
b78431d7e2 Fix MAS Eren Gölge 2022-05-03 00:34:55 +02:00
76b274e690 Merge pull request #1541 from coqui-ai/comp_emb_fix Edresson Casanova 2022-04-27 07:28:48 -03:00
379ccd7ba6 returns y_mask in VITS inference (#1540) WeberJulian 2022-04-27 10:42:26 +02:00
6233f4fcd7 Bug fix in compute embedding without eval partition Edresson Casanova 2022-04-26 13:54:09 -03:00
a41e860a66 Update Coqpit requirement (#1539) Edresson Casanova 2022-04-26 12:39:36 -03:00
69c8d0b7c9 Update Coqpit requirement update-coqpit-req Edresson Casanova 2022-04-26 09:30:18 -03:00
c50a427b51 Update Coqpit requeriment VITS-upsample Edresson Casanova 2022-04-26 09:22:39 -03:00
8d228ab22a Trick to Upsampling to High sampling rates using VITS model (#1456) Edresson Casanova 2022-04-26 06:47:46 -03:00
af98ec8eb9 Move upsampling tests to test_vits.py Edresson Casanova 2022-04-25 09:06:40 -03:00
f4e53295b1 Add asserts for encoder_sample_rate part Edresson Casanova 2022-04-22 12:07:37 -03:00
ce7138d9d4 Add upsampling_init and upsampling_z methods Edresson Casanova 2022-04-22 09:03:31 -03:00
b3e2c58398 Rename TTS_part_sample_rate to encoder_sample_rate Edresson Casanova 2022-04-22 07:57:27 -03:00
3f3efe88bb Fix the docs Edresson Casanova 2022-04-22 07:49:51 -03:00
d495e4581f Add docs for VITS upsampling Edresson Casanova 2022-04-21 16:57:36 -03:00
1e75942dbc Remove useless detach_z_vocoder parameter Edresson Casanova 2022-04-21 15:59:34 -03:00
984e2d66ac Add unit tests Edresson Casanova 2022-04-21 15:57:43 -03:00
c32082a62c Bug fix in speaker encoder load in inference time Edresson Casanova 2022-04-21 15:55:49 -03:00
adcc2f8299 Add the period for VITS multi-period discriminator in model_args Edresson Casanova 2022-04-21 10:03:37 -03:00
9252b3c5bd Style fix Edresson Casanova 2022-04-21 09:03:03 -03:00
17b6486ef1 Add RMS based norm in save_wav method Edresson Casanova 2022-04-21 08:26:27 -03:00
18d110eb23 Fix lint checks Edresson Casanova 2022-03-28 22:04:49 +00:00
faec6393bc Fix the bug in inference Edresson Casanova 2022-03-28 20:01:51 +00:00
99ecf357af Add upsample VITS support Edresson Casanova 2022-03-24 15:10:02 -03:00
4d1718a19a Implement get_state_dict update_model_save Eren Gölge 2022-04-22 12:39:46 +02:00
dfc19cd3ae Remove remaned trainer functions Eren Gölge 2022-04-22 12:37:35 +02:00
21cbfe964e Add RMS based norm in save_wav method VITS-debug-dp Edresson Casanova 2022-04-21 08:26:27 -03:00
c410bc58ef Bump to v0.6.2 v0.6.2 Eren Gölge 2022-04-20 11:46:26 +02:00
5271846d9c Add Speech style balancer Edresson Casanova 2022-04-19 15:51:15 -03:00
30bea7d53c Update manage.py (#1514) WeberJulian 2022-04-19 14:27:32 +02:00
b45d5c5c60 Improve docsQA default questions (#1411) Yanlong Wang 2022-04-19 20:24:34 +08:00
7b6339f2ed Update manage.py patch-print-license WeberJulian 2022-04-19 14:23:36 +02:00
a050aa7bb7 Update manage.py print_license_info WeberJulian 2022-04-19 14:18:52 +02:00
7133f8f47d Print Model's license when downloading (#1512) Eren Gölge 2022-04-19 14:18:49 +02:00
4953636b14 Add African models (#1511) WeberJulian 2022-04-19 14:18:30 +02:00
816d375ae3 Make style Eren Gölge 2022-04-19 14:10:52 +02:00
07a56641f1 Add a new license link Eren Gölge 2022-04-19 13:59:38 +02:00
da52a45fca Make style Eren Gölge 2022-04-19 13:57:14 +02:00
5cc8e48c3a Print model license while downloading Eren Gölge 2022-04-19 11:26:02 +02:00
b6073d16fb Return duration by ForwardTTS inference Eren Gölge 2022-04-19 11:00:15 +02:00
7ce4444056 Make style Eren Gölge 2022-04-19 10:59:59 +02:00
df30f9d885 Update ForwardTTSe2e tests Eren Gölge 2022-04-19 10:58:52 +02:00
8f3552fbaa Remove redundant abstract function Eren Gölge 2022-04-19 09:23:35 +02:00
5cd7fa6228 Refactor TTSDataset to use numpy transforms Eren Gölge 2022-04-19 09:23:18 +02:00
3824838e5d Update ForwardTTSE2eLoss Eren Gölge 2022-04-19 09:22:50 +02:00
85c03c75ca Make AP optional in BaseTTS Eren Gölge 2022-04-19 09:22:08 +02:00
2457739b5e Add numpy and torch transforms Eren Gölge 2022-04-19 09:21:46 +02:00
7742c0b64e Refactor ForwardTTS to skip decoder Eren Gölge 2022-04-19 09:21:31 +02:00
518b216631 Make plot results more general Eren Gölge 2022-04-19 09:20:31 +02:00
82c2ca505d Add missing kernel size attr to transformer layer Eren Gölge 2022-04-19 09:19:57 +02:00
622ff07c45 Remove AP from FastPitchE2e Eren Gölge 2022-04-19 09:19:07 +02:00
52e86d8866 Update fastpitche2e recipe Eren Gölge 2022-04-19 09:18:49 +02:00
519ee7c776 Update import statements Eren Gölge 2022-04-19 09:16:03 +02:00
093bd07528 Add reversal classifier loss Edresson Casanova 2022-04-18 21:09:59 -03:00
8a3396d9c1 Add prosody encoder training support Edresson Casanova 2022-04-18 17:01:44 -03:00
e8573bfe3e Update CONTRIBUTING.md (#1463) v0.6.2_models jackiexiao 2022-04-15 20:43:46 +08:00
c18100d112 Merge branch 'docker-ci' into dev (Fixes #1498) Reuben Morais 2022-04-15 02:32:51 +02:00
27fcb5dabf Add Dockerfile and build/push CI Reuben Morais 2022-04-15 01:13:32 +02:00
bb7a645e7a Add debug script Edresson Casanova 2022-04-14 08:31:52 -03:00
164c7dd676 Update requirements coqui_trainer -> trainer (#1478) Eren Gölge 2022-04-08 14:47:09 +02:00
3abe75c1d3 Update requirements coqui_trainer -> trainer update_trainer Eren Gölge 2022-04-07 14:37:55 +02:00
ad24598797 Remove redundancy Eren Gölge 2022-04-04 09:46:30 +02:00
9e456e8053 Fix Vocoder logging Eren Gölge 2022-04-04 09:46:10 +02:00
e5a9902e85 Rename vars in VITS Eren Gölge 2022-04-04 09:45:46 +02:00
8f21991a84 Add cond layer in decoder Eren Gölge 2022-04-04 09:44:20 +02:00
8408b983b2 Refactor multi-speaker init in ForwardTTS Eren Gölge 2022-04-04 09:43:46 +02:00
f1b034c8b0 Implement BaseTTSE2E Eren Gölge 2022-04-04 09:43:15 +02:00
29216ff907 Implement ForwardTTSE2E Loss Eren Gölge 2022-04-04 09:42:50 +02:00
95b52a65af Implement FastPitchE2E LJSpeech recipe Eren Gölge 2022-04-04 09:41:46 +02:00
2c0cd0ddd5 Implement ForwardTTSE2E tests Eren Gölge 2022-04-04 09:41:25 +02:00
ade84aa124 Implement FastPitchE2EConfig Eren Gölge 2022-04-04 09:41:05 +02:00
c369f087ab Implement ForwardTTSE2Eg Eren Gölge 2022-04-04 09:40:36 +02:00
f31ba25233 Add emotion embedding in the encoder Edresson Casanova 2022-03-31 19:14:41 -03:00
314f95f974 Add formatter for the Emotional Speech Dataset Edresson Casanova 2022-03-31 17:27:30 +00:00

... 9 10 11 12 13 ...