{
  "train": {
    "log_interval": 200,
    "eval_interval": 1000,
    "seed": 42,
    "epochs": 10000,
    "learning_rate": 0.0002,
    "betas": [
      0.8,
      0.99
    ],
    "eps": 1e-09,
    "batch_size": 24,
    "fp16_run": false,
    "lr_decay": 0.99995,
    "segment_size": 16384,
    "init_lr_ratio": 1,
    "warmup_epochs": 0,
    "c_mel": 45,
    "c_kl": 1.0,
    "skip_optimizer": true
  },
  "data": {
    "training_files": "filelists/train.list",
    "validation_files": "filelists/val.list",
    "max_wav_value": 32768.0,
    "sampling_rate": 22050,
    "filter_length": 2048,
    "hop_length": 512,
    "win_length": 2048,
    "n_mel_channels": 128,
    "mel_fmin": 0.0,
    "mel_fmax": null,
    "add_blank": true,
    "n_speakers": 700,
    "cleaned_text": true,
    "spk2id": {
      "老克勒": 0,
      "美琳": 1,
      "Jane": 2,
      "小贝": 3,
      "SSB0005": 4,
      "SSB0009": 5,
      "SSB0011": 6,
      "SSB0012": 7,
      "SSB0016": 8,
      "SSB0018": 9,
      "SSB0033": 10,
      "SSB0038": 11,
      "SSB0043": 12,
      "SSB0057": 13,
      "SSB0073": 14,
      "SSB0080": 15,
      "SSB0112": 16,
      "SSB0122": 17,
      "SSB0133": 18,
      "SSB0139": 19,
      "SSB0145": 20,
      "SSB0149": 21,
      "SSB0193": 22,
      "SSB0197": 23,
      "SSB0200": 24,
      "SSB0241": 25,
      "SSB0246": 26,
      "SSB0261": 27,
      "SSB0267": 28,
      "SSB0273": 29,
      "SSB0287": 30,
      "SSB0288": 31,
      "SSB0299": 32,
      "SSB0307": 33,
      "SSB0309": 34,
      "SSB0315": 35,
      "SSB0316": 36,
      "SSB0323": 37,
      "SSB0338": 38,
      "SSB0339": 39,
      "SSB0341": 40,
      "SSB0342": 41,
      "SSB0354": 42,
      "SSB0366": 43,
      "SSB0375": 44,
      "SSB0379": 45,
      "SSB0380": 46,
      "SSB0382": 47,
      "SSB0385": 48,
      "SSB0393": 49,
      "SSB0394": 50,
      "SSB0395": 51,
      "SSB0407": 52,
      "SSB0415": 53,
      "SSB0426": 54,
      "SSB0427": 55,
      "SSB0434": 56,
      "SSB0435": 57,
      "SSB0470": 58,
      "SSB0482": 59,
      "SSB0502": 60,
      "SSB0534": 61,
      "SSB0535": 62,
      "SSB0539": 63,
      "SSB0544": 64,
      "SSB0565": 65,
      "SSB0570": 66,
      "SSB0578": 67,
      "SSB0588": 68,
      "SSB0590": 69,
      "SSB0594": 70,
      "SSB0599": 71,
      "SSB0601": 72,
      "SSB0603": 73,
      "SSB0606": 74,
      "SSB0607": 75,
      "SSB0609": 76,
      "SSB0614": 77,
      "SSB0623": 78,
      "SSB0629": 79,
      "SSB0631": 80,
      "SSB0632": 81,
      "SSB0666": 82,
      "SSB0668": 83,
      "SSB0671": 84,
      "SSB0686": 85,
      "SSB0700": 86,
      "SSB0710": 87,
      "SSB0720": 88,
      "SSB0723": 89,
      "SSB0737": 90,
      "SSB0746": 91,
      "SSB0748": 92,
      "SSB0751": 93,
      "SSB0758": 94,
      "SSB0760": 95,
      "SSB0762": 96,
      "SSB0778": 97,
      "SSB0780": 98,
      "SSB0784": 99,
      "SSB0786": 100,
      "SSB0794": 101,
      "SSB0817": 102,
      "SSB0851": 103,
      "SSB0863": 104,
      "SSB0871": 105,
      "SSB0887": 106,
      "SSB0913": 107,
      "SSB0915": 108,
      "SSB0919": 109,
      "SSB0935": 110,
      "SSB0966": 111,
      "SSB0987": 112,
      "SSB1008": 113,
      "SSB1020": 114,
      "SSB1024": 115,
      "SSB1050": 116,
      "SSB1055": 117,
      "SSB1056": 118,
      "SSB1064": 119,
      "SSB1072": 120,
      "SSB1091": 121,
      "SSB1096": 122,
      "SSB1100": 123,
      "SSB1108": 124,
      "SSB1115": 125,
      "SSB1125": 126,
      "SSB1131": 127,
      "SSB1136": 128,
      "SSB1138": 129,
      "SSB1161": 130,
      "SSB1203": 131,
      "SSB1204": 132,
      "SSB1218": 133,
      "SSB1221": 134,
      "SSB1253": 135,
      "SSB1320": 136,
      "SSB1341": 137,
      "SSB1366": 138,
      "SSB1377": 139,
      "SSB1383": 140,
      "SSB1385": 141,
      "SSB1392": 142,
      "SSB1393": 143,
      "SSB1408": 144,
      "SSB1431": 145,
      "SSB1437": 146,
      "SSB1448": 147,
      "SSB1555": 148,
      "SSB1563": 149,
      "SSB1567": 150,
      "SSB1575": 151,
      "SSB1585": 152,
      "SSB1593": 153,
      "SSB1607": 154,
      "SSB1624": 155,
      "SSB1625": 156,
      "SSB1630": 157,
      "SSB1650": 158,
      "SSB1670": 159,
      "SSB1684": 160,
      "SSB1686": 161,
      "SSB1699": 162,
      "SSB1711": 163,
      "SSB1759": 164,
      "SSB1806": 165,
      "SSB1828": 166,
      "SSB1831": 167,
      "SSB1832": 168,
      "SSB1837": 169,
      "SSB1846": 170,
      "SSB1863": 171,
      "SSB1878": 172,
      "SSB1891": 173,
      "SSB1918": 174,
      "SSB1935": 175,
      "SSB1939": 176,
      "SSB1956": 177,
      "SSB0693": 178,
      "SSB0711": 179,
      "SSB0716": 180,
      "SSB0717": 181,
      "SSB0736": 182,
      "SSB0749": 183,
      "SSB0809": 184,
      "SSB0702": 185,
      "SSB0822": 186,
      "SSB1110": 187,
      "SSB1215": 188,
      "SSB1399": 189,
      "SSB1728": 190,
      "SSB0993": 191,
      "SSB0997": 192,
      "SSB1000": 193,
      "SSB1001": 194,
      "SSB1002": 195,
      "SSB1126": 196,
      "SSB1135": 197,
      "SSB1176": 198,
      "SSB1187": 199,
      "SSB1197": 200,
      "SSB1216": 201,
      "SSB1219": 202,
      "SSB1239": 203,
      "SSB1274": 204,
      "SSB1302": 205,
      "SSB1322": 206,
      "SSB1328": 207,
      "SSB1340": 208,
      "SSB1365": 209,
      "SSB1382": 210,
      "SSB1402": 211,
      "SSB1452": 212,
      "SSB1457": 213,
      "SSB1739": 214,
      "SSB1745": 215,
      "SSB1781": 216,
      "SSB1782": 217,
      "SSB1809": 218,
      "SSB1810": 219,
      "SSB1872": 220,
      "SSB1902": 221,
      "小庄": 222,
      "小嘟": 223
    }
  },
  "model": {
    "use_spk_conditioned_encoder": true,
    "use_noise_scaled_mas": true,
    "use_mel_posterior_encoder": false,
    "use_duration_discriminator": true,
    "inter_channels": 192,
    "hidden_channels": 192,
    "filter_channels": 768,
    "n_heads": 2,
    "n_layers": 6,
    "kernel_size": 3,
    "p_dropout": 0.1,
    "resblock": "1",
    "resblock_kernel_sizes": [
      3,
      7,
      11
    ],
    "resblock_dilation_sizes": [
      [
        1,
        3,
        5
      ],
      [
        1,
        3,
        5
      ],
      [
        1,
        3,
        5
      ]
    ],
    "upsample_rates": [
      8,
      8,
      2,
      2,
      2
    ],
    "upsample_initial_channel": 512,
    "upsample_kernel_sizes": [
      16,
      16,
      8,
      2,
      2
    ],
    "n_layers_q": 3,
    "use_spectral_norm": false,
    "gin_channels": 256
  },
  "version": "2.0"
}