| # | text | ref | baseline |
encodec_mbr_loudnorm40k
basket_config_path: quality/tts/tortoise-baskets/en_es_mapping_1000_24Khz.json
data_meta: null
exp_name: yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud
lang: es
meta:
basket_generation_config:
basket_lang: es
basket_path: quality/tts/tortoise-baskets/en_es_mapping_1000_24Khz.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: false
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud/
force_reference_std: -21.5
gpt_generate_args:
do_sample: true
num_return_sequences: 50
prefix_allowed_tokens_fn: encodec_interleaved_layers
repetition_penalty_span: 50.0
use_cache: true
out_sample_rate: 48000
override_conditioning_features:
snr: 100.0
reranking_options:
cdist_time_downsampling_factor: 6
mode: MBR
top_k: 1
vocoder: none
num_workers: 1
output_dir: en_es_mapping_encodec_mbr_snrc50pitchstdoverride_tgtlen0.75_24Khz/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud__2024-07-15_07-54-56
ticket: TTS-393
basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-15_07-54-56
|
|---|---|---|---|---|
|
1230
|
||||
|
1231
|
||||
|
1232
|
||||
|
1233
|
||||
|
1234
|
||||
|
1235
|
||||
|
1236
|
||||
|
1237
|
||||
|
1238
|
||||
|
1239
|
||||
|
1240
|
||||
|
1241
|
||||
|
1242
|
||||
|
1243
|
||||
|
1244
|
||||
|
1245
|
||||
|
1246
|
||||
|
1247
|
||||
|
1248
|
||||
|
1249
|
||||
|
1250
|
||||
|
1251
|
||||
|
1252
|
||||
|
1253
|
||||
|
1254
|
||||
|
1255
|
||||
|
1256
|
||||
|
1257
|
||||
|
1258
|
||||
|
1259
|