| # | uttid | text | ref |
baseline
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-44-57
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-44-57
|
indextts |
indexttslike
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_indextts_v2
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_indextts_v2
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_indextts_v2__2025-12-05_07-39-35
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-12-05_07-39-35
|
indexttslike_ref
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_indextts_v2__diffusion_yt4_indextts_v2_ref
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/diffusion_yt4_indextts_v2_ref
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_indextts_v2
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_indextts_v2__diffusion_yt4_indextts_v2_ref__2025-12-05_07-49-12
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-12-05_07-49-12
|
indexttslike_tgtlen
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_indextts_v2
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_indextts_v2
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_indextts_v2__2025-12-05_07-58-41
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-12-05_07-58-41
|
indexttslike_tgtlen_ref
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_indextts_v2__diffusion_yt4_indextts_v2_ref
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/diffusion_yt4_indextts_v2_ref
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_indextts_v2
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_indextts_v2__diffusion_yt4_indextts_v2_ref__2025-12-05_08-06-50
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-12-05_08-06-50
|
|---|---|---|---|---|---|---|---|---|---|
|
DF-sbs-cc-buc-qs1m/mtohEFEZLBE-e8hl_pt/M0__17.038-17.319
|
Go on.
|
||||||||
|
ref/DF-sbs-cc-buc-qs1m/mFpCHV8M_kU-rl64_ru/F0__20.120-21.021
|
|||||||||
|
DF-sbs-cc-buc-qs1m/IspiUk6P7eM-9yhr_pt/F3__11.919-13.450
|
What are you waiting for?
|
||||||||
|
ref/DF-sbs-cc-buc-qs1m/Ll6fcDRKi9k-2pur_ru/F1__0.040-1.562
|
|||||||||
|
ref/DF-sbs-cc-buc-qs1m/mtohEFEZLBE-e8hl_pt/F1__11.002-12.132
|
|||||||||
|
DF-sbs-cc-buc-qs1m/h8Ht1PqPYMw-b6a0_ru/F0__3.680-5.720
|
One choice after another.
|
||||||||
|
DF-sbs-cc-buc-qs1m/mtohEFEZLBE-e8hl_pt/F1__11.002-12.132
|
Am I a victim?
|
||||||||
|
ref/DF-sbs-cc-buc-qs1m/xtiiG-k5ejA-uwwi_de/F0__14.674-15.934
|
|||||||||
|
ref/DF-sbs-cc-buc-qs1m/mtohEFEZLBE-e8hl_pt/M0__17.038-17.319
|
|||||||||
|
DF-sbs-cc-buc-qs1m/GLA2YCQi_Rk-f1zo_fr/M1__12.696-13.590
|
What should I get you from the bookstore?
|
||||||||
|
ref/DF-sbs-cc-buc-qs1m/K4IBuuxsKsw-dwwr_fr/F0__8.582-15.612
|
|||||||||
|
ref/DF-sbs-cc-buc-qs1m/lTa1VcbYZEE-l411_fr/M0__14.560-18.030
|
|||||||||
|
DF-sbs-cc-buc-qs1m/mtohEFEZLBE-e8hl_pt/F1__17.419-19.569
|
It might sound strange, but I am a victim.
|
||||||||
|
ref/DF-sbs-cc-buc-qs1m/UXx6zn9y2B8-jhmn_es/F0__21.454-27.100
|
|||||||||
|
DF-sbs-cc-buc-qs1m/rlR9M9QZ4Cg-h55y_de/M0__9.265-11.106
|
Everything had always been completely normal.
|
||||||||
|
DF-sbs-cc-buc-qs1m/lTa1VcbYZEE-l411_fr/F0__9.940-13.790
|
So whatever he might have told you was probably just made-up stuff.
|
||||||||
|
DF-sbs-cc-buc-qs1m/b91pBJWJDhQ-dlsj_ru/M0__7.084-8.965
|
I'll be hosting online marathons.
|
||||||||
|
ref/DF-sbs-cc-buc-qs1m/m8DHPYWvm2c-zqza_ru/M0__4.503-7.705
|
|||||||||
|
ref/DF-sbs-cc-buc-qs1m/DGbTKywfSxw-h1io_ru/F0__0.080-1.442
|
|||||||||
|
ref/DF-sbs-cc-buc-qs1m/DssUtj_qKf4-flgd_ru/M0__15.844-16.604
|