| # | uttid | text | ref |
baseline_tgtlen
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15__2026-01-19_14-20-36
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-19_14-20-36
|
indextts2 |
literategoggles_idxdistill
basket_config_path: /mount/s3/tts-binary-data-nb/dchebakov/metrics/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_idxdistill_1ref_emo
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: /mount/s3/tts-binary-data-nb/dchebakov/metrics/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
duplicate_reference: false
exp: /mount/s3/tts-binary-data-nb/dchebakov/models/yt4_wavtokenizer_16K_lossent0.15_idxdistill_1ref_emo
gpt_generate_args:
do_sample: true
enforce_silent_start: false
num_return_sequences: 30
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825_en-US/yt4_wavtokenizer_16K_lossent0.15_idxdistill_1ref_emo__2026-01-10_07-59-19
ref_dir: cc_20250825_en-US/ref
ticket: QUALITY-000
basket_generation_git_hash: 084ccc0c4313e646e3630e4e5a35b7e04d70fdad
model_data_type: tts-cloning
ticket: QUALITY-000
version: 2026-01-10_07-59-19
|
movies2_finetune
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-28-38
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-28-38
|
movies2_finetune_snr0
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-35-53
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-35-53
|
movies2_finetune_anim
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-42-42
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-42-42
|
movies2_finetune_en
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-49-55
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-49-55
|
movies2_finetune_all
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-57-14
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-57-14
|
movies2_finetune_closest
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-11-09
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-11-09
|
movies2_finetune_closest_snr0
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-18-17
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-18-17
|
movies2_finetune_closest_anim
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-25-18
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-25-18
|
movies2_finetune_closest_en
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-32-27
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-32-27
|
movies2_finetune_closest_all
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-39-39
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-39-39
|
movies2_finetune_lora
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-46-48
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-46-48
|
movies2_finetune_lora_snr0
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-54-50
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-54-50
|
movies2_finetune_lora_anim
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-03-26
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-03-26
|
movies2_finetune_lora_en
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-11-54
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-11-54
|
movies2_finetune_lora_all
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_18-20-12
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_18-20-12
|
movies2_finetune_lora_closest
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_16-28-55
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_16-28-55
|
movies2_finetune_lora_closest_snr0
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_16-37-20
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_16-37-20
|
movies2_finetune_lora_closest_anim
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_16-45-44
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_16-45-44
|
movies2_finetune_lora_closest_en
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 0.0
pitch_std: 100.0
snr: 100.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_16-54-00
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_16-54-00
|
movies2_finetune_lora_closest_all
basket_config_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/cc_20250825_en-US.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
duplicate_reference: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest
gpt_generate_args:
do_sample: true
min_new_tokens: 20
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
is_animation: 1.0
pitch_std: 100.0
snr: 0.0
year: 2025.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250825/yt4_wavtokenizer_16K_lossent0.15_movies2_finetune_lora_closest__yt4_wavtokenizer_16K_lossent0.15__2026-01-14_17-02-35
ref_dir: cc_20250825/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2026-01-14_17-02-35
|
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
|
DF-creative-commons-basket/Ll6fcDRKi9k_ru/F0__0.040-1.410_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/U_1cQLJKt7c_es/F0__15.250-20.940_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/uTbCKWoc1YY_zh/F0__18.920-19.913
|
You're not coming home today?
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/2BJj_jAbQSw_pt/F1__5.060-6.178
|
How coward you are..
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/mQSxiD4Kp6c_es/F0__25.370-27.460_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/-d9C5FyXvvw_it/M0__12.929-13.539_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/-d9C5FyXvvw_it/M0__12.929-13.539
|
He did it.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/5Ges6LpYtI0_it/M0__9.020-10.034_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/qJaAnEUiO6E_it/F0__17.780-18.690
|
I'm sure.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/5k25FVLoCyo_ru/F0__9.440-11.890
|
You know, our mom taught us to respect our father.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/9ekEozd_9QE_ja/M0__0.000-7.503_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/xB2eAA38st4_hi/M0__20.710-23.000_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/QTa0hoQDonY_pt/M0__3.370-5.520
|
Luciano, I don't feel comfortable in my own home anymore.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/OesbsUiwgo0_pt/F0__7.550-8.920
|
You can get back to work.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/P8yVtZpEY7Y_es/F0__6.550-8.390
|
You're not going to compare that ugly woman to me.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/2BJj_jAbQSw_pt/F0__3.050-4.300
|
What are you talking about?
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/mQSxiD4Kp6c_es/F0__10.115-14.715
|
But don't let him fool you because he's not as much of a gentleman as you are, even though he's carrying a lady in his arms.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/P6glOSnV2gM_fr/M0__17.640-19.710
|
From the beginning, you decide everything on your own and then you run away.
|
|||||||||||||||||||||||||
|
DF-creative-commons-basket/yFfw234lX0c_zh/M0__7.020-10.740_spk
|
||||||||||||||||||||||||||
|
DF-creative-commons-basket/xtiiG-k5ejA_de/F0__0.150-3.940_spk
|