| # | uttid | text | ref |
baseline
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: null
emotion: null
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-44-57
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-44-57
|
anger
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: 1.0
emotion: anger
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-00-14
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-00-14
|
happy
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: 2.0
emotion: happy
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-11-45
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-11-45
|
sad
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: 4.0
emotion: sad
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_12-42-25
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_12-42-25
|
surprised
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: 1.0
emotion: surprised
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-22-37
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-22-37
|
laughing
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo
gpt_generate_args:
do_sample: true
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
emo2vec: 1.0
emotion: laughing
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
vocoder: bigvgan
voice_samples_preprocessing: []
num_workers: 1
output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-33-29
ref_dir: cc_20250725/ref
ticket: QUALITY-41
basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-33-29
|
|---|---|---|---|---|---|---|---|---|---|
|
DF-sbs-cc-buc-qs1m/7EqatsqEI-0-ldkm_ru/F0__3.966-5.728
|
It was the only keepsake I had of her.
|
||||||||
|
DF-sbs-cc-buc-qs1m/ljsv6_fRwTU-v8c1_ru/F0__1.119-7.596
|
I think this is the most revolutionary feminist novel I've ever read.
|
||||||||
|
DF-sbs-cc-buc-qs1m/31p-0IxN0XU-4jxf_de/F1__16.592-17.722
|
And now I have three.
|
||||||||
|
DF-sbs-cc-buc-qs1m/IspiUk6P7eM-9yhr_pt/F3__7.050-8.500
|
Serve me!
|
||||||||
|
DF-sbs-cc-buc-qs1m/eN-waporon0-vu63_de/M0__9.169-17.037
|
I saw her and in the evening, I would rather let my mother yell at me than talk to Claudia Knipping.
|