Prev
# uttid text baseline
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_00-41-14
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_00-41-14
angry
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: 1.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_01-01-59
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_01-01-59
sad
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: 4.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_00-54-07
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_00-54-07
happy
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: 2.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_01-09-57
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_01-09-57
nombr
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        pitch_std: 100.0
        snr: 100.0
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_00-48-41
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_00-48-41
angry_nombr
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: 1.0
        pitch_std: 100.0
        snr: 100.0
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_01-22-38
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_01-22-38
sad_nombr
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: 4.0
        pitch_std: 100.0
        snr: 100.0
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_01-17-19
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_01-17-19
happy_nombr
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v
      gpt_generate_args:
        do_sample: true
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: 2.0
        pitch_std: 100.0
        snr: 100.0
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_emo2vec_v2v__yt4_wavtokenizer_16K_lossent0.15__2025-10-07_01-28-08
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 2e93120b8f627c0ae77d8362efadde29892d2a29
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-07_01-28-08
DF-sbs-cc-buc-qs1m/31p-0IxN0XU-4jxf_de/F0__2.682-4.812
We won't know whether to drink it all away or just leave it be.
DF-sbs-cc-buc-qs1m/DssUtj_qKf4-flgd_ru/M0__15.844-16.604
What?
DF-sbs-cc-buc-qs1m/31p-0IxN0XU-4jxf_de/F0__1.461-2.421
That's your doing.
DF-sbs-cc-buc-qs1m/ljsv6_fRwTU-v8c1_ru/F0__7.596-12.493
How a woman of that era found the strength to reject Darcy because he treated her poorly.
DF-sbs-cc-buc-qs1m/mFpCHV8M_kU-rl64_ru/F1__17.718-19.219
I didn't sing it just now.
DF-sbs-cc-buc-qs1m/DGbTKywfSxw-h1io_ru/F0__0.080-1.442
to gather strength.
DF-sbs-cc-buc-qs1m/DssUtj_qKf4-flgd_ru/F1__18.965-21.125
How am I supposed to start my life over from scratch?
DF-sbs-cc-buc-qs1m/mFpCHV8M_kU-rl64_ru/F0__10.090-12.492
Is this showing respect to the audience and the jury?
DF-sbs-cc-buc-qs1m/IspiUk6P7eM-9yhr_pt/F2__17.413-18.083
Never!
DF-sbs-cc-buc-qs1m/mtohEFEZLBE-e8hl_pt/M0__15.497-16.987
For God's sake, tell us more.
DF-sbs-cc-buc-qs1m/lTa1VcbYZEE-l411_fr/F0__4.570-5.100
Why?
DF-sbs-cc-buc-qs1m/t_GIRgw8uGo-lmu4_de/F0__0.160-3.920
The utility company has made our house stop smoking.
DF-sbs-cc-buc-qs1m/k4P0uTlDLCM-z6dd_it/F0__17.550-18.230
Bye!
DF-sbs-cc-buc-qs1m/DssUtj_qKf4-flgd_ru/F0__3.821-5.401
I'm the only one who's useless with you.
DF-sbs-cc-buc-qs1m/HibKRdG8Ie0-5q8j_es/F0__20.693-21.723
Got a problem with that?
DF-sbs-cc-buc-qs1m/b91pBJWJDhQ-dlsj_ru/F0__12.647-13.888
And please forgive me too.
DF-sbs-cc-buc-qs1m/GLA2YCQi_Rk-f1zo_fr/F1__15.589-17.119
That gives you two hours to leave the house.
DF-sbs-cc-buc-qs1m/xtiiG-k5ejA-uwwi_de/F0__14.674-15.934
I only know that it's coming.
DF-sbs-cc-buc-qs1m/DssUtj_qKf4-flgd_ru/F1__17.524-18.805
What did you expect?
DF-sbs-cc-buc-qs1m/ljsv6_fRwTU-v8c1_ru/M0__12.493-13.472
It's bait.
Next