Prev
# uttid text ref baseline
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15__yt4_wavtokenizer_16K_lossent0.15__2025-10-22_13-44-57
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-10-22_13-44-57
indextts indexref_none
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_12-48-48
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_12-48-48
indexref_sad
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        emo_alpha: 1.0
        emo_vector:
        - 0.0
        - 0.0
        - 1.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_13-30-03
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_13-30-03
indexref_angry
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        emo_alpha: 1.0
        emo_vector:
        - 0.0
        - 1.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_13-16-16
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_13-16-16
indexref_happy
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        emo_alpha: 1.0
        emo_vector:
        - 1.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_13-02-06
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_13-02-06
indexref_surprised
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        emo_alpha: 1.0
        emo_vector:
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 1.0
        - 0.0
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_13-57-04
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_13-57-04
indexref_melancholic
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        emo_alpha: 1.0
        emo_vector:
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 1.0
        - 0.0
        - 0.0
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_13-43-42
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_13-43-42
indexref_calm
basket_config_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
data_meta: null
exp_name: yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/cc_20250729_rudefritespt_to_en.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate
      gpt_generate_args:
        do_sample: true
        emo_alpha: 1.0
        emo_vector:
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 0.0
        - 1.0
        min_new_tokens: 5
        num_return_sequences: 50
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        dmcs_flatness: 100500.0
        dmcs_roll_off_0.995: 100500.0
        emo2vec: null
        emotion: null
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      vocoder: bigvgan
      voice_samples_preprocessing: []
    num_workers: 1
    output_dir: cc_20250725/yt4_wavtokenizer_16K_lossent0.15_indexrefencoder_separate__2025-11-04_14-13-27
    ref_dir: cc_20250725/ref
    ticket: QUALITY-41
  basket_generation_git_hash: 7ba982d9bb8ddc0cb968d517f583b0227d2624ed
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-11-04_14-13-27
DF-sbs-cc-buc-qs1m/7EqatsqEI-0-ldkm_ru/F0__3.966-5.728
It was the only keepsake I had of her.
DF-sbs-cc-buc-qs1m/ljsv6_fRwTU-v8c1_ru/F0__1.119-7.596
I think this is the most revolutionary feminist novel I've ever read.
DF-sbs-cc-buc-qs1m/31p-0IxN0XU-4jxf_de/F1__16.592-17.722
And now I have three.
DF-sbs-cc-buc-qs1m/IspiUk6P7eM-9yhr_pt/F3__7.050-8.500
Serve me!
DF-sbs-cc-buc-qs1m/eN-waporon0-vu63_de/M0__9.169-17.037
I saw her and in the evening, I would rather let my mother yell at me than talk to Claudia Knipping.