Prev
# uttid text baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_diff_seed_vc_unnorm_mels_40k
lang: es
meta:
  basket_generation_config:
    basket_lang: es
    basket_path: /home/user/v2v/quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 1
    gpus: 4
    inference:
      diff_k: 3
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/polovick/exp/yt4_diff_seed_vc_unnorm_mels_40k
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 0.75
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_basket/yt4_diff_seed_vc_unnorm_mels_40k__2024-10-30_16-13-40
    ticket: ABC-123
  basket_generation_git_hash: b12c0445eb8945bffbe718d1db06d035ee3dc405
model_data_type: tts-cloning
ticket: ABC-123
version: 2024-10-30_16-13-40
baseline-old-diff
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_baseline_lats
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/dsat-basket-extended-refs-dur.json
    batch_size: 1
    gpus: 2
    inference:
      diff_steps: 400
      exp: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/yt4_baseline_lats
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 0.75
      vocoder: univnet
    num_workers: 1
    output_dir: dsat-cleared/yt4_baseline_lats__2024-07-30_03-28-45
    ticket: QUALITY-54
  basket_generation_git_hash: e0df79f1213deffbae77e909499694944e0746da
model_data_type: tts-cloning
ticket: QUALITY-54
version: 2024-07-30_03-28-45
wavtok
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: gpt_defaultparams
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: true
      diff_steps: 100
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_wavtok_inhouse/gpt_defaultparams/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        repetition_penalty: 3.0
        repetition_penalty_activation_span: 2.0
        repetition_penalty_span: 100.0
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        sakoe_chiba_radius: 24
        top_k: 1
      vocoder: none
    num_workers: 1
    output_dir: es_en_clean-dsat_mapping_wavtok_inhouse_nonorm/gpt_defaultparams__2024-11-26_14-11-07
    ticket: TTS-392
  basket_generation_git_hash: 7411c8d2f9b7ef2384f924f4b0f97566f8bc7899
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-11-26_14-11-07
wavtok-diff
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: gpt_defaultparams__diff
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: true
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_wavtok_inhouse/diff
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_wavtok_inhouse/gpt_defaultparams/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        repetition_penalty: 3.0
        repetition_penalty_activation_span: 2.0
        repetition_penalty_span: 100.0
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        sakoe_chiba_radius: 24
        top_k: 1
      vocoder: bigvgan
    num_workers: 1
    output_dir: es_en_clean-dsat_mapping_wavtok_inhouse_nonorm/gpt_defaultparams__diff__2024-11-26_14-13-08
    ticket: TTS-392
  basket_generation_git_hash: 7411c8d2f9b7ef2384f924f4b0f97566f8bc7899
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-11-26_14-13-08
wavtok-diff_resampled
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: gpt_defaultparams__diff_resampled
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: true
      diff_steps: 100
      diffusion_exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_wavtok_inhouse/diff_resampled/
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_wavtok_inhouse/gpt_defaultparams/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        repetition_penalty: 3.0
        repetition_penalty_activation_span: 2.0
        repetition_penalty_span: 100.0
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        sakoe_chiba_radius: 24
        top_k: 1
      vocoder: bigvgan
    num_workers: 1
    output_dir: es_en_clean-dsat_mapping_wavtok_inhouse_nonorm/gpt_defaultparams__diff_resampled__2024-11-26_14-19-35
    ticket: TTS-392
  basket_generation_git_hash: 7411c8d2f9b7ef2384f924f4b0f97566f8bc7899
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-11-26_14-19-35
150
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0065
A French comrade.
151
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1_0066
Pleased to meet you.
152
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0067
Enchanté
153
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0068
And this bearded man is Albert, who is a contortionist in the circus.
154
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0069
He is an English journalist.
155
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2_0070
Enchanté, delighted.
156
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0071
Likewise.
157
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0072
Well no... we didn't see each other yesterday.
158
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1_0073
Is it true?
159
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0074
No.
160
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0075
How did you like my speech?
161
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2_0076
Well, a little too much...
162
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1_0077
I want too much!
163
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2_0078
Especially at the end. But...
164
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0079
Well... she wrote it.
165
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2_0080
Sorry, no, joke!
166
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1_0081
It was great! Really!
167
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M2_0082
It's great!
168
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F8/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F8_0083
First results.
169
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0084
Yes, let's go, let's go!
170
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M1_0085
Are you coming?
171
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0086
Yes.
172
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0087
It looks like we are going to win.
173
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0090
What's the matter, aren't you happy?
174
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0091
When are you leaving?
175
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0092
The day after tomorrow.
176
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0093
I am taking a train to Paris and from there... to Buenos Aires.
177
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0094
What am I going to do?
178
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_M0_0095
What?
179
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0096
What am I going to do?
Next