| # | uttid | text |
baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_baseline_lats
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/dsat-basket-extended-refs-dur.json
batch_size: 1
gpus: 2
inference:
diff_steps: 400
exp: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/yt4_baseline_lats
gpt_generate_args:
do_sample: true
num_return_sequences: 50
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 0.75
vocoder: univnet
num_workers: 1
output_dir: dsat-cleared/yt4_baseline_lats__2024-07-30_03-28-45
ticket: QUALITY-54
basket_generation_git_hash: e0df79f1213deffbae77e909499694944e0746da
model_data_type: tts-cloning
ticket: QUALITY-54
version: 2024-07-30_03-28-45
|
encodec-inhousediff-sameinfer
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__diff_nonorm_2codes_pretrained
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: false
diff_steps: 400
diffusion_exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloudness_delaypattern8/diff_nonorm_2codes_pretrained
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes
gpt_generate_args:
do_sample: true
num_return_sequences: 50
prefix_allowed_tokens_fn: encodec_interleaved_layers
repetition_penalty_activation_span: 4.0
repetition_penalty_span: 50.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
cdist_time_downsampling_factor: 2
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: bigvgan
num_workers: 1
output_dir: es_en_clean-dsat_mapping_encodec_mbrlat_inhdiff/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__diff_nonorm_2codes_pretrained__2024-09-18_17-36-55
ticket: TTS-393
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-09-18_17-36-55
|
xcodec160k_1code_inhdiff20k
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_xcodec-opt-bigbatch__diffusion_yt4_xcodec
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
diffusion_exp: /mount/s3/tts-binary-data-nb/dimdi-y/diffusion_yt4_xcodec
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_xcodec-opt-bigbatch
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty_activation_span: 4.0
repetition_penalty_span: 50.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 16
top_k: 1
vocoder: bigvgan
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_inhdiff/yt4_langbycond_revgrad1_xcodec-opt-bigbatch__diffusion_yt4_xcodec__2024-10-02_15-50-47
ticket: TTS-393
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-10-02_15-50-47
|
wavtokeniser
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty_activation_span: 1.0
repetition_penalty_span: 100.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_codecdec/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc__2024-10-29_09-42-52
ticket: TTS-392
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-10-29_09-42-52
|
wavtokeniser_normloud
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
force_reference_std: -23
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty_activation_span: 1.0
repetition_penalty_span: 100.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_codecdec/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc__2024-10-29_09-58-08
ticket: TTS-392
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-10-29_09-58-08
|
wavtokeniser_normloud_lesspenalty
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
force_reference_std: -23
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty: 1.5
repetition_penalty_activation_span: 5.0
repetition_penalty_span: 100.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_codecdec/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc__2024-10-29_13-45-07
ticket: TTS-392
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-10-29_13-45-07
|
|---|---|---|---|---|---|---|---|---|
|
630
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0059
|
I do want to be here, but not to work.
|
||||||
|
631
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0060
|
No more to scrub my mom.
|
||||||
|
632
|
Dubbing_AD_TEST_dubf-cloned_es_M2/Dubbing_AD_TEST_dubf-cloned_es_M2_0061
|
I mean, how do I want to be here as a potted plant three or what, you don't understand?
|
||||||
|
633
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0062
|
Let's see, Rey, I don't need to work.
|
||||||
|
634
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0063
|
Ok.
|
||||||
|
635
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0064
|
Let's see, understand me.
|
||||||
|
636
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0065
|
My thing, my thing is horseback riding.
|
||||||
|
637
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0066
|
It is my passion.
|
||||||
|
638
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0067
|
I love it.
|
||||||
|
639
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0068
|
It's what I've done all my life.
|
||||||
|
640
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0069
|
And I had a place to do it in the United States, I had a place to do it in Nogales, but I have no place to do it here.
|
||||||
|
641
|
Dubbing_AD_TEST_dubf-cloned_es_F2/Dubbing_AD_TEST_dubf-cloned_es_F2_0070
|
So, I want to find a good place in Chile in Holland.
|
||||||
|
642
|
Dubbing_AD_TEST_dubf-cloned_es_M2/Dubbing_AD_TEST_dubf-cloned_es_M2_0071
|
Well, let's look for it.
|
||||||
|
643
|
Dubbing_AD_TEST_dubf-cloned_es_M2/Dubbing_AD_TEST_dubf-cloned_es_M2_0072
|
There must be thousands of places.
|
||||||
|
644
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0073
|
So, why don't we go straight against Gómez Labrador?
|
||||||
|
645
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0074
|
You know what I'm talking about, you're a smart woman.
|
||||||
|
646
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0075
|
Look, just stop spreading terror in the news.
|
||||||
|
647
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0076
|
Look, if we agree, I can help you with your political aspirations.
|
||||||
|
648
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0077
|
Here.
|
||||||
|
649
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0078
|
Really?
|
||||||
|
650
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0079
|
What?
|
||||||
|
651
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0080
|
I don't know.
|
||||||
|
652
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0081
|
It is that.
|
||||||
|
653
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0082
|
What?
|
||||||
|
654
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0083
|
I do not like to be associated with corruption.
|
||||||
|
655
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0084
|
I can't believe you have this here.
|
||||||
|
656
|
Dubbing_AD_TEST_dubf-cloned_es_F0/Dubbing_AD_TEST_dubf-cloned_es_F0_0085
|
It is a marvel.
|
||||||
|
657
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0086
|
Yes.
|
||||||
|
658
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0087
|
In fact, the president gave it to me as a gift.
|
||||||
|
659
|
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0088
|
Allow me.
|