| # | text |
baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_baseline_lats
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/projects-bucket-pack.json
batch_size: 1
gpus: 2
inference:
diff_steps: 400
exp: yt4_baseline_lats/
gpt_generate_args:
do_sample: true
num_return_sequences: 50
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 0.75
vocoder: univnet
num_workers: 1
output_dir: projects_pack_1/yt4_baseline_lats__2024-06-27_12-43-45
ticket: TTS-388
basket_generation_git_hash: 3ad347e2f731481af82dafbe72aa4daa136f907b
model_data_type: tts-cloning
ticket: TTS-388
version: 2024-06-27_12-43-45
|
encodec_mbr_dsat
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
batch_size: 1
gpus: 2
inference:
condition_sample_rate: 24000
diff_on_codes: false
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch
gpt_generate_args:
do_sample: true
num_return_sequences: 50
prefix_allowed_tokens_fn: encodec_interleaved_layers
repetition_penalty_span: 50.0
use_cache: true
override_conditioning_features:
c50: 0.0
snr: 100.0
reranking_options:
cdist_time_downsampling_factor: 6
mode: MBR
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-09_23-56-02
ticket: TTS-393
basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-09_23-56-02
|
encodec_mbr_normloud-contr-oversnr-dfnet
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: false
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud/
force_reference_std: -21.5
gpt_generate_args:
do_sample: true
num_return_sequences: 50
prefix_allowed_tokens_fn: encodec_interleaved_layers
repetition_penalty_span: 50.0
use_cache: true
out_sample_rate: 48000
override_conditioning_features:
snr: 100.0
reranking_options:
cdist_time_downsampling_factor: 6
mode: MBR
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud__2024-07-14_18-13-45
ticket: TTS-393
basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-14_18-13-45
|
|---|---|---|---|---|
|
690
|
Let's change, it's ours.
|
|||
|
691
|
As much as I love press appearances, as much as they fascinate me.
|
|||
|
692
|
Great dog.
|
|||
|
693
|
No.
|
|||
|
694
|
And well, for you.
|
|||
|
695
|
Your mom sends you her best regards, she sends you lots of hugs and she will be watching over you.
|
|||
|
696
|
Why didn't she come?
|
|||
|
697
|
Look, the important thing is that he's coming, eh?
|
|||
|
698
|
It is what is already to come.
|
|||
|
699
|
You saw it.
|
|||
|
700
|
And it's good, huh.
|
|||
|
701
|
It's the only one that matters.
|
|||
|
702
|
And why the hell didn't you get attracted to you?
|