| # | uttid | text |
baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_baseline_lats
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/dsat-basket-extended-refs-dur.json
batch_size: 1
gpus: 2
inference:
diff_steps: 400
exp: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/yt4_baseline_lats
gpt_generate_args:
do_sample: true
num_return_sequences: 50
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 0.75
vocoder: univnet
num_workers: 1
output_dir: dsat-cleared/yt4_baseline_lats__2024-07-30_03-28-45
ticket: QUALITY-54
basket_generation_git_hash: e0df79f1213deffbae77e909499694944e0746da
model_data_type: tts-cloning
ticket: QUALITY-54
version: 2024-07-30_03-28-45
|
encodec-inhousediff-sameinfer
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__diff_nonorm_2codes_pretrained
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: false
diff_steps: 400
diffusion_exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloudness_delaypattern8/diff_nonorm_2codes_pretrained
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes
gpt_generate_args:
do_sample: true
num_return_sequences: 50
prefix_allowed_tokens_fn: encodec_interleaved_layers
repetition_penalty_activation_span: 4.0
repetition_penalty_span: 50.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
cdist_time_downsampling_factor: 2
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: bigvgan
num_workers: 1
output_dir: es_en_clean-dsat_mapping_encodec_mbrlat_inhdiff/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__diff_nonorm_2codes_pretrained__2024-09-18_17-36-55
ticket: TTS-393
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-09-18_17-36-55
|
xcodec160k_1code_inhdiff20k
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_xcodec-opt-bigbatch__diffusion_yt4_xcodec
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
diffusion_exp: /mount/s3/tts-binary-data-nb/dimdi-y/diffusion_yt4_xcodec
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_xcodec-opt-bigbatch
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty_activation_span: 4.0
repetition_penalty_span: 50.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 16
top_k: 1
vocoder: bigvgan
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_inhdiff/yt4_langbycond_revgrad1_xcodec-opt-bigbatch__diffusion_yt4_xcodec__2024-10-02_15-50-47
ticket: TTS-393
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-10-02_15-50-47
|
wavtokeniser
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty_activation_span: 1.0
repetition_penalty_span: 100.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_codecdec/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc__2024-10-29_09-42-52
ticket: TTS-392
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-10-29_09-42-52
|
wavtokeniser_normloud
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
force_reference_std: -23
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty_activation_span: 1.0
repetition_penalty_span: 100.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_codecdec/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc__2024-10-29_09-58-08
ticket: TTS-392
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-10-29_09-58-08
|
wavtokeniser_normloud_lesspenalty
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
lang: en
meta:
basket_generation_config:
basket_lang: en
basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_cleared_721.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_on_codes: true
diff_steps: 400
exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc
force_reference_std: -23
gpt_generate_args:
do_sample: true
num_return_sequences: 50
repetition_penalty: 1.5
repetition_penalty_activation_span: 5.0
repetition_penalty_span: 100.0
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
c50: 0.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
sakoe_chiba_radius: 24
top_k: 1
vocoder: none
num_workers: 1
output_dir: es_en_clean-dsat_mapping_xcodec_mbrlat_codecdec/yt4_langbycond_revgrad1_wavtokenizer-opt-bigbatch_t5enc__2024-10-29_13-45-07
ticket: TTS-392
basket_generation_git_hash: 75e464c6d886d92ef5b904f41695658ca2bc7545
model_data_type: tts-cloning
ticket: TTS-392
version: 2024-10-29_13-45-07
|
|---|---|---|---|---|---|---|---|---|
|
0
|
bardot_fr_F0/bardot_fr_F0_0000
|
Here!
|
||||||
|
1
|
bardot_fr_F0/bardot_fr_F0_0001
|
Here's the new version of Babette.
|
||||||
|
2
|
bardot_fr_F0/bardot_fr_F0_0002
|
Oury has changed everything, it's night and day!
|
||||||
|
3
|
bardot_fr_F1/bardot_fr_F1_0003
|
Isn't he an actor?
|
||||||
|
4
|
bardot_fr_F0/bardot_fr_F0_0004
|
Now he writes, he's very talented.
|
||||||
|
5
|
bardot_fr_F0/bardot_fr_F0_0005
|
You read fast, don't you, please?
|
||||||
|
6
|
bardot_fr_F1/bardot_fr_F1_0006
|
That's a cute one.
|
||||||
|
7
|
bardot_fr_F1/bardot_fr_F1_0007
|
Ah, it's Charrier...
|
||||||
|
8
|
bardot_fr_F0/bardot_fr_F0_0008
|
He's the up-and-coming actor.
|
||||||
|
9
|
bardot_fr_F0/bardot_fr_F0_0009
|
Didn't you see Carné's Les Tricheurs?
|
||||||
|
10
|
bardot_fr_F1/bardot_fr_F1_0010
|
Not yet.
|
||||||
|
11
|
bardot_fr_F0/bardot_fr_F0_0011
|
This one is very interesting...
|
||||||
|
12
|
bardot_fr_F1/bardot_fr_F1_0012
|
A mouthful... Beautiful mouth.
|
||||||
|
13
|
bardot_fr_F1/bardot_fr_F1_0013
|
We'll have to see.
|
||||||
|
14
|
bardot_fr_F0/bardot_fr_F0_0014
|
He is currently filming with a young man, the same band...
|
||||||
|
15
|
bardot_fr_F1/bardot_fr_F1_0015
|
Who?
|
||||||
|
16
|
bardot_fr_F0/bardot_fr_F0_0016
|
Jean Luc quelque chose, a first film.
|
||||||
|
17
|
bardot_fr_F1/bardot_fr_F1_0017
|
Why do you make me meet only old directors?
|
||||||
|
18
|
bardot_fr_F1/bardot_fr_F1_0018
|
I am 24 years old.
|
||||||
|
19
|
bardot_fr_F1/bardot_fr_F1_0019
|
Am I already too old for young people?
|
||||||
|
20
|
bardot_fr_F0/bardot_fr_F0_0020
|
Everyone wants to meet you!
|
||||||
|
21
|
bardot_fr_F1/bardot_fr_F1_0021
|
Yes, well, meeting me, looking at me like I'm a freak.
|
||||||
|
22
|
bardot_fr_F1/bardot_fr_F1_0022
|
"The new wave."
|
||||||
|
23
|
bardot_fr_F1/bardot_fr_F1_0023
|
Am I already at the Musée Grévin for them?
|
||||||
|
24
|
bardot_fr_F0/bardot_fr_F0_0024
|
Waves come and go.
|
||||||
|
25
|
bardot_fr_F0/bardot_fr_F0_0025
|
Look, Carné.
|
||||||
|
26
|
bardot_fr_F0/bardot_fr_F0_0026
|
He's almost 60 and his film about young people is a triumph.
|
||||||
|
27
|
bardot_fr_F1/bardot_fr_F1_0027
|
What's his actor's name again?
|
||||||
|
28
|
bardot_fr_F0/bardot_fr_F0_0028
|
Jacques Charrier.
|
||||||
|
29
|
bardot_fr_F0/bardot_fr_F0_0029
|
Let me know what you think...
|