| # | uttid | text |
baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
data_meta: null
exp_name: gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
disable_optimized_diffusion: true
exp: /mount/s3/tts-binary-data-nb/dchebakov/models/gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice/
gpt_generate_args:
do_sample: true
enforce_silent_start: wavtokenizer
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing:
- deepfilternet
num_workers: 1
output_dir: dsat_042025_to_en_mini/gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice__2025-07-07_09-23-19
ref_dir: dsat_042025_to_en_mini/ref
ticket: QUALITY-41
basket_generation_git_hash: e961ea383299ff424f66fd9505a4c7b12ba65799
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-07-07_09-23-19
|
freq_feats
basket_config_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
data_meta: null
exp_name: gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice__diffusion_yt4_wavtokenizer_freq_feats_noref
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/diffusion_yt4_wavtokenizer_freq_feats_noref/
disable_optimized_diffusion: true
exp: /mount/s3/tts-binary-data-nb/dchebakov/models/gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice/
gpt_generate_args:
do_sample: true
enforce_silent_start: wavtokenizer
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing:
- deepfilternet
num_workers: 1
output_dir: dsat_042025_to_en_mini/gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice__diffusion_yt4_wavtokenizer_freq_feats_noref__2025-07-07_09-23-20
ref_dir: dsat_042025_to_en_mini/ref
ticket: QUALITY-41
basket_generation_git_hash: e961ea383299ff424f66fd9505a4c7b12ba65799
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-07-07_09-23-20
|
freq_feats_cv
basket_config_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
data_meta: null
exp_name: gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice__diffusion_yt4_wavtokenizer_freq_feats_noref_condcv
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
batch_size: 1
gpus: 1
inference:
condition_sample_rate: 24000
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/diffusion_yt4_wavtokenizer_freq_feats_noref_condcv/
disable_optimized_diffusion: true
exp: /mount/s3/tts-binary-data-nb/dchebakov/models/gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice/
gpt_generate_args:
do_sample: true
enforce_silent_start: wavtokenizer
num_return_sequences: 50
use_cache: true
out_sample_rate: 24000
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
pitch_std: 100.0
snr: 100.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing:
- deepfilternet
num_workers: 1
output_dir: dsat_042025_to_en_mini/gpt_yt4_langbycond_25freq_fsq_entropy__noclearvoice__diffusion_yt4_wavtokenizer_freq_feats_noref_condcv__2025-07-07_09-23-19
ref_dir: dsat_042025_to_en_mini/ref
ticket: QUALITY-41
basket_generation_git_hash: e961ea383299ff424f66fd9505a4c7b12ba65799
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-07-07_09-23-19
|
dvae_freq_feats
basket_config_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
data_meta: null
exp_name: yt4_en_accent_clf_entropy_t5__diffusion_yt4_en_accent_clf_entropy_t5_freq_feats_EN_noref
lang: en-us
meta:
basket_generation_config:
basket_lang: en-us
basket_path: quality/tts/tortoise-baskets/dsat_042025_to_en_mini_100.json
batch_size: 1
gpus: 1
inference:
diff_k: 3
diff_steps: 100
diffusion_exp: /mount/s3/tts-binary-data-nb/eg/exp/diffusion_yt4_en_accent_clf_entropy_t5_freq_feats_EN_noref/
disable_optimized_diffusion: true
exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_en_accent_clf_entropy_t5/
gpt_generate_args:
do_sample: true
enforce_silent_start: true
num_return_sequences: 50
use_cache: true
override_conditioning_features:
bad_text_proba: 0.0
c50: 0.0
dmcs_flatness: 100500.0
dmcs_roll_off_0.995: 100500.0
pitch_std: 100500.0
snr: 100500.0
reranking_options:
mode: MBR
top_k: 1
target_len_rate: 1.0
vocoder: bigvgan
voice_samples_preprocessing:
- deepfilternet
num_workers: 1
output_dir: dsat_042025_to_en_mini/yt4_en_accent_clf_entropy_t5__diffusion_yt4_en_accent_clf_entropy_t5_freq_feats_EN_noref__2025-06-02_13-57-41
ref_dir: dsat_042025_to_en_mini/ref
ticket: QUALITY-41
basket_generation_git_hash: c185fc1cf93b68974cf48ed189a1c77d4535cc35
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-06-02_13-57-41
|
|---|---|---|---|---|---|---|
|
IYUNOBokyeom-TV-od3h__Bo-chelin-at-Mingles_Final-29-6euy_ko/M0__220.223-220.893
|
however.
|
|||||
|
IYUNOKonrev_Bla-5xua__Soul-Scandal-Season-1_250310-z2ow_ko/F1__454.166-454.549
|
What
|
|||||
|
IYUNOBokyeom-TV-r1be__Bo-chelin-at-Mingles_Final-29-kvq3_ko/M0__538.075-539.937
|
You'll know what kind of murder it is when you chew on it.
|
|||||
|
IYUNOTTS-Manage-wvxp__Unmaksed-sample-2-video-2xs8_ko/M2__45.717-47.411
|
He was at a motel with his church member.
|
|||||
|
CB-4-min-test-onmv__H_MAGISSA_S01_E004-part1-lowre-d632_el/M0__71.011-71.525
|
Cry??
|
|||||
|
NETFLIX-test-proje-698i__JP-test-clip-1f6q_pt/M1__259.693-261.327
|
I got a test for Formula Ford.
|
|||||
|
CSHARP-DEMO-SAMPL-gnpv__Hindi-Low-Sample-79ll_zh/F0__57.918-59.659
|
when I wear these kinds of stockings?
|
|||||
|
MELSDerniere_s-s478__DerniereSeconde_S01-E01_SansPa-cs7j_fr/M1__15.142-16.859
|
Are you still in shock this morning?
|
|||||
|
DC-Test-Russe-alk2__Test-Russe-en-Chinois-9eow_ru/M0__101.681-105.305
|
you wouldn't guess it, but tonight you'll see L. A. like you've never seen it before.
|
|||||
|
CB-Chinese-mi-idgm__CHINESE_DUBBING_VIDEO-kni9_zh/F0__4.668-7.364
|
Grandma...I've barely said anything, and you…
|
|||||
|
DC-Profession-nwje__Folge-5-Vanessa-djwo_de/F0__28.009-34.399
|
When I was invited to come in for an interview with Hoffmann-Personal, I have to say that I immediately felt at home.
|
|||||
|
IYUNOWoowakgood-23lu__Woowakgood_Sample-58g4_ko/M2__83.010-85.272
|
I don't think we're gonna be able to punch our way through this.
|
|||||
|
IYUNOKonrev_Bla-5xua__Blah-Season-1_250310-hdwk_ko/F2__541.448-543.772
|
But I'm just not sure yet if I actually want to date you.
|
|||||
|
DC-Profession-nwje__Folge-1-Astar-yejb_de/F0__35.297-38.083
|
And that kind of stuff just didn't fit into their worldview at all.
|
|||||
|
IYUNOKonrev_Bla-5xua__Blah-Season-1_250310-hdwk_ko/M2__500.656-501.472
|
she would be it.
|
|||||
|
DC-Profession-nwje__Folge-5-Vanessa-djwo_de/F0__88.349-93.100
|
When the valves open up and you get that engine sound and you have loud music blaring on the stereo...
|
|||||
|
IYUNOKonrev_Bla-5xua__Blah-Season-1_250310-hdwk_ko/F1__86.167-88.550
|
I can't get fired again, but things aren't looking great.
|
|||||
|
CB-WINGED-TES-1jcc__vlc-record-2025-03-31-09h49m41-06pp_pt/F3__144.965-151.035
|
Exactly! In our families, everyone is connected to each other by a cord of love.
|
|||||
|
CB-4-min-test-onmv__H_MAGISSA_S01_E004-part1-lowre-d632_el/M1__130.863-132.713
|
You want us to slaughter each other over a stranger?
|
|||||
|
IYUNOKonrev_Bla-5xua__Blah-Season-1_250310-hdwk_ko/F1__85.423-85.670
|
Yup.
|