# | text |
baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_baseline_lats lang: en meta: basket_generation_config: basket_lang: en basket_path: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/projects-bucket-pack.json batch_size: 1 gpus: 2 inference: diff_steps: 400 exp: yt4_baseline_lats/ gpt_generate_args: do_sample: true num_return_sequences: 50 override_conditioning_features: c50: 0.0 pitch_std: 100.0 snr: 100.0 reranking_options: mode: MBR top_k: 1 target_len_rate: 0.75 vocoder: univnet num_workers: 1 output_dir: projects_pack_1/yt4_baseline_lats__2024-06-27_12-43-45 ticket: TTS-388 basket_generation_git_hash: 3ad347e2f731481af82dafbe72aa4daa136f907b model_data_type: tts-cloning ticket: TTS-388 version: 2024-06-27_12-43-45 |
encodec_mbr
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 2 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true override_conditioning_features: c50: 0.0 snr: 100.0 reranking_options: cdist_time_downsampling_factor: 6 mode: MBR top_k: 1 vocoder: none num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-09_23-56-02 ticket: TTS-393 basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935 model_data_type: tts-cloning ticket: TTS-393 version: 2024-07-09_23-56-02 |
encodec_mbr_24kfix
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 1 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch/ gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true out_sample_rate: 48000 override_conditioning_features: snr: 100.0 reranking_options: cdist_time_downsampling_factor: 6 mode: MBR top_k: 1 vocoder: none num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-22_14-21-18 ticket: TTS-393 basket_generation_git_hash: 37cb3542e38cc2685aebaf1d162ad5a0b7140f8e model_data_type: tts-cloning ticket: TTS-393 version: 2024-07-22_14-21-18 |
encodec_mbr_24kfix-inhousediff-overrides
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 1 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true out_sample_rate: 24000 override_conditioning_features: c50: 0.0 pitch_std: 100.0 snr: 100.0 reranking_options: cdist_time_downsampling_factor: 2 mode: MBR sakoe_chiba_radius: 24 top_k: 1 vocoder: bigvgan num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness_inhdiff/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__2024-08-02_03-20-48 ticket: TTS-393 basket_generation_git_hash: 5707d4c683a4b30e1858324363726a1e6d05bdd8 model_data_type: tts-cloning ticket: TTS-393 version: 2024-08-02_03-20-48 |
encodec_mbr_24kfix-normref
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 1 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch/ force_reference_std: -23 gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true out_sample_rate: 48000 override_conditioning_features: snr: 100.0 reranking_options: cdist_time_downsampling_factor: 6 mode: MBR top_k: 1 vocoder: none num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-22_16-15-37 ticket: TTS-393 basket_generation_git_hash: 37cb3542e38cc2685aebaf1d162ad5a0b7140f8e model_data_type: tts-cloning ticket: TTS-393 version: 2024-07-22_16-15-37 |
encodec_mbr_24kfix-inhousediff-overrides-normloud
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 1 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes force_reference_std: -23 gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true out_sample_rate: 24000 override_conditioning_features: c50: 0.0 pitch_std: 100.0 snr: 100.0 reranking_options: cdist_time_downsampling_factor: 2 mode: MBR sakoe_chiba_radius: 24 top_k: 1 vocoder: bigvgan num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness_inhdiff/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__2024-08-02_10-29-24 ticket: TTS-393 basket_generation_git_hash: 5707d4c683a4b30e1858324363726a1e6d05bdd8 model_data_type: tts-cloning ticket: TTS-393 version: 2024-08-02_10-29-24 |
encodec_mbr_normloud-contr-oversnr-dfnet
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 1 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud/ force_reference_std: -21.5 gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true out_sample_rate: 48000 override_conditioning_features: snr: 100.0 reranking_options: cdist_time_downsampling_factor: 6 mode: MBR top_k: 1 vocoder: none num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud__2024-07-14_18-13-45 ticket: TTS-393 basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935 model_data_type: tts-cloning ticket: TTS-393 version: 2024-07-14_18-13-45 |
encodec_mbr_normloud-contr-oversnr-dfnet-24kfix
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json data_meta: null exp_name: yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud lang: en meta: basket_generation_config: basket_lang: en basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json batch_size: 1 gpus: 1 inference: condition_sample_rate: 24000 diff_on_codes: false diff_steps: 400 exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud/ force_reference_std: -21.5 gpt_generate_args: do_sample: true num_return_sequences: 50 prefix_allowed_tokens_fn: encodec_interleaved_layers repetition_penalty_span: 50.0 use_cache: true out_sample_rate: 48000 override_conditioning_features: snr: 100.0 reranking_options: cdist_time_downsampling_factor: 6 mode: MBR top_k: 1 vocoder: none num_workers: 1 output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud__2024-07-22_14-43-07 ticket: TTS-393 basket_generation_git_hash: 37cb3542e38cc2685aebaf1d162ad5a0b7140f8e model_data_type: tts-cloning ticket: TTS-393 version: 2024-07-22_14-43-07 |
---|---|---|---|---|---|---|---|---|---|
240
|
Well... it's a bit crooked,
|
||||||||
241
|
But you can't see the pillow.
|
||||||||
242
|
Oh my! Well, I see it very well!
|
||||||||
243
|
The truth is that I had never done a girl's hair before, Chelita.
|
||||||||
244
|
That's why I relied on the internet video, the one you see there, look.
|
||||||||
245
|
But it kept you from going to your first day of school as a listener.
|
||||||||
246
|
Thank you for making me pretty, Emmanuel.
|
||||||||
247
|
No Chelita, I didn't do anything.
|
||||||||
248
|
You were born beautiful!
|
||||||||
249
|
I just combed your hair.
|
||||||||
250
|
That's it!
|
||||||||
251
|
It starts without any fuss.
|
||||||||
252
|
You are number one in the Escandon.
|
||||||||
253
|
We only do our job well, Chelita, so that the customer leaves happy and comes back.
|
||||||||
254
|
When I get a car, I'm sure I'll bring it with you so it's in range.
|
||||||||
255
|
You are still too young to think about that.
|
||||||||
256
|
Hey...
|
||||||||
257
|
but would you like to maneuver the steering wheel?
|
||||||||
258
|
Yes, yes, yes!
|
||||||||
259
|
Yes?
|
||||||||
260
|
Come here then!
|
||||||||
261
|
Be careful, eh? Don't go throwing a cow.
|
||||||||
262
|
Look, like this...
|
||||||||
263
|
You will grip the steering wheel with both hands.
|
||||||||
264
|
Yes?
|
||||||||
265
|
And you hit it one way, and you hit it the other.
|
||||||||
266
|
Come on, huh?
|
||||||||
267
|
At some point, I even become a racing driver.
|
||||||||
268
|
I'm sure it is.
|
||||||||
269
|
Look, come on.
|