Prev
# text baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_baseline_lats
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: /home/polovick/v2v_diff/ml/projects/ai-voice-cloning/projects-bucket-pack.json
    batch_size: 1
    gpus: 2
    inference:
      diff_steps: 400
      exp: yt4_baseline_lats/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 0.75
      vocoder: univnet
    num_workers: 1
    output_dir: projects_pack_1/yt4_baseline_lats__2024-06-27_12-43-45
    ticket: TTS-388
  basket_generation_git_hash: 3ad347e2f731481af82dafbe72aa4daa136f907b
model_data_type: tts-cloning
ticket: TTS-388
version: 2024-06-27_12-43-45
encodec_mbr
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      override_conditioning_features:
        c50: 0.0
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 6
        mode: MBR
        top_k: 1
      vocoder: none
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-09_23-56-02
    ticket: TTS-393
  basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-09_23-56-02
encodec_mbr_24kfix
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      out_sample_rate: 48000
      override_conditioning_features:
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 6
        mode: MBR
        top_k: 1
      vocoder: none
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-22_14-21-18
    ticket: TTS-393
  basket_generation_git_hash: 37cb3542e38cc2685aebaf1d162ad5a0b7140f8e
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-22_14-21-18
encodec_mbr_24kfix-inhousediff-overrides
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 2
        mode: MBR
        sakoe_chiba_radius: 24
        top_k: 1
      vocoder: bigvgan
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness_inhdiff/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__2024-08-02_03-20-48
    ticket: TTS-393
  basket_generation_git_hash: 5707d4c683a4b30e1858324363726a1e6d05bdd8
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-08-02_03-20-48
encodec_mbr_24kfix-normref
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch/
      force_reference_std: -23
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      out_sample_rate: 48000
      override_conditioning_features:
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 6
        mode: MBR
        top_k: 1
      vocoder: none
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1_encodec-opt-bigbatch__2024-07-22_16-15-37
    ticket: TTS-393
  basket_generation_git_hash: 37cb3542e38cc2685aebaf1d162ad5a0b7140f8e
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-22_16-15-37
encodec_mbr_24kfix-inhousediff-overrides-normloud
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes
      force_reference_std: -23
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      out_sample_rate: 24000
      override_conditioning_features:
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 2
        mode: MBR
        sakoe_chiba_radius: 24
        top_k: 1
      vocoder: bigvgan
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness_inhdiff/yt4_langbycond_revgrad1_encodec-opt-bigbatch-diffcodes__2024-08-02_10-29-24
    ticket: TTS-393
  basket_generation_git_hash: 5707d4c683a4b30e1858324363726a1e6d05bdd8
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-08-02_10-29-24
encodec_mbr_normloud-contr-oversnr-dfnet
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud/
      force_reference_std: -21.5
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      out_sample_rate: 48000
      override_conditioning_features:
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 6
        mode: MBR
        top_k: 1
      vocoder: none
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud__2024-07-14_18-13-45
    ticket: TTS-393
  basket_generation_git_hash: c8fbcc9a0f18330789b7a4441a1efbeea1019935
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-14_18-13-45
encodec_mbr_normloud-contr-oversnr-dfnet-24kfix
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
data_meta: null
exp_name: yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_5projects_704_fixedref.json
    batch_size: 1
    gpus: 1
    inference:
      condition_sample_rate: 24000
      diff_on_codes: false
      diff_steps: 400
      exp: /mount/s3/tts-binary-data-nb/dimdi-y/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud/
      force_reference_std: -21.5
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        prefix_allowed_tokens_fn: encodec_interleaved_layers
        repetition_penalty_span: 50.0
        use_cache: true
      out_sample_rate: 48000
      override_conditioning_features:
        snr: 100.0
      reranking_options:
        cdist_time_downsampling_factor: 6
        mode: MBR
        top_k: 1
      vocoder: none
    num_workers: 1
    output_dir: es_en_dsat_mapping_encodec_mbrlat_override_optimizeloudness/yt4_langbycond_revgrad1-contrastive_encodec-opt-bigbatch_normloud__2024-07-22_14-43-07
    ticket: TTS-393
  basket_generation_git_hash: 37cb3542e38cc2685aebaf1d162ad5a0b7140f8e
model_data_type: tts-cloning
ticket: TTS-393
version: 2024-07-22_14-43-07
180
The day after tomorrow.
181
I am taking a train to Paris and from there... to Buenos Aires.
182
What am I going to do?
183
What?
184
What am I going to do?
185
Well, come with me... To fight for our dreams.
186
Say something.
187
Have you already told him you will go?
188
How long have you known him?
189
I don't know, Laura, what do I know, I don't know.
190
Yes, fifteen days...
191
Fifteen days and he asks you to leave your family and child and go with him.
192
But how can you trust someone who asks you something like that?
193
Can't you see it?
194
It's crazy!
195
If you leave, it is not because of the revolution.
196
No, don't be fooled.
197
If you leave, it's because of him.
198
And for me, Laura, and for me.
199
Because he represents everything I have always dreamed of living.
200
But here is your son who needs you.
201
You have your family, you have me.
202
Really, you want to stop all that?
203
How do you want me to want to?
204
Then stay, Amelia.
205
And not see him again?
206
Look! I already know how to measure the oil in cars.
207
I saw that you are very smart, huh?
208
And you learn very quickly.
209
You, very good.
Next