Prev
# uttid text ref baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_bad_text_proba
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/slave/exp/yt4_bad_text_proba/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_bad_text_proba__2025-01-20_17-25-48
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-25-48
esesla_enusgbcain
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_consistency_esesla_3_enusgbcainau_revgrad
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_consistency_esesla_3_enusgbcainau_revgrad/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_consistency_esesla_3_enusgbcainau_revgrad__2025-01-20_17-21-38
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-21-38
newlangs
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: gpt_text_consistency_newlangs
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/gpt_text_consistency_newlangs/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/gpt_text_consistency_newlangs__2025-01-20_17-29-59
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-29-59
enonly
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: text_consistency_enonly
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/text_consistency_enonly/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/text_consistency_enonly__2025-01-20_17-34-11
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-34-11
1900
PT2m9lkGhvM_001/871507f0
1901
5Ln6XFAv1sw_001/a1bbef7c
1902
tgvSpNSj6qw_001/00efa6f2_24Khz
1903
LA6_Full_ProresHQ-2-_it_F1/LA6_Full_ProresHQ-2-_it_F1_0019
1904
Rosa_de_Guadalupe_-_-56007d_es_M1/Rosa_de_Guadalupe_-_-56007d_es_M1_0136
1905
CIaSavesB5U_001/45f4f834
1906
cS8FRUZyBXk_001/1379206f_24Khz
1907
A4hPsqqQ8vk_001/52740925
1908
sx8LqpClLIk_001/206af549_24Khz
1909
tihtx5AS_k8_001/b0f3c90f
1910
TEDX_M_006/TEDX_M_006_SPA_0021
1911
LA6_Full_ProresHQ-2-_it_F1/LA6_Full_ProresHQ-2-_it_F1_0060
1912
Rosa_de_Guadalupe_-_-56007d_es_M0/Rosa_de_Guadalupe_-_-56007d_es_M0_0056
1913
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0035
1914
qbaByMHJs3w_002/ccd99f3c
1915
Je8YcXQhaT4_001/6c30ebe8
1916
9PSW2HI3Kng_001/83d7f709_24Khz
1917
-w7wUs30OXk_001/5ba79dac_24Khz
1918
8x6EsAnAGXs_001/2212d26b_24Khz
1919
BoAU6fkv0dg_001/87fa6d64_24Khz
Next