Prev
# uttid text ref baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_bad_text_proba
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/slave/exp/yt4_bad_text_proba/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_bad_text_proba__2025-01-20_17-25-48
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-25-48
esesla_enusgbcain
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_consistency_esesla_3_enusgbcainau_revgrad
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_consistency_esesla_3_enusgbcainau_revgrad/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_consistency_esesla_3_enusgbcainau_revgrad__2025-01-20_17-21-38
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-21-38
newlangs
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: gpt_text_consistency_newlangs
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/gpt_text_consistency_newlangs/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/gpt_text_consistency_newlangs__2025-01-20_17-29-59
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-29-59
enonly
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: text_consistency_enonly
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/text_consistency_enonly/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/text_consistency_enonly__2025-01-20_17-34-11
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-34-11
2000
TEDX_F_032/TEDX_F_032_SPA_0011
2001
x9z9jRybHGw_001/614a7f47_24Khz
2002
y6jOzSdTtjI_002/1405b91d
2003
9PSW2HI3Kng_001/a1ea9c76
2004
A4hPsqqQ8vk_001/7a3e3e53
2005
V5QzJTUpi3Q_001/40ad27e9_24Khz
2006
DRtXJ2ih0AI_001/481d56a3_24Khz
2007
bardot_fr_M2/bardot_fr_M2_0054
2008
dMk0yuGEnhA_001/29693c9f_24Khz
2009
Bnb-7-2wdYw_001/58fb43ac_24Khz
2010
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0095
2011
vUzxViPfNcY_001/984f9f86_24Khz
2012
k5rIMr-u0Jw_001/fcfc8f09_24Khz
2013
x9z9jRybHGw_001/5b24d284_24Khz
2014
DRtXJ2ih0AI_001/db724f1d
2015
TEDX_M_092/TEDX_M_092_SPA_0007
2016
2Rl7DrjHv5Q_001/ef02523d_24Khz
2017
x9z9jRybHGw_001/e6494f31
2018
TEDX_F_037/TEDX_F_037_SPA_0017
2019
LA6_Full_ProresHQ-2-_it_F2/LA6_Full_ProresHQ-2-_it_F2_0102
Next