Prev
# uttid text ref baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_bad_text_proba
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/slave/exp/yt4_bad_text_proba/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_bad_text_proba__2025-01-20_17-25-48
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-25-48
esesla_enusgbcain
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_consistency_esesla_3_enusgbcainau_revgrad
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_consistency_esesla_3_enusgbcainau_revgrad/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_consistency_esesla_3_enusgbcainau_revgrad__2025-01-20_17-21-38
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-21-38
newlangs
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: gpt_text_consistency_newlangs
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/gpt_text_consistency_newlangs/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/gpt_text_consistency_newlangs__2025-01-20_17-29-59
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-29-59
enonly
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: text_consistency_enonly
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/text_consistency_enonly/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/text_consistency_enonly__2025-01-20_17-34-11
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-34-11
2160
EUqqj2YWc3k_001/961238a1_24Khz
2161
7pR84McidsU_001/fdb517c9_24Khz
2162
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0003
2163
10367/30738ac7
2164
TEDX_M_037/TEDX_M_037_SPA_0041
2165
SO9KnCbBNeY_001/7386407f_24Khz
2166
Aem7LMLEWes_001/be77d0c6
2167
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0008
2168
7ucdqr42B0g_001/8a835115_24Khz
2169
LA6_Full_ProresHQ-2-_it_F2/LA6_Full_ProresHQ-2-_it_F2_0099
2170
r7e5rhVXaCg_001/540f9561
2171
pcEdR90tbvo_001/b6d7c391_24Khz
2172
133/819ec141
2173
Aem7LMLEWes_001/224d577d
2174
TEDX_M_040/TEDX_M_040_SPA_0017
2175
Rosa_de_Guadalupe_-_-56007d_es_M2/Rosa_de_Guadalupe_-_-56007d_es_M2_0085
2176
tihtx5AS_k8_001/be72160f
2177
oAK9SaaL6QU_001/184a1751
2178
LsAVML-w7Co_001/d3f33789_24Khz
2179
6exp02l5gpU_001/d3b3a0da_24Khz
Next