Prev
# uttid text ref baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_bad_text_proba
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/slave/exp/yt4_bad_text_proba/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_bad_text_proba__2025-01-20_17-25-48
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-25-48
esesla_enusgbcain
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_consistency_esesla_3_enusgbcainau_revgrad
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_consistency_esesla_3_enusgbcainau_revgrad/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_consistency_esesla_3_enusgbcainau_revgrad__2025-01-20_17-21-38
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-21-38
newlangs
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: gpt_text_consistency_newlangs
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/gpt_text_consistency_newlangs/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/gpt_text_consistency_newlangs__2025-01-20_17-29-59
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-29-59
enonly
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: text_consistency_enonly
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/text_consistency_enonly/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/text_consistency_enonly__2025-01-20_17-34-11
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-34-11
1140
Rosa_de_Guadalupe_-_-56007d_es_M0/Rosa_de_Guadalupe_-_-56007d_es_M0_0121
1141
-DnkFcR6vrc_001/3af8df45_24Khz
1142
wZXmot3T1ec_001/e1b1cc96
1143
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F9/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F9_0114
1144
Bnb-7-2wdYw_001/c522ac66_24Khz
1145
BHv8jT_9wig_001/6aac94ac
1146
2Rl7DrjHv5Q_001/5f97c05c
1147
tgvSpNSj6qw_001/f408a79e_24Khz
1148
6SWyBN68N-A_001/15aeabdf_24Khz
1149
CIaSavesB5U_001/918cb17f
1150
q4L86hoeWoY_001/4e83af79
1151
UxxvJldAt9o_001/7ca2d6bb_24Khz
1152
ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0/ORIGINALSPAVERSION-93a5cd-VoiceActing_es_F0_0050
1153
O514d76Hqls_001/8a96592b_24Khz
1154
SO9KnCbBNeY_001/43c0b634_24Khz
1155
TEDX_M_068/TEDX_M_068_SPA_0020
1156
A4hPsqqQ8vk_001/a257b13b_24Khz
1157
fRUC8v7M6MI_001/62b2777b_24Khz
1158
72Ops7Ymido_001/68078587
1159
AdJqgKJgS30_002/ce3d5881_24Khz
Next