Prev
# uttid text ref baseline
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_bad_text_proba
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/slave/exp/yt4_bad_text_proba/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_bad_text_proba__2025-01-20_17-25-48
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-25-48
esesla_enusgbcain
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: yt4_consistency_esesla_3_enusgbcainau_revgrad
lang: en-us
meta:
  basket_generation_config:
    basket_lang: en-us
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/yt4_consistency_esesla_3_enusgbcainau_revgrad/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/yt4_consistency_esesla_3_enusgbcainau_revgrad__2025-01-20_17-21-38
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-21-38
newlangs
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: gpt_text_consistency_newlangs
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/gpt_text_consistency_newlangs/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/gpt_text_consistency_newlangs__2025-01-20_17-29-59
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-29-59
enonly
basket_config_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
data_meta: null
exp_name: text_consistency_enonly
lang: en
meta:
  basket_generation_config:
    basket_lang: en
    basket_path: quality/tts/tortoise-baskets/dsat_to_en_mini_100.json
    batch_size: 4
    gpus: 2
    inference:
      condition_sample_rate: 24000
      diff_k: 3
      diff_steps: 100
      duplicate_reference: true
      exp: /mount/s3/tts-binary-data-nb/eg/exp/text_consistency_enonly/
      gpt_generate_args:
        do_sample: true
        num_return_sequences: 50
        use_cache: true
      override_conditioning_features:
        bad_text_proba: 0.0
        c50: 0.0
        pitch_std: 100.0
        snr: 100.0
      reranking_options:
        mode: MBR
        top_k: 1
      target_len_rate: 1.25
      vocoder: bigvgan
      voice_samples_preprocessing:
      - demucs
      - deepfilternet
    num_workers: 1
    output_dir: dsat_to_en_mini/text_consistency_enonly__2025-01-20_17-34-11
    ticket: QUALITY-41
  basket_generation_git_hash: 6f6cb768a4ef7425185fdde6d1a4eac9371eb37e
model_data_type: tts-cloning
ticket: QUALITY-41
version: 2025-01-20_17-34-11
1960
11670/e7a2ab2a
1961
zM7yp2rXjdE_001/d52a4973_24Khz
1962
iaIsNexUfOE_001/0535a33b_24Khz
1963
DRtXJ2ih0AI_001/da61275c_24Khz
1964
Rbnby149tlc_001/10a3c485_24Khz
1965
tTFPa4ub4Aw_001/1e384acd_24Khz
1966
Dubbing_AD_TEST_dubf-cloned_es_M0/Dubbing_AD_TEST_dubf-cloned_es_M0_0033
1967
2E6fOjn5ZXU_001/42a6c565_24Khz
1968
XR7cvDLveBU_001/26f500ef_24Khz
1969
1MXhLpFGe10_001/4991b36f_24Khz
1970
BdJAZyWbOoo_001/d1b7f075
1971
Aem7LMLEWes_001/c88992d6
1972
At67Oh_rxPI_001/c396b2f5
1973
sl_JoobohTY_001/63cb5ac5_24Khz
1974
UxxvJldAt9o_001/983e0c5e_24Khz
1975
YwPD61hQkr4_001/36facaf0_24Khz
1976
TEDX_M_041/TEDX_M_041_SPA_0014
1977
r7e5rhVXaCg_001/bdc3c724_24Khz
1978
woeKjuz6jlM_001/f34e9710
1979
7snYoNLkxcY_001/b407c5d3_24Khz
Next