Spaces:
Runtime error
Runtime error
File size: 5,822 Bytes
0558aa4 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 |
#!/usr/bin/env bash
DOCKER_EXP_DIR="/checkpoints/results/25FPS_inference"
### Best for nonstreaming Great for streaming
# CKPT="/checkpoints/streaming/magpie/jason/magpieTTS--val_loss=5.1255-epoch=89-last.ckpt"
# HPARAM="/checkpoints/streaming/magpie/jason/magpietts_en_jason_inference.yaml"
# Great for nonstreaming Best for streaming with exponential weight
# CKPT="/checkpoints/streaming/magpie/sugh_BIN_F2P1E0.0/magpieTTS--val_loss=5.1851-epoch=143-last.ckpt"
# HPARAM="/checkpoints/streaming/magpie/sugh_BIN_F2P1E0.0/magpietts_en_subhankarg_BIN_F2P1E0.0.yaml"
# Good for nonstreaming
# CKPT="/checkpoints/streaming/magpie/BIN_F5P5E0_DECF1.0P1.0_wait1_strictwindowTrue/magpieTTS--val_loss=5.2150-epoch=173-last.ckpt"
# HPARAM="/checkpoints/streaming/magpie/BIN_F5P5E0_DECF1.0P1.0_wait1_strictwindowTrue/magpietts_en_subhankarg_BIN_F0P2E0.0_DECF1.0P1.0.yaml"
# CKPT="/checkpoints/streaming/magpie/sugh_BIN_F0P2E0.0_DECF1.0P1.0/magpieTTS--val_loss=5.2076-epoch=144-last.ckpt"
# HPARAM="/checkpoints/streaming/magpie/sugh_BIN_F0P2E0.0_DECF1.0P1.0/magpietts_en_subhankarg_BIN_F0P2E0.0_DECF1.0P1.0.yaml"
# 25FPS
# Non streaming ok
# CKPT="/TB/magpie2503_CE_CA_BIN_BPE_F6P2E0_DECF1.0P1.0_C25FPS_Causal_8cb_HRLLM_lr1e-4_bs12_precbf16_wait3_strictwindowTrue/magpieTTS/checkpoints/magpieTTS--val_loss=5.2386-epoch=153-last.ckpt"
# CKPT="/TB/magpie2503_CE_CA_BIN_BPE_F6P2E0_DECF1.0P1.0_C25FPS_Causal_8cb_HRLLM_lr1e-4_bs12_precbf16_NOwaitK_strictwindowTrue/magpieTTS/checkpoints/magpieTTS--val_loss=5.2388-epoch=150-last.ckpt"
#
# CKPT="/TB/magpie2503_DC_CE_CA_BIN_BPE_F5P2E0_DECF1.0P1.0_C25FPS_Causal_8cb_HRLLM_lr1e-4_bs12_precbf16_wait3_strictwindowTrue_bpe/magpieTTS/checkpoints/magpieTTS--val_loss=5.2238-epoch=229.ckpt"
# HPARAM="/workspace/NeMo/examples/tts/conf/magpietts/magpietts_en_bpe_25fps_inference.yaml"
### SMALL MAGPIE
# CKPT="/TB/DC_CE_BIN_small_C21FPS_Causal_8cb_HRLLM_lr1e-4_bs12_precbf16_lhotse/magpieTTS/checkpoints/magpieTTS.nemo"
# CKPT="/TB/DC_CE_BIN_small_C21FPS_Causal_8cb_HRLLM_lr1e-4_bs12_precbf16_lhotse/magpieTTS/checkpoints/MagpieTTS-EN-Lhotse--val_loss=5.1882-step=349010-epoch=349-last.ckpt"
# HPARAM="/workspace/NeMo/examples/tts/conf/magpietts/magpietts_lhotse_dc_en_tiny_inference.yaml"
# SMALL MAGPIE BETA-BINOMIAL
# CKPT="/TB/DC_CE_small_C21FPS_Causal_8cb_HRLLM_lr1e-4_bs12_precbf16_lhotse/magpieTTS/checkpoints/magpieTTS.nemo"
### SMALL MAGPIE WITH GRPO
# CKPT="/TB/GRPO_DC_CE_BIN_small_C21FPS_Causal_8cb_lr2e-7_bs2_prec32/magpieTTS/checkpoints/Magpie-TTS-EN--val_cer_gt=0.0237-step=1373-epoch=1.ckpt"
# CKPT="/TB/GRPO_KLDiv_infcfg0.5_DC_CE_BIN_small_C21FPS_Causal_8cb_lr2e-7_bs2_prec32/magpieTTS/checkpoints/Magpie-TTS-EN--val_cer_gt=0.0461-step=1846-epoch=2.ckpt"
# HPARAM="/workspace/NeMo/examples/tts/conf/magpietts/magpietts_lhotse_dc_en_tiny_inference.yaml"
### SMALL MAGPIE BETA-BINOMIAL WITH GRPO
# CKPT="/TB/GRPO_DC_CE_small_C21FPS_Causal_8cb_lr5e-7_bs2_prec32/magpieTTS/checkpoints/Magpie-TTS-EN--val_cer_gt=0.0250-step=1373-epoch=1.ckpt"
# CKPT="/checkpoints/streaming/magpie/shehzeen_ckpt/cer_ssim_priornull_2e7_beta001_llmservice_wcfg_wthreholds_epoch0.ckpt"
# HPARAM="/workspace/NeMo/examples/tts/conf/magpietts/magpietts_lhotse_dc_en_tiny_betabinomial_inference.yaml"
#### CICD TESTING
# CKPT="/home/TestData/tts/2506_SeenSpeaker/T5TTS--val_loss=0.3125-epoch=8.ckpt" multi_encoder_context_tts
# HPARAM="/home/TestData/tts/2506_SeenSpeaker/hparams.yaml"
# CKPT="/home/TestData/tts/2506_ZeroShot/dpo-T5TTS--val_loss=0.4513-epoch=3.ckpt" #decoder_context_tts
# HPARAM="/home/TestData/tts/2506_ZeroShot/lrhm_short_yt_prioralways_alignement_0.002_priorscale_0.1.yaml"
#### Jensen
# CKPT="/checkpoints/streaming/magpie/jensen/magpieTTS.nemo"
# decoder_context_tts
CKPT="/TB/magpie2508_DC_CE_CE_CA_TextCond_BetaBinom_C21FPS_Causal_8cb_En-Mn-Fr-Es-De-Vi-Hi_IPA_lr1e-4_bs12_prec32_corrected/magpieTTS/checkpoints/magpieTTS.nemo"
CKPT="/checkpoints/GRPO_Magpie_TTS_ML_V1_val_cer_gt_0_1014_step_800.ckpt"
# CKPT="/checkpoints/Magpie_TTS_ML_val_loss_9_7622_step_476016.ckpt"
HPARAM="/checkpoints/hparams.yaml"
# decoder_ce
# CODEC="/nemo_codec_checkpoints/AudioCodec_21Hz_no_eliz.nemo"
CODEC="/nemo_codec_checkpoints/21fps_causal_codecmodel.nemo"
# CODEC="/nemo_codec_checkpoints/Low_Frame-rate_Speech_Codec++.nemo"
# CODEC="/nemo_codec_checkpoints/Low_Frame-rate_25FPS_Speech_Codec++.nemo"
EPS=0.1
# EPS=1e-8
DATASET=local_longer_100 # riva_hard_digits,riva_hard_letters,riva_hard_money,riva_hard_short # local_longer_4 riva_challenging_nozeros # local_test_100 # local_test_20 # local_test # local_long_20 # local_longer_20 # local_longer_10
MODELTYPE=DC_CE_small_kld_cfg0.5_BIN_GRPO_2e-7_allattninf
# MODELTYPE=Shehzeen_ckpt
# OUT_DIR="/checkpoints/results/test_longer_4_GRPO_audiowav_streaming"
OUT_DIR="/checkpoints/results/${DATASET}_newGRPO_batch5_audiowav_nospace_eos_ap51822_emma_newlogic_fc3_20ws"
export CUDA_VISIBLE_DEVICES=0
export CUDA_LAUNCH_BLOCKING=1
# --nemo_files $CKPT \
# --checkpoint_files $CKPT \
# --hparams_files ${HPARAM} \
# python scripts/magpietts/infer_and_evaluate_streaming.py \
python scripts/magpietts/infer_and_evaluate_longform_batch.py \
--checkpoint_files $CKPT \
--hparams_files ${HPARAM} \
--codecmodel_path ${CODEC} \
--out_dir ${OUT_DIR} \
--datasets $DATASET \
--use_cfg \
--disable_fcd \
--batch_size 5 \
--apply_attention_prior \
--apply_prior_to_layers "0,1,2,3,4,5,6,7,8,9,10,11" \
--estimate_alignment_from_layers "4,5,6,7"
# python scripts/dataset_processing/tts/preprocess_text.py \
# --input_manifest="/workspace/NeMo/long_manifests/test_long_100_claude4-5sonnet.json" \
# --output_manifest="/workspace/NeMo/long_manifests/test_long_100_claude4-5sonnet_normalized.json" \
# --normalizer_config_path="examples/tts/conf/text/normalizer_en.yaml" \
# --num_workers=4 \
# --joblib_batch_size=16
|