├── .gitattributes ├── .gitignore ├── Dockerfile ├── Dockerfile-vllm ├── LICENSE ├── README.md ├── README_CN.md ├── README_JP.md ├── __init__.py ├── app.py ├── assets ├── Step-Audio.pdf ├── architecture.png ├── logo.png ├── pipeline.png ├── rlhf.png ├── stepeval_radar_chart.png └── yuewen.jpeg ├── call_vllm_chat.py ├── cosyvoice ├── __init__.py ├── cli │ ├── __init__.py │ ├── cosyvoice.py │ ├── frontend.py │ └── model.py ├── flow │ ├── decoder.py │ ├── flow.py │ ├── flow_matching.py │ └── length_regulator.py ├── hifigan │ ├── f0_predictor.py │ └── generator.py ├── matcha │ ├── audio.py │ ├── decoder.py │ ├── flow_matching.py │ └── transformer.py ├── transformer │ ├── __init__.py │ ├── activation.py │ ├── attention.py │ ├── convolution.py │ ├── decoder.py │ ├── decoder_layer.py │ ├── embedding.py │ ├── encoder.py │ ├── encoder_layer.py │ ├── label_smoothing_loss.py │ ├── positionwise_feed_forward.py │ └── subsampling.py └── utils │ ├── __init__.py │ ├── audio.py │ ├── class_utils.py │ ├── common.py │ ├── executor.py │ ├── file_utils.py │ ├── frontend_utils.py │ ├── mask.py │ ├── scheduler.py │ └── train_utils.py ├── examples ├── clone_wav_lixueqin.wav ├── clone_wav_yuqian.wav ├── emotional_control1.wav ├── emotional_control2.wav ├── multilingual1.wav ├── multilingual2.wav ├── multilingual_singing.wav ├── prompt_wav_lixueqin.wav ├── prompt_wav_yuqian.wav ├── prompt_wav_zhaobenshan.wav ├── rap.wav ├── singing.wav ├── speed_control1.wav ├── speed_control2.wav └── tone_control.wav ├── funasr_detach ├── __init__.py ├── auto │ ├── __init__.py │ ├── auto_frontend.py │ ├── auto_model.py │ └── auto_tokenizer.py ├── bin │ ├── __init__.py │ ├── compute_audio_cmvn.py │ ├── inference.py │ ├── tokenize_text.py │ └── train.py ├── datasets │ ├── __init__.py │ └── audio_datasets │ │ ├── __init__.py │ │ ├── datasets.py │ │ ├── index_ds.py │ │ ├── preprocessor.py │ │ ├── samplers.py │ │ └── scp2jsonl.py ├── download │ ├── __init__.py │ ├── download_dataset_from_hub.py │ ├── download_from_hub.py │ ├── file.py │ ├── name_maps_from_hub.py │ └── runtime_sdk_download_tool.py ├── frontends │ ├── __init__.py │ ├── default.py │ ├── eend_ola_feature.py │ ├── fused.py │ ├── s3prl.py │ ├── utils │ │ ├── __init__.py │ │ ├── beamformer.py │ │ ├── complex_utils.py │ │ ├── dnn_beamformer.py │ │ ├── dnn_wpe.py │ │ ├── feature_transform.py │ │ ├── frontend.py │ │ ├── log_mel.py │ │ ├── mask_estimator.py │ │ └── stft.py │ ├── wav_frontend.py │ └── windowing.py ├── losses │ ├── __init__.py │ └── label_smoothing_loss.py ├── metrics │ ├── __init__.py │ ├── common.py │ ├── compute_acc.py │ ├── compute_eer.py │ ├── compute_min_dcf.py │ └── compute_wer.py ├── models │ ├── __init__.py │ ├── bat │ │ ├── __init__.py │ │ └── model.py │ ├── bicif_paraformer │ │ ├── __init__.py │ │ ├── cif_predictor.py │ │ ├── model.py │ │ └── template.yaml │ ├── branchformer │ │ ├── __init__.py │ │ ├── cgmlp.py │ │ ├── encoder.py │ │ ├── fastformer.py │ │ ├── model.py │ │ └── template.yaml │ ├── campplus │ │ ├── __init__.py │ │ ├── cluster_backend.py │ │ ├── components.py │ │ ├── model.py │ │ ├── template.yaml │ │ └── utils.py │ ├── conformer │ │ ├── __init__.py │ │ ├── encoder.py │ │ ├── model.py │ │ └── template.yaml │ ├── contextual_paraformer │ │ ├── __init__.py │ │ ├── decoder.py │ │ ├── model.py │ │ └── template.yaml │ ├── ct_transformer │ │ ├── __init__.py │ │ ├── model.py │ │ ├── template.yaml │ │ └── utils.py │ ├── ct_transformer_streaming │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── encoder.py │ │ ├── model.py │ │ └── template.yaml │ ├── ctc │ │ ├── __init__.py │ │ └── ctc.py │ ├── data2vec │ │ ├── __init__.py │ │ ├── data2vec.py │ │ ├── data2vec_encoder.py │ │ ├── data_utils.py │ │ ├── ema_module.py │ │ ├── grad_multiply.py │ │ ├── multihead_attention.py │ │ ├── quant_noise.py │ │ ├── utils.py │ │ └── wav2vec2.py │ ├── e_branchformer │ │ ├── __init__.py │ │ ├── encoder.py │ │ ├── model.py │ │ └── template.yaml │ ├── eend │ │ ├── __init__.py │ │ ├── e2e_diar_eend_ola.py │ │ ├── eend_ola_dataloader.py │ │ ├── encoder.py │ │ ├── encoder_decoder_attractor.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── feature.py │ │ │ ├── kaldi_data.py │ │ │ ├── losses.py │ │ │ ├── power.py │ │ │ └── report.py │ ├── emotion2vec │ │ ├── __init__.py │ │ ├── audio.py │ │ ├── base.py │ │ ├── fairseq_modules.py │ │ ├── model.py │ │ ├── modules.py │ │ ├── template.yaml │ │ └── timm_modules.py │ ├── eres2net │ │ ├── __init__.py │ │ ├── eres2net.py │ │ ├── eres2net_aug.py │ │ └── fusion.py │ ├── fsmn_vad_streaming │ │ ├── __init__.py │ │ ├── encoder.py │ │ ├── model.py │ │ └── template.yaml │ ├── language_model │ │ ├── __init__.py │ │ ├── rnn │ │ │ ├── __init__.py │ │ │ ├── argument.py │ │ │ ├── attentions.py │ │ │ ├── decoders.py │ │ │ └── encoders.py │ │ ├── seq_rnn_lm.py │ │ ├── transformer_encoder.py │ │ └── transformer_lm.py │ ├── lora │ │ ├── __init__.py │ │ ├── layers.py │ │ └── utils.py │ ├── mfcca │ │ ├── __init__.py │ │ ├── e2e_asr_mfcca.py │ │ ├── encoder_layer_mfcca.py │ │ └── mfcca_encoder.py │ ├── model_hf │ │ └── __init__.py │ ├── monotonic_aligner │ │ ├── __init__.py │ │ ├── model.py │ │ └── template.yaml │ ├── mossformer │ │ ├── __init__.py │ │ ├── e2e_ss.py │ │ ├── mossformer.py │ │ ├── mossformer_decoder.py │ │ └── mossformer_encoder.py │ ├── normalize │ │ ├── __init__.py │ │ ├── global_mvn.py │ │ └── utterance_mvn.py │ ├── paraformer │ │ ├── __init__.py │ │ ├── cif_predictor.py │ │ ├── decoder.py │ │ ├── model.py │ │ ├── search.py │ │ └── template.yaml │ ├── paraformer_streaming │ │ ├── __init__.py │ │ ├── model.py │ │ └── template.yaml │ ├── rwkv_bat │ │ ├── __init__.py │ │ ├── cuda_decoder │ │ │ ├── wkv_cuda.cu │ │ │ └── wkv_op.cpp │ │ ├── cuda_encoder │ │ │ ├── wkv_cuda.cu │ │ │ └── wkv_op.cpp │ │ ├── rwkv.py │ │ ├── rwkv_attention.py │ │ ├── rwkv_encoder.py │ │ ├── rwkv_feed_forward.py │ │ └── rwkv_subsampling.py │ ├── sa_asr │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── beam_search_sa_asr.py │ │ ├── e2e_sa_asr.py │ │ └── transformer_decoder.py │ ├── sanm │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── decoder.py │ │ ├── encoder.py │ │ ├── model.py │ │ ├── positionwise_feed_forward.py │ │ └── template.yaml │ ├── scama │ │ ├── __init__.py │ │ ├── beam_search.py │ │ ├── chunk_utilis.py │ │ ├── decoder.py │ │ ├── encoder.py │ │ ├── model.py │ │ ├── template.yaml │ │ └── utils.py │ ├── seaco_paraformer │ │ ├── __init__.py │ │ ├── model.py │ │ └── template.yaml │ ├── sond │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── e2e_diar_sond.py │ │ ├── encoder │ │ │ ├── __init__.py │ │ │ ├── ci_scorers.py │ │ │ ├── conv_encoder.py │ │ │ ├── ecapa_tdnn_encoder.py │ │ │ ├── fsmn_encoder.py │ │ │ ├── resnet34_encoder.py │ │ │ └── self_attention_encoder.py │ │ ├── label_aggregation.py │ │ ├── pooling │ │ │ ├── __init__.py │ │ │ ├── pooling_layers.py │ │ │ └── statistic_pooling.py │ │ └── sv_decoder.py │ ├── specaug │ │ ├── __init__.py │ │ ├── mask_along_axis.py │ │ ├── profileaug.py │ │ ├── specaug.py │ │ └── time_warp.py │ ├── transducer │ │ ├── __init__.py │ │ ├── beam_search_transducer.py │ │ ├── joint_network.py │ │ ├── model.py │ │ ├── rnn_decoder.py │ │ └── rnnt_decoder.py │ ├── transformer │ │ ├── __init__.py │ │ ├── attention.py │ │ ├── decoder.py │ │ ├── embedding.py │ │ ├── encoder.py │ │ ├── layer_norm.py │ │ ├── model.py │ │ ├── positionwise_feed_forward.py │ │ ├── scorers │ │ │ ├── __init__.py │ │ │ ├── ctc.py │ │ │ ├── ctc_prefix_score.py │ │ │ ├── length_bonus.py │ │ │ └── scorer_interface.py │ │ ├── search.py │ │ ├── template.yaml │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── add_sos_eos.py │ │ │ ├── dynamic_conv.py │ │ │ ├── dynamic_conv2d.py │ │ │ ├── lightconv.py │ │ │ ├── lightconv2d.py │ │ │ ├── mask.py │ │ │ ├── multi_layer_conv.py │ │ │ ├── nets_utils.py │ │ │ ├── repeat.py │ │ │ ├── subsampling.py │ │ │ ├── subsampling_without_posenc.py │ │ │ └── vgg2l.py │ ├── uniasr │ │ ├── __init__.py │ │ ├── beam_search.py │ │ ├── model.py │ │ └── template.yaml │ ├── whisper │ │ ├── __init__.py │ │ ├── model.py │ │ └── utils │ │ │ ├── __init__.py │ │ │ ├── assets │ │ │ ├── gpt2 │ │ │ │ ├── merges.txt │ │ │ │ ├── special_tokens_map.json │ │ │ │ ├── tokenizer_config.json │ │ │ │ └── vocab.json │ │ │ ├── mel_filters.npz │ │ │ └── multilingual │ │ │ │ ├── added_tokens.json │ │ │ │ ├── merges.txt │ │ │ │ ├── special_tokens_map.json │ │ │ │ ├── tokenizer_config.json │ │ │ │ └── vocab.json │ │ │ ├── audio.py │ │ │ ├── decoding.py │ │ │ ├── tokenizer.py │ │ │ ├── transcribe.py │ │ │ └── utils.py │ └── xvector │ │ ├── __init__.py │ │ └── e2e_sv.py ├── optimizers │ ├── __init__.py │ ├── fairseq_adam.py │ └── sgd.py ├── register.py ├── schedulers │ ├── __init__.py │ ├── abs_scheduler.py │ ├── noam_lr.py │ ├── tri_stage_scheduler.py │ └── warmup_lr.py ├── tokenizer │ ├── __init__.py │ ├── abs_tokenizer.py │ ├── build_tokenizer.py │ ├── char_tokenizer.py │ ├── cleaner.py │ ├── korean_cleaner.py │ ├── phoneme_tokenizer.py │ ├── sentencepiece_tokenizer.py │ ├── token_id_converter.py │ └── word_tokenizer.py ├── train_utils │ ├── __init__.py │ ├── add_gradient_noise.py │ ├── average_nbest_models.py │ ├── device_funcs.py │ ├── forward_adaptor.py │ ├── initialize.py │ ├── load_pretrained_model.py │ ├── model_summary.py │ ├── recursive_op.py │ ├── set_all_random_seed.py │ └── trainer.py ├── utils │ ├── __init__.py │ ├── datadir_writer.py │ ├── load_utils.py │ ├── misc.py │ ├── postprocess_utils.py │ ├── prepare_data.py │ ├── speaker_utils.py │ ├── timestamp_tools.py │ ├── types.py │ └── vad_utils.py └── version.txt ├── offline_inference.py ├── requirements-vllm.txt ├── requirements.txt ├── speakers ├── TingtingRAP_prompt.wav ├── Tingting_prompt.wav ├── Tingting哼唱_prompt.wav └── speakers_info.json ├── stepaudio.py ├── tokenizer.py ├── tts.py ├── tts_app.py ├── tts_inference.py └── utils.py /.gitattributes: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/.gitattributes -------------------------------------------------------------------------------- /.gitignore: -------------------------------------------------------------------------------- 1 | __pycache__/ 2 | output/ -------------------------------------------------------------------------------- /Dockerfile: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/Dockerfile -------------------------------------------------------------------------------- /Dockerfile-vllm: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/Dockerfile-vllm -------------------------------------------------------------------------------- /LICENSE: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/LICENSE -------------------------------------------------------------------------------- /README.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/README.md -------------------------------------------------------------------------------- /README_CN.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/README_CN.md -------------------------------------------------------------------------------- /README_JP.md: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/README_JP.md -------------------------------------------------------------------------------- /__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/app.py -------------------------------------------------------------------------------- /assets/Step-Audio.pdf: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/Step-Audio.pdf -------------------------------------------------------------------------------- /assets/architecture.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/architecture.png -------------------------------------------------------------------------------- /assets/logo.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/logo.png -------------------------------------------------------------------------------- /assets/pipeline.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/pipeline.png -------------------------------------------------------------------------------- /assets/rlhf.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/rlhf.png -------------------------------------------------------------------------------- /assets/stepeval_radar_chart.png: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/stepeval_radar_chart.png -------------------------------------------------------------------------------- /assets/yuewen.jpeg: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/assets/yuewen.jpeg -------------------------------------------------------------------------------- /call_vllm_chat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/call_vllm_chat.py -------------------------------------------------------------------------------- /cosyvoice/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /cosyvoice/cli/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /cosyvoice/cli/cosyvoice.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/cli/cosyvoice.py -------------------------------------------------------------------------------- /cosyvoice/cli/frontend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/cli/frontend.py -------------------------------------------------------------------------------- /cosyvoice/cli/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/cli/model.py -------------------------------------------------------------------------------- /cosyvoice/flow/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/flow/decoder.py -------------------------------------------------------------------------------- /cosyvoice/flow/flow.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/flow/flow.py -------------------------------------------------------------------------------- /cosyvoice/flow/flow_matching.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/flow/flow_matching.py -------------------------------------------------------------------------------- /cosyvoice/flow/length_regulator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/flow/length_regulator.py -------------------------------------------------------------------------------- /cosyvoice/hifigan/f0_predictor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/hifigan/f0_predictor.py -------------------------------------------------------------------------------- /cosyvoice/hifigan/generator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/hifigan/generator.py -------------------------------------------------------------------------------- /cosyvoice/matcha/audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/matcha/audio.py -------------------------------------------------------------------------------- /cosyvoice/matcha/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/matcha/decoder.py -------------------------------------------------------------------------------- /cosyvoice/matcha/flow_matching.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/matcha/flow_matching.py -------------------------------------------------------------------------------- /cosyvoice/matcha/transformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/matcha/transformer.py -------------------------------------------------------------------------------- /cosyvoice/transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /cosyvoice/transformer/activation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/activation.py -------------------------------------------------------------------------------- /cosyvoice/transformer/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/attention.py -------------------------------------------------------------------------------- /cosyvoice/transformer/convolution.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/convolution.py -------------------------------------------------------------------------------- /cosyvoice/transformer/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/decoder.py -------------------------------------------------------------------------------- /cosyvoice/transformer/decoder_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/decoder_layer.py -------------------------------------------------------------------------------- /cosyvoice/transformer/embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/embedding.py -------------------------------------------------------------------------------- /cosyvoice/transformer/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/encoder.py -------------------------------------------------------------------------------- /cosyvoice/transformer/encoder_layer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/encoder_layer.py -------------------------------------------------------------------------------- /cosyvoice/transformer/label_smoothing_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/label_smoothing_loss.py -------------------------------------------------------------------------------- /cosyvoice/transformer/positionwise_feed_forward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/positionwise_feed_forward.py -------------------------------------------------------------------------------- /cosyvoice/transformer/subsampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/transformer/subsampling.py -------------------------------------------------------------------------------- /cosyvoice/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /cosyvoice/utils/audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/audio.py -------------------------------------------------------------------------------- /cosyvoice/utils/class_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/class_utils.py -------------------------------------------------------------------------------- /cosyvoice/utils/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/common.py -------------------------------------------------------------------------------- /cosyvoice/utils/executor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/executor.py -------------------------------------------------------------------------------- /cosyvoice/utils/file_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/file_utils.py -------------------------------------------------------------------------------- /cosyvoice/utils/frontend_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/frontend_utils.py -------------------------------------------------------------------------------- /cosyvoice/utils/mask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/mask.py -------------------------------------------------------------------------------- /cosyvoice/utils/scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/scheduler.py -------------------------------------------------------------------------------- /cosyvoice/utils/train_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/cosyvoice/utils/train_utils.py -------------------------------------------------------------------------------- /examples/clone_wav_lixueqin.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/clone_wav_lixueqin.wav -------------------------------------------------------------------------------- /examples/clone_wav_yuqian.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/clone_wav_yuqian.wav -------------------------------------------------------------------------------- /examples/emotional_control1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/emotional_control1.wav -------------------------------------------------------------------------------- /examples/emotional_control2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/emotional_control2.wav -------------------------------------------------------------------------------- /examples/multilingual1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/multilingual1.wav -------------------------------------------------------------------------------- /examples/multilingual2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/multilingual2.wav -------------------------------------------------------------------------------- /examples/multilingual_singing.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/multilingual_singing.wav -------------------------------------------------------------------------------- /examples/prompt_wav_lixueqin.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/prompt_wav_lixueqin.wav -------------------------------------------------------------------------------- /examples/prompt_wav_yuqian.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/prompt_wav_yuqian.wav -------------------------------------------------------------------------------- /examples/prompt_wav_zhaobenshan.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/prompt_wav_zhaobenshan.wav -------------------------------------------------------------------------------- /examples/rap.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/rap.wav -------------------------------------------------------------------------------- /examples/singing.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/singing.wav -------------------------------------------------------------------------------- /examples/speed_control1.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/speed_control1.wav -------------------------------------------------------------------------------- /examples/speed_control2.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/speed_control2.wav -------------------------------------------------------------------------------- /examples/tone_control.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/examples/tone_control.wav -------------------------------------------------------------------------------- /funasr_detach/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/__init__.py -------------------------------------------------------------------------------- /funasr_detach/auto/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/auto/auto_frontend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/auto/auto_frontend.py -------------------------------------------------------------------------------- /funasr_detach/auto/auto_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/auto/auto_model.py -------------------------------------------------------------------------------- /funasr_detach/auto/auto_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/auto/auto_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/bin/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/bin/compute_audio_cmvn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/bin/compute_audio_cmvn.py -------------------------------------------------------------------------------- /funasr_detach/bin/inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/bin/inference.py -------------------------------------------------------------------------------- /funasr_detach/bin/tokenize_text.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/bin/tokenize_text.py -------------------------------------------------------------------------------- /funasr_detach/bin/train.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/bin/train.py -------------------------------------------------------------------------------- /funasr_detach/datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/datasets/audio_datasets/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/datasets/audio_datasets/datasets.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/datasets/audio_datasets/datasets.py -------------------------------------------------------------------------------- /funasr_detach/datasets/audio_datasets/index_ds.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/datasets/audio_datasets/index_ds.py -------------------------------------------------------------------------------- /funasr_detach/datasets/audio_datasets/preprocessor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/datasets/audio_datasets/preprocessor.py -------------------------------------------------------------------------------- /funasr_detach/datasets/audio_datasets/samplers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/datasets/audio_datasets/samplers.py -------------------------------------------------------------------------------- /funasr_detach/datasets/audio_datasets/scp2jsonl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/datasets/audio_datasets/scp2jsonl.py -------------------------------------------------------------------------------- /funasr_detach/download/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/download/download_dataset_from_hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/download/download_dataset_from_hub.py -------------------------------------------------------------------------------- /funasr_detach/download/download_from_hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/download/download_from_hub.py -------------------------------------------------------------------------------- /funasr_detach/download/file.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/download/file.py -------------------------------------------------------------------------------- /funasr_detach/download/name_maps_from_hub.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/download/name_maps_from_hub.py -------------------------------------------------------------------------------- /funasr_detach/download/runtime_sdk_download_tool.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/download/runtime_sdk_download_tool.py -------------------------------------------------------------------------------- /funasr_detach/frontends/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/frontends/default.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/default.py -------------------------------------------------------------------------------- /funasr_detach/frontends/eend_ola_feature.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/eend_ola_feature.py -------------------------------------------------------------------------------- /funasr_detach/frontends/fused.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/fused.py -------------------------------------------------------------------------------- /funasr_detach/frontends/s3prl.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/s3prl.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/__init__.py: -------------------------------------------------------------------------------- 1 | """Initialize sub package.""" 2 | -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/beamformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/beamformer.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/complex_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/complex_utils.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/dnn_beamformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/dnn_beamformer.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/dnn_wpe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/dnn_wpe.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/feature_transform.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/feature_transform.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/frontend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/frontend.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/log_mel.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/log_mel.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/mask_estimator.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/mask_estimator.py -------------------------------------------------------------------------------- /funasr_detach/frontends/utils/stft.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/utils/stft.py -------------------------------------------------------------------------------- /funasr_detach/frontends/wav_frontend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/wav_frontend.py -------------------------------------------------------------------------------- /funasr_detach/frontends/windowing.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/frontends/windowing.py -------------------------------------------------------------------------------- /funasr_detach/losses/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/losses/label_smoothing_loss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/losses/label_smoothing_loss.py -------------------------------------------------------------------------------- /funasr_detach/metrics/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/metrics/common.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/metrics/common.py -------------------------------------------------------------------------------- /funasr_detach/metrics/compute_acc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/metrics/compute_acc.py -------------------------------------------------------------------------------- /funasr_detach/metrics/compute_eer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/metrics/compute_eer.py -------------------------------------------------------------------------------- /funasr_detach/metrics/compute_min_dcf.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/metrics/compute_min_dcf.py -------------------------------------------------------------------------------- /funasr_detach/metrics/compute_wer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/metrics/compute_wer.py -------------------------------------------------------------------------------- /funasr_detach/models/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/bat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/bat/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/bat/model.py -------------------------------------------------------------------------------- /funasr_detach/models/bicif_paraformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/bicif_paraformer/cif_predictor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/bicif_paraformer/cif_predictor.py -------------------------------------------------------------------------------- /funasr_detach/models/bicif_paraformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/bicif_paraformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/bicif_paraformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/bicif_paraformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/branchformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/branchformer/cgmlp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/branchformer/cgmlp.py -------------------------------------------------------------------------------- /funasr_detach/models/branchformer/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/branchformer/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/branchformer/fastformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/branchformer/fastformer.py -------------------------------------------------------------------------------- /funasr_detach/models/branchformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/branchformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/branchformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/branchformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/campplus/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/campplus/cluster_backend.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/campplus/cluster_backend.py -------------------------------------------------------------------------------- /funasr_detach/models/campplus/components.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/campplus/components.py -------------------------------------------------------------------------------- /funasr_detach/models/campplus/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/campplus/model.py -------------------------------------------------------------------------------- /funasr_detach/models/campplus/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/campplus/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/campplus/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/campplus/utils.py -------------------------------------------------------------------------------- /funasr_detach/models/conformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/conformer/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/conformer/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/conformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/conformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/conformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/conformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/contextual_paraformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/contextual_paraformer/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/contextual_paraformer/decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/contextual_paraformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/contextual_paraformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/contextual_paraformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/contextual_paraformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer/utils.py -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer_streaming/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer_streaming/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer_streaming/attention.py -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer_streaming/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer_streaming/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer_streaming/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer_streaming/model.py -------------------------------------------------------------------------------- /funasr_detach/models/ct_transformer_streaming/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ct_transformer_streaming/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/ctc/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/ctc/ctc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/ctc/ctc.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/data2vec.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/data2vec.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/data2vec_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/data2vec_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/data_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/data_utils.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/ema_module.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/ema_module.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/grad_multiply.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/grad_multiply.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/multihead_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/multihead_attention.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/quant_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/quant_noise.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/utils.py -------------------------------------------------------------------------------- /funasr_detach/models/data2vec/wav2vec2.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/data2vec/wav2vec2.py -------------------------------------------------------------------------------- /funasr_detach/models/e_branchformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/e_branchformer/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/e_branchformer/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/e_branchformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/e_branchformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/e_branchformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/e_branchformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/eend/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/eend/e2e_diar_eend_ola.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/e2e_diar_eend_ola.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/eend_ola_dataloader.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/eend_ola_dataloader.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/encoder_decoder_attractor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/encoder_decoder_attractor.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/eend/utils/feature.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/utils/feature.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/utils/kaldi_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/utils/kaldi_data.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/utils/losses.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/utils/losses.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/utils/power.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/utils/power.py -------------------------------------------------------------------------------- /funasr_detach/models/eend/utils/report.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eend/utils/report.py -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/audio.py -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/base.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/base.py -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/fairseq_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/fairseq_modules.py -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/model.py -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/modules.py -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/emotion2vec/timm_modules.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/emotion2vec/timm_modules.py -------------------------------------------------------------------------------- /funasr_detach/models/eres2net/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eres2net/__init__.py -------------------------------------------------------------------------------- /funasr_detach/models/eres2net/eres2net.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eres2net/eres2net.py -------------------------------------------------------------------------------- /funasr_detach/models/eres2net/eres2net_aug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eres2net/eres2net_aug.py -------------------------------------------------------------------------------- /funasr_detach/models/eres2net/fusion.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/eres2net/fusion.py -------------------------------------------------------------------------------- /funasr_detach/models/fsmn_vad_streaming/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/fsmn_vad_streaming/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/fsmn_vad_streaming/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/fsmn_vad_streaming/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/fsmn_vad_streaming/model.py -------------------------------------------------------------------------------- /funasr_detach/models/fsmn_vad_streaming/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/fsmn_vad_streaming/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/language_model/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/language_model/rnn/__init__.py: -------------------------------------------------------------------------------- 1 | """Initialize sub package.""" 2 | -------------------------------------------------------------------------------- /funasr_detach/models/language_model/rnn/argument.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/rnn/argument.py -------------------------------------------------------------------------------- /funasr_detach/models/language_model/rnn/attentions.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/rnn/attentions.py -------------------------------------------------------------------------------- /funasr_detach/models/language_model/rnn/decoders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/rnn/decoders.py -------------------------------------------------------------------------------- /funasr_detach/models/language_model/rnn/encoders.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/rnn/encoders.py -------------------------------------------------------------------------------- /funasr_detach/models/language_model/seq_rnn_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/seq_rnn_lm.py -------------------------------------------------------------------------------- /funasr_detach/models/language_model/transformer_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/transformer_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/language_model/transformer_lm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/language_model/transformer_lm.py -------------------------------------------------------------------------------- /funasr_detach/models/lora/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/lora/layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/lora/layers.py -------------------------------------------------------------------------------- /funasr_detach/models/lora/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/lora/utils.py -------------------------------------------------------------------------------- /funasr_detach/models/mfcca/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/mfcca/e2e_asr_mfcca.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mfcca/e2e_asr_mfcca.py -------------------------------------------------------------------------------- /funasr_detach/models/mfcca/encoder_layer_mfcca.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mfcca/encoder_layer_mfcca.py -------------------------------------------------------------------------------- /funasr_detach/models/mfcca/mfcca_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mfcca/mfcca_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/model_hf/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/monotonic_aligner/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/monotonic_aligner/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/monotonic_aligner/model.py -------------------------------------------------------------------------------- /funasr_detach/models/monotonic_aligner/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/monotonic_aligner/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/mossformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/mossformer/e2e_ss.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mossformer/e2e_ss.py -------------------------------------------------------------------------------- /funasr_detach/models/mossformer/mossformer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mossformer/mossformer.py -------------------------------------------------------------------------------- /funasr_detach/models/mossformer/mossformer_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mossformer/mossformer_decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/mossformer/mossformer_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/mossformer/mossformer_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/normalize/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/normalize/global_mvn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/normalize/global_mvn.py -------------------------------------------------------------------------------- /funasr_detach/models/normalize/utterance_mvn.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/normalize/utterance_mvn.py -------------------------------------------------------------------------------- /funasr_detach/models/paraformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/paraformer/cif_predictor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer/cif_predictor.py -------------------------------------------------------------------------------- /funasr_detach/models/paraformer/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer/decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/paraformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/paraformer/search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer/search.py -------------------------------------------------------------------------------- /funasr_detach/models/paraformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/paraformer_streaming/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/paraformer_streaming/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer_streaming/model.py -------------------------------------------------------------------------------- /funasr_detach/models/paraformer_streaming/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/paraformer_streaming/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/cuda_decoder/wkv_cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/cuda_decoder/wkv_cuda.cu -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/cuda_decoder/wkv_op.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/cuda_decoder/wkv_op.cpp -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/cuda_encoder/wkv_cuda.cu: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/cuda_encoder/wkv_cuda.cu -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/cuda_encoder/wkv_op.cpp: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/cuda_encoder/wkv_op.cpp -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/rwkv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/rwkv.py -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/rwkv_attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/rwkv_attention.py -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/rwkv_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/rwkv_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/rwkv_feed_forward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/rwkv_feed_forward.py -------------------------------------------------------------------------------- /funasr_detach/models/rwkv_bat/rwkv_subsampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/rwkv_bat/rwkv_subsampling.py -------------------------------------------------------------------------------- /funasr_detach/models/sa_asr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/sa_asr/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sa_asr/attention.py -------------------------------------------------------------------------------- /funasr_detach/models/sa_asr/beam_search_sa_asr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sa_asr/beam_search_sa_asr.py -------------------------------------------------------------------------------- /funasr_detach/models/sa_asr/e2e_sa_asr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sa_asr/e2e_sa_asr.py -------------------------------------------------------------------------------- /funasr_detach/models/sa_asr/transformer_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sa_asr/transformer_decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sanm/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/sanm/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sanm/attention.py -------------------------------------------------------------------------------- /funasr_detach/models/sanm/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sanm/decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sanm/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sanm/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sanm/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sanm/model.py -------------------------------------------------------------------------------- /funasr_detach/models/sanm/positionwise_feed_forward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sanm/positionwise_feed_forward.py -------------------------------------------------------------------------------- /funasr_detach/models/sanm/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sanm/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/scama/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/scama/beam_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/beam_search.py -------------------------------------------------------------------------------- /funasr_detach/models/scama/chunk_utilis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/chunk_utilis.py -------------------------------------------------------------------------------- /funasr_detach/models/scama/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/scama/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/scama/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/model.py -------------------------------------------------------------------------------- /funasr_detach/models/scama/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/scama/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/scama/utils.py -------------------------------------------------------------------------------- /funasr_detach/models/seaco_paraformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/seaco_paraformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/seaco_paraformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/seaco_paraformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/seaco_paraformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/sond/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/sond/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/attention.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/e2e_diar_sond.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/e2e_diar_sond.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/ci_scorers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/encoder/ci_scorers.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/conv_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/encoder/conv_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/ecapa_tdnn_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/encoder/ecapa_tdnn_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/fsmn_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/encoder/fsmn_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/resnet34_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/encoder/resnet34_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/encoder/self_attention_encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/encoder/self_attention_encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/label_aggregation.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/label_aggregation.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/pooling/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/sond/pooling/pooling_layers.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/pooling/pooling_layers.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/pooling/statistic_pooling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/pooling/statistic_pooling.py -------------------------------------------------------------------------------- /funasr_detach/models/sond/sv_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/sond/sv_decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/specaug/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/specaug/mask_along_axis.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/specaug/mask_along_axis.py -------------------------------------------------------------------------------- /funasr_detach/models/specaug/profileaug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/specaug/profileaug.py -------------------------------------------------------------------------------- /funasr_detach/models/specaug/specaug.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/specaug/specaug.py -------------------------------------------------------------------------------- /funasr_detach/models/specaug/time_warp.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/specaug/time_warp.py -------------------------------------------------------------------------------- /funasr_detach/models/transducer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/transducer/beam_search_transducer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transducer/beam_search_transducer.py -------------------------------------------------------------------------------- /funasr_detach/models/transducer/joint_network.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transducer/joint_network.py -------------------------------------------------------------------------------- /funasr_detach/models/transducer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transducer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/transducer/rnn_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transducer/rnn_decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/transducer/rnnt_decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transducer/rnnt_decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/transformer/attention.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/attention.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/decoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/decoder.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/embedding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/embedding.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/encoder.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/encoder.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/layer_norm.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/layer_norm.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/model.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/positionwise_feed_forward.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/positionwise_feed_forward.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/scorers/__init__.py: -------------------------------------------------------------------------------- 1 | """Initialize sub package.""" 2 | -------------------------------------------------------------------------------- /funasr_detach/models/transformer/scorers/ctc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/scorers/ctc.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/scorers/ctc_prefix_score.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/scorers/ctc_prefix_score.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/scorers/length_bonus.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/scorers/length_bonus.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/scorers/scorer_interface.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/scorers/scorer_interface.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/search.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/add_sos_eos.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/add_sos_eos.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/dynamic_conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/dynamic_conv.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/dynamic_conv2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/dynamic_conv2d.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/lightconv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/lightconv.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/lightconv2d.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/lightconv2d.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/mask.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/mask.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/multi_layer_conv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/multi_layer_conv.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/nets_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/nets_utils.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/repeat.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/repeat.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/subsampling.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/subsampling.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/subsampling_without_posenc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/subsampling_without_posenc.py -------------------------------------------------------------------------------- /funasr_detach/models/transformer/utils/vgg2l.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/transformer/utils/vgg2l.py -------------------------------------------------------------------------------- /funasr_detach/models/uniasr/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/uniasr/beam_search.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/uniasr/beam_search.py -------------------------------------------------------------------------------- /funasr_detach/models/uniasr/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/uniasr/model.py -------------------------------------------------------------------------------- /funasr_detach/models/uniasr/template.yaml: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/uniasr/template.yaml -------------------------------------------------------------------------------- /funasr_detach/models/whisper/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/whisper/model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/model.py -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/gpt2/merges.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/gpt2/merges.txt -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/gpt2/special_tokens_map.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/gpt2/special_tokens_map.json -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/gpt2/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/gpt2/tokenizer_config.json -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/gpt2/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/gpt2/vocab.json -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/mel_filters.npz: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/mel_filters.npz -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/multilingual/added_tokens.json: -------------------------------------------------------------------------------- 1 | {"<|endoftext|>": 50257} 2 | -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/multilingual/merges.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/multilingual/merges.txt -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/multilingual/special_tokens_map.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/multilingual/special_tokens_map.json -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/multilingual/tokenizer_config.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/multilingual/tokenizer_config.json -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/assets/multilingual/vocab.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/assets/multilingual/vocab.json -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/audio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/audio.py -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/decoding.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/decoding.py -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/transcribe.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/transcribe.py -------------------------------------------------------------------------------- /funasr_detach/models/whisper/utils/utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/whisper/utils/utils.py -------------------------------------------------------------------------------- /funasr_detach/models/xvector/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/models/xvector/e2e_sv.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/models/xvector/e2e_sv.py -------------------------------------------------------------------------------- /funasr_detach/optimizers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/optimizers/__init__.py -------------------------------------------------------------------------------- /funasr_detach/optimizers/fairseq_adam.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/optimizers/fairseq_adam.py -------------------------------------------------------------------------------- /funasr_detach/optimizers/sgd.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/optimizers/sgd.py -------------------------------------------------------------------------------- /funasr_detach/register.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/register.py -------------------------------------------------------------------------------- /funasr_detach/schedulers/__init__.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/schedulers/__init__.py -------------------------------------------------------------------------------- /funasr_detach/schedulers/abs_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/schedulers/abs_scheduler.py -------------------------------------------------------------------------------- /funasr_detach/schedulers/noam_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/schedulers/noam_lr.py -------------------------------------------------------------------------------- /funasr_detach/schedulers/tri_stage_scheduler.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/schedulers/tri_stage_scheduler.py -------------------------------------------------------------------------------- /funasr_detach/schedulers/warmup_lr.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/schedulers/warmup_lr.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/tokenizer/abs_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/abs_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/build_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/build_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/char_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/char_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/cleaner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/cleaner.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/korean_cleaner.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/korean_cleaner.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/phoneme_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/phoneme_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/sentencepiece_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/sentencepiece_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/token_id_converter.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/token_id_converter.py -------------------------------------------------------------------------------- /funasr_detach/tokenizer/word_tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/tokenizer/word_tokenizer.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/train_utils/add_gradient_noise.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/add_gradient_noise.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/average_nbest_models.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/average_nbest_models.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/device_funcs.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/device_funcs.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/forward_adaptor.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/forward_adaptor.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/initialize.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/initialize.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/load_pretrained_model.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/load_pretrained_model.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/model_summary.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/model_summary.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/recursive_op.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/recursive_op.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/set_all_random_seed.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/set_all_random_seed.py -------------------------------------------------------------------------------- /funasr_detach/train_utils/trainer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/train_utils/trainer.py -------------------------------------------------------------------------------- /funasr_detach/utils/__init__.py: -------------------------------------------------------------------------------- 1 | -------------------------------------------------------------------------------- /funasr_detach/utils/datadir_writer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/datadir_writer.py -------------------------------------------------------------------------------- /funasr_detach/utils/load_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/load_utils.py -------------------------------------------------------------------------------- /funasr_detach/utils/misc.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/misc.py -------------------------------------------------------------------------------- /funasr_detach/utils/postprocess_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/postprocess_utils.py -------------------------------------------------------------------------------- /funasr_detach/utils/prepare_data.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/prepare_data.py -------------------------------------------------------------------------------- /funasr_detach/utils/speaker_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/speaker_utils.py -------------------------------------------------------------------------------- /funasr_detach/utils/timestamp_tools.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/timestamp_tools.py -------------------------------------------------------------------------------- /funasr_detach/utils/types.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/types.py -------------------------------------------------------------------------------- /funasr_detach/utils/vad_utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/funasr_detach/utils/vad_utils.py -------------------------------------------------------------------------------- /funasr_detach/version.txt: -------------------------------------------------------------------------------- 1 | 1.0.8 2 | -------------------------------------------------------------------------------- /offline_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/offline_inference.py -------------------------------------------------------------------------------- /requirements-vllm.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/requirements-vllm.txt -------------------------------------------------------------------------------- /requirements.txt: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/requirements.txt -------------------------------------------------------------------------------- /speakers/TingtingRAP_prompt.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/speakers/TingtingRAP_prompt.wav -------------------------------------------------------------------------------- /speakers/Tingting_prompt.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/speakers/Tingting_prompt.wav -------------------------------------------------------------------------------- /speakers/Tingting哼唱_prompt.wav: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/speakers/Tingting哼唱_prompt.wav -------------------------------------------------------------------------------- /speakers/speakers_info.json: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/speakers/speakers_info.json -------------------------------------------------------------------------------- /stepaudio.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/stepaudio.py -------------------------------------------------------------------------------- /tokenizer.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/tokenizer.py -------------------------------------------------------------------------------- /tts.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/tts.py -------------------------------------------------------------------------------- /tts_app.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/tts_app.py -------------------------------------------------------------------------------- /tts_inference.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/tts_inference.py -------------------------------------------------------------------------------- /utils.py: -------------------------------------------------------------------------------- https://raw.githubusercontent.com/stepfun-ai/Step-Audio/HEAD/utils.py --------------------------------------------------------------------------------