All modules for which code is available
- espnet.asr.asr_mix_utils
- espnet.asr.asr_utils
- espnet.asr.chainer_backend.asr
- espnet.asr.pytorch_backend.asr
- espnet.asr.pytorch_backend.asr_init
- espnet.asr.pytorch_backend.asr_mix
- espnet.asr.pytorch_backend.recog
- espnet.bin.asr_enhance
- espnet.bin.asr_recog
- espnet.bin.asr_train
- espnet.bin.lm_train
- espnet.bin.mt_train
- espnet.bin.mt_trans
- espnet.bin.st_train
- espnet.bin.st_trans
- espnet.bin.tts_decode
- espnet.bin.tts_train
- espnet.bin.vc_decode
- espnet.bin.vc_train
- espnet.lm.chainer_backend.extlm
- espnet.lm.chainer_backend.lm
- espnet.lm.lm_utils
- espnet.lm.pytorch_backend.extlm
- espnet.lm.pytorch_backend.lm
- espnet.mt.mt_utils
- espnet.mt.pytorch_backend.mt
- espnet.nets.asr_interface
- espnet.nets.batch_beam_search
- espnet.nets.batch_beam_search_online
- espnet.nets.batch_beam_search_online_sim
- espnet.nets.beam_search
- espnet.nets.beam_search_transducer
- espnet.nets.chainer_backend.asr_interface
- espnet.nets.chainer_backend.ctc
- espnet.nets.chainer_backend.deterministic_embed_id
- espnet.nets.chainer_backend.e2e_asr
- espnet.nets.chainer_backend.e2e_asr_transformer
- espnet.nets.chainer_backend.rnn.attentions
- espnet.nets.chainer_backend.rnn.decoders
- espnet.nets.chainer_backend.rnn.encoders
- espnet.nets.chainer_backend.rnn.training
- espnet.nets.chainer_backend.transformer.attention
- espnet.nets.chainer_backend.transformer.ctc
- espnet.nets.chainer_backend.transformer.decoder
- espnet.nets.chainer_backend.transformer.decoder_layer
- espnet.nets.chainer_backend.transformer.embedding
- espnet.nets.chainer_backend.transformer.encoder
- espnet.nets.chainer_backend.transformer.encoder_layer
- espnet.nets.chainer_backend.transformer.label_smoothing_loss
- espnet.nets.chainer_backend.transformer.layer_norm
- espnet.nets.chainer_backend.transformer.mask
- espnet.nets.chainer_backend.transformer.positionwise_feed_forward
- espnet.nets.chainer_backend.transformer.subsampling
- espnet.nets.chainer_backend.transformer.training
- espnet.nets.ctc_prefix_score
- espnet.nets.e2e_asr_common
- espnet.nets.e2e_mt_common
- espnet.nets.lm_interface
- espnet.nets.mt_interface
- espnet.nets.pytorch_backend.conformer.argument
- espnet.nets.pytorch_backend.conformer.contextual_block_encoder_layer
- espnet.nets.pytorch_backend.conformer.convolution
- espnet.nets.pytorch_backend.conformer.encoder
- espnet.nets.pytorch_backend.conformer.encoder_layer
- espnet.nets.pytorch_backend.conformer.swish
- espnet.nets.pytorch_backend.ctc
- espnet.nets.pytorch_backend.e2e_asr
- espnet.nets.pytorch_backend.e2e_asr_conformer
- espnet.nets.pytorch_backend.e2e_asr_maskctc
- espnet.nets.pytorch_backend.e2e_asr_mix
- espnet.nets.pytorch_backend.e2e_asr_mix_transformer
- espnet.nets.pytorch_backend.e2e_asr_mulenc
- espnet.nets.pytorch_backend.e2e_asr_transducer
- espnet.nets.pytorch_backend.e2e_asr_transformer
- espnet.nets.pytorch_backend.e2e_mt
- espnet.nets.pytorch_backend.e2e_mt_transformer
- espnet.nets.pytorch_backend.e2e_st
- espnet.nets.pytorch_backend.e2e_st_conformer
- espnet.nets.pytorch_backend.e2e_st_transformer
- espnet.nets.pytorch_backend.e2e_tts_fastspeech
- espnet.nets.pytorch_backend.e2e_tts_tacotron2
- espnet.nets.pytorch_backend.e2e_tts_transformer
- espnet.nets.pytorch_backend.e2e_vc_tacotron2
- espnet.nets.pytorch_backend.e2e_vc_transformer
- espnet.nets.pytorch_backend.fastspeech.duration_calculator
- espnet.nets.pytorch_backend.fastspeech.duration_predictor
- espnet.nets.pytorch_backend.fastspeech.length_regulator
- espnet.nets.pytorch_backend.frontends.beamformer
- espnet.nets.pytorch_backend.frontends.dnn_beamformer
- espnet.nets.pytorch_backend.frontends.dnn_wpe
- espnet.nets.pytorch_backend.frontends.feature_transform
- espnet.nets.pytorch_backend.frontends.frontend
- espnet.nets.pytorch_backend.frontends.mask_estimator
- espnet.nets.pytorch_backend.initialization
- espnet.nets.pytorch_backend.lm.default
- espnet.nets.pytorch_backend.lm.seq_rnn
- espnet.nets.pytorch_backend.lm.transformer
- espnet.nets.pytorch_backend.maskctc.add_mask_token
- espnet.nets.pytorch_backend.maskctc.mask
- espnet.nets.pytorch_backend.nets_utils
- espnet.nets.pytorch_backend.rnn.argument
- espnet.nets.pytorch_backend.rnn.attentions
- espnet.nets.pytorch_backend.rnn.decoders
- espnet.nets.pytorch_backend.rnn.encoders
- espnet.nets.pytorch_backend.streaming.segment
- espnet.nets.pytorch_backend.streaming.window
- espnet.nets.pytorch_backend.tacotron2.cbhg
- espnet.nets.pytorch_backend.tacotron2.decoder
- espnet.nets.pytorch_backend.tacotron2.encoder
- espnet.nets.pytorch_backend.transducer.arguments
- espnet.nets.pytorch_backend.transducer.blocks
- espnet.nets.pytorch_backend.transducer.conv1d_nets
- espnet.nets.pytorch_backend.transducer.custom_decoder
- espnet.nets.pytorch_backend.transducer.custom_encoder
- espnet.nets.pytorch_backend.transducer.error_calculator
- espnet.nets.pytorch_backend.transducer.initializer
- espnet.nets.pytorch_backend.transducer.joint_network
- espnet.nets.pytorch_backend.transducer.rnn_decoder
- espnet.nets.pytorch_backend.transducer.rnn_encoder
- espnet.nets.pytorch_backend.transducer.transducer_tasks
- espnet.nets.pytorch_backend.transducer.transformer_decoder_layer
- espnet.nets.pytorch_backend.transducer.utils
- espnet.nets.pytorch_backend.transducer.vgg2l
- espnet.nets.pytorch_backend.transformer.add_sos_eos
- espnet.nets.pytorch_backend.transformer.argument
- espnet.nets.pytorch_backend.transformer.attention
- espnet.nets.pytorch_backend.transformer.contextual_block_encoder_layer
- espnet.nets.pytorch_backend.transformer.decoder
- espnet.nets.pytorch_backend.transformer.decoder_layer
- espnet.nets.pytorch_backend.transformer.dynamic_conv
- espnet.nets.pytorch_backend.transformer.dynamic_conv2d
- espnet.nets.pytorch_backend.transformer.embedding
- espnet.nets.pytorch_backend.transformer.encoder
- espnet.nets.pytorch_backend.transformer.encoder_layer
- espnet.nets.pytorch_backend.transformer.encoder_mix
- espnet.nets.pytorch_backend.transformer.initializer
- espnet.nets.pytorch_backend.transformer.label_smoothing_loss
- espnet.nets.pytorch_backend.transformer.layer_norm
- espnet.nets.pytorch_backend.transformer.lightconv
- espnet.nets.pytorch_backend.transformer.lightconv2d
- espnet.nets.pytorch_backend.transformer.mask
- espnet.nets.pytorch_backend.transformer.multi_layer_conv
- espnet.nets.pytorch_backend.transformer.optimizer
- espnet.nets.pytorch_backend.transformer.plot
- espnet.nets.pytorch_backend.transformer.positionwise_feed_forward
- espnet.nets.pytorch_backend.transformer.repeat
- espnet.nets.pytorch_backend.transformer.subsampling
- espnet.nets.pytorch_backend.transformer.subsampling_without_posenc
- espnet.nets.pytorch_backend.wavenet
- espnet.nets.scorer_interface
- espnet.nets.scorers.ctc
- espnet.nets.scorers.length_bonus
- espnet.nets.st_interface
- espnet.nets.transducer_decoder_interface
- espnet.nets.tts_interface
- espnet.optimizer.chainer
- espnet.optimizer.factory
- espnet.optimizer.parser
- espnet.optimizer.pytorch
- espnet.scheduler.chainer
- espnet.scheduler.pytorch
- espnet.scheduler.scheduler
- espnet.st.pytorch_backend.st
- espnet.transform.add_deltas
- espnet.transform.channel_selector
- espnet.transform.cmvn
- espnet.transform.functional
- espnet.transform.perturb
- espnet.transform.spec_augment
- espnet.transform.spectrogram
- espnet.transform.transform_interface
- espnet.transform.transformation
- espnet.transform.wpe
- espnet.tts.pytorch_backend.tts
- espnet.utils.check_kwargs
- espnet.utils.cli_readers
- espnet.utils.cli_utils
- espnet.utils.cli_writers
- espnet.utils.dataset
- espnet.utils.deterministic_utils
- espnet.utils.dynamic_import
- espnet.utils.fill_missing_args
- espnet.utils.io_utils
- espnet.utils.spec_augment
- espnet.utils.training.batchfy
- espnet.utils.training.evaluator
- espnet.utils.training.iterators
- espnet.utils.training.tensorboard_logger
- espnet.utils.training.train_utils
- espnet.vc.pytorch_backend.vc
- espnet2.asr.ctc
- espnet2.asr.decoder.abs_decoder
- espnet2.asr.decoder.mlm_decoder
- espnet2.asr.decoder.rnn_decoder
- espnet2.asr.decoder.transformer_decoder
- espnet2.asr.encoder.abs_encoder
- espnet2.asr.encoder.conformer_encoder
- espnet2.asr.encoder.contextual_block_conformer_encoder
- espnet2.asr.encoder.contextual_block_transformer_encoder
- espnet2.asr.encoder.hubert_encoder
- espnet2.asr.encoder.longformer_encoder
- espnet2.asr.encoder.rnn_encoder
- espnet2.asr.encoder.transformer_encoder
- espnet2.asr.encoder.vgg_rnn_encoder
- espnet2.asr.encoder.wav2vec2_encoder
- espnet2.asr.espnet_model
- espnet2.asr.frontend.abs_frontend
- espnet2.asr.frontend.default
- espnet2.asr.frontend.fused
- espnet2.asr.frontend.s3prl
- espnet2.asr.frontend.windowing
- espnet2.asr.maskctc_model
- espnet2.asr.postencoder.abs_postencoder
- espnet2.asr.postencoder.hugging_face_transformers_postencoder
- espnet2.asr.preencoder.abs_preencoder
- espnet2.asr.preencoder.linear
- espnet2.asr.preencoder.sinc
- espnet2.asr.specaug.abs_specaug
- espnet2.asr.specaug.specaug
- espnet2.asr.transducer.beam_search_transducer
- espnet2.asr.transducer.error_calculator
- espnet2.asr.transducer.joint_network
- espnet2.asr.transducer.transducer_decoder
- espnet2.asr.transducer.utils
- espnet2.bin.aggregate_stats_dirs
- espnet2.bin.asr_inference
- espnet2.bin.asr_inference_maskctc
- espnet2.bin.asr_inference_streaming
- espnet2.bin.asr_train
- espnet2.bin.diar_inference
- espnet2.bin.diar_train
- espnet2.bin.enh_inference
- espnet2.bin.enh_scoring
- espnet2.bin.enh_train
- espnet2.bin.gan_tts_train
- espnet2.bin.hubert_train
- espnet2.bin.launch
- espnet2.bin.lm_calc_perplexity
- espnet2.bin.lm_train
- espnet2.bin.mt_inference
- espnet2.bin.mt_train
- espnet2.bin.pack
- espnet2.bin.split_scps
- espnet2.bin.st_inference
- espnet2.bin.st_train
- espnet2.bin.tokenize_text
- espnet2.bin.tts_inference
- espnet2.bin.tts_train
- espnet2.diar.abs_diar
- espnet2.diar.attractor.abs_attractor
- espnet2.diar.attractor.rnn_attractor
- espnet2.diar.decoder.abs_decoder
- espnet2.diar.decoder.linear_decoder
- espnet2.diar.espnet_model
- espnet2.diar.label_processor
- espnet2.enh.abs_enh
- espnet2.enh.decoder.abs_decoder
- espnet2.enh.decoder.conv_decoder
- espnet2.enh.decoder.null_decoder
- espnet2.enh.decoder.stft_decoder
- espnet2.enh.encoder.abs_encoder
- espnet2.enh.encoder.conv_encoder
- espnet2.enh.encoder.null_encoder
- espnet2.enh.encoder.stft_encoder
- espnet2.enh.espnet_model
- espnet2.enh.layers.beamformer
- espnet2.enh.layers.complex_utils
- espnet2.enh.layers.complexnn
- espnet2.enh.layers.dnn_beamformer
- espnet2.enh.layers.dnn_wpe
- espnet2.enh.layers.dprnn
- espnet2.enh.layers.mask_estimator
- espnet2.enh.layers.skim
- espnet2.enh.layers.tcn
- espnet2.enh.layers.wpe
- espnet2.enh.loss.criterions.abs_loss
- espnet2.enh.loss.criterions.tf_domain
- espnet2.enh.loss.criterions.time_domain
- espnet2.enh.loss.wrappers.abs_wrapper
- espnet2.enh.loss.wrappers.fixed_order
- espnet2.enh.loss.wrappers.pit_solver
- espnet2.enh.separator.abs_separator
- espnet2.enh.separator.asteroid_models
- espnet2.enh.separator.conformer_separator
- espnet2.enh.separator.dccrn_separator
- espnet2.enh.separator.dprnn_separator
- espnet2.enh.separator.neural_beamformer
- espnet2.enh.separator.rnn_separator
- espnet2.enh.separator.skim_separator
- espnet2.enh.separator.tcn_separator
- espnet2.enh.separator.transformer_separator
- espnet2.fileio.datadir_writer
- espnet2.fileio.npy_scp
- espnet2.fileio.rand_gen_dataset
- espnet2.fileio.read_text
- espnet2.fileio.rttm
- espnet2.fileio.sound_scp
- espnet2.gan_tts.abs_gan_tts
- espnet2.gan_tts.espnet_model
- espnet2.gan_tts.hifigan.hifigan
- espnet2.gan_tts.hifigan.loss
- espnet2.gan_tts.hifigan.residual_block
- espnet2.gan_tts.joint.joint_text2wav
- espnet2.gan_tts.melgan.melgan
- espnet2.gan_tts.melgan.pqmf
- espnet2.gan_tts.melgan.residual_stack
- espnet2.gan_tts.parallel_wavegan.parallel_wavegan
- espnet2.gan_tts.parallel_wavegan.upsample
- espnet2.gan_tts.style_melgan.style_melgan
- espnet2.gan_tts.style_melgan.tade_res_block
- espnet2.gan_tts.utils.get_random_segments
- espnet2.gan_tts.vits.duration_predictor
- espnet2.gan_tts.vits.flow
- espnet2.gan_tts.vits.generator
- espnet2.gan_tts.vits.loss
- espnet2.gan_tts.vits.monotonic_align.__init__
- espnet2.gan_tts.vits.posterior_encoder
- espnet2.gan_tts.vits.residual_coupling
- espnet2.gan_tts.vits.text_encoder
- espnet2.gan_tts.vits.transform
- espnet2.gan_tts.vits.vits
- espnet2.gan_tts.wavenet.residual_block
- espnet2.gan_tts.wavenet.wavenet
- espnet2.hubert.espnet_model
- espnet2.hubert.hubert_loss
- espnet2.iterators.abs_iter_factory
- espnet2.iterators.chunk_iter_factory
- espnet2.iterators.multiple_iter_factory
- espnet2.iterators.sequence_iter_factory
- espnet2.layers.abs_normalize
- espnet2.layers.global_mvn
- espnet2.layers.inversible_interface
- espnet2.layers.label_aggregation
- espnet2.layers.log_mel
- espnet2.layers.mask_along_axis
- espnet2.layers.sinc_conv
- espnet2.layers.stft
- espnet2.layers.time_warp
- espnet2.layers.utterance_mvn
- espnet2.lm.abs_model
- espnet2.lm.espnet_model
- espnet2.lm.seq_rnn_lm
- espnet2.lm.transformer_lm
- espnet2.main_funcs.average_nbest_models
- espnet2.main_funcs.calculate_all_attentions
- espnet2.main_funcs.collect_stats
- espnet2.main_funcs.pack_funcs
- espnet2.mt.espnet_model
- espnet2.mt.frontend.embedding
- espnet2.optimizers.sgd
- espnet2.samplers.abs_sampler
- espnet2.samplers.build_batch_sampler
- espnet2.samplers.folded_batch_sampler
- espnet2.samplers.length_batch_sampler
- espnet2.samplers.num_elements_batch_sampler
- espnet2.samplers.sorted_batch_sampler
- espnet2.samplers.unsorted_batch_sampler
- espnet2.schedulers.abs_scheduler
- espnet2.schedulers.noam_lr
- espnet2.schedulers.warmup_lr
- espnet2.st.espnet_model
- espnet2.tasks.abs_task
- espnet2.tasks.asr
- espnet2.tasks.diar
- espnet2.tasks.enh
- espnet2.tasks.gan_tts
- espnet2.tasks.hubert
- espnet2.tasks.lm
- espnet2.tasks.mt
- espnet2.tasks.st
- espnet2.tasks.tts
- espnet2.text.abs_tokenizer
- espnet2.text.build_tokenizer
- espnet2.text.char_tokenizer
- espnet2.text.cleaner
- espnet2.text.korean_cleaner
- espnet2.text.phoneme_tokenizer
- espnet2.text.sentencepiece_tokenizer
- espnet2.text.token_id_converter
- espnet2.text.word_tokenizer
- espnet2.torch_utils.add_gradient_noise
- espnet2.torch_utils.device_funcs
- espnet2.torch_utils.forward_adaptor
- espnet2.torch_utils.initialize
- espnet2.torch_utils.load_pretrained_model
- espnet2.torch_utils.model_summary
- espnet2.torch_utils.pytorch_version
- espnet2.torch_utils.recursive_op
- espnet2.torch_utils.set_all_random_seed
- espnet2.train.abs_espnet_model
- espnet2.train.abs_gan_espnet_model
- espnet2.train.class_choices
- espnet2.train.collate_fn
- espnet2.train.dataset
- espnet2.train.distributed_utils
- espnet2.train.gan_trainer
- espnet2.train.iterable_dataset
- espnet2.train.preprocessor
- espnet2.train.reporter
- espnet2.train.trainer
- espnet2.tts.abs_tts
- espnet2.tts.espnet_model
- espnet2.tts.fastspeech.fastspeech
- espnet2.tts.fastspeech2.fastspeech2
- espnet2.tts.fastspeech2.loss
- espnet2.tts.fastspeech2.variance_predictor
- espnet2.tts.feats_extract.abs_feats_extract
- espnet2.tts.feats_extract.dio
- espnet2.tts.feats_extract.energy
- espnet2.tts.feats_extract.linear_spectrogram
- espnet2.tts.feats_extract.log_mel_fbank
- espnet2.tts.feats_extract.log_spectrogram
- espnet2.tts.gst.style_encoder
- espnet2.tts.tacotron2.tacotron2
- espnet2.tts.transformer.transformer
- espnet2.tts.utils.duration_calculator
- espnet2.tts.utils.parallel_wavegan_pretrained_vocoder
- espnet2.utils.build_dataclass
- espnet2.utils.config_argparse
- espnet2.utils.get_default_kwargs
- espnet2.utils.griffin_lim
- espnet2.utils.nested_dict_action
- espnet2.utils.sized_dict
- espnet2.utils.types
- espnet2.utils.yaml_no_alias_safe_dump
- torch.utils.data._typing