ESPnet
202402
Tutorial:
Installation
Common usages
Using job scheduling system
FAQ
Docker
ESPnet1:
Usage
ESPnet2:
ESPnet2
Instruction for run.sh
Change the configuration for training
Converting audio file formats using format_wav_scp.py
Task class and data input system for training
Distributed training
Notebook:
CMU 11492/11692 Spring 2023: Data preparation
Data preparation in ESPnet
CMU 11492/11692 Spring 2023: Speech Enhancement
Contents
CMU 11492/11692 Spring 2023: Spoken Language Understanding
CMU 11492/11692 Spring 2023: Text to Speech
Speech Recognition (Recipe)
Speech Recognition (Library)
ESPNET 2 pass SLU Demonstration
ESPnet2-ASR realtime demonstration
Use transfer learning for ASR in ESPnet2
Abstract
ESPnet installation (about 10 minutes in total)
mini_an4 recipe as a transfer learning example
CMU 11751/18781 Fall 2022: ESPnet Tutorial2 (New task)
Install ESPnet (Almost same procedure as your first tutorial)
What we provide you and what you need to proceed
CMU 11751/18781 Fall 2022: ESPnet Tutorial
Install ESPnet
Run an existing recipe
Make a new recipe
Additional resources
ESPnet2 real streaming Transformer demonstration
ESPnet2-TTS realtime demonstration
CMU 11751/18781 2021: ESPnet Tutorial
Run an inference example
Full installation
Run a recipe example
ESPnet Speech Enhancement Demonstration
Contents
(1) Tutorials on the Basic Usage
(2) Tutorials on Contributing to ESPNet-SE Project
espnet_onnx demonstration
Install Dependency
Export your model
Inference with onnx
Using streaming model
Pretrained Model
ESPnet Speech Enhancement Demonstration
ESPnet Speech Translation Demonstration
Text-to-Speech (Recipe)
ESPnet real time E2E-TTS demonstration
Package Reference:
espnet.bin package
espnet.scheduler package
espnet.transform package
espnet.utils package
espnet.optimizer package
espnet.tts package
espnet.asr package
espnet.lm package
espnet.mt package
espnet.vc package
espnet.nets package
espnet.st package
espnet.distributed package
espnet2.bin package
espnet2.schedulers package
espnet2.layers package
espnet2.hubert package
espnet2.asvspoof package
espnet2.optimizers package
espnet2.fst package
espnet2.asr_transducer package
espnet2.iterators package
espnet2.text package
espnet2.utils package
espnet2.train package
espnet2.diar package
espnet2.gan_tts package
espnet2.torch_utils package
espnet2.spk package
espnet2.s2st package
espnet2.tts package
espnet2.asr package
espnet2.enh package
espnet2.lm package
espnet2.gan_svs package
espnet2.mt package
espnet2.fileio package
espnet2.samplers package
espnet2.svs package
espnet2.uasr package
espnet2.tasks package
espnet2.s2t package
espnet2.main_funcs package
espnet2.st package
espnet2.slu package
Tool Reference:
core tools
core tools (espnet2)
python utility tools
bash utility tools
ESPnet
Index
Index
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
J
|
K
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
|
V
|
W
|
X
|
Y
|
Z
A
AAMSoftmax (class in espnet2.spk.loss.aamsoftmax)
AbsASVSpoofLoss (class in espnet2.asvspoof.loss.abs_loss)
AbsAttractor (class in espnet2.diar.attractor.abs_attractor)
AbsBatchStepScheduler (class in espnet2.schedulers.abs_scheduler)
AbsDataset (class in espnet2.train.dataset)
AbsDecoder (class in espnet2.asr.decoder.abs_decoder)
(class in espnet2.asr_transducer.decoder.abs_decoder)
(class in espnet2.asvspoof.decoder.abs_decoder)
(class in espnet2.diar.decoder.abs_decoder)
(class in espnet2.enh.decoder.abs_decoder)
AbsDiarization (class in espnet2.diar.abs_diar)
AbsDiffusion (class in espnet2.enh.diffusion.abs_diffusion)
AbsDiscriminator (class in espnet2.uasr.discriminator.abs_discriminator)
AbsEncoder (class in espnet2.asr.encoder.abs_encoder)
(class in espnet2.enh.encoder.abs_encoder)
AbsEnhancement (class in espnet2.enh.abs_enh)
AbsEnhLoss (class in espnet2.enh.loss.criterions.abs_loss)
AbsEpochStepScheduler (class in espnet2.schedulers.abs_scheduler)
AbsESPnetModel (class in espnet2.train.abs_espnet_model)
AbsExtractor (class in espnet2.enh.extractor.abs_extractor)
AbsFeatsExtract (class in espnet2.tts.feats_extract.abs_feats_extract)
AbsFrontend (class in espnet2.asr.frontend.abs_frontend)
AbsGANESPnetModel (class in espnet2.train.abs_gan_espnet_model)
AbsGANSVS (class in espnet2.gan_svs.abs_gan_svs)
AbsGANTTS (class in espnet2.gan_tts.abs_gan_tts)
AbsGenerator (class in espnet2.uasr.generator.abs_generator)
AbsIterFactory (class in espnet2.iterators.abs_iter_factory)
AbsLM (class in espnet2.lm.abs_model)
AbsLoss (class in espnet2.spk.loss.abs_loss)
AbsLossWrapper (class in espnet2.enh.loss.wrappers.abs_wrapper)
AbsMask (class in espnet2.diar.layers.abs_mask)
AbsNormalize (class in espnet2.layers.abs_normalize)
AbsPooling (class in espnet2.spk.pooling.abs_pooling)
AbsPostDecoder (class in espnet2.slu.postdecoder.abs_postdecoder)
AbsPostEncoder (class in espnet2.asr.postencoder.abs_postencoder)
AbsPreEncoder (class in espnet2.asr.preencoder.abs_preencoder)
AbsPreprocessor (class in espnet2.train.preprocessor)
AbsProjector (class in espnet2.spk.projector.abs_projector)
AbsS2STAuxAttention (class in espnet2.s2st.aux_attention.abs_aux_attention)
AbsS2STLoss (class in espnet2.s2st.losses.abs_loss)
AbsSampler (class in espnet2.samplers.abs_sampler)
AbsScheduler (class in espnet2.schedulers.abs_scheduler)
AbsSegmenter (class in espnet2.uasr.segmenter.abs_segmenter)
AbsSeparator (class in espnet2.enh.separator.abs_separator)
AbsSpecAug (class in espnet2.asr.specaug.abs_specaug)
AbsSVS (class in espnet2.svs.abs_svs)
AbsSynthesizer (class in espnet2.s2st.synthesizer.abs_synthesizer)
AbsTask (class in espnet2.tasks.abs_task)
AbsTgtFeatsExtract (class in espnet2.s2st.tgt_feats_extract.abs_tgt_feats_extract)
AbsTokenizer (class in espnet2.text.abs_tokenizer)
AbsTTS (class in espnet2.tts.abs_tts)
AbsUASRLoss (class in espnet2.uasr.loss.abs_loss)
AbsValEpochStepScheduler (class in espnet2.schedulers.abs_scheduler)
accept_input() (espnet.nets.pytorch_backend.streaming.segment.SegmentStreamingE2E method)
(espnet.nets.pytorch_backend.streaming.window.WindowStreamingE2E method)
Activation() (in module espnet2.asr.state_spaces.components)
activation_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
activation_fn (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
adadelta() (in module espnet.optimizer.parser)
adadelta_eps_decay() (in module espnet.asr.asr_utils)
AdadeltaFactory (class in espnet.optimizer.chainer)
(class in espnet.optimizer.pytorch)
adam() (in module espnet.optimizer.parser)
adam_lr_decay() (in module espnet.asr.asr_utils)
AdamFactory (class in espnet.optimizer.chainer)
(class in espnet.optimizer.pytorch)
AdapterForLabelScpReader (class in espnet2.train.dataset)
AdapterForSingingScoreScpReader (class in espnet2.train.dataset)
AdapterForSoundScpReader (class in espnet2.train.dataset)
ADD (espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce.R_Op attribute)
add (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
add() (espnet.asr.pytorch_backend.asr.DistributedDictSummary method)
(espnet2.main_funcs.pack_funcs.Archiver method)
add_arguments() (espnet.lm.chainer_backend.lm.DefaultRNNLM static method)
(espnet.nets.asr_interface.ASRInterface static method)
(espnet.nets.chainer_backend.e2e_asr.E2E static method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E static method)
(espnet.nets.lm_interface.LMInterface static method)
(espnet.nets.mt_interface.MTInterface static method)
(espnet.nets.pytorch_backend.e2e_asr.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_conformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_maskctc.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_mix_transformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_mt.E2E static method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_st.E2E static method)
(espnet.nets.pytorch_backend.e2e_st_conformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformer static method)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.Tacotron2 static method)
(espnet.nets.pytorch_backend.e2e_tts_transformer.Transformer static method)
(espnet.nets.pytorch_backend.e2e_vc_tacotron2.Tacotron2 static method)
(espnet.nets.pytorch_backend.e2e_vc_transformer.Transformer static method)
(espnet.nets.pytorch_backend.lm.default.DefaultRNNLM static method)
(espnet.nets.pytorch_backend.lm.seq_rnn.SequentialRNNLM static method)
(espnet.nets.pytorch_backend.lm.transformer.TransformerLM static method)
(espnet.nets.tts_interface.TTSInterface static method)
(espnet.optimizer.chainer.AdadeltaFactory static method)
(espnet.optimizer.chainer.AdamFactory static method)
(espnet.optimizer.chainer.SGDFactory static method)
(espnet.optimizer.factory.OptimizerFactoryInterface static method)
(espnet.optimizer.pytorch.AdadeltaFactory static method)
(espnet.optimizer.pytorch.AdamFactory static method)
(espnet.optimizer.pytorch.SGDFactory static method)
(espnet.scheduler.scheduler.SchedulerInterface class method)
(espnet.transform.functional.FuncTrans class method)
(espnet.transform.transform_interface.TransformInterface class method)
(espnet2.train.class_choices.ClassChoices method)
(espnet2.train.gan_trainer.GANTrainer class method)
(espnet2.train.trainer.Trainer class method)
(espnet2.train.uasr_trainer.UASRTrainer class method)
(in module espnet2.bin.pack)
add_arguments_conformer_common() (in module espnet.nets.pytorch_backend.conformer.argument)
add_arguments_rnn_attention_common() (in module espnet.nets.pytorch_backend.rnn.argument)
add_arguments_rnn_decoder_common() (in module espnet.nets.pytorch_backend.rnn.argument)
add_arguments_rnn_encoder_common() (in module espnet.nets.pytorch_backend.rnn.argument)
add_arguments_transformer_common() (in module espnet.nets.pytorch_backend.transformer.argument)
add_auxiliary_task_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_conformer_arguments() (espnet.nets.pytorch_backend.e2e_asr_conformer.E2E static method)
(espnet.nets.pytorch_backend.e2e_st_conformer.E2E static method)
add_custom_decoder_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_custom_encoder_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_custom_training_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_decoder_general_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_deltas() (in module espnet.transform.add_deltas)
add_encoder_general_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_gradient_noise() (in module espnet.asr.asr_utils)
(in module espnet2.torch_utils.add_gradient_noise)
add_maskctc_arguments() (espnet.nets.pytorch_backend.e2e_asr_maskctc.E2E static method)
add_optimizer_hooks() (in module espnet2.optimizers.optim_groups)
add_prefix_postfix() (espnet2.asr.decoder.hugging_face_transformers_decoder.HuggingFaceTransformersDecoder method)
add_results_to_json() (in module espnet.asr.asr_mix_utils)
(in module espnet.asr.asr_utils)
(in module espnet.mt.mt_utils)
add_rnn_decoder_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_rnn_encoder_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
add_sos_eos() (in module espnet.nets.pytorch_backend.transformer.add_sos_eos)
add_task_arguments() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.asr.ASRTask class method)
(espnet2.tasks.asr_transducer.ASRTransducerTask class method)
(espnet2.tasks.asvspoof.ASVSpoofTask class method)
(espnet2.tasks.diar.DiarizationTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
(espnet2.tasks.enh_s2t.EnhS2TTask class method)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.hubert.HubertTask class method)
(espnet2.tasks.lm.LMTask class method)
(espnet2.tasks.mt.MTTask class method)
(espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.s2t.S2TTask class method)
(espnet2.tasks.slu.SLUTask class method)
(espnet2.tasks.spk.SpeakerTask class method)
(espnet2.tasks.st.STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
add_transducer_arguments() (in module espnet.nets.pytorch_backend.transducer.arguments)
AddDeltas (class in espnet.transform.add_deltas)
addfile() (espnet2.main_funcs.pack_funcs.Archiver method)
Affine (class in espnet2.asr.state_spaces.residual)
AFMS (class in espnet2.spk.layers.rawnet_block)
aggregate() (espnet2.spk.espnet_model.ESPnetSpeakerModel method)
(in module espnet2.train.reporter)
aggregate_stats_dirs() (in module espnet2.bin.aggregate_stats_dirs)
alias (espnet.scheduler.scheduler.CyclicCosineScheduler attribute)
(espnet.scheduler.scheduler.NoScheduler attribute)
(espnet.scheduler.scheduler.NoamScheduler attribute)
(espnet.scheduler.scheduler.SchedulerInterface attribute)
align_length_sync_decoding() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
(espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
AlignmentModule (class in espnet2.gan_tts.jets.alignments)
AllHeadPReLULayerNormalization4DCF (class in espnet2.enh.separator.tfgridnetv2_separator)
amp_to_impulse_response() (in module espnet2.gan_svs.visinger2.ddsp)
analysis() (espnet2.gan_tts.melgan.pqmf.PQMF method)
AnnealedLangevinDynamics (class in espnet2.enh.diffusion.sampling.correctors)
any_allzero() (in module espnet2.train.preprocessor)
append_token() (espnet.nets.beam_search.BeamSearch static method)
apply_beamforming() (espnet2.enh.layers.dnn_beamformer.DNN_Beamformer method)
apply_beamforming_vector() (in module espnet.nets.pytorch_backend.frontends.beamformer)
(in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
apply_frontend() (espnet2.bin.asr_inference_streaming.Speech2TextStreaming method)
(espnet2.bin.st_inference_streaming.Speech2TextStreaming method)
apply_interpolation() (in module espnet.utils.spec_augment)
apply_masks() (espnet2.enh.separator.dccrn_separator.DCCRNSeparator method)
apply_spectral_norm() (espnet2.gan_tts.hifigan.__init__.HiFiGANPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANScaleDiscriminator method)
apply_weight_norm() (espnet2.gan_svs.avocodo.__init__.AvocodoGenerator method)
(espnet2.gan_svs.avocodo.avocodo.AvocodoGenerator method)
(espnet2.gan_svs.uhifigan.__init__.UHiFiGANGenerator method)
(espnet2.gan_svs.uhifigan.uhifigan.UHiFiGANGenerator method)
(espnet2.gan_svs.visinger2.__init__.VISinger2VocoderGenerator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.VISinger2VocoderGenerator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.melgan.melgan.MelGANGenerator method)
(espnet2.gan_tts.melgan.melgan.MelGANMultiScaleDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANGenerator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANGenerator method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANDiscriminator method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANGenerator method)
(espnet2.gan_tts.wavenet.wavenet.WaveNet method)
Archiver (class in espnet2.main_funcs.pack_funcs)
ArcMarginProduct_intertopk_subcenter (class in espnet2.spk.loss.aamsoftmax_subcenter_intertopk)
argmax() (espnet.nets.pytorch_backend.ctc.CTC method)
(espnet2.asr.ctc.CTC method)
ArgsComplexMultiplicationWrapper (class in espnet2.enh.layers.dcunet)
ArgumentParser (class in espnet2.utils.config_argparse)
asdict() (espnet.nets.beam_search.Hypothesis method)
asr_pit_loss() (espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
ASRInterface (class in espnet.nets.asr_interface)
ASRPackedContents (class in espnet2.bin.pack)
ASRTask (class in espnet2.tasks.asr)
ASRTransducerTask (class in espnet2.tasks.asr_transducer)
assemble_hyps() (espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
(espnet2.bin.asr_inference_streaming.Speech2TextStreaming method)
(espnet2.bin.st_inference_streaming.Speech2TextStreaming method)
assert_scipy_wav_style() (in module espnet.utils.cli_utils)
AsteroidFrontend (class in espnet2.asr.frontend.asteroid_frontend)
AsteroidModel_Converter (class in espnet2.enh.separator.asteroid_models)
ASVSpoofAMSoftmaxLoss (class in espnet2.asvspoof.loss.am_softmax_loss)
ASVSpoofBinaryLoss (class in espnet2.asvspoof.loss.binary_loss)
ASVSpoofOCSoftmaxLoss (class in espnet2.asvspoof.loss.oc_softmax_loss)
ASVSpoofTask (class in espnet2.tasks.asvspoof)
ATFBlock (class in espnet2.enh.layers.uses)
att_for() (in module espnet.nets.chainer_backend.rnn.attentions)
(in module espnet.nets.pytorch_backend.rnn.attentions)
att_to_numpy() (in module espnet.nets.pytorch_backend.rnn.attentions)
AttAdd (class in espnet.nets.pytorch_backend.rnn.attentions)
AttCov (class in espnet.nets.pytorch_backend.rnn.attentions)
AttCovLoc (class in espnet.nets.pytorch_backend.rnn.attentions)
AttDot (class in espnet.nets.chainer_backend.rnn.attentions)
(class in espnet.nets.pytorch_backend.rnn.attentions)
attention_add_arguments() (espnet.nets.pytorch_backend.e2e_asr.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E static method)
(espnet.nets.pytorch_backend.e2e_mt.E2E static method)
(espnet.nets.pytorch_backend.e2e_st.E2E static method)
attention_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
attention_plot_class() (espnet.nets.asr_interface.ASRInterface property)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E property)
(espnet.nets.mt_interface.MTInterface property)
(espnet.nets.pytorch_backend.e2e_asr_transducer.E2E property)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E property)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E property)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E property)
(espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformer property)
(espnet.nets.pytorch_backend.e2e_tts_transformer.Transformer property)
(espnet.nets.pytorch_backend.e2e_vc_transformer.Transformer property)
(espnet.nets.tts_interface.TTSInterface property)
AttentionReference (class in espnet.nets.pytorch_backend.frontends.dnn_beamformer)
(class in espnet2.enh.layers.dnn_beamformer)
AttForward (class in espnet.nets.pytorch_backend.rnn.attentions)
AttForwardTA (class in espnet.nets.pytorch_backend.rnn.attentions)
AttLoc (class in espnet.nets.chainer_backend.rnn.attentions)
(class in espnet.nets.pytorch_backend.rnn.attentions)
AttLoc2D (class in espnet.nets.pytorch_backend.rnn.attentions)
AttLocRec (class in espnet.nets.pytorch_backend.rnn.attentions)
AttMultiHeadAdd (class in espnet.nets.pytorch_backend.rnn.attentions)
AttMultiHeadDot (class in espnet.nets.pytorch_backend.rnn.attentions)
AttMultiHeadLoc (class in espnet.nets.pytorch_backend.rnn.attentions)
AttMultiHeadMultiResLoc (class in espnet.nets.pytorch_backend.rnn.attentions)
AttnBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
AttnBlockpp (class in espnet2.enh.layers.ncsnpp_utils.layerspp)
attractor_loss() (espnet2.diar.espnet_model.ESPnetDiarizationModel method)
audio_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
audio_feat_dim (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
audio_melspec() (espnet2.enh.layers.dnsmos.DNSMOS_local method)
audio_only (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
auxiliary_task_add_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
Average (class in espnet2.train.reporter)
average_by_duration() (in module espnet2.gan_tts.jets.alignments)
average_nbest_models() (in module espnet2.main_funcs.average_nbest_models)
AVHubertConfig (class in espnet2.asr.encoder.avhubert_encoder)
AVHubertModel (class in espnet2.asr.encoder.avhubert_encoder)
AvocodoDiscriminator (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
AvocodoDiscriminatorPlus (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
AvocodoGenerator (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
B
backward() (espnet.nets.chainer_backend.deterministic_embed_id.EmbedIDFunction method)
(espnet.nets.chainer_backend.deterministic_embed_id.EmbedIDGrad method)
(espnet.nets.pytorch_backend.gtn_ctc.GTNCTCLossFunction static method)
(espnet2.asr.encoder.avhubert_encoder.GradMultiply static method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.LogSoftmaxGradModification static method)
(espnet2.asr_transducer.decoder.modules.rwkv.attention.WKVLinearAttention static method)
bandpass_filtering() (in module espnet2.layers.augmentation)
BandpassPerturbation (class in espnet.transform.perturb)
bandreject_filtering() (in module espnet2.layers.augmentation)
bank() (espnet2.layers.sinc_conv.BarkScale class method)
(espnet2.layers.sinc_conv.MelScale class method)
BarkScale (class in espnet2.layers.sinc_conv)
base_plot_keys() (espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformer property)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.Tacotron2 property)
(espnet.nets.pytorch_backend.e2e_tts_transformer.Transformer property)
(espnet.nets.pytorch_backend.e2e_vc_tacotron2.Tacotron2 property)
(espnet.nets.pytorch_backend.e2e_vc_transformer.Transformer property)
(espnet.nets.tts_interface.TTSInterface property)
BaseEvaluator (class in espnet.utils.training.evaluator)
BaseFrequenceDiscriminator (class in espnet2.gan_svs.visinger2.visinger2_vocoder)
BaseTransformerDecoder (class in espnet2.asr.decoder.transformer_decoder)
BaseWriter (class in espnet.utils.cli_writers)
BasicBlock (class in espnet2.asr.encoder.avhubert_encoder)
BasicNorm (class in espnet2.asr_transducer.normalization)
batch_beam() (espnet.nets.batch_beam_search.BatchBeamSearch method)
batch_broadcast() (in module espnet2.enh.diffusion.sdes)
batch_init_state() (espnet.nets.scorer_interface.BatchScorerInterface method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
(espnet.nets.scorers.uasr.UASRPrefixScorer method)
batch_score() (espnet.nets.pytorch_backend.lm.default.DefaultRNNLM method)
(espnet.nets.pytorch_backend.lm.transformer.TransformerLM method)
(espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet.nets.pytorch_backend.transformer.decoder.Decoder method)
(espnet.nets.scorer_interface.BatchScorerInterface method)
(espnet.nets.scorers.length_bonus.LengthBonus method)
(espnet.nets.transducer_decoder_interface.TransducerDecoderInterface method)
(espnet2.asr.decoder.hugging_face_transformers_decoder.HuggingFaceTransformersDecoder method)
(espnet2.asr.decoder.s4_decoder.S4Decoder method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr.decoder.transformer_decoder.BaseTransformerDecoder method)
(espnet2.asr.decoder.transformer_decoder.TransformerMDDecoder method)
(espnet2.asr.decoder.whisper_decoder.OpenAIWhisperDecoder method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
(espnet2.bin.s2t_inference.ScoreFilter method)
(espnet2.lm.huggingface_pretrained_opt_lm.HuggingfaceOPTModel method)
(espnet2.lm.seq_rnn_lm.SequentialRNNLM method)
(espnet2.lm.transformer_lm.TransformerLM method)
(espnet2.s2st.synthesizer.discrete_synthesizer.TransformerDiscreteSynthesizer method)
batch_score_partial() (espnet.nets.scorer_interface.BatchPartialScorerInterface method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
BatchBeamSearch (class in espnet.nets.batch_beam_search)
BatchBeamSearchOnline (class in espnet.nets.batch_beam_search_online)
BatchBeamSearchOnlineSim (class in espnet.nets.batch_beam_search_online_sim)
batchfy() (espnet.nets.batch_beam_search.BatchBeamSearch method)
batchfy_by_bin() (in module espnet.utils.training.batchfy)
batchfy_by_frame() (in module espnet.utils.training.batchfy)
batchfy_by_seq() (in module espnet.utils.training.batchfy)
batchfy_shuffle() (in module espnet.utils.training.batchfy)
BatchHypothesis (class in espnet.nets.batch_beam_search)
batchify_nll() (espnet2.asr.espnet_model.ESPnetASRModel method)
(espnet2.asr.maskctc_model.MaskCTCModel method)
(espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
(espnet2.lm.espnet_model.ESPnetLanguageModel method)
(espnet2.lm.espnet_model_multitask.ESPnetMultitaskLanguageModel method)
BatchNorm (class in espnet2.enh.layers.dcunet)
BatchPartialScorerInterface (class in espnet.nets.scorer_interface)
BatchScorerInterface (class in espnet.nets.scorer_interface)
beam() (espnet.nets.beam_search.BeamSearch method)
beam_search() (in module espnet.nets.beam_search)
BeamSearch (class in espnet.nets.beam_search)
BeamSearchTimeSync (class in espnet.nets.beam_search_timesync)
BeamSearchTimeSyncStreaming (class in espnet.nets.beam_search_timesync_streaming)
BeamSearchTransducer (class in espnet.nets.beam_search_transducer)
(class in espnet2.asr.transducer.beam_search_transducer)
(class in espnet2.asr_transducer.beam_search_transducer)
BeamSearchTransducerStreaming (class in espnet2.asr.transducer.beam_search_transducer_streaming)
BF_module (class in espnet2.enh.layers.fasnet)
blind_analytic_normalization() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
bn_padded_data() (espnet2.uasr.generator.conv_generator.ConvGenerator method)
Bottle2neck (class in espnet2.spk.encoder.ska_tdnn_encoder)
(class in espnet2.spk.layers.rawnet_block)
BPTTUpdater (class in espnet.lm.chainer_backend.lm)
(class in espnet.lm.pytorch_backend.lm)
Branchformer (class in espnet2.asr_transducer.encoder.blocks.branchformer)
BranchformerEncoder (class in espnet2.asr.encoder.branchformer_encoder)
BranchformerEncoderLayer (class in espnet2.asr.encoder.branchformer_encoder)
buff_predict() (espnet.nets.pytorch_backend.lm.default.ClassifierWithState method)
build() (espnet.nets.asr_interface.ASRInterface class method)
(espnet.nets.lm_interface.LMInterface class method)
(espnet.nets.mt_interface.MTInterface class method)
(espnet.optimizer.factory.OptimizerFactoryInterface class method)
(espnet.scheduler.scheduler.SchedulerInterface class method)
build_attention_list() (in module espnet2.asr.decoder.rnn_decoder)
build_batch_sampler() (in module espnet2.samplers.build_batch_sampler)
build_blocks() (in module espnet.nets.pytorch_backend.transducer.blocks)
build_body_blocks() (in module espnet2.asr_transducer.encoder.building)
build_branchformer_block() (in module espnet2.asr_transducer.encoder.building)
build_category_iter_factory() (espnet2.tasks.abs_task.AbsTask class method)
build_chunk_iter_factory() (espnet2.tasks.abs_task.AbsTask class method)
build_collate_fn() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.asr.ASRTask class method)
(espnet2.tasks.asr_transducer.ASRTransducerTask class method)
(espnet2.tasks.asvspoof.ASVSpoofTask class method)
(espnet2.tasks.diar.DiarizationTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
(espnet2.tasks.enh_s2t.EnhS2TTask class method)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.hubert.HubertTask class method)
(espnet2.tasks.lm.LMTask class method)
(espnet2.tasks.mt.MTTask class method)
(espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.s2t.S2TTask class method)
(espnet2.tasks.spk.SpeakerTask class method)
(espnet2.tasks.st.STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
build_conformer_block() (in module espnet.nets.pytorch_backend.transducer.blocks)
(in module espnet2.asr_transducer.encoder.building)
build_conv1d_block() (in module espnet.nets.pytorch_backend.transducer.blocks)
(in module espnet2.asr_transducer.encoder.building)
build_dataclass() (in module espnet2.utils.build_dataclass)
build_ebranchformer_block() (in module espnet2.asr_transducer.encoder.building)
build_input_block() (in module espnet2.asr_transducer.encoder.building)
build_input_layer() (in module espnet.nets.pytorch_backend.transducer.blocks)
build_iter() (espnet2.iterators.abs_iter_factory.AbsIterFactory method)
(espnet2.iterators.category_iter_factory.CategoryIterFactory method)
(espnet2.iterators.chunk_iter_factory.ChunkIterFactory method)
(espnet2.iterators.multiple_iter_factory.MultipleIterFactory method)
(espnet2.iterators.sequence_iter_factory.SequenceIterFactory method)
build_iter_factory() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
build_iter_options() (espnet2.tasks.abs_task.AbsTask class method)
build_main_parameters() (in module espnet2.asr_transducer.encoder.building)
build_model() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel class method)
(espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.asr.ASRTask class method)
(espnet2.tasks.asr_transducer.ASRTransducerTask class method)
(espnet2.tasks.asvspoof.ASVSpoofTask class method)
(espnet2.tasks.diar.DiarizationTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
(espnet2.tasks.enh_s2t.EnhS2TTask class method)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.hubert.HubertTask class method)
(espnet2.tasks.lm.LMTask class method)
(espnet2.tasks.mt.MTTask class method)
(espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.s2t.S2TTask class method)
(espnet2.tasks.slu.SLUTask class method)
(espnet2.tasks.spk.SpeakerTask class method)
(espnet2.tasks.st.STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
build_model_from_args_and_file() (in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_tse_inference)
build_model_from_file() (espnet2.tasks.abs_task.AbsTask class method)
build_multiple_iter_factory() (espnet2.tasks.abs_task.AbsTask class method)
build_optimizers() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
build_options() (espnet2.train.gan_trainer.GANTrainer class method)
(espnet2.train.trainer.Trainer class method)
(espnet2.train.uasr_trainer.UASRTrainer class method)
build_positional_encoding() (in module espnet2.asr_transducer.encoder.building)
build_preprocess_fn() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.asr.ASRTask class method)
(espnet2.tasks.asr_transducer.ASRTransducerTask class method)
(espnet2.tasks.asvspoof.ASVSpoofTask class method)
(espnet2.tasks.diar.DiarizationTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
(espnet2.tasks.enh_s2t.EnhS2TTask class method)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.hubert.HubertTask class method)
(espnet2.tasks.lm.LMTask class method)
(espnet2.tasks.mt.MTTask class method)
(espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.s2t.S2TTask class method)
(espnet2.tasks.slu.SLUTask class method)
(espnet2.tasks.spk.SpeakerTask class method)
(espnet2.tasks.st.STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
build_sequence_iter_factory() (espnet2.tasks.abs_task.AbsTask class method)
build_streaming_iterator() (espnet2.tasks.abs_task.AbsTask class method)
build_task_iter_factory() (espnet2.tasks.abs_task.AbsTask class method)
build_tokenizer() (in module espnet2.text.build_tokenizer)
build_transformer_block() (in module espnet.nets.pytorch_backend.transducer.blocks)
build_vocoder_from_file() (espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
C
cached_score() (espnet.nets.beam_search_timesync.BeamSearchTimeSync method)
(espnet.nets.beam_search_timesync_streaming.BeamSearchTimeSyncStreaming method)
CacheItem (class in espnet.nets.beam_search_timesync)
(class in espnet.nets.beam_search_timesync_streaming)
cal_permumation() (espnet2.bin.diar_inference.DiarizeSpeech method)
(espnet2.bin.enh_inference.SeparateSpeech method)
(espnet2.bin.enh_tse_inference.SeparateSpeech method)
calc_diarization_error() (espnet2.diar.espnet_model.ESPnetDiarizationModel static method)
calc_perplexity() (in module espnet2.bin.lm_calc_perplexity)
calculate_all_attentions() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.chainer_backend.e2e_asr.E2E method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
(espnet.nets.chainer_backend.rnn.decoders.Decoder method)
(espnet.nets.mt_interface.MTInterface method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_mt.E2E method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformer method)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.Tacotron2 method)
(espnet.nets.pytorch_backend.e2e_tts_transformer.Transformer method)
(espnet.nets.pytorch_backend.e2e_vc_tacotron2.Tacotron2 method)
(espnet.nets.pytorch_backend.e2e_vc_transformer.Transformer method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.tacotron2.decoder.Decoder method)
(espnet.nets.tts_interface.TTSInterface method)
(in module espnet2.main_funcs.calculate_all_attentions)
calculate_all_ctc_probs() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
calculate_attentions() (espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
calculate_bleu_ctc() (espnet.nets.e2e_mt_common.ErrorCalculator method)
calculate_cer() (espnet.nets.e2e_asr_common.ErrorCalculator method)
(espnet.nets.pytorch_backend.transducer.error_calculator.ErrorCalculator method)
(espnet2.asr.transducer.error_calculator.ErrorCalculatorTransducer method)
(espnet2.asr_transducer.error_calculator.ErrorCalculator method)
calculate_cer_ctc() (espnet.nets.e2e_asr_common.ErrorCalculator method)
calculate_corpus_bleu() (espnet.nets.e2e_mt_common.ErrorCalculator method)
calculate_wer() (espnet.nets.e2e_asr_common.ErrorCalculator method)
(espnet.nets.pytorch_backend.transducer.error_calculator.ErrorCalculator method)
(espnet2.asr.transducer.error_calculator.ErrorCalculatorTransducer method)
(espnet2.asr_transducer.error_calculator.ErrorCalculator method)
cast_mask_emb() (espnet2.asr.encoder.hubert_encoder.FairseqHubertPretrainEncoder method)
cat() (in module espnet2.enh.layers.complex_utils)
CategoryBalancedSampler (class in espnet2.samplers.category_balanced_sampler)
CategoryIterFactory (class in espnet2.iterators.category_iter_factory)
cauchy_naive() (in module espnet2.asr.state_spaces.s4)
CausalConv1d (class in espnet.nets.pytorch_backend.transducer.conv1d_nets)
(class in espnet.nets.pytorch_backend.wavenet)
CBHG (class in espnet.nets.pytorch_backend.tacotron2.cbhg)
CBHGLoss (class in espnet.nets.pytorch_backend.tacotron2.cbhg)
chainer_load() (in module espnet.asr.asr_utils)
ChainerASRInterface (class in espnet.nets.chainer_backend.asr_interface)
ChainerDataLoader (class in espnet.utils.dataset)
ChainerScheduler (class in espnet.scheduler.chainer)
ChannelAttention (class in espnet2.enh.layers.uses)
ChannelSelector (class in espnet.transform.channel_selector)
ChannelTAC (class in espnet2.enh.layers.uses)
ChannelwiseLayerNorm (class in espnet2.diar.layers.tcn_nomask)
(class in espnet2.enh.layers.tcn)
char_probs (espnet2.bin.asr_align.CTCSegmentationTask attribute)
CharTokenizer (class in espnet2.text.char_tokenizer)
check_batch_states() (in module espnet.nets.pytorch_backend.transducer.utils)
check_early_stop() (in module espnet.utils.training.train_utils)
check_early_stopping() (espnet2.train.reporter.Reporter method)
check_kwargs() (in module espnet.utils.check_kwargs)
check_nonlinear() (in module espnet2.diar.layers.tcn_nomask)
(in module espnet2.enh.layers.tcn)
check_required_command_args() (espnet2.tasks.abs_task.AbsTask class method)
check_short_utt() (in module espnet.nets.pytorch_backend.transformer.subsampling)
(in module espnet2.asr_transducer.utils)
check_state() (in module espnet.nets.pytorch_backend.transducer.utils)
check_target_module_exists() (in module espnet2.layers.create_adapter_utils)
check_task_requirements() (espnet2.tasks.abs_task.AbsTask class method)
check_type_forward() (espnet.nets.chainer_backend.deterministic_embed_id.EmbedIDFunction method)
ChnAttnStatPooling (class in espnet2.spk.pooling.chn_attn_stat_pooling)
choices() (espnet2.train.class_choices.ClassChoices method)
choices_text_converter (espnet2.bin.asr_align.CTCSegmentation attribute)
choices_time_stamps (espnet2.bin.asr_align.CTCSegmentation attribute)
Chomp1d (class in espnet2.diar.layers.tcn_nomask)
(class in espnet2.enh.layers.tcn)
choose_norm() (in module espnet2.enh.layers.tcn)
chose_norm() (in module espnet2.diar.layers.tcn_nomask)
chunk_forward() (espnet2.asr_transducer.encoder.blocks.branchformer.Branchformer method)
(espnet2.asr_transducer.encoder.blocks.conformer.Conformer method)
(espnet2.asr_transducer.encoder.blocks.conv1d.Conv1d method)
(espnet2.asr_transducer.encoder.blocks.ebranchformer.EBranchformer method)
(espnet2.asr_transducer.encoder.encoder.Encoder method)
(espnet2.asr_transducer.encoder.modules.multi_blocks.MultiBlocks method)
ChunkIterFactory (class in espnet2.iterators.chunk_iter_factory)
CISDRLoss (class in espnet2.enh.loss.criterions.time_domain)
clamp_db (espnet2.enh.loss.criterions.time_domain.SISNRLoss attribute)
class_choices_list (espnet2.tasks.abs_task.AbsTask attribute)
(espnet2.tasks.asr.ASRTask attribute)
(espnet2.tasks.asr_transducer.ASRTransducerTask attribute)
(espnet2.tasks.asvspoof.ASVSpoofTask attribute)
(espnet2.tasks.diar.DiarizationTask attribute)
(espnet2.tasks.enh.EnhancementTask attribute)
(espnet2.tasks.enh_s2t.EnhS2TTask attribute)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask attribute)
(espnet2.tasks.gan_svs.GANSVSTask attribute)
(espnet2.tasks.gan_tts.GANTTSTask attribute)
(espnet2.tasks.hubert.HubertTask attribute)
(espnet2.tasks.lm.LMTask attribute)
(espnet2.tasks.mt.MTTask attribute)
(espnet2.tasks.s2st.S2STTask attribute)
(espnet2.tasks.s2t.S2TTask attribute)
(espnet2.tasks.slu.SLUTask attribute)
(espnet2.tasks.spk.SpeakerTask attribute)
(espnet2.tasks.st.STTask attribute)
(espnet2.tasks.svs.SVSTask attribute)
(espnet2.tasks.tts.TTSTask attribute)
(espnet2.tasks.uasr.UASRTask attribute)
ClassChoices (class in espnet2.train.class_choices)
ClassifierWithState (class in espnet.lm.chainer_backend.lm)
(class in espnet.nets.pytorch_backend.lm.default)
clipping() (in module espnet2.layers.augmentation)
close() (espnet.utils.cli_writers.BaseWriter method)
(espnet.utils.io_utils.SoundHDF5File method)
(espnet2.fileio.datadir_writer.DatadirWriter method)
(espnet2.fileio.npy_scp.NpyScpWriter method)
(espnet2.fileio.score_scp.SingingScoreWriter method)
(espnet2.fileio.score_scp.XMLWriter method)
(espnet2.fileio.sound_scp.SoundScpWriter method)
(espnet2.fileio.vad_scp.VADScpWriter method)
(espnet2.main_funcs.pack_funcs.Archiver method)
CMVN (class in espnet.transform.cmvn)
codecs() (in module espnet2.layers.augmentation)
collect_feats() (espnet2.asr.espnet_model.ESPnetASRModel method)
(espnet2.asr_transducer.espnet_transducer_model.ESPnetASRTransducerModel method)
(espnet2.asvspoof.espnet_model.ESPnetASVSpoofModel method)
(espnet2.diar.espnet_model.ESPnetDiarizationModel method)
(espnet2.enh.diffusion_enh.ESPnetDiffusionModel method)
(espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
(espnet2.enh.espnet_model.ESPnetEnhancementModel method)
(espnet2.enh.espnet_model_tse.ESPnetExtractionModel method)
(espnet2.gan_svs.espnet_model.ESPnetGANSVSModel method)
(espnet2.gan_tts.espnet_model.ESPnetGANTTSModel method)
(espnet2.hubert.espnet_model.HubertPretrainModel method)
(espnet2.hubert.espnet_model.TorchAudioHubertPretrainModel method)
(espnet2.lm.espnet_model.ESPnetLanguageModel method)
(espnet2.lm.espnet_model_multitask.ESPnetMultitaskLanguageModel method)
(espnet2.mt.espnet_model.ESPnetMTModel method)
(espnet2.s2st.espnet_model.ESPnetS2STModel method)
(espnet2.s2t.espnet_model.ESPnetS2TModel method)
(espnet2.slu.espnet_model.ESPnetSLUModel method)
(espnet2.spk.espnet_model.ESPnetSpeakerModel method)
(espnet2.st.espnet_model.ESPnetSTModel method)
(espnet2.svs.espnet_model.ESPnetSVSModel method)
(espnet2.train.abs_espnet_model.AbsESPnetModel method)
(espnet2.train.abs_gan_espnet_model.AbsGANESPnetModel method)
(espnet2.tts.espnet_model.ESPnetTTSModel method)
(espnet2.uasr.espnet_model.ESPnetUASRModel method)
collect_stats() (in module espnet2.main_funcs.collect_stats)
CoMBD (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
CoMBDBlock (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
combination() (in module espnet2.asr.state_spaces.s4)
Combine (class in espnet2.enh.layers.ncsnpp_utils.layerspp)
common_collate_fn() (in module espnet2.train.collate_fn)
CommonCollateFn (class in espnet2.train.collate_fn)
CommonPreprocessor (class in espnet2.train.preprocessor)
CommonPreprocessor_multi (class in espnet2.train.preprocessor)
CompareValueTrigger (class in espnet.asr.asr_utils)
complex() (espnet2.gan_svs.visinger2.visinger2_vocoder.TorchSTFT method)
complex_cat() (in module espnet2.enh.layers.complexnn)
complex_norm() (in module espnet2.enh.layers.complex_utils)
ComplexBatchNorm (class in espnet2.enh.layers.complexnn)
(class in espnet2.enh.layers.dcunet)
ComplexConv2d (class in espnet2.enh.layers.complexnn)
ComplexConvTranspose2d (class in espnet2.enh.layers.complexnn)
ComplexLinear (class in espnet2.enh.layers.dcunet)
compute_alphas() (espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.CPURNNT method)
compute_alphas_kernel (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
compute_attention_score() (espnet2.asr_transducer.encoder.modules.attention.RelPositionMultiHeadedAttention method)
compute_aux_transducer_and_symm_kl_div_losses() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
compute_betas_and_grads() (espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.CPURNNT method)
compute_betas_kernel (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
compute_correct() (espnet2.hubert.espnet_model.HubertPretrainModel method)
compute_cost_and_score() (espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.GPURNNT method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.MultiblankGPURNNT method)
compute_costs_data (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
compute_ctc_loss() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
compute_ema_coefficients() (espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema.MultiHeadDampedEMA method)
compute_ema_kernel() (espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema.MultiHeadDampedEMA method)
compute_features() (espnet2.asr_transducer.frontend.online_audio_processor.OnlineAudioProcessor method)
compute_grad_kernel (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
compute_lm_loss() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
compute_mean() (espnet.asr.pytorch_backend.asr.DistributedDictSummary method)
compute_multiblank_alphas_kernel (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
compute_multiblank_betas_kernel (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
compute_multiblank_grad_kernel (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
compute_on_mask() (espnet2.enh.loss.criterions.tf_domain.FrequencyDomainAbsCoherence property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainCrossEntropy property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainDPCL property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainL1 property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainMSE property)
compute_perplexity() (in module espnet.lm.lm_utils)
(in module espnet.lm.pytorch_backend.lm)
compute_simplified_attention_score() (espnet2.asr_transducer.encoder.modules.attention.RelPositionMultiHeadedAttention method)
compute_transducer_loss() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
ComputeErrorRates() (in module espnet2.utils.eer)
ComputeMinDcf() (in module espnet2.utils.eer)
concat_examples() (in module espnet.lm.pytorch_backend.lm)
ConcatAdaptLayer (class in espnet2.enh.layers.adapt_layers)
CondCRPBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
ConditionalBatchNorm2d (class in espnet2.enh.layers.ncsnpp_utils.normalization)
ConditionalInstanceNorm2d (class in espnet2.enh.layers.ncsnpp_utils.normalization)
ConditionalInstanceNorm2dPlus (class in espnet2.enh.layers.ncsnpp_utils.normalization)
ConditionalNoneNorm2d (class in espnet2.enh.layers.ncsnpp_utils.normalization)
ConditionalResidualBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
ConditionalVarianceNorm2d (class in espnet2.enh.layers.ncsnpp_utils.normalization)
CondMSFBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
CondRCUBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
CondRefineBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
config (espnet2.bin.asr_align.CTCSegmentation attribute)
(espnet2.bin.asr_align.CTCSegmentationTask attribute)
configure_optimizer() (in module espnet2.optimizers.optim_groups)
Conformer (class in espnet2.asr_transducer.encoder.blocks.conformer)
ConformerConvolution (class in espnet2.asr_transducer.encoder.modules.convolution)
ConformerEncoder (class in espnet2.asr.encoder.conformer_encoder)
ConformerPostEncoder (class in espnet2.slu.postencoder.conformer_postencoder)
ConformerSeparator (class in espnet2.enh.separator.conformer_separator)
ContextualBlockConformerEncoder (class in espnet2.asr.encoder.contextual_block_conformer_encoder)
ContextualBlockEncoderLayer (class in espnet.nets.pytorch_backend.conformer.contextual_block_encoder_layer)
(class in espnet.nets.pytorch_backend.transformer.contextual_block_encoder_layer)
ContextualBlockTransformerEncoder (class in espnet2.asr.encoder.contextual_block_transformer_encoder)
contract_inner() (in module espnet2.enh.layers.ncsnpp_utils.layers)
contrast() (in module espnet2.layers.augmentation)
Conv1d (class in espnet.nets.pytorch_backend.transducer.conv1d_nets)
(class in espnet2.asr_transducer.encoder.blocks.conv1d)
(class in espnet2.gan_tts.wavenet.residual_block)
Conv1d1x1 (class in espnet2.gan_tts.wavenet.residual_block)
Conv1dLinear (class in espnet.nets.pytorch_backend.transformer.multi_layer_conv)
Conv1dSubsampling1 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv1dSubsampling2 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv1dSubsampling3 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv2d (class in espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
(class in espnet2.gan_tts.parallel_wavegan.upsample)
conv2d_output_shape() (in module espnet2.enh.layers.conv_utils)
Conv2DActNorm (class in espnet2.enh.layers.tcndenseunet)
Conv2dSubsampling (class in espnet.nets.chainer_backend.transformer.subsampling)
(class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv2dSubsampling1 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv2dSubsampling2 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv2dSubsampling6 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv2dSubsampling8 (class in espnet.nets.pytorch_backend.transformer.subsampling)
Conv2dSubsamplingWOPosEnc (class in espnet.nets.pytorch_backend.transformer.subsampling_without_posenc)
conv3x3() (in module espnet2.asr.encoder.avhubert_encoder)
conv_bias (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
conv_downsample_2d() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
conv_feature_layers (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
conv_pos (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
conv_pos_groups (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
ConvDecoder (class in espnet2.enh.decoder.conv_decoder)
ConvDiscriminator (class in espnet2.uasr.discriminator.conv_discriminator)
ConvEncoder (class in espnet2.enh.encoder.conv_encoder)
convert() (espnet2.layers.sinc_conv.BarkScale static method)
(espnet2.layers.sinc_conv.MelScale static method)
convert_examples_to_features() (espnet2.slu.postdecoder.abs_postdecoder.AbsPostDecoder method)
(espnet2.slu.postdecoder.hugging_face_transformers_postdecoder.HuggingFaceTransformersPostDecoder method)
convert_to_char() (espnet.nets.e2e_asr_common.ErrorCalculator method)
(espnet.nets.pytorch_backend.transducer.error_calculator.ErrorCalculator method)
(espnet2.asr.transducer.error_calculator.ErrorCalculatorTransducer method)
(espnet2.asr_transducer.error_calculator.ErrorCalculator method)
ConvFlow (class in espnet2.gan_tts.vits.flow)
ConvGenerator (class in espnet2.uasr.generator.conv_generator)
ConvInput (class in espnet2.asr_transducer.encoder.blocks.conv_input)
ConvInUpsampleNetwork (class in espnet2.gan_tts.parallel_wavegan.upsample)
ConvMeanPool (class in espnet2.enh.layers.ncsnpp_utils.layers)
ConvolutionalGatingMLP (class in espnet2.asr.layers.cgmlp)
ConvolutionalSpatialGatingUnit (class in espnet2.asr.layers.cgmlp)
(class in espnet2.asr_transducer.encoder.modules.convolution)
ConvolutionModule (class in espnet.nets.pytorch_backend.conformer.convolution)
ConvReluNorm (class in espnet2.gan_svs.visinger2.visinger2_vocoder)
convtransp2d_output_shape() (in module espnet2.enh.layers.conv_utils)
copy() (espnet2.enh.diffusion.sdes.OUVESDE method)
(espnet2.enh.diffusion.sdes.OUVPSDE method)
(espnet2.enh.diffusion.sdes.SDE method)
copy_data_1d (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
Corrector (class in espnet2.enh.diffusion.sampling.__init__)
(class in espnet2.enh.diffusion.sampling.correctors)
corrupt_phase() (in module espnet2.layers.augmentation)
CosineAnnealingWarmupRestarts (class in espnet2.schedulers.cosine_anneal_warmup_restart)
cost_and_grad() (espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.CPURNNT method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.GPURNNT method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.MultiblankGPURNNT method)
cost_and_grad_kernel() (espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.CPURNNT method)
count_tokens() (in module espnet.lm.lm_utils)
CPURNNT (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt)
CpuRNNT_index (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt)
CpuRNNT_metadata (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt)
create_adapter() (in module espnet2.layers.create_adapter)
create_batch_states() (espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet.nets.transducer_decoder_interface.TransducerDecoderInterface method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
create_ctc_graph() (espnet.nets.pytorch_backend.gtn_ctc.GTNCTCLossFunction static method)
create_dataset() (espnet.utils.io_utils.SoundHDF5File method)
create_dense_flows() (in module espnet.utils.spec_augment)
create_fb_matrix() (in module espnet2.gan_svs.visinger2.visinger2_vocoder)
create_houlsby_adapter() (in module espnet2.layers.create_adapter_fn)
create_length_mask() (espnet2.diar.espnet_model.ESPnetDiarizationModel method)
create_lm_batch_inputs() (espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
create_lm_batch_states() (in module espnet.nets.pytorch_backend.transducer.utils)
create_lora_adapter() (in module espnet2.layers.create_adapter_fn)
create_mask_label() (espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss method)
create_masks() (espnet2.enh.separator.dccrn_separator.DCCRNSeparator method)
create_new_houlsby_module() (in module espnet2.layers.create_adapter_fn)
create_new_lora_module() (in module espnet2.layers.create_adapter_fn)
create_new_mask() (espnet.nets.pytorch_backend.transducer.conv1d_nets.Conv1d method)
(espnet.nets.pytorch_backend.transducer.vgg2l.VGG2L method)
(espnet2.asr_transducer.encoder.blocks.conv1d.Conv1d method)
create_new_pos_embed() (espnet.nets.pytorch_backend.transducer.conv1d_nets.Conv1d method)
create_new_pos_enc() (espnet2.asr_transducer.encoder.blocks.conv1d.Conv1d method)
create_transducer_compatible_state_dict() (in module espnet.asr.pytorch_backend.asr_init)
crop_scope() (espnet2.gan_svs.pits.ying_decoder.YingDecoder method)
(espnet2.tts.feats_extract.ying.Ying method)
cross_squared_distance_matrix() (in module espnet.utils.spec_augment)
CRPBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
CTAReduce (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce)
CTC (class in espnet.nets.chainer_backend.ctc)
(class in espnet.nets.chainer_backend.transformer.ctc)
(class in espnet.nets.pytorch_backend.ctc)
(class in espnet2.asr.ctc)
ctc_add_arguments() (espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E static method)
ctc_align() (in module espnet.bin.asr_align)
(in module espnet2.bin.asr_align)
ctc_for() (in module espnet.nets.chainer_backend.ctc)
(in module espnet.nets.pytorch_backend.ctc)
ctc_plot_class() (espnet.nets.asr_interface.ASRInterface property)
CTCPrefixScore (class in espnet.nets.ctc_prefix_score)
CTCPrefixScorer (class in espnet.nets.scorers.ctc)
CTCPrefixScoreTH (class in espnet.nets.ctc_prefix_score)
CTCSegmentation (class in espnet2.bin.asr_align)
CTCSegmentationTask (class in espnet2.bin.asr_align)
cumulativeMeanNormalizedDifferenceFunction() (in module espnet2.tts.feats_extract.yin)
cumulativeMeanNormalizedDifferenceFunctionTorch() (in module espnet2.tts.feats_extract.yin)
custom_converter() (espnet.nets.chainer_backend.asr_interface.ChainerASRInterface static method)
(espnet.nets.chainer_backend.e2e_asr.E2E static method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E static method)
custom_parallel_updater() (espnet.nets.chainer_backend.asr_interface.ChainerASRInterface static method)
(espnet.nets.chainer_backend.e2e_asr.E2E static method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E static method)
custom_torch_load() (in module espnet.nets.pytorch_backend.transducer.utils)
custom_updater() (espnet.nets.chainer_backend.asr_interface.ChainerASRInterface static method)
(espnet.nets.chainer_backend.e2e_asr.E2E static method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E static method)
CustomConverter (class in espnet.asr.pytorch_backend.asr)
(class in espnet.asr.pytorch_backend.asr_mix)
(class in espnet.mt.pytorch_backend.mt)
(class in espnet.nets.chainer_backend.rnn.training)
(class in espnet.nets.chainer_backend.transformer.training)
(class in espnet.st.pytorch_backend.st)
(class in espnet.tts.pytorch_backend.tts)
(class in espnet.vc.pytorch_backend.vc)
CustomConverterMulEnc (class in espnet.asr.pytorch_backend.asr)
CustomDecoder (class in espnet.nets.pytorch_backend.transducer.custom_decoder)
CustomEncoder (class in espnet.nets.pytorch_backend.transducer.custom_encoder)
CustomEvaluator (class in espnet.asr.pytorch_backend.asr)
(class in espnet.tts.pytorch_backend.tts)
(class in espnet.vc.pytorch_backend.vc)
CustomParallelUpdater (class in espnet.nets.chainer_backend.rnn.training)
(class in espnet.nets.chainer_backend.transformer.training)
CustomUpdater (class in espnet.asr.pytorch_backend.asr)
(class in espnet.nets.chainer_backend.rnn.training)
(class in espnet.nets.chainer_backend.transformer.training)
(class in espnet.tts.pytorch_backend.tts)
(class in espnet.vc.pytorch_backend.vc)
cwSKAttention (class in espnet2.spk.encoder.ska_tdnn_encoder)
CyclicCosineScheduler (class in espnet.scheduler.scheduler)
D
d_model() (espnet2.asr.state_spaces.base.SequenceModule property)
d_output() (espnet2.asr.state_spaces.base.SequenceModule property)
(espnet2.asr.state_spaces.block.SequenceResidualBlock property)
(espnet2.asr.state_spaces.pool.DownAvgPool property)
(espnet2.asr.state_spaces.pool.DownLinearPool property)
(espnet2.asr.state_spaces.pool.DownSample property)
(espnet2.asr.state_spaces.pool.DownSpectralPool property)
(espnet2.asr.state_spaces.pool.UpPool property)
(espnet2.asr.state_spaces.pool.UpSample property)
(espnet2.asr.state_spaces.residual.Residual property)
(espnet2.asr.state_spaces.s4.S4 property)
d_state() (espnet2.asr.state_spaces.base.SequenceModule property)
(espnet2.asr.state_spaces.block.SequenceResidualBlock property)
(espnet2.asr.state_spaces.model.SequenceModel property)
DANSeparator (class in espnet2.enh.separator.dan_separator)
DataAugmentation (class in espnet2.layers.augmentation)
DatadirWriter (class in espnet2.fileio.datadir_writer)
DC_CRN (class in espnet2.enh.layers.dc_crn)
DC_CRNSeparator (class in espnet2.enh.separator.dc_crn_separator)
DCCRNSeparator (class in espnet2.enh.separator.dccrn_separator)
DCUNet (class in espnet2.enh.layers.dcunet)
DCUNetComplexDecoderBlock (class in espnet2.enh.layers.dcunet)
DCUNetComplexEncoderBlock (class in espnet2.enh.layers.dcunet)
ddpm_conv1x1() (in module espnet2.enh.layers.ncsnpp_utils.layers)
ddpm_conv3x3() (in module espnet2.enh.layers.ncsnpp_utils.layers)
debug_update_fn() (espnet2.enh.diffusion.sampling.__init__.Predictor method)
(espnet2.enh.diffusion.sampling.predictors.Predictor method)
dec_out (espnet.nets.transducer_decoder_interface.ExtendedHypothesis attribute)
(espnet2.asr.transducer.beam_search_transducer.ExtendedHypothesis attribute)
(espnet2.asr.transducer.beam_search_transducer_streaming.ExtendedHypothesis attribute)
(espnet2.asr_transducer.beam_search_transducer.ExtendedHypothesis attribute)
dec_state (espnet2.asr_transducer.beam_search_transducer.Hypothesis attribute)
DecayResidual (class in espnet2.asr.state_spaces.residual)
decode() (espnet2.bin.diar_inference.DiarizeSpeech method)
(in module espnet.tts.pytorch_backend.tts)
(in module espnet.vc.pytorch_backend.vc)
decode_long() (espnet2.bin.s2t_inference.Speech2Text method)
decode_mu_law() (in module espnet.nets.pytorch_backend.wavenet)
decode_with_attention_offline() (espnet.nets.pytorch_backend.streaming.window.WindowStreamingE2E method)
Decoder (class in espnet.nets.chainer_backend.rnn.decoders)
(class in espnet.nets.chainer_backend.transformer.decoder)
(class in espnet.nets.pytorch_backend.rnn.decoders)
(class in espnet.nets.pytorch_backend.tacotron2.decoder)
(class in espnet.nets.pytorch_backend.transformer.decoder)
(class in espnet2.enh.separator.svoice_separator)
(class in espnet2.gan_svs.vits.pitch_predictor)
(class in espnet2.svs.singing_tacotron.decoder)
decoder_activation_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_add_arguments() (espnet.nets.pytorch_backend.e2e_asr.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E static method)
(espnet.nets.pytorch_backend.e2e_mt.E2E static method)
(espnet.nets.pytorch_backend.e2e_st.E2E static method)
decoder_add_custom_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
decoder_add_general_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
decoder_add_rnn_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
decoder_and_attention() (espnet.nets.pytorch_backend.e2e_asr_mix_transformer.E2E method)
decoder_attention_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_attention_heads (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_embed_dim (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_ffn_embed_dim (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_for() (in module espnet.nets.chainer_backend.rnn.decoders)
(in module espnet.nets.pytorch_backend.rnn.decoders)
decoder_init() (in module espnet.nets.pytorch_backend.tacotron2.decoder)
(in module espnet2.svs.singing_tacotron.decoder)
decoder_layerdrop (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_layers (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_learned_pos (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
decoder_normalize_before (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
DecoderLayer (class in espnet.nets.chainer_backend.transformer.decoder_layer)
(class in espnet.nets.pytorch_backend.transformer.decoder_layer)
deemphasis() (in module espnet2.layers.augmentation)
default_beam_search() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
(espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
default_init() (in module espnet2.enh.layers.ncsnpp_utils.layers)
default_name (espnet.utils.training.tensorboard_logger.TensorboardLogger attribute)
default_parameters() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
default_params() (espnet.transform.functional.FuncTrans class method)
default_state() (espnet2.asr.state_spaces.base.SequenceModule method)
(espnet2.asr.state_spaces.block.SequenceResidualBlock method)
(espnet2.asr.state_spaces.model.SequenceModel method)
(espnet2.asr.state_spaces.pool.DownPool method)
(espnet2.asr.state_spaces.pool.UpPool method)
(espnet2.asr.state_spaces.s4.S4 method)
(espnet2.asr.state_spaces.s4.SSKernel method)
(espnet2.asr.state_spaces.s4.SSKernelDiag method)
(espnet2.asr.state_spaces.s4.SSKernelNPLR method)
DefaultFrontend (class in espnet2.asr.frontend.default)
DefaultRNNLM (class in espnet.lm.chainer_backend.lm)
(class in espnet.nets.pytorch_backend.lm.default)
delta() (in module espnet.transform.add_deltas)
Dense (class in espnet2.enh.layers.ncsnpp_utils.layers)
dense_image_warp() (in module espnet.utils.spec_augment)
DenseBlock (class in espnet2.enh.layers.tcndenseunet)
DenselyConnectedBlock (class in espnet2.enh.layers.dc_crn)
DepthwiseConvolution (class in espnet2.asr_transducer.encoder.modules.convolution)
DepthwiseSeparableConv (class in espnet2.diar.layers.tcn_nomask)
(class in espnet2.enh.layers.tcn)
design_prototype_filter() (in module espnet2.gan_tts.melgan.pqmf)
detect_non_silence() (in module espnet2.train.preprocessor)
DiarizationTask (class in espnet2.tasks.diar)
DiarizeSpeech (class in espnet2.bin.diar_inference)
DiarPackedContents (class in espnet2.bin.pack)
differenceFunction() (in module espnet2.tts.feats_extract.yin)
differenceFunction_np() (in module espnet2.tts.feats_extract.yin)
differenceFunctionTorch() (in module espnet2.tts.feats_extract.yin)
diffusion() (espnet2.tts.prodiff.denoiser.SpectogramDenoiser method)
DiffusionStepEmbedding (class in espnet2.enh.layers.dcunet)
DilatedDepthSeparableConv (class in espnet2.gan_tts.vits.flow)
Dio (class in espnet2.tts.feats_extract.dio)
discretize() (espnet2.enh.diffusion.sdes.SDE method)
DiscriminatorAdversarialLoss (class in espnet2.gan_tts.hifigan.loss)
dist_backend (espnet2.train.distributed_utils.DistributedOption attribute)
dist_init_method (espnet2.train.distributed_utils.DistributedOption attribute)
dist_launcher (espnet2.train.distributed_utils.DistributedOption attribute)
dist_master_addr (espnet2.train.distributed_utils.DistributedOption attribute)
dist_master_port (espnet2.train.distributed_utils.DistributedOption attribute)
dist_rank (espnet2.train.distributed_utils.DistributedOption attribute)
dist_world_size (espnet2.train.distributed_utils.DistributedOption attribute)
distributed (espnet2.train.distributed_utils.DistributedOption attribute)
DistributedDictSummary (class in espnet.asr.pytorch_backend.asr)
DistributedOption (class in espnet2.train.distributed_utils)
div_up (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
DNN_Beamformer (class in espnet.nets.pytorch_backend.frontends.dnn_beamformer)
(class in espnet2.enh.layers.dnn_beamformer)
DNN_WPE (class in espnet.nets.pytorch_backend.frontends.dnn_wpe)
(class in espnet2.enh.layers.dnn_wpe)
DNSMOS_local (class in espnet2.enh.layers.dnsmos)
DNSMOS_web (class in espnet2.enh.layers.dnsmos)
done (espnet2.bin.asr_align.CTCSegmentationTask attribute)
DownAvgPool (class in espnet2.asr.state_spaces.pool)
DownLinearPool (class in espnet2.asr.state_spaces.pool)
download_avhubert() (in module espnet2.asr.encoder.avhubert_encoder)
download_hubert() (in module espnet2.asr.encoder.hubert_encoder)
download_w2v() (in module espnet2.asr.encoder.wav2vec2_encoder)
DownPool (class in espnet2.asr.state_spaces.pool)
DownPool2d (class in espnet2.asr.state_spaces.pool)
DownSample (class in espnet2.asr.state_spaces.pool)
Downsample (class in espnet2.enh.layers.ncsnpp_utils.layers)
(class in espnet2.enh.layers.ncsnpp_utils.layerspp)
downsample() (in module espnet2.asr.state_spaces.pool)
downsample_2d() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
downsample_basic_block() (in module espnet2.asr.encoder.avhubert_encoder)
downsample_basic_block_v2() (in module espnet2.asr.encoder.avhubert_encoder)
DownSpectralPool (class in espnet2.asr.state_spaces.pool)
DPCLE2ESeparator (class in espnet2.enh.separator.dpcl_e2e_separator)
DPCLSeparator (class in espnet2.enh.separator.dpcl_separator)
DPCLSolver (class in espnet2.enh.loss.wrappers.dpcl_solver)
dplr() (in module espnet2.asr.state_spaces.s4)
DPMulCat (class in espnet2.enh.layers.dpmulcat)
DPRNN (class in espnet2.enh.layers.dprnn)
DPRNN_TAC (class in espnet2.enh.layers.dprnn)
DPRNNSeparator (class in espnet2.enh.separator.dprnn_separator)
DPTNet (class in espnet2.enh.layers.dptnet)
DPTNetSeparator (class in espnet2.enh.separator.dptnet_separator)
draw_attention_plot() (espnet.asr.asr_mix_utils.PlotAttentionReport method)
(espnet.asr.asr_utils.PlotAttentionReport method)
draw_ctc_plot() (espnet.asr.asr_utils.PlotCTCReport method)
draw_han_plot() (espnet.asr.asr_utils.PlotAttentionReport method)
dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
dropout_features (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
dropout_input (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
DropoutNd (class in espnet2.asr.state_spaces.components)
dtype() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants)
Duration_Encoder (class in espnet2.svs.singing_tacotron.encoder)
DurationCalculator (class in espnet.nets.pytorch_backend.fastspeech.duration_calculator)
(class in espnet2.tts.utils.__init__)
(class in espnet2.tts.utils.duration_calculator)
DurationPredictor (class in espnet.nets.pytorch_backend.fastspeech.duration_predictor)
(class in espnet2.gan_svs.vits.duration_predictor)
(class in espnet2.s2st.synthesizer.translatotron2)
DurationPredictorLoss (class in espnet.nets.pytorch_backend.fastspeech.duration_predictor)
dynamic_import() (in module espnet.utils.dynamic_import)
dynamic_import_asr() (in module espnet.nets.asr_interface)
dynamic_import_lm() (in module espnet.nets.lm_interface)
dynamic_import_optimizer() (in module espnet.optimizer.factory)
dynamic_import_scheduler() (in module espnet.scheduler.scheduler)
dynamic_import_st() (in module espnet.nets.st_interface)
DynamicConvolution (class in espnet.nets.pytorch_backend.transformer.dynamic_conv)
DynamicConvolution2D (class in espnet.nets.pytorch_backend.transformer.dynamic_conv2d)
DynamicConvolution2DTransformerDecoder (class in espnet2.asr.decoder.transformer_decoder)
DynamicConvolutionTransformerDecoder (class in espnet2.asr.decoder.transformer_decoder)
DynamicMixingPreprocessor (class in espnet2.train.preprocessor)
E
E2E (class in espnet.nets.chainer_backend.e2e_asr)
(class in espnet.nets.chainer_backend.e2e_asr_transformer)
(class in espnet.nets.pytorch_backend.e2e_asr)
(class in espnet.nets.pytorch_backend.e2e_asr_conformer)
(class in espnet.nets.pytorch_backend.e2e_asr_maskctc)
(class in espnet.nets.pytorch_backend.e2e_asr_mix)
(class in espnet.nets.pytorch_backend.e2e_asr_mix_transformer)
(class in espnet.nets.pytorch_backend.e2e_asr_mulenc)
(class in espnet.nets.pytorch_backend.e2e_asr_transducer)
(class in espnet.nets.pytorch_backend.e2e_asr_transformer)
(class in espnet.nets.pytorch_backend.e2e_mt)
(class in espnet.nets.pytorch_backend.e2e_mt_transformer)
(class in espnet.nets.pytorch_backend.e2e_st)
(class in espnet.nets.pytorch_backend.e2e_st_conformer)
(class in espnet.nets.pytorch_backend.e2e_st_transformer)
EBranchformer (class in espnet2.asr_transducer.encoder.blocks.ebranchformer)
EBranchformerEncoder (class in espnet2.asr.encoder.e_branchformer_encoder)
EBranchformerEncoderLayer (class in espnet2.asr.encoder.e_branchformer_encoder)
EcapaBlock (class in espnet2.spk.layers.ecapa_block)
EcapaTdnnEncoder (class in espnet2.spk.encoder.ecapa_tdnn_encoder)
einsum() (in module espnet2.enh.layers.complex_utils)
ElementwiseAffineFlow (class in espnet2.gan_tts.vits.flow)
ema_one_step() (espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema.MultiHeadDampedEMA method)
embed_id() (in module espnet.nets.chainer_backend.deterministic_embed_id)
Embedding (class in espnet2.mt.frontend.embedding)
EmbedID (class in espnet.nets.chainer_backend.deterministic_embed_id)
EmbedIDFunction (class in espnet.nets.chainer_backend.deterministic_embed_id)
EmbedIDGrad (class in espnet.nets.chainer_backend.deterministic_embed_id)
encode() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
(espnet2.asr.discrete_asr_espnet_model.ESPnetDiscreteASRModel method)
(espnet2.asr.espnet_model.ESPnetASRModel method)
(espnet2.asr_transducer.espnet_transducer_model.ESPnetASRTransducerModel method)
(espnet2.asvspoof.espnet_model.ESPnetASVSpoofModel method)
(espnet2.bin.diar_inference.DiarizeSpeech method)
(espnet2.diar.espnet_model.ESPnetDiarizationModel method)
(espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
(espnet2.hubert.espnet_model.HubertPretrainModel method)
(espnet2.hubert.espnet_model.TorchAudioHubertPretrainModel method)
(espnet2.mt.espnet_model.ESPnetMTModel method)
(espnet2.s2st.espnet_model.ESPnetS2STModel method)
(espnet2.s2t.espnet_model.ESPnetS2TModel method)
(espnet2.slu.espnet_model.ESPnetSLUModel method)
(espnet2.st.espnet_model.ESPnetSTModel method)
(espnet2.uasr.espnet_model.ESPnetUASRModel method)
encode_custom() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
encode_diar() (espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
encode_frame() (espnet2.spk.espnet_model.ESPnetSpeakerModel method)
encode_mu_law() (in module espnet.nets.pytorch_backend.wavenet)
encode_rnn() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
Encoder (class in espnet.nets.chainer_backend.rnn.encoders)
(class in espnet.nets.chainer_backend.transformer.encoder)
(class in espnet.nets.pytorch_backend.conformer.encoder)
(class in espnet.nets.pytorch_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.tacotron2.encoder)
(class in espnet.nets.pytorch_backend.transducer.rnn_encoder)
(class in espnet.nets.pytorch_backend.transformer.encoder)
(class in espnet2.asr_transducer.encoder.encoder)
(class in espnet2.enh.separator.svoice_separator)
(class in espnet2.svs.singing_tacotron.encoder)
encoder_add_arguments() (espnet.nets.pytorch_backend.e2e_asr.E2E static method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E static method)
(espnet.nets.pytorch_backend.e2e_mt.E2E static method)
(espnet.nets.pytorch_backend.e2e_st.E2E static method)
encoder_add_custom_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
encoder_add_general_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
encoder_add_rnn_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
encoder_attention_heads (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
encoder_embed_dim (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
encoder_ffn_embed_dim (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
encoder_for() (in module espnet.nets.chainer_backend.rnn.encoders)
(in module espnet.nets.pytorch_backend.e2e_asr_mix)
(in module espnet.nets.pytorch_backend.rnn.encoders)
(in module espnet.nets.pytorch_backend.transducer.rnn_encoder)
encoder_init() (in module espnet.nets.pytorch_backend.tacotron2.encoder)
(in module espnet2.svs.singing_tacotron.encoder)
encoder_layerdrop (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
encoder_layers (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
encoder_mix_add_arguments() (espnet.nets.pytorch_backend.e2e_asr_mix.E2E static method)
EncoderLayer (class in espnet.nets.chainer_backend.transformer.encoder_layer)
(class in espnet.nets.pytorch_backend.conformer.encoder_layer)
(class in espnet.nets.pytorch_backend.transformer.encoder_layer)
EncoderMix (class in espnet.nets.pytorch_backend.e2e_asr_mix)
(class in espnet.nets.pytorch_backend.transformer.encoder_mix)
end_detect() (in module espnet.nets.e2e_asr_common)
Energy (class in espnet2.tts.feats_extract.energy)
enhance() (espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet2.enh.diffusion.abs_diffusion.AbsDiffusion method)
(espnet2.enh.diffusion.score_based_diffusion.ScoreModel method)
(espnet2.enh.diffusion_enh.ESPnetDiffusionModel method)
(in module espnet.asr.pytorch_backend.asr)
EnhancementTask (class in espnet2.tasks.enh)
EnhPackedContents (class in espnet2.bin.pack)
EnhPreprocessor (class in espnet2.train.preprocessor)
EnhS2TPackedContents (class in espnet2.bin.pack)
EnhS2TTask (class in espnet2.tasks.enh_s2t)
epoch_detail() (espnet.lm.lm_utils.ParallelSentenceIterator property)
(espnet.utils.dataset.ChainerDataLoader property)
eps (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss attribute)
(espnet2.enh.loss.criterions.time_domain.SISNRLoss attribute)
equalization_filtering() (in module espnet2.layers.augmentation)
ErrorCalculator (class in espnet.nets.e2e_asr_common)
(class in espnet.nets.e2e_mt_common)
(class in espnet.nets.pytorch_backend.transducer.error_calculator)
(class in espnet2.asr_transducer.error_calculator)
ErrorCalculatorTransducer (class in espnet2.asr.transducer.error_calculator)
espnet.asr.__init__ (module)
espnet.asr.asr_mix_utils (module)
espnet.asr.asr_utils (module)
espnet.asr.chainer_backend.__init__ (module)
espnet.asr.chainer_backend.asr (module)
espnet.asr.pytorch_backend.__init__ (module)
espnet.asr.pytorch_backend.asr (module)
espnet.asr.pytorch_backend.asr_init (module)
espnet.asr.pytorch_backend.asr_mix (module)
espnet.asr.pytorch_backend.recog (module)
espnet.bin.__init__ (module)
espnet.bin.asr_align (module)
espnet.bin.asr_enhance (module)
espnet.bin.asr_recog (module)
espnet.bin.asr_train (module)
espnet.bin.lm_train (module)
espnet.bin.mt_train (module)
espnet.bin.mt_trans (module)
espnet.bin.st_train (module)
espnet.bin.st_trans (module)
espnet.bin.tts_decode (module)
espnet.bin.tts_train (module)
espnet.bin.vc_decode (module)
espnet.bin.vc_train (module)
espnet.distributed.__init__ (module)
espnet.distributed.pytorch_backend.launch (module)
espnet.lm.__init__ (module)
espnet.lm.chainer_backend.__init__ (module)
espnet.lm.chainer_backend.extlm (module)
espnet.lm.chainer_backend.lm (module)
espnet.lm.lm_utils (module)
espnet.lm.pytorch_backend.__init__ (module)
espnet.lm.pytorch_backend.extlm (module)
espnet.lm.pytorch_backend.lm (module)
espnet.mt.__init__ (module)
espnet.mt.mt_utils (module)
espnet.mt.pytorch_backend.__init__ (module)
espnet.mt.pytorch_backend.mt (module)
espnet.nets.__init__ (module)
espnet.nets.asr_interface (module)
espnet.nets.batch_beam_search (module)
espnet.nets.batch_beam_search_online (module)
espnet.nets.batch_beam_search_online_sim (module)
espnet.nets.beam_search (module)
espnet.nets.beam_search_timesync (module)
espnet.nets.beam_search_timesync_streaming (module)
espnet.nets.beam_search_transducer (module)
espnet.nets.chainer_backend.__init__ (module)
espnet.nets.chainer_backend.asr_interface (module)
espnet.nets.chainer_backend.ctc (module)
espnet.nets.chainer_backend.deterministic_embed_id (module)
espnet.nets.chainer_backend.e2e_asr (module)
espnet.nets.chainer_backend.e2e_asr_transformer (module)
espnet.nets.chainer_backend.nets_utils (module)
espnet.nets.chainer_backend.rnn.__init__ (module)
espnet.nets.chainer_backend.rnn.attentions (module)
espnet.nets.chainer_backend.rnn.decoders (module)
espnet.nets.chainer_backend.rnn.encoders (module)
espnet.nets.chainer_backend.rnn.training (module)
espnet.nets.chainer_backend.transformer.__init__ (module)
espnet.nets.chainer_backend.transformer.attention (module)
espnet.nets.chainer_backend.transformer.ctc (module)
espnet.nets.chainer_backend.transformer.decoder (module)
espnet.nets.chainer_backend.transformer.decoder_layer (module)
espnet.nets.chainer_backend.transformer.embedding (module)
espnet.nets.chainer_backend.transformer.encoder (module)
espnet.nets.chainer_backend.transformer.encoder_layer (module)
espnet.nets.chainer_backend.transformer.label_smoothing_loss (module)
espnet.nets.chainer_backend.transformer.layer_norm (module)
espnet.nets.chainer_backend.transformer.mask (module)
espnet.nets.chainer_backend.transformer.positionwise_feed_forward (module)
espnet.nets.chainer_backend.transformer.subsampling (module)
espnet.nets.chainer_backend.transformer.training (module)
espnet.nets.ctc_prefix_score (module)
espnet.nets.e2e_asr_common (module)
espnet.nets.e2e_mt_common (module)
espnet.nets.lm_interface (module)
espnet.nets.mt_interface (module)
espnet.nets.pytorch_backend.__init__ (module)
espnet.nets.pytorch_backend.conformer.__init__ (module)
espnet.nets.pytorch_backend.conformer.argument (module)
espnet.nets.pytorch_backend.conformer.contextual_block_encoder_layer (module)
espnet.nets.pytorch_backend.conformer.convolution (module)
espnet.nets.pytorch_backend.conformer.encoder (module)
espnet.nets.pytorch_backend.conformer.encoder_layer (module)
espnet.nets.pytorch_backend.conformer.swish (module)
espnet.nets.pytorch_backend.ctc (module)
espnet.nets.pytorch_backend.e2e_asr (module)
espnet.nets.pytorch_backend.e2e_asr_conformer (module)
espnet.nets.pytorch_backend.e2e_asr_maskctc (module)
espnet.nets.pytorch_backend.e2e_asr_mix (module)
espnet.nets.pytorch_backend.e2e_asr_mix_transformer (module)
espnet.nets.pytorch_backend.e2e_asr_mulenc (module)
espnet.nets.pytorch_backend.e2e_asr_transducer (module)
espnet.nets.pytorch_backend.e2e_asr_transformer (module)
espnet.nets.pytorch_backend.e2e_mt (module)
espnet.nets.pytorch_backend.e2e_mt_transformer (module)
espnet.nets.pytorch_backend.e2e_st (module)
espnet.nets.pytorch_backend.e2e_st_conformer (module)
espnet.nets.pytorch_backend.e2e_st_transformer (module)
espnet.nets.pytorch_backend.e2e_tts_fastspeech (module)
espnet.nets.pytorch_backend.e2e_tts_tacotron2 (module)
espnet.nets.pytorch_backend.e2e_tts_transformer (module)
espnet.nets.pytorch_backend.e2e_vc_tacotron2 (module)
espnet.nets.pytorch_backend.e2e_vc_transformer (module)
espnet.nets.pytorch_backend.fastspeech.__init__ (module)
espnet.nets.pytorch_backend.fastspeech.duration_calculator (module)
espnet.nets.pytorch_backend.fastspeech.duration_predictor (module)
espnet.nets.pytorch_backend.fastspeech.length_regulator (module)
espnet.nets.pytorch_backend.frontends.__init__ (module)
espnet.nets.pytorch_backend.frontends.beamformer (module)
espnet.nets.pytorch_backend.frontends.dnn_beamformer (module)
espnet.nets.pytorch_backend.frontends.dnn_wpe (module)
espnet.nets.pytorch_backend.frontends.feature_transform (module)
espnet.nets.pytorch_backend.frontends.frontend (module)
espnet.nets.pytorch_backend.frontends.mask_estimator (module)
espnet.nets.pytorch_backend.gtn_ctc (module)
espnet.nets.pytorch_backend.initialization (module)
espnet.nets.pytorch_backend.lm.__init__ (module)
espnet.nets.pytorch_backend.lm.default (module)
espnet.nets.pytorch_backend.lm.seq_rnn (module)
espnet.nets.pytorch_backend.lm.transformer (module)
espnet.nets.pytorch_backend.maskctc.__init__ (module)
espnet.nets.pytorch_backend.maskctc.add_mask_token (module)
espnet.nets.pytorch_backend.maskctc.mask (module)
espnet.nets.pytorch_backend.nets_utils (module)
espnet.nets.pytorch_backend.rnn.__init__ (module)
espnet.nets.pytorch_backend.rnn.argument (module)
espnet.nets.pytorch_backend.rnn.attentions (module)
espnet.nets.pytorch_backend.rnn.decoders (module)
espnet.nets.pytorch_backend.rnn.encoders (module)
espnet.nets.pytorch_backend.streaming.__init__ (module)
espnet.nets.pytorch_backend.streaming.segment (module)
espnet.nets.pytorch_backend.streaming.window (module)
espnet.nets.pytorch_backend.tacotron2.__init__ (module)
espnet.nets.pytorch_backend.tacotron2.cbhg (module)
espnet.nets.pytorch_backend.tacotron2.decoder (module)
espnet.nets.pytorch_backend.tacotron2.encoder (module)
espnet.nets.pytorch_backend.transducer.__init__ (module)
espnet.nets.pytorch_backend.transducer.arguments (module)
espnet.nets.pytorch_backend.transducer.blocks (module)
espnet.nets.pytorch_backend.transducer.conv1d_nets (module)
espnet.nets.pytorch_backend.transducer.custom_decoder (module)
espnet.nets.pytorch_backend.transducer.custom_encoder (module)
espnet.nets.pytorch_backend.transducer.error_calculator (module)
espnet.nets.pytorch_backend.transducer.initializer (module)
espnet.nets.pytorch_backend.transducer.joint_network (module)
espnet.nets.pytorch_backend.transducer.rnn_decoder (module)
espnet.nets.pytorch_backend.transducer.rnn_encoder (module)
espnet.nets.pytorch_backend.transducer.transducer_tasks (module)
espnet.nets.pytorch_backend.transducer.transformer_decoder_layer (module)
espnet.nets.pytorch_backend.transducer.utils (module)
espnet.nets.pytorch_backend.transducer.vgg2l (module)
espnet.nets.pytorch_backend.transformer.__init__ (module)
espnet.nets.pytorch_backend.transformer.add_sos_eos (module)
espnet.nets.pytorch_backend.transformer.argument (module)
espnet.nets.pytorch_backend.transformer.attention (module)
espnet.nets.pytorch_backend.transformer.contextual_block_encoder_layer (module)
espnet.nets.pytorch_backend.transformer.decoder (module)
espnet.nets.pytorch_backend.transformer.decoder_layer (module)
espnet.nets.pytorch_backend.transformer.dynamic_conv (module)
espnet.nets.pytorch_backend.transformer.dynamic_conv2d (module)
espnet.nets.pytorch_backend.transformer.embedding (module)
espnet.nets.pytorch_backend.transformer.encoder (module)
espnet.nets.pytorch_backend.transformer.encoder_layer (module)
espnet.nets.pytorch_backend.transformer.encoder_mix (module)
espnet.nets.pytorch_backend.transformer.initializer (module)
espnet.nets.pytorch_backend.transformer.label_smoothing_loss (module)
espnet.nets.pytorch_backend.transformer.layer_norm (module)
espnet.nets.pytorch_backend.transformer.lightconv (module)
espnet.nets.pytorch_backend.transformer.lightconv2d (module)
espnet.nets.pytorch_backend.transformer.longformer_attention (module)
espnet.nets.pytorch_backend.transformer.mask (module)
espnet.nets.pytorch_backend.transformer.multi_layer_conv (module)
espnet.nets.pytorch_backend.transformer.optimizer (module)
espnet.nets.pytorch_backend.transformer.plot (module)
espnet.nets.pytorch_backend.transformer.positionwise_feed_forward (module)
espnet.nets.pytorch_backend.transformer.repeat (module)
espnet.nets.pytorch_backend.transformer.subsampling (module)
espnet.nets.pytorch_backend.transformer.subsampling_without_posenc (module)
espnet.nets.pytorch_backend.wavenet (module)
espnet.nets.scorer_interface (module)
espnet.nets.scorers.__init__ (module)
espnet.nets.scorers.ctc (module)
espnet.nets.scorers.length_bonus (module)
espnet.nets.scorers.ngram (module)
espnet.nets.scorers.uasr (module)
espnet.nets.st_interface (module)
espnet.nets.transducer_decoder_interface (module)
espnet.nets.tts_interface (module)
espnet.optimizer.__init__ (module)
espnet.optimizer.chainer (module)
espnet.optimizer.factory (module)
espnet.optimizer.parser (module)
espnet.optimizer.pytorch (module)
espnet.scheduler.__init__ (module)
espnet.scheduler.chainer (module)
espnet.scheduler.pytorch (module)
espnet.scheduler.scheduler (module)
espnet.st.__init__ (module)
espnet.st.pytorch_backend.__init__ (module)
espnet.st.pytorch_backend.st (module)
espnet.transform.__init__ (module)
espnet.transform.add_deltas (module)
espnet.transform.channel_selector (module)
espnet.transform.cmvn (module)
espnet.transform.functional (module)
espnet.transform.perturb (module)
espnet.transform.spec_augment (module)
espnet.transform.spectrogram (module)
espnet.transform.transform_interface (module)
espnet.transform.transformation (module)
espnet.transform.wpe (module)
espnet.tts.__init__ (module)
espnet.tts.pytorch_backend.__init__ (module)
espnet.tts.pytorch_backend.tts (module)
espnet.utils.__init__ (module)
espnet.utils.check_kwargs (module)
espnet.utils.cli_readers (module)
espnet.utils.cli_utils (module)
espnet.utils.cli_writers (module)
espnet.utils.dataset (module)
espnet.utils.deterministic_utils (module)
espnet.utils.dynamic_import (module)
espnet.utils.fill_missing_args (module)
espnet.utils.io_utils (module)
espnet.utils.spec_augment (module)
espnet.utils.training.__init__ (module)
espnet.utils.training.batchfy (module)
espnet.utils.training.evaluator (module)
espnet.utils.training.iterators (module)
espnet.utils.training.tensorboard_logger (module)
espnet.utils.training.train_utils (module)
espnet.vc.pytorch_backend.vc (module)
espnet2.asr.__init__ (module)
espnet2.asr.ctc (module)
espnet2.asr.decoder.__init__ (module)
espnet2.asr.decoder.abs_decoder (module)
espnet2.asr.decoder.hugging_face_transformers_decoder (module)
espnet2.asr.decoder.mlm_decoder (module)
espnet2.asr.decoder.rnn_decoder (module)
espnet2.asr.decoder.s4_decoder (module)
espnet2.asr.decoder.transducer_decoder (module)
espnet2.asr.decoder.transformer_decoder (module)
espnet2.asr.decoder.whisper_decoder (module)
espnet2.asr.discrete_asr_espnet_model (module)
espnet2.asr.encoder.__init__ (module)
espnet2.asr.encoder.abs_encoder (module)
espnet2.asr.encoder.avhubert_encoder (module)
espnet2.asr.encoder.branchformer_encoder (module)
espnet2.asr.encoder.conformer_encoder (module)
espnet2.asr.encoder.contextual_block_conformer_encoder (module)
espnet2.asr.encoder.contextual_block_transformer_encoder (module)
espnet2.asr.encoder.e_branchformer_encoder (module)
espnet2.asr.encoder.hubert_encoder (module)
espnet2.asr.encoder.hugging_face_transformers_encoder (module)
espnet2.asr.encoder.linear_encoder (module)
espnet2.asr.encoder.longformer_encoder (module)
espnet2.asr.encoder.rnn_encoder (module)
espnet2.asr.encoder.transformer_encoder (module)
espnet2.asr.encoder.transformer_encoder_multispkr (module)
espnet2.asr.encoder.vgg_rnn_encoder (module)
espnet2.asr.encoder.wav2vec2_encoder (module)
espnet2.asr.encoder.whisper_encoder (module)
espnet2.asr.espnet_model (module)
espnet2.asr.frontend.__init__ (module)
espnet2.asr.frontend.abs_frontend (module)
espnet2.asr.frontend.asteroid_frontend (module)
espnet2.asr.frontend.default (module)
espnet2.asr.frontend.fused (module)
espnet2.asr.frontend.melspec_torch (module)
espnet2.asr.frontend.s3prl (module)
espnet2.asr.frontend.whisper (module)
espnet2.asr.frontend.windowing (module)
espnet2.asr.layers.__init__ (module)
espnet2.asr.layers.cgmlp (module)
espnet2.asr.layers.fastformer (module)
espnet2.asr.maskctc_model (module)
espnet2.asr.pit_espnet_model (module)
espnet2.asr.postencoder.__init__ (module)
espnet2.asr.postencoder.abs_postencoder (module)
espnet2.asr.postencoder.hugging_face_transformers_postencoder (module)
espnet2.asr.postencoder.length_adaptor_postencoder (module)
espnet2.asr.preencoder.__init__ (module)
espnet2.asr.preencoder.abs_preencoder (module)
espnet2.asr.preencoder.linear (module)
espnet2.asr.preencoder.sinc (module)
espnet2.asr.specaug.__init__ (module)
espnet2.asr.specaug.abs_specaug (module)
espnet2.asr.specaug.specaug (module)
espnet2.asr.state_spaces.__init__ (module)
espnet2.asr.state_spaces.attention (module)
espnet2.asr.state_spaces.base (module)
espnet2.asr.state_spaces.block (module)
espnet2.asr.state_spaces.components (module)
espnet2.asr.state_spaces.ff (module)
espnet2.asr.state_spaces.model (module)
espnet2.asr.state_spaces.pool (module)
espnet2.asr.state_spaces.registry (module)
espnet2.asr.state_spaces.residual (module)
espnet2.asr.state_spaces.s4 (module)
espnet2.asr.state_spaces.utils (module)
espnet2.asr.transducer.__init__ (module)
espnet2.asr.transducer.beam_search_transducer (module)
espnet2.asr.transducer.beam_search_transducer_streaming (module)
espnet2.asr.transducer.error_calculator (module)
espnet2.asr.transducer.rnnt_multi_blank.__init__ (module)
espnet2.asr.transducer.rnnt_multi_blank.rnnt (module)
espnet2.asr.transducer.rnnt_multi_blank.rnnt_multi_blank (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.__init__ (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.__init__ (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.__init__ (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants (module)
espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper (module)
espnet2.asr_transducer.__init__ (module)
espnet2.asr_transducer.activation (module)
espnet2.asr_transducer.beam_search_transducer (module)
espnet2.asr_transducer.decoder.__init__ (module)
espnet2.asr_transducer.decoder.abs_decoder (module)
espnet2.asr_transducer.decoder.blocks.__init__ (module)
espnet2.asr_transducer.decoder.blocks.mega (module)
espnet2.asr_transducer.decoder.blocks.rwkv (module)
espnet2.asr_transducer.decoder.mega_decoder (module)
espnet2.asr_transducer.decoder.modules.__init__ (module)
espnet2.asr_transducer.decoder.modules.mega.__init__ (module)
espnet2.asr_transducer.decoder.modules.mega.feed_forward (module)
espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema (module)
espnet2.asr_transducer.decoder.modules.mega.positional_bias (module)
espnet2.asr_transducer.decoder.modules.rwkv.__init__ (module)
espnet2.asr_transducer.decoder.modules.rwkv.attention (module)
espnet2.asr_transducer.decoder.modules.rwkv.feed_forward (module)
espnet2.asr_transducer.decoder.rnn_decoder (module)
espnet2.asr_transducer.decoder.rwkv_decoder (module)
espnet2.asr_transducer.decoder.stateless_decoder (module)
espnet2.asr_transducer.encoder.__init__ (module)
espnet2.asr_transducer.encoder.blocks.__init__ (module)
espnet2.asr_transducer.encoder.blocks.branchformer (module)
espnet2.asr_transducer.encoder.blocks.conformer (module)
espnet2.asr_transducer.encoder.blocks.conv1d (module)
espnet2.asr_transducer.encoder.blocks.conv_input (module)
espnet2.asr_transducer.encoder.blocks.ebranchformer (module)
espnet2.asr_transducer.encoder.building (module)
espnet2.asr_transducer.encoder.encoder (module)
espnet2.asr_transducer.encoder.modules.__init__ (module)
espnet2.asr_transducer.encoder.modules.attention (module)
espnet2.asr_transducer.encoder.modules.convolution (module)
espnet2.asr_transducer.encoder.modules.multi_blocks (module)
espnet2.asr_transducer.encoder.modules.positional_encoding (module)
espnet2.asr_transducer.encoder.validation (module)
espnet2.asr_transducer.error_calculator (module)
espnet2.asr_transducer.espnet_transducer_model (module)
espnet2.asr_transducer.frontend.__init__ (module)
espnet2.asr_transducer.frontend.online_audio_processor (module)
espnet2.asr_transducer.joint_network (module)
espnet2.asr_transducer.normalization (module)
espnet2.asr_transducer.utils (module)
espnet2.asvspoof.__init__ (module)
espnet2.asvspoof.decoder.__init__ (module)
espnet2.asvspoof.decoder.abs_decoder (module)
espnet2.asvspoof.decoder.linear_decoder (module)
espnet2.asvspoof.espnet_model (module)
espnet2.asvspoof.loss.__init__ (module)
espnet2.asvspoof.loss.abs_loss (module)
espnet2.asvspoof.loss.am_softmax_loss (module)
espnet2.asvspoof.loss.binary_loss (module)
espnet2.asvspoof.loss.oc_softmax_loss (module)
espnet2.bin.__init__ (module)
espnet2.bin.aggregate_stats_dirs (module)
espnet2.bin.asr_align (module)
espnet2.bin.asr_inference (module)
espnet2.bin.asr_inference_maskctc (module)
espnet2.bin.asr_inference_streaming (module)
espnet2.bin.asr_train (module)
espnet2.bin.asr_transducer_inference (module)
espnet2.bin.asr_transducer_train (module)
espnet2.bin.asvspoof_inference (module)
espnet2.bin.asvspoof_train (module)
espnet2.bin.diar_inference (module)
espnet2.bin.diar_train (module)
espnet2.bin.enh_inference (module)
espnet2.bin.enh_inference_streaming (module)
espnet2.bin.enh_s2t_train (module)
espnet2.bin.enh_scoring (module)
espnet2.bin.enh_train (module)
espnet2.bin.enh_tse_inference (module)
espnet2.bin.enh_tse_train (module)
espnet2.bin.gan_svs_train (module)
espnet2.bin.gan_tts_train (module)
espnet2.bin.hubert_train (module)
espnet2.bin.hugging_face_export_vocabulary (module)
espnet2.bin.launch (module)
espnet2.bin.lm_calc_perplexity (module)
espnet2.bin.lm_inference (module)
espnet2.bin.lm_train (module)
espnet2.bin.mt_inference (module)
espnet2.bin.mt_train (module)
espnet2.bin.pack (module)
espnet2.bin.s2st_inference (module)
espnet2.bin.s2st_train (module)
espnet2.bin.s2t_inference (module)
espnet2.bin.s2t_inference_language (module)
espnet2.bin.s2t_train (module)
espnet2.bin.slu_inference (module)
espnet2.bin.slu_train (module)
espnet2.bin.spk_embed_extract (module)
espnet2.bin.spk_inference (module)
espnet2.bin.spk_train (module)
espnet2.bin.split_scps (module)
espnet2.bin.st_inference (module)
espnet2.bin.st_inference_streaming (module)
espnet2.bin.st_train (module)
espnet2.bin.svs_inference (module)
espnet2.bin.svs_train (module)
espnet2.bin.tokenize_text (module)
espnet2.bin.tts_inference (module)
espnet2.bin.tts_train (module)
espnet2.bin.uasr_extract_feature (module)
espnet2.bin.uasr_inference (module)
espnet2.bin.uasr_inference_k2 (module)
espnet2.bin.uasr_train (module)
espnet2.bin.whisper_export_vocabulary (module)
espnet2.diar.__init__ (module)
espnet2.diar.abs_diar (module)
espnet2.diar.attractor.__init__ (module)
espnet2.diar.attractor.abs_attractor (module)
espnet2.diar.attractor.rnn_attractor (module)
espnet2.diar.decoder.__init__ (module)
espnet2.diar.decoder.abs_decoder (module)
espnet2.diar.decoder.linear_decoder (module)
espnet2.diar.espnet_model (module)
espnet2.diar.label_processor (module)
espnet2.diar.layers.__init__ (module)
espnet2.diar.layers.abs_mask (module)
espnet2.diar.layers.multi_mask (module)
espnet2.diar.layers.tcn_nomask (module)
espnet2.diar.separator.__init__ (module)
espnet2.diar.separator.tcn_separator_nomask (module)
espnet2.enh.__init__ (module)
espnet2.enh.abs_enh (module)
espnet2.enh.decoder.__init__ (module)
espnet2.enh.decoder.abs_decoder (module)
espnet2.enh.decoder.conv_decoder (module)
espnet2.enh.decoder.null_decoder (module)
espnet2.enh.decoder.stft_decoder (module)
espnet2.enh.diffusion.__init__ (module)
espnet2.enh.diffusion.abs_diffusion (module)
espnet2.enh.diffusion.sampling.__init__ (module)
espnet2.enh.diffusion.sampling.correctors (module)
espnet2.enh.diffusion.sampling.predictors (module)
espnet2.enh.diffusion.score_based_diffusion (module)
espnet2.enh.diffusion.sdes (module)
espnet2.enh.diffusion_enh (module)
espnet2.enh.encoder.__init__ (module)
espnet2.enh.encoder.abs_encoder (module)
espnet2.enh.encoder.conv_encoder (module)
espnet2.enh.encoder.null_encoder (module)
espnet2.enh.encoder.stft_encoder (module)
espnet2.enh.espnet_enh_s2t_model (module)
espnet2.enh.espnet_model (module)
espnet2.enh.espnet_model_tse (module)
espnet2.enh.extractor.__init__ (module)
espnet2.enh.extractor.abs_extractor (module)
espnet2.enh.extractor.td_speakerbeam_extractor (module)
espnet2.enh.layers.__init__ (module)
espnet2.enh.layers.adapt_layers (module)
espnet2.enh.layers.beamformer (module)
espnet2.enh.layers.beamformer_th (module)
espnet2.enh.layers.complex_utils (module)
espnet2.enh.layers.complexnn (module)
espnet2.enh.layers.conv_utils (module)
espnet2.enh.layers.dc_crn (module)
espnet2.enh.layers.dcunet (module)
espnet2.enh.layers.dnn_beamformer (module)
espnet2.enh.layers.dnn_wpe (module)
espnet2.enh.layers.dnsmos (module)
espnet2.enh.layers.dpmulcat (module)
espnet2.enh.layers.dprnn (module)
espnet2.enh.layers.dptnet (module)
espnet2.enh.layers.fasnet (module)
espnet2.enh.layers.ifasnet (module)
espnet2.enh.layers.mask_estimator (module)
espnet2.enh.layers.ncsnpp (module)
espnet2.enh.layers.ncsnpp_utils.__init__ (module)
espnet2.enh.layers.ncsnpp_utils.layers (module)
espnet2.enh.layers.ncsnpp_utils.layerspp (module)
espnet2.enh.layers.ncsnpp_utils.normalization (module)
espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling (module)
espnet2.enh.layers.ncsnpp_utils.upfirdn2d (module)
espnet2.enh.layers.skim (module)
espnet2.enh.layers.tcn (module)
espnet2.enh.layers.tcndenseunet (module)
espnet2.enh.layers.uses (module)
espnet2.enh.layers.wpe (module)
espnet2.enh.loss.__init__ (module)
espnet2.enh.loss.criterions.__init__ (module)
espnet2.enh.loss.criterions.abs_loss (module)
espnet2.enh.loss.criterions.tf_domain (module)
espnet2.enh.loss.criterions.time_domain (module)
espnet2.enh.loss.wrappers.__init__ (module)
espnet2.enh.loss.wrappers.abs_wrapper (module)
espnet2.enh.loss.wrappers.dpcl_solver (module)
espnet2.enh.loss.wrappers.fixed_order (module)
espnet2.enh.loss.wrappers.mixit_solver (module)
espnet2.enh.loss.wrappers.multilayer_pit_solver (module)
espnet2.enh.loss.wrappers.pit_solver (module)
espnet2.enh.separator.__init__ (module)
espnet2.enh.separator.abs_separator (module)
espnet2.enh.separator.asteroid_models (module)
espnet2.enh.separator.conformer_separator (module)
espnet2.enh.separator.dan_separator (module)
espnet2.enh.separator.dc_crn_separator (module)
espnet2.enh.separator.dccrn_separator (module)
espnet2.enh.separator.dpcl_e2e_separator (module)
espnet2.enh.separator.dpcl_separator (module)
espnet2.enh.separator.dprnn_separator (module)
espnet2.enh.separator.dptnet_separator (module)
espnet2.enh.separator.fasnet_separator (module)
espnet2.enh.separator.ineube_separator (module)
espnet2.enh.separator.neural_beamformer (module)
espnet2.enh.separator.rnn_separator (module)
espnet2.enh.separator.skim_separator (module)
espnet2.enh.separator.svoice_separator (module)
espnet2.enh.separator.tcn_separator (module)
espnet2.enh.separator.tfgridnet_separator (module)
espnet2.enh.separator.tfgridnetv2_separator (module)
espnet2.enh.separator.transformer_separator (module)
espnet2.enh.separator.uses_separator (module)
espnet2.fileio.__init__ (module)
espnet2.fileio.datadir_writer (module)
espnet2.fileio.multi_sound_scp (module)
espnet2.fileio.npy_scp (module)
espnet2.fileio.rand_gen_dataset (module)
espnet2.fileio.read_text (module)
espnet2.fileio.rttm (module)
espnet2.fileio.score_scp (module)
espnet2.fileio.sound_scp (module)
espnet2.fileio.vad_scp (module)
espnet2.fst.__init__ (module)
espnet2.gan_svs.__init__ (module)
espnet2.gan_svs.abs_gan_svs (module)
espnet2.gan_svs.avocodo.__init__ (module)
espnet2.gan_svs.avocodo.avocodo (module)
espnet2.gan_svs.espnet_model (module)
espnet2.gan_svs.joint.__init__ (module)
espnet2.gan_svs.joint.joint_score2wav (module)
espnet2.gan_svs.pits.modules (module)
espnet2.gan_svs.pits.ying_decoder (module)
espnet2.gan_svs.uhifigan.__init__ (module)
espnet2.gan_svs.uhifigan.sine_generator (module)
espnet2.gan_svs.uhifigan.uhifigan (module)
espnet2.gan_svs.utils.__init__ (module)
espnet2.gan_svs.utils.expand_f0 (module)
espnet2.gan_svs.visinger2.__init__ (module)
espnet2.gan_svs.visinger2.ddsp (module)
espnet2.gan_svs.visinger2.visinger2_vocoder (module)
espnet2.gan_svs.vits.__init__ (module)
espnet2.gan_svs.vits.duration_predictor (module)
espnet2.gan_svs.vits.generator (module)
espnet2.gan_svs.vits.length_regulator (module)
espnet2.gan_svs.vits.modules (module)
espnet2.gan_svs.vits.phoneme_predictor (module)
espnet2.gan_svs.vits.pitch_predictor (module)
espnet2.gan_svs.vits.prior_decoder (module)
espnet2.gan_svs.vits.text_encoder (module)
espnet2.gan_svs.vits.vits (module)
espnet2.gan_tts.__init__ (module)
espnet2.gan_tts.abs_gan_tts (module)
espnet2.gan_tts.espnet_model (module)
espnet2.gan_tts.hifigan.__init__ (module)
espnet2.gan_tts.hifigan.hifigan (module)
espnet2.gan_tts.hifigan.loss (module)
espnet2.gan_tts.hifigan.residual_block (module)
espnet2.gan_tts.jets.__init__ (module)
espnet2.gan_tts.jets.alignments (module)
espnet2.gan_tts.jets.generator (module)
espnet2.gan_tts.jets.jets (module)
espnet2.gan_tts.jets.length_regulator (module)
espnet2.gan_tts.jets.loss (module)
espnet2.gan_tts.joint.__init__ (module)
espnet2.gan_tts.joint.joint_text2wav (module)
espnet2.gan_tts.melgan.__init__ (module)
espnet2.gan_tts.melgan.melgan (module)
espnet2.gan_tts.melgan.pqmf (module)
espnet2.gan_tts.melgan.residual_stack (module)
espnet2.gan_tts.parallel_wavegan.__init__ (module)
espnet2.gan_tts.parallel_wavegan.parallel_wavegan (module)
espnet2.gan_tts.parallel_wavegan.upsample (module)
espnet2.gan_tts.style_melgan.__init__ (module)
espnet2.gan_tts.style_melgan.style_melgan (module)
espnet2.gan_tts.style_melgan.tade_res_block (module)
espnet2.gan_tts.utils.__init__ (module)
espnet2.gan_tts.utils.get_random_segments (module)
espnet2.gan_tts.vits.__init__ (module)
espnet2.gan_tts.vits.duration_predictor (module)
espnet2.gan_tts.vits.flow (module)
espnet2.gan_tts.vits.generator (module)
espnet2.gan_tts.vits.loss (module)
espnet2.gan_tts.vits.monotonic_align.__init__ (module)
espnet2.gan_tts.vits.posterior_encoder (module)
espnet2.gan_tts.vits.residual_coupling (module)
espnet2.gan_tts.vits.text_encoder (module)
espnet2.gan_tts.vits.transform (module)
espnet2.gan_tts.vits.vits (module)
espnet2.gan_tts.wavenet.__init__ (module)
espnet2.gan_tts.wavenet.residual_block (module)
espnet2.gan_tts.wavenet.wavenet (module)
espnet2.hubert.__init__ (module)
espnet2.hubert.espnet_model (module)
espnet2.hubert.hubert_loss (module)
espnet2.iterators.__init__ (module)
espnet2.iterators.abs_iter_factory (module)
espnet2.iterators.category_iter_factory (module)
espnet2.iterators.chunk_iter_factory (module)
espnet2.iterators.multiple_iter_factory (module)
espnet2.iterators.sequence_iter_factory (module)
espnet2.layers.__init__ (module)
espnet2.layers.abs_normalize (module)
espnet2.layers.augmentation (module)
espnet2.layers.create_adapter (module)
espnet2.layers.create_adapter_fn (module)
espnet2.layers.create_adapter_utils (module)
espnet2.layers.global_mvn (module)
espnet2.layers.houlsby_adapter_layer (module)
espnet2.layers.inversible_interface (module)
espnet2.layers.label_aggregation (module)
espnet2.layers.log_mel (module)
espnet2.layers.mask_along_axis (module)
espnet2.layers.sinc_conv (module)
espnet2.layers.stft (module)
espnet2.layers.time_warp (module)
espnet2.layers.utterance_mvn (module)
espnet2.lm.__init__ (module)
espnet2.lm.abs_model (module)
espnet2.lm.espnet_model (module)
espnet2.lm.espnet_model_multitask (module)
espnet2.lm.huggingface_pretrained_opt_lm (module)
espnet2.lm.seq_rnn_lm (module)
espnet2.lm.transformer_lm (module)
espnet2.main_funcs.__init__ (module)
espnet2.main_funcs.average_nbest_models (module)
espnet2.main_funcs.calculate_all_attentions (module)
espnet2.main_funcs.collect_stats (module)
espnet2.main_funcs.pack_funcs (module)
espnet2.mt.__init__ (module)
espnet2.mt.espnet_model (module)
espnet2.mt.frontend.__init__ (module)
espnet2.mt.frontend.embedding (module)
espnet2.optimizers.__init__ (module)
espnet2.optimizers.optim_groups (module)
espnet2.optimizers.sgd (module)
espnet2.s2st.__init__ (module)
espnet2.s2st.aux_attention.__init__ (module)
espnet2.s2st.aux_attention.abs_aux_attention (module)
espnet2.s2st.aux_attention.multihead (module)
espnet2.s2st.espnet_model (module)
espnet2.s2st.losses.__init__ (module)
espnet2.s2st.losses.abs_loss (module)
espnet2.s2st.losses.attention_loss (module)
espnet2.s2st.losses.ctc_loss (module)
espnet2.s2st.losses.guided_attention_loss (module)
espnet2.s2st.losses.tacotron_loss (module)
espnet2.s2st.synthesizer.__init__ (module)
espnet2.s2st.synthesizer.abs_synthesizer (module)
espnet2.s2st.synthesizer.discrete_synthesizer (module)
espnet2.s2st.synthesizer.translatotron (module)
espnet2.s2st.synthesizer.translatotron2 (module)
espnet2.s2st.synthesizer.unity_synthesizer (module)
espnet2.s2st.tgt_feats_extract.__init__ (module)
espnet2.s2st.tgt_feats_extract.abs_tgt_feats_extract (module)
espnet2.s2st.tgt_feats_extract.linear_spectrogram (module)
espnet2.s2st.tgt_feats_extract.log_mel_fbank (module)
espnet2.s2st.tgt_feats_extract.log_spectrogram (module)
espnet2.s2t.__init__ (module)
espnet2.s2t.espnet_model (module)
espnet2.samplers.__init__ (module)
espnet2.samplers.abs_sampler (module)
espnet2.samplers.build_batch_sampler (module)
espnet2.samplers.category_balanced_sampler (module)
espnet2.samplers.folded_batch_sampler (module)
espnet2.samplers.length_batch_sampler (module)
espnet2.samplers.num_elements_batch_sampler (module)
espnet2.samplers.sorted_batch_sampler (module)
espnet2.samplers.unsorted_batch_sampler (module)
espnet2.schedulers.__init__ (module)
espnet2.schedulers.abs_scheduler (module)
espnet2.schedulers.cosine_anneal_warmup_restart (module)
espnet2.schedulers.noam_lr (module)
espnet2.schedulers.piecewise_linear_warmup_lr (module)
espnet2.schedulers.warmup_lr (module)
espnet2.schedulers.warmup_reducelronplateau (module)
espnet2.schedulers.warmup_step_lr (module)
espnet2.slu.__init__ (module)
espnet2.slu.espnet_model (module)
espnet2.slu.postdecoder.__init__ (module)
espnet2.slu.postdecoder.abs_postdecoder (module)
espnet2.slu.postdecoder.hugging_face_transformers_postdecoder (module)
espnet2.slu.postencoder.__init__ (module)
espnet2.slu.postencoder.conformer_postencoder (module)
espnet2.slu.postencoder.transformer_postencoder (module)
espnet2.spk.__init__ (module)
espnet2.spk.encoder.__init__ (module)
espnet2.spk.encoder.conformer_encoder (module)
espnet2.spk.encoder.ecapa_tdnn_encoder (module)
espnet2.spk.encoder.identity_encoder (module)
espnet2.spk.encoder.rawnet3_encoder (module)
espnet2.spk.encoder.ska_tdnn_encoder (module)
espnet2.spk.encoder.xvector_encoder (module)
espnet2.spk.espnet_model (module)
espnet2.spk.layers.__init__ (module)
espnet2.spk.layers.ecapa_block (module)
espnet2.spk.layers.rawnet_block (module)
espnet2.spk.loss.__init__ (module)
espnet2.spk.loss.aamsoftmax (module)
espnet2.spk.loss.aamsoftmax_subcenter_intertopk (module)
espnet2.spk.loss.abs_loss (module)
espnet2.spk.pooling.__init__ (module)
espnet2.spk.pooling.abs_pooling (module)
espnet2.spk.pooling.chn_attn_stat_pooling (module)
espnet2.spk.pooling.mean_pooling (module)
espnet2.spk.pooling.stat_pooling (module)
espnet2.spk.projector.__init__ (module)
espnet2.spk.projector.abs_projector (module)
espnet2.spk.projector.rawnet3_projector (module)
espnet2.spk.projector.ska_tdnn_projector (module)
espnet2.spk.projector.xvector_projector (module)
espnet2.st.__init__ (module)
espnet2.st.espnet_model (module)
espnet2.svs.__init__ (module)
espnet2.svs.abs_svs (module)
espnet2.svs.espnet_model (module)
espnet2.svs.feats_extract.__init__ (module)
espnet2.svs.feats_extract.score_feats_extract (module)
espnet2.svs.naive_rnn.__init__ (module)
espnet2.svs.naive_rnn.naive_rnn (module)
espnet2.svs.naive_rnn.naive_rnn_dp (module)
espnet2.svs.singing_tacotron.__init__ (module)
espnet2.svs.singing_tacotron.decoder (module)
espnet2.svs.singing_tacotron.encoder (module)
espnet2.svs.singing_tacotron.singing_tacotron (module)
espnet2.svs.xiaoice.__init__ (module)
espnet2.svs.xiaoice.loss (module)
espnet2.svs.xiaoice.XiaoiceSing (module)
espnet2.tasks.__init__ (module)
espnet2.tasks.abs_task (module)
espnet2.tasks.asr (module)
espnet2.tasks.asr_transducer (module)
espnet2.tasks.asvspoof (module)
espnet2.tasks.diar (module)
espnet2.tasks.enh (module)
espnet2.tasks.enh_s2t (module)
espnet2.tasks.enh_tse (module)
espnet2.tasks.gan_svs (module)
espnet2.tasks.gan_tts (module)
espnet2.tasks.hubert (module)
espnet2.tasks.lm (module)
espnet2.tasks.mt (module)
espnet2.tasks.s2st (module)
espnet2.tasks.s2t (module)
espnet2.tasks.slu (module)
espnet2.tasks.spk (module)
espnet2.tasks.st (module)
espnet2.tasks.svs (module)
espnet2.tasks.tts (module)
espnet2.tasks.uasr (module)
espnet2.text.__init__ (module)
espnet2.text.abs_tokenizer (module)
espnet2.text.build_tokenizer (module)
espnet2.text.char_tokenizer (module)
espnet2.text.cleaner (module)
espnet2.text.hugging_face_token_id_converter (module)
espnet2.text.hugging_face_tokenizer (module)
espnet2.text.korean_cleaner (module)
espnet2.text.phoneme_tokenizer (module)
espnet2.text.sentencepiece_tokenizer (module)
espnet2.text.token_id_converter (module)
espnet2.text.whisper_token_id_converter (module)
espnet2.text.whisper_tokenizer (module)
espnet2.text.word_tokenizer (module)
espnet2.torch_utils.__init__ (module)
espnet2.torch_utils.add_gradient_noise (module)
espnet2.torch_utils.device_funcs (module)
espnet2.torch_utils.forward_adaptor (module)
espnet2.torch_utils.get_layer_from_string (module)
espnet2.torch_utils.initialize (module)
espnet2.torch_utils.load_pretrained_model (module)
espnet2.torch_utils.model_summary (module)
espnet2.torch_utils.pytorch_version (module)
espnet2.torch_utils.recursive_op (module)
espnet2.torch_utils.set_all_random_seed (module)
espnet2.train.__init__ (module)
espnet2.train.abs_espnet_model (module)
espnet2.train.abs_gan_espnet_model (module)
espnet2.train.class_choices (module)
espnet2.train.collate_fn (module)
espnet2.train.dataset (module)
espnet2.train.distributed_utils (module)
espnet2.train.gan_trainer (module)
espnet2.train.iterable_dataset (module)
espnet2.train.preprocessor (module)
espnet2.train.reporter (module)
espnet2.train.spk_trainer (module)
espnet2.train.trainer (module)
espnet2.train.uasr_trainer (module)
espnet2.tts.__init__ (module)
espnet2.tts.abs_tts (module)
espnet2.tts.espnet_model (module)
espnet2.tts.fastspeech.__init__ (module)
espnet2.tts.fastspeech.fastspeech (module)
espnet2.tts.fastspeech2.__init__ (module)
espnet2.tts.fastspeech2.fastspeech2 (module)
espnet2.tts.fastspeech2.loss (module)
espnet2.tts.fastspeech2.variance_predictor (module)
espnet2.tts.feats_extract.__init__ (module)
espnet2.tts.feats_extract.abs_feats_extract (module)
espnet2.tts.feats_extract.dio (module)
espnet2.tts.feats_extract.energy (module)
espnet2.tts.feats_extract.linear_spectrogram (module)
espnet2.tts.feats_extract.log_mel_fbank (module)
espnet2.tts.feats_extract.log_spectrogram (module)
espnet2.tts.feats_extract.yin (module)
espnet2.tts.feats_extract.ying (module)
espnet2.tts.gst.__init__ (module)
espnet2.tts.gst.style_encoder (module)
espnet2.tts.prodiff.__init__ (module)
espnet2.tts.prodiff.denoiser (module)
espnet2.tts.prodiff.loss (module)
espnet2.tts.prodiff.prodiff (module)
espnet2.tts.tacotron2.__init__ (module)
espnet2.tts.tacotron2.tacotron2 (module)
espnet2.tts.transformer.__init__ (module)
espnet2.tts.transformer.transformer (module)
espnet2.tts.utils.__init__ (module)
espnet2.tts.utils.duration_calculator (module)
espnet2.tts.utils.parallel_wavegan_pretrained_vocoder (module)
espnet2.uasr.__init__ (module)
espnet2.uasr.discriminator.__init__ (module)
espnet2.uasr.discriminator.abs_discriminator (module)
espnet2.uasr.discriminator.conv_discriminator (module)
espnet2.uasr.espnet_model (module)
espnet2.uasr.generator.__init__ (module)
espnet2.uasr.generator.abs_generator (module)
espnet2.uasr.generator.conv_generator (module)
espnet2.uasr.loss.__init__ (module)
espnet2.uasr.loss.abs_loss (module)
espnet2.uasr.loss.discriminator_loss (module)
espnet2.uasr.loss.gradient_penalty (module)
espnet2.uasr.loss.phoneme_diversity_loss (module)
espnet2.uasr.loss.pseudo_label_loss (module)
espnet2.uasr.loss.smoothness_penalty (module)
espnet2.uasr.segmenter.__init__ (module)
espnet2.uasr.segmenter.abs_segmenter (module)
espnet2.uasr.segmenter.join_segmenter (module)
espnet2.uasr.segmenter.random_segmenter (module)
espnet2.utils.__init__ (module)
espnet2.utils.build_dataclass (module)
espnet2.utils.config_argparse (module)
espnet2.utils.eer (module)
espnet2.utils.get_default_kwargs (module)
espnet2.utils.griffin_lim (module)
espnet2.utils.kwargs2args (module)
espnet2.utils.nested_dict_action (module)
espnet2.utils.sized_dict (module)
espnet2.utils.types (module)
espnet2.utils.yaml_no_alias_safe_dump (module)
espnet_initialization_fn() (espnet2.asr.layers.cgmlp.ConvolutionalSpatialGatingUnit method)
(espnet2.asr.layers.fastformer.FastSelfAttention method)
(espnet2.asr.preencoder.sinc.LightweightSincConvs method)
ESPnetASRModel (class in espnet2.asr.espnet_model)
(class in espnet2.asr.pit_espnet_model)
ESPnetASRTransducerModel (class in espnet2.asr_transducer.espnet_transducer_model)
ESPnetASVSpoofModel (class in espnet2.asvspoof.espnet_model)
ESPnetDataset (class in espnet2.train.dataset)
ESPnetDiarizationModel (class in espnet2.diar.espnet_model)
ESPnetDiffusionModel (class in espnet2.enh.diffusion_enh)
ESPnetDiscreteASRModel (class in espnet2.asr.discrete_asr_espnet_model)
ESPnetEnhancementModel (class in espnet2.enh.espnet_model)
ESPnetEnhS2TModel (class in espnet2.enh.espnet_enh_s2t_model)
ESPnetExtractionModel (class in espnet2.enh.espnet_model_tse)
ESPnetGANSVSModel (class in espnet2.gan_svs.espnet_model)
ESPnetGANTTSModel (class in espnet2.gan_tts.espnet_model)
ESPnetLanguageModel (class in espnet2.lm.espnet_model)
ESPnetMTModel (class in espnet2.mt.espnet_model)
ESPnetMultitaskLanguageModel (class in espnet2.lm.espnet_model_multitask)
ESPnetS2STModel (class in espnet2.s2st.espnet_model)
ESPnetS2TModel (class in espnet2.s2t.espnet_model)
ESPnetSLUModel (class in espnet2.slu.espnet_model)
ESPnetSpeakerModel (class in espnet2.spk.espnet_model)
ESPnetSTModel (class in espnet2.st.espnet_model)
ESPnetSVSModel (class in espnet2.svs.espnet_model)
ESPnetTTSModel (class in espnet2.tts.espnet_model)
ESPnetUASRModel (class in espnet2.uasr.espnet_model)
estimate_samples_to_frames_ratio() (espnet2.bin.asr_align.CTCSegmentation method)
EulerMaruyamaPredictor (class in espnet2.enh.diffusion.sampling.predictors)
evaluate() (espnet.asr.pytorch_backend.asr.CustomEvaluator method)
(espnet.lm.chainer_backend.lm.LMEvaluator method)
(espnet.lm.pytorch_backend.lm.LMEvaluator method)
(espnet.tts.pytorch_backend.tts.CustomEvaluator method)
(espnet.vc.pytorch_backend.vc.CustomEvaluator method)
exclude_opts() (espnet2.tasks.abs_task.AbsTask class method)
exitcode() (espnet.distributed.pytorch_backend.launch.WorkerError property)
expand() (espnet2.gan_svs.vits.length_regulator.LengthRegulator method)
expand_f0() (in module espnet2.gan_svs.utils.expand_f0)
expand_to_frame() (in module espnet2.svs.feats_extract.score_feats_extract)
ExpandedTokenEmbedding (class in espnet2.asr.decoder.whisper_decoder)
expansion (espnet2.asr.encoder.avhubert_encoder.BasicBlock attribute)
EXPONENTIAL (espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce.I_Op attribute)
exponential (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
export_vocabulary() (in module espnet2.bin.hugging_face_export_vocabulary)
(in module espnet2.bin.whisper_export_vocabulary)
extend() (espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
(espnet.nets.batch_beam_search_online_sim.BatchBeamSearchOnlineSim method)
extend_pe() (espnet.nets.pytorch_backend.transformer.embedding.LearnableFourierPosEnc method)
(espnet.nets.pytorch_backend.transformer.embedding.PositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.embedding.RelPositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.embedding.StreamPositionalEncoding method)
(espnet2.asr_transducer.encoder.modules.positional_encoding.RelPositionalEncoding method)
extend_prob() (espnet.nets.ctc_prefix_score.CTCPrefixScoreTH method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
extend_state() (espnet.nets.ctc_prefix_score.CTCPrefixScoreTH method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
ExtendedHypothesis (class in espnet.nets.transducer_decoder_interface)
(class in espnet2.asr.transducer.beam_search_transducer)
(class in espnet2.asr.transducer.beam_search_transducer_streaming)
(class in espnet2.asr_transducer.beam_search_transducer)
extra_repr() (espnet.nets.pytorch_backend.frontends.feature_transform.GlobalMVN method)
(espnet.nets.pytorch_backend.frontends.feature_transform.LogMel method)
(espnet.nets.pytorch_backend.frontends.feature_transform.UtteranceMVN method)
(espnet2.enh.layers.complexnn.ComplexBatchNorm method)
(espnet2.enh.layers.dcunet.ComplexBatchNorm method)
(espnet2.enh.layers.skim.MemLSTM method)
(espnet2.layers.global_mvn.GlobalMVN method)
(espnet2.layers.label_aggregation.LabelAggregate method)
(espnet2.layers.log_mel.LogMel method)
(espnet2.layers.mask_along_axis.MaskAlongAxis method)
(espnet2.layers.mask_along_axis.MaskAlongAxisVariableMaxWidth method)
(espnet2.layers.stft.Stft method)
(espnet2.layers.time_warp.TimeWarp method)
(espnet2.layers.utterance_mvn.UtteranceMVN method)
(espnet2.svs.feats_extract.score_feats_extract.FrameScoreFeats method)
(espnet2.svs.feats_extract.score_feats_extract.SyllableScoreFeats method)
extract() (espnet2.main_funcs.pack_funcs.Archiver method)
extract_attrs_from_obj() (in module espnet2.asr.state_spaces.utils)
extract_embed() (espnet2.train.spk_trainer.SpkTrainer class method)
(in module espnet2.bin.spk_embed_extract)
extract_feats() (espnet2.spk.espnet_model.ESPnetSpeakerModel method)
extract_feature() (in module espnet2.bin.uasr_extract_feature)
extract_features() (espnet2.asr.encoder.avhubert_encoder.TransformerEncoder method)
extract_finetune() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
extract_loudness() (in module espnet2.gan_svs.visinger2.ddsp)
extract_pitch() (in module espnet2.gan_svs.visinger2.ddsp)
extractfile() (espnet2.main_funcs.pack_funcs.Archiver method)
F
FairseqAVHubertEncoder (class in espnet2.asr.encoder.avhubert_encoder)
FairseqHubertEncoder (class in espnet2.asr.encoder.hubert_encoder)
FairseqHubertPretrainEncoder (class in espnet2.asr.encoder.hubert_encoder)
FairSeqWav2Vec2Encoder (class in espnet2.asr.encoder.wav2vec2_encoder)
FaSNet_base (class in espnet2.enh.layers.fasnet)
FaSNet_TAC (class in espnet2.enh.layers.fasnet)
FaSNetSeparator (class in espnet2.enh.separator.fasnet_separator)
FastSelfAttention (class in espnet2.asr.layers.fastformer)
FastSpeech (class in espnet2.tts.fastspeech.fastspeech)
FastSpeech2 (class in espnet2.tts.fastspeech2.fastspeech2)
FastSpeech2Loss (class in espnet2.tts.fastspeech2.loss)
feature_grad_mult (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
feature_transform_for() (in module espnet.nets.pytorch_backend.frontends.feature_transform)
FeatureMapDense (class in espnet2.enh.layers.dcunet)
FeatureMatchLoss (class in espnet2.gan_tts.hifigan.loss)
FeatureTransform (class in espnet.nets.pytorch_backend.frontends.feature_transform)
Feedforward (class in espnet2.asr.state_spaces.residual)
FeedForward (class in espnet2.asr_transducer.decoder.modules.rwkv.feed_forward)
FeedForwardTransformer (class in espnet.nets.pytorch_backend.e2e_tts_fastspeech)
FeedForwardTransformerLoss (class in espnet.nets.pytorch_backend.e2e_tts_fastspeech)
FF (class in espnet2.asr.state_spaces.ff)
fft_convolve() (in module espnet2.gan_svs.visinger2.ddsp)
field2slice() (in module espnet2.bin.tokenize_text)
file_reader_helper() (in module espnet.utils.cli_readers)
file_writer_helper() (in module espnet.utils.cli_writers)
files (espnet2.bin.pack.ASRPackedContents attribute)
(espnet2.bin.pack.DiarPackedContents attribute)
(espnet2.bin.pack.EnhPackedContents attribute)
(espnet2.bin.pack.EnhS2TPackedContents attribute)
(espnet2.bin.pack.PackedContents attribute)
(espnet2.bin.pack.S2STPackedContents attribute)
(espnet2.bin.pack.S2TPackedContents attribute)
(espnet2.bin.pack.SSLPackedContents attribute)
(espnet2.bin.pack.STPackedContents attribute)
(espnet2.bin.pack.SVSPackedContents attribute)
(espnet2.bin.pack.SpkPackedContents attribute)
(espnet2.bin.pack.TTSPackedContents attribute)
fill_missing_args() (in module espnet.utils.fill_missing_args)
filter_modules() (in module espnet.asr.pytorch_backend.asr_init)
filter_state_dict() (in module espnet2.torch_utils.load_pretrained_model)
final() (espnet.lm.chainer_backend.extlm.LookAheadWordLM method)
(espnet.lm.chainer_backend.extlm.MultiLevelLM method)
(espnet.lm.chainer_backend.lm.ClassifierWithState method)
(espnet.lm.pytorch_backend.extlm.LookAheadWordLM method)
(espnet.lm.pytorch_backend.extlm.MultiLevelLM method)
(espnet.nets.pytorch_backend.lm.default.ClassifierWithState method)
final_dim (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
final_score() (espnet.nets.pytorch_backend.lm.default.DefaultRNNLM method)
(espnet.nets.scorer_interface.ScorerInterface method)
finalize() (espnet.utils.dataset.ChainerDataLoader method)
find_path_and_change_it_recursive() (in module espnet2.main_funcs.pack_funcs)
finish_epoch() (espnet2.train.reporter.Reporter method)
finished() (espnet2.train.reporter.SubReporter method)
fix_input_dims() (espnet2.enh.layers.dcunet.DCUNet method)
fix_output_dims() (espnet2.enh.layers.dcunet.DCUNet method)
FixedOrderSolver (class in espnet2.enh.loss.wrappers.fixed_order)
flatten_grid_locations() (in module espnet.utils.spec_augment)
flatten_parameters() (espnet2.enh.layers.complexnn.NavieComplexLSTM method)
(espnet2.enh.separator.dccrn_separator.DCCRNSeparator method)
flatten_tensor() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
FlipFlow (class in espnet2.gan_tts.vits.flow)
float_or_none() (in module espnet2.utils.types)
FloatRandomGenerateDataset (class in espnet2.fileio.rand_gen_dataset)
FoldedBatchSampler (class in espnet2.samplers.folded_batch_sampler)
force_gatherable() (in module espnet2.torch_utils.device_funcs)
forced_align() (espnet.nets.pytorch_backend.ctc.CTC method)
format_mulenc_args() (in module espnet.asr.asr_utils)
forward() (espnet.lm.pytorch_backend.extlm.LookAheadWordLM method)
(espnet.lm.pytorch_backend.extlm.MultiLevelLM method)
(espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
(espnet.nets.batch_beam_search_online_sim.BatchBeamSearchOnlineSim method)
(espnet.nets.beam_search.BeamSearch method)
(espnet.nets.beam_search_timesync.BeamSearchTimeSync method)
(espnet.nets.beam_search_timesync_streaming.BeamSearchTimeSyncStreaming method)
(espnet.nets.chainer_backend.deterministic_embed_id.EmbedIDFunction method)
(espnet.nets.chainer_backend.deterministic_embed_id.EmbedIDGrad method)
(espnet.nets.chainer_backend.e2e_asr.E2E method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
(espnet.nets.chainer_backend.transformer.attention.MultiHeadAttention method)
(espnet.nets.chainer_backend.transformer.decoder.Decoder method)
(espnet.nets.chainer_backend.transformer.decoder_layer.DecoderLayer method)
(espnet.nets.chainer_backend.transformer.embedding.PositionalEncoding method)
(espnet.nets.chainer_backend.transformer.encoder.Encoder method)
(espnet.nets.chainer_backend.transformer.encoder_layer.EncoderLayer method)
(espnet.nets.chainer_backend.transformer.label_smoothing_loss.LabelSmoothingLoss method)
(espnet.nets.chainer_backend.transformer.subsampling.Conv2dSubsampling method)
(espnet.nets.chainer_backend.transformer.subsampling.LinearSampling method)
(espnet.nets.lm_interface.LMInterface method)
(espnet.nets.mt_interface.MTInterface method)
(espnet.nets.pytorch_backend.conformer.contextual_block_encoder_layer.ContextualBlockEncoderLayer method)
(espnet.nets.pytorch_backend.conformer.convolution.ConvolutionModule method)
(espnet.nets.pytorch_backend.conformer.encoder.Encoder method)
(espnet.nets.pytorch_backend.conformer.encoder_layer.EncoderLayer method)
(espnet.nets.pytorch_backend.conformer.swish.Swish method)
(espnet.nets.pytorch_backend.ctc.CTC method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_maskctc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.EncoderMix method)
(espnet.nets.pytorch_backend.e2e_asr_mix_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_mt.E2E method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformer method)
(espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformerLoss method)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.GuidedAttentionLoss method)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.Tacotron2 method)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.Tacotron2Loss method)
(espnet.nets.pytorch_backend.e2e_tts_transformer.GuidedMultiHeadAttentionLoss method)
(espnet.nets.pytorch_backend.e2e_tts_transformer.Transformer method)
(espnet.nets.pytorch_backend.e2e_vc_tacotron2.Tacotron2 method)
(espnet.nets.pytorch_backend.e2e_vc_transformer.Transformer method)
(espnet.nets.pytorch_backend.fastspeech.duration_calculator.DurationCalculator method)
(espnet.nets.pytorch_backend.fastspeech.duration_predictor.DurationPredictor method)
(espnet.nets.pytorch_backend.fastspeech.duration_predictor.DurationPredictorLoss method)
(espnet.nets.pytorch_backend.fastspeech.length_regulator.LengthRegulator method)
(espnet.nets.pytorch_backend.frontends.dnn_beamformer.AttentionReference method)
(espnet.nets.pytorch_backend.frontends.dnn_beamformer.DNN_Beamformer method)
(espnet.nets.pytorch_backend.frontends.dnn_wpe.DNN_WPE method)
(espnet.nets.pytorch_backend.frontends.feature_transform.FeatureTransform method)
(espnet.nets.pytorch_backend.frontends.feature_transform.GlobalMVN method)
(espnet.nets.pytorch_backend.frontends.feature_transform.LogMel method)
(espnet.nets.pytorch_backend.frontends.feature_transform.UtteranceMVN method)
(espnet.nets.pytorch_backend.frontends.frontend.Frontend method)
(espnet.nets.pytorch_backend.frontends.mask_estimator.MaskEstimator method)
(espnet.nets.pytorch_backend.gtn_ctc.GTNCTCLossFunction static method)
(espnet.nets.pytorch_backend.lm.default.ClassifierWithState method)
(espnet.nets.pytorch_backend.lm.default.DefaultRNNLM method)
(espnet.nets.pytorch_backend.lm.default.RNNLM method)
(espnet.nets.pytorch_backend.lm.seq_rnn.SequentialRNNLM method)
(espnet.nets.pytorch_backend.lm.transformer.TransformerLM method)
(espnet.nets.pytorch_backend.rnn.attentions.AttAdd method)
(espnet.nets.pytorch_backend.rnn.attentions.AttCov method)
(espnet.nets.pytorch_backend.rnn.attentions.AttCovLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.AttDot method)
(espnet.nets.pytorch_backend.rnn.attentions.AttForward method)
(espnet.nets.pytorch_backend.rnn.attentions.AttForwardTA method)
(espnet.nets.pytorch_backend.rnn.attentions.AttLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.AttLoc2D method)
(espnet.nets.pytorch_backend.rnn.attentions.AttLocRec method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadAdd method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadDot method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadMultiResLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.GDCAttLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.NoAtt method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.rnn.encoders.Encoder method)
(espnet.nets.pytorch_backend.rnn.encoders.RNN method)
(espnet.nets.pytorch_backend.rnn.encoders.RNNP method)
(espnet.nets.pytorch_backend.rnn.encoders.VGG2L method)
(espnet.nets.pytorch_backend.tacotron2.cbhg.CBHG method)
(espnet.nets.pytorch_backend.tacotron2.cbhg.CBHGLoss method)
(espnet.nets.pytorch_backend.tacotron2.cbhg.HighwayNet method)
(espnet.nets.pytorch_backend.tacotron2.decoder.Decoder method)
(espnet.nets.pytorch_backend.tacotron2.decoder.Postnet method)
(espnet.nets.pytorch_backend.tacotron2.decoder.Prenet method)
(espnet.nets.pytorch_backend.tacotron2.decoder.ZoneOutCell method)
(espnet.nets.pytorch_backend.tacotron2.encoder.Encoder method)
(espnet.nets.pytorch_backend.transducer.conv1d_nets.CausalConv1d method)
(espnet.nets.pytorch_backend.transducer.conv1d_nets.Conv1d method)
(espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.custom_encoder.CustomEncoder method)
(espnet.nets.pytorch_backend.transducer.joint_network.JointNetwork method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_encoder.Encoder method)
(espnet.nets.pytorch_backend.transducer.rnn_encoder.RNN method)
(espnet.nets.pytorch_backend.transducer.rnn_encoder.RNNP method)
(espnet.nets.pytorch_backend.transducer.rnn_encoder.VGG2L method)
(espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
(espnet.nets.pytorch_backend.transducer.transformer_decoder_layer.TransformerDecoderLayer method)
(espnet.nets.pytorch_backend.transducer.vgg2l.VGG2L method)
(espnet.nets.pytorch_backend.transformer.attention.LegacyRelPositionMultiHeadedAttention method)
(espnet.nets.pytorch_backend.transformer.attention.MultiHeadedAttention method)
(espnet.nets.pytorch_backend.transformer.attention.RelPositionMultiHeadedAttention method)
(espnet.nets.pytorch_backend.transformer.contextual_block_encoder_layer.ContextualBlockEncoderLayer method)
(espnet.nets.pytorch_backend.transformer.decoder.Decoder method)
(espnet.nets.pytorch_backend.transformer.decoder_layer.DecoderLayer method)
(espnet.nets.pytorch_backend.transformer.dynamic_conv.DynamicConvolution method)
(espnet.nets.pytorch_backend.transformer.dynamic_conv2d.DynamicConvolution2D method)
(espnet.nets.pytorch_backend.transformer.embedding.LearnableFourierPosEnc method)
(espnet.nets.pytorch_backend.transformer.embedding.LegacyRelPositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.embedding.PositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.embedding.RelPositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.embedding.ScaledPositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.embedding.StreamPositionalEncoding method)
(espnet.nets.pytorch_backend.transformer.encoder.Encoder method)
(espnet.nets.pytorch_backend.transformer.encoder_layer.EncoderLayer method)
(espnet.nets.pytorch_backend.transformer.encoder_mix.EncoderMix method)
(espnet.nets.pytorch_backend.transformer.label_smoothing_loss.LabelSmoothingLoss method)
(espnet.nets.pytorch_backend.transformer.layer_norm.LayerNorm method)
(espnet.nets.pytorch_backend.transformer.lightconv.LightweightConvolution method)
(espnet.nets.pytorch_backend.transformer.lightconv2d.LightweightConvolution2D method)
(espnet.nets.pytorch_backend.transformer.longformer_attention.LongformerAttention method)
(espnet.nets.pytorch_backend.transformer.multi_layer_conv.Conv1dLinear method)
(espnet.nets.pytorch_backend.transformer.multi_layer_conv.MultiLayeredConv1d method)
(espnet.nets.pytorch_backend.transformer.positionwise_feed_forward.PositionwiseFeedForward method)
(espnet.nets.pytorch_backend.transformer.repeat.MultiSequential method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv1dSubsampling1 method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv1dSubsampling2 method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv1dSubsampling3 method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv2dSubsampling method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv2dSubsampling1 method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv2dSubsampling2 method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv2dSubsampling6 method)
(espnet.nets.pytorch_backend.transformer.subsampling.Conv2dSubsampling8 method)
(espnet.nets.pytorch_backend.transformer.subsampling_without_posenc.Conv2dSubsamplingWOPosEnc method)
(espnet.nets.pytorch_backend.wavenet.CausalConv1d method)
(espnet.nets.pytorch_backend.wavenet.OneHot method)
(espnet.nets.pytorch_backend.wavenet.UpSampling method)
(espnet.nets.pytorch_backend.wavenet.WaveNet method)
(espnet.nets.tts_interface.TTSInterface method)
(espnet2.asr.ctc.CTC method)
(espnet2.asr.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr.decoder.hugging_face_transformers_decoder.HuggingFaceTransformersDecoder method)
(espnet2.asr.decoder.mlm_decoder.MLMDecoder method)
(espnet2.asr.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr.decoder.s4_decoder.S4Decoder method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr.decoder.transformer_decoder.BaseTransformerDecoder method)
(espnet2.asr.decoder.transformer_decoder.TransformerMDDecoder method)
(espnet2.asr.decoder.whisper_decoder.ExpandedTokenEmbedding method)
(espnet2.asr.decoder.whisper_decoder.OpenAIWhisperDecoder method)
(espnet2.asr.discrete_asr_espnet_model.ESPnetDiscreteASRModel method)
(espnet2.asr.encoder.abs_encoder.AbsEncoder method)
(espnet2.asr.encoder.avhubert_encoder.BasicBlock method)
(espnet2.asr.encoder.avhubert_encoder.FairseqAVHubertEncoder method)
(espnet2.asr.encoder.avhubert_encoder.GradMultiply static method)
(espnet2.asr.encoder.avhubert_encoder.ResEncoder method)
(espnet2.asr.encoder.avhubert_encoder.ResNet method)
(espnet2.asr.encoder.avhubert_encoder.SamePad method)
(espnet2.asr.encoder.avhubert_encoder.SubModel method)
(espnet2.asr.encoder.avhubert_encoder.TransformerEncoder method)
(espnet2.asr.encoder.branchformer_encoder.BranchformerEncoder method)
(espnet2.asr.encoder.branchformer_encoder.BranchformerEncoderLayer method)
(espnet2.asr.encoder.conformer_encoder.ConformerEncoder method)
(espnet2.asr.encoder.contextual_block_conformer_encoder.ContextualBlockConformerEncoder method)
(espnet2.asr.encoder.contextual_block_transformer_encoder.ContextualBlockTransformerEncoder method)
(espnet2.asr.encoder.e_branchformer_encoder.EBranchformerEncoder method)
(espnet2.asr.encoder.e_branchformer_encoder.EBranchformerEncoderLayer method)
(espnet2.asr.encoder.hubert_encoder.FairseqHubertEncoder method)
(espnet2.asr.encoder.hubert_encoder.FairseqHubertPretrainEncoder method)
(espnet2.asr.encoder.hubert_encoder.TorchAudioHuBERTPretrainEncoder method)
(espnet2.asr.encoder.hugging_face_transformers_encoder.HuggingFaceTransformersEncoder method)
(espnet2.asr.encoder.linear_encoder.LinearEncoder method)
(espnet2.asr.encoder.longformer_encoder.LongformerEncoder method)
(espnet2.asr.encoder.rnn_encoder.RNNEncoder method)
(espnet2.asr.encoder.transformer_encoder.TransformerEncoder method)
(espnet2.asr.encoder.transformer_encoder_multispkr.TransformerEncoder method)
(espnet2.asr.encoder.vgg_rnn_encoder.VGGRNNEncoder method)
(espnet2.asr.encoder.wav2vec2_encoder.FairSeqWav2Vec2Encoder method)
(espnet2.asr.encoder.whisper_encoder.OpenAIWhisperEncoder method)
(espnet2.asr.espnet_model.ESPnetASRModel method)
(espnet2.asr.frontend.abs_frontend.AbsFrontend method)
(espnet2.asr.frontend.asteroid_frontend.AsteroidFrontend method)
(espnet2.asr.frontend.default.DefaultFrontend method)
(espnet2.asr.frontend.fused.FusedFrontends method)
(espnet2.asr.frontend.melspec_torch.MelSpectrogramTorch method)
(espnet2.asr.frontend.s3prl.S3prlFrontend method)
(espnet2.asr.frontend.whisper.WhisperFrontend method)
(espnet2.asr.frontend.windowing.SlidingWindow method)
(espnet2.asr.layers.cgmlp.ConvolutionalGatingMLP method)
(espnet2.asr.layers.cgmlp.ConvolutionalSpatialGatingUnit method)
(espnet2.asr.layers.fastformer.FastSelfAttention method)
(espnet2.asr.maskctc_model.MaskCTCInference method)
(espnet2.asr.maskctc_model.MaskCTCModel method)
(espnet2.asr.pit_espnet_model.ESPnetASRModel method)
(espnet2.asr.pit_espnet_model.PITLossWrapper method)
(espnet2.asr.postencoder.abs_postencoder.AbsPostEncoder method)
(espnet2.asr.postencoder.hugging_face_transformers_postencoder.HuggingFaceTransformersPostEncoder method)
(espnet2.asr.postencoder.length_adaptor_postencoder.LengthAdaptorPostEncoder method)
(espnet2.asr.preencoder.abs_preencoder.AbsPreEncoder method)
(espnet2.asr.preencoder.linear.LinearProjection method)
(espnet2.asr.preencoder.sinc.LightweightSincConvs method)
(espnet2.asr.preencoder.sinc.SpatialDropout method)
(espnet2.asr.specaug.abs_specaug.AbsSpecAug method)
(espnet2.asr.specaug.specaug.SpecAug method)
(espnet2.asr.state_spaces.attention.MultiHeadedAttention method)
(espnet2.asr.state_spaces.base.SequenceIdentity method)
(espnet2.asr.state_spaces.base.SequenceModule method)
(espnet2.asr.state_spaces.block.SequenceResidualBlock method)
(espnet2.asr.state_spaces.components.DropoutNd method)
(espnet2.asr.state_spaces.components.Normalization method)
(espnet2.asr.state_spaces.components.ReversibleInstanceNorm1dInput method)
(espnet2.asr.state_spaces.components.ReversibleInstanceNorm1dOutput method)
(espnet2.asr.state_spaces.components.SquaredReLU method)
(espnet2.asr.state_spaces.components.StochasticDepth method)
(espnet2.asr.state_spaces.components.TSInverseNormalization method)
(espnet2.asr.state_spaces.components.TSNormalization method)
(espnet2.asr.state_spaces.components.TransposedLN method)
(espnet2.asr.state_spaces.components.TransposedLinear method)
(espnet2.asr.state_spaces.ff.FF method)
(espnet2.asr.state_spaces.model.SequenceModel method)
(espnet2.asr.state_spaces.pool.DownAvgPool method)
(espnet2.asr.state_spaces.pool.DownLinearPool method)
(espnet2.asr.state_spaces.pool.DownPool method)
(espnet2.asr.state_spaces.pool.DownPool2d method)
(espnet2.asr.state_spaces.pool.DownSample method)
(espnet2.asr.state_spaces.pool.DownSpectralPool method)
(espnet2.asr.state_spaces.pool.UpPool method)
(espnet2.asr.state_spaces.pool.UpSample method)
(espnet2.asr.state_spaces.residual.Affine method)
(espnet2.asr.state_spaces.residual.DecayResidual method)
(espnet2.asr.state_spaces.residual.Highway method)
(espnet2.asr.state_spaces.residual.Residual method)
(espnet2.asr.state_spaces.s4.S4 method)
(espnet2.asr.state_spaces.s4.SSKernel method)
(espnet2.asr.state_spaces.s4.SSKernelDiag method)
(espnet2.asr.state_spaces.s4.SSKernelNPLR method)
(espnet2.asr.transducer.rnnt_multi_blank.rnnt_multi_blank.MultiblankRNNTLossNumba method)
(espnet2.asr.transducer.rnnt_multi_blank.rnnt_multi_blank.RNNTLossNumba method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.LogSoftmaxGradModification static method)
(espnet2.asr_transducer.activation.FTSwish method)
(espnet2.asr_transducer.activation.Mish method)
(espnet2.asr_transducer.activation.Smish method)
(espnet2.asr_transducer.activation.Swish method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.blocks.mega.MEGA method)
(espnet2.asr_transducer.decoder.blocks.rwkv.RWKV method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.modules.mega.feed_forward.NormalizedPositionwiseFeedForward method)
(espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema.MultiHeadDampedEMA method)
(espnet2.asr_transducer.decoder.modules.mega.positional_bias.RelativePositionBias method)
(espnet2.asr_transducer.decoder.modules.mega.positional_bias.RotaryRelativePositionBias method)
(espnet2.asr_transducer.decoder.modules.rwkv.attention.SelfAttention method)
(espnet2.asr_transducer.decoder.modules.rwkv.attention.WKVLinearAttention static method)
(espnet2.asr_transducer.decoder.modules.rwkv.feed_forward.FeedForward method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
(espnet2.asr_transducer.encoder.blocks.branchformer.Branchformer method)
(espnet2.asr_transducer.encoder.blocks.conformer.Conformer method)
(espnet2.asr_transducer.encoder.blocks.conv1d.Conv1d method)
(espnet2.asr_transducer.encoder.blocks.conv_input.ConvInput method)
(espnet2.asr_transducer.encoder.blocks.ebranchformer.EBranchformer method)
(espnet2.asr_transducer.encoder.encoder.Encoder method)
(espnet2.asr_transducer.encoder.modules.attention.RelPositionMultiHeadedAttention method)
(espnet2.asr_transducer.encoder.modules.convolution.ConformerConvolution method)
(espnet2.asr_transducer.encoder.modules.convolution.ConvolutionalSpatialGatingUnit method)
(espnet2.asr_transducer.encoder.modules.convolution.DepthwiseConvolution method)
(espnet2.asr_transducer.encoder.modules.multi_blocks.MultiBlocks method)
(espnet2.asr_transducer.encoder.modules.positional_encoding.RelPositionalEncoding method)
(espnet2.asr_transducer.espnet_transducer_model.ESPnetASRTransducerModel method)
(espnet2.asr_transducer.joint_network.JointNetwork method)
(espnet2.asr_transducer.normalization.BasicNorm method)
(espnet2.asr_transducer.normalization.RMSNorm method)
(espnet2.asr_transducer.normalization.ScaleNorm method)
(espnet2.asvspoof.decoder.abs_decoder.AbsDecoder method)
(espnet2.asvspoof.decoder.linear_decoder.LinearDecoder method)
(espnet2.asvspoof.espnet_model.ESPnetASVSpoofModel method)
(espnet2.asvspoof.loss.abs_loss.AbsASVSpoofLoss method)
(espnet2.asvspoof.loss.am_softmax_loss.ASVSpoofAMSoftmaxLoss method)
(espnet2.asvspoof.loss.binary_loss.ASVSpoofBinaryLoss method)
(espnet2.asvspoof.loss.oc_softmax_loss.ASVSpoofOCSoftmaxLoss method)
(espnet2.diar.abs_diar.AbsDiarization method)
(espnet2.diar.attractor.abs_attractor.AbsAttractor method)
(espnet2.diar.attractor.rnn_attractor.RnnAttractor method)
(espnet2.diar.decoder.abs_decoder.AbsDecoder method)
(espnet2.diar.decoder.linear_decoder.LinearDecoder method)
(espnet2.diar.espnet_model.ESPnetDiarizationModel method)
(espnet2.diar.label_processor.LabelProcessor method)
(espnet2.diar.layers.abs_mask.AbsMask method)
(espnet2.diar.layers.multi_mask.MultiMask method)
(espnet2.diar.layers.tcn_nomask.ChannelwiseLayerNorm method)
(espnet2.diar.layers.tcn_nomask.Chomp1d method)
(espnet2.diar.layers.tcn_nomask.DepthwiseSeparableConv method)
(espnet2.diar.layers.tcn_nomask.GlobalLayerNorm method)
(espnet2.diar.layers.tcn_nomask.TemporalBlock method)
(espnet2.diar.layers.tcn_nomask.TemporalConvNet method)
(espnet2.diar.separator.tcn_separator_nomask.TCNSeparatorNomask method)
(espnet2.enh.abs_enh.AbsEnhancement method)
(espnet2.enh.decoder.abs_decoder.AbsDecoder method)
(espnet2.enh.decoder.conv_decoder.ConvDecoder method)
(espnet2.enh.decoder.null_decoder.NullDecoder method)
(espnet2.enh.decoder.stft_decoder.STFTDecoder method)
(espnet2.enh.diffusion.abs_diffusion.AbsDiffusion method)
(espnet2.enh.diffusion.score_based_diffusion.ScoreModel method)
(espnet2.enh.diffusion_enh.ESPnetDiffusionModel method)
(espnet2.enh.encoder.abs_encoder.AbsEncoder method)
(espnet2.enh.encoder.conv_encoder.ConvEncoder method)
(espnet2.enh.encoder.null_encoder.NullEncoder method)
(espnet2.enh.encoder.stft_encoder.STFTEncoder method)
(espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
(espnet2.enh.espnet_model.ESPnetEnhancementModel method)
(espnet2.enh.espnet_model_tse.ESPnetExtractionModel method)
(espnet2.enh.extractor.abs_extractor.AbsExtractor method)
(espnet2.enh.extractor.td_speakerbeam_extractor.TDSpeakerBeamExtractor method)
(espnet2.enh.layers.adapt_layers.ConcatAdaptLayer method)
(espnet2.enh.layers.adapt_layers.MulAddAdaptLayer method)
(espnet2.enh.layers.complexnn.ComplexBatchNorm method)
(espnet2.enh.layers.complexnn.ComplexConv2d method)
(espnet2.enh.layers.complexnn.ComplexConvTranspose2d method)
(espnet2.enh.layers.complexnn.NavieComplexLSTM method)
(espnet2.enh.layers.dc_crn.DC_CRN method)
(espnet2.enh.layers.dc_crn.DenselyConnectedBlock method)
(espnet2.enh.layers.dc_crn.GLSTM method)
(espnet2.enh.layers.dc_crn.GluConv2d method)
(espnet2.enh.layers.dc_crn.GluConvTranspose2d method)
(espnet2.enh.layers.dcunet.ArgsComplexMultiplicationWrapper method)
(espnet2.enh.layers.dcunet.ComplexBatchNorm method)
(espnet2.enh.layers.dcunet.ComplexLinear method)
(espnet2.enh.layers.dcunet.DCUNet method)
(espnet2.enh.layers.dcunet.DCUNetComplexDecoderBlock method)
(espnet2.enh.layers.dcunet.DCUNetComplexEncoderBlock method)
(espnet2.enh.layers.dcunet.DiffusionStepEmbedding method)
(espnet2.enh.layers.dcunet.FeatureMapDense method)
(espnet2.enh.layers.dcunet.GaussianFourierProjection method)
(espnet2.enh.layers.dcunet.OnReIm method)
(espnet2.enh.layers.dnn_beamformer.AttentionReference method)
(espnet2.enh.layers.dnn_beamformer.DNN_Beamformer method)
(espnet2.enh.layers.dnn_wpe.DNN_WPE method)
(espnet2.enh.layers.dpmulcat.DPMulCat method)
(espnet2.enh.layers.dpmulcat.MulCatBlock method)
(espnet2.enh.layers.dprnn.DPRNN method)
(espnet2.enh.layers.dprnn.DPRNN_TAC method)
(espnet2.enh.layers.dprnn.SingleRNN method)
(espnet2.enh.layers.dptnet.DPTNet method)
(espnet2.enh.layers.dptnet.ImprovedTransformerLayer method)
(espnet2.enh.layers.fasnet.BF_module method)
(espnet2.enh.layers.fasnet.FaSNet_TAC method)
(espnet2.enh.layers.fasnet.FaSNet_base method)
(espnet2.enh.layers.ifasnet.iFaSNet method)
(espnet2.enh.layers.mask_estimator.MaskEstimator method)
(espnet2.enh.layers.ncsnpp.NCSNpp method)
(espnet2.enh.layers.ncsnpp_utils.layers.AttnBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.CRPBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.CondCRPBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.CondMSFBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.CondRCUBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.CondRefineBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.ConditionalResidualBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.ConvMeanPool method)
(espnet2.enh.layers.ncsnpp_utils.layers.Downsample method)
(espnet2.enh.layers.ncsnpp_utils.layers.MSFBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.MeanPoolConv method)
(espnet2.enh.layers.ncsnpp_utils.layers.NIN method)
(espnet2.enh.layers.ncsnpp_utils.layers.RCUBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.RefineBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.ResidualBlock method)
(espnet2.enh.layers.ncsnpp_utils.layers.ResnetBlockDDPM method)
(espnet2.enh.layers.ncsnpp_utils.layers.Upsample method)
(espnet2.enh.layers.ncsnpp_utils.layers.UpsampleConv method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.AttnBlockpp method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.Combine method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.Downsample method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.GaussianFourierProjection method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.ResnetBlockBigGANpp method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.ResnetBlockDDPMpp method)
(espnet2.enh.layers.ncsnpp_utils.layerspp.Upsample method)
(espnet2.enh.layers.ncsnpp_utils.normalization.ConditionalBatchNorm2d method)
(espnet2.enh.layers.ncsnpp_utils.normalization.ConditionalInstanceNorm2d method)
(espnet2.enh.layers.ncsnpp_utils.normalization.ConditionalInstanceNorm2dPlus method)
(espnet2.enh.layers.ncsnpp_utils.normalization.ConditionalNoneNorm2d method)
(espnet2.enh.layers.ncsnpp_utils.normalization.ConditionalVarianceNorm2d method)
(espnet2.enh.layers.ncsnpp_utils.normalization.InstanceNorm2dPlus method)
(espnet2.enh.layers.ncsnpp_utils.normalization.NoneNorm2d method)
(espnet2.enh.layers.ncsnpp_utils.normalization.VarianceNorm2d method)
(espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling.Conv2d method)
(espnet2.enh.layers.skim.MemLSTM method)
(espnet2.enh.layers.skim.SegLSTM method)
(espnet2.enh.layers.skim.SkiM method)
(espnet2.enh.layers.tcn.ChannelwiseLayerNorm method)
(espnet2.enh.layers.tcn.Chomp1d method)
(espnet2.enh.layers.tcn.DepthwiseSeparableConv method)
(espnet2.enh.layers.tcn.GlobalLayerNorm method)
(espnet2.enh.layers.tcn.TemporalBlock method)
(espnet2.enh.layers.tcn.TemporalConvNet method)
(espnet2.enh.layers.tcn.TemporalConvNetInformed method)
(espnet2.enh.layers.tcndenseunet.Conv2DActNorm method)
(espnet2.enh.layers.tcndenseunet.DenseBlock method)
(espnet2.enh.layers.tcndenseunet.FreqWiseBlock method)
(espnet2.enh.layers.tcndenseunet.TCNDenseUNet method)
(espnet2.enh.layers.tcndenseunet.TCNResBlock method)
(espnet2.enh.layers.uses.ATFBlock method)
(espnet2.enh.layers.uses.ChannelAttention method)
(espnet2.enh.layers.uses.ChannelTAC method)
(espnet2.enh.layers.uses.LayerNormalization method)
(espnet2.enh.layers.uses.USES method)
(espnet2.enh.loss.criterions.abs_loss.AbsEnhLoss method)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainAbsCoherence method)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainCrossEntropy method)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainDPCL method)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainL1 method)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainMSE method)
(espnet2.enh.loss.criterions.time_domain.CISDRLoss method)
(espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss method)
(espnet2.enh.loss.criterions.time_domain.SDRLoss method)
(espnet2.enh.loss.criterions.time_domain.SISNRLoss method)
(espnet2.enh.loss.criterions.time_domain.SNRLoss method)
(espnet2.enh.loss.criterions.time_domain.TimeDomainL1 method)
(espnet2.enh.loss.criterions.time_domain.TimeDomainMSE method)
(espnet2.enh.loss.wrappers.abs_wrapper.AbsLossWrapper method)
(espnet2.enh.loss.wrappers.dpcl_solver.DPCLSolver method)
(espnet2.enh.loss.wrappers.fixed_order.FixedOrderSolver method)
(espnet2.enh.loss.wrappers.mixit_solver.MixITSolver method)
(espnet2.enh.loss.wrappers.multilayer_pit_solver.MultiLayerPITSolver method)
(espnet2.enh.loss.wrappers.pit_solver.PITSolver method)
(espnet2.enh.separator.abs_separator.AbsSeparator method)
(espnet2.enh.separator.asteroid_models.AsteroidModel_Converter method)
(espnet2.enh.separator.conformer_separator.ConformerSeparator method)
(espnet2.enh.separator.dan_separator.DANSeparator method)
(espnet2.enh.separator.dc_crn_separator.DC_CRNSeparator method)
(espnet2.enh.separator.dccrn_separator.DCCRNSeparator method)
(espnet2.enh.separator.dpcl_e2e_separator.DPCLE2ESeparator method)
(espnet2.enh.separator.dpcl_separator.DPCLSeparator method)
(espnet2.enh.separator.dprnn_separator.DPRNNSeparator method)
(espnet2.enh.separator.dptnet_separator.DPTNetSeparator method)
(espnet2.enh.separator.fasnet_separator.FaSNetSeparator method)
(espnet2.enh.separator.ineube_separator.iNeuBe method)
(espnet2.enh.separator.neural_beamformer.NeuralBeamformer method)
(espnet2.enh.separator.rnn_separator.RNNSeparator method)
(espnet2.enh.separator.skim_separator.SkiMSeparator method)
(espnet2.enh.separator.svoice_separator.Decoder method)
(espnet2.enh.separator.svoice_separator.Encoder method)
(espnet2.enh.separator.svoice_separator.SVoiceSeparator method)
(espnet2.enh.separator.tcn_separator.TCNSeparator method)
(espnet2.enh.separator.tfgridnet_separator.GridNetBlock method)
(espnet2.enh.separator.tfgridnet_separator.LayerNormalization4D method)
(espnet2.enh.separator.tfgridnet_separator.LayerNormalization4DCF method)
(espnet2.enh.separator.tfgridnet_separator.TFGridNet method)
(espnet2.enh.separator.tfgridnetv2_separator.AllHeadPReLULayerNormalization4DCF method)
(espnet2.enh.separator.tfgridnetv2_separator.GridNetV2Block method)
(espnet2.enh.separator.tfgridnetv2_separator.LayerNormalization4DCF method)
(espnet2.enh.separator.tfgridnetv2_separator.TFGridNetV2 method)
(espnet2.enh.separator.transformer_separator.TransformerSeparator method)
(espnet2.enh.separator.uses_separator.USESSeparator method)
(espnet2.gan_svs.abs_gan_svs.AbsGANSVS method)
(espnet2.gan_svs.avocodo.__init__.AvocodoDiscriminator method)
(espnet2.gan_svs.avocodo.__init__.AvocodoDiscriminatorPlus method)
(espnet2.gan_svs.avocodo.__init__.AvocodoGenerator method)
(espnet2.gan_svs.avocodo.__init__.CoMBD method)
(espnet2.gan_svs.avocodo.__init__.CoMBDBlock method)
(espnet2.gan_svs.avocodo.__init__.MDC method)
(espnet2.gan_svs.avocodo.__init__.SBD method)
(espnet2.gan_svs.avocodo.__init__.SBDBlock method)
(espnet2.gan_svs.avocodo.avocodo.AvocodoDiscriminator method)
(espnet2.gan_svs.avocodo.avocodo.AvocodoDiscriminatorPlus method)
(espnet2.gan_svs.avocodo.avocodo.AvocodoGenerator method)
(espnet2.gan_svs.avocodo.avocodo.CoMBD method)
(espnet2.gan_svs.avocodo.avocodo.CoMBDBlock method)
(espnet2.gan_svs.avocodo.avocodo.MDC method)
(espnet2.gan_svs.avocodo.avocodo.SBD method)
(espnet2.gan_svs.avocodo.avocodo.SBDBlock method)
(espnet2.gan_svs.espnet_model.ESPnetGANSVSModel method)
(espnet2.gan_svs.joint.joint_score2wav.JointScore2Wav method)
(espnet2.gan_svs.pits.modules.WN method)
(espnet2.gan_svs.pits.ying_decoder.YingDecoder method)
(espnet2.gan_svs.uhifigan.__init__.SineGen method)
(espnet2.gan_svs.uhifigan.__init__.UHiFiGANGenerator method)
(espnet2.gan_svs.uhifigan.sine_generator.SineGen method)
(espnet2.gan_svs.uhifigan.uhifigan.UHiFiGANGenerator method)
(espnet2.gan_svs.visinger2.__init__.Generator_Harm method)
(espnet2.gan_svs.visinger2.__init__.Generator_Noise method)
(espnet2.gan_svs.visinger2.__init__.VISinger2Discriminator method)
(espnet2.gan_svs.visinger2.__init__.VISinger2VocoderGenerator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.BaseFrequenceDiscriminator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.ConvReluNorm method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.Generator_Harm method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.Generator_Noise method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.LayerNorm method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.MelScale method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.MultiFrequencyDiscriminator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.VISinger2Discriminator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.VISinger2VocoderGenerator method)
(espnet2.gan_svs.vits.duration_predictor.DurationPredictor method)
(espnet2.gan_svs.vits.generator.VISingerGenerator method)
(espnet2.gan_svs.vits.length_regulator.LengthRegulator method)
(espnet2.gan_svs.vits.modules.Projection method)
(espnet2.gan_svs.vits.phoneme_predictor.PhonemePredictor method)
(espnet2.gan_svs.vits.pitch_predictor.Decoder method)
(espnet2.gan_svs.vits.prior_decoder.PriorDecoder method)
(espnet2.gan_svs.vits.text_encoder.TextEncoder method)
(espnet2.gan_svs.vits.vits.VITS method)
(espnet2.gan_tts.abs_gan_tts.AbsGANTTS method)
(espnet2.gan_tts.espnet_model.ESPnetGANTTSModel method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANMultiPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANMultiScaleDiscriminator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANMultiScaleMultiPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANMultiPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANMultiScaleDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANMultiScaleMultiPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANPeriodDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.hifigan.loss.DiscriminatorAdversarialLoss method)
(espnet2.gan_tts.hifigan.loss.FeatureMatchLoss method)
(espnet2.gan_tts.hifigan.loss.GeneratorAdversarialLoss method)
(espnet2.gan_tts.hifigan.loss.MelSpectrogramLoss method)
(espnet2.gan_tts.hifigan.residual_block.ResidualBlock method)
(espnet2.gan_tts.jets.alignments.AlignmentModule method)
(espnet2.gan_tts.jets.generator.JETSGenerator method)
(espnet2.gan_tts.jets.jets.JETS method)
(espnet2.gan_tts.jets.length_regulator.GaussianUpsampling method)
(espnet2.gan_tts.jets.loss.ForwardSumLoss method)
(espnet2.gan_tts.jets.loss.VarianceLoss method)
(espnet2.gan_tts.joint.joint_text2wav.JointText2Wav method)
(espnet2.gan_tts.melgan.melgan.MelGANDiscriminator method)
(espnet2.gan_tts.melgan.melgan.MelGANGenerator method)
(espnet2.gan_tts.melgan.melgan.MelGANMultiScaleDiscriminator method)
(espnet2.gan_tts.melgan.residual_stack.ResidualStack method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANGenerator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANGenerator method)
(espnet2.gan_tts.parallel_wavegan.upsample.ConvInUpsampleNetwork method)
(espnet2.gan_tts.parallel_wavegan.upsample.Stretch2d method)
(espnet2.gan_tts.parallel_wavegan.upsample.UpsampleNetwork method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANDiscriminator method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANGenerator method)
(espnet2.gan_tts.style_melgan.tade_res_block.TADELayer method)
(espnet2.gan_tts.style_melgan.tade_res_block.TADEResBlock method)
(espnet2.gan_tts.vits.duration_predictor.StochasticDurationPredictor method)
(espnet2.gan_tts.vits.flow.ConvFlow method)
(espnet2.gan_tts.vits.flow.DilatedDepthSeparableConv method)
(espnet2.gan_tts.vits.flow.ElementwiseAffineFlow method)
(espnet2.gan_tts.vits.flow.FlipFlow method)
(espnet2.gan_tts.vits.flow.LogFlow method)
(espnet2.gan_tts.vits.flow.Transpose method)
(espnet2.gan_tts.vits.generator.VITSGenerator method)
(espnet2.gan_tts.vits.loss.KLDivergenceLoss method)
(espnet2.gan_tts.vits.loss.KLDivergenceLossWithoutFlow method)
(espnet2.gan_tts.vits.posterior_encoder.PosteriorEncoder method)
(espnet2.gan_tts.vits.residual_coupling.ResidualAffineCouplingBlock method)
(espnet2.gan_tts.vits.residual_coupling.ResidualAffineCouplingLayer method)
(espnet2.gan_tts.vits.text_encoder.TextEncoder method)
(espnet2.gan_tts.vits.vits.VITS method)
(espnet2.gan_tts.wavenet.residual_block.ResidualBlock method)
(espnet2.gan_tts.wavenet.wavenet.WaveNet method)
(espnet2.hubert.espnet_model.HubertPretrainModel method)
(espnet2.hubert.espnet_model.TorchAudioHubertPretrainModel method)
(espnet2.hubert.hubert_loss.HubertPretrainLoss method)
(espnet2.layers.abs_normalize.AbsNormalize method)
(espnet2.layers.global_mvn.GlobalMVN method)
(espnet2.layers.houlsby_adapter_layer.HoulsbyTransformerSentenceEncoderLayer method)
(espnet2.layers.houlsby_adapter_layer.Houlsby_Adapter method)
(espnet2.layers.label_aggregation.LabelAggregate method)
(espnet2.layers.log_mel.LogMel method)
(espnet2.layers.mask_along_axis.MaskAlongAxis method)
(espnet2.layers.mask_along_axis.MaskAlongAxisVariableMaxWidth method)
(espnet2.layers.sinc_conv.LogCompression method)
(espnet2.layers.sinc_conv.SincConv method)
(espnet2.layers.stft.Stft method)
(espnet2.layers.time_warp.TimeWarp method)
(espnet2.layers.utterance_mvn.UtteranceMVN method)
(espnet2.lm.abs_model.AbsLM method)
(espnet2.lm.espnet_model.ESPnetLanguageModel method)
(espnet2.lm.espnet_model_multitask.ESPnetMultitaskLanguageModel method)
(espnet2.lm.huggingface_pretrained_opt_lm.HuggingfaceOPTModel method)
(espnet2.lm.seq_rnn_lm.SequentialRNNLM method)
(espnet2.lm.transformer_lm.TransformerLM method)
(espnet2.mt.espnet_model.ESPnetMTModel method)
(espnet2.mt.frontend.embedding.Embedding method)
(espnet2.s2st.aux_attention.abs_aux_attention.AbsS2STAuxAttention method)
(espnet2.s2st.aux_attention.multihead.MultiHeadAttention method)
(espnet2.s2st.espnet_model.ESPnetS2STModel method)
(espnet2.s2st.losses.abs_loss.AbsS2STLoss method)
(espnet2.s2st.losses.attention_loss.S2STAttentionLoss method)
(espnet2.s2st.losses.ctc_loss.S2STCTCLoss method)
(espnet2.s2st.losses.guided_attention_loss.S2STGuidedAttentionLoss method)
(espnet2.s2st.losses.tacotron_loss.S2STTacotron2Loss method)
(espnet2.s2st.synthesizer.abs_synthesizer.AbsSynthesizer method)
(espnet2.s2st.synthesizer.discrete_synthesizer.TransformerDiscreteSynthesizer method)
(espnet2.s2st.synthesizer.translatotron.Translatotron method)
(espnet2.s2st.synthesizer.translatotron2.DurationPredictor method)
(espnet2.s2st.synthesizer.translatotron2.GaussianUpsampling method)
(espnet2.s2st.synthesizer.translatotron2.Prenet method)
(espnet2.s2st.synthesizer.unity_synthesizer.UnitYSynthesizer method)
(espnet2.s2st.tgt_feats_extract.abs_tgt_feats_extract.AbsTgtFeatsExtract method)
(espnet2.s2st.tgt_feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.s2st.tgt_feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.s2st.tgt_feats_extract.log_spectrogram.LogSpectrogram method)
(espnet2.s2t.espnet_model.ESPnetS2TModel method)
(espnet2.slu.espnet_model.ESPnetSLUModel method)
(espnet2.slu.postdecoder.abs_postdecoder.AbsPostDecoder method)
(espnet2.slu.postdecoder.hugging_face_transformers_postdecoder.HuggingFaceTransformersPostDecoder method)
(espnet2.slu.postencoder.conformer_postencoder.ConformerPostEncoder method)
(espnet2.slu.postencoder.transformer_postencoder.TransformerPostEncoder method)
(espnet2.spk.encoder.conformer_encoder.MfaConformerEncoder method)
(espnet2.spk.encoder.ecapa_tdnn_encoder.EcapaTdnnEncoder method)
(espnet2.spk.encoder.identity_encoder.IdentityEncoder method)
(espnet2.spk.encoder.rawnet3_encoder.RawNet3Encoder method)
(espnet2.spk.encoder.ska_tdnn_encoder.Bottle2neck method)
(espnet2.spk.encoder.ska_tdnn_encoder.ResBlock method)
(espnet2.spk.encoder.ska_tdnn_encoder.SEModule method)
(espnet2.spk.encoder.ska_tdnn_encoder.SKAttentionModule method)
(espnet2.spk.encoder.ska_tdnn_encoder.SkaTdnnEncoder method)
(espnet2.spk.encoder.ska_tdnn_encoder.cwSKAttention method)
(espnet2.spk.encoder.ska_tdnn_encoder.fwSKAttention method)
(espnet2.spk.encoder.xvector_encoder.XvectorEncoder method)
(espnet2.spk.espnet_model.ESPnetSpeakerModel method)
(espnet2.spk.layers.ecapa_block.EcapaBlock method)
(espnet2.spk.layers.ecapa_block.SEModule method)
(espnet2.spk.layers.rawnet_block.AFMS method)
(espnet2.spk.layers.rawnet_block.Bottle2neck method)
(espnet2.spk.loss.aamsoftmax.AAMSoftmax method)
(espnet2.spk.loss.aamsoftmax_subcenter_intertopk.ArcMarginProduct_intertopk_subcenter method)
(espnet2.spk.loss.abs_loss.AbsLoss method)
(espnet2.spk.pooling.abs_pooling.AbsPooling method)
(espnet2.spk.pooling.chn_attn_stat_pooling.ChnAttnStatPooling method)
(espnet2.spk.pooling.mean_pooling.MeanPooling method)
(espnet2.spk.pooling.stat_pooling.StatsPooling method)
(espnet2.spk.projector.abs_projector.AbsProjector method)
(espnet2.spk.projector.rawnet3_projector.RawNet3Projector method)
(espnet2.spk.projector.ska_tdnn_projector.SkaTdnnProjector method)
(espnet2.spk.projector.xvector_projector.XvectorProjector method)
(espnet2.st.espnet_model.ESPnetSTModel method)
(espnet2.svs.abs_svs.AbsSVS method)
(espnet2.svs.espnet_model.ESPnetSVSModel method)
(espnet2.svs.feats_extract.score_feats_extract.FrameScoreFeats method)
(espnet2.svs.feats_extract.score_feats_extract.SyllableScoreFeats method)
(espnet2.svs.naive_rnn.naive_rnn.NaiveRNN method)
(espnet2.svs.naive_rnn.naive_rnn.NaiveRNNLoss method)
(espnet2.svs.naive_rnn.naive_rnn_dp.NaiveRNNDP method)
(espnet2.svs.singing_tacotron.decoder.Decoder method)
(espnet2.svs.singing_tacotron.encoder.Duration_Encoder method)
(espnet2.svs.singing_tacotron.encoder.Encoder method)
(espnet2.svs.singing_tacotron.singing_tacotron.singing_tacotron method)
(espnet2.svs.xiaoice.XiaoiceSing.XiaoiceSing method)
(espnet2.svs.xiaoice.loss.XiaoiceSing2Loss method)
(espnet2.torch_utils.forward_adaptor.ForwardAdaptor method)
(espnet2.train.abs_espnet_model.AbsESPnetModel method)
(espnet2.train.abs_gan_espnet_model.AbsGANESPnetModel method)
(espnet2.tts.abs_tts.AbsTTS method)
(espnet2.tts.espnet_model.ESPnetTTSModel method)
(espnet2.tts.fastspeech.fastspeech.FastSpeech method)
(espnet2.tts.fastspeech2.fastspeech2.FastSpeech2 method)
(espnet2.tts.fastspeech2.loss.FastSpeech2Loss method)
(espnet2.tts.fastspeech2.variance_predictor.VariancePredictor method)
(espnet2.tts.feats_extract.abs_feats_extract.AbsFeatsExtract method)
(espnet2.tts.feats_extract.dio.Dio method)
(espnet2.tts.feats_extract.energy.Energy method)
(espnet2.tts.feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.tts.feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.tts.feats_extract.log_spectrogram.LogSpectrogram method)
(espnet2.tts.feats_extract.ying.Ying method)
(espnet2.tts.gst.style_encoder.ReferenceEncoder method)
(espnet2.tts.gst.style_encoder.StyleEncoder method)
(espnet2.tts.gst.style_encoder.StyleTokenLayer method)
(espnet2.tts.prodiff.denoiser.Mish method)
(espnet2.tts.prodiff.denoiser.ResidualBlock method)
(espnet2.tts.prodiff.denoiser.SpectogramDenoiser method)
(espnet2.tts.prodiff.loss.ProDiffLoss method)
(espnet2.tts.prodiff.loss.SSimLoss method)
(espnet2.tts.prodiff.prodiff.ProDiff method)
(espnet2.tts.tacotron2.tacotron2.Tacotron2 method)
(espnet2.tts.transformer.transformer.Transformer method)
(espnet2.tts.utils.__init__.DurationCalculator method)
(espnet2.tts.utils.__init__.ParallelWaveGANPretrainedVocoder method)
(espnet2.tts.utils.duration_calculator.DurationCalculator method)
(espnet2.tts.utils.parallel_wavegan_pretrained_vocoder.ParallelWaveGANPretrainedVocoder method)
(espnet2.uasr.discriminator.abs_discriminator.AbsDiscriminator method)
(espnet2.uasr.discriminator.conv_discriminator.ConvDiscriminator method)
(espnet2.uasr.discriminator.conv_discriminator.SamePad method)
(espnet2.uasr.espnet_model.ESPnetUASRModel method)
(espnet2.uasr.generator.abs_generator.AbsGenerator method)
(espnet2.uasr.generator.conv_generator.ConvGenerator method)
(espnet2.uasr.generator.conv_generator.SamePad method)
(espnet2.uasr.generator.conv_generator.TransposeLast method)
(espnet2.uasr.loss.abs_loss.AbsUASRLoss method)
(espnet2.uasr.loss.discriminator_loss.UASRDiscriminatorLoss method)
(espnet2.uasr.loss.gradient_penalty.UASRGradientPenalty method)
(espnet2.uasr.loss.phoneme_diversity_loss.UASRPhonemeDiversityLoss method)
(espnet2.uasr.loss.pseudo_label_loss.UASRPseudoLabelLoss method)
(espnet2.uasr.loss.smoothness_penalty.UASRSmoothnessPenalty method)
forward_asr() (espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
forward_attention() (espnet.nets.pytorch_backend.transformer.attention.MultiHeadedAttention method)
(espnet2.asr.state_spaces.attention.MultiHeadedAttention method)
(espnet2.asr_transducer.encoder.modules.attention.RelPositionMultiHeadedAttention method)
forward_audio() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
forward_denoise() (espnet2.tts.prodiff.denoiser.SpectogramDenoiser method)
forward_enhance() (espnet2.enh.espnet_model.ESPnetEnhancementModel method)
(espnet2.enh.espnet_model_tse.ESPnetExtractionModel method)
forward_features() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
forward_fusion() (espnet2.asr.encoder.avhubert_encoder.FairseqAVHubertEncoder method)
forward_infer() (espnet.nets.pytorch_backend.conformer.contextual_block_encoder_layer.ContextualBlockEncoderLayer method)
(espnet.nets.pytorch_backend.transformer.contextual_block_encoder_layer.ContextualBlockEncoderLayer method)
(espnet2.asr.encoder.contextual_block_conformer_encoder.ContextualBlockConformerEncoder method)
(espnet2.asr.encoder.contextual_block_transformer_encoder.ContextualBlockTransformerEncoder method)
forward_loss() (espnet2.enh.diffusion_enh.ESPnetDiffusionModel method)
(espnet2.enh.espnet_model.ESPnetEnhancementModel method)
(espnet2.enh.espnet_model_tse.ESPnetExtractionModel method)
forward_mt() (espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
forward_one_step() (espnet.nets.pytorch_backend.transformer.decoder.Decoder method)
(espnet.nets.pytorch_backend.transformer.encoder.Encoder method)
(espnet.nets.pytorch_backend.transformer.encoder_mix.EncoderMix method)
(espnet2.asr.decoder.transformer_decoder.BaseTransformerDecoder method)
(espnet2.asr.decoder.transformer_decoder.TransformerMDDecoder method)
(espnet2.asr.decoder.whisper_decoder.OpenAIWhisperDecoder method)
(espnet2.enh.layers.skim.MemLSTM method)
(espnet2.s2st.synthesizer.discrete_synthesizer.TransformerDiscreteSynthesizer method)
forward_padding_mask() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
forward_qkv() (espnet.nets.pytorch_backend.transformer.attention.MultiHeadedAttention method)
(espnet2.asr.state_spaces.attention.MultiHeadedAttention method)
(espnet2.asr_transducer.encoder.modules.attention.RelPositionMultiHeadedAttention method)
forward_rawwav() (espnet2.diar.abs_diar.AbsDiarization method)
(espnet2.enh.abs_enh.AbsEnhancement method)
(espnet2.enh.separator.asteroid_models.AsteroidModel_Converter method)
forward_state() (espnet2.asr.state_spaces.s4.SSKernel method)
(espnet2.asr.state_spaces.s4.SSKernelDiag method)
forward_stream() (espnet2.enh.layers.skim.SkiM method)
forward_streaming() (espnet2.enh.decoder.abs_decoder.AbsDecoder method)
(espnet2.enh.decoder.conv_decoder.ConvDecoder method)
(espnet2.enh.decoder.stft_decoder.STFTDecoder method)
(espnet2.enh.encoder.abs_encoder.AbsEncoder method)
(espnet2.enh.encoder.conv_encoder.ConvEncoder method)
(espnet2.enh.encoder.stft_encoder.STFTEncoder method)
(espnet2.enh.separator.abs_separator.AbsSeparator method)
(espnet2.enh.separator.rnn_separator.RNNSeparator method)
(espnet2.enh.separator.skim_separator.SkiMSeparator method)
(espnet2.enh.separator.tcn_separator.TCNSeparator method)
forward_train() (espnet.nets.pytorch_backend.conformer.contextual_block_encoder_layer.ContextualBlockEncoderLayer method)
(espnet.nets.pytorch_backend.transformer.contextual_block_encoder_layer.ContextualBlockEncoderLayer method)
(espnet2.asr.encoder.contextual_block_conformer_encoder.ContextualBlockConformerEncoder method)
(espnet2.asr.encoder.contextual_block_transformer_encoder.ContextualBlockTransformerEncoder method)
forward_transformer() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
forward_video() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
ForwardAdaptor (class in espnet2.torch_utils.forward_adaptor)
ForwardSumLoss (class in espnet2.gan_tts.jets.loss)
frame() (espnet2.bin.enh_inference_streaming.SeparateSpeechStreaming method)
FrameScoreFeats (class in espnet2.svs.feats_extract.score_feats_extract)
framing() (in module espnet2.train.preprocessor)
free_port() (in module espnet.distributed.pytorch_backend.launch)
(in module espnet2.train.distributed_utils)
freeze_modules() (in module espnet.asr.pytorch_backend.asr_init)
freq_mask() (in module espnet.transform.spec_augment)
(in module espnet.utils.spec_augment)
freq_path_process() (espnet2.enh.layers.uses.ATFBlock method)
FreqMask (class in espnet.transform.spec_augment)
FrequencyDomainAbsCoherence (class in espnet2.enh.loss.criterions.tf_domain)
FrequencyDomainCrossEntropy (class in espnet2.enh.loss.criterions.tf_domain)
FrequencyDomainDPCL (class in espnet2.enh.loss.criterions.tf_domain)
FrequencyDomainL1 (class in espnet2.enh.loss.criterions.tf_domain)
FrequencyDomainLoss (class in espnet2.enh.loss.criterions.tf_domain)
FrequencyDomainMSE (class in espnet2.enh.loss.criterions.tf_domain)
FreqWiseBlock (class in espnet2.enh.layers.tcndenseunet)
from_args() (espnet.optimizer.chainer.AdadeltaFactory static method)
(espnet.optimizer.chainer.AdamFactory static method)
(espnet.optimizer.chainer.SGDFactory static method)
(espnet.optimizer.factory.OptimizerFactoryInterface static method)
(espnet.optimizer.pytorch.AdadeltaFactory static method)
(espnet.optimizer.pytorch.AdamFactory static method)
(espnet.optimizer.pytorch.SGDFactory static method)
from_pretrained() (espnet2.bin.asr_inference.Speech2Text static method)
(espnet2.bin.asr_inference_maskctc.Speech2Text static method)
(espnet2.bin.asr_transducer_inference.Speech2Text static method)
(espnet2.bin.diar_inference.DiarizeSpeech static method)
(espnet2.bin.enh_inference.SeparateSpeech static method)
(espnet2.bin.enh_inference_streaming.SeparateSpeechStreaming static method)
(espnet2.bin.enh_tse_inference.SeparateSpeech static method)
(espnet2.bin.lm_inference.GenerateText static method)
(espnet2.bin.mt_inference.Text2Text static method)
(espnet2.bin.s2st_inference.Speech2Speech static method)
(espnet2.bin.s2t_inference.Speech2Text static method)
(espnet2.bin.s2t_inference_language.Speech2Language static method)
(espnet2.bin.slu_inference.Speech2Understand static method)
(espnet2.bin.spk_inference.Speech2Embedding static method)
(espnet2.bin.st_inference.Speech2Text static method)
(espnet2.bin.svs_inference.SingingGenerate static method)
(espnet2.bin.tts_inference.Text2Speech static method)
(espnet2.bin.uasr_inference.Speech2Text static method)
(espnet2.bin.uasr_inference_k2.k2Speech2Text static method)
Frontend (class in espnet.nets.pytorch_backend.frontends.frontend)
frontend_for() (in module espnet.nets.pytorch_backend.frontends.frontend)
fs (espnet2.bin.asr_align.CTCSegmentation attribute)
fs() (espnet2.bin.s2st_inference.Speech2Speech property)
(espnet2.bin.svs_inference.SingingGenerate property)
(espnet2.bin.tts_inference.Text2Speech property)
FTSwish (class in espnet2.asr_transducer.activation)
func() (espnet.transform.functional.FuncTrans property)
(in module espnet2.utils.kwargs2args)
FuncTrans (class in espnet.transform.functional)
fused_add_tanh_sigmoid_multiply() (espnet2.gan_svs.pits.modules.WN method)
FusedFrontends (class in espnet2.asr.frontend.fused)
fwSKAttention (class in espnet2.spk.encoder.ska_tdnn_encoder)
G
G2p_en (class in espnet2.text.phoneme_tokenizer)
G2pk (class in espnet2.text.phoneme_tokenizer)
GANSVSTask (class in espnet2.tasks.gan_svs)
GANTrainer (class in espnet2.train.gan_trainer)
GANTrainerOptions (class in espnet2.train.gan_trainer)
GANTTSTask (class in espnet2.tasks.gan_tts)
gaussian() (in module espnet2.tts.prodiff.loss)
GaussianFourierProjection (class in espnet2.enh.layers.dcunet)
(class in espnet2.enh.layers.ncsnpp_utils.layerspp)
GaussianUpsampling (class in espnet2.gan_tts.jets.length_regulator)
(class in espnet2.s2st.synthesizer.translatotron2)
GDCAttLoc (class in espnet.nets.pytorch_backend.rnn.attentions)
gen_lsc_block() (espnet2.asr.preencoder.sinc.LightweightSincConvs method)
generalized_eigenvalue_decomposition() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
generate() (espnet.nets.pytorch_backend.wavenet.WaveNet method)
(espnet2.iterators.category_iter_factory.RawSampler method)
(espnet2.iterators.sequence_iter_factory.RawSampler method)
(espnet2.samplers.abs_sampler.AbsSampler method)
generate_info() (espnet2.main_funcs.pack_funcs.Archiver method)
GenerateText (class in espnet2.bin.lm_inference)
Generator_Harm (class in espnet2.gan_svs.visinger2.__init__)
(class in espnet2.gan_svs.visinger2.visinger2_vocoder)
Generator_Noise (class in espnet2.gan_svs.visinger2.__init__)
(class in espnet2.gan_svs.visinger2.visinger2_vocoder)
GeneratorAdversarialLoss (class in espnet2.gan_tts.hifigan.loss)
get_act() (in module espnet2.enh.layers.ncsnpp_utils.layers)
get_activation() (in module espnet.nets.pytorch_backend.nets_utils)
(in module espnet2.asr_transducer.activation)
(in module espnet2.enh.layers.dcunet)
get_all_keys() (espnet2.train.reporter.Reporter method)
get_arg() (espnet.scheduler.scheduler.SchedulerInterface method)
get_attention_weight() (espnet.asr.asr_mix_utils.PlotAttentionReport method)
get_attention_weights() (espnet.asr.asr_mix_utils.PlotAttentionReport method)
(espnet.asr.asr_utils.PlotAttentionReport method)
(espnet.nets.pytorch_backend.transformer.plot.PlotAttentionReport method)
get_best_epoch() (espnet2.train.reporter.Reporter method)
get_class() (espnet2.train.class_choices.ClassChoices method)
(in module espnet2.asr.state_spaces.utils)
get_commandline_args() (in module espnet.utils.cli_utils)
get_convinput_module_parameters() (in module espnet2.asr_transducer.utils)
get_correlations() (in module espnet2.enh.layers.wpe)
get_covariances() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_ctc_probs() (espnet.asr.asr_utils.PlotCTCReport method)
get_current_feats() (espnet2.asr_transducer.frontend.online_audio_processor.OnlineAudioProcessor method)
get_current_samples() (espnet2.asr_transducer.frontend.online_audio_processor.OnlineAudioProcessor method)
get_decoder_input() (in module espnet.nets.pytorch_backend.transducer.utils)
get_default_config() (espnet2.tasks.abs_task.AbsTask class method)
get_default_kwargs() (in module espnet2.utils.get_default_kwargs)
get_dict_from_cache() (in module espnet2.main_funcs.pack_funcs)
get_ema_coefficients() (espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema.MultiHeadDampedEMA method)
get_epoch() (espnet2.train.reporter.Reporter method)
(espnet2.train.reporter.SubReporter method)
get_filter_matrix_conj() (in module espnet2.enh.layers.wpe)
get_first_element() (espnet.utils.dataset.ChainerDataLoader static method)
get_flat_grid_locations() (in module espnet.utils.spec_augment)
get_gev_vector() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_grid_locations() (in module espnet.utils.spec_augment)
get_hugging_face_model_lm_head() (in module espnet2.asr.decoder.hugging_face_transformers_decoder)
get_hugging_face_model_network() (in module espnet2.asr.decoder.hugging_face_transformers_decoder)
get_human_readable_count() (in module espnet2.torch_utils.model_summary)
get_initializer() (in module espnet2.asr.state_spaces.components)
get_keys() (espnet2.train.reporter.Reporter method)
get_keys2() (espnet2.train.reporter.Reporter method)
get_layer() (in module espnet2.torch_utils.get_layer_from_string)
get_lcmv_vector_with_rtf() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_lm_state_dict() (in module espnet.asr.pytorch_backend.asr_init)
get_local_rank() (in module espnet2.train.distributed_utils)
get_logger() (in module espnet2.asr.state_spaces.s4)
get_lpz() (espnet2.bin.asr_align.CTCSegmentation method)
get_lr() (espnet2.schedulers.cosine_anneal_warmup_restart.CosineAnnealingWarmupRestarts method)
(espnet2.schedulers.noam_lr.NoamLR method)
(espnet2.schedulers.piecewise_linear_warmup_lr.PiecewiseLinearWarmupLR method)
(espnet2.schedulers.warmup_lr.WarmupLR method)
(espnet2.schedulers.warmup_step_lr.WarmupStepLR method)
get_magnitude() (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss method)
get_mask_from_lengths() (espnet2.s2st.synthesizer.translatotron2.GaussianUpsampling method)
get_master_addr() (in module espnet2.train.distributed_utils)
get_master_port() (in module espnet2.train.distributed_utils)
get_model_conf() (in module espnet.asr.asr_utils)
get_mvdr_vector() (in module espnet.nets.pytorch_backend.frontends.beamformer)
(in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_mvdr_vector_with_rtf() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_mwf_vector() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_name_from_info() (espnet2.main_funcs.pack_funcs.Archiver method)
get_node_rank() (in module espnet2.train.distributed_utils)
get_normalization() (in module espnet2.asr_transducer.normalization)
(in module espnet2.enh.layers.ncsnpp_utils.normalization)
get_num_frames_writer() (in module espnet.utils.cli_writers)
get_num_nodes() (in module espnet2.train.distributed_utils)
get_num_vocabulary_size() (espnet2.text.hugging_face_token_id_converter.HuggingFaceTokenIDConverter method)
(espnet2.text.token_id_converter.TokenIDConverter method)
(espnet2.text.whisper_token_id_converter.OpenAIWhisperTokenIDConverter method)
get_ode_sampler() (espnet2.enh.diffusion.score_based_diffusion.ScoreModel method)
get_odim() (espnet2.layers.sinc_conv.SincConv method)
get_optim_index() (espnet2.uasr.espnet_model.ESPnetUASRModel method)
get_padding() (in module espnet2.gan_svs.avocodo.avocodo)
get_parameters() (espnet2.s2st.tgt_feats_extract.abs_tgt_feats_extract.AbsTgtFeatsExtract method)
(espnet2.s2st.tgt_feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.s2st.tgt_feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.s2st.tgt_feats_extract.log_spectrogram.LogSpectrogram method)
(espnet2.svs.feats_extract.score_feats_extract.FrameScoreFeats method)
(espnet2.svs.feats_extract.score_feats_extract.SyllableScoreFeats method)
(espnet2.tts.feats_extract.abs_feats_extract.AbsFeatsExtract method)
(espnet2.tts.feats_extract.dio.Dio method)
(espnet2.tts.feats_extract.energy.Energy method)
(espnet2.tts.feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.tts.feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.tts.feats_extract.log_spectrogram.LogSpectrogram method)
(espnet2.tts.feats_extract.ying.Ying method)
get_parser() (espnet2.tasks.abs_task.AbsTask class method)
(in module espnet.bin.asr_align)
(in module espnet.bin.asr_enhance)
(in module espnet.bin.asr_recog)
(in module espnet.bin.asr_train)
(in module espnet.bin.lm_train)
(in module espnet.bin.mt_train)
(in module espnet.bin.mt_trans)
(in module espnet.bin.st_train)
(in module espnet.bin.st_trans)
(in module espnet.bin.tts_decode)
(in module espnet.bin.tts_train)
(in module espnet.bin.vc_decode)
(in module espnet.bin.vc_train)
(in module espnet2.bin.aggregate_stats_dirs)
(in module espnet2.bin.asr_align)
(in module espnet2.bin.asr_inference)
(in module espnet2.bin.asr_inference_maskctc)
(in module espnet2.bin.asr_inference_streaming)
(in module espnet2.bin.asr_train)
(in module espnet2.bin.asr_transducer_inference)
(in module espnet2.bin.asr_transducer_train)
(in module espnet2.bin.asvspoof_inference)
(in module espnet2.bin.asvspoof_train)
(in module espnet2.bin.diar_inference)
(in module espnet2.bin.diar_train)
(in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_inference_streaming)
(in module espnet2.bin.enh_s2t_train)
(in module espnet2.bin.enh_scoring)
(in module espnet2.bin.enh_train)
(in module espnet2.bin.enh_tse_inference)
(in module espnet2.bin.enh_tse_train)
(in module espnet2.bin.gan_svs_train)
(in module espnet2.bin.gan_tts_train)
(in module espnet2.bin.hubert_train)
(in module espnet2.bin.hugging_face_export_vocabulary)
(in module espnet2.bin.launch)
(in module espnet2.bin.lm_calc_perplexity)
(in module espnet2.bin.lm_inference)
(in module espnet2.bin.lm_train)
(in module espnet2.bin.mt_inference)
(in module espnet2.bin.mt_train)
(in module espnet2.bin.pack)
(in module espnet2.bin.s2st_inference)
(in module espnet2.bin.s2st_train)
(in module espnet2.bin.s2t_inference)
(in module espnet2.bin.s2t_inference_language)
(in module espnet2.bin.s2t_train)
(in module espnet2.bin.slu_inference)
(in module espnet2.bin.slu_train)
(in module espnet2.bin.spk_embed_extract)
(in module espnet2.bin.spk_inference)
(in module espnet2.bin.spk_train)
(in module espnet2.bin.split_scps)
(in module espnet2.bin.st_inference)
(in module espnet2.bin.st_inference_streaming)
(in module espnet2.bin.st_train)
(in module espnet2.bin.svs_inference)
(in module espnet2.bin.svs_train)
(in module espnet2.bin.tokenize_text)
(in module espnet2.bin.tts_inference)
(in module espnet2.bin.tts_train)
(in module espnet2.bin.uasr_extract_feature)
(in module espnet2.bin.uasr_inference)
(in module espnet2.bin.uasr_inference_k2)
(in module espnet2.bin.uasr_train)
(in module espnet2.bin.whisper_export_vocabulary)
get_partial_state_dict() (in module espnet.asr.pytorch_backend.asr_init)
get_path() (espnet2.fileio.multi_sound_scp.MultiSoundScpReader method)
(espnet2.fileio.npy_scp.NpyScpReader method)
(espnet2.fileio.npy_scp.NpyScpWriter method)
(espnet2.fileio.score_scp.MIDReader method)
(espnet2.fileio.score_scp.SingingScoreReader method)
(espnet2.fileio.score_scp.SingingScoreWriter method)
(espnet2.fileio.score_scp.XMLReader method)
(espnet2.fileio.score_scp.XMLWriter method)
(espnet2.fileio.sound_scp.SoundScpReader method)
(espnet2.fileio.sound_scp.SoundScpWriter method)
get_pc_sampler() (espnet2.enh.diffusion.score_based_diffusion.ScoreModel method)
get_polyfit_val() (espnet2.enh.layers.dnsmos.DNSMOS_local method)
get_pos_enc_and_att_class() (in module espnet.nets.pytorch_backend.transducer.blocks)
get_positionwise_layer() (espnet.nets.pytorch_backend.transformer.encoder.Encoder method)
get_power() (in module espnet2.enh.layers.wpe)
get_power_spectral_density_matrix() (in module espnet.nets.pytorch_backend.frontends.beamformer)
(in module espnet2.enh.layers.beamformer)
get_random_segments() (in module espnet2.gan_tts.utils.get_random_segments)
get_rank() (in module espnet2.train.distributed_utils)
get_rank1_mwf_vector() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_readers() (in module espnet2.bin.enh_scoring)
get_rtf() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_rtf_matrix() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_sdw_mwf_vector() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_segments() (espnet2.bin.asr_align.CTCSegmentation static method)
(espnet2.svs.feats_extract.score_feats_extract.SyllableScoreFeats method)
(in module espnet2.gan_tts.utils.get_random_segments)
get_sinusoid_embeddings() (espnet2.asr_transducer.decoder.modules.mega.positional_bias.RotaryRelativePositionBias static method)
get_size() (in module espnet2.utils.sized_dict)
get_std_opt() (in module espnet.nets.pytorch_backend.transformer.optimizer)
get_submodules() (in module espnet2.layers.create_adapter_utils)
get_subsample() (in module espnet.nets.pytorch_backend.nets_utils)
get_target() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
get_timing_config() (espnet2.bin.asr_align.CTCSegmentation method)
get_total_count() (espnet2.train.reporter.SubReporter method)
get_total_subsampling_factor() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.chainer_backend.asr_interface.ChainerASRInterface method)
(espnet.nets.chainer_backend.e2e_asr.E2E method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
get_train_config() (in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_tse_inference)
get_trained_model_state_dict() (in module espnet.asr.pytorch_backend.asr_init)
get_transducer_task_io() (in module espnet2.asr_transducer.utils)
get_transducer_tasks_io() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
get_value() (espnet2.train.reporter.Reporter method)
get_vgg2l_odim() (in module espnet.nets.e2e_asr_common)
get_weight() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
get_workspace_size() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
get_world_size() (in module espnet2.train.distributed_utils)
get_WPD_filter() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_WPD_filter_v2() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
get_WPD_filter_with_rtf() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
gev_phase_correction() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
GlobalLayerNorm (class in espnet2.diar.layers.tcn_nomask)
(class in espnet2.enh.layers.tcn)
GlobalMVN (class in espnet.nets.pytorch_backend.frontends.feature_transform)
(class in espnet2.layers.global_mvn)
GLSTM (class in espnet2.enh.layers.dc_crn)
GluConv2d (class in espnet2.enh.layers.dc_crn)
GluConvTranspose2d (class in espnet2.enh.layers.dc_crn)
GPURNNT (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt)
GradMultiply (class in espnet2.asr.encoder.avhubert_encoder)
greedy_search() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
GridNetBlock (class in espnet2.enh.separator.tfgridnet_separator)
GridNetV2Block (class in espnet2.enh.separator.tfgridnetv2_separator)
griffin_lim() (in module espnet2.utils.griffin_lim)
ground_truth_mat (espnet2.bin.asr_align.CTCSegmentationTask attribute)
gru() (in module espnet2.gan_svs.visinger2.ddsp)
GTNCTCLossFunction (class in espnet.nets.pytorch_backend.gtn_ctc)
GuidedAttentionLoss (class in espnet.nets.pytorch_backend.e2e_tts_tacotron2)
GuidedMultiHeadAttentionLoss (class in espnet.nets.pytorch_backend.e2e_tts_transformer)
H
H5FileWrapper (class in espnet2.train.dataset)
hamming_window() (espnet2.layers.sinc_conv.SincConv static method)
harmonic_synth() (in module espnet2.gan_svs.visinger2.ddsp)
has() (espnet2.train.reporter.Reporter method)
has_name() (espnet2.train.dataset.AbsDataset method)
(espnet2.train.dataset.ESPnetDataset method)
(espnet2.train.iterable_dataset.IterableESPnetDataset method)
HDF5Reader (class in espnet.utils.cli_readers)
HDF5Writer (class in espnet.utils.cli_writers)
HiFiGANGenerator (class in espnet2.gan_tts.hifigan.__init__)
(class in espnet2.gan_tts.hifigan.hifigan)
HiFiGANMultiPeriodDiscriminator (class in espnet2.gan_tts.hifigan.__init__)
(class in espnet2.gan_tts.hifigan.hifigan)
HiFiGANMultiScaleDiscriminator (class in espnet2.gan_tts.hifigan.__init__)
(class in espnet2.gan_tts.hifigan.hifigan)
HiFiGANMultiScaleMultiPeriodDiscriminator (class in espnet2.gan_tts.hifigan.__init__)
(class in espnet2.gan_tts.hifigan.hifigan)
HiFiGANPeriodDiscriminator (class in espnet2.gan_tts.hifigan.__init__)
(class in espnet2.gan_tts.hifigan.hifigan)
HiFiGANScaleDiscriminator (class in espnet2.gan_tts.hifigan.__init__)
(class in espnet2.gan_tts.hifigan.hifigan)
highpass_filtering() (in module espnet2.layers.augmentation)
Highway (class in espnet2.asr.state_spaces.residual)
HighwayNet (class in espnet.nets.pytorch_backend.tacotron2.cbhg)
hop_sz (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss attribute)
Houlsby_Adapter (class in espnet2.layers.houlsby_adapter_layer)
HoulsbyTransformerSentenceEncoderLayer (class in espnet2.layers.houlsby_adapter_layer)
hs (espnet.nets.batch_beam_search.BatchHypothesis attribute)
(espnet.nets.beam_search.Hypothesis attribute)
HuBERTCollateFn (class in espnet2.train.collate_fn)
HubertPretrainLoss (class in espnet2.hubert.hubert_loss)
HubertPretrainModel (class in espnet2.hubert.espnet_model)
HubertTask (class in espnet2.tasks.hubert)
HuggingfaceOPTModel (class in espnet2.lm.huggingface_pretrained_opt_lm)
HuggingFaceTokenIDConverter (class in espnet2.text.hugging_face_token_id_converter)
HuggingFaceTokenizer (class in espnet2.text.hugging_face_tokenizer)
HuggingFaceTransformersDecoder (class in espnet2.asr.decoder.hugging_face_transformers_decoder)
HuggingFaceTransformersEncoder (class in espnet2.asr.encoder.hugging_face_transformers_encoder)
HuggingFaceTransformersPostDecoder (class in espnet2.slu.postdecoder.hugging_face_transformers_postdecoder)
HuggingFaceTransformersPostEncoder (class in espnet2.asr.postencoder.hugging_face_transformers_postencoder)
humanfriendly_or_none() (in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_inference_streaming)
(in module espnet2.bin.enh_tse_inference)
humanfriendly_parse_size_or_none() (in module espnet2.utils.types)
hypotheses_to_results() (espnet2.bin.asr_transducer_inference.Speech2Text method)
Hypothesis (class in espnet.nets.beam_search)
(class in espnet.nets.transducer_decoder_interface)
(class in espnet2.asr.transducer.beam_search_transducer)
(class in espnet2.asr.transducer.beam_search_transducer_streaming)
(class in espnet2.asr_transducer.beam_search_transducer)
I
I_Op (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce)
Identity (class in espnet.transform.transform_interface)
IDENTITY (espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce.I_Op attribute)
identity (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
IdentityEncoder (class in espnet2.spk.encoder.identity_encoder)
ids2text() (espnet2.asr.maskctc_model.MaskCTCInference method)
ids2tokens() (espnet2.text.hugging_face_token_id_converter.HuggingFaceTokenIDConverter method)
(espnet2.text.token_id_converter.TokenIDConverter method)
(espnet2.text.whisper_token_id_converter.OpenAIWhisperTokenIDConverter method)
iFaSNet (class in espnet2.enh.layers.ifasnet)
ignore_aliases() (espnet2.utils.yaml_no_alias_safe_dump.NoAliasSafeDumper method)
ignore_label (espnet.nets.chainer_backend.deterministic_embed_id.EmbedID attribute)
ImprovedTransformerLayer (class in espnet2.enh.layers.dptnet)
in_cooldown() (espnet2.schedulers.warmup_reducelronplateau.WarmupReduceLROnPlateau property)
index_put() (in module espnet2.asr.encoder.avhubert_encoder)
index_select_state() (espnet.nets.ctc_prefix_score.CTCPrefixScoreTH method)
indices_to_split_size() (in module espnet2.bin.uasr_inference_k2)
iNeuBe (class in espnet2.enh.separator.ineube_separator)
infer() (espnet2.gan_svs.pits.ying_decoder.YingDecoder method)
inference() (espnet.nets.pytorch_backend.e2e_tts_fastspeech.FeedForwardTransformer method)
(espnet.nets.pytorch_backend.e2e_tts_tacotron2.Tacotron2 method)
(espnet.nets.pytorch_backend.e2e_tts_transformer.Transformer method)
(espnet.nets.pytorch_backend.e2e_vc_tacotron2.Tacotron2 method)
(espnet.nets.pytorch_backend.e2e_vc_transformer.Transformer method)
(espnet.nets.pytorch_backend.fastspeech.duration_predictor.DurationPredictor method)
(espnet.nets.pytorch_backend.tacotron2.cbhg.CBHG method)
(espnet.nets.pytorch_backend.tacotron2.decoder.Decoder method)
(espnet.nets.pytorch_backend.tacotron2.encoder.Encoder method)
(espnet.nets.tts_interface.TTSInterface method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.gan_svs.joint.joint_score2wav.JointScore2Wav method)
(espnet2.gan_svs.uhifigan.__init__.UHiFiGANGenerator method)
(espnet2.gan_svs.uhifigan.uhifigan.UHiFiGANGenerator method)
(espnet2.gan_svs.vits.generator.VISingerGenerator method)
(espnet2.gan_svs.vits.vits.VITS method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANGenerator method)
(espnet2.gan_tts.jets.generator.JETSGenerator method)
(espnet2.gan_tts.jets.jets.JETS method)
(espnet2.gan_tts.joint.joint_text2wav.JointText2Wav method)
(espnet2.gan_tts.melgan.melgan.MelGANGenerator method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANGenerator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANGenerator method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANGenerator method)
(espnet2.gan_tts.vits.generator.VITSGenerator method)
(espnet2.gan_tts.vits.vits.VITS method)
(espnet2.s2st.espnet_model.ESPnetS2STModel method)
(espnet2.s2st.synthesizer.abs_synthesizer.AbsSynthesizer method)
(espnet2.s2st.synthesizer.discrete_synthesizer.TransformerDiscreteSynthesizer method)
(espnet2.s2st.synthesizer.translatotron.Translatotron method)
(espnet2.svs.abs_svs.AbsSVS method)
(espnet2.svs.espnet_model.ESPnetSVSModel method)
(espnet2.svs.naive_rnn.naive_rnn.NaiveRNN method)
(espnet2.svs.naive_rnn.naive_rnn_dp.NaiveRNNDP method)
(espnet2.svs.singing_tacotron.decoder.Decoder method)
(espnet2.svs.singing_tacotron.encoder.Duration_Encoder method)
(espnet2.svs.singing_tacotron.encoder.Encoder method)
(espnet2.svs.singing_tacotron.singing_tacotron.singing_tacotron method)
(espnet2.svs.xiaoice.XiaoiceSing.XiaoiceSing method)
(espnet2.tts.abs_tts.AbsTTS method)
(espnet2.tts.espnet_model.ESPnetTTSModel method)
(espnet2.tts.fastspeech.fastspeech.FastSpeech method)
(espnet2.tts.fastspeech2.fastspeech2.FastSpeech2 method)
(espnet2.tts.prodiff.denoiser.SpectogramDenoiser method)
(espnet2.tts.prodiff.prodiff.ProDiff method)
(espnet2.tts.tacotron2.tacotron2.Tacotron2 method)
(espnet2.tts.transformer.transformer.Transformer method)
(espnet2.uasr.espnet_model.ESPnetUASRModel method)
(in module espnet2.bin.asr_inference)
(in module espnet2.bin.asr_inference_maskctc)
(in module espnet2.bin.asr_inference_streaming)
(in module espnet2.bin.asr_transducer_inference)
(in module espnet2.bin.asvspoof_inference)
(in module espnet2.bin.diar_inference)
(in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_inference_streaming)
(in module espnet2.bin.enh_tse_inference)
(in module espnet2.bin.lm_inference)
(in module espnet2.bin.mt_inference)
(in module espnet2.bin.s2st_inference)
(in module espnet2.bin.s2t_inference)
(in module espnet2.bin.s2t_inference_language)
(in module espnet2.bin.slu_inference)
(in module espnet2.bin.spk_inference)
(in module espnet2.bin.st_inference)
(in module espnet2.bin.st_inference_streaming)
(in module espnet2.bin.svs_inference)
(in module espnet2.bin.tts_inference)
(in module espnet2.bin.uasr_inference)
(in module espnet2.bin.uasr_inference_k2)
inherite_attributes() (espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
init_filters() (espnet2.layers.sinc_conv.SincConv method)
init_hyp() (espnet.nets.batch_beam_search.BatchBeamSearch method)
(espnet.nets.beam_search.BeamSearch method)
init_kernels() (in module espnet2.gan_svs.visinger2.ddsp)
init_like_chainer() (espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
init_like_fairseq() (espnet.nets.pytorch_backend.e2e_mt.E2E method)
init_lm_state() (in module espnet.nets.pytorch_backend.transducer.utils)
init_lr() (espnet2.schedulers.cosine_anneal_warmup_restart.CosineAnnealingWarmupRestarts method)
init_options() (espnet2.train.distributed_utils.DistributedOption method)
init_state() (espnet.nets.pytorch_backend.lm.seq_rnn.SequentialRNNLM method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet.nets.scorer_interface.ScorerInterface method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
(espnet.nets.scorers.ngram.Ngrambase method)
(espnet.nets.scorers.uasr.UASRPrefixScorer method)
(espnet.nets.transducer_decoder_interface.TransducerDecoderInterface method)
(espnet2.asr.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr.decoder.s4_decoder.S4Decoder method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
init_torch_distributed() (espnet2.train.distributed_utils.DistributedOption method)
init_weights() (espnet2.asr.layers.fastformer.FastSelfAttention method)
initial_att() (in module espnet.nets.pytorch_backend.rnn.attentions)
initial_state() (espnet.nets.ctc_prefix_score.CTCPrefixScore method)
initialize() (espnet.nets.chainer_backend.transformer.training.VaswaniRule method)
(in module espnet.nets.pytorch_backend.transformer.initializer)
(in module espnet.nets.pytorch_backend.wavenet)
(in module espnet2.torch_utils.initialize)
initializer() (in module espnet.nets.pytorch_backend.transducer.initializer)
InstanceNorm2dPlus (class in espnet2.enh.layers.ncsnpp_utils.normalization)
instantiate() (in module espnet2.asr.state_spaces.utils)
int_or_none() (in module espnet2.utils.types)
inter_chunk_process() (espnet2.enh.layers.dptnet.DPTNet method)
interpolate_bilinear() (in module espnet.utils.spec_augment)
interpolate_spline() (in module espnet.utils.spec_augment)
into_orig_type() (in module espnet2.enh.layers.adapt_layers)
into_tuple() (in module espnet2.enh.layers.adapt_layers)
intra_chunk_process() (espnet2.enh.layers.dptnet.DPTNet method)
IntRandomGenerateDataset (class in espnet2.fileio.rand_gen_dataset)
Invalid (class in espnet2.utils.get_default_kwargs)
inverse() (espnet2.layers.global_mvn.GlobalMVN method)
(espnet2.layers.inversible_interface.InversibleInterface method)
(espnet2.layers.stft.Stft method)
(in module espnet2.enh.layers.complex_utils)
InversibleInterface (class in espnet2.layers.inversible_interface)
invert() (espnet2.layers.sinc_conv.BarkScale static method)
(espnet2.layers.sinc_conv.MelScale static method)
is_better() (espnet2.schedulers.warmup_reducelronplateau.WarmupReduceLROnPlateau method)
is_complex() (in module espnet2.enh.layers.complex_utils)
is_dereverb_loss() (espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss property)
(espnet2.enh.loss.criterions.time_domain.TimeDomainLoss property)
is_dict() (in module espnet2.asr.state_spaces.utils)
is_discriminative_step() (espnet2.uasr.espnet_model.ESPnetUASRModel method)
is_in_slurm_job() (in module espnet2.train.distributed_utils)
is_in_slurm_step() (in module espnet2.train.distributed_utils)
is_list() (in module espnet2.asr.state_spaces.utils)
is_noise_loss() (espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss property)
(espnet2.enh.loss.criterions.time_domain.TimeDomainLoss property)
is_prefix() (in module espnet.nets.pytorch_backend.transducer.utils)
is_scipy_wav_style() (in module espnet.utils.cli_utils)
is_torch_1_9_plus (in module espnet2.enh.layers.wpe)
is_torch_complex_tensor() (in module espnet2.enh.layers.complex_utils)
is_writable_process() (in module espnet.asr.pytorch_backend.asr)
is_xla_tensor() (in module espnet2.asr.encoder.avhubert_encoder)
IsG2p (class in espnet2.text.phoneme_tokenizer)
IStft (class in espnet.transform.spectrogram)
istft() (in module espnet.transform.spectrogram)
items() (espnet.utils.io_utils.SoundHDF5File method)
IterableESPnetDataset (class in espnet2.train.iterable_dataset)
IteratorOptions (class in espnet2.tasks.abs_task)
J
JAMO_LEADS (espnet2.text.phoneme_tokenizer.Jaso attribute)
JAMO_TAILS (espnet2.text.phoneme_tokenizer.Jaso attribute)
JAMO_VOWELS (espnet2.text.phoneme_tokenizer.Jaso attribute)
Jaso (class in espnet2.text.phoneme_tokenizer)
JETS (class in espnet2.gan_tts.jets.jets)
JETSGenerator (class in espnet2.gan_tts.jets.generator)
JoinSegmenter (class in espnet2.uasr.segmenter.join_segmenter)
joint_score() (espnet.nets.beam_search_timesync.BeamSearchTimeSync method)
(espnet.nets.beam_search_timesync_streaming.BeamSearchTimeSyncStreaming method)
JointNetwork (class in espnet.nets.pytorch_backend.transducer.joint_network)
(class in espnet2.asr_transducer.joint_network)
JointScore2Wav (class in espnet2.gan_svs.joint.joint_score2wav)
JointText2Wav (class in espnet2.gan_tts.joint.joint_text2wav)
K
k2Speech2Text (class in espnet2.bin.uasr_inference_k2)
kaldi_loader() (in module espnet2.train.dataset)
KaldiReader (class in espnet.utils.cli_readers)
KaldiWriter (class in espnet.utils.cli_writers)
keys() (espnet.utils.io_utils.SoundHDF5File method)
(espnet2.fileio.multi_sound_scp.MultiSoundScpReader method)
(espnet2.fileio.npy_scp.NpyScpReader method)
(espnet2.fileio.read_text.RandomTextReader method)
(espnet2.fileio.rttm.RttmReader method)
(espnet2.fileio.score_scp.MIDReader method)
(espnet2.fileio.score_scp.SingingScoreReader method)
(espnet2.fileio.score_scp.XMLReader method)
(espnet2.fileio.sound_scp.SoundScpReader method)
(espnet2.fileio.vad_scp.VADScpReader method)
(espnet2.train.dataset.AdapterForLabelScpReader method)
(espnet2.train.dataset.AdapterForSingingScoreScpReader method)
(espnet2.train.dataset.AdapterForSoundScpReader method)
KLDivergenceLoss (class in espnet2.gan_tts.vits.loss)
KLDivergenceLossWithoutFlow (class in espnet2.gan_tts.vits.loss)
KoreanCleaner (class in espnet2.text.korean_cleaner)
kwargs2args() (in module espnet2.utils.kwargs2args)
L
label_aggregate() (espnet2.svs.feats_extract.score_feats_extract.FrameScoreFeats method)
label_loader() (in module espnet2.train.dataset)
label_rate (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
label_smoothing_dist() (in module espnet.nets.e2e_asr_common)
LabelAggregate (class in espnet2.layers.label_aggregation)
LabelProcessor (class in espnet2.diar.label_processor)
LabelSmoothingLoss (class in espnet.nets.chainer_backend.transformer.label_smoothing_loss)
(class in espnet.nets.pytorch_backend.transformer.label_smoothing_loss)
LangevinCorrector (class in espnet2.enh.diffusion.sampling.correctors)
latent_temp (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
launch() (in module espnet.distributed.pytorch_backend.launch)
layer_norm_first (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
LayerNorm (class in espnet.nets.chainer_backend.transformer.layer_norm)
(class in espnet.nets.pytorch_backend.transformer.layer_norm)
(class in espnet2.gan_svs.visinger2.visinger2_vocoder)
LayerNormalization (class in espnet2.enh.layers.uses)
LayerNormalization4D (class in espnet2.enh.separator.tfgridnet_separator)
LayerNormalization4DCF (class in espnet2.enh.separator.tfgridnet_separator)
(class in espnet2.enh.separator.tfgridnetv2_separator)
LearnableFourierPosEnc (class in espnet.nets.pytorch_backend.transformer.embedding)
lecun_normal_init_parameters() (in module espnet.nets.pytorch_backend.initialization)
LegacyRelPositionalEncoding (class in espnet.nets.pytorch_backend.transformer.embedding)
LegacyRelPositionMultiHeadedAttention (class in espnet.nets.pytorch_backend.transformer.attention)
length (espnet.nets.batch_beam_search.BatchHypothesis attribute)
LengthAdaptorPostEncoder (class in espnet2.asr.postencoder.length_adaptor_postencoder)
LengthBatchSampler (class in espnet2.samplers.length_batch_sampler)
LengthBonus (class in espnet.nets.scorers.length_bonus)
LengthRegulator (class in espnet.nets.pytorch_backend.fastspeech.length_regulator)
(class in espnet2.gan_svs.vits.length_regulator)
LightweightConvolution (class in espnet.nets.pytorch_backend.transformer.lightconv)
LightweightConvolution2D (class in espnet.nets.pytorch_backend.transformer.lightconv2d)
LightweightConvolution2DTransformerDecoder (class in espnet2.asr.decoder.transformer_decoder)
LightweightConvolutionTransformerDecoder (class in espnet2.asr.decoder.transformer_decoder)
LightweightSincConvs (class in espnet2.asr.preencoder.sinc)
LinearActivation() (in module espnet2.asr.state_spaces.components)
LinearDecoder (class in espnet2.asvspoof.decoder.linear_decoder)
(class in espnet2.diar.decoder.linear_decoder)
LinearEncoder (class in espnet2.asr.encoder.linear_encoder)
LinearProjection (class in espnet2.asr.preencoder.linear)
LinearSampling (class in espnet.nets.chainer_backend.transformer.subsampling)
LinearSpectrogram (class in espnet2.s2st.tgt_feats_extract.linear_spectrogram)
(class in espnet2.tts.feats_extract.linear_spectrogram)
ListsToTensor() (in module espnet2.svs.feats_extract.score_feats_extract)
lm_score (espnet2.asr_transducer.beam_search_transducer.ExtendedHypothesis attribute)
lm_scores (espnet.nets.transducer_decoder_interface.ExtendedHypothesis attribute)
(espnet2.asr.transducer.beam_search_transducer.ExtendedHypothesis attribute)
(espnet2.asr.transducer.beam_search_transducer_streaming.ExtendedHypothesis attribute)
lm_state (espnet.nets.transducer_decoder_interface.Hypothesis attribute)
(espnet2.asr.transducer.beam_search_transducer.Hypothesis attribute)
(espnet2.asr.transducer.beam_search_transducer_streaming.Hypothesis attribute)
(espnet2.asr_transducer.beam_search_transducer.Hypothesis attribute)
LMEvaluator (class in espnet.lm.chainer_backend.lm)
(class in espnet.lm.pytorch_backend.lm)
LMInterface (class in espnet.nets.lm_interface)
LMTask (class in espnet2.tasks.lm)
load_dataset() (in module espnet.lm.lm_utils)
load_kaldi() (in module espnet2.train.iterable_dataset)
load_num_sequence_text() (in module espnet2.fileio.read_text)
load_pretrained_model() (espnet.nets.tts_interface.TTSInterface method)
(in module espnet2.torch_utils.load_pretrained_model)
load_rttm_text() (in module espnet2.fileio.rttm)
load_state_dict() (espnet.nets.pytorch_backend.lm.default.DefaultRNNLM method)
(espnet.nets.pytorch_backend.transformer.optimizer.NoamOpt method)
(espnet2.schedulers.abs_scheduler.AbsBatchStepScheduler method)
(espnet2.schedulers.abs_scheduler.AbsEpochStepScheduler method)
(espnet2.schedulers.abs_scheduler.AbsScheduler method)
(espnet2.schedulers.abs_scheduler.AbsValEpochStepScheduler method)
(espnet2.schedulers.warmup_reducelronplateau.WarmupReduceLROnPlateau method)
(espnet2.train.reporter.Reporter method)
load_trained_model() (in module espnet.asr.pytorch_backend.asr_init)
load_trained_modules() (in module espnet.asr.pytorch_backend.asr_init)
load_wkv_kernel() (in module espnet2.asr_transducer.decoder.modules.rwkv.attention)
LoadInputsAndTargets (class in espnet.utils.io_utils)
local_rank (espnet2.train.distributed_utils.DistributedOption attribute)
log (in module espnet2.asr.state_spaces.s4)
log_attentions() (espnet.asr.asr_mix_utils.PlotAttentionReport method)
(espnet.asr.asr_utils.PlotAttentionReport method)
(espnet.nets.pytorch_backend.transformer.plot.PlotAttentionReport method)
log_ctc_probs() (espnet.asr.asr_utils.PlotCTCReport method)
log_mel_spectrogram() (espnet2.asr.encoder.whisper_encoder.OpenAIWhisperEncoder method)
(espnet2.asr.frontend.whisper.WhisperFrontend method)
log_message() (espnet2.train.reporter.Reporter method)
(espnet2.train.reporter.SubReporter method)
log_plus (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
log_softmax() (espnet.nets.chainer_backend.ctc.CTC method)
(espnet.nets.chainer_backend.transformer.ctc.CTC method)
(espnet.nets.pytorch_backend.ctc.CTC method)
(espnet2.asr.ctc.CTC method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.GPURNNT method)
log_sum_exp (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
log_sum_exp() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt)
log_vandermonde() (in module espnet2.asr.state_spaces.s4)
log_vandermonde_transpose() (in module espnet2.asr.state_spaces.s4)
LogCompression (class in espnet2.layers.sinc_conv)
LogFlow (class in espnet2.gan_tts.vits.flow)
logit_segment() (espnet2.uasr.segmenter.abs_segmenter.AbsSegmenter method)
(espnet2.uasr.segmenter.join_segmenter.JoinSegmenter method)
(espnet2.uasr.segmenter.random_segmenter.RandomSegmenter method)
logit_temp (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
LogMel (class in espnet.nets.pytorch_backend.frontends.feature_transform)
(class in espnet2.layers.log_mel)
logmel2linear() (in module espnet2.utils.griffin_lim)
LogMelFbank (class in espnet2.s2st.tgt_feats_extract.log_mel_fbank)
(class in espnet2.tts.feats_extract.log_mel_fbank)
LogMelSpectrogram (class in espnet.transform.spectrogram)
logmelspectrogram() (in module espnet.transform.spectrogram)
logp (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt_kernel)
LogSoftmaxGradModification (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt)
LogSpectrogram (class in espnet2.s2st.tgt_feats_extract.log_spectrogram)
(class in espnet2.tts.feats_extract.log_spectrogram)
logzero (espnet.lm.chainer_backend.extlm.LookAheadWordLM attribute)
(espnet.lm.chainer_backend.extlm.MultiLevelLM attribute)
(espnet.lm.pytorch_backend.extlm.LookAheadWordLM attribute)
(espnet.lm.pytorch_backend.extlm.MultiLevelLM attribute)
LongformerAttention (class in espnet.nets.pytorch_backend.transformer.longformer_attention)
LongformerEncoder (class in espnet2.asr.encoder.longformer_encoder)
LookAheadWordLM (class in espnet.lm.chainer_backend.extlm)
(class in espnet.lm.pytorch_backend.extlm)
loss_fn() (espnet.nets.pytorch_backend.ctc.CTC method)
(espnet2.asr.ctc.CTC method)
lowpass_filtering() (in module espnet2.layers.augmentation)
lpz (espnet2.bin.asr_align.CTCSegmentationTask attribute)
LR() (espnet2.gan_svs.vits.length_regulator.LengthRegulator method)
lr_for_WarmupLR() (espnet2.schedulers.noam_lr.NoamLR method)
M
main() (espnet2.tasks.abs_task.AbsTask class method)
(in module espnet.bin.asr_align)
(in module espnet.bin.asr_enhance)
(in module espnet.bin.asr_recog)
(in module espnet.bin.asr_train)
(in module espnet.bin.lm_train)
(in module espnet.bin.mt_train)
(in module espnet.bin.mt_trans)
(in module espnet.bin.st_train)
(in module espnet.bin.st_trans)
(in module espnet.bin.tts_decode)
(in module espnet.bin.tts_train)
(in module espnet.bin.vc_decode)
(in module espnet.bin.vc_train)
(in module espnet2.bin.aggregate_stats_dirs)
(in module espnet2.bin.asr_align)
(in module espnet2.bin.asr_inference)
(in module espnet2.bin.asr_inference_maskctc)
(in module espnet2.bin.asr_inference_streaming)
(in module espnet2.bin.asr_train)
(in module espnet2.bin.asr_transducer_inference)
(in module espnet2.bin.asr_transducer_train)
(in module espnet2.bin.asvspoof_inference)
(in module espnet2.bin.asvspoof_train)
(in module espnet2.bin.diar_inference)
(in module espnet2.bin.diar_train)
(in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_inference_streaming)
(in module espnet2.bin.enh_s2t_train)
(in module espnet2.bin.enh_scoring)
(in module espnet2.bin.enh_train)
(in module espnet2.bin.enh_tse_inference)
(in module espnet2.bin.enh_tse_train)
(in module espnet2.bin.gan_svs_train)
(in module espnet2.bin.gan_tts_train)
(in module espnet2.bin.hubert_train)
(in module espnet2.bin.hugging_face_export_vocabulary)
(in module espnet2.bin.launch)
(in module espnet2.bin.lm_calc_perplexity)
(in module espnet2.bin.lm_inference)
(in module espnet2.bin.lm_train)
(in module espnet2.bin.mt_inference)
(in module espnet2.bin.mt_train)
(in module espnet2.bin.pack)
(in module espnet2.bin.s2st_inference)
(in module espnet2.bin.s2st_train)
(in module espnet2.bin.s2t_inference)
(in module espnet2.bin.s2t_inference_language)
(in module espnet2.bin.s2t_train)
(in module espnet2.bin.slu_inference)
(in module espnet2.bin.slu_train)
(in module espnet2.bin.spk_embed_extract)
(in module espnet2.bin.spk_inference)
(in module espnet2.bin.spk_train)
(in module espnet2.bin.split_scps)
(in module espnet2.bin.st_inference)
(in module espnet2.bin.st_inference_streaming)
(in module espnet2.bin.st_train)
(in module espnet2.bin.svs_inference)
(in module espnet2.bin.svs_train)
(in module espnet2.bin.tokenize_text)
(in module espnet2.bin.tts_inference)
(in module espnet2.bin.tts_train)
(in module espnet2.bin.uasr_extract_feature)
(in module espnet2.bin.uasr_inference)
(in module espnet2.bin.uasr_inference_k2)
(in module espnet2.bin.uasr_train)
(in module espnet2.bin.whisper_export_vocabulary)
main_worker() (espnet2.tasks.abs_task.AbsTask class method)
MainProcessError
make_adapt_layer() (in module espnet2.enh.layers.adapt_layers)
make_attention_mask() (espnet.nets.chainer_backend.transformer.decoder.Decoder method)
make_batchset() (in module espnet.utils.training.batchfy)
make_chunk_mask() (in module espnet2.asr_transducer.utils)
make_history_mask() (in module espnet.nets.chainer_backend.transformer.mask)
make_lexical_tree() (in module espnet.lm.lm_utils)
make_non_pad_mask() (in module espnet.nets.pytorch_backend.nets_utils)
make_pad_mask() (in module espnet.nets.pytorch_backend.nets_utils)
make_source_mask() (in module espnet2.asr_transducer.utils)
make_unet_encoder_decoder_args() (in module espnet2.enh.layers.dcunet)
MakeSymlinkToBestModel (class in espnet.lm.lm_utils)
marginal_prob() (espnet2.enh.diffusion.sdes.OUVESDE method)
(espnet2.enh.diffusion.sdes.OUVPSDE method)
(espnet2.enh.diffusion.sdes.SDE method)
mask_along_axis() (in module espnet2.layers.mask_along_axis)
mask_by_length() (in module espnet.nets.pytorch_backend.nets_utils)
mask_channel_length (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_channel_min_space (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_channel_other (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_channel_prob (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_channel_selection (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_length_audio (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_length_image (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_min_space (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_other (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_prob_audio (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_prob_image (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_selection (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
mask_type() (espnet2.enh.loss.criterions.tf_domain.FrequencyDomainAbsCoherence property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainCrossEntropy property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainDPCL property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainL1 property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainMSE property)
mask_uniform() (in module espnet.nets.pytorch_backend.maskctc.add_mask_token)
MaskAlongAxis (class in espnet2.layers.mask_along_axis)
MaskAlongAxisVariableMaxWidth (class in espnet2.layers.mask_along_axis)
MaskCTCInference (class in espnet2.asr.maskctc_model)
MaskCTCModel (class in espnet2.asr.maskctc_model)
MaskEstimator (class in espnet.nets.pytorch_backend.frontends.mask_estimator)
(class in espnet2.enh.layers.mask_estimator)
masking_type (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
matmul() (in module espnet2.enh.layers.complex_utils)
matplotlib_plot() (espnet2.train.reporter.Reporter method)
max_num_spk() (espnet2.diar.layers.abs_mask.AbsMask property)
(espnet2.diar.layers.multi_mask.MultiMask property)
max_positions() (espnet2.asr.encoder.avhubert_encoder.TransformerEncoder method)
max_target_positions (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
MAXIMUM (espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce.R_Op attribute)
maximum (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
maximum_path() (in module espnet2.gan_tts.vits.monotonic_align.__init__)
maximum_path_each_numba (in module espnet2.gan_tts.vits.monotonic_align.__init__)
maximum_path_numba (in module espnet2.gan_tts.vits.monotonic_align.__init__)
MDC (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
MDCDConfig (class in espnet2.gan_svs.avocodo.avocodo)
mean_std_loudness() (in module espnet2.gan_svs.visinger2.ddsp)
MeanPoolConv (class in espnet2.enh.layers.ncsnpp_utils.layers)
MeanPooling (class in espnet2.spk.pooling.mean_pooling)
measure_iter_time() (espnet2.train.reporter.SubReporter method)
measure_time() (espnet2.train.reporter.SubReporter method)
MEGA (class in espnet2.asr_transducer.decoder.blocks.mega)
MEGADecoder (class in espnet2.asr_transducer.decoder.mega_decoder)
MelGANDiscriminator (class in espnet2.gan_tts.melgan.melgan)
MelGANGenerator (class in espnet2.gan_tts.melgan.melgan)
MelGANMultiScaleDiscriminator (class in espnet2.gan_tts.melgan.melgan)
MelScale (class in espnet2.gan_svs.visinger2.visinger2_vocoder)
(class in espnet2.layers.sinc_conv)
MelSpectrogramLoss (class in espnet2.gan_tts.hifigan.loss)
MelSpectrogramTorch (class in espnet2.asr.frontend.melspec_torch)
MemLSTM (class in espnet2.enh.layers.skim)
merge() (espnet2.bin.enh_inference_streaming.SeparateSpeechStreaming method)
merge_feature() (espnet2.enh.separator.dptnet_separator.DPTNetSeparator method)
(in module espnet2.enh.layers.dprnn)
merge_scores() (espnet.nets.beam_search.BeamSearch static method)
merge_states() (espnet.nets.batch_beam_search.BatchBeamSearch method)
(espnet.nets.beam_search.BeamSearch method)
MfaConformerEncoder (class in espnet2.spk.encoder.conformer_encoder)
mfmcwf() (espnet2.enh.separator.ineube_separator.iNeuBe static method)
midi_to_lag() (espnet2.tts.feats_extract.ying.Ying method)
MIDReader (class in espnet2.fileio.score_scp)
min_pit_sample() (espnet.nets.pytorch_backend.e2e_asr_mix.PIT method)
Mish (class in espnet2.asr_transducer.activation)
(class in espnet2.tts.prodiff.denoiser)
MixITSolver (class in espnet2.enh.loss.wrappers.mixit_solver)
MLMDecoder (class in espnet2.asr.decoder.mlm_decoder)
mlp() (in module espnet2.gan_svs.visinger2.ddsp)
modality_dropout (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
modality_fuse (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
modality_fusion() (espnet2.asr.encoder.avhubert_encoder.AVHubertModel method)
model_summary() (in module espnet2.torch_utils.model_summary)
modified_adaptive_expansion_search() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
(espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
MSFBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
MTInterface (class in espnet.nets.mt_interface)
MTTask (class in espnet2.tasks.mt)
MulAddAdaptLayer (class in espnet2.enh.layers.adapt_layers)
MulCatBlock (class in espnet2.enh.layers.dpmulcat)
multi_blank_greedy_search() (espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
multi_columns_sound_loader() (in module espnet2.train.dataset)
multiblank_rnnt_loss_gpu() (in module espnet2.asr.transducer.rnnt_multi_blank.rnnt)
MultiblankGPURNNT (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt)
MultiblankRNNTLossNumba (class in espnet2.asr.transducer.rnnt_multi_blank.rnnt_multi_blank)
MultiBlocks (class in espnet2.asr_transducer.encoder.modules.multi_blocks)
MultiFrequencyDiscriminator (class in espnet2.gan_svs.visinger2.visinger2_vocoder)
MultiHeadAttention (class in espnet.nets.chainer_backend.transformer.attention)
(class in espnet2.s2st.aux_attention.multihead)
MultiHeadDampedEMA (class in espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema)
MultiHeadedAttention (class in espnet.nets.pytorch_backend.transformer.attention)
(class in espnet2.asr.state_spaces.attention)
(class in espnet2.tts.gst.style_encoder)
MultiLayeredConv1d (class in espnet.nets.pytorch_backend.transformer.multi_layer_conv)
MultiLayerPITSolver (class in espnet2.enh.loss.wrappers.multilayer_pit_solver)
MultiLevelLM (class in espnet.lm.chainer_backend.extlm)
(class in espnet.lm.pytorch_backend.extlm)
MultiMask (class in espnet2.diar.layers.multi_mask)
MultipleIterFactory (class in espnet2.iterators.multiple_iter_factory)
multiprocessing_distributed (espnet2.train.distributed_utils.DistributedOption attribute)
MultiResL1SpecLoss (class in espnet2.enh.loss.criterions.time_domain)
multiscale_fft() (in module espnet2.gan_svs.visinger2.ddsp)
MultiSequential (class in espnet.nets.pytorch_backend.transformer.repeat)
MultiSoundScpReader (class in espnet2.fileio.multi_sound_scp)
MutliTokenizerCommonPreprocessor (class in espnet2.train.preprocessor)
N
naive_downsample_2d() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
naive_upsample_2d() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
NaiveRNN (class in espnet2.svs.naive_rnn.naive_rnn)
NaiveRNNDP (class in espnet2.svs.naive_rnn.naive_rnn_dp)
NaiveRNNLoss (class in espnet2.svs.naive_rnn.naive_rnn)
name (espnet2.bin.asr_align.CTCSegmentationTask attribute)
name() (espnet2.asvspoof.loss.abs_loss.AbsASVSpoofLoss property)
(espnet2.enh.loss.criterions.abs_loss.AbsEnhLoss property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss property)
(espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss property)
(espnet2.enh.loss.criterions.time_domain.TimeDomainLoss property)
(espnet2.enh.loss.wrappers.mixit_solver.MixITSolver property)
(espnet2.s2st.aux_attention.abs_aux_attention.AbsS2STAuxAttention property)
(espnet2.s2st.losses.abs_loss.AbsS2STLoss property)
(espnet2.uasr.loss.abs_loss.AbsUASRLoss property)
names() (espnet2.train.dataset.AbsDataset method)
(espnet2.train.dataset.ESPnetDataset method)
(espnet2.train.iterable_dataset.IterableESPnetDataset method)
NavieComplexLSTM (class in espnet2.enh.layers.complexnn)
ncsn_conv1x1() (in module espnet2.enh.layers.ncsnpp_utils.layers)
ncsn_conv3x3() (in module espnet2.enh.layers.ncsnpp_utils.layers)
NCSNpp (class in espnet2.enh.layers.ncsnpp)
negate (in module espnet2.asr.transducer.rnnt_multi_blank.utils.rnnt_helper)
NestedDictAction (class in espnet2.utils.nested_dict_action)
NeuralBeamformer (class in espnet2.enh.separator.neural_beamformer)
new_complex_like() (in module espnet2.enh.layers.complex_utils)
next() (espnet.utils.dataset.ChainerDataLoader method)
(espnet2.train.reporter.SubReporter method)
ngpu (espnet2.train.distributed_utils.DistributedOption attribute)
Ngrambase (class in espnet.nets.scorers.ngram)
NgramFullScorer (class in espnet.nets.scorers.ngram)
NgramPartScorer (class in espnet.nets.scorers.ngram)
NIN (class in espnet2.enh.layers.ncsnpp_utils.layers)
nll() (espnet2.asr.espnet_model.ESPnetASRModel method)
(espnet2.asr.maskctc_model.MaskCTCModel method)
(espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
(espnet2.lm.espnet_model.ESPnetLanguageModel method)
(espnet2.lm.espnet_model_multitask.ESPnetMultitaskLanguageModel method)
no_mask_channel_overlap (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
no_mask_overlap (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
no_scale_embedding (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
no_token_positional_embeddings (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
NoAliasSafeDumper (class in espnet2.utils.yaml_no_alias_safe_dump)
NoamLR (class in espnet2.schedulers.noam_lr)
NoamOpt (class in espnet.nets.pytorch_backend.transformer.optimizer)
NoamScheduler (class in espnet.scheduler.scheduler)
NoAtt (class in espnet.nets.chainer_backend.rnn.attentions)
(class in espnet.nets.pytorch_backend.rnn.attentions)
noise_scheduler() (in module espnet2.tts.prodiff.denoiser)
NoiseInjection (class in espnet.transform.perturb)
none_window() (espnet2.layers.sinc_conv.SincConv static method)
NoneCorrector (class in espnet2.enh.diffusion.sampling.correctors)
NoneNorm2d (class in espnet2.enh.layers.ncsnpp_utils.normalization)
NonePredictor (class in espnet2.enh.diffusion.sampling.predictors)
Normalization (class in espnet2.asr.state_spaces.components)
normalize_text() (espnet2.text.korean_cleaner.KoreanCleaner class method)
normalize_variance (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss attribute)
NormalizedPositionwiseFeedForward (class in espnet2.asr_transducer.decoder.modules.mega.feed_forward)
NoScheduler (class in espnet.scheduler.scheduler)
NOTE (class in espnet2.fileio.score_scp)
nplr() (in module espnet2.asr.state_spaces.s4)
NpyScpReader (class in espnet2.fileio.npy_scp)
NpyScpWriter (class in espnet2.fileio.npy_scp)
nsc_beam_search() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
NullDecoder (class in espnet2.enh.decoder.null_decoder)
NullEncoder (class in espnet2.enh.encoder.null_encoder)
num2tuple() (in module espnet2.enh.layers.conv_utils)
num_optimizers (espnet2.tasks.abs_task.AbsTask attribute)
(espnet2.tasks.asr.ASRTask attribute)
(espnet2.tasks.asr_transducer.ASRTransducerTask attribute)
(espnet2.tasks.asvspoof.ASVSpoofTask attribute)
(espnet2.tasks.diar.DiarizationTask attribute)
(espnet2.tasks.enh.EnhancementTask attribute)
(espnet2.tasks.enh_s2t.EnhS2TTask attribute)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask attribute)
(espnet2.tasks.gan_svs.GANSVSTask attribute)
(espnet2.tasks.gan_tts.GANTTSTask attribute)
(espnet2.tasks.hubert.HubertTask attribute)
(espnet2.tasks.lm.LMTask attribute)
(espnet2.tasks.mt.MTTask attribute)
(espnet2.tasks.s2st.S2STTask attribute)
(espnet2.tasks.s2t.S2TTask attribute)
(espnet2.tasks.slu.SLUTask attribute)
(espnet2.tasks.spk.SpeakerTask attribute)
(espnet2.tasks.st.STTask attribute)
(espnet2.tasks.svs.SVSTask attribute)
(espnet2.tasks.tts.TTSTask attribute)
(espnet2.tasks.uasr.UASRTask attribute)
num_spk() (espnet2.diar.decoder.abs_decoder.AbsDecoder property)
(espnet2.diar.decoder.linear_decoder.LinearDecoder property)
(espnet2.diar.separator.tcn_separator_nomask.TCNSeparatorNomask property)
(espnet2.enh.separator.abs_separator.AbsSeparator property)
(espnet2.enh.separator.asteroid_models.AsteroidModel_Converter property)
(espnet2.enh.separator.conformer_separator.ConformerSeparator property)
(espnet2.enh.separator.dan_separator.DANSeparator property)
(espnet2.enh.separator.dc_crn_separator.DC_CRNSeparator property)
(espnet2.enh.separator.dccrn_separator.DCCRNSeparator property)
(espnet2.enh.separator.dpcl_e2e_separator.DPCLE2ESeparator property)
(espnet2.enh.separator.dpcl_separator.DPCLSeparator property)
(espnet2.enh.separator.dprnn_separator.DPRNNSeparator property)
(espnet2.enh.separator.dptnet_separator.DPTNetSeparator property)
(espnet2.enh.separator.fasnet_separator.FaSNetSeparator property)
(espnet2.enh.separator.ineube_separator.iNeuBe property)
(espnet2.enh.separator.neural_beamformer.NeuralBeamformer property)
(espnet2.enh.separator.rnn_separator.RNNSeparator property)
(espnet2.enh.separator.skim_separator.SkiMSeparator property)
(espnet2.enh.separator.svoice_separator.SVoiceSeparator property)
(espnet2.enh.separator.tcn_separator.TCNSeparator property)
(espnet2.enh.separator.tfgridnet_separator.TFGridNet property)
(espnet2.enh.separator.tfgridnetv2_separator.TFGridNetV2 property)
(espnet2.enh.separator.transformer_separator.TransformerSeparator property)
(espnet2.enh.separator.uses_separator.USESSeparator property)
number_updates() (espnet2.uasr.espnet_model.ESPnetUASRModel property)
NumElementsBatchSampler (class in espnet2.samplers.num_elements_batch_sampler)
O
observe() (espnet2.train.reporter.Reporter method)
omegaconf_filter_keys() (in module espnet2.asr.state_spaces.utils)
OneHot (class in espnet.nets.pytorch_backend.wavenet)
OnlineAudioProcessor (class in espnet2.asr_transducer.frontend.online_audio_processor)
only_for_test() (espnet2.enh.loss.criterions.abs_loss.AbsEnhLoss property)
(espnet2.enh.loss.criterions.tf_domain.FrequencyDomainLoss property)
(espnet2.enh.loss.criterions.time_domain.TimeDomainLoss property)
OnReIm (class in espnet2.enh.layers.dcunet)
OpenAIWhisperDecoder (class in espnet2.asr.decoder.whisper_decoder)
OpenAIWhisperEncoder (class in espnet2.asr.encoder.whisper_encoder)
OpenAIWhisperTokenIDConverter (class in espnet2.text.whisper_token_id_converter)
OpenAIWhisperTokenizer (class in espnet2.text.whisper_tokenizer)
OptimizerFactoryInterface (class in espnet.optimizer.factory)
OptimModule (class in espnet2.asr.state_spaces.s4)
optional_data_names() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.asr.ASRTask class method)
(espnet2.tasks.asr_transducer.ASRTransducerTask class method)
(espnet2.tasks.asvspoof.ASVSpoofTask class method)
(espnet2.tasks.diar.DiarizationTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
(espnet2.tasks.enh_s2t.EnhS2TTask class method)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.hubert.HubertTask class method)
(espnet2.tasks.lm.LMTask class method)
(espnet2.tasks.mt.MTTask class method)
(espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.s2t.S2TTask class method)
(espnet2.tasks.slu.SLUTask class method)
(espnet2.tasks.spk.SpeakerTask class method)
(espnet2.tasks.st.STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
output_dim() (espnet2.diar.separator.tcn_separator_nomask.TCNSeparatorNomask property)
(espnet2.enh.encoder.abs_encoder.AbsEncoder property)
(espnet2.enh.encoder.conv_encoder.ConvEncoder property)
(espnet2.enh.encoder.null_encoder.NullEncoder property)
(espnet2.enh.encoder.stft_encoder.STFTEncoder property)
output_size() (espnet2.asr.encoder.abs_encoder.AbsEncoder method)
(espnet2.asr.encoder.avhubert_encoder.FairseqAVHubertEncoder method)
(espnet2.asr.encoder.branchformer_encoder.BranchformerEncoder method)
(espnet2.asr.encoder.conformer_encoder.ConformerEncoder method)
(espnet2.asr.encoder.contextual_block_conformer_encoder.ContextualBlockConformerEncoder method)
(espnet2.asr.encoder.contextual_block_transformer_encoder.ContextualBlockTransformerEncoder method)
(espnet2.asr.encoder.e_branchformer_encoder.EBranchformerEncoder method)
(espnet2.asr.encoder.hubert_encoder.FairseqHubertEncoder method)
(espnet2.asr.encoder.hubert_encoder.FairseqHubertPretrainEncoder method)
(espnet2.asr.encoder.hubert_encoder.TorchAudioHuBERTPretrainEncoder method)
(espnet2.asr.encoder.hugging_face_transformers_encoder.HuggingFaceTransformersEncoder method)
(espnet2.asr.encoder.linear_encoder.LinearEncoder method)
(espnet2.asr.encoder.longformer_encoder.LongformerEncoder method)
(espnet2.asr.encoder.rnn_encoder.RNNEncoder method)
(espnet2.asr.encoder.transformer_encoder.TransformerEncoder method)
(espnet2.asr.encoder.transformer_encoder_multispkr.TransformerEncoder method)
(espnet2.asr.encoder.vgg_rnn_encoder.VGGRNNEncoder method)
(espnet2.asr.encoder.wav2vec2_encoder.FairSeqWav2Vec2Encoder method)
(espnet2.asr.encoder.whisper_encoder.OpenAIWhisperEncoder method)
(espnet2.asr.frontend.abs_frontend.AbsFrontend method)
(espnet2.asr.frontend.asteroid_frontend.AsteroidFrontend method)
(espnet2.asr.frontend.default.DefaultFrontend method)
(espnet2.asr.frontend.fused.FusedFrontends method)
(espnet2.asr.frontend.melspec_torch.MelSpectrogramTorch method)
(espnet2.asr.frontend.s3prl.S3prlFrontend method)
(espnet2.asr.frontend.whisper.WhisperFrontend method)
(espnet2.asr.frontend.windowing.SlidingWindow method)
(espnet2.asr.postencoder.abs_postencoder.AbsPostEncoder method)
(espnet2.asr.postencoder.hugging_face_transformers_postencoder.HuggingFaceTransformersPostEncoder method)
(espnet2.asr.postencoder.length_adaptor_postencoder.LengthAdaptorPostEncoder method)
(espnet2.asr.preencoder.abs_preencoder.AbsPreEncoder method)
(espnet2.asr.preencoder.linear.LinearProjection method)
(espnet2.asr.preencoder.sinc.LightweightSincConvs method)
(espnet2.mt.frontend.embedding.Embedding method)
(espnet2.s2st.tgt_feats_extract.abs_tgt_feats_extract.AbsTgtFeatsExtract method)
(espnet2.s2st.tgt_feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.s2st.tgt_feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.s2st.tgt_feats_extract.log_spectrogram.LogSpectrogram method)
(espnet2.slu.postdecoder.abs_postdecoder.AbsPostDecoder method)
(espnet2.slu.postdecoder.hugging_face_transformers_postdecoder.HuggingFaceTransformersPostDecoder method)
(espnet2.slu.postencoder.conformer_postencoder.ConformerPostEncoder method)
(espnet2.slu.postencoder.transformer_postencoder.TransformerPostEncoder method)
(espnet2.spk.encoder.conformer_encoder.MfaConformerEncoder method)
(espnet2.spk.encoder.ecapa_tdnn_encoder.EcapaTdnnEncoder method)
(espnet2.spk.encoder.identity_encoder.IdentityEncoder method)
(espnet2.spk.encoder.rawnet3_encoder.RawNet3Encoder method)
(espnet2.spk.encoder.ska_tdnn_encoder.SkaTdnnEncoder method)
(espnet2.spk.encoder.xvector_encoder.XvectorEncoder method)
(espnet2.spk.pooling.abs_pooling.AbsPooling method)
(espnet2.spk.pooling.chn_attn_stat_pooling.ChnAttnStatPooling method)
(espnet2.spk.pooling.mean_pooling.MeanPooling method)
(espnet2.spk.pooling.stat_pooling.StatsPooling method)
(espnet2.spk.projector.abs_projector.AbsProjector method)
(espnet2.spk.projector.rawnet3_projector.RawNet3Projector method)
(espnet2.spk.projector.ska_tdnn_projector.SkaTdnnProjector method)
(espnet2.spk.projector.xvector_projector.XvectorProjector method)
(espnet2.svs.feats_extract.score_feats_extract.FrameScoreFeats method)
(espnet2.svs.feats_extract.score_feats_extract.SyllableScoreFeats method)
(espnet2.tts.feats_extract.abs_feats_extract.AbsFeatsExtract method)
(espnet2.tts.feats_extract.dio.Dio method)
(espnet2.tts.feats_extract.energy.Energy method)
(espnet2.tts.feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.tts.feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.tts.feats_extract.log_spectrogram.LogSpectrogram method)
(espnet2.tts.feats_extract.ying.Ying method)
(espnet2.uasr.generator.abs_generator.AbsGenerator method)
(espnet2.uasr.generator.conv_generator.ConvGenerator method)
OUVESDE (class in espnet2.enh.diffusion.sdes)
OUVPSDE (class in espnet2.enh.diffusion.sdes)
overlap_and_add() (in module espnet2.enh.separator.svoice_separator)
P
pack() (in module espnet2.main_funcs.pack_funcs)
PackedContents (class in espnet2.bin.pack)
pad2() (espnet2.enh.separator.ineube_separator.iNeuBe static method)
(espnet2.enh.separator.tfgridnet_separator.TFGridNet static method)
(espnet2.enh.separator.tfgridnetv2_separator.TFGridNetV2 static method)
pad_input() (espnet2.enh.layers.fasnet.FaSNet_base method)
pad_list() (in module espnet.nets.pytorch_backend.nets_utils)
pad_or_trim() (espnet2.asr.encoder.whisper_encoder.OpenAIWhisperEncoder method)
pad_sequence() (in module espnet.nets.pytorch_backend.transducer.utils)
pad_spec() (espnet2.enh.layers.ncsnpp.NCSNpp method)
pad_to_same_length() (espnet2.fileio.multi_sound_scp.MultiSoundScpReader method)
ParallelSentenceIterator (class in espnet.lm.lm_utils)
ParallelWaveGANDiscriminator (class in espnet2.gan_tts.parallel_wavegan.__init__)
(class in espnet2.gan_tts.parallel_wavegan.parallel_wavegan)
ParallelWaveGANGenerator (class in espnet2.gan_tts.parallel_wavegan.__init__)
(class in espnet2.gan_tts.parallel_wavegan.parallel_wavegan)
ParallelWaveGANPretrainedVocoder (class in espnet2.tts.utils.__init__)
(class in espnet2.tts.utils.parallel_wavegan_pretrained_vocoder)
param_groups() (espnet.nets.pytorch_backend.transformer.optimizer.NoamOpt property)
parse_hypothesis() (in module espnet.asr.asr_utils)
(in module espnet.mt.mt_utils)
parse_known_args() (espnet2.utils.config_argparse.ArgumentParser method)
parse_wspecifier() (in module espnet.utils.cli_writers)
PartialScorerInterface (class in espnet.nets.scorer_interface)
perform_filter_operation() (in module espnet2.enh.layers.wpe)
perform_WPD_filtering() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
permutate() (espnet2.asr.pit_espnet_model.PITLossWrapper class method)
permutation_invariant_training() (espnet2.enh.espnet_enh_s2t_model.ESPnetEnhS2TModel method)
permutationDFS() (espnet.nets.pytorch_backend.e2e_asr_mix.PIT method)
permute_diar() (espnet2.bin.diar_inference.DiarizeSpeech method)
phi() (in module espnet.utils.spec_augment)
PhonemePredictor (class in espnet2.gan_svs.vits.phoneme_predictor)
PhonemeTokenizer (class in espnet2.text.phoneme_tokenizer)
Phonemizer (class in espnet2.text.phoneme_tokenizer)
piecewise_rational_quadratic_transform() (in module espnet2.gan_tts.vits.transform)
PiecewiseLinearWarmupLR (class in espnet2.schedulers.piecewise_linear_warmup_lr)
PIT (class in espnet.nets.pytorch_backend.e2e_asr_mix)
pit_loss() (espnet2.diar.espnet_model.ESPnetDiarizationModel method)
pit_loss_single_permute() (espnet2.diar.espnet_model.ESPnetDiarizationModel method)
pit_process() (espnet.nets.pytorch_backend.e2e_asr_mix.PIT method)
pitch_shift() (in module espnet2.layers.augmentation)
PITLossWrapper (class in espnet2.asr.pit_espnet_model)
PITSolver (class in espnet2.enh.loss.wrappers.pit_solver)
plot_attention() (espnet2.train.trainer.Trainer class method)
plot_multi_head_attention() (in module espnet.nets.pytorch_backend.transformer.plot)
plot_spectrogram() (in module espnet.asr.asr_utils)
PlotAttentionReport (class in espnet.asr.asr_mix_utils)
(class in espnet.asr.asr_utils)
(class in espnet.nets.pytorch_backend.transformer.plot)
PlotCTCReport (class in espnet.asr.asr_utils)
plotfn() (espnet.nets.pytorch_backend.e2e_tts_transformer.TTSPlot method)
(espnet.nets.pytorch_backend.transformer.plot.PlotAttentionReport method)
polarity_inverse() (in module espnet2.layers.augmentation)
poly1d() (in module espnet2.enh.layers.dnsmos)
PositionalEncoding (class in espnet.nets.chainer_backend.transformer.embedding)
(class in espnet.nets.pytorch_backend.transformer.embedding)
PositionwiseFeedForward (class in espnet.nets.chainer_backend.transformer.positionwise_feed_forward)
(class in espnet.nets.pytorch_backend.transformer.positionwise_feed_forward)
post_process() (espnet.nets.batch_beam_search.BatchBeamSearch method)
(espnet.nets.beam_search.BeamSearch method)
PosteriorEncoder (class in espnet2.gan_tts.vits.posterior_encoder)
Postnet (class in espnet.nets.pytorch_backend.tacotron2.decoder)
power() (in module espnet2.asr.state_spaces.s4)
PQMF (class in espnet2.gan_tts.melgan.pqmf)
pre_segment() (espnet2.uasr.segmenter.abs_segmenter.AbsSegmenter method)
(espnet2.uasr.segmenter.join_segmenter.JoinSegmenter method)
(espnet2.uasr.segmenter.random_segmenter.RandomSegmenter method)
predict() (espnet.lm.chainer_backend.lm.ClassifierWithState method)
(espnet.nets.pytorch_backend.lm.default.ClassifierWithState method)
predict_mask() (espnet2.enh.layers.dnn_beamformer.DNN_Beamformer method)
(espnet2.enh.layers.dnn_wpe.DNN_WPE method)
Predictor (class in espnet2.enh.diffusion.sampling.__init__)
(class in espnet2.enh.diffusion.sampling.predictors)
preemphasis() (in module espnet2.layers.augmentation)
prefix_search() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
Prenet (class in espnet.nets.pytorch_backend.tacotron2.decoder)
(class in espnet2.s2st.synthesizer.translatotron2)
prepare_beamformer_stats() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
prepare_body_model() (in module espnet.nets.pytorch_backend.transducer.blocks)
prepare_input_layer() (in module espnet.nets.pytorch_backend.transducer.blocks)
prepare_segmentation_task() (espnet2.bin.asr_align.CTCSegmentation method)
previous_epoch_detail() (espnet.lm.lm_utils.ParallelSentenceIterator property)
print_confidence_score (espnet2.bin.asr_align.CTCSegmentationTask attribute)
print_config() (espnet2.tasks.abs_task.AbsTask class method)
print_utterance_text (espnet2.bin.asr_align.CTCSegmentationTask attribute)
prior_logp() (espnet2.enh.diffusion.sdes.OUVESDE method)
(espnet2.enh.diffusion.sdes.OUVPSDE method)
(espnet2.enh.diffusion.sdes.SDE method)
prior_sampling() (espnet2.enh.diffusion.sdes.OUVESDE method)
(espnet2.enh.diffusion.sdes.OUVPSDE method)
(espnet2.enh.diffusion.sdes.SDE method)
PriorDecoder (class in espnet2.gan_svs.vits.prior_decoder)
process_one_block() (espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
process_one_block_time_sync() (espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
ProDiff (class in espnet2.tts.prodiff.prodiff)
ProDiffLoss (class in espnet2.tts.prodiff.loss)
project_spk_embd() (espnet2.spk.espnet_model.ESPnetSpeakerModel method)
Projection (class in espnet2.gan_svs.vits.modules)
PUNC (espnet2.text.phoneme_tokenizer.Jaso attribute)
pyopenjtalk_g2p() (in module espnet2.text.phoneme_tokenizer)
pyopenjtalk_g2p_accent() (in module espnet2.text.phoneme_tokenizer)
pyopenjtalk_g2p_accent_with_pause() (in module espnet2.text.phoneme_tokenizer)
pyopenjtalk_g2p_kana() (in module espnet2.text.phoneme_tokenizer)
pyopenjtalk_g2p_prosody() (in module espnet2.text.phoneme_tokenizer)
pypinyin_g2p() (in module espnet2.text.phoneme_tokenizer)
pypinyin_g2p_phone() (in module espnet2.text.phoneme_tokenizer)
pypinyin_g2p_phone_without_prosody() (in module espnet2.text.phoneme_tokenizer)
pytorch_cudnn_version() (in module espnet2.torch_utils.pytorch_version)
PyTorchScheduler (class in espnet.scheduler.pytorch)
R
R_Op (class in espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce)
rand_int_loader() (in module espnet2.train.dataset)
RandomSegmenter (class in espnet2.uasr.segmenter.random_segmenter)
RandomTextReader (class in espnet2.fileio.read_text)
rank_correction() (in module espnet2.asr.state_spaces.s4)
rank_zero_only() (in module espnet2.asr.state_spaces.s4)
rate() (espnet.nets.pytorch_backend.transformer.optimizer.NoamOpt method)
rational_quadratic_spline() (in module espnet2.gan_tts.vits.transform)
RawNet3Encoder (class in espnet2.spk.encoder.rawnet3_encoder)
RawNet3Projector (class in espnet2.spk.projector.rawnet3_projector)
RawSampler (class in espnet2.iterators.category_iter_factory)
(class in espnet2.iterators.sequence_iter_factory)
RCUBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
read_2columns_text() (in module espnet2.fileio.read_text)
read_audio() (in module espnet2.bin.enh_scoring)
read_label() (in module espnet2.fileio.read_text)
read_multi_columns_text() (in module espnet2.fileio.read_text)
read_tokens() (in module espnet.lm.lm_utils)
receptive_field_size() (espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANGenerator property)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANGenerator property)
(espnet2.gan_tts.wavenet.wavenet.WaveNet property)
recog() (espnet.nets.pytorch_backend.e2e_asr_mix_transformer.E2E method)
(in module espnet.asr.chainer_backend.asr)
(in module espnet.asr.pytorch_backend.asr)
(in module espnet.asr.pytorch_backend.asr_mix)
recog_v2() (in module espnet.asr.pytorch_backend.recog)
recognize() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.chainer_backend.e2e_asr.E2E method)
(espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
(espnet.nets.chainer_backend.transformer.decoder.Decoder method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_maskctc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transducer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
recognize_batch() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mix.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
recognize_beam() (espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
(espnet.nets.chainer_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
recognize_beam_batch() (espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
recombine_hyps() (espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
(in module espnet.nets.pytorch_backend.transducer.utils)
recursive_average() (in module espnet2.torch_utils.recursive_op)
recursive_dict_update() (in module espnet2.bin.enh_inference)
(in module espnet2.bin.enh_tse_inference)
recursive_divide() (in module espnet2.torch_utils.recursive_op)
recursive_sum() (in module espnet2.torch_utils.recursive_op)
reduce_exp() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce)
reduce_max() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce)
ReduceHelper() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.reduce)
reduction (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss attribute)
ReferenceEncoder (class in espnet2.tts.gst.style_encoder)
RefineBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
register() (espnet2.asr.state_spaces.s4.OptimModule method)
(espnet2.train.reporter.SubReporter method)
register_scheduler() (in module espnet.scheduler.scheduler)
register_stats() (espnet2.gan_svs.uhifigan.__init__.UHiFiGANGenerator method)
(espnet2.gan_svs.uhifigan.uhifigan.UHiFiGANGenerator method)
rel_shift() (espnet.nets.pytorch_backend.transformer.attention.LegacyRelPositionMultiHeadedAttention method)
(espnet.nets.pytorch_backend.transformer.attention.RelPositionMultiHeadedAttention method)
(espnet2.asr_transducer.encoder.modules.attention.RelPositionMultiHeadedAttention method)
RelativePositionBias (class in espnet2.asr_transducer.decoder.modules.mega.positional_bias)
reload_pretrained_parameters() (espnet2.asr.decoder.hugging_face_transformers_decoder.HuggingFaceTransformersDecoder method)
(espnet2.asr.encoder.avhubert_encoder.FairseqAVHubertEncoder method)
(espnet2.asr.encoder.hubert_encoder.FairseqHubertEncoder method)
(espnet2.asr.encoder.hubert_encoder.FairseqHubertPretrainEncoder method)
(espnet2.asr.encoder.hubert_encoder.TorchAudioHuBERTPretrainEncoder method)
(espnet2.asr.encoder.hugging_face_transformers_encoder.HuggingFaceTransformersEncoder method)
(espnet2.asr.encoder.wav2vec2_encoder.FairSeqWav2Vec2Encoder method)
(espnet2.asr.frontend.s3prl.S3prlFrontend method)
(espnet2.asr.postencoder.hugging_face_transformers_postencoder.HuggingFaceTransformersPostEncoder method)
(espnet2.lm.huggingface_pretrained_opt_lm.HuggingfaceOPTModel method)
RelPositionalEncoding (class in espnet.nets.pytorch_backend.transformer.embedding)
(class in espnet2.asr_transducer.encoder.modules.positional_encoding)
RelPositionMultiHeadedAttention (class in espnet.nets.pytorch_backend.transformer.attention)
(class in espnet2.asr_transducer.encoder.modules.attention)
remove_above_nyquist() (in module espnet2.gan_svs.visinger2.ddsp)
remove_parenthesis() (in module espnet2.utils.types)
remove_quotes() (in module espnet2.utils.types)
remove_spectral_norm() (espnet2.gan_tts.hifigan.__init__.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANScaleDiscriminator method)
remove_weight_norm() (espnet2.gan_svs.avocodo.__init__.AvocodoGenerator method)
(espnet2.gan_svs.avocodo.avocodo.AvocodoGenerator method)
(espnet2.gan_svs.pits.modules.WN method)
(espnet2.gan_svs.uhifigan.__init__.UHiFiGANGenerator method)
(espnet2.gan_svs.uhifigan.uhifigan.UHiFiGANGenerator method)
(espnet2.gan_svs.visinger2.__init__.VISinger2VocoderGenerator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.VISinger2VocoderGenerator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANScaleDiscriminator method)
(espnet2.gan_tts.melgan.melgan.MelGANGenerator method)
(espnet2.gan_tts.melgan.melgan.MelGANMultiScaleDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.__init__.ParallelWaveGANGenerator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.parallel_wavegan.ParallelWaveGANGenerator method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANGenerator method)
(espnet2.gan_tts.wavenet.wavenet.WaveNet method)
rename_state_dict() (in module espnet.nets.pytorch_backend.nets_utils)
repeat() (in module espnet.nets.pytorch_backend.transformer.repeat)
replace_module() (in module espnet2.layers.create_adapter_utils)
report() (espnet.lm.pytorch_backend.lm.Reporter method)
(espnet.nets.pytorch_backend.e2e_asr.Reporter method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.Reporter method)
(espnet.nets.pytorch_backend.e2e_asr_transducer.Reporter method)
(espnet.nets.pytorch_backend.e2e_mt.Reporter method)
(espnet.nets.pytorch_backend.e2e_st.Reporter method)
(espnet.nets.tts_interface.Reporter method)
ReportedValue (class in espnet2.train.reporter)
Reporter (class in espnet.lm.pytorch_backend.lm)
(class in espnet.nets.pytorch_backend.e2e_asr)
(class in espnet.nets.pytorch_backend.e2e_asr_mulenc)
(class in espnet.nets.pytorch_backend.e2e_asr_transducer)
(class in espnet.nets.pytorch_backend.e2e_mt)
(class in espnet.nets.pytorch_backend.e2e_st)
(class in espnet.nets.tts_interface)
(class in espnet2.train.reporter)
require_raw_singing() (espnet2.gan_svs.joint.joint_score2wav.JointScore2Wav property)
(espnet2.gan_svs.vits.vits.VITS property)
(espnet2.svs.abs_svs.AbsSVS property)
require_raw_speech() (espnet2.gan_tts.jets.jets.JETS property)
(espnet2.gan_tts.joint.joint_text2wav.JointText2Wav property)
(espnet2.gan_tts.vits.vits.VITS property)
(espnet2.s2st.synthesizer.abs_synthesizer.AbsSynthesizer property)
(espnet2.tts.abs_tts.AbsTTS property)
require_vocoder() (espnet2.gan_svs.joint.joint_score2wav.JointScore2Wav property)
(espnet2.gan_svs.vits.vits.VITS property)
(espnet2.gan_tts.jets.jets.JETS property)
(espnet2.gan_tts.joint.joint_text2wav.JointText2Wav property)
(espnet2.gan_tts.vits.vits.VITS property)
(espnet2.s2st.espnet_model.ESPnetS2STModel property)
(espnet2.s2st.synthesizer.abs_synthesizer.AbsSynthesizer property)
(espnet2.svs.abs_svs.AbsSVS property)
(espnet2.tts.abs_tts.AbsTTS property)
required_data_names() (espnet2.tasks.abs_task.AbsTask class method)
(espnet2.tasks.asr.ASRTask class method)
(espnet2.tasks.asr_transducer.ASRTransducerTask class method)
(espnet2.tasks.asvspoof.ASVSpoofTask class method)
(espnet2.tasks.diar.DiarizationTask class method)
(espnet2.tasks.enh.EnhancementTask class method)
(espnet2.tasks.enh_s2t.EnhS2TTask class method)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask class method)
(espnet2.tasks.gan_svs.GANSVSTask class method)
(espnet2.tasks.gan_tts.GANTTSTask class method)
(espnet2.tasks.hubert.HubertTask class method)
(espnet2.tasks.lm.LMTask class method)
(espnet2.tasks.mt.MTTask class method)
(espnet2.tasks.s2st.S2STTask class method)
(espnet2.tasks.s2t.S2TTask class method)
(espnet2.tasks.slu.SLUTask class method)
(espnet2.tasks.spk.SpeakerTask class method)
(espnet2.tasks.st.STTask class method)
(espnet2.tasks.svs.SVSTask class method)
(espnet2.tasks.tts.TTSTask class method)
(espnet2.tasks.uasr.UASRTask class method)
resample() (in module espnet2.gan_svs.visinger2.ddsp)
ResBlock (class in espnet2.spk.encoder.ska_tdnn_encoder)
ResEncoder (class in espnet2.asr.encoder.avhubert_encoder)
reset() (espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
(espnet.nets.beam_search_timesync.BeamSearchTimeSync method)
(espnet.nets.beam_search_timesync_streaming.BeamSearchTimeSyncStreaming method)
(espnet.nets.chainer_backend.rnn.attentions.AttDot method)
(espnet.nets.chainer_backend.rnn.attentions.AttLoc method)
(espnet.nets.chainer_backend.rnn.attentions.NoAtt method)
(espnet.nets.pytorch_backend.rnn.attentions.AttAdd method)
(espnet.nets.pytorch_backend.rnn.attentions.AttCov method)
(espnet.nets.pytorch_backend.rnn.attentions.AttCovLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.AttDot method)
(espnet.nets.pytorch_backend.rnn.attentions.AttForward method)
(espnet.nets.pytorch_backend.rnn.attentions.AttForwardTA method)
(espnet.nets.pytorch_backend.rnn.attentions.AttLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.AttLoc2D method)
(espnet.nets.pytorch_backend.rnn.attentions.AttLocRec method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadAdd method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadDot method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.AttMultiHeadMultiResLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.GDCAttLoc method)
(espnet.nets.pytorch_backend.rnn.attentions.NoAtt method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
(espnet2.bin.asr_inference_streaming.Speech2TextStreaming method)
(espnet2.bin.enh_inference_streaming.SeparateSpeechStreaming method)
(espnet2.bin.st_inference_streaming.Speech2TextStreaming method)
reset_backward_rnn_state() (in module espnet.nets.pytorch_backend.rnn.encoders)
(in module espnet.nets.pytorch_backend.transducer.rnn_encoder)
reset_cache() (espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr_transducer.encoder.encoder.Encoder method)
(espnet2.asr_transducer.frontend.online_audio_processor.OnlineAudioProcessor method)
reset_parameters() (espnet.nets.chainer_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
(espnet.nets.pytorch_backend.transformer.embedding.ScaledPositionalEncoding method)
(espnet2.asr_transducer.decoder.blocks.mega.MEGA method)
(espnet2.asr_transducer.decoder.modules.mega.feed_forward.NormalizedPositionwiseFeedForward method)
(espnet2.asr_transducer.decoder.modules.mega.multi_head_damped_ema.MultiHeadDampedEMA method)
(espnet2.asr_transducer.decoder.modules.mega.positional_bias.RelativePositionBias method)
(espnet2.asr_transducer.decoder.modules.mega.positional_bias.RotaryRelativePositionBias method)
(espnet2.asr_transducer.decoder.modules.rwkv.attention.SelfAttention method)
(espnet2.asr_transducer.decoder.modules.rwkv.feed_forward.FeedForward method)
(espnet2.diar.layers.tcn_nomask.ChannelwiseLayerNorm method)
(espnet2.diar.layers.tcn_nomask.GlobalLayerNorm method)
(espnet2.enh.layers.complexnn.ComplexBatchNorm method)
(espnet2.enh.layers.dcunet.ComplexBatchNorm method)
(espnet2.enh.layers.tcn.ChannelwiseLayerNorm method)
(espnet2.enh.layers.tcn.GlobalLayerNorm method)
(espnet2.gan_svs.avocodo.__init__.AvocodoGenerator method)
(espnet2.gan_svs.avocodo.avocodo.AvocodoGenerator method)
(espnet2.gan_svs.uhifigan.__init__.UHiFiGANGenerator method)
(espnet2.gan_svs.uhifigan.uhifigan.UHiFiGANGenerator method)
(espnet2.gan_svs.visinger2.__init__.VISinger2VocoderGenerator method)
(espnet2.gan_svs.visinger2.visinger2_vocoder.VISinger2VocoderGenerator method)
(espnet2.gan_tts.hifigan.__init__.HiFiGANGenerator method)
(espnet2.gan_tts.hifigan.hifigan.HiFiGANGenerator method)
(espnet2.gan_tts.melgan.melgan.MelGANGenerator method)
(espnet2.gan_tts.melgan.melgan.MelGANMultiScaleDiscriminator method)
(espnet2.gan_tts.parallel_wavegan.upsample.Conv2d method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANDiscriminator method)
(espnet2.gan_tts.style_melgan.style_melgan.StyleMelGANGenerator method)
(espnet2.gan_tts.wavenet.residual_block.Conv1d method)
reset_running_stats() (espnet2.enh.layers.complexnn.ComplexBatchNorm method)
(espnet2.enh.layers.dcunet.ComplexBatchNorm method)
reset_streaming_cache() (espnet2.asr_transducer.encoder.blocks.branchformer.Branchformer method)
(espnet2.asr_transducer.encoder.blocks.conformer.Conformer method)
(espnet2.asr_transducer.encoder.blocks.conv1d.Conv1d method)
(espnet2.asr_transducer.encoder.blocks.ebranchformer.EBranchformer method)
(espnet2.asr_transducer.encoder.modules.multi_blocks.MultiBlocks method)
(espnet2.bin.asr_transducer_inference.Speech2Text method)
Residual (class in espnet2.asr.state_spaces.residual)
ResidualAffineCouplingBlock (class in espnet2.gan_tts.vits.residual_coupling)
ResidualAffineCouplingLayer (class in espnet2.gan_tts.vits.residual_coupling)
ResidualBlock (class in espnet2.enh.layers.ncsnpp_utils.layers)
(class in espnet2.gan_tts.hifigan.residual_block)
(class in espnet2.gan_tts.wavenet.residual_block)
(class in espnet2.tts.prodiff.denoiser)
ResidualStack (class in espnet2.gan_tts.melgan.residual_stack)
ResNet (class in espnet2.asr.encoder.avhubert_encoder)
resnet_relu_type (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
resnet_weights (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
ResnetBlockBigGANpp (class in espnet2.enh.layers.ncsnpp_utils.layerspp)
ResnetBlockDDPM (class in espnet2.enh.layers.ncsnpp_utils.layers)
ResnetBlockDDPMpp (class in espnet2.enh.layers.ncsnpp_utils.layerspp)
resolve_distributed_mode() (in module espnet2.train.distributed_utils)
restore_snapshot() (in module espnet.asr.asr_utils)
resume() (espnet2.train.trainer.Trainer static method)
reverse() (espnet2.enh.diffusion.sdes.SDE method)
(in module espnet2.enh.layers.complex_utils)
(in module espnet2.layers.augmentation)
ReverseDiffusionPredictor (class in espnet2.enh.diffusion.sampling.predictors)
ReversibleInstanceNorm1dInput (class in espnet2.asr.state_spaces.components)
ReversibleInstanceNorm1dOutput (class in espnet2.asr.state_spaces.components)
RIRConvolve (class in espnet.transform.perturb)
RMSNorm (class in espnet2.asr_transducer.normalization)
RNN (class in espnet.nets.chainer_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.transducer.rnn_encoder)
rnn_forward() (espnet.nets.chainer_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet2.asr.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
RnnAttractor (class in espnet2.diar.attractor.rnn_attractor)
RNNDecoder (class in espnet.nets.pytorch_backend.transducer.rnn_decoder)
(class in espnet2.asr.decoder.rnn_decoder)
(class in espnet2.asr_transducer.decoder.rnn_decoder)
RNNEncoder (class in espnet2.asr.encoder.rnn_encoder)
RNNLM (class in espnet.lm.chainer_backend.lm)
(class in espnet.nets.pytorch_backend.lm.default)
RNNP (class in espnet.nets.chainer_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.transducer.rnn_encoder)
RNNSeparator (class in espnet2.enh.separator.rnn_separator)
rnnt_loss() (in module espnet2.asr.transducer.rnnt_multi_blank.rnnt_multi_blank)
rnnt_loss_cpu() (in module espnet2.asr.transducer.rnnt_multi_blank.rnnt)
rnnt_loss_gpu() (in module espnet2.asr.transducer.rnnt_multi_blank.rnnt)
RNNT_STATUS_INVALID_VALUE (espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants.RNNTStatus attribute)
RNNT_STATUS_SUCCESS (espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants.RNNTStatus attribute)
RNNTLossNumba (class in espnet2.asr.transducer.rnnt_multi_blank.rnnt_multi_blank)
RNNTStatus (class in espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants)
rotary() (espnet2.asr_transducer.decoder.modules.mega.positional_bias.RotaryRelativePositionBias method)
RotaryRelativePositionBias (class in espnet2.asr_transducer.decoder.modules.mega.positional_bias)
round_down() (in module espnet2.samplers.category_balanced_sampler)
RttmReader (class in espnet2.fileio.rttm)
run() (espnet2.train.trainer.Trainer class method)
RWKV (class in espnet2.asr_transducer.decoder.blocks.rwkv)
RWKVDecoder (class in espnet2.asr_transducer.decoder.rwkv_decoder)
S
S2STAttentionLoss (class in espnet2.s2st.losses.attention_loss)
S2STCTCLoss (class in espnet2.s2st.losses.ctc_loss)
S2STGuidedAttentionLoss (class in espnet2.s2st.losses.guided_attention_loss)
S2STPackedContents (class in espnet2.bin.pack)
S2STTacotron2Loss (class in espnet2.s2st.losses.tacotron_loss)
S2STTask (class in espnet2.tasks.s2st)
S2TPackedContents (class in espnet2.bin.pack)
S2TPreprocessor (class in espnet2.train.preprocessor)
S2TTask (class in espnet2.tasks.s2t)
S3prlFrontend (class in espnet2.asr.frontend.s3prl)
S4 (class in espnet2.asr.state_spaces.s4)
S4Decoder (class in espnet2.asr.decoder.s4_decoder)
safe_log() (in module espnet2.gan_svs.visinger2.ddsp)
SamePad (class in espnet2.asr.encoder.avhubert_encoder)
(class in espnet2.uasr.discriminator.conv_discriminator)
(class in espnet2.uasr.generator.conv_generator)
sample_rate (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
samples_to_frames_ratio (espnet2.bin.asr_align.CTCSegmentation attribute)
savefig() (in module espnet.nets.pytorch_backend.transformer.plot)
SBD (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
SBDBlock (class in espnet2.gan_svs.avocodo.__init__)
(class in espnet2.gan_svs.avocodo.avocodo)
scale() (espnet.scheduler.scheduler.CyclicCosineScheduler method)
(espnet.scheduler.scheduler.NoScheduler method)
(espnet.scheduler.scheduler.NoamScheduler method)
(espnet.scheduler.scheduler.SchedulerInterface method)
scale_function() (in module espnet2.gan_svs.visinger2.ddsp)
ScaledPositionalEncoding (class in espnet.nets.pytorch_backend.transformer.embedding)
ScaleNorm (class in espnet2.asr_transducer.normalization)
SchedulerInterface (class in espnet.scheduler.scheduler)
score (espnet.nets.batch_beam_search.BatchHypothesis attribute)
(espnet.nets.beam_search.Hypothesis attribute)
score() (espnet.nets.pytorch_backend.lm.default.DefaultRNNLM method)
(espnet.nets.pytorch_backend.lm.seq_rnn.SequentialRNNLM method)
(espnet.nets.pytorch_backend.lm.transformer.TransformerLM method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
(espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet.nets.pytorch_backend.transformer.decoder.Decoder method)
(espnet.nets.scorer_interface.ScorerInterface method)
(espnet.nets.scorers.length_bonus.LengthBonus method)
(espnet.nets.scorers.ngram.NgramFullScorer method)
(espnet.nets.transducer_decoder_interface.TransducerDecoderInterface method)
(espnet2.asr.decoder.hugging_face_transformers_decoder.HuggingFaceTransformersDecoder method)
(espnet2.asr.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr.decoder.s4_decoder.S4Decoder method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr.decoder.transformer_decoder.BaseTransformerDecoder method)
(espnet2.asr.decoder.transformer_decoder.TransformerMDDecoder method)
(espnet2.asr.decoder.whisper_decoder.OpenAIWhisperDecoder method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
(espnet2.asvspoof.loss.abs_loss.AbsASVSpoofLoss method)
(espnet2.asvspoof.loss.am_softmax_loss.ASVSpoofAMSoftmaxLoss method)
(espnet2.asvspoof.loss.binary_loss.ASVSpoofBinaryLoss method)
(espnet2.asvspoof.loss.oc_softmax_loss.ASVSpoofOCSoftmaxLoss method)
(espnet2.bin.s2t_inference.ScoreFilter method)
(espnet2.lm.huggingface_pretrained_opt_lm.HuggingfaceOPTModel method)
(espnet2.lm.seq_rnn_lm.SequentialRNNLM method)
(espnet2.lm.transformer_lm.TransformerLM method)
(espnet2.s2st.synthesizer.discrete_synthesizer.TransformerDiscreteSynthesizer method)
score_fn() (espnet2.enh.diffusion.score_based_diffusion.ScoreModel method)
score_forward() (espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.CPURNNT method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.GPURNNT method)
(espnet2.asr.transducer.rnnt_multi_blank.utils.cuda_utils.gpu_rnnt.MultiblankGPURNNT method)
score_full() (espnet.nets.batch_beam_search.BatchBeamSearch method)
(espnet.nets.batch_beam_search_online.BatchBeamSearchOnline method)
(espnet.nets.beam_search.BeamSearch method)
score_loader() (in module espnet2.train.dataset)
score_partial() (espnet.nets.batch_beam_search.BatchBeamSearch method)
(espnet.nets.beam_search.BeamSearch method)
(espnet.nets.scorer_interface.PartialScorerInterface method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
(espnet.nets.scorers.ngram.NgramPartScorer method)
score_partial_() (espnet.nets.scorers.ngram.Ngrambase method)
ScoreFilter (class in espnet2.bin.s2t_inference)
ScoreModel (class in espnet2.enh.diffusion.score_based_diffusion)
ScorerInterface (class in espnet.nets.scorer_interface)
scorers() (espnet.nets.asr_interface.ASRInterface method)
(espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_mulenc.E2E method)
(espnet.nets.pytorch_backend.e2e_asr_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
scores (espnet.nets.batch_beam_search.BatchHypothesis attribute)
(espnet.nets.beam_search.Hypothesis attribute)
scoring() (in module espnet2.bin.enh_scoring)
SDE (class in espnet2.enh.diffusion.sdes)
sde() (espnet2.enh.diffusion.sdes.OUVESDE method)
(espnet2.enh.diffusion.sdes.OUVPSDE method)
(espnet2.enh.diffusion.sdes.SDE method)
SDRLoss (class in espnet2.enh.loss.criterions.time_domain)
search() (espnet.nets.batch_beam_search.BatchBeamSearch method)
(espnet.nets.beam_search.BeamSearch method)
seg_signal_context() (espnet2.enh.layers.fasnet.FaSNet_base method)
SegLSTM (class in espnet2.enh.layers.skim)
segments (espnet2.bin.asr_align.CTCSegmentationTask attribute)
SegmentStreamingE2E (class in espnet.nets.pytorch_backend.streaming.segment)
select_k_expansions() (espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
(in module espnet.nets.pytorch_backend.transducer.utils)
select_lm_state() (in module espnet.nets.pytorch_backend.transducer.utils)
select_state() (espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet.nets.scorer_interface.ScorerInterface method)
(espnet.nets.scorers.ctc.CTCPrefixScorer method)
(espnet.nets.scorers.ngram.NgramPartScorer method)
(espnet.nets.transducer_decoder_interface.TransducerDecoderInterface method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
selection_type (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
SelfAttention (class in espnet2.asr_transducer.decoder.modules.rwkv.attention)
SEModule (class in espnet2.spk.encoder.ska_tdnn_encoder)
(class in espnet2.spk.layers.ecapa_block)
SentencepiecesTokenizer (class in espnet2.text.sentencepiece_tokenizer)
SeparateSpeech (class in espnet2.bin.enh_inference)
(class in espnet2.bin.enh_tse_inference)
SeparateSpeechStreaming (class in espnet2.bin.enh_inference_streaming)
seq_cos_sim() (espnet2.enh.layers.fasnet.FaSNet_base method)
sequence_mask() (in module espnet2.gan_svs.vits.modules)
SequenceIdentity (class in espnet2.asr.state_spaces.base)
SequenceIterFactory (class in espnet2.iterators.sequence_iter_factory)
SequenceModel (class in espnet2.asr.state_spaces.model)
SequenceModule (class in espnet2.asr.state_spaces.base)
SequenceResidualBlock (class in espnet2.asr.state_spaces.block)
SequentialRNNLM (class in espnet.nets.pytorch_backend.lm.seq_rnn)
(class in espnet2.lm.seq_rnn_lm)
serialize() (espnet.lm.lm_utils.MakeSymlinkToBestModel method)
(espnet.lm.lm_utils.ParallelSentenceIterator method)
(espnet.nets.chainer_backend.transformer.training.VaswaniRule method)
(espnet.utils.dataset.ChainerDataLoader method)
set() (espnet2.bin.asr_align.CTCSegmentationTask method)
set_all_random_seed() (in module espnet2.torch_utils.set_all_random_seed)
set_block_size() (espnet.nets.batch_beam_search_online_sim.BatchBeamSearchOnlineSim method)
set_config() (espnet2.bin.asr_align.CTCSegmentation method)
set_deterministic_chainer() (in module espnet.utils.deterministic_utils)
set_deterministic_pytorch() (in module espnet.utils.deterministic_utils)
set_device() (espnet.nets.pytorch_backend.transducer.custom_decoder.CustomDecoder method)
(espnet.nets.pytorch_backend.transducer.rnn_decoder.RNNDecoder method)
(espnet2.asr.decoder.transducer_decoder.TransducerDecoder method)
(espnet2.asr_transducer.decoder.abs_decoder.AbsDecoder method)
(espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
(espnet2.asr_transducer.decoder.rnn_decoder.RNNDecoder method)
(espnet2.asr_transducer.decoder.rwkv_decoder.RWKVDecoder method)
(espnet2.asr_transducer.decoder.stateless_decoder.StatelessDecoder method)
set_early_stop() (in module espnet.utils.training.train_utils)
set_epoch() (espnet2.train.reporter.Reporter method)
set_forget_bias_to_one() (in module espnet.nets.pytorch_backend.initialization)
set_hop_size() (espnet.nets.batch_beam_search_online_sim.BatchBeamSearchOnlineSim method)
set_hyp_primer() (espnet.nets.beam_search.BeamSearch method)
set_look_ahead() (espnet.nets.batch_beam_search_online_sim.BatchBeamSearchOnlineSim method)
set_start_method() (in module espnet.distributed.pytorch_backend.launch)
set_streaming_config() (espnet.nets.batch_beam_search_online_sim.BatchBeamSearchOnlineSim method)
set_target() (espnet.nets.pytorch_backend.transducer.transducer_tasks.TransducerTasks method)
setup_logging() (in module espnet.bin.asr_train)
setup_probs() (espnet2.asr.transducer.rnnt_multi_blank.utils.cpu_utils.cpu_rnnt.CpuRNNT_metadata method)
setup_step() (espnet2.asr.state_spaces.s4.S4 method)
SGD (class in espnet2.optimizers.sgd)
sgd() (in module espnet.optimizer.parser)
SGDFactory (class in espnet.optimizer.chainer)
(class in espnet.optimizer.pytorch)
share_decoder_input_output_embed (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
ShufflingEnabler (class in espnet.utils.training.iterators)
signal_context() (espnet2.enh.layers.fasnet.FaSNet_base method)
signal_framing() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
(in module espnet2.enh.layers.wpe)
signal_no() (espnet.distributed.pytorch_backend.launch.MainProcessError property)
sim_type (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
sinc() (espnet2.layers.sinc_conv.SincConv static method)
SincConv (class in espnet2.layers.sinc_conv)
SineGen (class in espnet2.gan_svs.uhifigan.__init__)
(class in espnet2.gan_svs.uhifigan.sine_generator)
singing_tacotron (class in espnet2.svs.singing_tacotron.singing_tacotron)
SingingGenerate (class in espnet2.bin.svs_inference)
SingingScoreReader (class in espnet2.fileio.score_scp)
SingingScoreWriter (class in espnet2.fileio.score_scp)
SingleRNN (class in espnet2.enh.layers.dprnn)
SISNRLoss (class in espnet2.enh.loss.criterions.time_domain)
SizedDict (class in espnet2.utils.sized_dict)
SkaTdnnEncoder (class in espnet2.spk.encoder.ska_tdnn_encoder)
SkaTdnnProjector (class in espnet2.spk.projector.ska_tdnn_projector)
SKAttentionModule (class in espnet2.spk.encoder.ska_tdnn_encoder)
SkiM (class in espnet2.enh.layers.skim)
SkiMSeparator (class in espnet2.enh.separator.skim_separator)
skip_masked (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
skip_nomask (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
SlidingWindow (class in espnet2.asr.frontend.windowing)
SLUPreprocessor (class in espnet2.train.preprocessor)
SLUTask (class in espnet2.tasks.slu)
Smish (class in espnet2.asr_transducer.activation)
snapshot_object() (in module espnet.asr.asr_utils)
SNRLoss (class in espnet2.enh.loss.criterions.time_domain)
softmax() (espnet.nets.pytorch_backend.ctc.CTC method)
(espnet2.asr.ctc.CTC method)
softmax_attention() (espnet2.asr_transducer.decoder.blocks.mega.MEGA method)
solve() (in module espnet2.enh.layers.complex_utils)
solve_interpolation() (in module espnet.utils.spec_augment)
sort_by_perm() (espnet2.enh.espnet_model.ESPnetEnhancementModel static method)
sort_epochs() (espnet2.train.reporter.Reporter method)
sort_epochs_and_values() (espnet2.train.reporter.Reporter method)
sort_nbest() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
(espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
sort_values() (espnet2.train.reporter.Reporter method)
SortedBatchSampler (class in espnet2.samplers.sorted_batch_sampler)
sound_loader() (in module espnet2.train.dataset)
soundfile_read() (in module espnet2.fileio.sound_scp)
SoundHDF5File (class in espnet.utils.io_utils)
SoundHDF5Reader (class in espnet.utils.cli_readers)
SoundHDF5Writer (class in espnet.utils.cli_writers)
SoundReader (class in espnet.utils.cli_readers)
SoundScpReader (class in espnet2.fileio.sound_scp)
SoundScpWriter (class in espnet2.fileio.sound_scp)
SoundWriter (class in espnet.utils.cli_writers)
SPACE (espnet2.text.phoneme_tokenizer.Jaso attribute)
sparse_image_warp() (in module espnet.utils.spec_augment)
SpatialDropout (class in espnet2.asr.preencoder.sinc)
SpeakerTask (class in espnet2.tasks.spk)
spec_augment() (in module espnet.transform.spec_augment)
spec_back() (espnet2.enh.decoder.stft_decoder.STFTDecoder method)
spec_transform_func() (espnet2.enh.encoder.stft_encoder.STFTEncoder method)
SpecAug (class in espnet2.asr.specaug.specaug)
specaug() (in module espnet.utils.spec_augment)
SpecAugment (class in espnet.transform.spec_augment)
SpectogramDenoiser (class in espnet2.tts.prodiff.denoiser)
Spectrogram (class in espnet.transform.spectrogram)
spectrogram() (espnet2.s2st.tgt_feats_extract.abs_tgt_feats_extract.AbsTgtFeatsExtract method)
(espnet2.s2st.tgt_feats_extract.linear_spectrogram.LinearSpectrogram method)
(espnet2.s2st.tgt_feats_extract.log_mel_fbank.LogMelFbank method)
(espnet2.s2st.tgt_feats_extract.log_spectrogram.LogSpectrogram method)
(in module espnet.transform.spectrogram)
Spectrogram2Waveform (class in espnet2.utils.griffin_lim)
Speech2Embedding (class in espnet2.bin.spk_inference)
Speech2Language (class in espnet2.bin.s2t_inference_language)
Speech2Speech (class in espnet2.bin.s2st_inference)
Speech2Text (class in espnet2.bin.asr_inference)
(class in espnet2.bin.asr_inference_maskctc)
(class in espnet2.bin.asr_transducer_inference)
(class in espnet2.bin.s2t_inference)
(class in espnet2.bin.st_inference)
(class in espnet2.bin.uasr_inference)
Speech2TextStreaming (class in espnet2.bin.asr_inference_streaming)
(class in espnet2.bin.st_inference_streaming)
Speech2Understand (class in espnet2.bin.slu_inference)
SpeechAntiSpoof (class in espnet2.bin.asvspoof_inference)
speed_perturb() (in module espnet2.layers.augmentation)
SpeedPerturbation (class in espnet.transform.perturb)
SpkPackedContents (class in espnet2.bin.pack)
SpkPreprocessor (class in espnet2.train.preprocessor)
SpkTrainer (class in espnet2.train.spk_trainer)
split_by_space() (in module espnet2.text.phoneme_tokenizer)
split_feature() (espnet2.enh.separator.dptnet_separator.DPTNetSeparator method)
(in module espnet2.enh.layers.dprnn)
split_scps() (in module espnet2.bin.split_scps)
square_mask() (in module espnet.nets.pytorch_backend.maskctc.mask)
SquaredReLU (class in espnet2.asr.state_spaces.components)
ssim() (espnet2.tts.prodiff.loss.SSimLoss method)
SSimLoss (class in espnet2.tts.prodiff.loss)
SSKernel (class in espnet2.asr.state_spaces.s4)
SSKernelDiag (class in espnet2.asr.state_spaces.s4)
SSKernelNPLR (class in espnet2.asr.state_spaces.s4)
SSLPackedContents (class in espnet2.bin.pack)
ssm() (in module espnet2.asr.state_spaces.s4)
stack() (in module espnet2.enh.layers.complex_utils)
stack_qk_states() (espnet2.asr_transducer.decoder.mega_decoder.MEGADecoder method)
start_epoch() (espnet2.train.reporter.Reporter method)
start_shuffle() (espnet.lm.lm_utils.ParallelSentenceIterator method)
(espnet.utils.dataset.ChainerDataLoader method)
(espnet.utils.training.iterators.ToggleableShufflingMultiprocessIterator method)
(espnet.utils.training.iterators.ToggleableShufflingSerialIterator method)
state_dict() (espnet.nets.pytorch_backend.lm.default.DefaultRNNLM method)
(espnet.nets.pytorch_backend.transformer.optimizer.NoamOpt method)
(espnet2.schedulers.abs_scheduler.AbsBatchStepScheduler method)
(espnet2.schedulers.abs_scheduler.AbsEpochStepScheduler method)
(espnet2.schedulers.abs_scheduler.AbsScheduler method)
(espnet2.schedulers.abs_scheduler.AbsValEpochStepScheduler method)
(espnet2.schedulers.warmup_reducelronplateau.WarmupReduceLROnPlateau method)
(espnet2.train.reporter.Reporter method)
state_list (espnet2.bin.asr_align.CTCSegmentationTask attribute)
state_to_tensor() (espnet2.asr.state_spaces.base.SequenceModule property)
(espnet2.asr.state_spaces.block.SequenceResidualBlock property)
(espnet2.asr.state_spaces.model.SequenceModel property)
StatelessDecoder (class in espnet2.asr_transducer.decoder.stateless_decoder)
states (espnet.nets.batch_beam_search.BatchHypothesis attribute)
(espnet.nets.beam_search.Hypothesis attribute)
StatsPooling (class in espnet2.spk.pooling.stat_pooling)
step() (espnet.nets.pytorch_backend.transformer.optimizer.NoamOpt method)
(espnet.scheduler.chainer.ChainerScheduler method)
(espnet.scheduler.pytorch.PyTorchScheduler method)
(espnet2.asr.state_spaces.attention.MultiHeadedAttention method)
(espnet2.asr.state_spaces.base.SequenceModule method)
(espnet2.asr.state_spaces.block.SequenceResidualBlock method)
(espnet2.asr.state_spaces.components.Normalization method)
(espnet2.asr.state_spaces.ff.FF method)
(espnet2.asr.state_spaces.model.SequenceModel method)
(espnet2.asr.state_spaces.pool.DownAvgPool method)
(espnet2.asr.state_spaces.pool.DownLinearPool method)
(espnet2.asr.state_spaces.pool.DownPool method)
(espnet2.asr.state_spaces.pool.DownSample method)
(espnet2.asr.state_spaces.pool.DownSpectralPool method)
(espnet2.asr.state_spaces.pool.UpPool method)
(espnet2.asr.state_spaces.pool.UpSample method)
(espnet2.asr.state_spaces.s4.S4 method)
(espnet2.asr.state_spaces.s4.SSKernel method)
(espnet2.asr.state_spaces.s4.SSKernelDiag method)
(espnet2.asr.state_spaces.s4.SSKernelNPLR method)
(espnet2.schedulers.abs_scheduler.AbsBatchStepScheduler method)
(espnet2.schedulers.abs_scheduler.AbsEpochStepScheduler method)
(espnet2.schedulers.abs_scheduler.AbsScheduler method)
(espnet2.schedulers.abs_scheduler.AbsValEpochStepScheduler method)
(espnet2.schedulers.cosine_anneal_warmup_restart.CosineAnnealingWarmupRestarts method)
(espnet2.schedulers.warmup_reducelronplateau.WarmupReduceLROnPlateau method)
Stft (class in espnet.transform.spectrogram)
(class in espnet2.layers.stft)
stft() (in module espnet.transform.spectrogram)
Stft2LogMelSpectrogram (class in espnet.transform.spectrogram)
stft2logmelspectrogram() (in module espnet.transform.spectrogram)
STFTDecoder (class in espnet2.enh.decoder.stft_decoder)
STFTEncoder (class in espnet2.enh.encoder.stft_encoder)
STInterface (class in espnet.nets.st_interface)
stochastic_depth() (in module espnet2.asr.state_spaces.components)
StochasticDepth (class in espnet2.asr.state_spaces.components)
StochasticDurationPredictor (class in espnet2.gan_tts.vits.duration_predictor)
STPackedContents (class in espnet2.bin.pack)
str2bool() (in module espnet2.utils.types)
str2pair_str() (in module espnet2.utils.types)
str2triple_str() (in module espnet2.utils.types)
str_or_int() (in module espnet2.utils.types)
str_or_none() (in module espnet2.utils.types)
streaming_decode() (espnet2.bin.asr_transducer_inference.Speech2Text method)
streaming_frame() (espnet2.enh.encoder.abs_encoder.AbsEncoder method)
(espnet2.enh.encoder.conv_encoder.ConvEncoder method)
(espnet2.enh.encoder.stft_encoder.STFTEncoder method)
streaming_merge() (espnet2.enh.decoder.abs_decoder.AbsDecoder method)
(espnet2.enh.decoder.conv_decoder.ConvDecoder method)
(espnet2.enh.decoder.stft_decoder.STFTDecoder method)
StreamPositionalEncoding (class in espnet.nets.pytorch_backend.transformer.embedding)
Stretch2d (class in espnet2.gan_tts.parallel_wavegan.upsample)
strtobool() (in module espnet.utils.cli_utils)
STTask (class in espnet2.tasks.st)
StyleEncoder (class in espnet2.tts.gst.style_encoder)
StyleMelGANDiscriminator (class in espnet2.gan_tts.style_melgan.style_melgan)
StyleMelGANGenerator (class in espnet2.gan_tts.style_melgan.style_melgan)
StyleTokenLayer (class in espnet2.tts.gst.style_encoder)
sub_encoder_layers (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
SubModel (class in espnet2.asr.encoder.avhubert_encoder)
SubReporter (class in espnet2.train.reporter)
subsample_frames() (espnet.nets.pytorch_backend.e2e_asr.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
subsequent_mask() (in module espnet.nets.pytorch_backend.transformer.mask)
subtract() (in module espnet.nets.pytorch_backend.transducer.utils)
sum_sqnorm() (in module espnet.nets.chainer_backend.rnn.training)
(in module espnet.nets.chainer_backend.transformer.training)
SVoiceSeparator (class in espnet2.enh.separator.svoice_separator)
SVSPackedContents (class in espnet2.bin.pack)
SVSPreprocessor (class in espnet2.train.preprocessor)
SVSTask (class in espnet2.tasks.svs)
Swish (class in espnet.nets.pytorch_backend.conformer.swish)
(class in espnet2.asr_transducer.activation)
SyllableScoreFeats (class in espnet2.svs.feats_extract.score_feats_extract)
synthesis() (espnet2.gan_tts.melgan.pqmf.PQMF method)
T
T() (espnet2.enh.diffusion.sdes.OUVESDE property)
(espnet2.enh.diffusion.sdes.OUVPSDE property)
(espnet2.enh.diffusion.sdes.SDE property)
Tacotron2 (class in espnet.nets.pytorch_backend.e2e_tts_tacotron2)
(class in espnet.nets.pytorch_backend.e2e_vc_tacotron2)
(class in espnet2.tts.tacotron2.tacotron2)
Tacotron2Loss (class in espnet.nets.pytorch_backend.e2e_tts_tacotron2)
TADELayer (class in espnet2.gan_tts.style_melgan.tade_res_block)
TADEResBlock (class in espnet2.gan_tts.style_melgan.tade_res_block)
target_forcing() (espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
target_glu (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
target_language_biasing() (espnet.nets.pytorch_backend.e2e_mt.E2E method)
target_mask() (in module espnet.nets.pytorch_backend.transformer.mask)
TargetSpeakerExtractionTask (class in espnet2.tasks.enh_tse)
TCNDenseUNet (class in espnet2.enh.layers.tcndenseunet)
TCNResBlock (class in espnet2.enh.layers.tcndenseunet)
TCNSeparator (class in espnet2.enh.separator.tcn_separator)
TCNSeparatorNomask (class in espnet2.diar.separator.tcn_separator_nomask)
TDSpeakerBeamExtractor (class in espnet2.enh.extractor.td_speakerbeam_extractor)
TemporalBlock (class in espnet2.diar.layers.tcn_nomask)
(class in espnet2.enh.layers.tcn)
TemporalConvNet (class in espnet2.diar.layers.tcn_nomask)
(class in espnet2.enh.layers.tcn)
TemporalConvNetInformed (class in espnet2.enh.layers.tcn)
tensorboard_add_scalar() (espnet2.train.reporter.Reporter method)
(espnet2.train.reporter.SubReporter method)
TensorboardLogger (class in espnet.utils.training.tensorboard_logger)
test_model() (in module espnet2.enh.layers.fasnet)
(in module espnet2.enh.layers.ifasnet)
text (espnet2.bin.asr_align.CTCSegmentationTask attribute)
Text2Speech (class in espnet2.bin.tts_inference)
Text2Text (class in espnet2.bin.mt_inference)
text2tokens() (espnet2.text.abs_tokenizer.AbsTokenizer method)
(espnet2.text.char_tokenizer.CharTokenizer method)
(espnet2.text.hugging_face_tokenizer.HuggingFaceTokenizer method)
(espnet2.text.phoneme_tokenizer.PhonemeTokenizer method)
(espnet2.text.sentencepiece_tokenizer.SentencepiecesTokenizer method)
(espnet2.text.whisper_tokenizer.OpenAIWhisperTokenizer method)
(espnet2.text.word_tokenizer.WordTokenizer method)
text2tokens_svs() (espnet2.text.phoneme_tokenizer.PhonemeTokenizer method)
text_converter (espnet2.bin.asr_align.CTCSegmentation attribute)
TextCleaner (class in espnet2.text.cleaner)
TextEncoder (class in espnet2.gan_svs.vits.text_encoder)
(class in espnet2.gan_tts.vits.text_encoder)
TFGridNet (class in espnet2.enh.separator.tfgridnet_separator)
TFGridNetV2 (class in espnet2.enh.separator.tfgridnetv2_separator)
th_accuracy() (in module espnet.nets.pytorch_backend.nets_utils)
threads_per_block() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants)
threeD_to_2D_tensor() (espnet2.asr.encoder.avhubert_encoder.ResEncoder method)
THRESHOLD (in module espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants)
tik_reg() (in module espnet2.enh.layers.beamformer)
(in module espnet2.enh.layers.beamformer_th)
time_domain_weight (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss attribute)
time_mask() (in module espnet.transform.spec_augment)
(in module espnet.utils.spec_augment)
time_masking() (in module espnet2.asr.encoder.avhubert_encoder)
time_path_process() (espnet2.enh.layers.uses.ATFBlock method)
time_stamps (espnet2.bin.asr_align.CTCSegmentation attribute)
time_step() (espnet.nets.beam_search_timesync.BeamSearchTimeSync method)
(espnet.nets.beam_search_timesync_streaming.BeamSearchTimeSyncStreaming method)
time_stretch() (in module espnet2.layers.augmentation)
time_sync_decoding() (espnet.nets.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer.BeamSearchTransducer method)
(espnet2.asr.transducer.beam_search_transducer_streaming.BeamSearchTransducerStreaming method)
(espnet2.asr_transducer.beam_search_transducer.BeamSearchTransducer method)
time_warp() (in module espnet.transform.spec_augment)
(in module espnet.utils.spec_augment)
(in module espnet2.layers.time_warp)
TimeDomainL1 (class in espnet2.enh.loss.criterions.time_domain)
TimeDomainLoss (class in espnet2.enh.loss.criterions.time_domain)
TimeDomainMSE (class in espnet2.enh.loss.criterions.time_domain)
TimeMask (class in espnet.transform.spec_augment)
TimeWarp (class in espnet.transform.spec_augment)
(class in espnet2.layers.time_warp)
timings (espnet2.bin.asr_align.CTCSegmentationTask attribute)
to_bytes() (in module espnet2.torch_utils.model_summary)
to_complex() (in module espnet2.enh.layers.complex_utils)
to_device() (in module espnet.nets.pytorch_backend.nets_utils)
(in module espnet2.torch_utils.device_funcs)
to_dict() (in module espnet2.asr.state_spaces.utils)
to_double() (in module espnet2.enh.layers.complex_utils)
to_float() (in module espnet2.enh.layers.complex_utils)
to_list() (in module espnet2.asr.state_spaces.utils)
to_reported_value() (in module espnet2.train.reporter)
to_torch_tensor() (in module espnet.nets.pytorch_backend.nets_utils)
ToggleableShufflingMultiprocessIterator (class in espnet.utils.training.iterators)
ToggleableShufflingSerialIterator (class in espnet.utils.training.iterators)
TokenIDConverter (class in espnet2.text.token_id_converter)
tokenize() (in module espnet2.bin.tokenize_text)
tokens2ids() (espnet2.text.hugging_face_token_id_converter.HuggingFaceTokenIDConverter method)
(espnet2.text.token_id_converter.TokenIDConverter method)
(espnet2.text.whisper_token_id_converter.OpenAIWhisperTokenIDConverter method)
tokens2text() (espnet2.text.abs_tokenizer.AbsTokenizer method)
(espnet2.text.char_tokenizer.CharTokenizer method)
(espnet2.text.hugging_face_tokenizer.HuggingFaceTokenizer method)
(espnet2.text.phoneme_tokenizer.PhonemeTokenizer method)
(espnet2.text.sentencepiece_tokenizer.SentencepiecesTokenizer method)
(espnet2.text.whisper_tokenizer.OpenAIWhisperTokenizer method)
(espnet2.text.word_tokenizer.WordTokenizer method)
TooShortUttError
,
[1]
torch_complex_from_reim() (in module espnet2.enh.layers.dcunet)
torch_load() (in module espnet.asr.asr_utils)
torch_resume() (in module espnet.asr.asr_utils)
torch_save() (in module espnet.asr.asr_utils)
torch_snapshot() (in module espnet.asr.asr_utils)
TorchAudioHuBERTPretrainEncoder (class in espnet2.asr.encoder.hubert_encoder)
TorchAudioHubertPretrainModel (class in espnet2.hubert.espnet_model)
TorchSTFT (class in espnet2.gan_svs.visinger2.visinger2_vocoder)
trace() (in module espnet2.enh.layers.complex_utils)
train() (in module espnet.asr.chainer_backend.asr)
(in module espnet.asr.pytorch_backend.asr)
(in module espnet.asr.pytorch_backend.asr_mix)
(in module espnet.lm.chainer_backend.lm)
(in module espnet.lm.pytorch_backend.lm)
(in module espnet.mt.pytorch_backend.mt)
(in module espnet.st.pytorch_backend.st)
(in module espnet.tts.pytorch_backend.tts)
(in module espnet.vc.pytorch_backend.vc)
train_one_epoch() (espnet2.train.gan_trainer.GANTrainer class method)
(espnet2.train.trainer.Trainer class method)
(espnet2.train.uasr_trainer.UASRTrainer class method)
Trainer (class in espnet2.train.trainer)
trainer (espnet2.tasks.abs_task.AbsTask attribute)
(espnet2.tasks.asr.ASRTask attribute)
(espnet2.tasks.asr_transducer.ASRTransducerTask attribute)
(espnet2.tasks.asvspoof.ASVSpoofTask attribute)
(espnet2.tasks.diar.DiarizationTask attribute)
(espnet2.tasks.enh.EnhancementTask attribute)
(espnet2.tasks.enh_s2t.EnhS2TTask attribute)
(espnet2.tasks.enh_tse.TargetSpeakerExtractionTask attribute)
(espnet2.tasks.gan_svs.GANSVSTask attribute)
(espnet2.tasks.gan_tts.GANTTSTask attribute)
(espnet2.tasks.hubert.HubertTask attribute)
(espnet2.tasks.lm.LMTask attribute)
(espnet2.tasks.mt.MTTask attribute)
(espnet2.tasks.s2st.S2STTask attribute)
(espnet2.tasks.s2t.S2TTask attribute)
(espnet2.tasks.slu.SLUTask attribute)
(espnet2.tasks.spk.SpeakerTask attribute)
(espnet2.tasks.st.STTask attribute)
(espnet2.tasks.svs.SVSTask attribute)
(espnet2.tasks.tts.TTSTask attribute)
(espnet2.tasks.uasr.UASRTask attribute)
TrainerOptions (class in espnet2.train.trainer)
training_add_custom_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
trans() (in module espnet.mt.pytorch_backend.mt)
(in module espnet.st.pytorch_backend.st)
transducer_add_arguments() (espnet.nets.pytorch_backend.e2e_asr_transducer.E2E static method)
TransducerDecoder (class in espnet2.asr.decoder.transducer_decoder)
TransducerDecoderInterface (class in espnet.nets.transducer_decoder_interface)
TransducerTasks (class in espnet.nets.pytorch_backend.transducer.transducer_tasks)
transfer_verification() (in module espnet.asr.pytorch_backend.asr_init)
Transform (class in espnet.utils.dataset)
transform() (espnet2.gan_svs.visinger2.visinger2_vocoder.TorchSTFT method)
Transformation (class in espnet.transform.transformation)
TransformDataset (class in espnet.utils.dataset)
Transformer (class in espnet.nets.pytorch_backend.e2e_tts_transformer)
(class in espnet.nets.pytorch_backend.e2e_vc_transformer)
(class in espnet2.tts.transformer.transformer)
TransformerDecoder (class in espnet2.asr.decoder.transformer_decoder)
TransformerDecoderLayer (class in espnet.nets.pytorch_backend.transducer.transformer_decoder_layer)
TransformerDiscreteSynthesizer (class in espnet2.s2st.synthesizer.discrete_synthesizer)
TransformerEncoder (class in espnet2.asr.encoder.avhubert_encoder)
(class in espnet2.asr.encoder.transformer_encoder)
(class in espnet2.asr.encoder.transformer_encoder_multispkr)
TransformerLM (class in espnet.nets.pytorch_backend.lm.transformer)
(class in espnet2.lm.transformer_lm)
TransformerMDDecoder (class in espnet2.asr.decoder.transformer_decoder)
TransformerPostEncoder (class in espnet2.slu.postencoder.transformer_postencoder)
TransformerSeparator (class in espnet2.enh.separator.transformer_separator)
TransformInterface (class in espnet.transform.transform_interface)
transition() (in module espnet2.asr.state_spaces.s4)
translate() (espnet.nets.mt_interface.MTInterface method)
(espnet.nets.pytorch_backend.e2e_mt.E2E method)
(espnet.nets.pytorch_backend.e2e_mt_transformer.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.pytorch_backend.e2e_st_transformer.E2E method)
(espnet.nets.st_interface.STInterface method)
translate_batch() (espnet.nets.mt_interface.MTInterface method)
(espnet.nets.pytorch_backend.e2e_mt.E2E method)
(espnet.nets.pytorch_backend.e2e_st.E2E method)
(espnet.nets.st_interface.STInterface method)
Translatotron (class in espnet2.s2st.synthesizer.translatotron)
Translatotron2 (class in espnet2.s2st.synthesizer.translatotron2)
Transpose (class in espnet2.gan_tts.vits.flow)
transpose_for_scores() (espnet2.asr.layers.fastformer.FastSelfAttention method)
TransposedLinear (class in espnet2.asr.state_spaces.components)
TransposedLN (class in espnet2.asr.state_spaces.components)
TransposedModule() (in module espnet2.asr.state_spaces.base)
TransposeLast (class in espnet2.uasr.generator.conv_generator)
trim_attention_weight() (espnet.asr.asr_utils.PlotAttentionReport method)
trim_by_ctc_posterior() (in module espnet.nets.pytorch_backend.nets_utils)
trim_ctc_prob() (espnet.asr.asr_utils.PlotCTCReport method)
triu_onnx() (in module espnet.nets.pytorch_backend.nets_utils)
TSEPreprocessor (class in espnet2.train.preprocessor)
TSInverseNormalization (class in espnet2.asr.state_spaces.components)
TSNormalization (class in espnet2.asr.state_spaces.components)
TTSInterface (class in espnet.nets.tts_interface)
TTSPackedContents (class in espnet2.bin.pack)
TTSPlot (class in espnet.nets.pytorch_backend.e2e_tts_transformer)
TTSTask (class in espnet2.tasks.tts)
tuneThresholdfromScore() (in module espnet2.utils.eer)
U
UASRDiscriminatorLoss (class in espnet2.uasr.loss.discriminator_loss)
UASRGradientPenalty (class in espnet2.uasr.loss.gradient_penalty)
UASRPhonemeDiversityLoss (class in espnet2.uasr.loss.phoneme_diversity_loss)
UASRPrefixScorer (class in espnet.nets.scorers.uasr)
UASRPseudoLabelLoss (class in espnet2.uasr.loss.pseudo_label_loss)
UASRSmoothnessPenalty (class in espnet2.uasr.loss.smoothness_penalty)
UASRTask (class in espnet2.tasks.uasr)
UASRTrainer (class in espnet2.train.uasr_trainer)
UASRTrainerOptions (class in espnet2.train.uasr_trainer)
UHiFiGANGenerator (class in espnet2.gan_svs.uhifigan.__init__)
(class in espnet2.gan_svs.uhifigan.uhifigan)
unbatchfy() (espnet.nets.batch_beam_search.BatchBeamSearch method)
unconstrained_rational_quadratic_spline() (in module espnet2.gan_tts.vits.transform)
unet_decoder_args() (in module espnet2.enh.layers.dcunet)
unfold() (espnet2.enh.separator.ineube_separator.iNeuBe static method)
uniform_init_parameters() (in module espnet.nets.pytorch_backend.initialization)
UnitYSynthesizer (class in espnet2.s2st.synthesizer.unity_synthesizer)
unpack() (in module espnet2.main_funcs.pack_funcs)
UnsortedBatchSampler (class in espnet2.samplers.unsorted_batch_sampler)
untie_final_proj (espnet2.asr.encoder.avhubert_encoder.AVHubertConfig attribute)
update() (espnet.asr.pytorch_backend.asr.CustomUpdater method)
(espnet.nets.chainer_backend.rnn.training.CustomParallelUpdater method)
(espnet.nets.chainer_backend.rnn.training.CustomUpdater method)
(espnet.nets.chainer_backend.transformer.training.CustomParallelUpdater method)
(espnet.nets.chainer_backend.transformer.training.CustomUpdater method)
(espnet.tts.pytorch_backend.tts.CustomUpdater method)
(espnet.vc.pytorch_backend.vc.CustomUpdater method)
(espnet2.spk.loss.aamsoftmax_subcenter_intertopk.ArcMarginProduct_intertopk_subcenter method)
update_core() (espnet.asr.pytorch_backend.asr.CustomUpdater method)
(espnet.lm.chainer_backend.lm.BPTTUpdater method)
(espnet.lm.pytorch_backend.lm.BPTTUpdater method)
(espnet.nets.chainer_backend.rnn.training.CustomParallelUpdater method)
(espnet.nets.chainer_backend.rnn.training.CustomUpdater method)
(espnet.nets.chainer_backend.transformer.training.CustomParallelUpdater method)
(espnet.nets.chainer_backend.transformer.training.CustomUpdater method)
(espnet.tts.pytorch_backend.tts.CustomUpdater method)
(espnet.vc.pytorch_backend.vc.CustomUpdater method)
update_fn() (espnet2.enh.diffusion.sampling.__init__.Corrector method)
(espnet2.enh.diffusion.sampling.__init__.Predictor method)
(espnet2.enh.diffusion.sampling.correctors.AnnealedLangevinDynamics method)
(espnet2.enh.diffusion.sampling.correctors.Corrector method)
(espnet2.enh.diffusion.sampling.correctors.LangevinCorrector method)
(espnet2.enh.diffusion.sampling.correctors.NoneCorrector method)
(espnet2.enh.diffusion.sampling.predictors.EulerMaruyamaPredictor method)
(espnet2.enh.diffusion.sampling.predictors.NonePredictor method)
(espnet2.enh.diffusion.sampling.predictors.Predictor method)
(espnet2.enh.diffusion.sampling.predictors.ReverseDiffusionPredictor method)
upfirdn2d() (in module espnet2.enh.layers.ncsnpp_utils.upfirdn2d)
upfirdn2d_native() (in module espnet2.enh.layers.ncsnpp_utils.upfirdn2d)
upgrade_state_dict_named() (espnet2.asr.encoder.avhubert_encoder.TransformerEncoder method)
UpPool (class in espnet2.asr.state_spaces.pool)
UpSample (class in espnet2.asr.state_spaces.pool)
Upsample (class in espnet2.enh.layers.ncsnpp_utils.layers)
(class in espnet2.enh.layers.ncsnpp_utils.layerspp)
upsample() (in module espnet2.asr.state_spaces.pool)
(in module espnet2.gan_svs.visinger2.ddsp)
upsample_2d() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
upsample_conv_2d() (in module espnet2.enh.layers.ncsnpp_utils.up_or_down_sampling)
UpsampleConv (class in espnet2.enh.layers.ncsnpp_utils.layers)
UpsampleNetwork (class in espnet2.gan_tts.parallel_wavegan.upsample)
UpSampling (class in espnet.nets.pytorch_backend.wavenet)
use_lids() (espnet2.bin.s2st_inference.Speech2Speech property)
(espnet2.bin.svs_inference.SingingGenerate property)
(espnet2.bin.tts_inference.Text2Speech property)
use_sids() (espnet2.bin.s2st_inference.Speech2Speech property)
(espnet2.bin.svs_inference.SingingGenerate property)
(espnet2.bin.tts_inference.Text2Speech property)
use_speech() (espnet2.bin.s2st_inference.Speech2Speech property)
(espnet2.bin.svs_inference.SingingGenerate property)
(espnet2.bin.tts_inference.Text2Speech property)
use_spembs() (espnet2.bin.s2st_inference.Speech2Speech property)
(espnet2.bin.svs_inference.SingingGenerate property)
(espnet2.bin.tts_inference.Text2Speech property)
USES (class in espnet2.enh.layers.uses)
USESSeparator (class in espnet2.enh.separator.uses_separator)
utt_begin_indices (espnet2.bin.asr_align.CTCSegmentationTask attribute)
utt_ids (espnet2.bin.asr_align.CTCSegmentationTask attribute)
utterance_mvn() (in module espnet.nets.pytorch_backend.frontends.feature_transform)
(in module espnet2.layers.utterance_mvn)
UtteranceCMVN (class in espnet.transform.cmvn)
UtteranceMVN (class in espnet.nets.pytorch_backend.frontends.feature_transform)
(class in espnet2.layers.utterance_mvn)
V
VADScpReader (class in espnet2.fileio.vad_scp)
VADScpWriter (class in espnet2.fileio.vad_scp)
valid_aux_encoder_output_layers() (in module espnet.nets.pytorch_backend.transducer.utils)
VALID_CHARS (espnet2.text.phoneme_tokenizer.Jaso attribute)
validate_architecture() (in module espnet2.asr_transducer.encoder.validation)
validate_block_arguments() (in module espnet2.asr_transducer.encoder.validation)
validate_input_block() (in module espnet2.asr_transducer.encoder.validation)
validate_one_epoch() (espnet2.train.gan_trainer.GANTrainer class method)
(espnet2.train.spk_trainer.SpkTrainer class method)
(espnet2.train.trainer.Trainer class method)
(espnet2.train.uasr_trainer.UASRTrainer class method)
values() (espnet.utils.io_utils.SoundHDF5File method)
variable_columns_sound_loader() (in module espnet2.train.dataset)
variance_scaling() (in module espnet2.enh.layers.ncsnpp_utils.layers)
VarianceLoss (class in espnet2.gan_tts.jets.loss)
VarianceNorm2d (class in espnet2.enh.layers.ncsnpp_utils.normalization)
VariancePredictor (class in espnet2.tts.fastspeech2.variance_predictor)
VaswaniRule (class in espnet.nets.chainer_backend.transformer.training)
verify_block_arguments() (in module espnet.nets.pytorch_backend.transducer.blocks)
verify_rel_pos_type() (in module espnet.nets.pytorch_backend.conformer.argument)
VGG2L (class in espnet.nets.chainer_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.rnn.encoders)
(class in espnet.nets.pytorch_backend.transducer.rnn_encoder)
(class in espnet.nets.pytorch_backend.transducer.vgg2l)
VGGRNNEncoder (class in espnet2.asr.encoder.vgg_rnn_encoder)
VISinger2Discriminator (class in espnet2.gan_svs.visinger2.__init__)
(class in espnet2.gan_svs.visinger2.visinger2_vocoder)
VISinger2VocoderGenerator (class in espnet2.gan_svs.visinger2.__init__)
(class in espnet2.gan_svs.visinger2.visinger2_vocoder)
VISingerGenerator (class in espnet2.gan_svs.vits.generator)
viterbi_decode() (in module espnet2.gan_tts.jets.alignments)
VITS (class in espnet2.gan_svs.vits.vits)
(class in espnet2.gan_tts.vits.vits)
VITSGenerator (class in espnet2.gan_tts.vits.generator)
VolumePerturbation (class in espnet.transform.perturb)
W
W (espnet.nets.chainer_backend.deterministic_embed_id.EmbedID attribute)
wandb_get_prefix() (in module espnet2.train.reporter)
wandb_log() (espnet2.train.reporter.Reporter method)
(espnet2.train.reporter.SubReporter method)
WarmupLR (class in espnet2.schedulers.warmup_lr)
WarmupReduceLROnPlateau (class in espnet2.schedulers.warmup_reducelronplateau)
WarmupStepLR (class in espnet2.schedulers.warmup_step_lr)
warned_about_misconfiguration (espnet2.bin.asr_align.CTCSegmentation attribute)
warp_size() (in module espnet2.asr.transducer.rnnt_multi_blank.utils.global_constants)
WaveNet (class in espnet.nets.pytorch_backend.wavenet)
(class in espnet2.gan_tts.wavenet.wavenet)
weight (espnet2.enh.loss.wrappers.abs_wrapper.AbsLossWrapper attribute)
weight() (espnet2.asr.decoder.whisper_decoder.ExpandedTokenEmbedding property)
weighted_sample_without_replacement() (in module espnet2.layers.augmentation)
WeightedAverage (class in espnet2.train.reporter)
whisper_encode() (espnet2.asr.encoder.whisper_encoder.OpenAIWhisperEncoder method)
(espnet2.asr.frontend.whisper.WhisperFrontend method)
WhisperFrontend (class in espnet2.asr.frontend.whisper)
window_sz (espnet2.enh.loss.criterions.time_domain.MultiResL1SpecLoss attribute)
WindowStreamingE2E (class in espnet.nets.pytorch_backend.streaming.window)
wkv_linear_attention() (espnet2.asr_transducer.decoder.modules.rwkv.attention.SelfAttention method)
WKVLinearAttention (class in espnet2.asr_transducer.decoder.modules.rwkv.attention)
WN (class in espnet2.gan_svs.pits.modules)
WordTokenizer (class in espnet2.text.word_tokenizer)
worker_id() (espnet.distributed.pytorch_backend.launch.WorkerError property)
worker_init_fn() (in module espnet2.iterators.category_iter_factory)
(in module espnet2.iterators.sequence_iter_factory)
WorkerError
WPE (class in espnet.transform.wpe)
wpe() (in module espnet2.enh.layers.wpe)
wpe_one_iteration() (in module espnet2.enh.layers.wpe)
X
XiaoiceSing (class in espnet2.svs.xiaoice.XiaoiceSing)
XiaoiceSing2Loss (class in espnet2.svs.xiaoice.loss)
XMLReader (class in espnet2.fileio.score_scp)
XMLWriter (class in espnet2.fileio.score_scp)
XvectorEncoder (class in espnet2.spk.encoder.xvector_encoder)
XvectorProjector (class in espnet2.spk.projector.xvector_projector)
Y
yaml_files (espnet2.bin.pack.ASRPackedContents attribute)
(espnet2.bin.pack.DiarPackedContents attribute)
(espnet2.bin.pack.EnhPackedContents attribute)
(espnet2.bin.pack.EnhS2TPackedContents attribute)
(espnet2.bin.pack.PackedContents attribute)
(espnet2.bin.pack.S2STPackedContents attribute)
(espnet2.bin.pack.S2TPackedContents attribute)
(espnet2.bin.pack.SSLPackedContents attribute)
(espnet2.bin.pack.STPackedContents attribute)
(espnet2.bin.pack.SVSPackedContents attribute)
(espnet2.bin.pack.SpkPackedContents attribute)
(espnet2.bin.pack.TTSPackedContents attribute)
yaml_no_alias_safe_dump() (in module espnet2.utils.yaml_no_alias_safe_dump)
Ying (class in espnet2.tts.feats_extract.ying)
YingDecoder (class in espnet2.gan_svs.pits.ying_decoder)
yingram() (espnet2.tts.feats_extract.ying.Ying method)
yingram_from_cmndf() (espnet2.tts.feats_extract.ying.Ying method)
yseq (espnet.nets.batch_beam_search.BatchHypothesis attribute)
(espnet.nets.beam_search.Hypothesis attribute)
Z
zero (espnet.lm.chainer_backend.extlm.LookAheadWordLM attribute)
(espnet.lm.chainer_backend.extlm.MultiLevelLM attribute)
(espnet.lm.pytorch_backend.extlm.LookAheadWordLM attribute)
(espnet.lm.pytorch_backend.extlm.MultiLevelLM attribute)
zero_grad() (espnet.nets.pytorch_backend.transformer.optimizer.NoamOpt method)
zero_mean (espnet2.enh.loss.criterions.time_domain.SISNRLoss attribute)
zero_state() (espnet.nets.pytorch_backend.lm.default.RNNLM method)
(espnet.nets.pytorch_backend.rnn.decoders.Decoder method)
(espnet2.asr.decoder.rnn_decoder.RNNDecoder method)
(espnet2.lm.seq_rnn_lm.SequentialRNNLM method)
ZoneOutCell (class in espnet.nets.pytorch_backend.tacotron2.decoder)