lhotse
v1.9
Contents:
Getting started
Representing a corpus
Cuts
Feature extraction
Executing tasks in parallel
PyTorch Datasets
Kaldi Interoperability
Command-line interface
API Reference
lhotse
Docs
»
Index
Edit on GitHub
Index
Symbols
|
_
|
A
|
B
|
C
|
D
|
E
|
F
|
G
|
H
|
I
|
K
|
L
|
M
|
N
|
O
|
P
|
R
|
S
|
T
|
U
|
V
|
W
|
X
|
Z
Symbols
--absolute-paths <absolute_paths>
lhotse-prepare-callhome-egyptian command line option
lhotse-prepare-callhome-english command line option
lhotse-prepare-cmu-kids command line option
lhotse-prepare-cslu-kids command line option
lhotse-prepare-eval2000 command line option
lhotse-prepare-fisher-english command line option
lhotse-prepare-fisher-spanish command line option
lhotse-prepare-gale-arabic command line option
lhotse-prepare-gale-mandarin command line option
lhotse-prepare-switchboard command line option
--annotations <annotations>
lhotse-download-ami command line option
lhotse-prepare-ami command line option
--audio
lhotse-cut-export-to-webdataset command line option
--audio <audio>
lhotse-prepare-gale-arabic command line option
lhotse-prepare-gale-mandarin command line option
--audio-dirs <audio_dirs>
lhotse-prepare-fisher-english command line option
--audio-format <audio_format>
lhotse-cut-export-to-webdataset command line option
--batch-duration <batch_duration>
lhotse-feat-extract-cuts-batch command line option
--buck-walter
lhotse-prepare-mgb2 command line option
--bundle-name <bundle_name>
lhotse-workflows-align-with-torchaudio command line option
--compute-durations
lhotse-kaldi-import command line option
--configs <configs>
lhotse-prepare-csj command line option
--context-direction <context_direction>
lhotse-cut-trim-to-supervisions command line option
--custom
lhotse-cut-export-to-webdataset command line option
--cutids <cutids>
lhotse-subset command line option
--cuts-manifest <cuts_manifest>
lhotse-workflows-annotate-with-whisper command line option
--dataset-part <dataset_part>
lhotse-prepare-nsc command line option
--dataset-parts <dataset_parts>
lhotse-prepare-csj command line option
lhotse-prepare-librispeech command line option
lhotse-prepare-wenet-speech command line option
--dev <dev>
lhotse-prepare-dihard3 command line option
--device <device>
lhotse-workflows-align-with-torchaudio command line option
lhotse-workflows-annotate-with-whisper command line option
--discard-overflowing-supervisions
lhotse-cut-truncate command line option
--discard-overlapping
lhotse-cut-trim-to-supervisions command line option
--dont-normalize-text
lhotse-workflows-align-with-torchaudio command line option
--dont-read-data
lhotse-validate command line option
lhotse-validate-pair command line option
--duration <duration>
lhotse-cut-pad command line option
--eval <eval>
lhotse-prepare-dihard3 command line option
--extension <extension>
lhotse-workflows-annotate-with-whisper command line option
--fault-tolerant
lhotse-cut-export-to-webdataset command line option
--feature-manifest <feature_manifest>
lhotse-cut-simple command line option
lhotse-feat-extract command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
--feature-type <feature_type>
lhotse-feat-write-default-config command line option
--features
lhotse-cut-export-to-webdataset command line option
--first <first>
lhotse-subset command line option
--flac
lhotse-prepare-mls command line option
--force-download
lhotse-download-ali-meeting command line option
lhotse-download-daily-talk command line option
lhotse-download-libricss command line option
lhotse-download-voxceleb1 command line option
lhotse-download-voxceleb2 command line option
--force-download <force_download>
lhotse-download-ami command line option
lhotse-download-icsi command line option
--force-eager
lhotse-cut-simple command line option
--frame-shift <frame_shift>
lhotse-kaldi-import command line option
--full
lhotse-download-librispeech command line option
--host <host>
lhotse-download-gigaspeech command line option
--install-dir <install_dir>
lhotse-install-sph2pipe command line option
--jobs <jobs>
lhotse-workflows-annotate-with-whisper command line option
--keep-overflowing-supervisions
lhotse-cut-truncate command line option
--keep-overlapping
lhotse-cut-trim-to-supervisions command line option
--lang <lang>
lhotse-download-mtedx command line option
lhotse-prepare-mtedx command line option
--language <language>
lhotse-prepare-commonvoice command line option
lhotse-workflows-annotate-with-whisper command line option
--last <last>
lhotse-subset command line option
--lilcom-tick-power <lilcom_tick_power>
lhotse-feat-extract command line option
--link-previous-utterance
lhotse-prepare-libritts command line option
--map-string-to-underscores <map_string_to_underscores>
lhotse-kaldi-import command line option
--map-underscores-to <map_underscores_to>
lhotse-kaldi-export command line option
--max-duration <max_duration>
lhotse-cut-truncate command line option
--max-jobs <max_jobs>
lhotse-copy-feats command line option
--mer-thresh <mer_thresh>
lhotse-prepare-mgb2 command line option
--mic <mic>
lhotse-download-ami command line option
lhotse-download-icsi command line option
lhotse-prepare-ali-meeting command line option
lhotse-prepare-ami command line option
lhotse-prepare-aspire command line option
lhotse-prepare-icsi command line option
--min-duration <min_duration>
lhotse-cut-trim-to-supervisions command line option
--min-segment-seconds <min_segment_seconds>
lhotse-prepare-librimix command line option
--mini
lhotse-download-librispeech command line option
--model-name <model_name>
lhotse-workflows-annotate-with-whisper command line option
--no-audio
lhotse-cut-export-to-webdataset command line option
--no-buck-walter
lhotse-prepare-mgb2 command line option
--no-custom
lhotse-cut-export-to-webdataset command line option
--no-features
lhotse-cut-export-to-webdataset command line option
--no-normalize-text
lhotse-prepare-earnings21 command line option
lhotse-prepare-earnings22 command line option
lhotse-prepare-spgispeech command line option
--no-pad
lhotse-split command line option
--no-precomputed-mixtures
lhotse-prepare-librimix command line option
--no-previous-utterance
lhotse-prepare-libritts command line option
--no-text-cleaning
lhotse-prepare-mgb2 command line option
--no-uem
lhotse-prepare-dihard3 command line option
--no-vocals
lhotse-prepare-musan command line option
--normalize-text
lhotse-prepare-earnings21 command line option
lhotse-prepare-earnings22 command line option
lhotse-prepare-icsi command line option
lhotse-prepare-spgispeech command line option
lhotse-workflows-align-with-torchaudio command line option
--normalize-text <normalize_text>
lhotse-prepare-ami command line option
lhotse-prepare-cslu-kids command line option
--num-jobs <num_jobs>
lhotse-feat-extract command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
lhotse-feat-upload command line option
lhotse-kaldi-import command line option
lhotse-prepare-aishell2 command line option
lhotse-prepare-commonvoice command line option
lhotse-prepare-csj command line option
lhotse-prepare-daily-talk command line option
lhotse-prepare-dihard3 command line option
lhotse-prepare-fisher-english command line option
lhotse-prepare-gigaspeech command line option
lhotse-prepare-hifitts command line option
lhotse-prepare-librispeech command line option
lhotse-prepare-libritts command line option
lhotse-prepare-mgb2 command line option
lhotse-prepare-mls command line option
lhotse-prepare-mtedx command line option
lhotse-prepare-spgispeech command line option
lhotse-prepare-tal-csasr command line option
lhotse-prepare-timit command line option
lhotse-prepare-voxceleb command line option
lhotse-prepare-wenet-speech command line option
--num-phones <num_phones>
lhotse-prepare-timit command line option
--num_jobs <num_jobs>
lhotse-prepare-bvcc command line option
--offset-type <offset_type>
lhotse-cut-truncate command line option
--omit-silence
lhotse-prepare-switchboard command line option
--opus
lhotse-prepare-mls command line option
--pad
lhotse-split command line option
--partition <partition>
lhotse-prepare-ami command line option
--parts <parts>
lhotse-prepare-rir-noise command line option
--prefix-spk-id
lhotse-kaldi-export command line option
--preserve-id
lhotse-cut-truncate command line option
--read-data
lhotse-validate command line option
lhotse-validate-pair command line option
--recording-manifest <recording_manifest>
lhotse-cut-simple command line option
--recordings-dir <recordings_dir>
lhotse-workflows-annotate-with-whisper command line option
--recordings-manifest <recordings_manifest>
lhotse-workflows-annotate-with-whisper command line option
--retain-silence
lhotse-prepare-switchboard command line option
--root-dir <root_dir>
lhotse-feat-extract command line option
--rttm-dir <rttm_dir>
lhotse-prepare-callhome-english command line option
--sampling-rate <sampling_rate>
lhotse-prepare-librimix command line option
--seed <seed>
lhotse command line option
--segment-words <segment_words>
lhotse-prepare-gale-mandarin command line option
--sentiment-dir <sentiment_dir>
lhotse-prepare-switchboard command line option
--shard-size <shard_size>
lhotse-cut-export-to-webdataset command line option
--shuffle
lhotse-split command line option
--split <split>
lhotse-prepare-commonvoice command line option
--stop-on-fail
lhotse-cut-export-to-webdataset command line option
--storage-type <storage_type>
lhotse-copy-feats command line option
lhotse-feat-extract command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
--subset <subset>
lhotse-download-gigaspeech command line option
lhotse-prepare-gigaspeech command line option
--supervision-manifest <supervision_manifest>
lhotse-cut-simple command line option
--text-cleaning
lhotse-prepare-mgb2 command line option
--transcript <transcript>
lhotse-prepare-gale-arabic command line option
lhotse-prepare-gale-mandarin command line option
--transcript-dir <transcript_dir>
lhotse-prepare-callhome-english command line option
lhotse-prepare-switchboard command line option
--transcript-dirs <transcript_dirs>
lhotse-prepare-fisher-english command line option
--transcripts-dir <transcripts_dir>
lhotse-download-icsi command line option
lhotse-prepare-icsi command line option
--type <type>
lhotse-prepare-libricss command line option
--uem
lhotse-prepare-dihard3 command line option
--url <url>
lhotse-download-ami command line option
lhotse-download-icsi command line option
lhotse-install-sph2pipe command line option
--use-edinburgh-vctk-url <use_edinburgh_vctk_url>
lhotse-prepare-vctk command line option
--use-vocals
lhotse-prepare-musan command line option
--voxceleb1 <voxceleb1>
lhotse-prepare-voxceleb command line option
--voxceleb2 <voxceleb2>
lhotse-prepare-voxceleb command line option
--with-precomputed-mixtures
lhotse-prepare-librimix command line option
-ad
lhotse-prepare-fisher-english command line option
-b
lhotse-feat-extract-cuts-batch command line option
-c
lhotse-cut-trim-to-supervisions command line option
lhotse-prepare-csj command line option
lhotse-workflows-annotate-with-whisper command line option
-d
lhotse-cut-pad command line option
lhotse-cut-trim-to-supervisions command line option
lhotse-cut-truncate command line option
lhotse-kaldi-import command line option
lhotse-workflows-align-with-torchaudio command line option
lhotse-workflows-annotate-with-whisper command line option
-e
lhotse-workflows-annotate-with-whisper command line option
-f
lhotse-cut-export-to-webdataset command line option
lhotse-cut-simple command line option
lhotse-feat-extract command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
lhotse-feat-write-default-config command line option
lhotse-kaldi-import command line option
-j
lhotse-copy-feats command line option
lhotse-feat-extract command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
lhotse-feat-upload command line option
lhotse-kaldi-import command line option
lhotse-prepare-aishell2 command line option
lhotse-prepare-commonvoice command line option
lhotse-prepare-csj command line option
lhotse-prepare-dihard3 command line option
lhotse-prepare-fisher-english command line option
lhotse-prepare-gigaspeech command line option
lhotse-prepare-hifitts command line option
lhotse-prepare-librispeech command line option
lhotse-prepare-libritts command line option
lhotse-prepare-mgb2 command line option
lhotse-prepare-mls command line option
lhotse-prepare-mtedx command line option
lhotse-prepare-spgispeech command line option
lhotse-prepare-tal-csasr command line option
lhotse-prepare-timit command line option
lhotse-prepare-voxceleb command line option
lhotse-prepare-wenet-speech command line option
lhotse-workflows-annotate-with-whisper command line option
-l
lhotse-download-mtedx command line option
lhotse-prepare-commonvoice command line option
lhotse-prepare-mtedx command line option
lhotse-workflows-annotate-with-whisper command line option
-m
lhotse-workflows-annotate-with-whisper command line option
-n
lhotse-workflows-align-with-torchaudio command line option
lhotse-workflows-annotate-with-whisper command line option
-nj
lhotse-prepare-bvcc command line option
-o
lhotse-cut-truncate command line option
-p
lhotse-kaldi-export command line option
lhotse-prepare-csj command line option
lhotse-prepare-librispeech command line option
lhotse-prepare-nsc command line option
lhotse-prepare-rir-noise command line option
lhotse-prepare-timit command line option
lhotse-prepare-wenet-speech command line option
-r
lhotse-cut-simple command line option
lhotse-feat-extract command line option
lhotse-workflows-annotate-with-whisper command line option
-s
lhotse command line option
lhotse-cut-export-to-webdataset command line option
lhotse-cut-simple command line option
lhotse-prepare-commonvoice command line option
lhotse-prepare-gale-arabic command line option
lhotse-prepare-gale-mandarin command line option
lhotse-split command line option
-t
lhotse-copy-feats command line option
lhotse-feat-extract command line option
lhotse-prepare-gale-arabic command line option
lhotse-prepare-gale-mandarin command line option
-td
lhotse-prepare-fisher-english command line option
-u
lhotse-kaldi-export command line option
lhotse-kaldi-import command line option
-v1
lhotse-prepare-voxceleb command line option
-v2
lhotse-prepare-voxceleb command line option
_
__call__() (lhotse.dataset.input_strategies.AudioSamples method)
(lhotse.dataset.input_strategies.BatchIO method)
(lhotse.dataset.input_strategies.OnTheFlyFeatures method)
(lhotse.dataset.input_strategies.PrecomputedFeatures method)
__init__() (lhotse.audio.AudioLoadingError method)
(lhotse.audio.AudioMixer method)
(lhotse.audio.AudioSource method)
(lhotse.audio.CompositeAudioBackend method)
(lhotse.audio.DurationMismatchError method)
(lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
(lhotse.dataset.collation.TokenCollater method)
(lhotse.dataset.cut_transforms.CutConcatenate method)
(lhotse.dataset.cut_transforms.CutMix method)
(lhotse.dataset.cut_transforms.ExtraPadding method)
(lhotse.dataset.cut_transforms.PerturbSpeed method)
(lhotse.dataset.cut_transforms.PerturbTempo method)
(lhotse.dataset.cut_transforms.PerturbVolume method)
(lhotse.dataset.cut_transforms.ReverbWithImpulseResponse method)
(lhotse.dataset.diarization.DiarizationDataset method)
(lhotse.dataset.input_strategies.AudioSamples method)
(lhotse.dataset.input_strategies.BatchIO method)
(lhotse.dataset.input_strategies.OnTheFlyFeatures method)
(lhotse.dataset.signal_transforms.DereverbWPE method)
(lhotse.dataset.signal_transforms.GlobalMVN method)
(lhotse.dataset.signal_transforms.RandomizedSmoothing method)
(lhotse.dataset.signal_transforms.SpecAugment method)
(lhotse.dataset.source_separation.DynamicallyMixedSourceSeparationDataset method)
(lhotse.dataset.source_separation.PreMixedSourceSeparationDataset method)
(lhotse.dataset.speech_recognition.K2SpeechRecognitionDataset method)
(lhotse.dataset.unsupervised.DynamicUnsupervisedDataset method)
(lhotse.dataset.unsupervised.UnsupervisedDataset method)
(lhotse.dataset.unsupervised.UnsupervisedWaveformDataset method)
(lhotse.dataset.vad.VadDataset method)
(lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.Features method)
(lhotse.features.base.FeatureSet method)
(lhotse.features.base.FeatureSetBuilder method)
(lhotse.features.base.StatsAccumulator method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.fbank.TorchaudioFbankConfig method)
(lhotse.features.io.ChunkedLilcomHdf5Reader method)
(lhotse.features.io.ChunkedLilcomHdf5Writer method)
(lhotse.features.io.KaldiReader method)
(lhotse.features.io.KaldiWriter method)
(lhotse.features.io.LilcomChunkyReader method)
(lhotse.features.io.LilcomChunkyWriter method)
(lhotse.features.io.LilcomFilesReader method)
(lhotse.features.io.LilcomFilesWriter method)
(lhotse.features.io.LilcomHdf5Reader method)
(lhotse.features.io.LilcomHdf5Writer method)
(lhotse.features.io.LilcomURLReader method)
(lhotse.features.io.LilcomURLWriter method)
(lhotse.features.io.MemoryLilcomReader method)
(lhotse.features.io.MemoryLilcomWriter method)
(lhotse.features.io.MemoryRawReader method)
(lhotse.features.io.MemoryRawWriter method)
(lhotse.features.io.NumpyFilesReader method)
(lhotse.features.io.NumpyFilesWriter method)
(lhotse.features.io.NumpyHdf5Reader method)
(lhotse.features.io.NumpyHdf5Writer method)
(lhotse.features.kaldi.extractors.Fbank method)
(lhotse.features.kaldi.extractors.Mfcc method)
(lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.librosa_fbank.LibrosaFbankConfig method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.mfcc.TorchaudioMfccConfig method)
(lhotse.features.mixer.FeatureMixer method)
(lhotse.features.spectrogram.Spectrogram method)
(lhotse.features.spectrogram.SpectrogramConfig method)
(lhotse.supervision.SupervisionSegment method)
(lhotse.supervision.SupervisionSet method)
A
add_module() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
add_to_mix() (lhotse.audio.AudioMixer method)
(lhotse.features.mixer.FeatureMixer method)
alignment (lhotse.supervision.SupervisionSegment attribute)
AlignmentItem (class in lhotse.supervision)
append_cuts() (in module lhotse.cut)
apply() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
args (lhotse.audio.AudioLoadingError attribute)
(lhotse.audio.DurationMismatchError attribute)
assert_and_maybe_fix_num_samples() (in module lhotse.audio)
AUDIO_DIR
lhotse-download-icsi command line option
lhotse-prepare-broadcast-news command line option
lhotse-prepare-callhome-egyptian command line option
lhotse-prepare-callhome-english command line option
lhotse-prepare-fisher-spanish command line option
lhotse-prepare-icsi command line option
lhotse-prepare-switchboard command line option
audio_energy() (in module lhotse.audio)
AudioBackend (class in lhotse.audio)
AudioLoadingError
AudioMixer (class in lhotse.audio)
audioread_info() (in module lhotse.audio)
audioread_load() (in module lhotse.audio)
AudioreadBackend (class in lhotse.audio)
AudioSamples (class in lhotse.dataset.input_strategies)
AudioSource (class in lhotse.audio)
available_storage_backends() (in module lhotse.features.io)
available_windows() (in module lhotse.features.kaldi.layers)
B
BatchIO (class in lhotse.dataset.input_strategies)
bfloat16() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
buffers() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
C
cepstral_lifter (lhotse.features.mfcc.TorchaudioMfccConfig attribute)
channel (lhotse.supervision.SupervisionSegment attribute)
channel_ids (lhotse.audio.Recording attribute)
channels (lhotse.audio.AudioSource attribute)
(lhotse.audio.LibsndfileCompatibleAudioInfo property)
(lhotse.features.base.Features attribute)
check_h5py_installed() (in module lhotse.features.io)
children() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
CHUNK_SIZE
lhotse-split-lazy command line option
CHUNK_SIZE (lhotse.features.io.LilcomChunkyReader attribute)
(lhotse.features.io.LilcomChunkyWriter attribute)
ChunkedLilcomHdf5Reader (class in lhotse.features.io)
ChunkedLilcomHdf5Writer (class in lhotse.features.io)
close() (lhotse.features.io.ChunkedLilcomHdf5Writer method)
(lhotse.features.io.KaldiWriter method)
(lhotse.features.io.LilcomChunkyWriter method)
(lhotse.features.io.LilcomHdf5Writer method)
(lhotse.features.io.MemoryLilcomWriter method)
(lhotse.features.io.MemoryRawWriter method)
(lhotse.features.io.NumpyHdf5Writer method)
close_cached_file_handles() (in module lhotse.features.io)
collate_audio() (in module lhotse.dataset.collation)
collate_custom_field() (in module lhotse.dataset.collation)
collate_features() (in module lhotse.dataset.collation)
collate_matrices() (in module lhotse.dataset.collation)
collate_multi_channel_audio() (in module lhotse.dataset.collation)
collate_multi_channel_features() (in module lhotse.dataset.collation)
collate_vectors() (in module lhotse.dataset.collation)
combine() (in module lhotse.manipulation)
CompositeAudioBackend (class in lhotse.audio)
compute_energy() (lhotse.features.base.FeatureExtractor static method)
(lhotse.features.base.TorchaudioFeatureExtractor static method)
(lhotse.features.fbank.TorchaudioFbank static method)
(lhotse.features.kaldi.extractors.Fbank static method)
(lhotse.features.librosa_fbank.LibrosaFbank static method)
(lhotse.features.mfcc.TorchaudioMfcc static method)
(lhotse.features.spectrogram.Spectrogram static method)
compute_global_stats() (in module lhotse.features.base)
(lhotse.features.base.FeatureSet method)
compute_supervisions_frame_mask() (in module lhotse.cut)
config_type (lhotse.features.base.FeatureExtractor attribute)
(lhotse.features.base.TorchaudioFeatureExtractor attribute)
(lhotse.features.fbank.TorchaudioFbank attribute)
(lhotse.features.kaldi.extractors.Fbank attribute)
(lhotse.features.kaldi.extractors.Mfcc attribute)
(lhotse.features.librosa_fbank.LibrosaFbank attribute)
(lhotse.features.mfcc.TorchaudioMfcc attribute)
(lhotse.features.spectrogram.Spectrogram attribute)
copy_feats() (lhotse.features.base.Features method)
(lhotse.features.base.FeatureSet method)
CORPUS_DIR
lhotse-prepare-adept command line option
lhotse-prepare-aidatatang-200zh command line option
lhotse-prepare-aishell command line option
lhotse-prepare-aishell2 command line option
lhotse-prepare-aishell4 command line option
lhotse-prepare-ali-meeting command line option
lhotse-prepare-ami command line option
lhotse-prepare-aspire command line option
lhotse-prepare-babel command line option
lhotse-prepare-bvcc command line option
lhotse-prepare-cmu-arctic command line option
lhotse-prepare-cmu-indic command line option
lhotse-prepare-cmu-kids command line option
lhotse-prepare-commonvoice command line option
lhotse-prepare-csj command line option
lhotse-prepare-cslu-kids command line option
lhotse-prepare-daily-talk command line option
lhotse-prepare-earnings21 command line option
lhotse-prepare-earnings22 command line option
lhotse-prepare-eval2000 command line option
lhotse-prepare-fisher-english command line option
lhotse-prepare-gigaspeech command line option
lhotse-prepare-hifitts command line option
lhotse-prepare-l2-arctic command line option
lhotse-prepare-libricss command line option
lhotse-prepare-librispeech command line option
lhotse-prepare-libritts command line option
lhotse-prepare-ljspeech command line option
lhotse-prepare-magicdata command line option
lhotse-prepare-mgb2 command line option
lhotse-prepare-mls command line option
lhotse-prepare-mtedx command line option
lhotse-prepare-musan command line option
lhotse-prepare-nsc command line option
lhotse-prepare-peoples-speech command line option
lhotse-prepare-primewords command line option
lhotse-prepare-rir-noise command line option
lhotse-prepare-spgispeech command line option
lhotse-prepare-stcmds command line option
lhotse-prepare-tal-asr command line option
lhotse-prepare-tal-csasr command line option
lhotse-prepare-thchs-30 command line option
lhotse-prepare-timit command line option
lhotse-prepare-vctk command line option
lhotse-prepare-wenet-speech command line option
lhotse-prepare-yesno command line option
count() (lhotse.audio.LibsndfileCompatibleAudioInfo method)
(lhotse.supervision.AlignmentItem method)
cpu() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
create_cut_set_eager() (in module lhotse.cut)
create_cut_set_lazy() (in module lhotse.cut)
create_default_feature_extractor() (in module lhotse.features.base)
create_frame_window() (in module lhotse.features.kaldi.layers)
create_mel_scale() (in module lhotse.features.kaldi.layers)
cuda() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
custom (lhotse.supervision.SupervisionSegment attribute)
CUT_MANIFEST
lhotse-cut-pad command line option
lhotse-cut-truncate command line option
CUT_MANIFESTS
lhotse-cut-append command line option
lhotse-cut-mix-by-recording-id command line option
lhotse-cut-mix-sequential command line option
CutConcatenate (class in lhotse.dataset.cut_transforms)
CutMix (class in lhotse.dataset.cut_transforms)
CUTS
lhotse-cut-trim-to-supervisions command line option
CUTSET
lhotse-cut-decompose command line option
lhotse-cut-describe command line option
lhotse-cut-export-to-webdataset command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
D
data (lhotse.audio.RecordingSet property)
(lhotse.features.base.FeatureSet property)
(lhotse.supervision.SupervisionSet property)
DATA_DIR
lhotse-kaldi-import command line option
DereverbWPE (class in lhotse.dataset.signal_transforms)
deserialize() (lhotse.supervision.AlignmentItem static method)
device (lhotse.features.base.FeatureExtractor property)
(lhotse.features.base.TorchaudioFeatureExtractor property)
(lhotse.features.fbank.TorchaudioFbank property)
(lhotse.features.librosa_fbank.LibrosaFbank property)
(lhotse.features.mfcc.TorchaudioMfcc property)
(lhotse.features.spectrogram.Spectrogram property)
DiarizationDataset (class in lhotse.dataset.diarization)
dither (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
double() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
dump_patches (lhotse.features.kaldi.layers.Wav2FFT attribute)
(lhotse.features.kaldi.layers.Wav2LogFilterBank attribute)
(lhotse.features.kaldi.layers.Wav2LogSpec attribute)
(lhotse.features.kaldi.layers.Wav2MFCC attribute)
(lhotse.features.kaldi.layers.Wav2Spec attribute)
(lhotse.features.kaldi.layers.Wav2Win attribute)
duration (lhotse.audio.LibsndfileCompatibleAudioInfo property)
(lhotse.audio.Recording attribute)
(lhotse.features.base.Features attribute)
(lhotse.supervision.AlignmentItem property)
(lhotse.supervision.SupervisionSegment attribute)
duration() (lhotse.audio.RecordingSet method)
DurationMismatchError
DynamicallyMixedSourceSeparationDataset (class in lhotse.dataset.source_separation)
DynamicUnsupervisedDataset (class in lhotse.dataset.unsupervised)
E
end (lhotse.features.base.Features property)
(lhotse.supervision.AlignmentItem property)
(lhotse.supervision.SupervisionSegment property)
energy_floor (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
eval() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
export_to_kaldi() (in module lhotse.kaldi)
extra_repr() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
extract() (lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.kaldi.extractors.Fbank method)
(lhotse.features.kaldi.extractors.Mfcc method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.spectrogram.Spectrogram method)
extract_batch() (lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.spectrogram.Spectrogram method)
extract_from_recording_and_store() (lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.spectrogram.Spectrogram method)
extract_from_samples_and_store() (lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.spectrogram.Spectrogram method)
ExtraPadding (class in lhotse.dataset.cut_transforms)
F
Fbank (class in lhotse.features.kaldi.extractors)
feature_dim() (lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.kaldi.extractors.Fbank method)
(lhotse.features.kaldi.extractors.Mfcc method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.spectrogram.Spectrogram method)
FEATURE_MANIFEST
lhotse-feat-upload command line option
FeatureExtractor (class in lhotse.features.base)
FeatureMixer (class in lhotse.features.mixer)
Features (class in lhotse.features.base)
FeatureSet (class in lhotse.features.base)
FeatureSetBuilder (class in lhotse.features.base)
FeaturesReader (class in lhotse.features.io)
FeaturesWriter (class in lhotse.features.io)
FfmpegSubprocessOpusBackend (class in lhotse.audio)
FfmpegTorchaudioStreamerBackend (class in lhotse.audio)
fft_size (lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
filter() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
find() (lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
float() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
fmax (lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
fmin (lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
forward() (lhotse.dataset.signal_transforms.DereverbWPE method)
(lhotse.dataset.signal_transforms.GlobalMVN method)
(lhotse.dataset.signal_transforms.RandomizedSmoothing method)
(lhotse.dataset.signal_transforms.SpecAugment method)
(lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
frame_length (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
frame_shift (lhotse.features.base.FeatureExtractor property)
(lhotse.features.base.Features attribute)
(lhotse.features.base.TorchaudioFeatureExtractor property)
(lhotse.features.fbank.TorchaudioFbank property)
(lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.kaldi.extractors.Fbank property)
(lhotse.features.kaldi.extractors.Mfcc property)
(lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
(lhotse.features.librosa_fbank.LibrosaFbank property)
(lhotse.features.mfcc.TorchaudioMfcc property)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.Spectrogram property)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
frames (lhotse.audio.LibsndfileCompatibleAudioInfo property)
from_bytes() (lhotse.audio.Recording static method)
from_cuts() (lhotse.dataset.signal_transforms.GlobalMVN class method)
from_dict() (lhotse.audio.AudioSource static method)
(lhotse.audio.Recording static method)
(lhotse.features.base.FeatureExtractor class method)
(lhotse.features.base.Features static method)
(lhotse.features.base.TorchaudioFeatureExtractor class method)
(lhotse.features.fbank.TorchaudioFbank class method)
(lhotse.features.fbank.TorchaudioFbankConfig static method)
(lhotse.features.librosa_fbank.LibrosaFbank class method)
(lhotse.features.librosa_fbank.LibrosaFbankConfig static method)
(lhotse.features.mfcc.TorchaudioMfcc class method)
(lhotse.features.mfcc.TorchaudioMfccConfig static method)
(lhotse.features.spectrogram.Spectrogram class method)
(lhotse.features.spectrogram.SpectrogramConfig static method)
(lhotse.supervision.SupervisionSegment static method)
from_dicts() (lhotse.audio.RecordingSet static method)
(lhotse.features.base.FeatureSet static method)
(lhotse.supervision.SupervisionSet static method)
from_dir() (lhotse.audio.RecordingSet static method)
from_features() (lhotse.features.base.FeatureSet static method)
from_file() (lhotse.audio.Recording static method)
(lhotse.audio.RecordingSet class method)
(lhotse.dataset.signal_transforms.GlobalMVN class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.supervision.SupervisionSet class method)
from_items() (lhotse.audio.RecordingSet static method)
(lhotse.features.base.FeatureSet static method)
(lhotse.supervision.SupervisionSet static method)
from_json() (lhotse.audio.RecordingSet class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.supervision.SupervisionSet class method)
from_jsonl() (lhotse.audio.RecordingSet class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.supervision.SupervisionSet class method)
from_jsonl_lazy() (lhotse.audio.RecordingSet class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.supervision.SupervisionSet class method)
from_recordings() (lhotse.audio.RecordingSet static method)
from_rttm() (lhotse.supervision.SupervisionSet static method)
from_segments() (lhotse.supervision.SupervisionSet static method)
from_yaml() (lhotse.audio.RecordingSet class method)
(lhotse.features.base.FeatureExtractor class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.features.base.TorchaudioFeatureExtractor class method)
(lhotse.features.fbank.TorchaudioFbank class method)
(lhotse.features.librosa_fbank.LibrosaFbank class method)
(lhotse.features.mfcc.TorchaudioMfcc class method)
(lhotse.features.spectrogram.Spectrogram class method)
(lhotse.supervision.SupervisionSet class method)
G
gender (lhotse.supervision.SupervisionSegment attribute)
get() (lhotse.features.base.StatsAccumulator method)
get_buffer() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
get_default_audio_backend() (in module lhotse.audio)
get_duration() (in module lhotse.kaldi)
get_extra_state() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
get_extractor_type() (in module lhotse.features.base)
get_memory_writer() (in module lhotse.features.io)
get_parameter() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
get_reader() (in module lhotse.features.io)
get_submodule() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
get_writer() (in module lhotse.features.io)
GlobalMVN (class in lhotse.dataset.signal_transforms)
H
half() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
handles_special_case() (lhotse.audio.AudioBackend method)
(lhotse.audio.AudioreadBackend method)
(lhotse.audio.CompositeAudioBackend method)
(lhotse.audio.FfmpegSubprocessOpusBackend method)
(lhotse.audio.FfmpegTorchaudioStreamerBackend method)
(lhotse.audio.LibsndfileBackend method)
(lhotse.audio.Sph2pipeSubprocessBackend method)
(lhotse.audio.TorchaudioDefaultBackend method)
high_freq (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
hop_size (lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
I
id (lhotse.audio.Recording attribute)
(lhotse.supervision.SupervisionSegment attribute)
ids (lhotse.audio.RecordingSet property)
(lhotse.supervision.SupervisionSet property)
IN_CUTS
lhotse-workflows-align-with-torchaudio command line option
index() (lhotse.audio.LibsndfileCompatibleAudioInfo method)
(lhotse.supervision.AlignmentItem method)
info() (in module lhotse.audio)
INPUT_MANIFEST
lhotse-copy command line option
lhotse-copy-feats command line option
inverse() (lhotse.dataset.collation.TokenCollater method)
(lhotse.dataset.signal_transforms.GlobalMVN method)
ipu() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
is_applicable() (lhotse.audio.AudioBackend method)
(lhotse.audio.AudioreadBackend method)
(lhotse.audio.CompositeAudioBackend method)
(lhotse.audio.FfmpegSubprocessOpusBackend method)
(lhotse.audio.FfmpegTorchaudioStreamerBackend method)
(lhotse.audio.LibsndfileBackend method)
(lhotse.audio.Sph2pipeSubprocessBackend method)
(lhotse.audio.TorchaudioDefaultBackend method)
is_lazy (lhotse.audio.RecordingSet property)
(lhotse.features.base.FeatureSet property)
(lhotse.supervision.SupervisionSet property)
K
K2SpeechRecognitionDataset (class in lhotse.dataset.speech_recognition)
KaldiReader (class in lhotse.features.io)
KaldiWriter (class in lhotse.features.io)
L
language (lhotse.supervision.SupervisionSegment attribute)
lhotse command line option
--seed <seed>
-s
lhotse-combine command line option
MANIFESTS
OUTPUT_MANIFEST
lhotse-copy command line option
INPUT_MANIFEST
OUTPUT_MANIFEST
lhotse-copy-feats command line option
--max-jobs <max_jobs>
--storage-type <storage_type>
-j
-t
INPUT_MANIFEST
OUTPUT_MANIFEST
STORAGE_PATH
lhotse-cut-append command line option
CUT_MANIFESTS
OUTPUT_CUT_MANIFEST
lhotse-cut-decompose command line option
CUTSET
OUTPUT
lhotse-cut-describe command line option
CUTSET
lhotse-cut-export-to-webdataset command line option
--audio
--audio-format <audio_format>
--custom
--fault-tolerant
--features
--no-audio
--no-custom
--no-features
--shard-size <shard_size>
--stop-on-fail
-f
-s
CUTSET
WSPECIFIER
lhotse-cut-mix-by-recording-id command line option
CUT_MANIFESTS
OUTPUT_CUT_MANIFEST
lhotse-cut-mix-sequential command line option
CUT_MANIFESTS
OUTPUT_CUT_MANIFEST
lhotse-cut-pad command line option
--duration <duration>
-d
CUT_MANIFEST
OUTPUT_CUT_MANIFEST
lhotse-cut-simple command line option
--feature-manifest <feature_manifest>
--force-eager
--recording-manifest <recording_manifest>
--supervision-manifest <supervision_manifest>
-f
-r
-s
OUTPUT_CUT_MANIFEST
lhotse-cut-trim-to-supervisions command line option
--context-direction <context_direction>
--discard-overlapping
--keep-overlapping
--min-duration <min_duration>
-c
-d
CUTS
OUTPUT_CUTS
lhotse-cut-truncate command line option
--discard-overflowing-supervisions
--keep-overflowing-supervisions
--max-duration <max_duration>
--offset-type <offset_type>
--preserve-id
-d
-o
CUT_MANIFEST
OUTPUT_CUT_MANIFEST
lhotse-download-adept command line option
TARGET_DIR
lhotse-download-aidatatang-200zh command line option
TARGET_DIR
lhotse-download-aishell command line option
TARGET_DIR
lhotse-download-aishell4 command line option
TARGET_DIR
lhotse-download-ali-meeting command line option
--force-download
TARGET_DIR
lhotse-download-ami command line option
--annotations <annotations>
--force-download <force_download>
--mic <mic>
--url <url>
TARGET_DIR
lhotse-download-cmu-arctic command line option
TARGET_DIR
lhotse-download-cmu-indic command line option
TARGET_DIR
lhotse-download-daily-talk command line option
--force-download
TARGET_DIR
lhotse-download-earnings21 command line option
TARGET_DIR
lhotse-download-gigaspeech command line option
--host <host>
--subset <subset>
PASSWORD
TARGET_DIR
lhotse-download-heroico command line option
TARGET_DIR
lhotse-download-hifitts command line option
TARGET_DIR
lhotse-download-icsi command line option
--force-download <force_download>
--mic <mic>
--transcripts-dir <transcripts_dir>
--url <url>
AUDIO_DIR
lhotse-download-libricss command line option
--force-download
TARGET_DIR
lhotse-download-librimix command line option
TARGET_DIR
lhotse-download-librispeech command line option
--full
--mini
TARGET_DIR
lhotse-download-libritts command line option
TARGET_DIR
lhotse-download-ljspeech command line option
TARGET_DIR
lhotse-download-magicdata command line option
TARGET_DIR
lhotse-download-mtedx command line option
--lang <lang>
-l
TARGET_DIR
lhotse-download-musan command line option
TARGET_DIR
lhotse-download-primewords command line option
TARGET_DIR
lhotse-download-rir-noise command line option
TARGET_DIR
lhotse-download-spgispeech command line option
TARGET_DIR
lhotse-download-stcmds command line option
TARGET_DIR
lhotse-download-tedlium command line option
TARGET_DIR
lhotse-download-thchs-30 command line option
TARGET_DIR
lhotse-download-timit command line option
TARGET_DIR
lhotse-download-vctk command line option
TARGET_DIR
lhotse-download-voxceleb1 command line option
--force-download
TARGET_DIR
lhotse-download-voxceleb2 command line option
--force-download
TARGET_DIR
lhotse-download-yesno command line option
TARGET_DIR
lhotse-feat-extract command line option
--feature-manifest <feature_manifest>
--lilcom-tick-power <lilcom_tick_power>
--num-jobs <num_jobs>
--root-dir <root_dir>
--storage-type <storage_type>
-f
-j
-r
-t
OUTPUT_DIR
RECORDING_MANIFEST
lhotse-feat-extract-cuts command line option
--feature-manifest <feature_manifest>
--num-jobs <num_jobs>
--storage-type <storage_type>
-f
-j
CUTSET
OUTPUT_CUTSET
STORAGE_PATH
lhotse-feat-extract-cuts-batch command line option
--batch-duration <batch_duration>
--feature-manifest <feature_manifest>
--num-jobs <num_jobs>
--storage-type <storage_type>
-b
-f
-j
CUTSET
OUTPUT_CUTSET
STORAGE_PATH
lhotse-feat-upload command line option
--num-jobs <num_jobs>
-j
FEATURE_MANIFEST
OUTPUT_MANIFEST
URL
lhotse-feat-write-default-config command line option
--feature-type <feature_type>
-f
OUTPUT_CONFIG
lhotse-filter command line option
MANIFEST
OUTPUT_MANIFEST
PREDICATE
lhotse-fix command line option
OUTPUT_DIR
RECORDINGS
SUPERVISIONS
lhotse-install-sph2pipe command line option
--install-dir <install_dir>
--url <url>
lhotse-kaldi-export command line option
--map-underscores-to <map_underscores_to>
--prefix-spk-id
-p
-u
OUTPUT_DIR
RECORDINGS
SUPERVISIONS
lhotse-kaldi-import command line option
--compute-durations
--frame-shift <frame_shift>
--map-string-to-underscores <map_string_to_underscores>
--num-jobs <num_jobs>
-d
-f
-j
-u
DATA_DIR
MANIFEST_DIR
SAMPLING_RATE
lhotse-prepare-adept command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-aidatatang-200zh command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-aishell command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-aishell2 command line option
--num-jobs <num_jobs>
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-aishell4 command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-ali-meeting command line option
--mic <mic>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-ami command line option
--annotations <annotations>
--mic <mic>
--normalize-text <normalize_text>
--partition <partition>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-aspire command line option
--mic <mic>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-babel command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-broadcast-news command line option
AUDIO_DIR
OUTPUT_DIR
TRANSCRIPT_DIR
lhotse-prepare-bvcc command line option
--num_jobs <num_jobs>
-nj
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-callhome-egyptian command line option
--absolute-paths <absolute_paths>
AUDIO_DIR
OUTPUT_DIR
TRANSCRIPT_DIR
lhotse-prepare-callhome-english command line option
--absolute-paths <absolute_paths>
--rttm-dir <rttm_dir>
--transcript-dir <transcript_dir>
AUDIO_DIR
OUTPUT_DIR
lhotse-prepare-cmu-arctic command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-cmu-indic command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-cmu-kids command line option
--absolute-paths <absolute_paths>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-commonvoice command line option
--language <language>
--num-jobs <num_jobs>
--split <split>
-j
-l
-s
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-csj command line option
--configs <configs>
--dataset-parts <dataset_parts>
--num-jobs <num_jobs>
-c
-j
-p
CORPUS_DIR
MANIFEST_DIR
TRANSCRIPT_DIR
lhotse-prepare-cslu-kids command line option
--absolute-paths <absolute_paths>
--normalize-text <normalize_text>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-daily-talk command line option
--num-jobs <num_jobs>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-dihard3 command line option
--dev <dev>
--eval <eval>
--no-uem
--num-jobs <num_jobs>
--uem
-j
OUTPUT_DIR
lhotse-prepare-earnings21 command line option
--no-normalize-text
--normalize-text
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-earnings22 command line option
--no-normalize-text
--normalize-text
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-eval2000 command line option
--absolute-paths <absolute_paths>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-fisher-english command line option
--absolute-paths <absolute_paths>
--audio-dirs <audio_dirs>
--num-jobs <num_jobs>
--transcript-dirs <transcript_dirs>
-ad
-j
-td
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-fisher-spanish command line option
--absolute-paths <absolute_paths>
AUDIO_DIR
OUTPUT_DIR
TRANSCRIPT_DIR
lhotse-prepare-gale-arabic command line option
--absolute-paths <absolute_paths>
--audio <audio>
--transcript <transcript>
-s
-t
OUTPUT_DIR
lhotse-prepare-gale-mandarin command line option
--absolute-paths <absolute_paths>
--audio <audio>
--segment-words <segment_words>
--transcript <transcript>
-s
-t
OUTPUT_DIR
lhotse-prepare-gigaspeech command line option
--num-jobs <num_jobs>
--subset <subset>
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-heroico command line option
OUTPUT_DIR
SPEECH_DIR
TRANSCRIPT_DIR
lhotse-prepare-hifitts command line option
--num-jobs <num_jobs>
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-icsi command line option
--mic <mic>
--normalize-text
--transcripts-dir <transcripts_dir>
AUDIO_DIR
OUTPUT_DIR
lhotse-prepare-l2-arctic command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-libricss command line option
--type <type>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-librimix command line option
--min-segment-seconds <min_segment_seconds>
--no-precomputed-mixtures
--sampling-rate <sampling_rate>
--with-precomputed-mixtures
LIBRIMIX_CSV
OUTPUT_DIR
lhotse-prepare-librispeech command line option
--dataset-parts <dataset_parts>
--num-jobs <num_jobs>
-j
-p
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-libritts command line option
--link-previous-utterance
--no-previous-utterance
--num-jobs <num_jobs>
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-ljspeech command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-magicdata command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-mgb2 command line option
--buck-walter
--mer-thresh <mer_thresh>
--no-buck-walter
--no-text-cleaning
--num-jobs <num_jobs>
--text-cleaning
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-mls command line option
--flac
--num-jobs <num_jobs>
--opus
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-mtedx command line option
--lang <lang>
--num-jobs <num_jobs>
-j
-l
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-musan command line option
--no-vocals
--use-vocals
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-nsc command line option
--dataset-part <dataset_part>
-p
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-peoples-speech command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-primewords command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-rir-noise command line option
--parts <parts>
-p
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-spgispeech command line option
--no-normalize-text
--normalize-text
--num-jobs <num_jobs>
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-stcmds command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-switchboard command line option
--absolute-paths <absolute_paths>
--omit-silence
--retain-silence
--sentiment-dir <sentiment_dir>
--transcript-dir <transcript_dir>
AUDIO_DIR
OUTPUT_DIR
lhotse-prepare-tal-asr command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-tal-csasr command line option
--num-jobs <num_jobs>
-j
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-tedlium command line option
OUTPUT_DIR
TEDLIUM_DIR
lhotse-prepare-thchs-30 command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-timit command line option
--num-jobs <num_jobs>
--num-phones <num_phones>
-j
-p
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-vctk command line option
--use-edinburgh-vctk-url <use_edinburgh_vctk_url>
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-voxceleb command line option
--num-jobs <num_jobs>
--voxceleb1 <voxceleb1>
--voxceleb2 <voxceleb2>
-j
-v1
-v2
OUTPUT_DIR
lhotse-prepare-wenet-speech command line option
--dataset-parts <dataset_parts>
--num-jobs <num_jobs>
-j
-p
CORPUS_DIR
OUTPUT_DIR
lhotse-prepare-yesno command line option
CORPUS_DIR
OUTPUT_DIR
lhotse-split command line option
--no-pad
--pad
--shuffle
-s
MANIFEST
NUM_SPLITS
OUTPUT_DIR
lhotse-split-lazy command line option
CHUNK_SIZE
MANIFEST
OUTPUT_DIR
lhotse-subset command line option
--cutids <cutids>
--first <first>
--last <last>
MANIFEST
OUTPUT_MANIFEST
lhotse-validate command line option
--dont-read-data
--read-data
MANIFEST
lhotse-validate-pair command line option
--dont-read-data
--read-data
RECORDINGS
SUPERVISIONS
lhotse-workflows-align-with-torchaudio command line option
--bundle-name <bundle_name>
--device <device>
--dont-normalize-text
--normalize-text
-d
-n
IN_CUTS
OUT_CUTS
lhotse-workflows-annotate-with-whisper command line option
--cuts-manifest <cuts_manifest>
--device <device>
--extension <extension>
--jobs <jobs>
--language <language>
--model-name <model_name>
--recordings-dir <recordings_dir>
--recordings-manifest <recordings_manifest>
-c
-d
-e
-j
-l
-m
-n
-r
OUT_CUTS
lhotse.audio
module
lhotse.augmentation
module
lhotse.cut
module
lhotse.dataset.collation
module
lhotse.dataset.cut_transforms
module
lhotse.dataset.diarization
module
lhotse.dataset.input_strategies
module
lhotse.dataset.sampling
module
lhotse.dataset.signal_transforms
module
lhotse.dataset.speech_recognition
module
lhotse.dataset.unsupervised
module
lhotse.dataset.vad
module
lhotse.features.base
module
lhotse.features.fbank
module
lhotse.features.io
module
lhotse.features.librosa_fbank
module
lhotse.features.mfcc
module
lhotse.features.mixer
module
lhotse.features.spectrogram
module
lhotse.kaldi
module
lhotse.manipulation
module
lhotse.recipes
module
lhotse.supervision
module
LIBRIMIX_CSV
lhotse-prepare-librimix command line option
LibrosaFbank (class in lhotse.features.librosa_fbank)
LibrosaFbankConfig (class in lhotse.features.librosa_fbank)
LibsndfileBackend (class in lhotse.audio)
LibsndfileCompatibleAudioInfo (class in lhotse.audio)
LilcomChunkyReader (class in lhotse.features.io)
LilcomChunkyWriter (class in lhotse.features.io)
LilcomFilesReader (class in lhotse.features.io)
LilcomFilesWriter (class in lhotse.features.io)
LilcomHdf5Reader (class in lhotse.features.io)
LilcomHdf5Writer (class in lhotse.features.io)
LilcomURLReader (class in lhotse.features.io)
LilcomURLWriter (class in lhotse.features.io)
lin2mel() (in module lhotse.features.kaldi.layers)
load() (lhotse.features.base.Features method)
(lhotse.features.base.FeatureSet method)
load_audio() (lhotse.audio.AudioSource method)
(lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
load_kaldi_data_dir() (in module lhotse.kaldi)
load_kaldi_text_mapping() (in module lhotse.kaldi)
load_state_dict() (lhotse.dataset.signal_transforms.SpecAugment method)
(lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
logmelfilterbank() (in module lhotse.features.librosa_fbank)
lookup_cache_or_open() (in module lhotse.features.io)
lookup_chunk_size() (in module lhotse.features.io)
low_freq (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
M
make_dct_matrix() (lhotse.features.kaldi.layers.Wav2MFCC static method)
make_lifter() (lhotse.features.kaldi.layers.Wav2MFCC static method)
make_wavscp_channel_string_map() (in module lhotse.kaldi)
MANIFEST
lhotse-filter command line option
lhotse-split command line option
lhotse-split-lazy command line option
lhotse-subset command line option
lhotse-validate command line option
MANIFEST_DIR
lhotse-kaldi-import command line option
lhotse-prepare-csj command line option
MANIFESTS
lhotse-combine command line option
map() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSegment method)
(lhotse.supervision.SupervisionSet method)
maybe_pad() (in module lhotse.dataset.collation)
mel2lin() (in module lhotse.features.kaldi.layers)
MemoryLilcomReader (class in lhotse.features.io)
MemoryLilcomWriter (class in lhotse.features.io)
MemoryRawReader (class in lhotse.features.io)
MemoryRawWriter (class in lhotse.features.io)
Mfcc (class in lhotse.features.kaldi.extractors)
min_duration (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
mix() (lhotse.features.base.FeatureExtractor static method)
(lhotse.features.base.TorchaudioFeatureExtractor static method)
(lhotse.features.fbank.TorchaudioFbank static method)
(lhotse.features.kaldi.extractors.Fbank static method)
(lhotse.features.librosa_fbank.LibrosaFbank static method)
(lhotse.features.mfcc.TorchaudioMfcc static method)
(lhotse.features.spectrogram.Spectrogram static method)
mix_cuts() (in module lhotse.cut)
mixed_audio (lhotse.audio.AudioMixer property)
mixed_feats (lhotse.features.mixer.FeatureMixer property)
mixed_mono_audio (lhotse.audio.AudioMixer property)
module
lhotse.audio
lhotse.augmentation
lhotse.cut
lhotse.dataset.collation
lhotse.dataset.cut_transforms
lhotse.dataset.diarization
lhotse.dataset.input_strategies
lhotse.dataset.sampling
lhotse.dataset.signal_transforms
lhotse.dataset.speech_recognition
lhotse.dataset.unsupervised
lhotse.dataset.vad
lhotse.features.base
lhotse.features.fbank
lhotse.features.io
lhotse.features.librosa_fbank
lhotse.features.mfcc
lhotse.features.mixer
lhotse.features.spectrogram
lhotse.kaldi
lhotse.manipulation
lhotse.recipes
lhotse.supervision
modules() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
move_to_memory() (lhotse.audio.Recording method)
(lhotse.features.base.Features method)
mux() (lhotse.audio.RecordingSet class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.supervision.SupervisionSet class method)
N
name (lhotse.features.base.FeatureExtractor attribute)
(lhotse.features.base.TorchaudioFeatureExtractor attribute)
(lhotse.features.fbank.TorchaudioFbank attribute)
(lhotse.features.io.ChunkedLilcomHdf5Reader attribute)
(lhotse.features.io.ChunkedLilcomHdf5Writer attribute)
(lhotse.features.io.FeaturesReader property)
(lhotse.features.io.FeaturesWriter property)
(lhotse.features.io.KaldiReader attribute)
(lhotse.features.io.KaldiWriter attribute)
(lhotse.features.io.LilcomChunkyReader attribute)
(lhotse.features.io.LilcomChunkyWriter attribute)
(lhotse.features.io.LilcomFilesReader attribute)
(lhotse.features.io.LilcomFilesWriter attribute)
(lhotse.features.io.LilcomHdf5Reader attribute)
(lhotse.features.io.LilcomHdf5Writer attribute)
(lhotse.features.io.LilcomURLReader attribute)
(lhotse.features.io.LilcomURLWriter attribute)
(lhotse.features.io.MemoryLilcomReader attribute)
(lhotse.features.io.MemoryLilcomWriter attribute)
(lhotse.features.io.MemoryRawReader attribute)
(lhotse.features.io.MemoryRawWriter attribute)
(lhotse.features.io.NumpyFilesReader attribute)
(lhotse.features.io.NumpyFilesWriter attribute)
(lhotse.features.io.NumpyHdf5Reader attribute)
(lhotse.features.io.NumpyHdf5Writer attribute)
(lhotse.features.kaldi.extractors.Fbank attribute)
(lhotse.features.kaldi.extractors.Mfcc attribute)
(lhotse.features.librosa_fbank.LibrosaFbank attribute)
(lhotse.features.mfcc.TorchaudioMfcc attribute)
(lhotse.features.spectrogram.Spectrogram attribute)
named_buffers() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
named_children() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
named_modules() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
named_parameters() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
next_power_of_2() (in module lhotse.features.kaldi.layers)
norm_means (lhotse.features.base.StatsAccumulator property)
norm_stds (lhotse.features.base.StatsAccumulator property)
null_result_on_audio_loading_error() (in module lhotse.audio)
num_ceps (lhotse.features.mfcc.TorchaudioMfccConfig attribute)
num_channels (lhotse.audio.Recording property)
num_channels() (lhotse.audio.RecordingSet method)
num_features (lhotse.features.base.Features attribute)
(lhotse.features.mixer.FeatureMixer property)
num_frames (lhotse.features.base.Features attribute)
num_mel_bins (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
num_samples (lhotse.audio.Recording attribute)
num_samples() (lhotse.audio.RecordingSet method)
num_samples_total (lhotse.audio.AudioMixer property)
NUM_SPLITS
lhotse-split command line option
NumpyFilesReader (class in lhotse.features.io)
NumpyFilesWriter (class in lhotse.features.io)
NumpyHdf5Reader (class in lhotse.features.io)
NumpyHdf5Writer (class in lhotse.features.io)
O
online_inference() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
OnTheFlyFeatures (class in lhotse.dataset.input_strategies)
open_writer() (lhotse.audio.RecordingSet class method)
(lhotse.features.base.FeatureSet class method)
(lhotse.supervision.SupervisionSet class method)
opus_info() (in module lhotse.audio)
OUT_CUTS
lhotse-workflows-align-with-torchaudio command line option
lhotse-workflows-annotate-with-whisper command line option
OUTPUT
lhotse-cut-decompose command line option
OUTPUT_CONFIG
lhotse-feat-write-default-config command line option
OUTPUT_CUT_MANIFEST
lhotse-cut-append command line option
lhotse-cut-mix-by-recording-id command line option
lhotse-cut-mix-sequential command line option
lhotse-cut-pad command line option
lhotse-cut-simple command line option
lhotse-cut-truncate command line option
OUTPUT_CUTS
lhotse-cut-trim-to-supervisions command line option
OUTPUT_CUTSET
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
OUTPUT_DIR
lhotse-feat-extract command line option
lhotse-fix command line option
lhotse-kaldi-export command line option
lhotse-prepare-adept command line option
lhotse-prepare-aidatatang-200zh command line option
lhotse-prepare-aishell command line option
lhotse-prepare-aishell2 command line option
lhotse-prepare-aishell4 command line option
lhotse-prepare-ali-meeting command line option
lhotse-prepare-ami command line option
lhotse-prepare-aspire command line option
lhotse-prepare-babel command line option
lhotse-prepare-broadcast-news command line option
lhotse-prepare-bvcc command line option
lhotse-prepare-callhome-egyptian command line option
lhotse-prepare-callhome-english command line option
lhotse-prepare-cmu-arctic command line option
lhotse-prepare-cmu-indic command line option
lhotse-prepare-cmu-kids command line option
lhotse-prepare-commonvoice command line option
lhotse-prepare-cslu-kids command line option
lhotse-prepare-daily-talk command line option
lhotse-prepare-dihard3 command line option
lhotse-prepare-earnings21 command line option
lhotse-prepare-earnings22 command line option
lhotse-prepare-eval2000 command line option
lhotse-prepare-fisher-english command line option
lhotse-prepare-fisher-spanish command line option
lhotse-prepare-gale-arabic command line option
lhotse-prepare-gale-mandarin command line option
lhotse-prepare-gigaspeech command line option
lhotse-prepare-heroico command line option
lhotse-prepare-hifitts command line option
lhotse-prepare-icsi command line option
lhotse-prepare-l2-arctic command line option
lhotse-prepare-libricss command line option
lhotse-prepare-librimix command line option
lhotse-prepare-librispeech command line option
lhotse-prepare-libritts command line option
lhotse-prepare-ljspeech command line option
lhotse-prepare-magicdata command line option
lhotse-prepare-mgb2 command line option
lhotse-prepare-mls command line option
lhotse-prepare-mtedx command line option
lhotse-prepare-musan command line option
lhotse-prepare-nsc command line option
lhotse-prepare-peoples-speech command line option
lhotse-prepare-primewords command line option
lhotse-prepare-rir-noise command line option
lhotse-prepare-spgispeech command line option
lhotse-prepare-stcmds command line option
lhotse-prepare-switchboard command line option
lhotse-prepare-tal-asr command line option
lhotse-prepare-tal-csasr command line option
lhotse-prepare-tedlium command line option
lhotse-prepare-thchs-30 command line option
lhotse-prepare-timit command line option
lhotse-prepare-vctk command line option
lhotse-prepare-voxceleb command line option
lhotse-prepare-wenet-speech command line option
lhotse-prepare-yesno command line option
lhotse-split command line option
lhotse-split-lazy command line option
OUTPUT_MANIFEST
lhotse-combine command line option
lhotse-copy command line option
lhotse-copy-feats command line option
lhotse-feat-upload command line option
lhotse-filter command line option
lhotse-subset command line option
P
pad_or_truncate_features() (in module lhotse.features.librosa_fbank)
pairwise() (in module lhotse.features.io)
parameters() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
parse_channel_from_ffmpeg_output() (in module lhotse.audio)
PASSWORD
lhotse-download-gigaspeech command line option
perturb_speed() (lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
(lhotse.supervision.AlignmentItem method)
(lhotse.supervision.SupervisionSegment method)
perturb_tempo() (lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
(lhotse.supervision.SupervisionSegment method)
perturb_volume() (lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
(lhotse.supervision.SupervisionSegment method)
PerturbSpeed (class in lhotse.dataset.cut_transforms)
PerturbTempo (class in lhotse.dataset.cut_transforms)
PerturbVolume (class in lhotse.dataset.cut_transforms)
PrecomputedFeatures (class in lhotse.dataset.input_strategies)
PREDICATE
lhotse-filter command line option
preemph_coeff (lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
preemphasis_coefficient (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
PreMixedSourceSeparationDataset (class in lhotse.dataset.source_separation)
process_and_store_recordings() (lhotse.features.base.FeatureSetBuilder method)
R
RandomizedSmoothing (class in lhotse.dataset.signal_transforms)
raw_energy (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
read() (lhotse.features.io.ChunkedLilcomHdf5Reader method)
(lhotse.features.io.FeaturesReader method)
(lhotse.features.io.KaldiReader method)
(lhotse.features.io.LilcomChunkyReader method)
(lhotse.features.io.LilcomFilesReader method)
(lhotse.features.io.LilcomHdf5Reader method)
(lhotse.features.io.LilcomURLReader method)
(lhotse.features.io.MemoryLilcomReader method)
(lhotse.features.io.MemoryRawReader method)
(lhotse.features.io.NumpyFilesReader method)
(lhotse.features.io.NumpyHdf5Reader method)
read_audio() (in module lhotse.audio)
(lhotse.audio.AudioBackend method)
(lhotse.audio.AudioreadBackend method)
(lhotse.audio.CompositeAudioBackend method)
(lhotse.audio.FfmpegSubprocessOpusBackend method)
(lhotse.audio.FfmpegTorchaudioStreamerBackend method)
(lhotse.audio.LibsndfileBackend method)
(lhotse.audio.Sph2pipeSubprocessBackend method)
(lhotse.audio.TorchaudioDefaultBackend method)
read_audio_from_cuts() (in module lhotse.dataset.collation)
read_features_from_cuts() (in module lhotse.dataset.collation)
read_opus() (in module lhotse.audio)
read_opus_ffmpeg() (in module lhotse.audio)
read_opus_torchaudio() (in module lhotse.audio)
read_sph() (in module lhotse.audio)
Recording (class in lhotse.audio)
recording_id (lhotse.features.base.Features attribute)
(lhotse.supervision.SupervisionSegment attribute)
RECORDING_MANIFEST
lhotse-feat-extract command line option
RECORDINGS
lhotse-fix command line option
lhotse-kaldi-export command line option
lhotse-validate-pair command line option
RecordingSet (class in lhotse.audio)
register_backward_hook() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_buffer() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_extractor() (in module lhotse.features.base)
register_forward_hook() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_forward_pre_hook() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_full_backward_hook() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_load_state_dict_post_hook() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_module() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_parameter() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
register_reader() (in module lhotse.features.io)
register_writer() (in module lhotse.features.io)
remove_dc_offset (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
repeat() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
requires_grad_() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
resample() (lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
reverb_rir() (lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
(lhotse.supervision.SupervisionSegment method)
ReverbWithImpulseResponse (class in lhotse.dataset.cut_transforms)
round_to_power_of_two (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
S
samplerate (lhotse.audio.LibsndfileCompatibleAudioInfo property)
SAMPLING_RATE
lhotse-kaldi-import command line option
sampling_rate (lhotse.audio.Recording attribute)
(lhotse.features.base.Features attribute)
(lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
(lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
sampling_rate() (lhotse.audio.RecordingSet method)
save_kaldi_text_mapping() (in module lhotse.kaldi)
score (lhotse.supervision.AlignmentItem property)
serialize() (lhotse.supervision.AlignmentItem method)
set_audio_duration_mismatch_tolerance() (in module lhotse.audio)
set_extra_state() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
share_memory() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
shuffle() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
soundfile_load() (in module lhotse.audio)
source (lhotse.audio.AudioSource attribute)
sources (lhotse.audio.Recording attribute)
speaker (lhotse.supervision.SupervisionSegment attribute)
SpecAugment (class in lhotse.dataset.signal_transforms)
Spectrogram (class in lhotse.features.spectrogram)
SpectrogramConfig (class in lhotse.features.spectrogram)
SPEECH_DIR
lhotse-prepare-heroico command line option
speech_synthesis (in module lhotse.dataset)
Sph2pipeSubprocessBackend (class in lhotse.audio)
sph_info() (in module lhotse.audio)
split() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
split_lazy() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
split_parallelize_combine() (in module lhotse.manipulation)
start (lhotse.features.base.Features attribute)
(lhotse.supervision.AlignmentItem property)
(lhotse.supervision.SupervisionSegment attribute)
state_dict() (lhotse.dataset.signal_transforms.SpecAugment method)
(lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
StatsAccumulator (class in lhotse.features.base)
storage_key (lhotse.features.base.Features attribute)
STORAGE_PATH
lhotse-copy-feats command line option
lhotse-feat-extract-cuts command line option
lhotse-feat-extract-cuts-batch command line option
storage_path (lhotse.features.base.Features attribute)
(lhotse.features.io.ChunkedLilcomHdf5Writer property)
(lhotse.features.io.FeaturesWriter property)
(lhotse.features.io.KaldiWriter property)
(lhotse.features.io.LilcomChunkyWriter property)
(lhotse.features.io.LilcomFilesWriter property)
(lhotse.features.io.LilcomHdf5Writer property)
(lhotse.features.io.LilcomURLWriter property)
(lhotse.features.io.MemoryLilcomWriter property)
(lhotse.features.io.MemoryRawWriter property)
(lhotse.features.io.NumpyFilesWriter property)
(lhotse.features.io.NumpyHdf5Writer property)
storage_type (lhotse.features.base.Features attribute)
store_array() (lhotse.features.io.ChunkedLilcomHdf5Writer method)
(lhotse.features.io.FeaturesWriter method)
(lhotse.features.io.KaldiWriter method)
(lhotse.features.io.LilcomChunkyWriter method)
(lhotse.features.io.LilcomFilesWriter method)
(lhotse.features.io.LilcomHdf5Writer method)
(lhotse.features.io.LilcomURLWriter method)
(lhotse.features.io.MemoryLilcomWriter method)
(lhotse.features.io.MemoryRawWriter method)
(lhotse.features.io.NumpyFilesWriter method)
(lhotse.features.io.NumpyHdf5Writer method)
store_feature_array() (in module lhotse.features.base)
subset() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
supervision_intervals() (lhotse.dataset.input_strategies.AudioSamples method)
(lhotse.dataset.input_strategies.BatchIO method)
(lhotse.dataset.input_strategies.OnTheFlyFeatures method)
(lhotse.dataset.input_strategies.PrecomputedFeatures method)
supervision_masks() (lhotse.dataset.input_strategies.AudioSamples method)
(lhotse.dataset.input_strategies.BatchIO method)
(lhotse.dataset.input_strategies.OnTheFlyFeatures method)
(lhotse.dataset.input_strategies.PrecomputedFeatures method)
SUPERVISIONS
lhotse-fix command line option
lhotse-kaldi-export command line option
lhotse-validate-pair command line option
SupervisionSegment (class in lhotse.supervision)
SupervisionSet (class in lhotse.supervision)
suppress_audio_loading_errors() (in module lhotse.audio)
symbol (lhotse.supervision.AlignmentItem property)
T
T_destination (lhotse.features.kaldi.layers.Wav2FFT attribute)
(lhotse.features.kaldi.layers.Wav2LogFilterBank attribute)
(lhotse.features.kaldi.layers.Wav2LogSpec attribute)
(lhotse.features.kaldi.layers.Wav2MFCC attribute)
(lhotse.features.kaldi.layers.Wav2Spec attribute)
(lhotse.features.kaldi.layers.Wav2Win attribute)
TARGET_DIR
lhotse-download-adept command line option
lhotse-download-aidatatang-200zh command line option
lhotse-download-aishell command line option
lhotse-download-aishell4 command line option
lhotse-download-ali-meeting command line option
lhotse-download-ami command line option
lhotse-download-cmu-arctic command line option
lhotse-download-cmu-indic command line option
lhotse-download-daily-talk command line option
lhotse-download-earnings21 command line option
lhotse-download-gigaspeech command line option
lhotse-download-heroico command line option
lhotse-download-hifitts command line option
lhotse-download-libricss command line option
lhotse-download-librimix command line option
lhotse-download-librispeech command line option
lhotse-download-libritts command line option
lhotse-download-ljspeech command line option
lhotse-download-magicdata command line option
lhotse-download-mtedx command line option
lhotse-download-musan command line option
lhotse-download-primewords command line option
lhotse-download-rir-noise command line option
lhotse-download-spgispeech command line option
lhotse-download-stcmds command line option
lhotse-download-tedlium command line option
lhotse-download-thchs-30 command line option
lhotse-download-timit command line option
lhotse-download-vctk command line option
lhotse-download-voxceleb1 command line option
lhotse-download-voxceleb2 command line option
lhotse-download-yesno command line option
TEDLIUM_DIR
lhotse-prepare-tedlium command line option
text (lhotse.supervision.SupervisionSegment attribute)
to() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
to_cut() (lhotse.audio.Recording method)
to_dict() (lhotse.audio.AudioSource method)
(lhotse.audio.Recording method)
(lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.Features method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.fbank.TorchaudioFbankConfig method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.librosa_fbank.LibrosaFbankConfig method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.mfcc.TorchaudioMfccConfig method)
(lhotse.features.spectrogram.Spectrogram method)
(lhotse.features.spectrogram.SpectrogramConfig method)
(lhotse.supervision.SupervisionSegment method)
to_dicts() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
to_eager() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
to_empty() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
to_file() (lhotse.audio.RecordingSet method)
(lhotse.dataset.signal_transforms.GlobalMVN method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
to_json() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
to_jsonl() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureSet method)
(lhotse.supervision.SupervisionSet method)
to_manifest() (in module lhotse.manipulation)
to_yaml() (lhotse.audio.RecordingSet method)
(lhotse.features.base.FeatureExtractor method)
(lhotse.features.base.FeatureSet method)
(lhotse.features.base.TorchaudioFeatureExtractor method)
(lhotse.features.fbank.TorchaudioFbank method)
(lhotse.features.librosa_fbank.LibrosaFbank method)
(lhotse.features.mfcc.TorchaudioMfcc method)
(lhotse.features.spectrogram.Spectrogram method)
(lhotse.supervision.SupervisionSet method)
TokenCollater (class in lhotse.dataset.collation)
torchaudio_ffmpeg_load() (in module lhotse.audio)
torchaudio_info() (in module lhotse.audio)
torchaudio_load() (in module lhotse.audio)
torchaudio_soundfile_supports_format() (in module lhotse.audio)
torchaudio_supports_ffmpeg() (in module lhotse.audio)
TorchaudioDefaultBackend (class in lhotse.audio)
TorchaudioFbank (class in lhotse.features.fbank)
TorchaudioFbankConfig (class in lhotse.features.fbank)
TorchaudioFeatureExtractor (class in lhotse.features.base)
TorchaudioMfcc (class in lhotse.features.mfcc)
TorchaudioMfccConfig (class in lhotse.features.mfcc)
train() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
training (lhotse.dataset.signal_transforms.DereverbWPE attribute)
(lhotse.dataset.signal_transforms.GlobalMVN attribute)
(lhotse.dataset.signal_transforms.RandomizedSmoothing attribute)
(lhotse.dataset.signal_transforms.SpecAugment attribute)
(lhotse.features.kaldi.layers.Wav2FFT attribute)
(lhotse.features.kaldi.layers.Wav2LogFilterBank attribute)
(lhotse.features.kaldi.layers.Wav2LogSpec attribute)
(lhotse.features.kaldi.layers.Wav2MFCC attribute)
(lhotse.features.kaldi.layers.Wav2Spec attribute)
(lhotse.features.kaldi.layers.Wav2Win attribute)
TRANSCRIPT_DIR
lhotse-prepare-broadcast-news command line option
lhotse-prepare-callhome-egyptian command line option
lhotse-prepare-csj command line option
lhotse-prepare-fisher-spanish command line option
lhotse-prepare-heroico command line option
transform() (lhotse.supervision.AlignmentItem method)
transform_alignment() (lhotse.supervision.SupervisionSegment method)
(lhotse.supervision.SupervisionSet method)
transform_text() (lhotse.supervision.SupervisionSegment method)
(lhotse.supervision.SupervisionSet method)
transforms (lhotse.audio.Recording attribute)
trim() (lhotse.supervision.AlignmentItem method)
(lhotse.supervision.SupervisionSegment method)
type (lhotse.audio.AudioSource attribute)
(lhotse.features.base.Features attribute)
type() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
U
unmixed_audio (lhotse.audio.AudioMixer property)
unmixed_feats (lhotse.features.mixer.FeatureMixer property)
UnsupervisedDataset (class in lhotse.dataset.unsupervised)
UnsupervisedWaveformDataset (class in lhotse.dataset.unsupervised)
update() (lhotse.features.base.StatsAccumulator method)
URL
lhotse-feat-upload command line option
use_energy (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
V
VadDataset (class in lhotse.dataset.vad)
validate() (lhotse.dataset.source_separation.DynamicallyMixedSourceSeparationDataset method)
validate_for_asr() (in module lhotse.dataset.speech_recognition)
verbose_audio_loading_exceptions() (in module lhotse.audio)
vtln_high (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
vtln_low (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
vtln_warp (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
W
Wav2FFT (class in lhotse.features.kaldi.layers)
Wav2LogFilterBank (class in lhotse.features.kaldi.layers)
Wav2LogSpec (class in lhotse.features.kaldi.layers)
Wav2MFCC (class in lhotse.features.kaldi.layers)
Wav2Spec (class in lhotse.features.kaldi.layers)
Wav2Win (class in lhotse.features.kaldi.layers)
win_length (lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
window (lhotse.features.librosa_fbank.LibrosaFbankConfig attribute)
window_type (lhotse.features.fbank.TorchaudioFbankConfig attribute)
(lhotse.features.kaldi.layers.Wav2FFT property)
(lhotse.features.kaldi.layers.Wav2LogFilterBank property)
(lhotse.features.kaldi.layers.Wav2LogSpec property)
(lhotse.features.kaldi.layers.Wav2MFCC property)
(lhotse.features.kaldi.layers.Wav2Spec property)
(lhotse.features.mfcc.TorchaudioMfccConfig attribute)
(lhotse.features.spectrogram.SpectrogramConfig attribute)
with_alignment() (lhotse.supervision.SupervisionSegment method)
with_alignment_from_ctm() (lhotse.supervision.SupervisionSet method)
with_offset() (lhotse.supervision.AlignmentItem method)
(lhotse.supervision.SupervisionSegment method)
with_path_prefix() (lhotse.audio.AudioSource method)
(lhotse.audio.Recording method)
(lhotse.audio.RecordingSet method)
(lhotse.features.base.Features method)
(lhotse.features.base.FeatureSet method)
with_traceback() (lhotse.audio.AudioLoadingError method)
(lhotse.audio.DurationMismatchError method)
write() (lhotse.features.io.ChunkedLilcomHdf5Writer method)
(lhotse.features.io.FeaturesWriter method)
(lhotse.features.io.KaldiWriter method)
(lhotse.features.io.LilcomChunkyWriter method)
(lhotse.features.io.LilcomFilesWriter method)
(lhotse.features.io.LilcomHdf5Writer method)
(lhotse.features.io.LilcomURLWriter method)
(lhotse.features.io.MemoryLilcomWriter method)
(lhotse.features.io.MemoryRawWriter method)
(lhotse.features.io.NumpyFilesWriter method)
(lhotse.features.io.NumpyHdf5Writer method)
write_alignment_to_ctm() (lhotse.supervision.SupervisionSet method)
WSPECIFIER
lhotse-cut-export-to-webdataset command line option
X
xpu() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
Z
zero_grad() (lhotse.features.kaldi.layers.Wav2FFT method)
(lhotse.features.kaldi.layers.Wav2LogFilterBank method)
(lhotse.features.kaldi.layers.Wav2LogSpec method)
(lhotse.features.kaldi.layers.Wav2MFCC method)
(lhotse.features.kaldi.layers.Wav2Spec method)
(lhotse.features.kaldi.layers.Wav2Win method)
Read the Docs
v: v1.9
Versions
Downloads
On Read the Docs
Project Home
Builds
Free document hosting provided by
Read the Docs
.