mirror of
https://github.com/huggingface/transformers.git
synced 2025-08-01 18:51:14 +06:00
hertz is already per second (#21188)
This commit is contained in:
parent
4bc18e7a83
commit
9b42c68f7c
@ -34,7 +34,7 @@ class SequenceFeatureExtractor(FeatureExtractionMixin):
|
|||||||
feature_size (`int`):
|
feature_size (`int`):
|
||||||
The feature dimension of the extracted features.
|
The feature dimension of the extracted features.
|
||||||
sampling_rate (`int`):
|
sampling_rate (`int`):
|
||||||
The sampling rate at which the audio files should be digitalized expressed in Hertz per second (Hz).
|
The sampling rate at which the audio files should be digitalized expressed in hertz (Hz).
|
||||||
padding_value (`float`):
|
padding_value (`float`):
|
||||||
The value that is used to fill the padding values / vectors.
|
The value that is used to fill the padding values / vectors.
|
||||||
"""
|
"""
|
||||||
|
@ -44,7 +44,7 @@ class ASTFeatureExtractor(SequenceFeatureExtractor):
|
|||||||
feature_size (`int`, *optional*, defaults to 1):
|
feature_size (`int`, *optional*, defaults to 1):
|
||||||
The feature dimension of the extracted features.
|
The feature dimension of the extracted features.
|
||||||
sampling_rate (`int`, *optional*, defaults to 16000):
|
sampling_rate (`int`, *optional*, defaults to 16000):
|
||||||
The sampling rate at which the audio files should be digitalized expressed in Hertz per second (Hz).
|
The sampling rate at which the audio files should be digitalized expressed in hertz (Hz).
|
||||||
num_mel_bins (`int`, *optional*, defaults to 128):
|
num_mel_bins (`int`, *optional*, defaults to 128):
|
||||||
Number of Mel-frequency bins.
|
Number of Mel-frequency bins.
|
||||||
max_length (`int`, *optional*, defaults to 1024):
|
max_length (`int`, *optional*, defaults to 1024):
|
||||||
|
@ -53,7 +53,7 @@ class MCTCTFeatureExtractor(SequenceFeatureExtractor):
|
|||||||
feature_size (`int`, defaults to 80):
|
feature_size (`int`, defaults to 80):
|
||||||
The feature dimension of the extracted features. This is the number of mel_frequency
|
The feature dimension of the extracted features. This is the number of mel_frequency
|
||||||
sampling_rate (`int`, defaults to 16000):
|
sampling_rate (`int`, defaults to 16000):
|
||||||
The sampling rate at which the audio files should be digitalized expressed in Hertz per second (Hz).
|
The sampling rate at which the audio files should be digitalized expressed in hertz (Hz).
|
||||||
padding_value (`float`, defaults to 0.0):
|
padding_value (`float`, defaults to 0.0):
|
||||||
The value that is used to fill the padding values.
|
The value that is used to fill the padding values.
|
||||||
hop_length (`int`, defaults to 10):
|
hop_length (`int`, defaults to 10):
|
||||||
|
@ -44,7 +44,7 @@ class Speech2TextFeatureExtractor(SequenceFeatureExtractor):
|
|||||||
feature_size (`int`, defaults to 80):
|
feature_size (`int`, defaults to 80):
|
||||||
The feature dimension of the extracted features.
|
The feature dimension of the extracted features.
|
||||||
sampling_rate (`int`, defaults to 16000):
|
sampling_rate (`int`, defaults to 16000):
|
||||||
The sampling rate at which the audio files should be digitalized expressed in Hertz per second (Hz).
|
The sampling rate at which the audio files should be digitalized expressed in hertz (Hz).
|
||||||
num_mel_bins (`int`, defaults to 80):
|
num_mel_bins (`int`, defaults to 80):
|
||||||
Number of Mel-frequency bins.
|
Number of Mel-frequency bins.
|
||||||
padding_value (`float`, defaults to 0.0):
|
padding_value (`float`, defaults to 0.0):
|
||||||
|
@ -39,7 +39,7 @@ class Wav2Vec2FeatureExtractor(SequenceFeatureExtractor):
|
|||||||
feature_size (`int`, defaults to 1):
|
feature_size (`int`, defaults to 1):
|
||||||
The feature dimension of the extracted features.
|
The feature dimension of the extracted features.
|
||||||
sampling_rate (`int`, defaults to 16000):
|
sampling_rate (`int`, defaults to 16000):
|
||||||
The sampling rate at which the audio files should be digitalized expressed in Hertz per second (Hz).
|
The sampling rate at which the audio files should be digitalized expressed in hertz (Hz).
|
||||||
padding_value (`float`, defaults to 0.0):
|
padding_value (`float`, defaults to 0.0):
|
||||||
The value that is used to fill the padding values.
|
The value that is used to fill the padding values.
|
||||||
do_normalize (`bool`, *optional*, defaults to `True`):
|
do_normalize (`bool`, *optional*, defaults to `True`):
|
||||||
|
@ -43,7 +43,7 @@ class WhisperFeatureExtractor(SequenceFeatureExtractor):
|
|||||||
feature_size (`int`, defaults to 80):
|
feature_size (`int`, defaults to 80):
|
||||||
The feature dimension of the extracted features.
|
The feature dimension of the extracted features.
|
||||||
sampling_rate (`int`, defaults to 16000):
|
sampling_rate (`int`, defaults to 16000):
|
||||||
The sampling rate at which the audio files should be digitalized expressed in Hertz per second (Hz).
|
The sampling rate at which the audio files should be digitalized expressed in hertz (Hz).
|
||||||
hop_length (`int`, defaults to 160):
|
hop_length (`int`, defaults to 160):
|
||||||
Length of the overlaping windows for the STFT used to obtain the Mel Frequency coefficients.
|
Length of the overlaping windows for the STFT used to obtain the Mel Frequency coefficients.
|
||||||
chunk_length (`int`, defaults to 30):
|
chunk_length (`int`, defaults to 30):
|
||||||
|
Loading…
Reference in New Issue
Block a user