parakeet-rnnt-0.6b / processor_config.json
eustlb's picture
eustlb HF Staff
Fix RNN-T tokenizer: <blank> at id 1024 (aliased as pad), consistent with blank_token_id=1024
9ff46b0 verified
{
"blank_token": "<blank>",
"decoder_type": "rnnt",
"feature_extractor": {
"feature_extractor_type": "ParakeetFeatureExtractor",
"feature_size": 80,
"hop_length": 160,
"n_fft": 512,
"padding_side": "right",
"padding_value": 0.0,
"preemphasis": 0.97,
"return_attention_mask": true,
"sampling_rate": 16000,
"win_length": 400
},
"processor_class": "ParakeetProcessor"
}