enactic
/

avista-base-plus

Automatic Speech Recognition

Model card Files Files and versions

avista-base-plus / preprocessor_config.json

yubo0306's picture

Upload processor

a431f05 verified about 1 month ago

history blame contribute delete

1.05 kB

	{
	"auto_map": {
	"AutoFeatureExtractor": "feature_extraction_avhubert.AVHubertFeatureExtractor",
	"AutoProcessor": "processing_avhubert.AVHubertProcessor"
	},
	"feature_extractor_type": "AVHubertFeatureExtractor",
	"image_crop_size": 88,
	"landmark_indices": [
	5,
	411,
	199,
	187
	],
	"max_sample_size": null,
	"min_detection_confidence": 0.5,
	"min_tracking_confidence": 0.5,
	"normalize": true,
	"processor_class": "AVHubertProcessor",
	"refine_landmarks": false,
	"sr": 16000,
	"stack_order_audio": 4,
	"static_image_mode": false,
	"transforms": [
	{
	"training": "True",
	"transforms_type": "ToImage"
	},
	{
	"size": "(88, 88)",
	"training": "True",
	"transforms_type": "CenterCrop"
	},
	{
	"dtype": "torch.float32",
	"scale": "True",
	"training": "True",
	"transforms_type": "ToDtype"
	},
	{
	"inplace": "False",
	"mean": "[0.421]",
	"std": "[0.165]",
	"training": "True",
	"transforms_type": "Normalize"
	}
	]
	}