46 lines
958 B
JSON
46 lines
958 B
JSON
{
|
|
"im_end": "<|image_end|>",
|
|
"im_end_token": "<|image_end|>",
|
|
"im_id_end": "<|image_id_end|>",
|
|
"im_id_start": "<|image_id_start|>",
|
|
"im_start": "<|image_start|>",
|
|
"im_start_token": "<|image_start|>",
|
|
"image_feature_size": 64,
|
|
"image_processor_type": "MegrezOImageProcessor",
|
|
"audio_feature_extractor_type": "WhisperFeatureExtractor",
|
|
"feature_size": 128,
|
|
"max_slice_nums": 9,
|
|
"mean": [
|
|
0.5,
|
|
0.5,
|
|
0.5
|
|
],
|
|
"norm_mean": [
|
|
0.5,
|
|
0.5,
|
|
0.5
|
|
],
|
|
"norm_std": [
|
|
0.5,
|
|
0.5,
|
|
0.5
|
|
],
|
|
"patch_size": 14,
|
|
"processor_class": "MegrezOProcessor",
|
|
"sampling_rate": 16000,
|
|
"scale_resolution": 448,
|
|
"slice_end": "<|slice_end|>",
|
|
"slice_end_token": "<|slice_end|>",
|
|
"slice_mode": true,
|
|
"slice_start": "<|slice_start|>",
|
|
"slice_start_token": "<|slice_start|>",
|
|
"std": [
|
|
0.5,
|
|
0.5,
|
|
0.5
|
|
],
|
|
"unk": "<|unk|>",
|
|
"unk_token": "<|unk|>",
|
|
"pad_token": "<|pad|>",
|
|
"use_image_id": true
|
|
} |