-
Notifications
You must be signed in to change notification settings - Fork 58
Expand file tree
/
Copy pathpreprocessor_config.json
More file actions
58 lines (57 loc) · 1.48 KB
/
preprocessor_config.json
File metadata and controls
58 lines (57 loc) · 1.48 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
{
"auto_map": {
"AutoImageProcessor": "image_processing_bailingmm2.BailingMM2ImageProcessor",
"AutoFeatureExtractor": "audio_processing_bailingmm2.BailingMM2AudioProcessor",
"AutoProcessor": "processing_bailingmm2.BailingMM2Processor"
},
"min_pixels": 4096,
"max_pixels": 16777216,
"patch_size": 16,
"temporal_patch_size": 2,
"merge_size": 2,
"image_mean": [
0.48145466,
0.4578275,
0.40821073
],
"image_std": [
0.26862954,
0.26130258,
0.27577711
],
"image_token": "<image>",
"video_token": "<video>",
"use_interleaved_frame_timestamp": true,
"image_processor_type": "BailingMM2ImageProcessor",
"feature_extractor_type": "BailingMM2AudioProcessor",
"audio_token": "<audio>",
"chunk_length": 30,
"dither": 0.0,
"feature_size": 80,
"frame_length": 25,
"frame_shift": 10,
"inverse_norm": true,
"lfr_m": 7,
"lfr_n": 6,
"n_samples": 480000,
"num_audio_tokens": 256,
"sampling_rate": 16000,
"up_sample": true,
"return_attention_mask": true,
"padding_side": "right",
"padding_value": 0.0,
"processor_class": "BailingMM2Processor",
"wav_frontend_args": {
"cmvn_file": "am.mvn",
"fs": 16000,
"window": "hamming",
"n_mels": 80,
"frame_length": 25,
"frame_shift": 10,
"lfr_m": 7,
"lfr_n": 6
},
"whisper_frontend_args": {
"n_mels": 128
}
}