lkhl commited on
Commit
e4996c0
·
verified ·
1 Parent(s): 36a63f8

Upload processor

Browse files
chat_template.jinja CHANGED
@@ -17,15 +17,13 @@ You are VideoLLaMA3 created by Alibaba DAMO Academy, a helpful assistant to help
17
  {{- message['content'] -}}
18
  {% else %}
19
  {% for content in message['content'] %}
20
- {% if content is string %}
21
- {{- content -}}
22
- {% elif content['type'] == 'text' or 'text' in content %}
23
  {{- content['text'] -}}
24
- {% elif content['type'] == 'image' or 'image' in content %}
25
- {{- image_token + '
26
  ' -}}
27
- {% elif content['type'] == 'video' or 'video' in content %}
28
- {{- video_token + '
29
  ' -}}
30
  {% endif %}
31
  {% endfor %}
 
17
  {{- message['content'] -}}
18
  {% else %}
19
  {% for content in message['content'] %}
20
+ {% if content['type'] == 'text' %}
 
 
21
  {{- content['text'] -}}
22
+ {% elif content['type'] == 'image' %}
23
+ {{- '<|image_pad|>' + '
24
  ' -}}
25
+ {% elif content['type'] == 'video' %}
26
+ {{- '<|video_pad|>' + '
27
  ' -}}
28
  {% endif %}
29
  {% endfor %}
preprocessor_config.json CHANGED
@@ -8,18 +8,24 @@
8
  0.5,
9
  0.5
10
  ],
11
- "image_merge_size": 1,
12
  "image_processor_type": "Videollama3ImageProcessor",
13
  "image_std": [
14
  0.5,
15
  0.5,
16
  0.5
17
  ],
 
18
  "max_tokens": 16384,
 
 
19
  "min_tokens": 16,
20
  "patch_size": 14,
21
  "processor_class": "Videollama3Processor",
22
  "resample": 3,
23
  "rescale_factor": 0.00392156862745098,
24
- "video_merge_size": 1
 
 
 
 
25
  }
 
8
  0.5,
9
  0.5
10
  ],
 
11
  "image_processor_type": "Videollama3ImageProcessor",
12
  "image_std": [
13
  0.5,
14
  0.5,
15
  0.5
16
  ],
17
+ "max_pixels": 3211264,
18
  "max_tokens": 16384,
19
+ "merge_size": 1,
20
+ "min_pixels": 3136,
21
  "min_tokens": 16,
22
  "patch_size": 14,
23
  "processor_class": "Videollama3Processor",
24
  "resample": 3,
25
  "rescale_factor": 0.00392156862745098,
26
+ "size": {
27
+ "longest_edge": 1003520,
28
+ "shortest_edge": 3136
29
+ },
30
+ "temporal_patch_size": 1
31
  }
video_preprocessor_config.json CHANGED
@@ -9,14 +9,13 @@
9
  "do_pad": null,
10
  "do_rescale": true,
11
  "do_resize": true,
12
- "do_sample_frames": true,
13
  "fps": null,
14
  "image_mean": [
15
  0.5,
16
  0.5,
17
  0.5
18
  ],
19
- "image_merge_size": null,
20
  "image_std": [
21
  0.5,
22
  0.5,
@@ -24,16 +23,21 @@
24
  ],
25
  "input_data_format": null,
26
  "max_frames": 180,
27
- "max_tokens": 16384,
28
- "min_tokens": 16,
 
 
29
  "num_frames": null,
30
  "patch_size": 14,
31
  "processor_class": "Videollama3Processor",
32
  "resample": 3,
33
  "rescale_factor": 0.00392156862745098,
34
- "size": null,
 
 
 
35
  "size_divisor": null,
36
- "video_merge_size": 2,
37
  "video_metadata": null,
38
  "video_processor_type": "Videollama3VideoProcessor"
39
  }
 
9
  "do_pad": null,
10
  "do_rescale": true,
11
  "do_resize": true,
12
+ "do_sample_frames": false,
13
  "fps": null,
14
  "image_mean": [
15
  0.5,
16
  0.5,
17
  0.5
18
  ],
 
19
  "image_std": [
20
  0.5,
21
  0.5,
 
23
  ],
24
  "input_data_format": null,
25
  "max_frames": 180,
26
+ "max_pixels": 12845056,
27
+ "merge_size": 2,
28
+ "min_frames": 4,
29
+ "min_pixels": 12544,
30
  "num_frames": null,
31
  "patch_size": 14,
32
  "processor_class": "Videollama3Processor",
33
  "resample": 3,
34
  "rescale_factor": 0.00392156862745098,
35
+ "size": {
36
+ "longest_edge": 12845056,
37
+ "shortest_edge": 12544
38
+ },
39
  "size_divisor": null,
40
+ "temporal_patch_size": 1,
41
  "video_metadata": null,
42
  "video_processor_type": "Videollama3VideoProcessor"
43
  }