Spaces:
Running on Zero
Running on Zero
fix: add do_sample_frames flag to processor_kwargs to prevent metadata errors
Browse files
app.py
CHANGED
|
@@ -115,13 +115,13 @@ def predict(message: str, file: FileData = None, downsample_mode: str = "16x") -
|
|
| 115 |
inputs = processor.apply_chat_template(
|
| 116 |
messages, tokenize=True, add_generation_prompt=True,
|
| 117 |
return_dict=True, return_tensors="pt",
|
| 118 |
-
# Wrap vision kwargs in processor_kwargs for newer transformers versions
|
| 119 |
processor_kwargs={
|
| 120 |
"downsample_mode": downsample_mode,
|
| 121 |
"max_num_frames": 64,
|
| 122 |
"stack_frames": 1,
|
| 123 |
"max_slice_nums": 1,
|
| 124 |
"use_image_id": False,
|
|
|
|
| 125 |
}
|
| 126 |
).to(model.device)
|
| 127 |
else:
|
|
@@ -138,7 +138,6 @@ def predict(message: str, file: FileData = None, downsample_mode: str = "16x") -
|
|
| 138 |
inputs = processor.apply_chat_template(
|
| 139 |
messages, tokenize=True, add_generation_prompt=True,
|
| 140 |
return_dict=True, return_tensors="pt",
|
| 141 |
-
# Wrap vision kwargs in processor_kwargs
|
| 142 |
processor_kwargs={
|
| 143 |
"downsample_mode": downsample_mode,
|
| 144 |
"max_slice_nums": 9,
|
|
|
|
| 115 |
inputs = processor.apply_chat_template(
|
| 116 |
messages, tokenize=True, add_generation_prompt=True,
|
| 117 |
return_dict=True, return_tensors="pt",
|
|
|
|
| 118 |
processor_kwargs={
|
| 119 |
"downsample_mode": downsample_mode,
|
| 120 |
"max_num_frames": 64,
|
| 121 |
"stack_frames": 1,
|
| 122 |
"max_slice_nums": 1,
|
| 123 |
"use_image_id": False,
|
| 124 |
+
"do_sample_frames": False, # Fix: Avoid requiring metadata since we already sampled
|
| 125 |
}
|
| 126 |
).to(model.device)
|
| 127 |
else:
|
|
|
|
| 138 |
inputs = processor.apply_chat_template(
|
| 139 |
messages, tokenize=True, add_generation_prompt=True,
|
| 140 |
return_dict=True, return_tensors="pt",
|
|
|
|
| 141 |
processor_kwargs={
|
| 142 |
"downsample_mode": downsample_mode,
|
| 143 |
"max_slice_nums": 9,
|