akhaliq HF Staff commited on
Commit
803abce
·
1 Parent(s): d5cf375

fix: add do_sample_frames flag to processor_kwargs to prevent metadata errors

Browse files
Files changed (1) hide show
  1. app.py +1 -2
app.py CHANGED
@@ -115,13 +115,13 @@ def predict(message: str, file: FileData = None, downsample_mode: str = "16x") -
115
  inputs = processor.apply_chat_template(
116
  messages, tokenize=True, add_generation_prompt=True,
117
  return_dict=True, return_tensors="pt",
118
- # Wrap vision kwargs in processor_kwargs for newer transformers versions
119
  processor_kwargs={
120
  "downsample_mode": downsample_mode,
121
  "max_num_frames": 64,
122
  "stack_frames": 1,
123
  "max_slice_nums": 1,
124
  "use_image_id": False,
 
125
  }
126
  ).to(model.device)
127
  else:
@@ -138,7 +138,6 @@ def predict(message: str, file: FileData = None, downsample_mode: str = "16x") -
138
  inputs = processor.apply_chat_template(
139
  messages, tokenize=True, add_generation_prompt=True,
140
  return_dict=True, return_tensors="pt",
141
- # Wrap vision kwargs in processor_kwargs
142
  processor_kwargs={
143
  "downsample_mode": downsample_mode,
144
  "max_slice_nums": 9,
 
115
  inputs = processor.apply_chat_template(
116
  messages, tokenize=True, add_generation_prompt=True,
117
  return_dict=True, return_tensors="pt",
 
118
  processor_kwargs={
119
  "downsample_mode": downsample_mode,
120
  "max_num_frames": 64,
121
  "stack_frames": 1,
122
  "max_slice_nums": 1,
123
  "use_image_id": False,
124
+ "do_sample_frames": False, # Fix: Avoid requiring metadata since we already sampled
125
  }
126
  ).to(model.device)
127
  else:
 
138
  inputs = processor.apply_chat_template(
139
  messages, tokenize=True, add_generation_prompt=True,
140
  return_dict=True, return_tensors="pt",
 
141
  processor_kwargs={
142
  "downsample_mode": downsample_mode,
143
  "max_slice_nums": 9,