hassansh commited on
Commit
e9b74a6
·
verified ·
1 Parent(s): 845e2f2

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +20 -6
README.md CHANGED
@@ -66,14 +66,28 @@ pip install "transformers[dev-torch] @ git+https://github.com/Zyphra/transformer
66
  TODO
67
 
68
  ```python
69
- from transformers import AutoTokenizer, AutoModelForCausalLM
70
  import torch
71
 
72
- tokenizer = AutoTokenizer.from_pretrained("Zyphra/ZAYA1-base")
73
- model = AutoModelForCausalLM.from_pretrained("Zyphra/ZAYA1-base", device_map="cuda", dtype=torch.bfloat16)
74
-
75
- input_text = "What factors contributed to the fall of the Roman Empire?"
76
- input_ids = tokenizer(input_text, return_tensors="pt").to("cuda")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
77
 
78
  outputs = model.generate(**input_ids, max_new_tokens=100)
79
  print(tokenizer.decode(outputs[0]))
 
66
  TODO
67
 
68
  ```python
69
+ from transformers import Zaya1VLForConditionalGeneration, Zaya1VLProcessor
70
  import torch
71
 
72
+ device = "cuda"
73
+ processor = Zaya1VLProcessor.from_pretrained("Zyphra/ZAYA1-VL", temporal_patch_size=1)
74
+ model = Zaya1VLForConditionalGeneration.from_pretrained("Zyphra/ZAYA1-VL", device_map=device, torch_dtype=torch.bfloat16, attn_implementation="flash_attention_2")
75
+
76
+ question = "What do you see in the image? Give us some detail."
77
+ add_special_tokens = True
78
+ num_img_tokens = 8000
79
+
80
+ conversation = [
81
+ {"role": "user", "content": [
82
+ {"type": "image", "image": image, "max_pixels" : num_img_tokens * 28 * 28, "min_pixels" : 10 * 28 * 28},
83
+ {"type": "text", "text": question},
84
+ ]
85
+ },
86
+ ]
87
+ prompt = processor.apply_chat_template(conversation, add_generation_prompt=True)
88
+ images, _ = process_vision_info(conversation)
89
+ inputs = processor(text=prompt, images=images, add_special_tokens=True, return_tensors="pt")
90
+ inputs = {key: value.to(device) for key, value in inputs.items()}
91
 
92
  outputs = model.generate(**input_ids, max_new_tokens=100)
93
  print(tokenizer.decode(outputs[0]))