Upload folder using huggingface_hub

Files changed (3) hide show

README.md CHANGED Viewed

@@ -53,7 +53,8 @@ model-index:
 [**📄 Technical Report**](https://arxiv.org/abs/2603.13398) |
 [**🖥️ Qianfan Platform**](https://cloud.baidu.com/product-s/qianfan_home) |
-[**💻 GitHub**](https://github.com/baidubce/Qianfan-VL)
 </div>
@@ -317,6 +318,24 @@ print(response)
 vllm serve baidu/Qianfan-OCR --trust-remote-code
 ```
 ## Citation
 ```bibtex

 [**📄 Technical Report**](https://arxiv.org/abs/2603.13398) |
 [**🖥️ Qianfan Platform**](https://cloud.baidu.com/product-s/qianfan_home) |
+[**💻 GitHub**](https://github.com/baidubce/Qianfan-VL) |
+[**🧩 Skill**](https://github.com/baidubce/skills/tree/develop/skills/qianfanocr-document-intelligence)
 </div>
 vllm serve baidu/Qianfan-OCR --trust-remote-code
 ```
+## Skill
+We provide a [Qianfan OCR Document Intelligence](https://github.com/baidubce/skills/tree/develop/skills/qianfanocr-document-intelligence) skill for image and PDF understanding workflows.
+It can be used by users of OpenClaw, Claude Code, Codex, and other assistants that support this skill format.
+This skill packages reusable instructions, scripts, and references so the agent can automatically apply Qianfan-powered document intelligence to tasks such as:
+- document parsing to Markdown
+- layout analysis
+- element recognition
+- general OCR
+- key information extraction
+- chart understanding
+- document VQA
+The skill is designed for visual understanding tasks over images and PDFs, and includes the execution flow needed to prepare inputs, choose the right analysis mode, and call the bundled CLI tools.
 ## Citation
 ```bibtex

config.json CHANGED Viewed

@@ -51,7 +51,7 @@
   "pad_token_id": 151643,
   "ps_version": "v2",
   "select_layer": -1,
-  "template": "internvl2_5",
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": null,

   "pad_token_id": 151643,
   "ps_version": "v2",
   "select_layer": -1,
+  "template": "qianfanvl",
   "tie_word_embeddings": false,
   "torch_dtype": "bfloat16",
   "transformers_version": null,

conversation.py CHANGED Viewed

@@ -33,6 +33,7 @@ class SeparatorStyle(IntEnum):
     CHATGLM3 = auto()
     INTERNVL_ZH = auto()
     MPT = auto()
 @dataclasses.dataclass
@@ -247,6 +248,18 @@ class Conversation:
                 else:
                     ret += role
             return ret
         else:
             raise ValueError(f'Invalid style: {self.sep_style}')
@@ -389,3 +402,15 @@ register_conv_template(
         sep='<|im_end|>\n',
     )
 )

     CHATGLM3 = auto()
     INTERNVL_ZH = auto()
     MPT = auto()
+    QIANFANVL = auto()
 @dataclasses.dataclass
                 else:
                     ret += role
             return ret
+        elif self.sep_style == SeparatorStyle.QIANFANVL:
+            ret = ''
+            if self.system_message:
+                ret = system_prompt + self.sep
+            for role, message in self.messages:
+                if message:
+                    if type(message) is tuple:
+                        message, _, _ = message
+                    ret += role + message + self.sep
+                else:
+                    ret += role
+            return ret
         else:
             raise ValueError(f'Invalid style: {self.sep_style}')
         sep='<|im_end|>\n',
     )
 )
+register_conv_template(
+    Conversation(
+        name='qianfanvl',
+        system_template='<|im_start|>system\n{system_message}',
+        system_message='',
+        roles=('<|im_start|>user\n', '<|im_start|>assistant\n'),
+        sep_style=SeparatorStyle.QIANFANVL,
+        sep='<|im_end|>\n',
+    )
+)