embedl
/

Cosmos-Reason2-8B-W4A16-FlashHead

+try:
+    from vllm.model_executor.models.qwen3_vl import _SUPPORTS_EMBEDL_FLASHHEAD
+except ImportError:
+    raise ImportError(
+        "\n\n"
+        "===============================================================\n"
+        "  FlashHead requires the Embedl Docker container to run.\n"
+        "\n"
+        "  Currently, FlashHead inference is supported only via vLLM.\n"
+        "  Hugging Face Transformers support will be added in a future release.\n"
+        "  Please use one of the following images:\n"
+        "\n"
+        "    Jetson Orin:  embedl/vllm:latest-jetson-orin-flashhead\n"
+        "    Jetson Thor:  embedl/vllm:latest-jetson-thor-flashhead\n"
+        "\n"
+        "  Do NOT install embedl-models via pip directly.\n"
+        "===============================================================\n"
+    )