github-sync-test / smolagents /hellosmol.py
billyaungmyint's picture
Sync from GitHub via hub-sync
908d59b verified
raw
history blame contribute delete
639 Bytes
import os
from huggingface_hub import InferenceClient
## You need a token from https://hf.co/settings/tokens, ensure that you select 'read' as the token type. If you run this on Google Colab, you can set it up in the "settings" tab under "secrets". Make sure to call it "HF_TOKEN"
# HF_TOKEN = os.environ.get("HF_TOKEN")
client = InferenceClient(model="moonshotai/Kimi-K2.5")
output = client.chat.completions.create(
messages=[
{"role": "user", "content": "The capital of France is"},
],
stream=False,
max_tokens=1024,
extra_body={'thinking': {'type': 'disabled'}},
)
print(output.choices[0].message.content)