Spaces:

billyaungmyint
/

github-sync-test

Running

App Files Files Community

github-sync-test / main.py

billyaungmyint

Sync from GitHub via hub-sync

7e506ce verified 16 days ago

raw

history blame

7.94 kB

	import datetime as dt
	import json
	import os
	from pathlib import Path
	import urllib.error
	import urllib.request

	import gradio as gr
	from huggingface_hub import InferenceClient


	def _build_label() -> str:
	version_file = Path("VERSION")
	version_from_file = ""
	if version_file.exists():
	version_from_file = version_file.read_text(encoding="utf-8").strip()

	commit = (
	os.getenv("GITHUB_SHA")
	or os.getenv("COMMIT_SHA")
	or os.getenv("SPACE_COMMIT_SHA")
	or version_from_file
	or "local"
	)
	short_commit = commit[:7] if commit != "local" else commit
	version = os.getenv("APP_VERSION") or short_commit
	deployed_at = dt.datetime.utcnow().strftime("%Y-%m-%d %H:%M:%S UTC")
	return f"Version: {version} \| Commit: {short_commit} \| Loaded: {deployed_at}"


	def _env(name: str, default: str = "") -> str:
	return (os.getenv(name) or default).strip()


	HF_TOKEN = _env("HF_TOKEN")
	HF_MODEL = _env("HF_MODEL", "zai-org/GLM-5.1")

	AI_BACKEND = _env("AI_BACKEND", "hf").lower()
	AI_MAX_TOKENS = int(_env("AI_MAX_TOKENS", "512"))
	AI_FALLBACK_ORDER = [
	p.strip().lower()
	for p in _env("AI_FALLBACK_ORDER", "hf,github,openrouter,fireworks").split(",")
	if p.strip()
	]

	GITHUB_TOKEN = _env("GITHUB_TOKEN")
	GITHUB_MODEL = _env("GITHUB_MODEL")

	OPENROUTER_API_KEY = _env("OPENROUTER_API_KEY")
	OPENROUTER_MODEL = _env("OPENROUTER_MODEL")

	FIREWORKS_API_KEY = _env("FIREWORKS_API_KEY")
	FIREWORKS_MODEL = _env("FIREWORKS_MODEL")


	# Explicit token passing helps avoid auth ambiguity across local and Space runtimes.
	hf_client = InferenceClient(token=HF_TOKEN) if HF_TOKEN else InferenceClient()


	def _runtime_label() -> str:
	active_model = {
	"hf": HF_MODEL,
	"github": GITHUB_MODEL,
	"openrouter": OPENROUTER_MODEL,
	"fireworks": FIREWORKS_MODEL,
	}.get(AI_BACKEND, "")
	backend_name = AI_BACKEND.upper()
	model_text = active_model or "not-set"
	return f"Backend: {backend_name} \| Model: {model_text}"


	def _history_to_messages(history: list, user_message: str) -> list:
	messages = []

	for item in history or []:
	if isinstance(item, dict):
	role = item.get("role")
	content = item.get("content")
	if role in {"user", "assistant", "system"} and content:
	messages.append({"role": role, "content": str(content)})
	continue

	if isinstance(item, (list, tuple)) and len(item) == 2:
	user_msg, assistant_msg = item
	if user_msg:
	messages.append({"role": "user", "content": str(user_msg)})
	if assistant_msg:
	messages.append({"role": "assistant", "content": str(assistant_msg)})

	messages.append({"role": "user", "content": user_message})
	return messages


	def _extract_content(choice_message: dict) -> str:
	content = choice_message.get("content", "")
	if isinstance(content, str):
	return content
	if isinstance(content, list):
	chunks = []
	for part in content:
	if isinstance(part, dict) and part.get("type") == "text":
	chunks.append(str(part.get("text", "")))
	return "".join(chunks).strip()
	return str(content)


	def _chat_openai_compatible(
	endpoint: str,
	api_key: str,
	model: str,
	messages: list,
	extra_headers=None,
	) -> str:
	if not api_key:
	raise ValueError("API key is missing.")
	if not model:
	raise ValueError("Model is not configured.")

	payload = {
	"model": model,
	"messages": messages,
	"max_tokens": AI_MAX_TOKENS,
	}
	headers = {
	"Authorization": f"Bearer {api_key}",
	"Content-Type": "application/json",
	}
	if extra_headers:
	headers.update(extra_headers)

	request = urllib.request.Request(
	endpoint,
	data=json.dumps(payload).encode("utf-8"),
	headers=headers,
	method="POST",
	)
	try:
	with urllib.request.urlopen(request, timeout=90) as response:
	body = json.loads(response.read().decode("utf-8"))
	except urllib.error.HTTPError as exc:
	details = exc.read().decode("utf-8", errors="ignore")
	raise RuntimeError(f"HTTP {exc.code}: {details[:300]}") from exc

	choices = body.get("choices") or []
	if not choices:
	raise RuntimeError("No choices returned from provider.")
	message = choices[0].get("message") or {}
	return _extract_content(message) or "(empty response)"


	def _chat_hf(messages: list) -> str:
	response = hf_client.chat_completion(
	model=HF_MODEL,
	messages=messages,
	max_tokens=AI_MAX_TOKENS,
	)
	return response.choices[0].message.content or "(empty response)"


	def _chat_github(messages: list) -> str:
	return _chat_openai_compatible(
	endpoint="https://models.github.ai/inference/chat/completions",
	api_key=GITHUB_TOKEN,
	model=GITHUB_MODEL,
	messages=messages,
	)


	def _chat_openrouter(messages: list) -> str:
	return _chat_openai_compatible(
	endpoint="https://openrouter.ai/api/v1/chat/completions",
	api_key=OPENROUTER_API_KEY,
	model=OPENROUTER_MODEL,
	messages=messages,
	extra_headers={
	"HTTP-Referer": _env("OPENROUTER_REFERER", "https://huggingface.co"),
	"X-Title": _env("OPENROUTER_APP_NAME", "hf-multi-provider-chat"),
	},
	)


	def _chat_fireworks(messages: list) -> str:
	return _chat_openai_compatible(
	endpoint="https://api.fireworks.ai/inference/v1/chat/completions",
	api_key=FIREWORKS_API_KEY,
	model=FIREWORKS_MODEL,
	messages=messages,
	)


	def _chat_once(backend: str, messages: list) -> str:
	if backend == "hf":
	return _chat_hf(messages)
	if backend == "github":
	return _chat_github(messages)
	if backend == "openrouter":
	return _chat_openrouter(messages)
	if backend == "fireworks":
	return _chat_fireworks(messages)
	raise ValueError(
	f"Unsupported AI_BACKEND='{backend}'. Use one of: hf, github, openrouter, fireworks, auto"
	)


	def chat_response(message: str, history: list) -> str:
	"""Send a user message using the configured backend and return assistant text."""
	if not message or not message.strip():
	return "Please enter a message."

	messages = _history_to_messages(history, message.strip())

	try:
	if AI_BACKEND == "auto":
	errors = []
	for backend in AI_FALLBACK_ORDER:
	try:
	return _chat_once(backend, messages)
	except Exception as exc: # noqa: BLE001
	errors.append(f"{backend}: {exc}")
	return "All providers failed. " + " \| ".join(errors)

	return _chat_once(AI_BACKEND, messages)
	except Exception as e:
	return f"Error: {str(e)}"


	with gr.Blocks(title="GitHub + HuggingFace + AI Chat Demo") as demo:
	gr.Markdown("# GitHub → HuggingFace → AI Chat")
	gr.Markdown(f"{_build_label()}")
	gr.Markdown(
	"Multi-provider chat app for learning and testing across HF, GitHub Models, OpenRouter, and Fireworks."
	)
	gr.Markdown(f"{_runtime_label()}")

	gr.ChatInterface(
	chat_response,
	examples=[
	"What is the capital of France?",
	"Explain quantum computing in simple terms.",
	"Give me a low-cost model selection strategy for dev vs prod.",
	],
	title=None,
	description="Ask me anything!",
	)


	if __name__ == "__main__":
	# server_name="0.0.0.0" is required inside HF Space containers.
	# root_path ensures Gradio resolves JS/CSS assets correctly when running
	# behind a reverse proxy or custom domain.
	_root_path = os.getenv("GRADIO_ROOT_PATH", "").rstrip("/")
	demo.launch(server_name="0.0.0.0", root_path=_root_path)