Spaces:

ronitraj
/

vegarl

Running

App Files Files Community

vegarl / QUICK_FIX_SCRIPT.sh

ronitraj

Deploy Space without oversized raw dataset

4fbc241 about 1 month ago

raw

history blame contribute delete

7.57 kB

	#!/bin/bash
	# Quick Fix Script for InferenceGym Submission
	# Run this to fix the most critical issues before submission

	set -e

	echo "🔧 InferenceGym Quick Fix Script"
	echo "================================"
	echo ""

	# 1. Fix inference.py log format
	echo "1️⃣ Fixing inference.py log format..."
	sed -i 's/rewards_str = "\[" + ",".join(f"{r:.4f}" for r in rewards) + "\]"/rewards_str = ",".join(f"{r:.2f}" for r in rewards)/' inference.py
	sed -i 's/f"score={score:.4f} rewards={rewards_str}"/f"score={score:.2f} rewards={rewards_str}"/' inference.py
	sed -i 's/f"reward={reward:.4f}/f"reward={reward:.2f}/' inference.py
	echo " ✅ Log format fixed"

	# 2. Fix Dockerfile
	echo ""
	echo "2️⃣ Fixing Dockerfile..."
	cat > Dockerfile.new << 'EOF'
	FROM python:3.11-slim AS builder

	ENV PYTHONDONTWRITEBYTECODE=1
	ENV PYTHONUNBUFFERED=1

	WORKDIR /app

	COPY pyproject.toml README.md openenv.yaml ./
	COPY llmserve_env ./llmserve_env
	COPY server ./server
	COPY agents ./agents
	COPY rl ./rl
	COPY weights ./weights
	COPY data ./data
	COPY inference.py train.py evaluate.py ./

	RUN pip install --no-cache-dir --upgrade pip && \
	pip install --no-cache-dir --prefix=/install .

	FROM python:3.11-slim

	ENV PYTHONDONTWRITEBYTECODE=1
	ENV PYTHONUNBUFFERED=1
	ENV ENABLE_WEB_INTERFACE=true

	WORKDIR /app

	COPY --from=builder /install /usr/local
	COPY pyproject.toml README.md openenv.yaml ./
	COPY llmserve_env ./llmserve_env
	COPY server ./server
	COPY agents ./agents
	COPY rl ./rl
	COPY weights ./weights
	COPY data ./data
	COPY inference.py train.py evaluate.py ./

	EXPOSE 7860

	HEALTHCHECK --interval=30s --timeout=5s --start-period=15s --retries=3 \
	CMD python -c "import urllib.request; urllib.request.urlopen('http://127.0.0.1:7860/health', timeout=5)" \|\| exit 1

	CMD ["uvicorn", "server.app:app", "--host", "0.0.0.0", "--port", "7860", "--workers", "1"]
	EOF

	mv Dockerfile Dockerfile.backup
	mv Dockerfile.new Dockerfile
	echo " ✅ Dockerfile fixed (backup saved as Dockerfile.backup)"

	# 3. Add precomputed baselines to grader
	echo ""
	echo "3️⃣ Adding precomputed baselines to grader..."
	cat > grader_patch.py << 'EOF'
	import sys

	# Read the file
	with open('server/grader.py', 'r') as f:
	content = f.read()

	# Add precomputed baselines after line with "def __init__"
	if 'PRECOMPUTED_BASELINES' not in content:
	# Find the line after "def __init__(self)"
	lines = content.split('\n')
	new_lines = []
	for i, line in enumerate(lines):
	new_lines.append(line)
	if 'class GraderEngine:' in line:
	# Add after class definition
	new_lines.append(' """Grader engine with precomputed baselines for fast evaluation."""')
	new_lines.append(' ')
	new_lines.append(' PRECOMPUTED_BASELINES = {')
	new_lines.append(' "static_workload": 0.55,')
	new_lines.append(' "bursty_workload": 0.48,')
	new_lines.append(' "adversarial_multitenant": 0.38,')
	new_lines.append(' }')

	# Write back
	with open('server/grader.py', 'w') as f:
	f.write('\n'.join(new_lines))

	print(" ✅ Precomputed baselines added to grader")
	else:
	print(" ℹ️ Precomputed baselines already exist")
	EOF

	python3 grader_patch.py
	rm grader_patch.py

	# 4. Run benchmarks
	echo ""
	echo "4️⃣ Running benchmarks (this may take 5-10 minutes)..."
	echo " Running random agent..."
	python3 agents/random_agent.py --episodes 10 > benchmark_random.json 2>&1 \|\| echo " ⚠️ Random agent failed"

	echo " Running heuristic agent..."
	python3 agents/heuristic_agent.py --episodes 10 > benchmark_heuristic.json 2>&1 \|\| echo " ⚠️ Heuristic agent failed"

	echo " Running PPO agent..."
	python3 evaluate.py --agent ppo --task all --episodes 10 > benchmark_ppo.json 2>&1 \|\| echo " ⚠️ PPO agent failed"

	echo " ✅ Benchmarks complete (results saved to benchmark_*.json)"

	# 5. Test Docker build
	echo ""
	echo "5️⃣ Testing Docker build..."
	if command -v docker &> /dev/null; then
	echo " Building Docker image (this may take 5-10 minutes)..."
	docker build -t inferencegym-test . > docker_build.log 2>&1
	if [ $? -eq 0 ]; then
	echo " ✅ Docker build successful"
	echo " Testing Docker run..."
	docker run -d --name inferencegym-test -p 7860:7860 inferencegym-test
	sleep 10
	curl -s http://localhost:7860/health > /dev/null
	if [ $? -eq 0 ]; then
	echo " ✅ Docker container running and healthy"
	else
	echo " ⚠️ Docker container not responding to /health"
	fi
	docker stop inferencegym-test > /dev/null 2>&1
	docker rm inferencegym-test > /dev/null 2>&1
	else
	echo " ❌ Docker build failed (see docker_build.log)"
	fi
	else
	echo " ⚠️ Docker not found, skipping Docker test"
	fi

	# 6. Create submission checklist
	echo ""
	echo "6️⃣ Creating submission checklist..."
	cat > SUBMISSION_CHECKLIST.md << 'EOF'
	# InferenceGym Submission Checklist

	## Pre-Submission Tests

	- [ ] `docker build -t inferencegym .` succeeds
	- [ ] `docker run -p 7860:7860 inferencegym` starts without errors
	- [ ] `curl http://localhost:7860/health` returns `{"status":"ok"}`
	- [ ] `curl -X POST http://localhost:7860/reset -d '{}'` returns valid observation
	- [ ] `curl -X POST http://localhost:7860/step -d '{"batch_cap":32,...}'` works
	- [ ] `curl http://localhost:7860/tasks` lists 3 tasks
	- [ ] `curl -X POST http://localhost:7860/grader` returns score in [0.0, 1.0]
	- [ ] `python inference.py` completes without errors
	- [ ] `python inference.py` emits [START], [STEP], [END] logs correctly
	- [ ] `python inference.py` completes in <20 minutes
	- [ ] All 3 PPO weight files exist in `weights/`
	- [ ] `openenv.yaml` is valid
	- [ ] README.md has real benchmark numbers (not placeholders)

	## HuggingFace Space Deployment

	- [ ] Create new HF Space with `sdk: docker`
	- [ ] Set `app_port: 7860`
	- [ ] Add tag `openenv` to Space metadata
	- [ ] Push repo to HF Space
	- [ ] Wait for build to complete
	- [ ] Test Space URL: `curl https://your-space.hf.space/health`
	- [ ] Run `openenv validate --url https://your-space.hf.space`
	- [ ] Fix any validation errors

	## Environment Variables (Optional)

	If testing with OpenAI API:
	- [ ] Set `API_BASE_URL`
	- [ ] Set `MODEL_NAME`
	- [ ] Set `HF_TOKEN`
	- [ ] Test: `python inference.py` uses LLM agent

	## Final Verification

	- [ ] All files committed to git
	- [ ] No sensitive data (API keys) in repo
	- [ ] README is clear and complete
	- [ ] Description.md has real benchmark results
	- [ ] No TODO or FIXME comments in critical files
	- [ ] All tests pass: `pytest -q`

	## Submission

	- [ ] Submit HF Space URL to competition portal
	- [ ] Verify submission received
	- [ ] Monitor Space logs for errors
	- [ ] Join Discord for updates

	---

	Estimated Time to Complete: 2-3 hours
	Deadline: April 8, 2026 11:59 PM
	Current Date: April 8, 2026

	⚠️ You have less than 12 hours remaining!
	EOF

	echo " ✅ Submission checklist created (SUBMISSION_CHECKLIST.md)"

	echo ""
	echo "✅ Quick fixes complete!"
	echo ""
	echo "📋 Next steps:"
	echo " 1. Review CRITICAL_ISSUES_ANALYSIS.md for detailed issues"
	echo " 2. Review SUBMISSION_CHECKLIST.md for final checks"
	echo " 3. Update README.md with benchmark results from benchmark_*.json"
	echo " 4. Test Docker build and run"
	echo " 5. Deploy to HuggingFace Space"
	echo " 6. Run openenv validate"
	echo " 7. Submit!"
	echo ""
	echo "⏰ Time remaining: ~11 hours until deadline"
	echo ""