Commit ·
4e751f3
1
Parent(s): fbc77a0
Remove all auth to fix GPU connection
Browse files- src/inference/qwen.rs +1 -6
src/inference/qwen.rs
CHANGED
|
@@ -6,15 +6,10 @@ use serde_json::Value;
|
|
| 6 |
pub async fn generate(redacted_prompt: &str) -> Result<(String, String, String)> {
|
| 7 |
let vllm_url = std::env::var("VLLM_URL")
|
| 8 |
.unwrap_or_else(|_| "http://localhost:8000/v1/completions".to_string());
|
| 9 |
-
let api_key = std::env::var("VLLM_API_KEY")
|
| 10 |
-
.unwrap_or_else(|_| "abc-123".to_string());
|
| 11 |
-
|
| 12 |
-
// Append API key as query parameter (ngrok-friendly)
|
| 13 |
-
let url_with_key = format!("{}?api_key={}", vllm_url, api_key);
|
| 14 |
|
| 15 |
let client = reqwest::Client::new();
|
| 16 |
let resp = client
|
| 17 |
-
.post(&
|
| 18 |
.header("ngrok-skip-browser-warning", "true")
|
| 19 |
.json(&serde_json::json!({
|
| 20 |
"model": "Qwen/Qwen2.5-7B-Instruct",
|
|
|
|
| 6 |
pub async fn generate(redacted_prompt: &str) -> Result<(String, String, String)> {
|
| 7 |
let vllm_url = std::env::var("VLLM_URL")
|
| 8 |
.unwrap_or_else(|_| "http://localhost:8000/v1/completions".to_string());
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 9 |
|
| 10 |
let client = reqwest::Client::new();
|
| 11 |
let resp = client
|
| 12 |
+
.post(&vllm_url)
|
| 13 |
.header("ngrok-skip-browser-warning", "true")
|
| 14 |
.json(&serde_json::json!({
|
| 15 |
"model": "Qwen/Qwen2.5-7B-Instruct",
|