brainworm2024 commited on
Commit
4e751f3
·
1 Parent(s): fbc77a0

Remove all auth to fix GPU connection

Browse files
Files changed (1) hide show
  1. src/inference/qwen.rs +1 -6
src/inference/qwen.rs CHANGED
@@ -6,15 +6,10 @@ use serde_json::Value;
6
  pub async fn generate(redacted_prompt: &str) -> Result<(String, String, String)> {
7
  let vllm_url = std::env::var("VLLM_URL")
8
  .unwrap_or_else(|_| "http://localhost:8000/v1/completions".to_string());
9
- let api_key = std::env::var("VLLM_API_KEY")
10
- .unwrap_or_else(|_| "abc-123".to_string());
11
-
12
- // Append API key as query parameter (ngrok-friendly)
13
- let url_with_key = format!("{}?api_key={}", vllm_url, api_key);
14
 
15
  let client = reqwest::Client::new();
16
  let resp = client
17
- .post(&url_with_key)
18
  .header("ngrok-skip-browser-warning", "true")
19
  .json(&serde_json::json!({
20
  "model": "Qwen/Qwen2.5-7B-Instruct",
 
6
  pub async fn generate(redacted_prompt: &str) -> Result<(String, String, String)> {
7
  let vllm_url = std::env::var("VLLM_URL")
8
  .unwrap_or_else(|_| "http://localhost:8000/v1/completions".to_string());
 
 
 
 
 
9
 
10
  let client = reqwest::Client::new();
11
  let resp = client
12
+ .post(&vllm_url)
13
  .header("ngrok-skip-browser-warning", "true")
14
  .json(&serde_json::json!({
15
  "model": "Qwen/Qwen2.5-7B-Instruct",