vllm-project
diff --git a/‎config/config-mcp-classifier-example.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config-mcp-classifier-example.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.development.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.development.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.e2e.yaml‎
Lines changed: 0 additions & 4 deletions b/‎config/config.e2e.yaml‎
Lines changed: 0 additions & 4 deletions
diff --git a/‎config/config.production.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.production.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.recipe-accuracy.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.recipe-accuracy.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.recipe-latency.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.recipe-latency.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.recipe-token-efficiency.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.recipe-token-efficiency.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.testing.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.testing.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/config.yaml‎
Lines changed: 0 additions & 2 deletions b/‎config/config.yaml‎
Lines changed: 0 additions & 2 deletions
diff --git a/‎config/examples/system_prompt_example.yaml‎
Lines changed: 3 additions & 3 deletions b/‎config/examples/system_prompt_example.yaml‎
Lines changed: 3 additions & 3 deletions
@@ -75,8 +75,6 @@ vllm_endpoints:
   - name: endpoint1
     address: 127.0.0.1
     port: 8000
-    models:
-      - openai/gpt-oss-20b
     weight: 1
     health_check_path: /health
 
 
@@ -29,8 +29,6 @@ vllm_endpoints:
   - name: "local-endpoint"
     address: "127.0.0.1"
     port: 8000
-    models:
-      - "test-model"
     weight: 1
 
 model_config:
 
@@ -42,15 +42,11 @@ vllm_endpoints:
   - name: "qwen-endpoint"
     address: "127.0.0.1"
     port: 8000
-    models:
-      - "Model-A"
     weight: 1
     health_check_path: "/health"
   - name: "tinyllama-endpoint"
     address: "127.0.0.1"
     port: 8001
-    models:
-      - "Model-B"
     weight: 1
     health_check_path: "/health"
 
 
@@ -34,8 +34,6 @@ vllm_endpoints:
   - name: "endpoint1"
     address: "127.0.0.1"
     port: 8000
-    models:
-      - "openai/gpt-oss-20b"
     weight: 1
 
 model_config:
 
@@ -44,8 +44,6 @@ vllm_endpoints:
   - name: "endpoint1"
     address: "127.0.0.1"
     port: 8000
-    models:
-      - "openai/gpt-oss-20b"
     weight: 1
 
 model_config:
 
@@ -39,8 +39,6 @@ vllm_endpoints:
   - name: "endpoint1"
     address: "127.0.0.1"
     port: 8000
-    models:
-      - "openai/gpt-oss-20b"
     weight: 1
 
 model_config:
 
@@ -44,8 +44,6 @@ vllm_endpoints:
   - name: "endpoint1"
     address: "127.0.0.1"
     port: 8000
-    models:
-      - "openai/gpt-oss-20b"
     weight: 1
 
 model_config:
 
@@ -30,8 +30,6 @@ vllm_endpoints:
   - name: "mock"
     address: "172.28.0.10"
     port: 8000
-    models:
-      - "openai/gpt-oss-20b"
     weight: 1
     health_check_path: "/health"
 
 
@@ -34,8 +34,6 @@ vllm_endpoints:
   - name: "endpoint1"
     address: "127.0.0.1"  # IPv4 address - REQUIRED format
     port: 8000
-    models:
-      - "openai/gpt-oss-20b"
     weight: 1
 
 model_config:
 
@@ -100,9 +100,9 @@ default_reasoning_effort: medium
 # vLLM endpoints configuration
 vllm_endpoints:
   - name: "mock"
-    address: "http://127.0.0.1:8000"
-    models:
-      - "openai/gpt-oss-20b"
+    address: "127.0.0.1"
+    port: 8000
+    weight: 1
 
 # Usage Notes:
 # 1. System prompts are automatically injected based on query classification