@@ -22,38 +22,20 @@ import (
2222)
2323
2424const (
25- kindNamespace = "default"
26- semanticNamespace = "vllm-semantic-router-system"
27- gatewayNamespace = "istio-system"
28- inferenceGatewayName = "inference-gateway"
29- istioVersion = "1.28.0"
30- gatewayCRDURL = "https://github.com/kubernetes-sigs/gateway-api/releases/download/v1.2.0/standard-install.yaml"
31- inferenceCRDURL = "https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.1.0/manifests.yaml"
25+ kindNamespace = "default"
26+ semanticNamespace = "vllm-semantic-router-system"
27+ gatewayNamespace = "istio-system"
28+ istioVersion = "1.28.0"
29+ gatewayCRDURL = "https://github.com/kubernetes-sigs/gateway-api/releases/download/v1.2.0/standard-install.yaml"
30+ inferenceCRDURL = "https://github.com/kubernetes-sigs/gateway-api-inference-extension/releases/download/v1.1.0/manifests.yaml"
3231)
3332
3433type Profile struct {
35- verbose bool
36- useExisting bool
37- skipSetup bool
38- versions struct {
39- istio string
40- gateway string
41- inference string
42- inferenceController string
43- }
34+ verbose bool
4435}
4536
4637func NewProfile () * Profile {
47- p := & Profile {}
48- p .versions .istio = istioVersion
49- p .versions .gateway = gatewayCRDURL
50- p .versions .inference = inferenceCRDURL
51- ctrlURL := os .Getenv ("GAIE_CONTROLLER_URL" )
52- if ctrlURL == "" {
53- ctrlURL = inferenceCRDURL
54- }
55- p .versions .inferenceController = ctrlURL
56- return p
38+ return & Profile {}
5739}
5840
5941func (p * Profile ) Name () string {
@@ -66,16 +48,9 @@ func (p *Profile) Description() string {
6648
6749func (p * Profile ) Setup (ctx context.Context , opts * framework.SetupOptions ) error {
6850 p .verbose = opts .Verbose
69- p .useExisting = strings .EqualFold (os .Getenv ("LLMD_USE_EXISTING" ), "true" ) || os .Getenv ("LLMD_USE_EXISTING" ) == "1"
70- p .skipSetup = strings .EqualFold (os .Getenv ("LLMD_SKIP_SETUP" ), "true" ) || os .Getenv ("LLMD_SKIP_SETUP" ) == "1"
71-
72- fmt .Printf ("[Profile] llm-d setup start (istio=%s, gatewayCRD=%s, inferenceCRD=%s, controller=%s, useExisting=%v, skipSetup=%v)\n " ,
73- p .versions .istio , p .versions .gateway , p .versions .inference , p .versions .inferenceController , p .useExisting , p .skipSetup )
7451
75- if p .skipSetup {
76- fmt .Println ("[Profile] LLMD_SKIP_SETUP set; skipping deploy steps, running verification only" )
77- return p .verifyEnvironment (ctx , opts )
78- }
52+ fmt .Printf ("[Profile] llm-d setup start (istio=%s, gatewayCRD=%s, inferenceCRD=%s)\\ n" ,
53+ istioVersion , gatewayCRDURL , inferenceCRDURL )
7954
8055 rollback := []func (){}
8156 rollbackAll := func () {
@@ -221,27 +196,17 @@ func (p *Profile) Teardown(ctx context.Context, opts *framework.TeardownOptions)
221196}
222197
223198func (p * Profile ) GetTestCases () []string {
224- tests := []string {
225- "llmd-health-check" ,
226- "llmd-distributed-inference" ,
227- "llmd-auto-routing" ,
228- "llmd-failover-recovery" ,
229- "llmd-performance-baseline" ,
230- }
231- if strings .EqualFold (os .Getenv ("LLMD_PERF_SKIP" ), "true" ) || os .Getenv ("LLMD_PERF_SKIP" ) == "1" {
232- var filtered []string
233- for _ , t := range tests {
234- if t == "llmd-performance-baseline" {
235- continue
236- }
237- filtered = append (filtered , t )
238- }
239- if p .verbose {
240- fmt .Println ("[Profile] LLMD_PERF_SKIP set; skipping llmd-performance-baseline test" )
241- }
242- return filtered
199+ // Shared router testcases that we also want to validate in the llm-d environment
200+ shared := []string {
201+ "chat-completions-request" ,
202+ "chat-completions-stress-request" ,
203+ "chat-completions-progressive-stress" ,
204+ "domain-classify" ,
243205 }
244- return tests
206+
207+ // For llm-d we currently only reuse shared router testcases.
208+ // llm-d-specific HA/traffic semantics are expected to be covered in LLM-D / infra tests.
209+ return shared
245210}
246211
247212func (p * Profile ) GetServiceConfig () framework.ServiceConfig {
0 commit comments