volcano-sh · anirudh240 · Apr 1, 2026 · Apr 1, 2026 · Apr 1, 2026 · Apr 1, 2026
diff --git a/.github/workflows/build-mock-images.yml b/.github/workflows/build-mock-images.yml
@@ -0,0 +1,56 @@
+name: Build and Push Mock Images
+
+on:
+  push:
+    branches:
+      - main
+    paths:
+      - hack/mock-images/**
+  workflow_dispatch:
+
+jobs:
+  build-vllm-mock:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Log in to GHCR
+        uses: docker/login-action@v3
+        with:
+          registry: ghcr.io
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Build and push vllm-mock
+        uses: docker/build-push-action@v5
+        with:
+          context: hack/mock-images/vllm-mock
+          push: true
+          tags: ghcr.io/volcano-sh/vllm-mock:latest
+
+  build-sglang-mock:
+    runs-on: ubuntu-latest
+    permissions:
+      contents: read
+      packages: write
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v4
+
+      - name: Log in to GHCR
+        uses: docker/login-action@v3
+        with:
+          registry: ghcr.io
+          username: ${{ github.actor }}
+          password: ${{ secrets.GITHUB_TOKEN }}
+
+      - name: Build and push sglang-mock
+        uses: docker/build-push-action@v5
+        with:
+          context: hack/mock-images/sglang-mock
+          push: true
+          tags: ghcr.io/volcano-sh/sglang-mock:latest
diff --git a/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml b/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock
@@ -49,7 +49,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml b/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock-ds7b.yaml b/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock-ds7b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock.yaml b/docs/kthena/docs/assets/examples/kthena-router/LLM-Mock.yaml
@@ -2,7 +2,7 @@
 # The mock server will return a fixed response for any input.
 # You can use this mock server to test the inference router without deploying a real LLM server.
 #
-# NOTE: `ghcr.io/yaozengzeng/vllm-mock:latest` is built based on `https://github.com/YaoZengzeng/aibrix/tree/vllm-mock`.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
 # Move the image to kthena registry once it's public.
-# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
-# Move the image to kthena registry once it's public.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built from
+# `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
-# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
-# Move the image to kthena registry once it's public.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built from
+# `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
 
 apiVersion: apps/v1
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/...a/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml b/...a/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock
@@ -49,7 +49,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml b/docs/kthena/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock-ds7b.yaml b/docs/kthena/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock-ds7b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock.yaml b/docs/kthena/versioned_docs/version-v0.1.0/assets/examples/kthena-router/LLM-Mock.yaml
@@ -2,7 +2,7 @@
 # The mock server will return a fixed response for any input.
 # You can use this mock server to test the inference router without deploying a real LLM server.
 #
-# NOTE: `ghcr.io/yaozengzeng/vllm-mock:latest` is built based on `https://github.com/YaoZengzeng/aibrix/tree/vllm-mock`.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
 # Move the image to kthena registry once it's public.
-# Move the image to kthena registry once it's public.
-# Move the image to kthena registry once it's public.
 
 apiVersion: apps/v1
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/...a/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml b/...a/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock
@@ -49,7 +49,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml b/docs/kthena/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock-ds7b.yaml b/docs/kthena/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock-ds7b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock.yaml b/docs/kthena/versioned_docs/version-v0.2.0/assets/examples/kthena-router/LLM-Mock.yaml
@@ -2,7 +2,7 @@
 # The mock server will return a fixed response for any input.
 # You can use this mock server to test the inference router without deploying a real LLM server.
 #
-# NOTE: `ghcr.io/yaozengzeng/vllm-mock:latest` is built based on `https://github.com/YaoZengzeng/aibrix/tree/vllm-mock`.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
 # Move the image to kthena registry once it's public.
 
 apiVersion: apps/v1
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/...a/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml b/...a/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock
@@ -49,7 +49,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml b/docs/kthena/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock-ds1.5b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock-ds7b.yaml b/docs/kthena/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock-ds7b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/docs/kthena/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock.yaml b/docs/kthena/versioned_docs/version-v0.3.0/assets/examples/kthena-router/LLM-Mock.yaml
@@ -2,7 +2,7 @@
 # The mock server will return a fixed response for any input.
 # You can use this mock server to test the inference router without deploying a real LLM server.
 #
-# NOTE: `ghcr.io/yaozengzeng/vllm-mock:latest` is built based on `https://github.com/YaoZengzeng/aibrix/tree/vllm-mock`.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
 # Move the image to kthena registry once it's public.
 
 apiVersion: apps/v1
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml b/examples/kthena-router/LLM-Mock-ds1.5b-Canary.yaml
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock
@@ -49,7 +49,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/examples/kthena-router/LLM-Mock-ds1.5b.yaml b/examples/kthena-router/LLM-Mock-ds1.5b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/examples/kthena-router/LLM-Mock-ds7b.yaml b/examples/kthena-router/LLM-Mock-ds7b.yaml
@@ -19,7 +19,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/examples/kthena-router/LLM-Mock.yaml b/examples/kthena-router/LLM-Mock.yaml
@@ -2,7 +2,7 @@
 # The mock server will return a fixed response for any input.
 # You can use this mock server to test the inference router without deploying a real LLM server.
 #
-# NOTE: `ghcr.io/yaozengzeng/vllm-mock:latest` is built based on `https://github.com/YaoZengzeng/aibrix/tree/vllm-mock`.
+# NOTE: `ghcr.io/volcano-sh/vllm-mock:latest` is built based on `https://github.com/volcano-sh/kthena/tree/main/hack/mock-images/vllm-mock`.
 # Move the image to kthena registry once it's public.
-# Move the image to kthena registry once it's public.
+# The image is published in the `volcano-sh` GHCR namespace by the official kthena build/publish workflow.
-# Move the image to kthena registry once it's public.
-# Move the image to kthena registry once it's public.
+# The image is published in the `volcano-sh` GHCR namespace by the official kthena build/publish workflow.
-# Move the image to kthena registry once it's public.
 
 apiVersion: apps/v1
@@ -21,7 +21,7 @@ spec:
     spec:
       containers:
         - name: llm-engine
-          image: ghcr.io/yaozengzeng/vllm-mock:latest
+          image: ghcr.io/volcano-sh/vllm-mock:latest
           imagePullPolicy: IfNotPresent
           env:
             # specify the model name to mock

diff --git a/examples/kthena-router/ModelServing-ds1.5b-pd-disaggregation.yaml b/examples/kthena-router/ModelServing-ds1.5b-pd-disaggregation.yaml
@@ -19,7 +19,7 @@ spec:
           spec:
             containers:
               - name: leader
-                image: ghcr.io/yaozengzeng/vllm-mock:latest
+                image: ghcr.io/volcano-sh/vllm-mock:latest
                 imagePullPolicy: IfNotPresent
                 env:
                   # specify the model name to mock
@@ -39,7 +39,7 @@ spec:
           spec:
             containers:
               - name: leader
-                image: ghcr.io/yaozengzeng/vllm-mock:latest
+                image: ghcr.io/volcano-sh/vllm-mock:latest
                 imagePullPolicy: IfNotPresent
                 env:
                   # specify the model name to mock

diff --git a/hack/mock-images/sglang-mock/Dockerfile b/hack/mock-images/sglang-mock/Dockerfile
@@ -0,0 +1,10 @@
+FROM python:3.11-slim
+
+WORKDIR /app
+
+COPY requirements.txt .
+RUN pip install --no-cache-dir -r requirements.txt
+
+COPY . .
+
+CMD ["python", "sglang_app.py"]
diff --git a/hack/mock-images/sglang-mock/requirements.txt b/hack/mock-images/sglang-mock/requirements.txt
@@ -0,0 +1 @@
+flask