wanglei19991004
diff --git a/‎.github/configs/ascend.yml‎
Lines changed: 74 additions & 0 deletions b/‎.github/configs/ascend.yml‎
Lines changed: 74 additions & 0 deletions
diff --git a/‎.github/configs/metax.yml‎
Lines changed: 42 additions & 0 deletions b/‎.github/configs/metax.yml‎
Lines changed: 42 additions & 0 deletions
diff --git a/‎.github/workflows/all_tests_ascend.yml‎
Lines changed: 30 additions & 0 deletions b/‎.github/workflows/all_tests_ascend.yml‎
Lines changed: 30 additions & 0 deletions
diff --git a/‎.github/workflows/all_tests_common.yml‎
Lines changed: 8 additions & 2 deletions b/‎.github/workflows/all_tests_common.yml‎
Lines changed: 8 additions & 2 deletions
diff --git a/‎.github/workflows/all_tests_metax.yml‎
Lines changed: 32 additions & 0 deletions b/‎.github/workflows/all_tests_metax.yml‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎.github/workflows/functional_tests_cli.yml‎
Lines changed: 72 additions & 3 deletions b/‎.github/workflows/functional_tests_cli.yml‎
Lines changed: 72 additions & 3 deletions
diff --git a/‎.github/workflows/functional_tests_inference.yml‎
Lines changed: 22 additions & 0 deletions b/‎.github/workflows/functional_tests_inference.yml‎
Lines changed: 22 additions & 0 deletions
diff --git a/‎.github/workflows/functional_tests_serve.yml‎
Lines changed: 22 additions & 0 deletions b/‎.github/workflows/functional_tests_serve.yml‎
Lines changed: 22 additions & 0 deletions
@@ -0,0 +1,74 @@
+# Ascend NPU Hardware Configuration
+# This file defines CI/CD settings for Huawei Ascend NPU-based testing
+# Test configurations are defined in tests/test_utils/config/platforms/ascend.yaml
+
+hardware_name: ascend
+display_name: "Ascend NPU Tests"
+
+# Docker image for this hardware
+ci_image: harbor.baai.ac.cn/flagscale/vllm-plugin-fl:v0.1.0-ascend-ci
+ci_train_image: harbor.baai.ac.cn/flagscale/vllm-plugin-fl:v0.1.0-ascend-ci
+ci_inference_image: harbor.baai.ac.cn/flagscale/vllm-plugin-fl:v0.1.0-ascend-ci
+
+# Runner labels for this hardware
+runner_labels:
+  - self-hosted
+  - Linux
+  - ARM64
+  - ascend-72
+  - npus-8
+
+# Container volumes (hardware-specific paths)
+container_volumes:
+  - /home/flagscale_cicd/flask/static:/workspace/report
+  - /home/flagscale_cicd/flask/config:/workspace/config
+  - /home/flagscale_cicd/docker/docker_build/docker_data:/home/gitlab-runner/data
+  - /home/flagscale_cicd/docker/docker_build/docker_tokenizers:/home/gitlab-runner/tokenizers
+  - /usr/local/Ascend/driver:/usr/local/Ascend/driver:ro
+  - /usr/local/Ascend/add-ons:/usr/local/Ascend/add-ons:ro
+  - /usr/local/sbin/npu-smi:/usr/local/sbin/npu-smi:ro
+
+# Container options for Ascend NPU (no --gpus, use --device for NPU cards)
+container_options: >-
+  --device /dev/davinci0
+  --device /dev/davinci1
+  --device /dev/davinci2
+  --device /dev/davinci3
+  --device /dev/davinci4
+  --device /dev/davinci5
+  --device /dev/davinci6
+  --device /dev/davinci7
+  --device /dev/davinci8
+  --device /dev/davinci9
+  --device /dev/davinci10
+  --device /dev/davinci11
+  --device /dev/davinci12
+  --device /dev/davinci13
+  --device /dev/davinci14
+  --device /dev/davinci15
+  --device /dev/davinci_manager
+  --device /dev/devmm_svm
+  --device /dev/hisi_hdc
+  --privileged
+  --ipc=host
+  --shm-size=500g
+  --hostname flagscale_cicd
+  --user root
+  --ulimit nofile=65535:65535
+
+# =============================================================================
+# Package Manager Configuration
+# =============================================================================
+# Ascend CI image has all dependencies pre-installed; use pip directly.
+pkg_mgr: "pip"
+
+# Environment path (not used for pip, kept for compatibility)
+env_path: ""
+
+# Conda environment name (not used for pip)
+env_names:
+  train: ""
+  hetero_train: ""
+  inference: ""
+  serve: ""
+  rl: ""
@@ -0,0 +1,42 @@
+# MetaX C500 Hardware Configuration
+# This file defines CI/CD settings for MetaX C500 GPU (MACA) testing
+# Test configurations are defined in tests/test_utils/config/platforms/metax.yaml
+
+hardware_name: metax
+display_name: "MetaX C500 Tests"
+
+# Docker images for MetaX C500 (MACA-based)
+ci_image: localhost:5000/megatron-lm-with-te:202603231839
+ci_train_image: localhost:5000/megatron-lm-with-te:202603231839
+ci_inference_image: localhost:5000/megatron-lm-with-te:202603231839
+
+# Runner labels for MetaX C500 hardware
+runner_labels:
+  - self-hosted
+  - Linux
+  - X64
+  - metax-c500
+  - gpus-2
+
+# Container volumes (hardware-specific paths)
+container_volumes:
+  - /home/flagscale_cicd/docker/docker_build/docker_data:/home/gitlab-runner/data
+  - /home/flagscale_cicd/docker/docker_build/docker_tokenizers:/home/gitlab-runner/tokenizers
+
+# Container options for MetaX C500 (MACA runtime)
+container_options: "--hostname=flagscale-ci --ipc=host --privileged --group-add video --shm-size=100g --ulimit memlock=-1 --security-opt seccomp=unconfined --security-opt apparmor=unconfined --device=/dev/dri --device=/dev/mxcd --device=/dev/infiniband --user root --ulimit nofile=65535:65535"
+
+# =============================================================================
+# Package Manager Configuration
+# =============================================================================
+pkg_mgr: "conda"
+
+# Environment path (conda installation path)
+env_path: "/opt/conda"
+
+# Conda environment names
+env_names:
+  train: "base"
+  hetero_train: ""
+  inference: ""
+  rl: ""
@@ -0,0 +1,30 @@
+name: ascend_tests
+
+on:
+  push:
+    branches: ["main"]
+  pull_request:
+    branches: ["main"]
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}-${{ github.actor }}
+  cancel-in-progress: true
+
+jobs:
+  run_tests:
+    uses: ./.github/workflows/all_tests_common.yml
+    with:
+      platform: ascend
+
+  all_tests:
+    needs: run_tests
+    runs-on: ubuntu-latest
+    if: always()
+    steps:
+      - name: Verify workflow status
+        run: |
+          if [ "${{ needs.run_tests.result }}" != "success" ]; then
+            echo "❌ Tests workflow failed"
+            exit 1
+          fi
+          echo "✅ All tests passed!"
@@ -111,11 +111,15 @@ jobs:
       container_volumes: ${{ needs.checkout_and_config.outputs.container_volumes }}
       container_options: ${{ needs.checkout_and_config.outputs.container_options }}
       source_artifact: flagscale-source-${{ github.sha }}
+      pkg_mgr: ${{ needs.checkout_and_config.outputs.pkg_mgr }}
+      env_name: ${{ needs.checkout_and_config.outputs.env_name_train }}
+      env_path: ${{ needs.checkout_and_config.outputs.env_path }}
 
   unit_tests:
     needs:
       - checkout_and_config
       - cli_validation
+    if: fromJson(needs.checkout_and_config.outputs.device_types)[0] != null
     strategy:
       fail-fast: false
       matrix:
@@ -266,12 +270,14 @@ jobs:
           # Check all test jobs (skip if not run)
           failed=false
 
-          if [ "${{ needs.unit_tests.result }}" != "success" ]; then
+          if [ "${{ needs.unit_tests.result }}" != "success" ] && \
+             [ "${{ needs.unit_tests.result }}" != "skipped" ]; then
             echo "❌ Unit tests failed"
             failed=true
           fi
 
-          if [ "${{ needs.cli_validation.result }}" != "success" ]; then
+          if [ "${{ needs.cli_validation.result }}" != "success" ] && \
+             [ "${{ needs.cli_validation.result }}" != "skipped" ]; then
             echo "❌ CLI validation failed"
             failed=true
           fi
 
@@ -0,0 +1,32 @@
+name: metax_c500_tests
+
+on:
+  push:
+    branches: ["main"]
+  pull_request:
+    branches: ["main"]
+
+concurrency:
+  group: ${{ github.workflow }}-${{ github.event.pull_request.number || github.ref }}-${{ github.actor }}
+  cancel-in-progress: true
+
+jobs:
+  run_tests:
+    # Hardware and environment settings are read from .github/configs/metax.yml
+    # Test selection is configured in tests/test_utils/config/platforms/metax.yaml
+    uses: ./.github/workflows/all_tests_common.yml
+    with:
+      platform: metax
+
+  all_tests:
+    needs: run_tests
+    runs-on: ubuntu-latest
+    if: always()
+    steps:
+      - name: Verify workflow status
+        run: |
+          if [ "${{ needs.run_tests.result }}" != "success" ]; then
+            echo "❌ Tests workflow failed"
+            exit 1
+          fi
+          echo "✅ All MetaX C500 tests passed!"
@@ -23,6 +23,21 @@ on:
         required: true
         type: string
         description: Name of the artifact containing source code
+      pkg_mgr:
+        required: false
+        type: string
+        description: Package manager (pip, uv, conda). Default uv.
+        default: "uv"
+      env_name:
+        required: false
+        type: string
+        description: Conda environment name (for conda only)
+        default: ""
+      env_path:
+        required: false
+        type: string
+        description: Environment path (venv path for uv, conda installation path for conda)
+        default: "/opt/venv"
 
 jobs:
   functional_test_cli:
@@ -93,11 +108,40 @@ jobs:
           set -euo pipefail
           cd $PROJECT_ROOT
 
-          echo "Installing FlagScale CLI (outside virtual environment)"
+          PKG_MGR='${{ inputs.pkg_mgr }}'
+          ENV_NAME='${{ inputs.env_name }}'
+          ENV_PATH='${{ inputs.env_path }}'
+
+          echo "Installing FlagScale CLI"
+          echo "Installing dependencies for training"
+          echo "Package Manager: $PKG_MGR"
+          echo "Environment Name: $ENV_NAME"
+          echo "Environment Path: $ENV_PATH"
+
+          # Source environment utilities
+          source ./tools/install/utils/pyenv_utils.sh
+
+          # Activate environment based on package manager
+          case "$PKG_MGR" in
+            conda)
+              if [ -n "$ENV_NAME" ] && [ -n "$ENV_PATH" ]; then
+                activate_conda "$ENV_NAME" "$ENV_PATH" || { echo "❌ Conda activation failed"; exit 1; }
+              fi
+              ;;
+            uv)
+              if [ -n "$ENV_PATH" ] && [ -d "$ENV_PATH" ]; then
+                activate_uv_env "$ENV_PATH" || { echo "❌ UV activation failed"; exit 1; }
+              fi
+              ;;
+            pip)
+              echo "Using system Python with pip"
+              ;;
+          esac
+
           echo "Python location: $(which python)"
           echo "Python version: $(python --version)"
 
-          # Install FlagScale CLI using system pip
+          # Install FlagScale CLI
           pip install . --no-build-isolation --root-user-action=ignore || { echo "❌ FlagScale CLI install failed"; exit 1; }
 
           # Verify installation
@@ -111,7 +155,32 @@ jobs:
           set -euo pipefail
           cd $PROJECT_ROOT
 
-          echo "Validating CLI (outside virtual environment)"
+          PKG_MGR='${{ inputs.pkg_mgr }}'
+          ENV_NAME='${{ inputs.env_name }}'
+          ENV_PATH='${{ inputs.env_path }}'
+
+          # Source environment utilities
+          source ./tools/install/utils/pyenv_utils.sh
+
+          # Activate environment based on package manager
+          # Activate environment based on package manager
+          case "$PKG_MGR" in
+            conda)
+              if [ -n "$ENV_NAME" ] && [ -n "$ENV_PATH" ]; then
+                activate_conda "$ENV_NAME" "$ENV_PATH" || { echo "❌ Conda activation failed"; exit 1; }
+              fi
+              ;;
+            uv)
+              if [ -n "$ENV_PATH" ] && [ -d "$ENV_PATH" ]; then
+                activate_uv_env "$ENV_PATH" || { echo "❌ UV activation failed"; exit 1; }
+              fi
+              ;;
+            pip)
+              echo "Using system Python with pip"
+              ;;
+          esac
+
+          echo "Validating CLI"
           echo "Python location: $(which python)"
           echo "Python version: $(python --version)"
 
 
@@ -115,6 +115,7 @@ jobs:
           git config --global --add safe.directory $PROJECT_ROOT
 
       - name: Setup environment for inference
+        if: inputs.platform == 'cuda'
         run: |
           set -euo pipefail
           cd $PROJECT_ROOT
@@ -164,6 +165,27 @@ jobs:
 
         timeout-minutes: 5
 
+      - name: Install dependencies for inference ascend
+        if: inputs.platform == 'ascend'
+        run: |
+          set -euo pipefail
+
+          # Install vllm-plugin-FL
+          pip install vllm-plugin-fl==0.1.0+vllm0.13.0 \
+            --extra-index-url https://resource.flagos.net/repository/flagos-pypi-hosted/simple \
+            || { echo "❌ vllm-plugin-FL install failed"; exit 1; }
+          echo "✅ vllm-plugin-FL installed successfully"
+
+          # Install FlagScale and dependencies
+          cd $PROJECT_ROOT
+          pip install . --no-build-isolation --root-user-action=ignore || { echo "❌ FlagScale CLI install failed"; exit 1; }
+
+          # Verify installation
+          command -v flagscale || { echo "❌ FlagScale CLI not found in PATH"; exit 1; }
+          echo "✅ FlagScale CLI installed successfully: $(flagscale --version 2>/dev/null || echo 'version unknown')"
+          echo "✅ Environment ready for inference tests"
+        timeout-minutes: 15
+
       - name: Run functional tests
         id: functional_test
         run: |
 
@@ -115,6 +115,7 @@ jobs:
           git config --global --add safe.directory $PROJECT_ROOT
 
       - name: Install dependencies for serve
+        if: inputs.platform == 'cuda'
         run: |
           set -euo pipefail
           cd $PROJECT_ROOT
@@ -163,6 +164,27 @@ jobs:
           echo "Environment ready for serve tests"
         timeout-minutes: 5
 
+      - name: Install dependencies for serve ascend
+        if: inputs.platform == 'ascend'
+        run: |
+          set -euo pipefail
+
+          # Install vllm-plugin-FL
+          pip install vllm-plugin-fl==0.1.0+vllm0.13.0 \
+            --extra-index-url https://resource.flagos.net/repository/flagos-pypi-hosted/simple \
+            || { echo "❌ vllm-plugin-FL install failed"; exit 1; }
+          echo "✅ vllm-plugin-FL installed successfully"
+
+          # Install FlagScale
+          cd $PROJECT_ROOT
+          pip install . --no-build-isolation --root-user-action=ignore || { echo "❌ FlagScale CLI install failed"; exit 1; }
+
+          # Verify installation
+          command -v flagscale || { echo "❌ FlagScale CLI not found in PATH"; exit 1; }
+          echo "✅ FlagScale CLI installed successfully: $(flagscale --version 2>/dev/null || echo 'version unknown')"
+          echo "✅ Environment ready for serve tests"
+        timeout-minutes: 15
+
       - name: Run functional tests
         id: functional_test
         env: