diff --git a/.github/dependabot.yml b/.github/dependabot.yml
new file mode 100644
index 0000000..c7a6df3
--- /dev/null
+++ b/.github/dependabot.yml
@@ -0,0 +1,46 @@
+version: 2
+updates:
+  - package-ecosystem: gomod
+    directory: /api-server
+    schedule:
+      interval: weekly
+    open-pull-requests-limit: 5
+    commit-message:
+      prefix: "deps(go)"
+
+  - package-ecosystem: npm
+    directory: /web-ui
+    schedule:
+      interval: weekly
+    open-pull-requests-limit: 5
+    commit-message:
+      prefix: "deps(web-ui)"
+
+  - package-ecosystem: npm
+    directory: /website
+    schedule:
+      interval: weekly
+    open-pull-requests-limit: 5
+    commit-message:
+      prefix: "deps(website)"
+
+  - package-ecosystem: github-actions
+    directory: /
+    schedule:
+      interval: weekly
+    commit-message:
+      prefix: "ci"
+
+  - package-ecosystem: docker
+    directory: /api-server
+    schedule:
+      interval: weekly
+    commit-message:
+      prefix: "deps(docker)"
+
+  - package-ecosystem: docker
+    directory: /web-ui
+    schedule:
+      interval: weekly
+    commit-message:
+      prefix: "deps(docker)"
diff --git a/.github/workflows/build-test.yml b/.github/workflows/build-test.yml
index d1abc5c..db62134 100644
--- a/.github/workflows/build-test.yml
+++ b/.github/workflows/build-test.yml
@@ -27,7 +27,7 @@ jobs:
         uses: actions/checkout@v4
 
       - name: Set up Go
-        uses: actions/setup-go@v5
+        uses: actions/setup-go@v6
         with:
           go-version: '1.24'
           cache-dependency-path: api-server/go.sum
@@ -53,7 +53,7 @@ jobs:
         uses: actions/checkout@v4
 
       - name: Set up Go
-        uses: actions/setup-go@v5
+        uses: actions/setup-go@v6
         with:
           go-version: '1.24'
           cache-dependency-path: api-server/go.sum
diff --git a/.github/workflows/cleanup-docs-version.yml b/.github/workflows/cleanup-docs-version.yml
new file mode 100644
index 0000000..6c5473e
--- /dev/null
+++ b/.github/workflows/cleanup-docs-version.yml
@@ -0,0 +1,137 @@
+name: Cleanup Documentation Version
+
+on:
+  release:
+    types: [deleted]
+
+permissions:
+  contents: write
+
+concurrency:
+  group: docs-versioning
+  cancel-in-progress: false
+
+jobs:
+  remove-version:
+    name: Remove Documentation Version
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+          ref: main
+
+      - name: Extract version from tag
+        id: version
+        run: |
+          # Extract version from tag (v0.0.3 -> 0.0.3)
+          VERSION=${GITHUB_REF#refs/tags/v}
+          echo "version=$VERSION" >> $GITHUB_OUTPUT
+          echo "Removing documentation version: $VERSION"
+
+      - name: Check if version exists
+        id: check
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+          if grep -q "\"${VERSION}\"" website/versions.json; then
+            echo "exists=true" >> $GITHUB_OUTPUT
+            echo "✅ Version ${VERSION} found in versions.json"
+          else
+            echo "exists=false" >> $GITHUB_OUTPUT
+            echo "⚠️  Version ${VERSION} not found, nothing to remove"
+          fi
+
+      - name: Install jq
+        if: steps.check.outputs.exists == 'true'
+        run: |
+          sudo apt-get update
+          sudo apt-get install -y jq
+
+      - name: Remove version from versions.json
+        if: steps.check.outputs.exists == 'true'
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+
+          echo "Current versions.json:"
+          cat website/versions.json
+
+          # Remove version from array using jq
+          jq --arg ver "${VERSION}" 'del(.[] | select(. == $ver))' website/versions.json > website/versions.json.tmp
+          mv website/versions.json.tmp website/versions.json
+
+          echo ""
+          echo "Updated versions.json:"
+          cat website/versions.json
+
+      - name: Remove versioned directories
+        if: steps.check.outputs.exists == 'true'
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+
+          # Remove versioned documentation directory
+          if [ -d "website/versioned_docs/version-${VERSION}" ]; then
+            rm -rf "website/versioned_docs/version-${VERSION}"
+            echo "✅ Removed versioned_docs/version-${VERSION}/"
+          fi
+
+          # Remove versioned sidebars file
+          if [ -f "website/versioned_sidebars/version-${VERSION}-sidebars.json" ]; then
+            rm -f "website/versioned_sidebars/version-${VERSION}-sidebars.json"
+            echo "✅ Removed versioned_sidebars/version-${VERSION}-sidebars.json"
+          fi
+
+          echo ""
+          echo "Files removed:"
+          git status --short
+
+      - name: Configure Git
+        if: steps.check.outputs.exists == 'true'
+        run: |
+          git config user.name "github-actions[bot]"
+          git config user.email "github-actions[bot]@users.noreply.github.com"
+
+      - name: Commit and push changes
+        if: steps.check.outputs.exists == 'true'
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+
+          git add website/versions.json
+          git add website/versioned_docs/
+          git add website/versioned_sidebars/
+
+          git commit -m "docs: remove version ${VERSION} [skip ci]
+
+          Auto-cleanup documentation version after release deletion ${GITHUB_REF}
+
+          - Removed version ${VERSION} from versions.json
+          - Deleted versioned_docs/version-${VERSION}/
+          - Deleted versioned_sidebars/version-${VERSION}-sidebars.json"
+
+          git push origin HEAD:main
+
+          echo "✅ Changes pushed to main branch"
+          echo "📚 Documentation version ${VERSION} has been removed"
+
+      - name: Summary
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+          EXISTS=${{ steps.check.outputs.exists }}
+
+          echo "## Documentation Cleanup Summary" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "**Version**: ${VERSION}" >> $GITHUB_STEP_SUMMARY
+          echo "**Release**: ${GITHUB_REF}" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+
+          if [ "$EXISTS" == "true" ]; then
+            echo "✅ **Status**: Documentation version removed successfully" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo "**Removed files**:" >> $GITHUB_STEP_SUMMARY
+            echo "- \`versions.json\` (updated)" >> $GITHUB_STEP_SUMMARY
+            echo "- \`versioned_docs/version-${VERSION}/\`" >> $GITHUB_STEP_SUMMARY
+            echo "- \`versioned_sidebars/version-${VERSION}-sidebars.json\`" >> $GITHUB_STEP_SUMMARY
+          else
+            echo "⚠️  **Status**: Version not found, nothing to remove" >> $GITHUB_STEP_SUMMARY
+          fi
diff --git a/.github/workflows/deploy-docs.yml b/.github/workflows/deploy-docs.yml
index 428461d..ef0f15c 100644
--- a/.github/workflows/deploy-docs.yml
+++ b/.github/workflows/deploy-docs.yml
@@ -19,13 +19,17 @@ concurrency:
   cancel-in-progress: false
 
 jobs:
-  build-docs:
-    name: Build Docusaurus
+  deploy-docs:
+    name: Build and Deploy Documentation
     runs-on: ubuntu-latest
+
     steps:
-      - name: Checkout code
+      - name: Checkout repository
         uses: actions/checkout@v4
 
+      - name: Setup Pages
+        uses: actions/configure-pages@v5
+
       - name: Setup Node.js
         uses: actions/setup-node@v4
         with:
@@ -43,75 +47,22 @@ jobs:
           cd website
           npm run build
 
-      - name: Upload build artifact
-        uses: actions/upload-artifact@v4
-        with:
-          name: docusaurus-build
-          path: website/build/
-
-  deploy-docs:
-    name: Deploy to GitHub Pages
-    needs: build-docs
-    runs-on: ubuntu-latest
-    steps:
-      - name: Checkout gh-pages branch (or create it)
-        uses: actions/checkout@v4
-        with:
-          ref: gh-pages
-          fetch-depth: 0
-        continue-on-error: true
-
-      - name: Initialize gh-pages if checkout failed
-        run: |
-          if [ ! -d ".git" ]; then
-            echo "gh-pages branch doesn't exist, creating it..."
-            git init
-            git checkout -b gh-pages
-            git remote add origin https://x-access-token:${{ secrets.GITHUB_TOKEN }}@github.com/${{ github.repository }}.git
-          fi
-
-      - name: Download docs build
-        uses: actions/download-artifact@v4
-        with:
-          name: docusaurus-build
-          path: docs-temp/
-
-      - name: Preserve Helm charts and deploy docs
+      - name: Prepare deployment
         run: |
-          # Backup existing charts/ directory if it exists
-          if [ -d "charts" ]; then
-            echo "Backing up existing charts/ directory"
-            mv charts charts-backup
-          fi
+          # Create deployment directory
+          mkdir -p _site
 
-          # Clear everything except charts-backup and .git
-          find . -maxdepth 1 ! -name charts-backup ! -name .git ! -name . ! -name .. -exec rm -rf {} +
+          # Copy Docusaurus build output
+          cp -r website/build/* _site/
 
-          # Move Docusaurus build to root
-          if [ -d "docs-temp" ] && [ "$(ls -A docs-temp)" ]; then
-            mv docs-temp/* docs-temp/.* . 2>/dev/null || mv docs-temp/* .
-            rm -rf docs-temp
-          else
-            echo "Warning: docs-temp directory is empty or doesn't exist"
-          fi
+          # Ensure .nojekyll exists (should already be in build)
+          touch _site/.nojekyll
 
-          # Restore charts/ directory
-          if [ -d "charts-backup" ]; then
-            echo "Restoring charts/ directory"
-            mv charts-backup charts
-          fi
-
-      - name: Configure Git
-        run: |
-          git config user.name "github-actions[bot]"
-          git config user.email "github-actions[bot]@users.noreply.github.com"
+      - name: Upload artifact
+        uses: actions/upload-pages-artifact@v3
+        with:
+          path: '_site'
 
-      - name: Commit and push
-        run: |
-          git add -A
-          if ! git diff --cached --quiet; then
-            git commit -m "Deploy documentation from commit ${{ github.sha }}"
-            git push origin gh-pages --force
-          else
-            echo "No changes to commit"
-          fi
+      - name: Deploy to GitHub Pages
+        id: deployment
+        uses: actions/deploy-pages@v4
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
index 8fb8205..d9c407a 100644
--- a/.github/workflows/release.yml
+++ b/.github/workflows/release.yml
@@ -15,9 +15,74 @@ env:
   IMAGE_PREFIX: ghcr.io/${{ github.repository_owner }}/bison
 
 jobs:
+  gate:
+    name: Test & Lint Gate
+    runs-on: ubuntu-latest
+    steps:
+      - name: Checkout code
+        uses: actions/checkout@v4
+
+      - name: Set up Go
+        uses: actions/setup-go@v6
+        with:
+          go-version: '1.24'
+          cache-dependency-path: api-server/go.sum
+
+      - name: Go vet
+        working-directory: api-server
+        run: go vet ./...
+
+      - name: Go fmt check
+        working-directory: api-server
+        run: |
+          if [ -n "$(gofmt -l .)" ]; then
+            echo "Go code is not formatted:"; gofmt -d .; exit 1
+          fi
+
+      - name: Go build
+        working-directory: api-server
+        run: go build ./...
+
+      - name: Go test (race + coverage)
+        working-directory: api-server
+        run: |
+          go test -race -coverprofile=coverage.out ./...
+          echo "### API coverage" >> "$GITHUB_STEP_SUMMARY"
+          go tool cover -func=coverage.out | tail -1 >> "$GITHUB_STEP_SUMMARY"
+
+      - name: Set up Node
+        uses: actions/setup-node@v4
+        with:
+          node-version: '20'
+          cache: npm
+          cache-dependency-path: web-ui/package-lock.json
+
+      - name: Web install
+        working-directory: web-ui
+        # Remove the lockfile before install so platform-specific optional deps
+        # (e.g. @rollup/rollup-linux-x64-gnu) resolve on the Linux runner. A lock
+        # generated on another platform omits them and triggers npm bug #4828.
+        # This mirrors the web-ui Dockerfile.
+        run: |
+          rm -f package-lock.json
+          npm install --no-audit --no-fund
+
+      - name: Web lint
+        working-directory: web-ui
+        run: npm run lint
+
+      - name: Web test
+        working-directory: web-ui
+        run: npx vitest run
+
+      - name: Web build
+        working-directory: web-ui
+        run: npm run build
+
   prepare:
     name: Prepare Release
     runs-on: ubuntu-latest
+    needs: gate
     outputs:
       version: ${{ steps.extract_version.outputs.version }}
     steps:
@@ -81,6 +146,12 @@ jobs:
       - name: Set up Docker Buildx
         uses: docker/setup-buildx-action@v3
 
+      - name: Set GHCR organization
+        id: ghcr
+        run: |
+          # Convert GitHub username to lowercase for GHCR
+          echo "owner=$(echo '${{ github.repository_owner }}' | tr '[:upper:]' '[:lower:]')" >> $GITHUB_OUTPUT
+
       - name: Log in to GitHub Container Registry
         uses: docker/login-action@v3
         with:
@@ -92,7 +163,7 @@ jobs:
         id: meta
         uses: docker/metadata-action@v5
         with:
-          images: ${{ env.IMAGE_PREFIX }}/${{ matrix.component }}
+          images: ghcr.io/${{ steps.ghcr.outputs.owner }}/bison/${{ matrix.component }}
           tags: |
             type=semver,pattern={{version}}
             type=semver,pattern={{major}}.{{minor}}
@@ -171,14 +242,19 @@ jobs:
 
           ### 🚀 Installation
 
-          #### Using Helm Repository (Recommended)
+          **Requirements:** Helm >= 3.8.0, Kubernetes >= 1.22
+
+          #### Method 1: From GHCR (Recommended)
           \`\`\`bash
-          helm repo add bison https://${{ github.repository_owner }}.github.io/Bison/
-          helm repo update
-          helm install my-bison bison/bison --version ${VERSION}
+          # Install directly from GitHub Container Registry
+          helm install my-bison oci://ghcr.io/supermarioyl/charts/bison --version ${VERSION}
+
+          # Or pull first, then install
+          helm pull oci://ghcr.io/supermarioyl/charts/bison --version ${VERSION}
+          helm install my-bison bison-${VERSION}.tgz
           \`\`\`
 
-          #### Using GitHub Release
+          #### Method 2: From GitHub Releases
           \`\`\`bash
           wget https://github.com/${{ github.repository }}/releases/download/v${VERSION}/bison-${VERSION}.tgz
           helm install my-bison bison-${VERSION}.tgz
@@ -187,14 +263,21 @@ jobs:
           ### 🐳 Docker Images
 
           \`\`\`bash
-          docker pull ghcr.io/${{ github.repository_owner }}/bison/api-server:${VERSION}
-          docker pull ghcr.io/${{ github.repository_owner }}/bison/web-ui:${VERSION}
+          docker pull ghcr.io/supermarioyl/bison/api-server:${VERSION}
+          docker pull ghcr.io/supermarioyl/bison/web-ui:${VERSION}
           \`\`\`
 
           ### 📦 What's Changed
 
           **Full Changelog**: https://github.com/${{ github.repository }}/compare/v${VERSION}...v${VERSION}
 
+          ### 📚 Documentation
+
+          Version-specific documentation will be available shortly at:
+          - 📖 [https://bison.lei6393.com/docs/${VERSION}/](https://bison.lei6393.com/docs/${VERSION}/)
+
+          > Note: Documentation versioning happens automatically after release. Allow a few minutes for the docs site to update.
+
           ---
           🤖 Generated with [GitHub Actions](https://github.com/features/actions)
           EOF
@@ -211,106 +294,99 @@ jobs:
           prerelease: false
           token: ${{ secrets.GITHUB_TOKEN }}
 
-  publish-helm-repo:
-    name: Publish to Helm Repository (GitHub Pages)
+  commit-versions:
+    name: Commit Version Updates to Main
     runs-on: ubuntu-latest
     needs: [prepare, create-release]
+    permissions:
+      contents: write
+
     steps:
-      - name: Checkout code
+      - name: Checkout repository
         uses: actions/checkout@v4
         with:
+          ref: main
           fetch-depth: 0
 
-      - name: Download Helm chart
+      - name: Download updated files
         uses: actions/download-artifact@v4
         with:
-          name: helm-chart
+          name: updated-files
           path: .
 
-      - name: Install Helm
-        uses: azure/setup-helm@v4
-        with:
-          version: 'latest'
-
       - name: Configure Git
         run: |
           git config user.name "github-actions[bot]"
           git config user.email "github-actions[bot]@users.noreply.github.com"
 
-      - name: Publish to GitHub Pages (charts/ subdirectory)
-        env:
-          VERSION: ${{ needs.prepare.outputs.version }}
-          GITHUB_TOKEN: ${{ secrets.GITHUB_TOKEN }}
+      - name: Commit and push version updates
         run: |
-          # Clone or create gh-pages branch
-          if git ls-remote --exit-code --heads origin gh-pages; then
-            echo "gh-pages branch exists, cloning..."
-            git clone --single-branch --branch gh-pages https://x-access-token:${GITHUB_TOKEN}@github.com/${{ github.repository }}.git gh-pages
-          else
-            echo "gh-pages branch does not exist, creating..."
-            mkdir gh-pages
-            cd gh-pages
-            git init
-            git checkout -b gh-pages
-            git remote add origin https://x-access-token:${GITHUB_TOKEN}@github.com/${{ github.repository }}.git
-            cd ..
-          fi
-
-          # Create charts/ directory if it doesn't exist
-          mkdir -p gh-pages/charts
-
-          # Copy Helm chart to gh-pages/charts/
-          cp bison-${VERSION}.tgz gh-pages/charts/
+          VERSION=${{ needs.prepare.outputs.version }}
 
-          # Generate or update index.yaml in charts/ directory
-          cd gh-pages/charts
-          helm repo index . --url https://${{ github.repository_owner }}.github.io/Bison/charts/
+          # Check if there are changes to commit
+          if git diff --quiet deploy/charts/bison/Chart.yaml web-ui/package.json; then
+            echo "⚠️  No changes to commit"
+            exit 0
+          fi
 
-          # Create README in charts/ directory if it doesn't exist
-          if [ ! -f README.md ]; then
-            cat <<EOF > README.md
-          # Bison Helm Chart Repository
+          git add deploy/charts/bison/Chart.yaml
+          git add web-ui/package.json
 
-          ## Usage
+          git commit -m "chore: bump version to ${VERSION} [skip ci]
 
-          Add the Helm repository:
+          Auto-updated version files from release ${GITHUB_REF}
 
-          \`\`\`bash
-          helm repo add bison https://${{ github.repository_owner }}.github.io/Bison/charts/
-          helm repo update
-          \`\`\`
+          - Updated Chart.yaml version to ${VERSION}
+          - Updated package.json version to ${VERSION}"
 
-          Search for available charts:
+          git push origin HEAD:main
 
-          \`\`\`bash
-          helm search repo bison
-          \`\`\`
+          echo "✅ Version updates committed to main branch"
 
-          Install the chart:
+      - name: Summary
+        run: |
+          VERSION=${{ needs.prepare.outputs.version }}
+          echo "## Version Update Summary" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "**Version**: ${VERSION}" >> $GITHUB_STEP_SUMMARY
+          echo "**Release**: ${GITHUB_REF}" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "✅ **Status**: Version files committed to main branch" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "**Updated files**:" >> $GITHUB_STEP_SUMMARY
+          echo "- \`deploy/charts/bison/Chart.yaml\`" >> $GITHUB_STEP_SUMMARY
+          echo "- \`web-ui/package.json\`" >> $GITHUB_STEP_SUMMARY
 
-          \`\`\`bash
-          helm install my-bison bison/bison --version ${VERSION}
-          \`\`\`
+  publish-helm-repo:
+    name: Publish to Helm Repository (GHCR)
+    runs-on: ubuntu-latest
+    needs: [prepare, create-release]
+    permissions:
+      contents: read
+      packages: write
 
-          ## Available Versions
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
 
-          See [index.yaml](./index.yaml) for all available versions.
-          EOF
-          fi
+      - name: Download Helm chart
+        uses: actions/download-artifact@v4
+        with:
+          name: helm-chart
+          path: .
 
-          # Return to gh-pages root
-          cd ..
+      - name: Install Helm
+        uses: azure/setup-helm@v4
+        with:
+          version: 'latest'
 
-          # Configure Git
-          git config user.name "github-actions[bot]"
-          git config user.email "github-actions[bot]@users.noreply.github.com"
+      - name: Log in to GitHub Container Registry
+        run: echo "${{ secrets.GITHUB_TOKEN }}" | helm registry login ghcr.io -u ${{ github.actor }} --password-stdin
 
-          # Commit and push
-          git add charts/
-          if git diff --cached --quiet; then
-            echo "No changes to commit"
-          else
-            git commit -m "Release Helm chart v${VERSION}"
-            git push origin gh-pages
-            echo "Successfully published Helm chart to GitHub Pages at /charts/"
-          fi
+      - name: Push Helm chart to GHCR
+        env:
+          VERSION: ${{ needs.prepare.outputs.version }}
+        run: |
+          # Convert GitHub username to lowercase for GHCR
+          REPO_OWNER=$(echo "${{ github.repository_owner }}" | tr '[:upper:]' '[:lower:]')
+          helm push bison-${VERSION}.tgz oci://ghcr.io/${REPO_OWNER}/charts
diff --git a/.github/workflows/version-docs.yml b/.github/workflows/version-docs.yml
new file mode 100644
index 0000000..1314da3
--- /dev/null
+++ b/.github/workflows/version-docs.yml
@@ -0,0 +1,119 @@
+name: Version Documentation
+
+on:
+  release:
+    types: [published]
+
+permissions:
+  contents: write
+
+concurrency:
+  group: docs-versioning
+  cancel-in-progress: false
+
+jobs:
+  create-version:
+    name: Create Documentation Version
+    runs-on: ubuntu-latest
+
+    steps:
+      - name: Checkout repository
+        uses: actions/checkout@v4
+        with:
+          fetch-depth: 0
+          ref: main
+
+      - name: Extract version from tag
+        id: version
+        run: |
+          # Extract version from tag (v0.0.3 -> 0.0.3)
+          VERSION=${GITHUB_REF#refs/tags/v}
+          echo "version=$VERSION" >> $GITHUB_OUTPUT
+          echo "Creating documentation version: $VERSION"
+
+      - name: Check if version already exists
+        id: check
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+          if grep -q "\"${VERSION}\"" website/versions.json; then
+            echo "exists=true" >> $GITHUB_OUTPUT
+            echo "⚠️  Version ${VERSION} already exists in versions.json"
+          else
+            echo "exists=false" >> $GITHUB_OUTPUT
+            echo "✅ Version ${VERSION} not found, will create"
+          fi
+
+      - name: Setup Node.js
+        if: steps.check.outputs.exists == 'false'
+        uses: actions/setup-node@v4
+        with:
+          node-version: '20'
+          cache: 'npm'
+          cache-dependency-path: website/package-lock.json
+
+      - name: Install dependencies
+        if: steps.check.outputs.exists == 'false'
+        run: |
+          cd website
+          npm ci
+
+      - name: Create documentation version
+        if: steps.check.outputs.exists == 'false'
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+          cd website
+
+          echo "Running: npm run docusaurus docs:version ${VERSION}"
+          npm run docusaurus docs:version ${VERSION}
+
+          echo "✅ Documentation version ${VERSION} created"
+          echo ""
+          echo "Files created/modified:"
+          git status --short
+
+      - name: Configure Git
+        if: steps.check.outputs.exists == 'false'
+        run: |
+          git config user.name "github-actions[bot]"
+          git config user.email "github-actions[bot]@users.noreply.github.com"
+
+      - name: Commit and push changes
+        if: steps.check.outputs.exists == 'false'
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+
+          git add website/versions.json
+          git add website/versioned_docs/
+          git add website/versioned_sidebars/
+
+          git commit -m "docs: add version ${VERSION} [skip ci]
+
+          Auto-generated documentation version from release ${GITHUB_REF}
+
+          - Added version ${VERSION} to versions.json
+          - Created versioned_docs/version-${VERSION}/
+          - Created versioned_sidebars/version-${VERSION}-sidebars.json"
+
+          git push origin HEAD:main
+
+          echo "✅ Changes pushed to main branch"
+          echo "📚 Documentation will be available at: https://bison.lei6393.com/docs/${VERSION}/"
+
+      - name: Summary
+        run: |
+          VERSION=${{ steps.version.outputs.version }}
+          EXISTS=${{ steps.check.outputs.exists }}
+
+          echo "## Documentation Versioning Summary" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+          echo "**Version**: ${VERSION}" >> $GITHUB_STEP_SUMMARY
+          echo "**Release**: ${GITHUB_REF}" >> $GITHUB_STEP_SUMMARY
+          echo "" >> $GITHUB_STEP_SUMMARY
+
+          if [ "$EXISTS" == "true" ]; then
+            echo "⚠️  **Status**: Version already exists, skipped" >> $GITHUB_STEP_SUMMARY
+          else
+            echo "✅ **Status**: Documentation version created successfully" >> $GITHUB_STEP_SUMMARY
+            echo "" >> $GITHUB_STEP_SUMMARY
+            echo "📚 **View Documentation**: [https://bison.lei6393.com/docs/${VERSION}/](https://bison.lei6393.com/docs/${VERSION}/)" >> $GITHUB_STEP_SUMMARY
+          fi
diff --git a/CHANGELOG.md b/CHANGELOG.md
index 6a33766..799207f 100644
--- a/CHANGELOG.md
+++ b/CHANGELOG.md
@@ -5,6 +5,147 @@ All notable changes to the Bison project will be documented in this file.
 The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
 and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
 
+## [0.0.27] - 2026-06-19
+
+### Added — Supply-chain hygiene
+
+- Added `.github/dependabot.yml` to track updates weekly for Go modules, the web-ui and website npm trees, GitHub Actions, and the Docker base images.
+- Added `.dockerignore` for api-server and web-ui so build contexts exclude `.git`, `node_modules`, `dist`, coverage and editor files — smaller, more reproducible image builds.
+
+## [0.0.26] - 2026-06-19
+
+### Added — Availability & network hardening templates (opt-in)
+
+- Optional **PodDisruptionBudget** (`apiServer.podDisruptionBudget` / `webUI.podDisruptionBudget`) keeps a minimum replica available during voluntary disruptions (node drains).
+- Optional **HorizontalPodAutoscaler** (`apiServer.autoscaling` / `webUI.autoscaling`); when enabled, the Deployment no longer pins `replicas` so the HPA owns scaling.
+- Optional **NetworkPolicy** (`networkPolicy.enabled`) restricting api-server ingress to web-ui pods and the release namespace.
+- All three are disabled by default; `values.schema.json` extended to type-check the new keys.
+
+## [0.0.25] - 2026-06-19
+
+### Added — Chart validation
+
+- Added `values.schema.json` so Helm validates value types at install/upgrade time (e.g. a string `replicaCount` or non-boolean `enabled` now fails fast instead of being silently mis-applied). The schema type-checks known keys while remaining lenient about additions.
+- Added `kubeVersion: ">=1.22.0-0"` to `Chart.yaml` so unsupported clusters are rejected up front.
+
+## [0.0.24] - 2026-06-19
+
+### Changed — Frontend re-render reduction
+
+- `AuthProvider` and `ThemeProvider` now memoize their context value (`useMemo`) instead of allocating a fresh object every render, so consumers (and, for the theme, the whole Ant Design `ConfigProvider` subtree) no longer re-render on unrelated parent renders.
+
+## [0.0.23] - 2026-06-19
+
+### Changed — Centralized frontend error handling
+
+- Replaced the 13 duplicated `err.response?.data?.error || err.message` extraction sites (across ClusterNodes, TeamDetail, TeamCreate, Login, ResourceConfig) with the shared `getApiErrorMessage` helper. The backend error envelope shape now lives in one place, so future changes touch one file instead of thirteen.
+
+## [0.0.22] - 2026-06-19
+
+### Security — Refuse insecure defaults at startup
+
+- When `AUTH_ENABLED=true`, the server now refuses to start if `JWT_SECRET` is empty or still the built-in public default, or if `ADMIN_PASSWORD` is empty or `admin`. This prevents a production deployment from silently running with a forgeable token-signing key or the well-known default password. Auth-disabled and local development are unaffected; the Helm chart already injects randomly generated, persisted secrets. Added table-driven config validation tests.
+
+## [0.0.21] - 2026-06-19
+
+### Added — Release test/lint gate
+
+- The release workflow now runs a **Test & Lint Gate** before anything is built or published: `go vet`, `gofmt` check, `go build`, `go test -race` (with coverage in the job summary), plus web `npm ci` / lint / `vitest run` / build. `prepare` (and the whole publish chain) `needs` this gate, so broken code can no longer be tagged into a public release.
+
+### Fixed — Reproducible web build
+
+- Declared `tslib` as an explicit dependency: `echarts-for-react` imports it but doesn't declare it, so it was a phantom dependency previously satisfied only by the removed `@ant-design/pro-components`. Clean installs (`npm ci`) now build reliably.
+- Synced `package-lock.json` with `package.json` (removed stale `pro-components`, added `tslib`) so `npm ci` works.
+- Applied `gofmt` across the api-server (formatting only).
+
+## [0.0.20] - 2026-06-19
+
+### Changed — OpenCost query caching
+
+- The OpenCost client now wraps allocation queries in a 30s TTL cache that also **coalesces concurrent identical queries** (same window/aggregate/filter), so a burst of dashboard/billing requests hits OpenCost once instead of once per caller. Errors are not cached (next caller retries). Self-contained implementation — no new dependency; covered by race-tested unit tests.
+
+## [0.0.19] - 2026-06-19
+
+### Changed — Backend performance
+
+- `GET /teams` no longer issues one (discarded) OpenCost usage query per team; per-team usage is fetched on demand by the detail/dashboard endpoints. This removes an O(teams) OpenCost call storm from the team list.
+- Billing/report cost computation now resolves the resource price table **once per operation** (`loadPrices` + `costFromPrices`) instead of reading the resource-config ConfigMap for every allocation row, cutting ConfigMap reads from O(allocations) to O(1) in `ProcessBilling`, `GetTeamBill`, and `GetProjectBill`.
+
+## [0.0.18] - 2026-06-19
+
+### Fixed — Daily-consumption (burn-rate) estimate
+
+- `CalculateDailyConsumption` now divides total in-window deductions by the **actual span of deduction activity** (capped at 7 days, floored at 0.5 day) instead of a fixed 7-day denominator, which previously underestimated the burn rate and overestimated the time-to-overdue.
+- Fetches up to 400 history records (was 100) so a full week of hourly deductions isn't truncated and undercounted. Recharges and out-of-window records are correctly excluded. Added unit tests for span, floor, and exclusion behavior.
+
+## [0.0.17] - 2026-06-19
+
+### Fixed — Billing interval correctness & restart safety
+
+- Billing now gates on a persisted `lastBilledAt` timestamp (stored in the billing ConfigMap): a cycle only runs once ~the configured interval has actually elapsed. This stops two failure modes — the hourly scheduler tick over-billing when `interval > 1h`, and a process restart re-billing a window that was already charged.
+- The first run on a fresh deployment establishes a baseline instead of billing an unknown historical window.
+- The timestamp write uses optimistic-concurrency retry; added a round-trip unit test.
+
+## [0.0.16] - 2026-06-19
+
+### Security — Configurable CORS
+
+- CORS is now configurable via `CORS_ALLOWED_ORIGINS` (comma-separated allowlist). When set, only listed origins are echoed back (with `Vary: Origin` and `Access-Control-Allow-Credentials`); other origins get no `Access-Control-Allow-Origin` and are blocked by the browser. Default (unset) preserves the previous `*` behavior, so existing deployments are unaffected until they opt in to tightening.
+
+## [0.0.15] - 2026-06-19
+
+### Security — Login hardening
+
+- **Per-IP login rate limiting**: after 5 failed attempts within 5 minutes an IP is locked out for 15 minutes (HTTP 429 + `Retry-After`), stopping unthrottled brute-force of the admin password.
+- **Constant-time credential comparison** (`crypto/subtle.ConstantTimeCompare`) for both username and password, removing the early-exit timing side channel; both comparisons always run so username validity isn't leaked.
+- Added unit tests for the limiter (block threshold, success reset, window reset).
+
+## [0.0.14] - 2026-06-19
+
+### Fixed — Helm secret persistence
+
+- The auth `Secret` now reuses the existing JWT signing key and admin password on `helm upgrade` via `lookup`, instead of regenerating them with `randAlphaNum` on every render. Previously each upgrade rotated the JWT key (invalidating all sessions) and silently changed the admin password. Fresh installs still auto-generate; explicit `auth.admin.password` / `auth.jwt.secret` and `existingSecret` continue to take precedence.
+
+## [0.0.13] - 2026-06-19
+
+### Added — Scheduler leader election
+
+- **Lease-based leader election** (`internal/leader`) guards the singleton billing/auto-recharge/alert scheduler so it runs on exactly one api-server replica at a time. This is the root fix for the duplicate-billing risk; `apiServer.replicaCount` is restored to `2` for HA.
+- The scheduler is now **re-startable** (clean `Start`/`Stop` on leadership changes), with new tests covering restart and stop-before-start safety.
+- Toggle via `LEADER_ELECTION_ENABLED` (default on); disable for single-replica / local dev.
+- Added `coordination.k8s.io/leases` (get/create/update) to the api-server RBAC.
+
+## [0.0.12] - 2026-06-19
+
+### Fixed — Billing correctness & concurrency
+
+- **Atomic balance updates**: `Recharge`, `Deduct`, auto-recharge, and overdue-marking now perform their ConfigMap read-modify-write under `retry.RetryOnConflict`, eliminating silent lost updates / balance corruption under concurrent operations.
+- **`Deduct` returns the post-write balance**, so `ProcessBilling` no longer makes a racy second read to decide suspension.
+- **Overdue marker preserved across deductions** — a deduction no longer wipes `OverdueAt`, so the grace-period clock is measured from when the balance first went negative (teams now actually suspend after the grace window instead of never).
+- **Scheduler hardening**: per-task `panic` recovery (one failing task can no longer crash the api-server) plus startup jitter to avoid multi-replica stampede.
+- **Stopgap against double-billing**: `apiServer.replicaCount` defaults to `1` until scheduler leader election lands (the scheduler runs in the api-server; 2 replicas billed tenants twice).
+
+### Changed — Performance
+
+- **K8s client** QPS/Burst raised to 50/100 (from the 5/10 default) so dashboard/billing list bursts are not client-side throttled.
+- **Web UI** route-level code splitting + Vite `manualChunks`: echarts (~1 MB) and per-page bundles now load on demand instead of shipping with every Login/Dashboard session.
+
+### Added
+
+- First backend unit tests (`calculateCost`, `Recharge`/`Deduct`, grace-period logic, concurrent-recharge race test) with a fake-clientset optimistic-concurrency harness.
+- Top-level React `ErrorBoundary` and a shared `getApiErrorMessage` utility.
+- `docs/optimization-roadmap.md` — prioritized continuous-optimization roadmap from a full-codebase audit.
+
+### Changed — Website & docs
+
+- Replaced emoji icons with inline Tabler-style SVG icons; added an interactive vector `ProductShowcase` (Dashboard / Cluster / Reports / Billing).
+- Fixed the displayed UI version (was hardcoded `v3.0.0`; now injected from `package.json`).
+- Corrected install docs: OCI path `charts/bison`, `/healthz` health check, OpenCost namespace/value keys, `replicaCount`, object names `bison-api`/`bison-web`.
+- New 1200×630 social/OG card and SEO metadata; reduced-motion + offscreen-pause for the particle background.
+- Removed the unused `@ant-design/pro-components` dependency and stray `console.log`s.
+
+> Note: versions 0.0.2–0.0.11 were release-automation version bumps without dedicated changelog entries.
+
 ## [0.0.1] - 2025-12-27
 
 ### 🎉 Initial Release
diff --git a/Makefile b/Makefile
index 9453481..62ef8b6 100644
--- a/Makefile
+++ b/Makefile
@@ -2,7 +2,7 @@
 # 基于 Capsule + OpenCost 架构
 
 # ==================== 配置 ====================
-REGISTRY ?= docker.io
+REGISTRY ?= ghcr.io/supermarioyl
 REPO ?= bison
 VERSION ?= latest
 HELM_RELEASE ?= bison
@@ -304,9 +304,8 @@ deploy: ## 部署 Bison
 	helm upgrade --install $(HELM_RELEASE) ./deploy/charts/bison \
 		--namespace $(NAMESPACE) \
 		--create-namespace \
-		--set apiServer.image.repository=$(REGISTRY)/$(REPO)/api-server \
+		--set global.imageRegistry=$(REGISTRY) \
 		--set apiServer.image.tag=$(VERSION) \
-		--set webUI.image.repository=$(REGISTRY)/$(REPO)/web-ui \
 		--set webUI.image.tag=$(VERSION)
 
 .PHONY: deploy-with-auth
@@ -316,9 +315,8 @@ deploy-with-auth: ## 部署 Bison (启用认证)
 		--create-namespace \
 		--set auth.enabled=true \
 		--set auth.admin.password=$$(openssl rand -base64 12) \
-		--set apiServer.image.repository=$(REGISTRY)/$(REPO)/api-server \
+		--set global.imageRegistry=$(REGISTRY) \
 		--set apiServer.image.tag=$(VERSION) \
-		--set webUI.image.repository=$(REGISTRY)/$(REPO)/web-ui \
 		--set webUI.image.tag=$(VERSION)
 
 .PHONY: undeploy
diff --git a/README.md b/README.md
index 17866cd..48d660a 100644
--- a/README.md
+++ b/README.md
@@ -237,29 +237,27 @@ helm install opencost opencost/opencost -n opencost --create-namespace \
 
 ### 2. Deploy Bison
 
-#### Option A: Using Helm Repository (Recommended)
+#### Option A: Using GHCR (Recommended - OCI Format)
 
 ```bash
-# Add Bison Helm repository
-helm repo add bison https://supermarioyl.github.io/Bison/charts/
-helm repo update
-
-# Install Bison
-helm install bison bison/bison \
+# Install directly from GitHub Container Registry
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
   --namespace bison-system \
   --create-namespace \
   --set auth.enabled=true \
-  --version 0.0.1
+  --version 0.0.12
 ```
 
+> **Note:** Requires Helm >= 3.8.0 for OCI support
+
 #### Option B: From GitHub Release
 
 ```bash
 # Download Helm chart from GitHub Release
-wget https://github.com/SuperMarioYL/Bison/releases/download/v0.0.1/bison-0.0.1.tgz
+wget https://github.com/SuperMarioYL/Bison/releases/download/v0.0.12/bison-0.0.12.tgz
 
 # Install from downloaded chart
-helm install bison bison-0.0.1.tgz \
+helm install bison bison-0.0.12.tgz \
   --namespace bison-system \
   --create-namespace \
   --set auth.enabled=true
@@ -288,7 +286,7 @@ kubectl get secret bison-auth -n bison-system -o jsonpath='{.data.password}' | b
 kubectl port-forward svc/bison-api 8080:8080 -n bison-system
 
 # Access API
-curl http://localhost:8080/api/v1/health
+curl http://localhost:8080/healthz
 ```
 
 ---
@@ -732,26 +730,53 @@ docker pull ghcr.io/supermarioyl/bison/web-ui:latest
 - `linux/amd64`
 - `linux/arm64`
 
-### Helm Repository
+### Helm Installation Methods
+
+Bison Helm charts are distributed via **GitHub Container Registry (GHCR)** using the OCI format, which is the modern standard for Helm 3.8+.
+
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
+
+#### Method 1: Install from GHCR (Recommended)
 
 ```bash
-# Add repository
-helm repo add bison https://supermarioyl.github.io/Bison/charts/
+# Install specific version directly from GHCR
+helm install my-bison oci://ghcr.io/supermarioyl/charts/bison --version 0.0.12
 
-# Search available versions
-helm search repo bison
+# Or pull the chart first, then install
+helm pull oci://ghcr.io/supermarioyl/charts/bison --version 0.0.12
+helm install my-bison bison-0.0.12.tgz
 
-# View chart information
-helm show chart bison/bison
-helm show values bison/bison
+# Customize installation
+helm install my-bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
+  --namespace bison-system \
+  --create-namespace \
+  --set dependencies.opencost.apiUrl=http://opencost.opencost.svc.cluster.local:9003 \
+  --set dependencies.opencost.enabled=true \
+  --set auth.enabled=true
+```
+
+#### Method 2: Install from GitHub Releases
 
-# Install specific version
-helm install my-bison bison/bison --version 0.0.1
+```bash
+# Download chart from GitHub Releases
+wget https://github.com/SuperMarioYL/Bison/releases/download/v0.0.12/bison-0.0.12.tgz
 
-# Upgrade to latest
-helm upgrade my-bison bison/bison
+# Install from downloaded file
+helm install my-bison bison-0.0.12.tgz \
+  --namespace bison-system \
+  --create-namespace
 ```
 
+**Why GHCR OCI Format?**
+- ✅ No need for separate Helm repository maintenance
+- ✅ Unified image and chart management in GHCR
+- ✅ Faster installation (direct pull from registry)
+- ✅ Better version control and immutability
+- ✅ Standard practice for Helm 3.8+
+
 ## Development
 
 ```bash
@@ -783,16 +808,16 @@ Bison uses automated GitHub Actions for releases:
    ```
 
 2. **GitHub Actions automatically**:
-   - Builds multi-platform Docker images
+   - Builds multi-platform Docker images (amd64, arm64)
    - Pushes images to GitHub Container Registry
    - Packages Helm chart
-   - Creates GitHub Release
-   - Updates Helm repository on GitHub Pages
+   - Publishes chart to GHCR (OCI format)
+   - Creates GitHub Release with chart attachment
 
 3. **Verify release**:
    - Check [GitHub Releases](https://github.com/SuperMarioYL/Bison/releases)
-   - Pull new images: `docker pull ghcr.io/supermarioyl/bison/api-server:3.1.0`
-   - Update Helm repo: `helm repo update && helm search repo bison`
+   - Pull new images: `docker pull ghcr.io/supermarioyl/bison/api-server:0.0.12`
+   - Install chart: `helm install test oci://ghcr.io/supermarioyl/charts/bison --version 0.0.12`
 
 ## Project Structure
 
diff --git a/api-server/.dockerignore b/api-server/.dockerignore
new file mode 100644
index 0000000..7106c2e
--- /dev/null
+++ b/api-server/.dockerignore
@@ -0,0 +1,11 @@
+# Keep the Docker build context small and reproducible.
+.git
+.gitignore
+.dockerignore
+Dockerfile
+dist
+bin
+*.out
+coverage.out
+.idea
+.vscode
diff --git a/api-server/cmd/main.go b/api-server/cmd/main.go
index 307caf1..8c8be80 100644
--- a/api-server/cmd/main.go
+++ b/api-server/cmd/main.go
@@ -14,6 +14,7 @@ import (
 	"github.com/bison/api-server/internal/config"
 	"github.com/bison/api-server/internal/handler"
 	"github.com/bison/api-server/internal/k8s"
+	"github.com/bison/api-server/internal/leader"
 	"github.com/bison/api-server/internal/middleware"
 	"github.com/bison/api-server/internal/opencost"
 	"github.com/bison/api-server/internal/scheduler"
@@ -71,6 +72,9 @@ func main() {
 	reportSvc := service.NewReportService(opencostClient, tenantSvc, projectSvc, billingSvc)
 	nodeSvc := service.NewNodeService(k8sClient)
 	workloadSvc := service.NewWorkloadService(k8sClient)
+	initScriptSvc := service.NewInitScriptService(k8sClient)
+	onboardingSvc := service.NewOnboardingService(k8sClient, nodeSvc, initScriptSvc)
+	configTransferSvc := service.NewConfigTransferService(billingSvc, alertSvc, resourceConfigSvc, initScriptSvc)
 
 	// Initialize scheduler
 	sched := scheduler.NewScheduler(billingSvc, balanceSvc, alertSvc)
@@ -106,6 +110,8 @@ func main() {
 	statusHandler := handler.NewStatusHandler(statusSvc)
 	nodeHandler := handler.NewNodeHandler(nodeSvc)
 	workloadHandler := handler.NewWorkloadHandler(workloadSvc, projectSvc)
+	onboardingHandler := handler.NewOnboardingHandler(onboardingSvc, initScriptSvc)
+	configTransferHandler := handler.NewConfigTransferHandler(configTransferSvc)
 
 	// Setup Gin router
 	if cfg.Mode == "release" {
@@ -115,7 +121,7 @@ func main() {
 	router := gin.New()
 	router.Use(middleware.Recovery())
 	router.Use(middleware.Logger())
-	router.Use(corsMiddleware())
+	router.Use(corsMiddleware(cfg.CORSAllowedOrigins))
 
 	// Health check endpoints
 	router.GET("/healthz", func(c *gin.Context) {
@@ -135,7 +141,9 @@ func main() {
 		// Feature flags (public)
 		api.GET("/features", func(c *gin.Context) {
 			c.JSON(http.StatusOK, gin.H{
-				"costEnabled": costSvc.IsEnabled(),
+				"costEnabled":       costSvc.IsEnabled(),
+				"capsuleEnabled":    cfg.CapsuleEnabled,
+				"prometheusEnabled": cfg.PrometheusURL != "",
 			})
 		})
 
@@ -235,6 +243,12 @@ func main() {
 			protected.POST("/nodes/:name/assign", nodeHandler.AssignNodeToTeam)
 			protected.POST("/nodes/:name/release", nodeHandler.ReleaseNode)
 
+			// Node onboarding
+			protected.POST("/nodes/onboard", onboardingHandler.StartOnboarding)
+			protected.GET("/nodes/onboard", onboardingHandler.ListOnboardingJobs)
+			protected.GET("/nodes/onboard/:jobId", onboardingHandler.GetOnboardingJob)
+			protected.DELETE("/nodes/onboard/:jobId", onboardingHandler.CancelOnboardingJob)
+
 			// System settings
 			protected.GET("/settings", settingsHandler.GetSettings)
 			protected.GET("/settings/billing", billingHandler.GetBillingConfig)
@@ -243,6 +257,25 @@ func main() {
 			protected.PUT("/settings/alerts", alertHandler.UpdateAlertConfig)
 			protected.POST("/settings/alerts/test", alertHandler.TestChannel)
 
+			// Control plane settings
+			protected.GET("/settings/control-plane", onboardingHandler.GetControlPlaneConfig)
+			protected.PUT("/settings/control-plane", onboardingHandler.UpdateControlPlaneConfig)
+			protected.POST("/settings/control-plane/test", onboardingHandler.TestControlPlaneConnection)
+
+			// Init scripts settings
+			protected.GET("/settings/init-scripts", onboardingHandler.ListInitScripts)
+			protected.POST("/settings/init-scripts", onboardingHandler.CreateInitScript)
+			protected.GET("/settings/init-scripts/:id", onboardingHandler.GetInitScript)
+			protected.PUT("/settings/init-scripts/:id", onboardingHandler.UpdateInitScript)
+			protected.DELETE("/settings/init-scripts/:id", onboardingHandler.DeleteInitScript)
+			protected.PUT("/settings/init-scripts/:id/toggle", onboardingHandler.ToggleInitScript)
+			protected.PUT("/settings/init-scripts/reorder", onboardingHandler.ReorderInitScripts)
+
+			// Configuration import/export
+			protected.GET("/settings/export", configTransferHandler.ExportConfig)
+			protected.POST("/settings/import/preview", configTransferHandler.PreviewImport)
+			protected.POST("/settings/import/apply", configTransferHandler.ApplyImport)
+
 			// Node metrics (from Prometheus)
 			protected.GET("/metrics/node/:name", settingsHandler.GetNodeMetrics)
 
@@ -268,9 +301,22 @@ func main() {
 		IdleTimeout:  60 * time.Second,
 	}
 
-	// Start scheduler
+	// Start scheduler. When leader election is enabled the singleton scheduler
+	// runs on exactly one replica at a time (guards against duplicate billing);
+	// otherwise it runs directly (single-replica / local dev).
 	ctx, cancel := context.WithCancel(context.Background())
-	sched.Start(ctx)
+	if cfg.LeaderElectionEnabled {
+		go leader.Run(ctx, k8sClient.Clientset(), service.BisonNamespace,
+			func(leaderCtx context.Context) {
+				sched.Start(leaderCtx)
+				<-leaderCtx.Done()
+				sched.Stop()
+			},
+			func() { sched.Stop() },
+		)
+	} else {
+		sched.Start(ctx)
+	}
 
 	// Start server in goroutine
 	go func() {
@@ -302,9 +348,31 @@ func main() {
 	logger.Info("Server stopped gracefully")
 }
 
-func corsMiddleware() gin.HandlerFunc {
+func corsMiddleware(allowedOrigins []string) gin.HandlerFunc {
+	// Build an O(1) lookup; "*" or an empty list means allow any origin.
+	allowAny := len(allowedOrigins) == 0
+	allowSet := make(map[string]struct{}, len(allowedOrigins))
+	for _, o := range allowedOrigins {
+		if o == "*" {
+			allowAny = true
+		}
+		allowSet[o] = struct{}{}
+	}
+
 	return func(c *gin.Context) {
-		c.Header("Access-Control-Allow-Origin", "*")
+		origin := c.GetHeader("Origin")
+
+		if allowAny {
+			c.Header("Access-Control-Allow-Origin", "*")
+		} else if _, ok := allowSet[origin]; ok && origin != "" {
+			// Echo the specific allowed origin and allow credentialed requests.
+			c.Header("Access-Control-Allow-Origin", origin)
+			c.Header("Access-Control-Allow-Credentials", "true")
+			c.Header("Vary", "Origin")
+		}
+		// If the origin is not allowed, no Allow-Origin header is set and the
+		// browser blocks the cross-origin response.
+
 		c.Header("Access-Control-Allow-Methods", "GET, POST, PUT, DELETE, OPTIONS")
 		c.Header("Access-Control-Allow-Headers", "Content-Type, Authorization")
 
diff --git a/api-server/go.mod b/api-server/go.mod
index 5e13945..a7e009b 100644
--- a/api-server/go.mod
+++ b/api-server/go.mod
@@ -6,6 +6,7 @@ require (
 	github.com/gin-gonic/gin v1.9.1
 	github.com/golang-jwt/jwt/v5 v5.2.0
 	go.uber.org/zap v1.27.0
+	golang.org/x/crypto v0.18.0
 	k8s.io/api v0.29.1
 	k8s.io/apimachinery v0.29.1
 	k8s.io/client-go v0.29.1
@@ -16,6 +17,7 @@ require (
 	github.com/chenzhuoyu/base64x v0.0.0-20221115062448-fe3a3abad311 // indirect
 	github.com/davecgh/go-spew v1.1.1 // indirect
 	github.com/emicklei/go-restful/v3 v3.11.0 // indirect
+	github.com/evanphx/json-patch v4.12.0+incompatible // indirect
 	github.com/gabriel-vasile/mimetype v1.4.2 // indirect
 	github.com/gin-contrib/sse v0.1.0 // indirect
 	github.com/go-logr/logr v1.4.1 // indirect
@@ -45,12 +47,12 @@ require (
 	github.com/onsi/ginkgo/v2 v2.15.0 // indirect
 	github.com/onsi/gomega v1.31.1 // indirect
 	github.com/pelletier/go-toml/v2 v2.0.8 // indirect
+	github.com/pkg/errors v0.9.1 // indirect
 	github.com/spf13/pflag v1.0.5 // indirect
 	github.com/twitchyliquid64/golang-asm v0.15.1 // indirect
 	github.com/ugorji/go/codec v1.2.11 // indirect
 	go.uber.org/multierr v1.11.0 // indirect
 	golang.org/x/arch v0.3.0 // indirect
-	golang.org/x/crypto v0.18.0 // indirect
 	golang.org/x/net v0.20.0 // indirect
 	golang.org/x/oauth2 v0.12.0 // indirect
 	golang.org/x/sys v0.16.0 // indirect
diff --git a/api-server/go.sum b/api-server/go.sum
index 11d916a..c59e0ea 100644
--- a/api-server/go.sum
+++ b/api-server/go.sum
@@ -10,6 +10,8 @@ github.com/davecgh/go-spew v1.1.1 h1:vj9j/u1bqnvCEfJOwUhtlOARqs3+rkHYY13jYWTU97c
 github.com/davecgh/go-spew v1.1.1/go.mod h1:J7Y8YcW2NihsgmVo/mv3lAwl/skON4iLHjSsI+c5H38=
 github.com/emicklei/go-restful/v3 v3.11.0 h1:rAQeMHw1c7zTmncogyy8VvRZwtkmkZ4FxERmMY4rD+g=
 github.com/emicklei/go-restful/v3 v3.11.0/go.mod h1:6n3XBCmQQb25CM2LCACGz8ukIrRry+4bhvbpWn3mrbc=
+github.com/evanphx/json-patch v4.12.0+incompatible h1:4onqiflcdA9EOZ4RxV643DvftH5pOlLGNtQ5lPWQu84=
+github.com/evanphx/json-patch v4.12.0+incompatible/go.mod h1:50XU6AFN0ol/bzJsmQLiYLvXMP4fmwYFNcr97nuDLSk=
 github.com/gabriel-vasile/mimetype v1.4.2 h1:w5qFW6JKBz9Y393Y4q372O9A7cUSequkh1Q7OhCmWKU=
 github.com/gabriel-vasile/mimetype v1.4.2/go.mod h1:zApsH/mKG4w07erKIaJPFiX0Tsq9BFQgN3qGY5GnNgA=
 github.com/gin-contrib/sse v0.1.0 h1:Y/yl/+YNO8GZSjAhjMsSuLt29uWRFHdHYUb5lYOV9qE=
@@ -97,6 +99,8 @@ github.com/onsi/gomega v1.31.1 h1:KYppCUK+bUgAZwHOu7EXVBKyQA6ILvOESHkn/tgoqvo=
 github.com/onsi/gomega v1.31.1/go.mod h1:y40C95dwAD1Nz36SsEnxvfFe8FFfNxzI5eJ0EYGyAy0=
 github.com/pelletier/go-toml/v2 v2.0.8 h1:0ctb6s9mE31h0/lhu+J6OPmVeDxJn+kYnJc2jZR9tGQ=
 github.com/pelletier/go-toml/v2 v2.0.8/go.mod h1:vuYfssBdrU2XDZ9bYydBu6t+6a6PYNcZljzZR9VXg+4=
+github.com/pkg/errors v0.9.1 h1:FEBLx1zS214owpjy7qsBeixbURkuhQAwrK5UwLGTwt4=
+github.com/pkg/errors v0.9.1/go.mod h1:bwawxfHBFNV+L2hUp1rHADufV3IMtnDRdf1r5NINEl0=
 github.com/pmezard/go-difflib v1.0.0 h1:4DBwDE0NGyQoBHbLQYPwSUPoCMWR5BEzIk/f1lZbAQM=
 github.com/pmezard/go-difflib v1.0.0/go.mod h1:iKH77koFhYxTK1pcRnkKkqfTogsbg7gZNVY4sRDYZ/4=
 github.com/rogpeppe/go-internal v1.10.0 h1:TMyTOH3F/DB16zRVcYyreMH6GnZZrwQVAoYjRBZyWFQ=
diff --git a/api-server/internal/config/config.go b/api-server/internal/config/config.go
index 437324d..266320d 100644
--- a/api-server/internal/config/config.go
+++ b/api-server/internal/config/config.go
@@ -4,6 +4,7 @@ import (
 	"fmt"
 	"os"
 	"strconv"
+	"strings"
 )
 
 // Config holds the API server configuration
@@ -21,19 +22,40 @@ type Config struct {
 	// External services
 	OpenCostURL   string
 	PrometheusURL string
+
+	// CORSAllowedOrigins restricts cross-origin requests. Empty means allow all
+	// origins ("*"); set a comma-separated allowlist to tighten in production.
+	CORSAllowedOrigins []string
+
+	// Feature toggles
+	CapsuleEnabled bool
+
+	// LeaderElectionEnabled gates the singleton scheduler behind a Kubernetes
+	// lease so it runs on exactly one replica. Disable for single-replica or
+	// out-of-cluster development.
+	LeaderElectionEnabled bool
 }
 
+// Built-in development defaults that MUST NOT be used in production once auth is
+// enabled — startup refuses to proceed if they are left unchanged.
+const (
+	defaultAdminPassword = "admin"
+	defaultJWTSecret     = "bison-secret-key-change-in-production"
+)
+
 // Load reads configuration from environment variables
 func Load() (*Config, error) {
 	cfg := &Config{
-		Port:          8080,
-		Mode:          "release",
-		AuthEnabled:   false,
-		AdminUsername: "admin",
-		AdminPassword: "admin",
-		JWTSecret:     "bison-secret-key-change-in-production",
-		OpenCostURL:   "",
-		PrometheusURL: "",
+		Port:                  8080,
+		Mode:                  "release",
+		AuthEnabled:           false,
+		AdminUsername:         "admin",
+		AdminPassword:         defaultAdminPassword,
+		JWTSecret:             defaultJWTSecret,
+		OpenCostURL:           "",
+		PrometheusURL:         "",
+		CapsuleEnabled:        true,
+		LeaderElectionEnabled: true,
 	}
 
 	if port := os.Getenv("PORT"); port != "" {
@@ -70,5 +92,42 @@ func Load() (*Config, error) {
 		cfg.PrometheusURL = prometheusURL
 	}
 
+	// Feature toggles
+	if capsuleEnabled := os.Getenv("CAPSULE_ENABLED"); capsuleEnabled == "false" {
+		cfg.CapsuleEnabled = false
+	}
+	if le := os.Getenv("LEADER_ELECTION_ENABLED"); le == "false" {
+		cfg.LeaderElectionEnabled = false
+	}
+
+	// CORS allowlist (comma-separated origins). Empty -> allow all.
+	if origins := os.Getenv("CORS_ALLOWED_ORIGINS"); origins != "" {
+		for _, o := range strings.Split(origins, ",") {
+			if o = strings.TrimSpace(o); o != "" {
+				cfg.CORSAllowedOrigins = append(cfg.CORSAllowedOrigins, o)
+			}
+		}
+	}
+
+	if err := cfg.validate(); err != nil {
+		return nil, err
+	}
+
 	return cfg, nil
 }
+
+// validate refuses to start with insecure defaults once authentication is enabled,
+// so a production deployment cannot accidentally run with the public default JWT
+// signing key or the well-known "admin" password.
+func (c *Config) validate() error {
+	if !c.AuthEnabled {
+		return nil
+	}
+	if c.JWTSecret == "" || c.JWTSecret == defaultJWTSecret {
+		return fmt.Errorf("refusing to start: JWT_SECRET must be set to a non-default value when AUTH_ENABLED=true")
+	}
+	if c.AdminPassword == "" || c.AdminPassword == defaultAdminPassword {
+		return fmt.Errorf("refusing to start: ADMIN_PASSWORD must be set to a non-default value when AUTH_ENABLED=true")
+	}
+	return nil
+}
diff --git a/api-server/internal/config/config_test.go b/api-server/internal/config/config_test.go
new file mode 100644
index 0000000..f55d0bf
--- /dev/null
+++ b/api-server/internal/config/config_test.go
@@ -0,0 +1,43 @@
+package config
+
+import "testing"
+
+func TestValidate(t *testing.T) {
+	cases := []struct {
+		name    string
+		cfg     Config
+		wantErr bool
+	}{
+		{
+			name: "auth disabled allows defaults",
+			cfg:  Config{AuthEnabled: false, JWTSecret: defaultJWTSecret, AdminPassword: defaultAdminPassword},
+		},
+		{
+			name:    "auth enabled rejects default jwt secret",
+			cfg:     Config{AuthEnabled: true, JWTSecret: defaultJWTSecret, AdminPassword: "strong-pass"},
+			wantErr: true,
+		},
+		{
+			name:    "auth enabled rejects empty jwt secret",
+			cfg:     Config{AuthEnabled: true, JWTSecret: "", AdminPassword: "strong-pass"},
+			wantErr: true,
+		},
+		{
+			name:    "auth enabled rejects default password",
+			cfg:     Config{AuthEnabled: true, JWTSecret: "a-real-secret", AdminPassword: defaultAdminPassword},
+			wantErr: true,
+		},
+		{
+			name: "auth enabled accepts strong values",
+			cfg:  Config{AuthEnabled: true, JWTSecret: "a-real-secret", AdminPassword: "strong-pass"},
+		},
+	}
+	for _, tc := range cases {
+		t.Run(tc.name, func(t *testing.T) {
+			err := tc.cfg.validate()
+			if (err != nil) != tc.wantErr {
+				t.Fatalf("validate() err=%v, wantErr=%v", err, tc.wantErr)
+			}
+		})
+	}
+}
diff --git a/api-server/internal/handler/auth.go b/api-server/internal/handler/auth.go
index 1705883..3841bd9 100644
--- a/api-server/internal/handler/auth.go
+++ b/api-server/internal/handler/auth.go
@@ -1,8 +1,11 @@
 package handler
 
 import (
+	"crypto/subtle"
 	"net/http"
+	"strconv"
 	"strings"
+	"sync"
 	"time"
 
 	"github.com/gin-gonic/gin"
@@ -11,12 +14,79 @@ import (
 	"github.com/bison/api-server/pkg/logger"
 )
 
+// Login brute-force protection: after maxLoginFails failed attempts from one IP
+// within loginWindow, that IP is locked out for loginBlock.
+const (
+	maxLoginFails = 5
+	loginWindow   = 5 * time.Minute
+	loginBlock    = 15 * time.Minute
+)
+
+type failRecord struct {
+	count        int
+	resetAt      time.Time
+	blockedUntil time.Time
+}
+
+// loginLimiter is a small in-memory per-IP failed-login limiter.
+type loginLimiter struct {
+	mu    sync.Mutex
+	fails map[string]*failRecord
+}
+
+func newLoginLimiter() *loginLimiter {
+	return &loginLimiter{fails: make(map[string]*failRecord)}
+}
+
+// allowed reports whether the IP may attempt a login now; if blocked it returns
+// the number of seconds to wait.
+func (l *loginLimiter) allowed(ip string, now time.Time) (bool, int) {
+	l.mu.Lock()
+	defer l.mu.Unlock()
+	rec := l.fails[ip]
+	if rec != nil && now.Before(rec.blockedUntil) {
+		return false, int(rec.blockedUntil.Sub(now).Seconds()) + 1
+	}
+	return true, 0
+}
+
+// recordFailure increments the failure counter for an IP and blocks it once the
+// threshold within the window is exceeded.
+func (l *loginLimiter) recordFailure(ip string, now time.Time) {
+	l.mu.Lock()
+	defer l.mu.Unlock()
+	rec := l.fails[ip]
+	if rec == nil || now.After(rec.resetAt) {
+		rec = &failRecord{resetAt: now.Add(loginWindow)}
+		l.fails[ip] = rec
+	}
+	rec.count++
+	if rec.count >= maxLoginFails {
+		rec.blockedUntil = now.Add(loginBlock)
+	}
+	// Opportunistic prune to bound memory.
+	if len(l.fails) > 1024 {
+		for k, v := range l.fails {
+			if now.After(v.resetAt) && now.After(v.blockedUntil) {
+				delete(l.fails, k)
+			}
+		}
+	}
+}
+
+func (l *loginLimiter) recordSuccess(ip string) {
+	l.mu.Lock()
+	defer l.mu.Unlock()
+	delete(l.fails, ip)
+}
+
 // AuthHandler handles authentication
 type AuthHandler struct {
 	username  string
 	password  string
 	jwtSecret []byte
 	enabled   bool
+	limiter   *loginLimiter
 }
 
 // NewAuthHandler creates a new AuthHandler
@@ -26,6 +96,7 @@ func NewAuthHandler(username, password, jwtSecret string, enabled bool) *AuthHan
 		password:  password,
 		jwtSecret: []byte(jwtSecret),
 		enabled:   enabled,
+		limiter:   newLoginLimiter(),
 	}
 }
 
@@ -44,6 +115,17 @@ type LoginResponse struct {
 
 // Login handles user login
 func (h *AuthHandler) Login(c *gin.Context) {
+	ip := c.ClientIP()
+	now := time.Now()
+
+	// Reject brute-force attempts before doing any credential work.
+	if ok, retryAfter := h.limiter.allowed(ip, now); !ok {
+		logger.Warn("Login blocked: too many failed attempts", "ip", ip, "retryAfterSec", retryAfter)
+		c.Header("Retry-After", strconv.Itoa(retryAfter))
+		c.JSON(http.StatusTooManyRequests, gin.H{"error": "登录尝试过于频繁，请稍后再试", "code": "TOO_MANY_ATTEMPTS"})
+		return
+	}
+
 	var req LoginRequest
 	if err := c.ShouldBindJSON(&req); err != nil {
 		logger.Warn("Login failed: invalid request", "error", err)
@@ -51,12 +133,17 @@ func (h *AuthHandler) Login(c *gin.Context) {
 		return
 	}
 
-	// Validate credentials
-	if req.Username != h.username || req.Password != h.password {
-		logger.Warn("Login failed: invalid credentials", "username", req.Username)
+	// Validate credentials using constant-time comparison to avoid leaking timing
+	// information. Both comparisons always run so username validity is not revealed.
+	userOK := subtle.ConstantTimeCompare([]byte(req.Username), []byte(h.username)) == 1
+	passOK := subtle.ConstantTimeCompare([]byte(req.Password), []byte(h.password)) == 1
+	if !userOK || !passOK {
+		h.limiter.recordFailure(ip, now)
+		logger.Warn("Login failed: invalid credentials", "username", req.Username, "ip", ip)
 		c.JSON(http.StatusUnauthorized, gin.H{"error": "用户名或密码错误", "code": "INVALID_CREDENTIALS"})
 		return
 	}
+	h.limiter.recordSuccess(ip)
 
 	// Generate JWT token
 	expiresAt := time.Now().Add(24 * time.Hour)
diff --git a/api-server/internal/handler/auth_test.go b/api-server/internal/handler/auth_test.go
new file mode 100644
index 0000000..3550864
--- /dev/null
+++ b/api-server/internal/handler/auth_test.go
@@ -0,0 +1,66 @@
+package handler
+
+import (
+	"testing"
+	"time"
+)
+
+func TestLoginLimiterBlocksAfterMaxFails(t *testing.T) {
+	l := newLoginLimiter()
+	now := time.Now()
+	ip := "1.2.3.4"
+
+	for i := 0; i < maxLoginFails-1; i++ {
+		l.recordFailure(ip, now)
+		if ok, _ := l.allowed(ip, now); !ok {
+			t.Fatalf("blocked too early after %d fails", i+1)
+		}
+	}
+	// The maxLoginFails-th failure triggers the block.
+	l.recordFailure(ip, now)
+	ok, retry := l.allowed(ip, now)
+	if ok {
+		t.Fatal("expected block after maxLoginFails failures")
+	}
+	if retry <= 0 {
+		t.Fatalf("expected positive Retry-After, got %d", retry)
+	}
+
+	// Block clears after loginBlock elapses.
+	if ok, _ := l.allowed(ip, now.Add(loginBlock+time.Second)); !ok {
+		t.Fatal("expected unblock after loginBlock elapsed")
+	}
+}
+
+func TestLoginLimiterSuccessResets(t *testing.T) {
+	l := newLoginLimiter()
+	now := time.Now()
+	ip := "5.6.7.8"
+
+	for i := 0; i < maxLoginFails; i++ {
+		l.recordFailure(ip, now)
+	}
+	if ok, _ := l.allowed(ip, now); ok {
+		t.Fatal("expected block")
+	}
+	// A successful login from a different (unblocked) state clears the record.
+	l.recordSuccess(ip)
+	if ok, _ := l.allowed(ip, now); !ok {
+		t.Fatal("expected allowed after recordSuccess")
+	}
+}
+
+func TestLoginLimiterWindowResets(t *testing.T) {
+	l := newLoginLimiter()
+	now := time.Now()
+	ip := "9.9.9.9"
+
+	// A few failures, then let the window expire before reaching the threshold.
+	l.recordFailure(ip, now)
+	l.recordFailure(ip, now)
+	later := now.Add(loginWindow + time.Second)
+	l.recordFailure(ip, later) // counter resets, so this is failure #1 in a new window
+	if ok, _ := l.allowed(ip, later); !ok {
+		t.Fatal("expected allowed; window should have reset the counter")
+	}
+}
diff --git a/api-server/internal/handler/config_transfer.go b/api-server/internal/handler/config_transfer.go
new file mode 100644
index 0000000..c101a72
--- /dev/null
+++ b/api-server/internal/handler/config_transfer.go
@@ -0,0 +1,116 @@
+package handler
+
+import (
+	"encoding/json"
+	"fmt"
+	"net/http"
+	"strings"
+	"time"
+
+	"github.com/gin-gonic/gin"
+
+	"github.com/bison/api-server/internal/service"
+	"github.com/bison/api-server/pkg/logger"
+)
+
+// ConfigTransferHandler handles configuration import/export requests
+type ConfigTransferHandler struct {
+	configTransferSvc *service.ConfigTransferService
+}
+
+// NewConfigTransferHandler creates a new ConfigTransferHandler
+func NewConfigTransferHandler(svc *service.ConfigTransferService) *ConfigTransferHandler {
+	return &ConfigTransferHandler{
+		configTransferSvc: svc,
+	}
+}
+
+// ExportConfig exports configuration as a JSON file download
+func (h *ConfigTransferHandler) ExportConfig(c *gin.Context) {
+	sectionsParam := c.DefaultQuery("sections", strings.Join(service.AllSections, ","))
+	includeSensitive := c.DefaultQuery("includeSensitive", "false") == "true"
+
+	sections := strings.Split(sectionsParam, ",")
+	for i := range sections {
+		sections[i] = strings.TrimSpace(sections[i])
+	}
+
+	operator := "admin"
+	if username, exists := c.Get("username"); exists {
+		operator = username.(string)
+	}
+
+	config, err := h.configTransferSvc.Export(c.Request.Context(), sections, includeSensitive, operator)
+	if err != nil {
+		logger.Error("Failed to export config", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	data, err := json.MarshalIndent(config, "", "  ")
+	if err != nil {
+		logger.Error("Failed to marshal export config", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": "序列化配置失败"})
+		return
+	}
+
+	filename := fmt.Sprintf("bison-config-%s.json", time.Now().Format("20060102-150405"))
+	c.Header("Content-Type", "application/json")
+	c.Header("Content-Disposition", fmt.Sprintf("attachment; filename=%s", filename))
+	c.Data(http.StatusOK, "application/json", data)
+}
+
+// PreviewImport validates and previews an import configuration
+func (h *ConfigTransferHandler) PreviewImport(c *gin.Context) {
+	var config service.ExportConfig
+	if err := c.ShouldBindJSON(&config); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": "无效的 JSON 格式: " + err.Error()})
+		return
+	}
+
+	if config.Version == "" {
+		c.JSON(http.StatusBadRequest, gin.H{"error": "缺少 version 字段"})
+		return
+	}
+	if config.Sections == nil || len(config.Sections) == 0 {
+		c.JSON(http.StatusBadRequest, gin.H{"error": "缺少 sections 字段"})
+		return
+	}
+
+	result, err := h.configTransferSvc.Preview(c.Request.Context(), &config)
+	if err != nil {
+		logger.Error("Failed to preview import", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, result)
+}
+
+// ApplyImport applies the imported configuration
+func (h *ConfigTransferHandler) ApplyImport(c *gin.Context) {
+	var req service.ImportRequest
+	if err := c.ShouldBindJSON(&req); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": "无效的请求格式: " + err.Error()})
+		return
+	}
+
+	if len(req.Sections) == 0 {
+		c.JSON(http.StatusBadRequest, gin.H{"error": "请选择至少一个配置模块"})
+		return
+	}
+
+	if req.Config.Version == "" || req.Config.Sections == nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": "无效的配置数据"})
+		return
+	}
+
+	result, err := h.configTransferSvc.Apply(c.Request.Context(), &req)
+	if err != nil {
+		logger.Error("Failed to apply import", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, result)
+}
diff --git a/api-server/internal/handler/onboarding.go b/api-server/internal/handler/onboarding.go
new file mode 100644
index 0000000..d33b051
--- /dev/null
+++ b/api-server/internal/handler/onboarding.go
@@ -0,0 +1,276 @@
+package handler
+
+import (
+	"net/http"
+
+	"github.com/gin-gonic/gin"
+
+	"github.com/bison/api-server/internal/service"
+	"github.com/bison/api-server/pkg/logger"
+)
+
+// OnboardingHandler handles node onboarding requests
+type OnboardingHandler struct {
+	onboardingSvc *service.OnboardingService
+	initScriptSvc *service.InitScriptService
+}
+
+// NewOnboardingHandler creates a new OnboardingHandler
+func NewOnboardingHandler(onboardingSvc *service.OnboardingService, initScriptSvc *service.InitScriptService) *OnboardingHandler {
+	return &OnboardingHandler{
+		onboardingSvc: onboardingSvc,
+		initScriptSvc: initScriptSvc,
+	}
+}
+
+// StartOnboarding starts a new node onboarding job
+// POST /api/v1/nodes/onboard
+func (h *OnboardingHandler) StartOnboarding(c *gin.Context) {
+	var req service.OnboardingRequest
+	if err := c.ShouldBindJSON(&req); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	job, err := h.onboardingSvc.StartOnboarding(c.Request.Context(), &req)
+	if err != nil {
+		logger.Error("Failed to start onboarding", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusAccepted, job)
+}
+
+// GetOnboardingJob returns a specific onboarding job
+// GET /api/v1/nodes/onboard/:jobId
+func (h *OnboardingHandler) GetOnboardingJob(c *gin.Context) {
+	jobID := c.Param("jobId")
+
+	job, err := h.onboardingSvc.GetJob(c.Request.Context(), jobID)
+	if err != nil {
+		c.JSON(http.StatusNotFound, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, job)
+}
+
+// ListOnboardingJobs returns all onboarding jobs
+// GET /api/v1/nodes/onboard
+func (h *OnboardingHandler) ListOnboardingJobs(c *gin.Context) {
+	jobs, err := h.onboardingSvc.ListJobs(c.Request.Context())
+	if err != nil {
+		logger.Error("Failed to list onboarding jobs", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"items": jobs})
+}
+
+// CancelOnboardingJob cancels a running onboarding job
+// DELETE /api/v1/nodes/onboard/:jobId
+func (h *OnboardingHandler) CancelOnboardingJob(c *gin.Context) {
+	jobID := c.Param("jobId")
+
+	err := h.onboardingSvc.CancelJob(c.Request.Context(), jobID)
+	if err != nil {
+		logger.Error("Failed to cancel onboarding job", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"message": "Job cancelled"})
+}
+
+// GetControlPlaneConfig returns the control plane configuration
+// GET /api/v1/settings/control-plane
+func (h *OnboardingHandler) GetControlPlaneConfig(c *gin.Context) {
+	config, err := h.initScriptSvc.GetControlPlaneConfig(c.Request.Context())
+	if err != nil {
+		logger.Error("Failed to get control plane config", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	// Mask sensitive data
+	response := gin.H{
+		"host":          config.Host,
+		"sshPort":       config.SSHPort,
+		"sshUser":       config.SSHUser,
+		"authMethod":    config.AuthMethod,
+		"hasPassword":   config.Password != "",
+		"hasPrivateKey": config.PrivateKey != "",
+	}
+
+	c.JSON(http.StatusOK, response)
+}
+
+// UpdateControlPlaneConfig updates the control plane configuration
+// PUT /api/v1/settings/control-plane
+func (h *OnboardingHandler) UpdateControlPlaneConfig(c *gin.Context) {
+	var config service.ControlPlaneConfig
+	if err := c.ShouldBindJSON(&config); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	// Get existing config to preserve credentials if not provided
+	existing, _ := h.initScriptSvc.GetControlPlaneConfig(c.Request.Context())
+	if existing != nil {
+		if config.Password == "" && existing.Password != "" {
+			config.Password = existing.Password
+		}
+		if config.PrivateKey == "" && existing.PrivateKey != "" {
+			config.PrivateKey = existing.PrivateKey
+		}
+	}
+
+	err := h.initScriptSvc.SaveControlPlaneConfig(c.Request.Context(), &config)
+	if err != nil {
+		logger.Error("Failed to save control plane config", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"message": "Control plane configuration saved"})
+}
+
+// TestControlPlaneConnection tests the control plane SSH connection
+// POST /api/v1/settings/control-plane/test
+func (h *OnboardingHandler) TestControlPlaneConnection(c *gin.Context) {
+	err := h.onboardingSvc.TestControlPlaneConnection(c.Request.Context())
+	if err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"message": "Connection successful"})
+}
+
+// ListInitScripts returns all init script groups
+// GET /api/v1/settings/init-scripts
+func (h *OnboardingHandler) ListInitScripts(c *gin.Context) {
+	groups, err := h.initScriptSvc.GetAllScriptGroups(c.Request.Context())
+	if err != nil {
+		logger.Error("Failed to list init scripts", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"items": groups})
+}
+
+// GetInitScript returns a specific init script group
+// GET /api/v1/settings/init-scripts/:id
+func (h *OnboardingHandler) GetInitScript(c *gin.Context) {
+	id := c.Param("id")
+
+	group, err := h.initScriptSvc.GetScriptGroup(c.Request.Context(), id)
+	if err != nil {
+		c.JSON(http.StatusNotFound, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, group)
+}
+
+// CreateInitScript creates a new init script group
+// POST /api/v1/settings/init-scripts
+func (h *OnboardingHandler) CreateInitScript(c *gin.Context) {
+	var group service.ScriptGroup
+	if err := c.ShouldBindJSON(&group); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	err := h.initScriptSvc.CreateScriptGroup(c.Request.Context(), &group)
+	if err != nil {
+		logger.Error("Failed to create init script", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusCreated, group)
+}
+
+// UpdateInitScript updates an init script group
+// PUT /api/v1/settings/init-scripts/:id
+func (h *OnboardingHandler) UpdateInitScript(c *gin.Context) {
+	id := c.Param("id")
+
+	var group service.ScriptGroup
+	if err := c.ShouldBindJSON(&group); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	err := h.initScriptSvc.UpdateScriptGroup(c.Request.Context(), id, &group)
+	if err != nil {
+		logger.Error("Failed to update init script", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, group)
+}
+
+// DeleteInitScript deletes an init script group
+// DELETE /api/v1/settings/init-scripts/:id
+func (h *OnboardingHandler) DeleteInitScript(c *gin.Context) {
+	id := c.Param("id")
+
+	err := h.initScriptSvc.DeleteScriptGroup(c.Request.Context(), id)
+	if err != nil {
+		logger.Error("Failed to delete init script", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"message": "Script group deleted"})
+}
+
+// ToggleInitScript enables or disables an init script group
+// PUT /api/v1/settings/init-scripts/:id/toggle
+func (h *OnboardingHandler) ToggleInitScript(c *gin.Context) {
+	id := c.Param("id")
+
+	var req struct {
+		Enabled bool `json:"enabled"`
+	}
+	if err := c.ShouldBindJSON(&req); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	err := h.initScriptSvc.ToggleScriptGroup(c.Request.Context(), id, req.Enabled)
+	if err != nil {
+		logger.Error("Failed to toggle init script", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"message": "Script group toggled"})
+}
+
+// ReorderInitScripts updates the order of init script groups
+// PUT /api/v1/settings/init-scripts/reorder
+func (h *OnboardingHandler) ReorderInitScripts(c *gin.Context) {
+	var req struct {
+		IDs []string `json:"ids"`
+	}
+	if err := c.ShouldBindJSON(&req); err != nil {
+		c.JSON(http.StatusBadRequest, gin.H{"error": err.Error()})
+		return
+	}
+
+	err := h.initScriptSvc.ReorderScriptGroups(c.Request.Context(), req.IDs)
+	if err != nil {
+		logger.Error("Failed to reorder init scripts", "error", err)
+		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
+		return
+	}
+
+	c.JSON(http.StatusOK, gin.H{"message": "Script groups reordered"})
+}
diff --git a/api-server/internal/handler/settings.go b/api-server/internal/handler/settings.go
index ccdf5cb..7419710 100644
--- a/api-server/internal/handler/settings.go
+++ b/api-server/internal/handler/settings.go
@@ -32,8 +32,17 @@ func (h *SettingsHandler) GetSettings(c *gin.Context) {
 func (h *SettingsHandler) GetNodeMetrics(c *gin.Context) {
 	nodeName := c.Param("name")
 	hours, _ := strconv.Atoi(c.DefaultQuery("hours", "24"))
+	hasGpu := c.DefaultQuery("hasGpu", "false") == "true"
+	hasNpu := c.DefaultQuery("hasNpu", "false") == "true"
+
+	req := service.NodeMetricsRequest{
+		NodeName: nodeName,
+		Hours:    hours,
+		HasGpu:   hasGpu,
+		HasNpu:   hasNpu,
+	}
 
-	metrics, err := h.settingsSvc.GetNodeMetrics(c.Request.Context(), nodeName, hours)
+	metrics, err := h.settingsSvc.GetNodeMetrics(c.Request.Context(), req)
 	if err != nil {
 		logger.Error("Failed to get node metrics", "node", nodeName, "error", err)
 		c.JSON(http.StatusInternalServerError, gin.H{"error": err.Error()})
diff --git a/api-server/internal/handler/team.go b/api-server/internal/handler/team.go
index e24a457..8ca3594 100644
--- a/api-server/internal/handler/team.go
+++ b/api-server/internal/handler/team.go
@@ -34,17 +34,9 @@ func (h *TeamHandler) ListTeams(c *gin.Context) {
 		return
 	}
 
-	// Enrich with usage data if cost service is enabled
-	if h.costSvc.IsEnabled() {
-		window := c.DefaultQuery("window", "7d")
-		for _, team := range teams {
-			usage, _ := h.costSvc.GetTeamUsageByName(c.Request.Context(), team.Name, window)
-			if usage != nil {
-				// Add usage info (could extend Team struct or return separately)
-				_ = usage
-			}
-		}
-	}
+	// Per-team usage is fetched on demand by the team detail / dashboard endpoints,
+	// not here: the previous enrichment loop issued one OpenCost query per team and
+	// then discarded the result, scaling cost linearly with team count for nothing.
 
 	c.JSON(http.StatusOK, gin.H{"items": teams})
 }
diff --git a/api-server/internal/k8s/client.go b/api-server/internal/k8s/client.go
index 59fb7c8..07925fa 100644
--- a/api-server/internal/k8s/client.go
+++ b/api-server/internal/k8s/client.go
@@ -24,10 +24,24 @@ import (
 
 // Client wraps Kubernetes client operations
 type Client struct {
-	clientset     *kubernetes.Clientset
+	clientset     kubernetes.Interface
 	dynamicClient dynamic.Interface
 }
 
+// NewClientWithInterfaces builds a Client from pre-constructed clients.
+// It is primarily used to inject fake clients in unit tests.
+func NewClientWithInterfaces(clientset kubernetes.Interface, dynamicClient dynamic.Interface) *Client {
+	return &Client{
+		clientset:     clientset,
+		dynamicClient: dynamicClient,
+	}
+}
+
+// Clientset exposes the underlying typed client (used e.g. for leader election).
+func (c *Client) Clientset() kubernetes.Interface {
+	return c.clientset
+}
+
 // NewClient creates a new Kubernetes client
 func NewClient() (*Client, error) {
 	var config *rest.Config
@@ -52,6 +66,16 @@ func NewClient() (*Client, error) {
 		logger.Info("Using in-cluster config")
 	}
 
+	// Raise client-side rate limits well above the client-go default (5 QPS / 10 burst)
+	// so dashboard and billing list bursts are not serialized behind the throttler.
+	// Only override when the loaded config has not set explicit limits.
+	if config.QPS == 0 {
+		config.QPS = 50
+	}
+	if config.Burst == 0 {
+		config.Burst = 100
+	}
+
 	clientset, err := kubernetes.NewForConfig(config)
 	if err != nil {
 		logger.Error("Failed to create clientset", "error", err)
diff --git a/api-server/internal/leader/leader.go b/api-server/internal/leader/leader.go
new file mode 100644
index 0000000..35b9e21
--- /dev/null
+++ b/api-server/internal/leader/leader.go
@@ -0,0 +1,98 @@
+// Package leader provides Kubernetes lease-based leader election so that
+// singleton background work (the billing/auto-recharge/alert scheduler) runs on
+// exactly one api-server replica at a time, even when scaled horizontally.
+package leader
+
+import (
+	"context"
+	"os"
+	"time"
+
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"k8s.io/client-go/kubernetes"
+	"k8s.io/client-go/tools/leaderelection"
+	"k8s.io/client-go/tools/leaderelection/resourcelock"
+
+	"github.com/bison/api-server/pkg/logger"
+)
+
+// LeaseName is the coordination.k8s.io Lease used to elect the scheduler leader.
+const LeaseName = "bison-scheduler"
+
+// identity returns a per-process identity. In Kubernetes the pod name is the
+// hostname, which is unique per replica; POD_NAME overrides it when set.
+func identity() string {
+	if v := os.Getenv("POD_NAME"); v != "" {
+		return v
+	}
+	if h, err := os.Hostname(); err == nil && h != "" {
+		return h
+	}
+	return "bison-api"
+}
+
+func namespace(def string) string {
+	if v := os.Getenv("POD_NAMESPACE"); v != "" {
+		return v
+	}
+	return def
+}
+
+// Run blocks running leader election until ctx is cancelled.
+//
+// onStarted is invoked (in its own goroutine) with a context that is cancelled
+// when leadership is lost or ctx is cancelled; it should start the leader-only
+// work and return promptly when its context is done. onStopped is invoked when
+// leadership is lost. The scheduler must be re-startable, since leadership can be
+// re-acquired after a transient loss.
+func Run(ctx context.Context, clientset kubernetes.Interface, ns string, onStarted func(context.Context), onStopped func()) {
+	id := identity()
+	leaseNS := namespace(ns)
+
+	lock := &resourcelock.LeaseLock{
+		LeaseMeta:  metav1.ObjectMeta{Name: LeaseName, Namespace: leaseNS},
+		Client:     clientset.CoordinationV1(),
+		LockConfig: resourcelock.ResourceLockConfig{Identity: id},
+	}
+
+	logger.Info("Starting leader election", "identity", id, "namespace", leaseNS, "lease", LeaseName)
+
+	config := leaderelection.LeaderElectionConfig{
+		Lock:            lock,
+		ReleaseOnCancel: true,
+		LeaseDuration:   15 * time.Second,
+		RenewDeadline:   10 * time.Second,
+		RetryPeriod:     2 * time.Second,
+		Callbacks: leaderelection.LeaderCallbacks{
+			OnStartedLeading: func(leaderCtx context.Context) {
+				logger.Info("Acquired scheduler leadership", "identity", id)
+				onStarted(leaderCtx)
+			},
+			OnStoppedLeading: func() {
+				logger.Warn("Lost scheduler leadership", "identity", id)
+				onStopped()
+			},
+			OnNewLeader: func(current string) {
+				if current != id {
+					logger.Info("Observed scheduler leader", "leader", current)
+				}
+			},
+		},
+	}
+
+	// RunOrDie returns when ctx is cancelled or leadership is lost. Loop so a
+	// transient loss leads to re-election rather than permanently idle.
+	for {
+		select {
+		case <-ctx.Done():
+			return
+		default:
+		}
+		leaderelection.RunOrDie(ctx, config)
+		select {
+		case <-ctx.Done():
+			return
+		case <-time.After(2 * time.Second):
+		}
+	}
+}
diff --git a/api-server/internal/opencost/cache.go b/api-server/internal/opencost/cache.go
new file mode 100644
index 0000000..9bd6e8d
--- /dev/null
+++ b/api-server/internal/opencost/cache.go
@@ -0,0 +1,58 @@
+package opencost
+
+import (
+	"sync"
+	"time"
+)
+
+type allocCacheEntry struct {
+	ready  chan struct{} // closed when val/err are populated
+	val    []Allocation
+	err    error
+	expiry time.Time // guarded by allocCache.mu; zero while in-flight
+}
+
+// allocCache is a small TTL cache that also coalesces concurrent identical
+// allocation queries, so a burst of dashboard/billing requests for the same
+// window/aggregate/filter hits OpenCost once instead of once per caller.
+type allocCache struct {
+	ttl     time.Duration
+	mu      sync.Mutex
+	entries map[string]*allocCacheEntry
+}
+
+func newAllocCache(ttl time.Duration) *allocCache {
+	return &allocCache{ttl: ttl, entries: make(map[string]*allocCacheEntry)}
+}
+
+// do returns a cached result if fresh, joins an in-flight fetch for the same key,
+// or runs fetch once and caches the (successful) result for ttl. Errors are not
+// cached so the next caller retries.
+func (c *allocCache) do(key string, fetch func() ([]Allocation, error)) ([]Allocation, error) {
+	c.mu.Lock()
+	if e := c.entries[key]; e != nil && (e.expiry.IsZero() || time.Now().Before(e.expiry)) {
+		// In-flight (zero expiry) or still-fresh cached result: reuse it.
+		c.mu.Unlock()
+		<-e.ready
+		return e.val, e.err
+	}
+	e := &allocCacheEntry{ready: make(chan struct{})}
+	c.entries[key] = e
+	c.mu.Unlock()
+
+	e.val, e.err = fetch()
+
+	c.mu.Lock()
+	if e.err != nil {
+		// Do not cache failures; drop so the next caller retries.
+		if c.entries[key] == e {
+			delete(c.entries, key)
+		}
+	} else {
+		e.expiry = time.Now().Add(c.ttl)
+	}
+	c.mu.Unlock()
+
+	close(e.ready)
+	return e.val, e.err
+}
diff --git a/api-server/internal/opencost/cache_test.go b/api-server/internal/opencost/cache_test.go
new file mode 100644
index 0000000..d0fac3f
--- /dev/null
+++ b/api-server/internal/opencost/cache_test.go
@@ -0,0 +1,78 @@
+package opencost
+
+import (
+	"errors"
+	"sync"
+	"sync/atomic"
+	"testing"
+	"time"
+)
+
+func TestAllocCacheCoalescesConcurrentCalls(t *testing.T) {
+	c := newAllocCache(time.Minute)
+	var calls int32
+
+	fetch := func() ([]Allocation, error) {
+		atomic.AddInt32(&calls, 1)
+		time.Sleep(40 * time.Millisecond) // hold the in-flight window open
+		return []Allocation{{Name: "ns"}}, nil
+	}
+
+	const n = 12
+	var wg sync.WaitGroup
+	wg.Add(n)
+	for i := 0; i < n; i++ {
+		go func() {
+			defer wg.Done()
+			res, err := c.do("k", fetch)
+			if err != nil || len(res) != 1 {
+				t.Errorf("unexpected result: %v %v", res, err)
+			}
+		}()
+	}
+	wg.Wait()
+
+	if got := atomic.LoadInt32(&calls); got != 1 {
+		t.Fatalf("expected 1 underlying fetch (coalesced), got %d", got)
+	}
+}
+
+func TestAllocCacheTTL(t *testing.T) {
+	c := newAllocCache(40 * time.Millisecond)
+	var calls int32
+	fetch := func() ([]Allocation, error) {
+		atomic.AddInt32(&calls, 1)
+		return nil, nil
+	}
+
+	_, _ = c.do("k", fetch)
+	_, _ = c.do("k", fetch) // within TTL -> cached
+	if got := atomic.LoadInt32(&calls); got != 1 {
+		t.Fatalf("expected 1 fetch within TTL, got %d", got)
+	}
+
+	time.Sleep(60 * time.Millisecond) // let it expire
+	_, _ = c.do("k", fetch)
+	if got := atomic.LoadInt32(&calls); got != 2 {
+		t.Fatalf("expected re-fetch after TTL, got %d", got)
+	}
+}
+
+func TestAllocCacheDoesNotCacheErrors(t *testing.T) {
+	c := newAllocCache(time.Minute)
+	var calls int32
+	fetch := func() ([]Allocation, error) {
+		atomic.AddInt32(&calls, 1)
+		return nil, errors.New("boom")
+	}
+
+	if _, err := c.do("k", fetch); err == nil {
+		t.Fatal("expected error")
+	}
+	if _, err := c.do("k", fetch); err == nil {
+		t.Fatal("expected error on retry")
+	}
+	if got := atomic.LoadInt32(&calls); got != 2 {
+		t.Fatalf("errors must not be cached; expected 2 fetches, got %d", got)
+	}
+}
diff --git a/api-server/internal/opencost/client.go b/api-server/internal/opencost/client.go
index 25698f7..5a057e7 100644
--- a/api-server/internal/opencost/client.go
+++ b/api-server/internal/opencost/client.go
@@ -16,6 +16,7 @@ import (
 type Client struct {
 	baseURL    string
 	httpClient *http.Client
+	cache      *allocCache
 }
 
 // NewClient creates a new OpenCost client
@@ -25,6 +26,9 @@ func NewClient(baseURL string) *Client {
 		httpClient: &http.Client{
 			Timeout: 30 * time.Second,
 		},
+		// Short TTL: dashboard/billing repeatedly query the same windows; 30s keeps
+		// data near-real-time while collapsing duplicate concurrent queries.
+		cache: newAllocCache(30 * time.Second),
 	}
 }
 
@@ -109,12 +113,20 @@ func (c *Client) GetAllocationForNamespace(ctx context.Context, window, namespac
 	return c.getAllocation(ctx, window, "namespace", fmt.Sprintf("namespace:\"%s\"", namespace))
 }
 
-// getAllocation is the internal method to query allocations
+// getAllocation queries allocations through a short-TTL coalescing cache so that
+// concurrent dashboard/billing requests for the same window hit OpenCost once.
 func (c *Client) getAllocation(ctx context.Context, window, aggregate, filter string) ([]Allocation, error) {
 	if !c.IsEnabled() {
 		return nil, fmt.Errorf("opencost not configured")
 	}
+	key := window + "|" + aggregate + "|" + filter
+	return c.cache.do(key, func() ([]Allocation, error) {
+		return c.fetchAllocation(ctx, window, aggregate, filter)
+	})
+}
 
+// fetchAllocation performs the actual OpenCost HTTP query (uncached).
+func (c *Client) fetchAllocation(ctx context.Context, window, aggregate, filter string) ([]Allocation, error) {
 	// Build URL
 	params := url.Values{}
 	params.Set("window", window)
diff --git a/api-server/internal/scheduler/scheduler.go b/api-server/internal/scheduler/scheduler.go
index f7ab8d4..7996386 100644
--- a/api-server/internal/scheduler/scheduler.go
+++ b/api-server/internal/scheduler/scheduler.go
@@ -2,6 +2,7 @@ package scheduler
 
 import (
 	"context"
+	"math/rand"
 	"sync"
 	"time"
 
@@ -18,8 +19,10 @@ type Scheduler struct {
 	executions   []service.TaskExecution
 	executionsMu sync.RWMutex
 
-	stopCh chan struct{}
-	wg     sync.WaitGroup
+	mu      sync.Mutex
+	started bool
+	stopCh  chan struct{}
+	wg      sync.WaitGroup
 }
 
 // NewScheduler creates a new Scheduler
@@ -33,31 +36,41 @@ func NewScheduler(
 		balanceSvc: balanceSvc,
 		alertSvc:   alertSvc,
 		executions: make([]service.TaskExecution, 0),
-		stopCh:     make(chan struct{}),
 	}
 }
 
-// Start starts all scheduled tasks
+// Start starts all scheduled tasks. It is idempotent and re-startable: calling
+// Start after a Stop (e.g. when leadership is re-acquired) spins up a fresh set
+// of tasks against a new stop channel.
 func (s *Scheduler) Start(ctx context.Context) {
+	s.mu.Lock()
+	defer s.mu.Unlock()
+	if s.started {
+		return
+	}
+	s.started = true
+	s.stopCh = make(chan struct{})
 	logger.Info("Starting scheduler")
 
-	// Start billing task (every hour)
-	s.wg.Add(1)
+	s.wg.Add(3)
 	go s.runBillingTask(ctx)
-
-	// Start auto-recharge task (every hour)
-	s.wg.Add(1)
 	go s.runAutoRechargeTask(ctx)
-
-	// Start alert check task (every 15 minutes)
-	s.wg.Add(1)
 	go s.runAlertTask(ctx)
 }
 
-// Stop stops all scheduled tasks
+// Stop stops all scheduled tasks and waits for them to exit. Safe to call when
+// not started.
 func (s *Scheduler) Stop() {
-	logger.Info("Stopping scheduler")
+	s.mu.Lock()
+	if !s.started {
+		s.mu.Unlock()
+		return
+	}
+	s.started = false
 	close(s.stopCh)
+	s.mu.Unlock()
+
+	logger.Info("Stopping scheduler")
 	s.wg.Wait()
 }
 
@@ -87,18 +100,50 @@ func (s *Scheduler) GetExecutions(limit int) []service.TaskExecution {
 	return result
 }
 
+// safeExecute runs a task body with panic recovery so a single failing task can
+// never take down the whole api-server process.
+func (s *Scheduler) safeExecute(name string, fn func()) {
+	defer func() {
+		if r := recover(); r != nil {
+			logger.Error("Scheduled task panicked and was recovered", "task", name, "panic", r)
+		}
+	}()
+	fn()
+}
+
+// sleepWithJitter waits a random duration in [0, max) to desynchronize task
+// firing across replicas, returning false if the scheduler is stopped meanwhile.
+func (s *Scheduler) sleepWithJitter(stopCh <-chan struct{}, max time.Duration) bool {
+	if max <= 0 {
+		return true
+	}
+	timer := time.NewTimer(time.Duration(rand.Int63n(int64(max))))
+	defer timer.Stop()
+	select {
+	case <-stopCh:
+		return false
+	case <-timer.C:
+		return true
+	}
+}
+
 func (s *Scheduler) runBillingTask(ctx context.Context) {
 	defer s.wg.Done()
+	stopCh := s.stopCh
+
+	if !s.sleepWithJitter(stopCh, 60*time.Second) {
+		return
+	}
 
 	ticker := time.NewTicker(1 * time.Hour)
 	defer ticker.Stop()
 
 	for {
 		select {
-		case <-s.stopCh:
+		case <-stopCh:
 			return
 		case <-ticker.C:
-			s.executeBillingTask(ctx)
+			s.safeExecute("billing", func() { s.executeBillingTask(ctx) })
 		}
 	}
 }
@@ -129,16 +174,21 @@ func (s *Scheduler) executeBillingTask(ctx context.Context) {
 
 func (s *Scheduler) runAutoRechargeTask(ctx context.Context) {
 	defer s.wg.Done()
+	stopCh := s.stopCh
+
+	if !s.sleepWithJitter(stopCh, 60*time.Second) {
+		return
+	}
 
 	ticker := time.NewTicker(1 * time.Hour)
 	defer ticker.Stop()
 
 	for {
 		select {
-		case <-s.stopCh:
+		case <-stopCh:
 			return
 		case <-ticker.C:
-			s.executeAutoRechargeTask(ctx)
+			s.safeExecute("auto_recharge", func() { s.executeAutoRechargeTask(ctx) })
 		}
 	}
 }
@@ -169,16 +219,21 @@ func (s *Scheduler) executeAutoRechargeTask(ctx context.Context) {
 
 func (s *Scheduler) runAlertTask(ctx context.Context) {
 	defer s.wg.Done()
+	stopCh := s.stopCh
+
+	if !s.sleepWithJitter(stopCh, 30*time.Second) {
+		return
+	}
 
 	ticker := time.NewTicker(15 * time.Minute)
 	defer ticker.Stop()
 
 	for {
 		select {
-		case <-s.stopCh:
+		case <-stopCh:
 			return
 		case <-ticker.C:
-			s.executeAlertTask(ctx)
+			s.safeExecute("alert_check", func() { s.executeAlertTask(ctx) })
 		}
 	}
 }
diff --git a/api-server/internal/scheduler/scheduler_test.go b/api-server/internal/scheduler/scheduler_test.go
new file mode 100644
index 0000000..b5f2c44
--- /dev/null
+++ b/api-server/internal/scheduler/scheduler_test.go
@@ -0,0 +1,45 @@
+package scheduler
+
+import (
+	"context"
+	"os"
+	"testing"
+	"time"
+
+	"github.com/bison/api-server/pkg/logger"
+)
+
+func TestMain(m *testing.M) {
+	logger.Init(false)
+	os.Exit(m.Run())
+}
+
+// TestSchedulerRestartable verifies the scheduler can be stopped and started
+// again (required for leader-election re-acquisition) and that Start/Stop are
+// idempotent and do not deadlock.
+func TestSchedulerRestartable(t *testing.T) {
+	s := NewScheduler(nil, nil, nil)
+	ctx := context.Background()
+
+	done := make(chan struct{})
+	go func() {
+		s.Start(ctx)
+		s.Start(ctx) // idempotent: second Start is a no-op
+		s.Stop()
+		s.Stop()     // idempotent: second Stop is a no-op
+		s.Start(ctx) // re-startable after Stop
+		s.Stop()
+		close(done)
+	}()
+
+	select {
+	case <-done:
+	case <-time.After(5 * time.Second):
+		t.Fatal("Start/Stop deadlocked")
+	}
+}
+
+func TestStopBeforeStartIsSafe(t *testing.T) {
+	s := NewScheduler(nil, nil, nil)
+	s.Stop() // must not panic or block when never started
+}
diff --git a/api-server/internal/service/balance_service.go b/api-server/internal/service/balance_service.go
index c07b463..5aecd1b 100644
--- a/api-server/internal/service/balance_service.go
+++ b/api-server/internal/service/balance_service.go
@@ -10,6 +10,7 @@ import (
 	corev1 "k8s.io/api/core/v1"
 	"k8s.io/apimachinery/pkg/api/errors"
 	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"k8s.io/client-go/util/retry"
 
 	"github.com/bison/api-server/internal/k8s"
 	"github.com/bison/api-server/pkg/logger"
@@ -120,7 +121,9 @@ func (s *BalanceService) GetAllBalances(ctx context.Context) ([]*Balance, error)
 	return balances, nil
 }
 
-// Recharge adds balance to a team
+// Recharge adds balance to a team. The read-modify-write is performed under
+// optimistic-concurrency retry so concurrent recharges/deductions on the shared
+// balances ConfigMap cannot silently lose updates.
 func (s *BalanceService) Recharge(ctx context.Context, teamName string, amount float64, operator, remark string) error {
 	logger.Info("Recharging team", "team", teamName, "amount", amount, "operator", operator)
 
@@ -128,18 +131,11 @@ func (s *BalanceService) Recharge(ctx context.Context, teamName string, amount f
 		return fmt.Errorf("recharge amount must be positive")
 	}
 
-	// Get current balance
-	balance, err := s.GetBalance(ctx, teamName)
+	newAmount, err := s.applyBalanceDelta(ctx, teamName, amount)
 	if err != nil {
 		return err
 	}
 
-	// Update balance
-	newAmount := balance.Amount + amount
-	if err := s.updateBalance(ctx, teamName, newAmount); err != nil {
-		return err
-	}
-
 	// Record history
 	record := &RechargeRecord{
 		ID:        fmt.Sprintf("%d", time.Now().UnixNano()),
@@ -154,24 +150,19 @@ func (s *BalanceService) Recharge(ctx context.Context, teamName string, amount f
 	return s.addRechargeRecord(ctx, teamName, record)
 }
 
-// Deduct deducts balance from a team
-func (s *BalanceService) Deduct(ctx context.Context, teamName string, amount float64, reason string) error {
+// Deduct deducts balance from a team (negative balances are allowed) and returns
+// the balance AFTER the write, so callers do not need a second racy read to decide
+// suspension. The update is conflict-retried for concurrency safety.
+func (s *BalanceService) Deduct(ctx context.Context, teamName string, amount float64, reason string) (float64, error) {
 	logger.Info("Deducting from team", "team", teamName, "amount", amount, "reason", reason)
 
 	if amount <= 0 {
-		return fmt.Errorf("deduction amount must be positive")
+		return 0, fmt.Errorf("deduction amount must be positive")
 	}
 
-	// Get current balance
-	balance, err := s.GetBalance(ctx, teamName)
+	newAmount, err := s.applyBalanceDelta(ctx, teamName, -amount)
 	if err != nil {
-		return err
-	}
-
-	// Update balance (allow negative balance)
-	newAmount := balance.Amount - amount
-	if err := s.updateBalance(ctx, teamName, newAmount); err != nil {
-		return err
+		return 0, err
 	}
 
 	// Record history
@@ -185,7 +176,10 @@ func (s *BalanceService) Deduct(ctx context.Context, teamName string, amount flo
 		Balance:   newAmount,
 	}
 
-	return s.addRechargeRecord(ctx, teamName, record)
+	if err := s.addRechargeRecord(ctx, teamName, record); err != nil {
+		return newAmount, err
+	}
+	return newAmount, nil
 }
 
 // GetRechargeHistory returns recharge/deduction history for a team
@@ -297,18 +291,16 @@ func (s *BalanceService) ProcessAutoRecharge(ctx context.Context) error {
 			continue
 		}
 
-		logger.Info("Executing auto-recharge", "team", teamName, "amount", config.Amount)
-
-		// Get current balance
-		balance, err := s.GetBalance(ctx, teamName)
-		if err != nil {
-			logger.Error("Failed to get balance for auto-recharge", "team", teamName, "error", err)
+		if config.Amount <= 0 {
+			logger.Warn("Skipping auto-recharge with non-positive amount", "team", teamName, "amount", config.Amount)
 			continue
 		}
 
-		// Update balance
-		newAmount := balance.Amount + config.Amount
-		if err := s.updateBalance(ctx, teamName, newAmount); err != nil {
+		logger.Info("Executing auto-recharge", "team", teamName, "amount", config.Amount)
+
+		// Atomically add the recharge amount to the current balance.
+		newAmount, err := s.applyBalanceDelta(ctx, teamName, config.Amount)
+		if err != nil {
 			logger.Error("Failed to update balance for auto-recharge", "team", teamName, "error", err)
 			continue
 		}
@@ -372,64 +364,78 @@ func (s *BalanceService) GetTotalBalance(ctx context.Context) (float64, error) {
 
 // Helper methods
 
-func (s *BalanceService) updateBalance(ctx context.Context, teamName string, amount float64) error {
-	balance := &Balance{
-		TeamName:    teamName,
-		Amount:      amount,
-		LastUpdated: time.Now(),
-	}
-
-	data, err := json.Marshal(balance)
-	if err != nil {
-		return fmt.Errorf("failed to marshal balance: %w", err)
-	}
-
-	cm, err := s.getOrCreateConfigMap(ctx, BalancesConfigMap)
-	if err != nil {
-		return err
-	}
+// mutateConfigMap performs an optimistic-concurrency read-modify-write on a Bison
+// ConfigMap. It re-reads the ConfigMap and re-applies mutate on every resourceVersion
+// conflict, so concurrent writers (recharge, billing deduction, auto-recharge,
+// overdue marking) cannot silently lose each other's updates.
+func (s *BalanceService) mutateConfigMap(ctx context.Context, name string, mutate func(cm *corev1.ConfigMap) error) error {
+	return retry.RetryOnConflict(retry.DefaultRetry, func() error {
+		cm, err := s.getOrCreateConfigMap(ctx, name)
+		if err != nil {
+			return err
+		}
+		if cm.Data == nil {
+			cm.Data = make(map[string]string)
+		}
+		if err := mutate(cm); err != nil {
+			return err
+		}
+		// Use the raw client so a conflict error is returned unwrapped for RetryOnConflict.
+		return s.k8sClient.UpdateConfigMap(ctx, BisonNamespace, cm)
+	})
+}
 
-	if cm.Data == nil {
-		cm.Data = make(map[string]string)
-	}
-	cm.Data[teamName] = string(data)
+// applyBalanceDelta atomically adds delta (negative to deduct) to a team's balance,
+// preserving other persisted fields such as OverdueAt, and returns the new amount.
+func (s *BalanceService) applyBalanceDelta(ctx context.Context, teamName string, delta float64) (float64, error) {
+	var newAmount float64
+	err := s.mutateConfigMap(ctx, BalancesConfigMap, func(cm *corev1.ConfigMap) error {
+		balance := Balance{TeamName: teamName}
+		if existing, ok := cm.Data[teamName]; ok {
+			if err := json.Unmarshal([]byte(existing), &balance); err != nil {
+				return fmt.Errorf("failed to parse balance: %w", err)
+			}
+		}
+		balance.TeamName = teamName
+		balance.Amount += delta
+		balance.LastUpdated = time.Now()
 
-	return s.updateConfigMap(ctx, cm)
+		data, err := json.Marshal(&balance)
+		if err != nil {
+			return fmt.Errorf("failed to marshal balance: %w", err)
+		}
+		cm.Data[teamName] = string(data)
+		newAmount = balance.Amount
+		return nil
+	})
+	return newAmount, err
 }
 
 func (s *BalanceService) addRechargeRecord(ctx context.Context, teamName string, record *RechargeRecord) error {
-	cm, err := s.getOrCreateConfigMap(ctx, RechargeHistoryConfigMap)
-	if err != nil {
-		return err
-	}
-
-	var records []*RechargeRecord
-	if data, ok := cm.Data[teamName]; ok {
-		if err := json.Unmarshal([]byte(data), &records); err != nil {
-			logger.Warn("Failed to unmarshal existing history, starting fresh", "team", teamName)
-			records = []*RechargeRecord{}
+	return s.mutateConfigMap(ctx, RechargeHistoryConfigMap, func(cm *corev1.ConfigMap) error {
+		var records []*RechargeRecord
+		if data, ok := cm.Data[teamName]; ok {
+			if err := json.Unmarshal([]byte(data), &records); err != nil {
+				logger.Warn("Failed to unmarshal existing history, starting fresh", "team", teamName)
+				records = []*RechargeRecord{}
+			}
 		}
-	}
-
-	// Add new record
-	records = append(records, record)
-
-	// Keep only last 1000 records
-	if len(records) > 1000 {
-		records = records[len(records)-1000:]
-	}
 
-	data, err := json.Marshal(records)
-	if err != nil {
-		return fmt.Errorf("failed to marshal history: %w", err)
-	}
+		// Add new record
+		records = append(records, record)
 
-	if cm.Data == nil {
-		cm.Data = make(map[string]string)
-	}
-	cm.Data[teamName] = string(data)
+		// Keep only last 1000 records
+		if len(records) > 1000 {
+			records = records[len(records)-1000:]
+		}
 
-	return s.updateConfigMap(ctx, cm)
+		data, err := json.Marshal(records)
+		if err != nil {
+			return fmt.Errorf("failed to marshal history: %w", err)
+		}
+		cm.Data[teamName] = string(data)
+		return nil
+	})
 }
 
 func (s *BalanceService) getOrCreateConfigMap(ctx context.Context, name string) (*corev1.ConfigMap, error) {
@@ -496,68 +502,82 @@ func (s *BalanceService) calculateNextExecution(config *AutoRechargeConfig) time
 	}
 }
 
-// CalculateDailyConsumption calculates the average daily consumption for a team based on recent history
+// CalculateDailyConsumption estimates the average daily spend for a team from its
+// recent deduction history.
+//
+// The denominator is the actual span of deduction activity within the last 7 days
+// (capped at 7 days, floored to avoid wildly overestimating from a single very
+// recent deduction) — NOT a fixed 7 days, which previously underestimated the burn
+// rate whenever the real activity window was shorter. We also fetch enough records
+// to cover a full week of hourly billing (168+), since the old 100-record cap
+// truncated the 7-day window and undercounted total deductions.
 func (s *BalanceService) CalculateDailyConsumption(ctx context.Context, teamName string) (float64, error) {
-	records, err := s.GetRechargeHistory(ctx, teamName, 100) // Get last 100 records
+	const (
+		lookbackDays = 7
+		maxSpanDays  = 7.0
+		minSpanDays  = 0.5
+		fetchRecords = 400
+	)
+
+	records, err := s.GetRechargeHistory(ctx, teamName, fetchRecords)
 	if err != nil {
 		return 0, err
 	}
 
-	// Calculate total deductions in last 7 days
 	now := time.Now()
-	sevenDaysAgo := now.AddDate(0, 0, -7)
+	windowStart := now.AddDate(0, 0, -lookbackDays)
 
 	var totalDeductions float64
-	var daysWithData float64 = 7 // Default to 7 days
+	var oldestDeduction time.Time
+	hasDeduction := false
 
 	for _, record := range records {
-		if record.Type == "deduction" && record.Timestamp.After(sevenDaysAgo) {
-			totalDeductions += -record.Amount // Amount is negative for deductions
+		if record.Type != "deduction" || !record.Timestamp.After(windowStart) {
+			continue
 		}
-	}
-
-	// If we have less than 7 days of data, calculate based on actual time span
-	if len(records) > 0 {
-		oldestRecord := records[len(records)-1]
-		if oldestRecord.Timestamp.After(sevenDaysAgo) {
-			actualDays := now.Sub(oldestRecord.Timestamp).Hours() / 24
-			if actualDays > 0 {
-				daysWithData = actualDays
-			}
+		totalDeductions += -record.Amount // Amount is negative for deductions
+		if !hasDeduction || record.Timestamp.Before(oldestDeduction) {
+			oldestDeduction = record.Timestamp
+			hasDeduction = true
 		}
 	}
 
-	if daysWithData == 0 {
+	if !hasDeduction || totalDeductions <= 0 {
 		return 0, nil
 	}
 
-	return totalDeductions / daysWithData, nil
-}
-
-// SetOverdueAt records when a team first went into negative balance
-func (s *BalanceService) SetOverdueAt(ctx context.Context, teamName string, overdueAt *time.Time) error {
-	balance, err := s.GetBalance(ctx, teamName)
-	if err != nil {
-		return err
+	spanDays := now.Sub(oldestDeduction).Hours() / 24
+	if spanDays > maxSpanDays {
+		spanDays = maxSpanDays
 	}
-
-	balance.OverdueAt = overdueAt
-	data, err := json.Marshal(balance)
-	if err != nil {
-		return fmt.Errorf("failed to marshal balance: %w", err)
+	if spanDays < minSpanDays {
+		spanDays = minSpanDays
 	}
 
-	cm, err := s.getOrCreateConfigMap(ctx, BalancesConfigMap)
-	if err != nil {
-		return err
-	}
+	return totalDeductions / spanDays, nil
+}
 
-	if cm.Data == nil {
-		cm.Data = make(map[string]string)
-	}
-	cm.Data[teamName] = string(data)
+// SetOverdueAt records (or clears) when a team first went into negative balance.
+// The update is conflict-retried and preserves the current amount, so it cannot
+// clobber a concurrent deduction/recharge.
+func (s *BalanceService) SetOverdueAt(ctx context.Context, teamName string, overdueAt *time.Time) error {
+	return s.mutateConfigMap(ctx, BalancesConfigMap, func(cm *corev1.ConfigMap) error {
+		balance := Balance{TeamName: teamName}
+		if existing, ok := cm.Data[teamName]; ok {
+			if err := json.Unmarshal([]byte(existing), &balance); err != nil {
+				return fmt.Errorf("failed to parse balance: %w", err)
+			}
+		}
+		balance.TeamName = teamName
+		balance.OverdueAt = overdueAt
 
-	return s.updateConfigMap(ctx, cm)
+		data, err := json.Marshal(&balance)
+		if err != nil {
+			return fmt.Errorf("failed to marshal balance: %w", err)
+		}
+		cm.Data[teamName] = string(data)
+		return nil
+	})
 }
 
 // GetBalanceWithEstimate returns the balance with consumption and estimated overdue time calculated
diff --git a/api-server/internal/service/balance_service_test.go b/api-server/internal/service/balance_service_test.go
new file mode 100644
index 0000000..5ded60b
--- /dev/null
+++ b/api-server/internal/service/balance_service_test.go
@@ -0,0 +1,265 @@
+package service
+
+import (
+	"context"
+	"fmt"
+	"strconv"
+	"sync"
+	"testing"
+	"time"
+
+	corev1 "k8s.io/api/core/v1"
+	apierrors "k8s.io/apimachinery/pkg/api/errors"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"k8s.io/apimachinery/pkg/runtime"
+	"k8s.io/apimachinery/pkg/runtime/schema"
+	k8sfake "k8s.io/client-go/kubernetes/fake"
+	k8stesting "k8s.io/client-go/testing"
+
+	"github.com/bison/api-server/internal/k8s"
+)
+
+func newTestBalanceService() *BalanceService {
+	cs := k8sfake.NewSimpleClientset()
+	client := k8s.NewClientWithInterfaces(cs, nil)
+	return NewBalanceService(client)
+}
+
+// installOptimisticConcurrency makes the fake clientset enforce resourceVersion on
+// ConfigMap update so it behaves like etcd. Without this the default fake silently
+// accepts stale writes and the RetryOnConflict path is never exercised. The tracker
+// is the single source of truth for the current resourceVersion.
+func installOptimisticConcurrency(cs *k8sfake.Clientset) {
+	var mu sync.Mutex
+
+	cs.PrependReactor("update", "configmaps", func(action k8stesting.Action) (bool, runtime.Object, error) {
+		cm := action.(k8stesting.UpdateAction).GetObject().(*corev1.ConfigMap).DeepCopy()
+		mu.Lock()
+		defer mu.Unlock()
+
+		existing, err := cs.Tracker().Get(action.GetResource(), action.GetNamespace(), cm.Name)
+		if err != nil {
+			return true, nil, err
+		}
+		existingCM := existing.(*corev1.ConfigMap)
+		if cm.ResourceVersion != existingCM.ResourceVersion {
+			return true, nil, apierrors.NewConflict(
+				schema.GroupResource{Resource: "configmaps"}, cm.Name,
+				fmt.Errorf("resourceVersion conflict"))
+		}
+
+		rv, _ := strconv.Atoi(existingCM.ResourceVersion)
+		cm.ResourceVersion = strconv.Itoa(rv + 1)
+		if err := cs.Tracker().Update(action.GetResource(), cm, action.GetNamespace()); err != nil {
+			return true, nil, err
+		}
+		return true, cm, nil
+	})
+}
+
+func seedConfigMap(name string) *corev1.ConfigMap {
+	return &corev1.ConfigMap{
+		ObjectMeta: metav1.ObjectMeta{Name: name, Namespace: BisonNamespace, ResourceVersion: "1"},
+		Data:       map[string]string{},
+	}
+}
+
+func TestRechargeThenDeduct(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+
+	if err := svc.Recharge(ctx, "team-a", 100, "admin", "init"); err != nil {
+		t.Fatalf("Recharge: %v", err)
+	}
+
+	bal, err := svc.GetBalance(ctx, "team-a")
+	if err != nil {
+		t.Fatalf("GetBalance: %v", err)
+	}
+	if bal.Amount != 100 {
+		t.Fatalf("after recharge: got %v, want 100", bal.Amount)
+	}
+
+	newBal, err := svc.Deduct(ctx, "team-a", 30, "usage")
+	if err != nil {
+		t.Fatalf("Deduct: %v", err)
+	}
+	if newBal != 70 {
+		t.Fatalf("Deduct returned %v, want 70", newBal)
+	}
+
+	bal, _ = svc.GetBalance(ctx, "team-a")
+	if bal.Amount != 70 {
+		t.Fatalf("stored balance %v, want 70", bal.Amount)
+	}
+
+	recs, err := svc.GetRechargeHistory(ctx, "team-a", 0)
+	if err != nil {
+		t.Fatalf("GetRechargeHistory: %v", err)
+	}
+	if len(recs) != 2 {
+		t.Fatalf("history records = %d, want 2", len(recs))
+	}
+}
+
+func TestDeductAllowsNegativeBalance(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+
+	if err := svc.Recharge(ctx, "team-a", 10, "admin", ""); err != nil {
+		t.Fatal(err)
+	}
+	newBal, err := svc.Deduct(ctx, "team-a", 25, "usage")
+	if err != nil {
+		t.Fatalf("Deduct: %v", err)
+	}
+	if newBal != -15 {
+		t.Fatalf("Deduct returned %v, want -15", newBal)
+	}
+}
+
+func TestRechargeRejectsNonPositive(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+
+	if err := svc.Recharge(ctx, "team-a", 0, "admin", ""); err == nil {
+		t.Fatal("Recharge(0) should error")
+	}
+	if err := svc.Recharge(ctx, "team-a", -5, "admin", ""); err == nil {
+		t.Fatal("Recharge(-5) should error")
+	}
+	if _, err := svc.Deduct(ctx, "team-a", 0, "usage"); err == nil {
+		t.Fatal("Deduct(0) should error")
+	}
+}
+
+// TestDeductPreservesOverdueAt guards the regression where a deduction overwrote
+// the whole Balance object and silently wiped OverdueAt, which would reset the
+// grace-period clock on every billing cycle and prevent suspension.
+func TestDeductPreservesOverdueAt(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+
+	if err := svc.Recharge(ctx, "team-a", 10, "admin", ""); err != nil {
+		t.Fatal(err)
+	}
+	overdue := time.Now().Add(-2 * time.Hour).Truncate(time.Second)
+	if err := svc.SetOverdueAt(ctx, "team-a", &overdue); err != nil {
+		t.Fatal(err)
+	}
+
+	if _, err := svc.Deduct(ctx, "team-a", 50, "usage"); err != nil {
+		t.Fatal(err)
+	}
+
+	bal, _ := svc.GetBalance(ctx, "team-a")
+	if bal.OverdueAt == nil {
+		t.Fatal("OverdueAt was wiped by Deduct")
+	}
+	if !bal.OverdueAt.Equal(overdue) {
+		t.Fatalf("OverdueAt = %v, want %v", bal.OverdueAt, overdue)
+	}
+	if bal.Amount != -40 {
+		t.Fatalf("amount = %v, want -40", bal.Amount)
+	}
+}
+
+func addDeduction(t *testing.T, svc *BalanceService, team string, amount float64, ts time.Time) {
+	t.Helper()
+	if err := svc.addRechargeRecord(context.Background(), team, &RechargeRecord{
+		ID:        ts.Format(time.RFC3339Nano),
+		Timestamp: ts,
+		Type:      "deduction",
+		Amount:    -amount,
+		Operator:  "system",
+	}); err != nil {
+		t.Fatalf("addRechargeRecord: %v", err)
+	}
+}
+
+func TestCalculateDailyConsumptionUsesDeductionSpan(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+	now := time.Now()
+
+	// Two deductions spanning ~4 days, total 200 -> ~50/day.
+	addDeduction(t, svc, "team-a", 100, now.Add(-4*24*time.Hour))
+	addDeduction(t, svc, "team-a", 100, now)
+
+	rate, err := svc.CalculateDailyConsumption(ctx, "team-a")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if rate < 45 || rate > 55 {
+		t.Fatalf("expected ~50/day, got %.2f", rate)
+	}
+}
+
+func TestCalculateDailyConsumptionFloorsSpan(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+
+	// Single very recent deduction: span floored to 0.5 day -> 10 / 0.5 = 20.
+	addDeduction(t, svc, "team-a", 10, time.Now())
+	rate, err := svc.CalculateDailyConsumption(ctx, "team-a")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if rate < 18 || rate > 22 {
+		t.Fatalf("expected ~20/day (floored span), got %.2f", rate)
+	}
+}
+
+func TestCalculateDailyConsumptionIgnoresOldAndNonDeductions(t *testing.T) {
+	svc := newTestBalanceService()
+	ctx := context.Background()
+	now := time.Now()
+
+	addDeduction(t, svc, "team-a", 1000, now.Add(-30*24*time.Hour)) // outside 7d window
+	// a recharge inside the window must not count as consumption
+	if err := svc.addRechargeRecord(ctx, "team-a", &RechargeRecord{
+		ID: "r1", Timestamp: now, Type: "recharge", Amount: 500,
+	}); err != nil {
+		t.Fatal(err)
+	}
+	rate, err := svc.CalculateDailyConsumption(ctx, "team-a")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if rate != 0 {
+		t.Fatalf("expected 0 (no in-window deductions), got %.2f", rate)
+	}
+}
+
+// TestConcurrentRecharge exercises the optimistic-concurrency retry path against a
+// fake that enforces resourceVersion. Each Recharge re-reads, recomputes and
+// re-writes under retry.RetryOnConflict, so the final balance must equal the sum of
+// all operations with no lost updates. Contention is kept within DefaultRetry's
+// budget (5 attempts) by using a small number of writers.
+func TestConcurrentRecharge(t *testing.T) {
+	cs := k8sfake.NewSimpleClientset(seedConfigMap(BalancesConfigMap), seedConfigMap(RechargeHistoryConfigMap))
+	installOptimisticConcurrency(cs)
+	svc := NewBalanceService(k8s.NewClientWithInterfaces(cs, nil))
+	ctx := context.Background()
+
+	const n = 4
+	var wg sync.WaitGroup
+	wg.Add(n)
+	for i := 0; i < n; i++ {
+		go func() {
+			defer wg.Done()
+			if err := svc.Recharge(ctx, "team-a", 5, "admin", "concurrent"); err != nil {
+				t.Errorf("Recharge: %v", err)
+			}
+		}()
+	}
+	wg.Wait()
+
+	bal, err := svc.GetBalance(ctx, "team-a")
+	if err != nil {
+		t.Fatal(err)
+	}
+	if bal.Amount != float64(n*5) {
+		t.Fatalf("concurrent recharge total = %v, want %v (lost update)", bal.Amount, n*5)
+	}
+}
diff --git a/api-server/internal/service/billing_service.go b/api-server/internal/service/billing_service.go
index 57924af..d9a480f 100644
--- a/api-server/internal/service/billing_service.go
+++ b/api-server/internal/service/billing_service.go
@@ -7,9 +7,10 @@ import (
 	"strconv"
 	"time"
 
-	appsv1 "k8s.io/api/apps/v1"
 	corev1 "k8s.io/api/core/v1"
+	"k8s.io/apimachinery/pkg/api/errors"
 	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	"k8s.io/client-go/util/retry"
 
 	"github.com/bison/api-server/internal/k8s"
 	"github.com/bison/api-server/internal/opencost"
@@ -18,6 +19,10 @@ import (
 
 const (
 	BillingConfigMap = "bison-billing-config"
+	// lastBilledKey stores (in the billing ConfigMap) the RFC3339 timestamp of the
+	// last successful billing run, so billing is not duplicated when the ticker
+	// fires more often than the configured interval or after a process restart.
+	lastBilledKey = "lastBilledAt"
 )
 
 // BillingConfig represents the billing configuration
@@ -150,6 +155,31 @@ func (s *BillingService) ProcessBilling(ctx context.Context) error {
 		return nil
 	}
 
+	// Enforce the configured billing interval regardless of how often the
+	// scheduler ticks, and survive restarts, by gating on a persisted timestamp.
+	interval := config.Interval
+	if interval <= 0 {
+		interval = 1
+	}
+	minGap := time.Duration(interval) * time.Hour
+	now := time.Now()
+	lastBilled, _ := s.getLastBilled(ctx)
+	if lastBilled.IsZero() {
+		// First run on a fresh deployment: establish a baseline instead of billing
+		// an unknown historical window.
+		if err := s.setLastBilled(ctx, now); err != nil {
+			logger.Warn("Failed to initialize billing baseline", "error", err)
+		}
+		logger.Info("Billing baseline initialized; skipping first cycle")
+		return nil
+	}
+	// Tolerate scheduler jitter: require ~95% of the interval to have elapsed.
+	if now.Sub(lastBilled) < time.Duration(float64(minGap)*0.95) {
+		logger.Debug("Skipping billing: interval not yet elapsed",
+			"sinceLastBilled", now.Sub(lastBilled).String(), "interval", minGap.String())
+		return nil
+	}
+
 	// Get usage from OpenCost
 	if s.opencostClient == nil || !s.opencostClient.IsEnabled() {
 		logger.Warn("OpenCost not available, skipping billing")
@@ -180,7 +210,8 @@ func (s *BillingService) ProcessBilling(ctx context.Context) error {
 		}
 	}
 
-	// Aggregate costs by team
+	// Aggregate costs by team. Prices are read once for the whole run.
+	prices := s.loadPrices(ctx)
 	teamCosts := make(map[string]float64)
 	for _, alloc := range allocations {
 		teamName, ok := nsToTeam[alloc.Name]
@@ -188,8 +219,7 @@ func (s *BillingService) ProcessBilling(ctx context.Context) error {
 			continue
 		}
 
-		// Calculate cost based on pricing config
-		cost := s.calculateCost(ctx, config, &alloc)
+		cost := costFromPrices(config, prices, &alloc)
 		teamCosts[teamName] += cost
 	}
 
@@ -200,46 +230,114 @@ func (s *BillingService) ProcessBilling(ctx context.Context) error {
 		}
 
 		reason := fmt.Sprintf("Usage billing for %s", window)
-		if err := s.balanceSvc.Deduct(ctx, teamName, cost, reason); err != nil {
+		// Deduct returns the authoritative post-write balance, so the suspension
+		// decision below is no longer based on a racy second read.
+		newBalance, err := s.balanceSvc.Deduct(ctx, teamName, cost, reason)
+		if err != nil {
 			logger.Error("Failed to deduct balance", "team", teamName, "cost", cost, "error", err)
 			continue
 		}
 
-		// Check if team is now in debt
-		balance, _ := s.balanceSvc.GetBalance(ctx, teamName)
-		if balance != nil && balance.Amount < 0 {
-			logger.Warn("Team is in debt", "team", teamName, "balance", balance.Amount)
+		if newBalance < 0 {
+			logger.Warn("Team is in debt", "team", teamName, "balance", newBalance)
 
-			// Record when balance first went negative
-			if balance.OverdueAt == nil {
+			// Determine the overdue start time, preserving any existing marker so the
+			// grace period is measured from when the balance first went negative.
+			cur, err := s.balanceSvc.GetBalance(ctx, teamName)
+			if err != nil {
+				logger.Error("Failed to read balance for overdue check", "team", teamName, "error", err)
+				continue
+			}
+			overdueAt := cur.OverdueAt
+			if overdueAt == nil {
 				now := time.Now()
-				if err := s.balanceSvc.SetOverdueAt(ctx, teamName, &now); err != nil {
+				overdueAt = &now
+				if err := s.balanceSvc.SetOverdueAt(ctx, teamName, overdueAt); err != nil {
 					logger.Error("Failed to set overdue time", "team", teamName, "error", err)
 				}
-				balance.OverdueAt = &now
 			}
 
 			// Check if grace period has passed
-			if s.isGracePeriodExpired(config, balance.OverdueAt) {
-				logger.Warn("Grace period expired, suspending team", "team", teamName, "overdueAt", balance.OverdueAt)
+			if s.isGracePeriodExpired(config, overdueAt) {
+				logger.Warn("Grace period expired, suspending team", "team", teamName, "overdueAt", overdueAt)
 				if err := s.SuspendTeam(ctx, teamName); err != nil {
 					logger.Error("Failed to suspend team", "team", teamName, "error", err)
 				}
 			} else {
-				remaining := s.balanceSvc.CalculateGraceRemaining(balance.OverdueAt, config.GracePeriodValue, config.GracePeriodUnit)
+				remaining := s.balanceSvc.CalculateGraceRemaining(overdueAt, config.GracePeriodValue, config.GracePeriodUnit)
 				logger.Info("Team in grace period", "team", teamName, "remaining", remaining)
 			}
-		} else if balance != nil && balance.Amount >= 0 && balance.OverdueAt != nil {
-			// Balance is positive again, clear overdue time
-			if err := s.balanceSvc.SetOverdueAt(ctx, teamName, nil); err != nil {
-				logger.Error("Failed to clear overdue time", "team", teamName, "error", err)
+		} else {
+			// Balance is non-negative again, clear any overdue marker.
+			if cur, err := s.balanceSvc.GetBalance(ctx, teamName); err == nil && cur.OverdueAt != nil {
+				if err := s.balanceSvc.SetOverdueAt(ctx, teamName, nil); err != nil {
+					logger.Error("Failed to clear overdue time", "team", teamName, "error", err)
+				}
 			}
 		}
 	}
 
+	// Record successful billing time so the next cycle bills the correct window.
+	if err := s.setLastBilled(ctx, now); err != nil {
+		logger.Error("Failed to update last-billed timestamp", "error", err)
+	}
+
 	return nil
 }
 
+// getLastBilled returns the timestamp of the last successful billing run, or the
+// zero time if none has been recorded yet.
+func (s *BillingService) getLastBilled(ctx context.Context) (time.Time, error) {
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, BillingConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			return time.Time{}, nil
+		}
+		return time.Time{}, err
+	}
+	v, ok := cm.Data[lastBilledKey]
+	if !ok || v == "" {
+		return time.Time{}, nil
+	}
+	t, err := time.Parse(time.RFC3339, v)
+	if err != nil {
+		logger.Warn("Invalid lastBilledAt timestamp, treating as unset", "value", v)
+		return time.Time{}, nil
+	}
+	return t, nil
+}
+
+// setLastBilled persists the last successful billing time, using optimistic
+// concurrency so it cannot clobber a concurrent config update.
+func (s *BillingService) setLastBilled(ctx context.Context, t time.Time) error {
+	value := t.UTC().Format(time.RFC3339)
+	return retry.RetryOnConflict(retry.DefaultRetry, func() error {
+		cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, BillingConfigMap)
+		if err != nil {
+			if errors.IsNotFound(err) {
+				cm = &corev1.ConfigMap{
+					ObjectMeta: metav1.ObjectMeta{
+						Name:      BillingConfigMap,
+						Namespace: BisonNamespace,
+						Labels: map[string]string{
+							"app.kubernetes.io/name":      "bison",
+							"app.kubernetes.io/component": "billing",
+						},
+					},
+					Data: map[string]string{lastBilledKey: value},
+				}
+				return s.k8sClient.CreateConfigMap(ctx, BisonNamespace, cm)
+			}
+			return err
+		}
+		if cm.Data == nil {
+			cm.Data = make(map[string]string)
+		}
+		cm.Data[lastBilledKey] = value
+		return s.k8sClient.UpdateConfigMap(ctx, BisonNamespace, cm)
+	})
+}
+
 // isGracePeriodExpired checks if the grace period has expired for a team
 func (s *BillingService) isGracePeriodExpired(config *BillingConfig, overdueAt *time.Time) bool {
 	if overdueAt == nil {
@@ -274,6 +372,7 @@ func (s *BillingService) GetTeamBill(ctx context.Context, teamName, window strin
 	resourceCosts := make(map[string]float64)
 
 	config, _ := s.GetConfig(ctx)
+	prices := s.loadPrices(ctx)
 
 	if s.opencostClient != nil && s.opencostClient.IsEnabled() {
 		for _, project := range projects {
@@ -289,7 +388,7 @@ func (s *BillingService) GetTeamBill(ctx context.Context, teamName, window strin
 				totalUsage.GPUHours += alloc.GPUHours
 				totalUsage.Minutes += alloc.Minutes
 
-				cost := s.calculateCost(ctx, config, &alloc)
+				cost := costFromPrices(config, prices, &alloc)
 				totalCost += cost
 
 				resourceCosts["cpu"] += alloc.CPUCost
@@ -323,6 +422,7 @@ func (s *BillingService) GetProjectBill(ctx context.Context, projectName, window
 	resourceCosts := make(map[string]float64)
 
 	config, _ := s.GetConfig(ctx)
+	prices := s.loadPrices(ctx)
 
 	if s.opencostClient != nil && s.opencostClient.IsEnabled() {
 		allocations, err := s.opencostClient.GetAllocationForNamespace(ctx, window, projectName)
@@ -336,7 +436,7 @@ func (s *BillingService) GetProjectBill(ctx context.Context, projectName, window
 			usage.GPUHours += alloc.GPUHours
 			usage.Minutes += alloc.Minutes
 
-			cost := s.calculateCost(ctx, config, &alloc)
+			cost := costFromPrices(config, prices, &alloc)
 			totalCost += cost
 
 			resourceCosts["cpu"] += alloc.CPUCost
@@ -452,62 +552,72 @@ func (s *BillingService) getDefaultConfig() *BillingConfig {
 	}
 }
 
-func (s *BillingService) calculateCost(ctx context.Context, config *BillingConfig, alloc *opencost.Allocation) float64 {
-	if config == nil || !config.Enabled {
-		return alloc.TotalCost
-	}
-
-	var cost float64
+// resourcePrices holds the per-unit prices used for cost computation, resolved
+// once per billing/report operation instead of per allocation row.
+type resourcePrices struct {
+	cpu         float64
+	memory      float64
+	accelerator float64
+}
 
-	// Get resource configs for pricing
+// loadPrices reads the enabled resource configs once and builds a price table.
+func (s *BillingService) loadPrices(ctx context.Context) resourcePrices {
 	resourceConfigs, _ := s.resourceConfigSvc.GetEnabledResourceConfigs(ctx)
-
-	// Build price map and find accelerator price
-	cpuPrice := float64(0)
-	memoryPrice := float64(0)
-	acceleratorPrice := float64(0)
-
+	var p resourcePrices
 	for _, rc := range resourceConfigs {
 		if rc.Price <= 0 {
 			continue
 		}
 		switch rc.Name {
 		case "cpu":
-			cpuPrice = rc.Price
+			p.cpu = rc.Price
 		case "memory":
-			memoryPrice = rc.Price
+			p.memory = rc.Price
 		default:
-			// For accelerators (any non-cpu/memory resource), use the first one with price
-			if rc.Category == CategoryAccelerator && acceleratorPrice == 0 {
-				acceleratorPrice = rc.Price
+			// For accelerators (any non-cpu/memory resource), use the first priced one.
+			if rc.Category == CategoryAccelerator && p.accelerator == 0 {
+				p.accelerator = rc.Price
 			}
 		}
 	}
+	return p
+}
 
-	// CPU cost
-	if cpuPrice > 0 {
-		cost += alloc.CPUCoreHours * cpuPrice
+// costFromPrices computes the cost of a single allocation from a precomputed price table.
+func costFromPrices(config *BillingConfig, p resourcePrices, alloc *opencost.Allocation) float64 {
+	if config == nil || !config.Enabled {
+		return alloc.TotalCost
+	}
+
+	var cost float64
+	if p.cpu > 0 {
+		cost += alloc.CPUCoreHours * p.cpu
 	} else {
 		cost += alloc.CPUCost
 	}
-
-	// Memory cost
-	if memoryPrice > 0 {
-		cost += alloc.RAMGBHours * memoryPrice
+	if p.memory > 0 {
+		cost += alloc.RAMGBHours * p.memory
 	} else {
 		cost += alloc.RAMCost
 	}
-
-	// GPU/Accelerator cost (OpenCost reports all accelerators as GPUHours)
-	if acceleratorPrice > 0 {
-		cost += alloc.GPUHours * acceleratorPrice
+	// OpenCost reports all accelerators as GPUHours.
+	if p.accelerator > 0 {
+		cost += alloc.GPUHours * p.accelerator
 	} else {
 		cost += alloc.GPUCost
 	}
-
 	return cost
 }
 
+// calculateCost computes the cost of a single allocation, loading prices each call.
+// In loops prefer loadPrices + costFromPrices to avoid repeated ConfigMap reads.
+func (s *BillingService) calculateCost(ctx context.Context, config *BillingConfig, alloc *opencost.Allocation) float64 {
+	if config == nil || !config.Enabled {
+		return alloc.TotalCost
+	}
+	return costFromPrices(config, s.loadPrices(ctx), alloc)
+}
+
 func (s *BillingService) scaleDownNamespace(ctx context.Context, namespace string) error {
 	// Scale down deployments
 	deployments, err := s.k8sClient.ListDeployments(ctx, namespace)
@@ -639,6 +749,3 @@ func (s *BillingService) scaleUpNamespace(ctx context.Context, namespace string)
 
 	return nil
 }
-
-// Unused import fix
-var _ = appsv1.Deployment{}
diff --git a/api-server/internal/service/billing_service_test.go b/api-server/internal/service/billing_service_test.go
new file mode 100644
index 0000000..e6f6f59
--- /dev/null
+++ b/api-server/internal/service/billing_service_test.go
@@ -0,0 +1,143 @@
+package service
+
+import (
+	"context"
+	"encoding/json"
+	"testing"
+	"time"
+
+	corev1 "k8s.io/api/core/v1"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+	k8sfake "k8s.io/client-go/kubernetes/fake"
+
+	"github.com/bison/api-server/internal/k8s"
+	"github.com/bison/api-server/internal/opencost"
+)
+
+func newTestBillingService(resourceConfigs []ResourceDefinition) *BillingService {
+	data, _ := json.Marshal(resourceConfigs)
+	cm := &corev1.ConfigMap{
+		ObjectMeta: metav1.ObjectMeta{
+			Name:      ResourceConfigName,
+			Namespace: ResourceConfigNamespace,
+		},
+		Data: map[string]string{ResourceConfigDataKey: string(data)},
+	}
+	cs := k8sfake.NewSimpleClientset(cm)
+	client := k8s.NewClientWithInterfaces(cs, nil)
+	rcSvc := NewResourceConfigService(client)
+	balSvc := NewBalanceService(client)
+	return NewBillingService(client, nil, balSvc, nil, nil, rcSvc)
+}
+
+func TestCalculateCostWithConfiguredPrices(t *testing.T) {
+	svc := newTestBillingService([]ResourceDefinition{
+		{Name: "cpu", Enabled: true, Price: 0.1, Category: CategoryCompute},
+		{Name: "memory", Enabled: true, Price: 0.05, Category: CategoryMemory},
+		{Name: "nvidia.com/gpu", Enabled: true, Price: 8, Category: CategoryAccelerator},
+	})
+
+	config := &BillingConfig{Enabled: true}
+	alloc := &opencost.Allocation{
+		CPUCoreHours: 10,
+		RAMGBHours:   20,
+		GPUHours:     2,
+		// Fallback costs that must be ignored when a configured price exists.
+		CPUCost: 999,
+		RAMCost: 999,
+		GPUCost: 999,
+	}
+
+	got := svc.calculateCost(context.Background(), config, alloc)
+	want := 10*0.1 + 20*0.05 + 2*8.0 // 1 + 1 + 16 = 18
+	if got != want {
+		t.Fatalf("calculateCost = %v, want %v", got, want)
+	}
+}
+
+func TestCalculateCostFallsBackToAllocationCost(t *testing.T) {
+	// No enabled/priced resources configured -> use OpenCost's own cost numbers.
+	svc := newTestBillingService([]ResourceDefinition{})
+
+	config := &BillingConfig{Enabled: true}
+	alloc := &opencost.Allocation{
+		CPUCost: 1.5,
+		RAMCost: 2.5,
+		GPUCost: 6.0,
+	}
+
+	got := svc.calculateCost(context.Background(), config, alloc)
+	want := 1.5 + 2.5 + 6.0
+	if got != want {
+		t.Fatalf("calculateCost fallback = %v, want %v", got, want)
+	}
+}
+
+func TestCalculateCostDisabledReturnsTotalCost(t *testing.T) {
+	svc := newTestBillingService([]ResourceDefinition{})
+
+	alloc := &opencost.Allocation{TotalCost: 42}
+	if got := svc.calculateCost(context.Background(), nil, alloc); got != 42 {
+		t.Fatalf("calculateCost(nil config) = %v, want 42", got)
+	}
+	if got := svc.calculateCost(context.Background(), &BillingConfig{Enabled: false}, alloc); got != 42 {
+		t.Fatalf("calculateCost(disabled) = %v, want 42", got)
+	}
+}
+
+func TestLastBilledRoundTrip(t *testing.T) {
+	svc := newTestBillingService([]ResourceDefinition{})
+	ctx := context.Background()
+
+	// No timestamp yet -> zero time.
+	if ts, err := svc.getLastBilled(ctx); err != nil || !ts.IsZero() {
+		t.Fatalf("expected zero time initially, got %v err=%v", ts, err)
+	}
+
+	now := time.Now().UTC().Truncate(time.Second)
+	if err := svc.setLastBilled(ctx, now); err != nil {
+		t.Fatalf("setLastBilled: %v", err)
+	}
+	got, err := svc.getLastBilled(ctx)
+	if err != nil {
+		t.Fatalf("getLastBilled: %v", err)
+	}
+	if !got.Equal(now) {
+		t.Fatalf("round-trip mismatch: got %v want %v", got, now)
+	}
+
+	// Overwrite works.
+	later := now.Add(2 * time.Hour)
+	if err := svc.setLastBilled(ctx, later); err != nil {
+		t.Fatalf("setLastBilled (overwrite): %v", err)
+	}
+	if got, _ := svc.getLastBilled(ctx); !got.Equal(later) {
+		t.Fatalf("overwrite mismatch: got %v want %v", got, later)
+	}
+}
+
+func TestIsGracePeriodExpired(t *testing.T) {
+	s := &BillingService{}
+	recent := time.Now().Add(-1 * time.Hour)
+	old := time.Now().Add(-72 * time.Hour)
+
+	cases := []struct {
+		name      string
+		cfg       *BillingConfig
+		overdueAt *time.Time
+		want      bool
+	}{
+		{"nil overdue", &BillingConfig{GracePeriodValue: 1, GracePeriodUnit: "days"}, nil, false},
+		{"within hours", &BillingConfig{GracePeriodValue: 24, GracePeriodUnit: "hours"}, &recent, false},
+		{"expired hours", &BillingConfig{GracePeriodValue: 1, GracePeriodUnit: "hours"}, &recent, true},
+		{"within days", &BillingConfig{GracePeriodValue: 7, GracePeriodUnit: "days"}, &old, false},
+		{"expired days", &BillingConfig{GracePeriodValue: 1, GracePeriodUnit: "days"}, &old, true},
+	}
+	for _, tc := range cases {
+		t.Run(tc.name, func(t *testing.T) {
+			if got := s.isGracePeriodExpired(tc.cfg, tc.overdueAt); got != tc.want {
+				t.Fatalf("isGracePeriodExpired = %v, want %v", got, tc.want)
+			}
+		})
+	}
+}
diff --git a/api-server/internal/service/config_transfer_service.go b/api-server/internal/service/config_transfer_service.go
new file mode 100644
index 0000000..5366c49
--- /dev/null
+++ b/api-server/internal/service/config_transfer_service.go
@@ -0,0 +1,664 @@
+package service
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"time"
+
+	"github.com/bison/api-server/pkg/logger"
+)
+
+const (
+	ExportVersion    = "1.0"
+	RedactedValue    = "***REDACTED***"
+	SectionBilling   = "billing"
+	SectionAlerts    = "alerts"
+	SectionResources = "resources"
+	SectionCP        = "controlPlane"
+	SectionScripts   = "initScripts"
+)
+
+var AllSections = []string{SectionBilling, SectionAlerts, SectionResources, SectionCP, SectionScripts}
+
+// ExportConfig represents the full export file structure
+type ExportConfig struct {
+	Version    string                     `json:"version"`
+	ExportedAt time.Time                  `json:"exportedAt"`
+	ExportedBy string                     `json:"exportedBy"`
+	Sections   map[string]json.RawMessage `json:"sections"`
+}
+
+// SectionPreview holds diff info for one config section
+type SectionPreview struct {
+	Present          bool                    `json:"present"`
+	Valid            bool                    `json:"valid"`
+	HasSensitiveData bool                    `json:"hasSensitiveData"`
+	Changes          map[string]*FieldChange `json:"changes,omitempty"`
+	Summary          *ResourceSummary        `json:"summary,omitempty"`
+	Warnings         []string                `json:"warnings,omitempty"`
+	Errors           []string                `json:"errors,omitempty"`
+}
+
+// FieldChange represents a single field change
+type FieldChange struct {
+	Current  interface{} `json:"current"`
+	Imported interface{} `json:"imported"`
+}
+
+// ResourceSummary for array-based configs
+type ResourceSummary struct {
+	Added     []string `json:"added,omitempty"`
+	Modified  []string `json:"modified,omitempty"`
+	Removed   []string `json:"removed,omitempty"`
+	Unchanged []string `json:"unchanged,omitempty"`
+}
+
+// ImportPreviewResult holds the preview/diff analysis
+type ImportPreviewResult struct {
+	Valid      bool                       `json:"valid"`
+	Version    string                     `json:"version"`
+	ExportedAt string                     `json:"exportedAt,omitempty"`
+	Sections   map[string]*SectionPreview `json:"sections"`
+	Errors     []string                   `json:"errors"`
+	Warnings   []string                   `json:"warnings"`
+}
+
+// ImportRequest holds the import apply request
+type ImportRequest struct {
+	Config            ExportConfig `json:"config"`
+	Sections          []string     `json:"sections"`
+	PreserveSensitive bool         `json:"preserveSensitive"`
+}
+
+// ImportResult holds the import apply result
+type ImportResult struct {
+	Message  string   `json:"message"`
+	Applied  []string `json:"applied"`
+	Skipped  []string `json:"skipped"`
+	Warnings []string `json:"warnings"`
+}
+
+// ConfigTransferService handles configuration export and import
+type ConfigTransferService struct {
+	billingSvc        *BillingService
+	alertSvc          *AlertService
+	resourceConfigSvc *ResourceConfigService
+	initScriptSvc     *InitScriptService
+}
+
+// NewConfigTransferService creates a new ConfigTransferService
+func NewConfigTransferService(
+	billingSvc *BillingService,
+	alertSvc *AlertService,
+	resourceConfigSvc *ResourceConfigService,
+	initScriptSvc *InitScriptService,
+) *ConfigTransferService {
+	return &ConfigTransferService{
+		billingSvc:        billingSvc,
+		alertSvc:          alertSvc,
+		resourceConfigSvc: resourceConfigSvc,
+		initScriptSvc:     initScriptSvc,
+	}
+}
+
+// Export exports selected configuration sections
+func (s *ConfigTransferService) Export(ctx context.Context, sections []string, includeSensitive bool, operator string) (*ExportConfig, error) {
+	logger.Info("Exporting configuration", "sections", sections, "includeSensitive", includeSensitive, "operator", operator)
+
+	sectionSet := make(map[string]bool)
+	for _, sec := range sections {
+		sectionSet[sec] = true
+	}
+
+	result := &ExportConfig{
+		Version:    ExportVersion,
+		ExportedAt: time.Now(),
+		ExportedBy: operator,
+		Sections:   make(map[string]json.RawMessage),
+	}
+
+	if sectionSet[SectionBilling] {
+		config, err := s.billingSvc.GetConfig(ctx)
+		if err != nil {
+			return nil, fmt.Errorf("failed to export billing config: %w", err)
+		}
+		data, _ := json.Marshal(config)
+		result.Sections[SectionBilling] = data
+	}
+
+	if sectionSet[SectionAlerts] {
+		config, err := s.alertSvc.GetConfig(ctx)
+		if err != nil {
+			return nil, fmt.Errorf("failed to export alert config: %w", err)
+		}
+		if !includeSensitive {
+			s.redactAlertChannels(config)
+		}
+		data, _ := json.Marshal(config)
+		result.Sections[SectionAlerts] = data
+	}
+
+	if sectionSet[SectionResources] {
+		configs, err := s.resourceConfigSvc.GetResourceConfigs(ctx)
+		if err != nil {
+			return nil, fmt.Errorf("failed to export resource configs: %w", err)
+		}
+		data, _ := json.Marshal(configs)
+		result.Sections[SectionResources] = data
+	}
+
+	if sectionSet[SectionCP] {
+		config, err := s.initScriptSvc.GetControlPlaneConfig(ctx)
+		if err != nil {
+			return nil, fmt.Errorf("failed to export control plane config: %w", err)
+		}
+		if !includeSensitive {
+			if config.Password != "" {
+				config.Password = RedactedValue
+			}
+			if config.PrivateKey != "" {
+				config.PrivateKey = RedactedValue
+			}
+		}
+		data, _ := json.Marshal(config)
+		result.Sections[SectionCP] = data
+	}
+
+	if sectionSet[SectionScripts] {
+		groups, err := s.initScriptSvc.GetAllScriptGroups(ctx)
+		if err != nil {
+			return nil, fmt.Errorf("failed to export init scripts: %w", err)
+		}
+		data, _ := json.Marshal(groups)
+		result.Sections[SectionScripts] = data
+	}
+
+	return result, nil
+}
+
+// redactAlertChannels masks sensitive webhook URLs in alert channels
+func (s *ConfigTransferService) redactAlertChannels(config *AlertConfig) {
+	sensitiveKeys := map[string]bool{
+		"url":     true,
+		"webhook": true,
+		"smtp":    true,
+	}
+	for i := range config.Channels {
+		for key := range config.Channels[i].Config {
+			if sensitiveKeys[key] {
+				val := config.Channels[i].Config[key]
+				if len(val) > 20 {
+					config.Channels[i].Config[key] = val[:10] + "***" + val[len(val)-5:]
+				} else if val != "" {
+					config.Channels[i].Config[key] = RedactedValue
+				}
+			}
+		}
+	}
+}
+
+// Preview validates and previews an import configuration
+func (s *ConfigTransferService) Preview(ctx context.Context, config *ExportConfig) (*ImportPreviewResult, error) {
+	logger.Info("Previewing configuration import")
+
+	result := &ImportPreviewResult{
+		Valid:    true,
+		Version:  config.Version,
+		Sections: make(map[string]*SectionPreview),
+		Errors:   []string{},
+		Warnings: []string{},
+	}
+
+	if config.Version != ExportVersion {
+		result.Valid = false
+		result.Errors = append(result.Errors, fmt.Sprintf("不支持的版本: %s (期望 %s)", config.Version, ExportVersion))
+		return result, nil
+	}
+
+	if !config.ExportedAt.IsZero() {
+		result.ExportedAt = config.ExportedAt.Format(time.RFC3339)
+	}
+
+	for section, raw := range config.Sections {
+		switch section {
+		case SectionBilling:
+			preview := s.previewBilling(ctx, raw)
+			result.Sections[section] = preview
+			if !preview.Valid {
+				result.Valid = false
+			}
+		case SectionAlerts:
+			preview := s.previewAlerts(ctx, raw)
+			result.Sections[section] = preview
+			if !preview.Valid {
+				result.Valid = false
+			}
+		case SectionResources:
+			preview := s.previewResources(ctx, raw)
+			result.Sections[section] = preview
+			if !preview.Valid {
+				result.Valid = false
+			}
+		case SectionCP:
+			preview := s.previewControlPlane(ctx, raw)
+			result.Sections[section] = preview
+			if !preview.Valid {
+				result.Valid = false
+			}
+		case SectionScripts:
+			preview := s.previewInitScripts(ctx, raw)
+			result.Sections[section] = preview
+			if !preview.Valid {
+				result.Valid = false
+			}
+		default:
+			result.Warnings = append(result.Warnings, fmt.Sprintf("未知的配置模块: %s (将被忽略)", section))
+		}
+	}
+
+	return result, nil
+}
+
+func (s *ConfigTransferService) previewBilling(ctx context.Context, raw json.RawMessage) *SectionPreview {
+	preview := &SectionPreview{Present: true, Valid: true}
+
+	var imported BillingConfig
+	if err := json.Unmarshal(raw, &imported); err != nil {
+		preview.Valid = false
+		preview.Errors = append(preview.Errors, "计费配置格式无效: "+err.Error())
+		return preview
+	}
+
+	if imported.Interval <= 0 || imported.Interval > 24 {
+		preview.Errors = append(preview.Errors, "计费间隔必须在 1-24 小时之间")
+		preview.Valid = false
+	}
+	if imported.Currency == "" {
+		preview.Errors = append(preview.Errors, "货币代码不能为空")
+		preview.Valid = false
+	}
+
+	current, err := s.billingSvc.GetConfig(ctx)
+	if err != nil {
+		preview.Warnings = append(preview.Warnings, "无法获取当前计费配置进行对比")
+		return preview
+	}
+
+	preview.Changes = make(map[string]*FieldChange)
+	if current.Enabled != imported.Enabled {
+		preview.Changes["enabled"] = &FieldChange{Current: current.Enabled, Imported: imported.Enabled}
+	}
+	if current.Interval != imported.Interval {
+		preview.Changes["interval"] = &FieldChange{Current: current.Interval, Imported: imported.Interval}
+	}
+	if current.Currency != imported.Currency {
+		preview.Changes["currency"] = &FieldChange{Current: current.Currency, Imported: imported.Currency}
+	}
+	if current.CurrencySymbol != imported.CurrencySymbol {
+		preview.Changes["currencySymbol"] = &FieldChange{Current: current.CurrencySymbol, Imported: imported.CurrencySymbol}
+	}
+	if current.GracePeriodValue != imported.GracePeriodValue {
+		preview.Changes["gracePeriodValue"] = &FieldChange{Current: current.GracePeriodValue, Imported: imported.GracePeriodValue}
+	}
+	if current.GracePeriodUnit != imported.GracePeriodUnit {
+		preview.Changes["gracePeriodUnit"] = &FieldChange{Current: current.GracePeriodUnit, Imported: imported.GracePeriodUnit}
+	}
+
+	return preview
+}
+
+func (s *ConfigTransferService) previewAlerts(ctx context.Context, raw json.RawMessage) *SectionPreview {
+	preview := &SectionPreview{Present: true, Valid: true}
+
+	var imported AlertConfig
+	if err := json.Unmarshal(raw, &imported); err != nil {
+		preview.Valid = false
+		preview.Errors = append(preview.Errors, "告警配置格式无效: "+err.Error())
+		return preview
+	}
+
+	if imported.BalanceThreshold < 0 {
+		preview.Errors = append(preview.Errors, "告警阈值不能为负数")
+		preview.Valid = false
+	}
+
+	for _, ch := range imported.Channels {
+		if ch.ID == "" || ch.Type == "" || ch.Name == "" {
+			preview.Errors = append(preview.Errors, fmt.Sprintf("告警通道 '%s' 缺少必填字段 (id/type/name)", ch.Name))
+			preview.Valid = false
+		}
+		for _, val := range ch.Config {
+			if val == RedactedValue {
+				preview.HasSensitiveData = true
+				preview.Warnings = append(preview.Warnings, "告警通道包含已脱敏的敏感数据，导入时将保留当前值")
+				break
+			}
+		}
+	}
+
+	current, err := s.alertSvc.GetConfig(ctx)
+	if err != nil {
+		preview.Warnings = append(preview.Warnings, "无法获取当前告警配置进行对比")
+		return preview
+	}
+
+	preview.Changes = make(map[string]*FieldChange)
+	if current.BalanceThreshold != imported.BalanceThreshold {
+		preview.Changes["balanceThreshold"] = &FieldChange{Current: current.BalanceThreshold, Imported: imported.BalanceThreshold}
+	}
+	if len(current.Channels) != len(imported.Channels) {
+		preview.Changes["channels"] = &FieldChange{
+			Current:  fmt.Sprintf("%d 个通道", len(current.Channels)),
+			Imported: fmt.Sprintf("%d 个通道", len(imported.Channels)),
+		}
+	}
+
+	return preview
+}
+
+func (s *ConfigTransferService) previewResources(ctx context.Context, raw json.RawMessage) *SectionPreview {
+	preview := &SectionPreview{Present: true, Valid: true}
+
+	var imported []ResourceDefinition
+	if err := json.Unmarshal(raw, &imported); err != nil {
+		preview.Valid = false
+		preview.Errors = append(preview.Errors, "资源配置格式无效: "+err.Error())
+		return preview
+	}
+
+	for _, r := range imported {
+		if r.Name == "" {
+			preview.Errors = append(preview.Errors, "资源名称不能为空")
+			preview.Valid = false
+		}
+		if r.Divisor <= 0 {
+			preview.Errors = append(preview.Errors, fmt.Sprintf("资源 '%s' 的 divisor 必须大于 0", r.Name))
+			preview.Valid = false
+		}
+	}
+
+	current, err := s.resourceConfigSvc.GetResourceConfigs(ctx)
+	if err != nil {
+		preview.Warnings = append(preview.Warnings, "无法获取当前资源配置进行对比")
+		return preview
+	}
+
+	currentMap := make(map[string]ResourceDefinition)
+	for _, r := range current {
+		currentMap[r.Name] = r
+	}
+	importedMap := make(map[string]ResourceDefinition)
+	for _, r := range imported {
+		importedMap[r.Name] = r
+	}
+
+	summary := &ResourceSummary{}
+	for _, r := range imported {
+		if _, exists := currentMap[r.Name]; exists {
+			curR := currentMap[r.Name]
+			if curR.DisplayName != r.DisplayName || curR.Unit != r.Unit || curR.Divisor != r.Divisor ||
+				curR.Category != r.Category || curR.Enabled != r.Enabled || curR.Price != r.Price ||
+				curR.SortOrder != r.SortOrder || curR.ShowInQuota != r.ShowInQuota {
+				summary.Modified = append(summary.Modified, r.Name)
+			} else {
+				summary.Unchanged = append(summary.Unchanged, r.Name)
+			}
+		} else {
+			summary.Added = append(summary.Added, r.Name)
+		}
+	}
+	for _, r := range current {
+		if _, exists := importedMap[r.Name]; !exists {
+			summary.Removed = append(summary.Removed, r.Name)
+		}
+	}
+
+	if len(summary.Removed) > 0 {
+		preview.Warnings = append(preview.Warnings, fmt.Sprintf("以下资源将被移除: %v", summary.Removed))
+	}
+
+	preview.Summary = summary
+	return preview
+}
+
+func (s *ConfigTransferService) previewControlPlane(ctx context.Context, raw json.RawMessage) *SectionPreview {
+	preview := &SectionPreview{Present: true, Valid: true}
+
+	var imported ControlPlaneConfig
+	if err := json.Unmarshal(raw, &imported); err != nil {
+		preview.Valid = false
+		preview.Errors = append(preview.Errors, "控制面配置格式无效: "+err.Error())
+		return preview
+	}
+
+	if imported.SSHPort < 1 || imported.SSHPort > 65535 {
+		preview.Errors = append(preview.Errors, "SSH 端口必须在 1-65535 之间")
+		preview.Valid = false
+	}
+	if imported.AuthMethod != "" && imported.AuthMethod != "password" && imported.AuthMethod != "privateKey" {
+		preview.Errors = append(preview.Errors, "认证方式必须为 password 或 privateKey")
+		preview.Valid = false
+	}
+
+	if imported.Password == RedactedValue || imported.PrivateKey == RedactedValue {
+		preview.HasSensitiveData = true
+		preview.Warnings = append(preview.Warnings, "敏感数据 (密码/私钥) 已被排除，导入时将保留当前值")
+	}
+
+	current, err := s.initScriptSvc.GetControlPlaneConfig(ctx)
+	if err != nil {
+		preview.Warnings = append(preview.Warnings, "无法获取当前控制面配置进行对比")
+		return preview
+	}
+
+	preview.Changes = make(map[string]*FieldChange)
+	if current.Host != imported.Host {
+		preview.Changes["host"] = &FieldChange{Current: current.Host, Imported: imported.Host}
+	}
+	if current.SSHPort != imported.SSHPort {
+		preview.Changes["sshPort"] = &FieldChange{Current: current.SSHPort, Imported: imported.SSHPort}
+	}
+	if current.SSHUser != imported.SSHUser {
+		preview.Changes["sshUser"] = &FieldChange{Current: current.SSHUser, Imported: imported.SSHUser}
+	}
+	if current.AuthMethod != imported.AuthMethod {
+		preview.Changes["authMethod"] = &FieldChange{Current: current.AuthMethod, Imported: imported.AuthMethod}
+	}
+
+	return preview
+}
+
+func (s *ConfigTransferService) previewInitScripts(ctx context.Context, raw json.RawMessage) *SectionPreview {
+	preview := &SectionPreview{Present: true, Valid: true}
+
+	var imported []ScriptGroup
+	if err := json.Unmarshal(raw, &imported); err != nil {
+		preview.Valid = false
+		preview.Errors = append(preview.Errors, "初始化脚本配置格式无效: "+err.Error())
+		return preview
+	}
+
+	for _, g := range imported {
+		if g.ID == "" || g.Name == "" {
+			preview.Errors = append(preview.Errors, fmt.Sprintf("脚本组 '%s' 缺少必填字段 (id/name)", g.Name))
+			preview.Valid = false
+		}
+		if g.Phase != PhasePreJoin && g.Phase != PhasePostJoin {
+			preview.Errors = append(preview.Errors, fmt.Sprintf("脚本组 '%s' 的 phase 必须为 pre-join 或 post-join", g.Name))
+			preview.Valid = false
+		}
+	}
+
+	current, err := s.initScriptSvc.GetAllScriptGroups(ctx)
+	if err != nil {
+		preview.Warnings = append(preview.Warnings, "无法获取当前初始化脚本进行对比")
+		return preview
+	}
+
+	currentMap := make(map[string]ScriptGroup)
+	for _, g := range current {
+		currentMap[g.ID] = g
+	}
+
+	summary := &ResourceSummary{}
+	for _, g := range imported {
+		if _, exists := currentMap[g.ID]; exists {
+			summary.Modified = append(summary.Modified, g.Name)
+		} else {
+			summary.Added = append(summary.Added, g.Name)
+		}
+	}
+	importedMap := make(map[string]bool)
+	for _, g := range imported {
+		importedMap[g.ID] = true
+	}
+	for _, g := range current {
+		if !importedMap[g.ID] {
+			summary.Removed = append(summary.Removed, g.Name)
+		}
+	}
+
+	builtinOverwrite := 0
+	for _, g := range imported {
+		if cur, exists := currentMap[g.ID]; exists && cur.Builtin {
+			builtinOverwrite++
+		}
+	}
+	if builtinOverwrite > 0 {
+		preview.Warnings = append(preview.Warnings, fmt.Sprintf("将覆盖 %d 个内置脚本组", builtinOverwrite))
+	}
+
+	preview.Summary = summary
+	return preview
+}
+
+// Apply applies the imported configuration
+func (s *ConfigTransferService) Apply(ctx context.Context, req *ImportRequest) (*ImportResult, error) {
+	logger.Info("Applying imported configuration", "sections", req.Sections)
+
+	result := &ImportResult{
+		Applied:  []string{},
+		Skipped:  []string{},
+		Warnings: []string{},
+	}
+
+	sectionSet := make(map[string]bool)
+	for _, sec := range req.Sections {
+		sectionSet[sec] = true
+	}
+
+	for _, section := range AllSections {
+		raw, exists := req.Config.Sections[section]
+		if !exists || !sectionSet[section] {
+			if sectionSet[section] {
+				result.Skipped = append(result.Skipped, section)
+			}
+			continue
+		}
+
+		var err error
+		switch section {
+		case SectionBilling:
+			err = s.applyBilling(ctx, raw)
+		case SectionAlerts:
+			err = s.applyAlerts(ctx, raw, req.PreserveSensitive)
+		case SectionResources:
+			err = s.applyResources(ctx, raw)
+		case SectionCP:
+			err = s.applyControlPlane(ctx, raw, req.PreserveSensitive)
+		case SectionScripts:
+			err = s.applyInitScripts(ctx, raw)
+		}
+
+		if err != nil {
+			result.Warnings = append(result.Warnings, fmt.Sprintf("%s 导入失败: %s", section, err.Error()))
+			result.Skipped = append(result.Skipped, section)
+		} else {
+			result.Applied = append(result.Applied, section)
+		}
+	}
+
+	if len(result.Applied) > 0 {
+		result.Message = fmt.Sprintf("成功导入 %d 个配置模块", len(result.Applied))
+	} else {
+		result.Message = "未成功导入任何配置模块"
+	}
+
+	return result, nil
+}
+
+func (s *ConfigTransferService) applyBilling(ctx context.Context, raw json.RawMessage) error {
+	var config BillingConfig
+	if err := json.Unmarshal(raw, &config); err != nil {
+		return fmt.Errorf("解析计费配置失败: %w", err)
+	}
+	return s.billingSvc.SetConfig(ctx, &config)
+}
+
+func (s *ConfigTransferService) applyAlerts(ctx context.Context, raw json.RawMessage, preserveSensitive bool) error {
+	var config AlertConfig
+	if err := json.Unmarshal(raw, &config); err != nil {
+		return fmt.Errorf("解析告警配置失败: %w", err)
+	}
+
+	if preserveSensitive {
+		current, err := s.alertSvc.GetConfig(ctx)
+		if err == nil {
+			currentChannelMap := make(map[string]NotifyChannel)
+			for _, ch := range current.Channels {
+				currentChannelMap[ch.ID] = ch
+			}
+			for i, ch := range config.Channels {
+				if curCh, exists := currentChannelMap[ch.ID]; exists {
+					for key, val := range ch.Config {
+						if val == RedactedValue || (len(val) > 8 && val[len(val)-3:] == "***") {
+							if curVal, ok := curCh.Config[key]; ok {
+								config.Channels[i].Config[key] = curVal
+							}
+						}
+					}
+				}
+			}
+		}
+	}
+
+	return s.alertSvc.SetConfig(ctx, &config)
+}
+
+func (s *ConfigTransferService) applyResources(ctx context.Context, raw json.RawMessage) error {
+	var configs []ResourceDefinition
+	if err := json.Unmarshal(raw, &configs); err != nil {
+		return fmt.Errorf("解析资源配置失败: %w", err)
+	}
+	return s.resourceConfigSvc.SaveResourceConfigs(ctx, configs)
+}
+
+func (s *ConfigTransferService) applyControlPlane(ctx context.Context, raw json.RawMessage, preserveSensitive bool) error {
+	var config ControlPlaneConfig
+	if err := json.Unmarshal(raw, &config); err != nil {
+		return fmt.Errorf("解析控制面配置失败: %w", err)
+	}
+
+	if preserveSensitive {
+		current, err := s.initScriptSvc.GetControlPlaneConfig(ctx)
+		if err == nil {
+			if config.Password == RedactedValue {
+				config.Password = current.Password
+			}
+			if config.PrivateKey == RedactedValue {
+				config.PrivateKey = current.PrivateKey
+			}
+		}
+	}
+
+	return s.initScriptSvc.SaveControlPlaneConfig(ctx, &config)
+}
+
+func (s *ConfigTransferService) applyInitScripts(ctx context.Context, raw json.RawMessage) error {
+	var groups []ScriptGroup
+	if err := json.Unmarshal(raw, &groups); err != nil {
+		return fmt.Errorf("解析初始化脚本配置失败: %w", err)
+	}
+	return s.initScriptSvc.SaveAllScriptGroups(ctx, groups)
+}
diff --git a/api-server/internal/service/init_script_service.go b/api-server/internal/service/init_script_service.go
new file mode 100644
index 0000000..1444b90
--- /dev/null
+++ b/api-server/internal/service/init_script_service.go
@@ -0,0 +1,924 @@
+package service
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"sort"
+	"strings"
+	"time"
+
+	corev1 "k8s.io/api/core/v1"
+	"k8s.io/apimachinery/pkg/api/errors"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+
+	"github.com/bison/api-server/internal/k8s"
+	"github.com/bison/api-server/pkg/logger"
+)
+
+const (
+	InitScriptsConfigMap        = "bison-init-scripts"
+	ControlPlaneConfigConfigMap = "bison-control-plane-config"
+)
+
+// ScriptPhase represents when a script should be executed
+type ScriptPhase string
+
+const (
+	PhasePreJoin  ScriptPhase = "pre-join"
+	PhasePostJoin ScriptPhase = "post-join"
+)
+
+// Script represents a platform-specific script implementation
+type Script struct {
+	ID      string `json:"id"`
+	OS      string `json:"os"`      // "ubuntu", "centos", "debian", "*" (wildcard)
+	Arch    string `json:"arch"`    // "amd64", "arm64", "*" (wildcard)
+	Content string `json:"content"` // Shell script content
+}
+
+// ScriptGroup represents a group of scripts for a specific functionality
+type ScriptGroup struct {
+	ID          string      `json:"id"`
+	Name        string      `json:"name"`
+	Description string      `json:"description"`
+	Phase       ScriptPhase `json:"phase"`
+	Enabled     bool        `json:"enabled"`
+	Order       int         `json:"order"`
+	Builtin     bool        `json:"builtin"`
+	Scripts     []Script    `json:"scripts"`
+}
+
+// InitScriptsConfig holds all script groups
+type InitScriptsConfig struct {
+	Groups []ScriptGroup `json:"groups"`
+}
+
+// NodePlatform represents the detected platform of a node
+type NodePlatform struct {
+	OS      string `json:"os"`
+	Version string `json:"version"`
+	Arch    string `json:"arch"`
+}
+
+// ControlPlaneConfig holds the control plane SSH configuration
+type ControlPlaneConfig struct {
+	Host       string `json:"host"`
+	SSHPort    int    `json:"sshPort"`
+	SSHUser    string `json:"sshUser"`
+	AuthMethod string `json:"authMethod"` // "password" or "privateKey"
+	Password   string `json:"password,omitempty"`
+	PrivateKey string `json:"privateKey,omitempty"`
+}
+
+// InitScriptService handles initialization script operations
+type InitScriptService struct {
+	k8sClient *k8s.Client
+}
+
+// NewInitScriptService creates a new InitScriptService
+func NewInitScriptService(k8sClient *k8s.Client) *InitScriptService {
+	return &InitScriptService{
+		k8sClient: k8sClient,
+	}
+}
+
+// GetAllScriptGroups returns all script groups
+func (s *InitScriptService) GetAllScriptGroups(ctx context.Context) ([]ScriptGroup, error) {
+	logger.Debug("Getting all script groups")
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return nil, err
+	}
+
+	// Sort by order
+	sort.Slice(config.Groups, func(i, j int) bool {
+		return config.Groups[i].Order < config.Groups[j].Order
+	})
+
+	return config.Groups, nil
+}
+
+// GetScriptGroup returns a specific script group by ID
+func (s *InitScriptService) GetScriptGroup(ctx context.Context, id string) (*ScriptGroup, error) {
+	logger.Debug("Getting script group", "id", id)
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return nil, err
+	}
+
+	for _, group := range config.Groups {
+		if group.ID == id {
+			return &group, nil
+		}
+	}
+
+	return nil, fmt.Errorf("script group not found: %s", id)
+}
+
+// CreateScriptGroup creates a new script group
+func (s *InitScriptService) CreateScriptGroup(ctx context.Context, group *ScriptGroup) error {
+	logger.Info("Creating script group", "name", group.Name)
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return err
+	}
+
+	// Generate ID if not provided
+	if group.ID == "" {
+		group.ID = fmt.Sprintf("custom-%d", time.Now().UnixNano())
+	}
+
+	// Check for duplicate ID
+	for _, existing := range config.Groups {
+		if existing.ID == group.ID {
+			return fmt.Errorf("script group with ID %s already exists", group.ID)
+		}
+	}
+
+	// Set order to last
+	if group.Order == 0 {
+		maxOrder := 0
+		for _, g := range config.Groups {
+			if g.Order > maxOrder {
+				maxOrder = g.Order
+			}
+		}
+		group.Order = maxOrder + 1
+	}
+
+	// Custom scripts are not builtin
+	group.Builtin = false
+
+	config.Groups = append(config.Groups, *group)
+
+	return s.saveInitScriptsConfig(ctx, config)
+}
+
+// UpdateScriptGroup updates an existing script group
+func (s *InitScriptService) UpdateScriptGroup(ctx context.Context, id string, group *ScriptGroup) error {
+	logger.Info("Updating script group", "id", id)
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return err
+	}
+
+	found := false
+	for i, existing := range config.Groups {
+		if existing.ID == id {
+			// Preserve builtin status and ID
+			group.ID = id
+			group.Builtin = existing.Builtin
+			config.Groups[i] = *group
+			found = true
+			break
+		}
+	}
+
+	if !found {
+		return fmt.Errorf("script group not found: %s", id)
+	}
+
+	return s.saveInitScriptsConfig(ctx, config)
+}
+
+// DeleteScriptGroup deletes a script group (only custom scripts can be deleted)
+func (s *InitScriptService) DeleteScriptGroup(ctx context.Context, id string) error {
+	logger.Info("Deleting script group", "id", id)
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return err
+	}
+
+	newGroups := make([]ScriptGroup, 0, len(config.Groups))
+	deleted := false
+
+	for _, group := range config.Groups {
+		if group.ID == id {
+			if group.Builtin {
+				return fmt.Errorf("cannot delete builtin script group: %s", id)
+			}
+			deleted = true
+			continue
+		}
+		newGroups = append(newGroups, group)
+	}
+
+	if !deleted {
+		return fmt.Errorf("script group not found: %s", id)
+	}
+
+	config.Groups = newGroups
+	return s.saveInitScriptsConfig(ctx, config)
+}
+
+// ToggleScriptGroup enables or disables a script group
+func (s *InitScriptService) ToggleScriptGroup(ctx context.Context, id string, enabled bool) error {
+	logger.Info("Toggling script group", "id", id, "enabled", enabled)
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return err
+	}
+
+	found := false
+	for i, group := range config.Groups {
+		if group.ID == id {
+			config.Groups[i].Enabled = enabled
+			found = true
+			break
+		}
+	}
+
+	if !found {
+		return fmt.Errorf("script group not found: %s", id)
+	}
+
+	return s.saveInitScriptsConfig(ctx, config)
+}
+
+// ReorderScriptGroups updates the order of script groups
+func (s *InitScriptService) ReorderScriptGroups(ctx context.Context, ids []string) error {
+	logger.Info("Reordering script groups", "ids", ids)
+
+	config, err := s.getInitScriptsConfig(ctx)
+	if err != nil {
+		return err
+	}
+
+	// Create a map of current groups
+	groupMap := make(map[string]*ScriptGroup)
+	for i := range config.Groups {
+		groupMap[config.Groups[i].ID] = &config.Groups[i]
+	}
+
+	// Update orders based on the provided order
+	for i, id := range ids {
+		if group, ok := groupMap[id]; ok {
+			group.Order = i + 1
+		}
+	}
+
+	return s.saveInitScriptsConfig(ctx, config)
+}
+
+// GetMatchingScript returns the best matching script for a given platform
+func (s *InitScriptService) GetMatchingScript(group *ScriptGroup, platform NodePlatform) *Script {
+	if len(group.Scripts) == 0 {
+		return nil
+	}
+
+	// Priority: exact match > OS match with wildcard arch > wildcard OS with arch match > all wildcards
+	var exactMatch, osMatch, archMatch, wildcardMatch *Script
+
+	for i := range group.Scripts {
+		script := &group.Scripts[i]
+		osMatches := script.OS == platform.OS || script.OS == "*"
+		archMatches := script.Arch == platform.Arch || script.Arch == "*"
+
+		if !osMatches || !archMatches {
+			continue
+		}
+
+		if script.OS == platform.OS && script.Arch == platform.Arch {
+			exactMatch = script
+			break // Best match found
+		} else if script.OS == platform.OS && script.Arch == "*" {
+			osMatch = script
+		} else if script.OS == "*" && script.Arch == platform.Arch {
+			archMatch = script
+		} else if script.OS == "*" && script.Arch == "*" {
+			wildcardMatch = script
+		}
+	}
+
+	// Return by priority
+	if exactMatch != nil {
+		return exactMatch
+	}
+	if osMatch != nil {
+		return osMatch
+	}
+	if archMatch != nil {
+		return archMatch
+	}
+	return wildcardMatch
+}
+
+// GetScriptsForPhase returns all enabled scripts for a specific phase, matched to the platform
+func (s *InitScriptService) GetScriptsForPhase(ctx context.Context, phase ScriptPhase, platform NodePlatform) ([]struct {
+	Group  ScriptGroup
+	Script Script
+}, error) {
+	groups, err := s.GetAllScriptGroups(ctx)
+	if err != nil {
+		return nil, err
+	}
+
+	var result []struct {
+		Group  ScriptGroup
+		Script Script
+	}
+
+	for _, group := range groups {
+		if group.Phase != phase || !group.Enabled {
+			continue
+		}
+
+		script := s.GetMatchingScript(&group, platform)
+		if script != nil {
+			result = append(result, struct {
+				Group  ScriptGroup
+				Script Script
+			}{
+				Group:  group,
+				Script: *script,
+			})
+		}
+	}
+
+	return result, nil
+}
+
+// GetControlPlaneConfig returns the control plane SSH configuration
+func (s *InitScriptService) GetControlPlaneConfig(ctx context.Context) (*ControlPlaneConfig, error) {
+	logger.Debug("Getting control plane config")
+
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, ControlPlaneConfigConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			return &ControlPlaneConfig{
+				SSHPort: 22,
+				SSHUser: "root",
+			}, nil
+		}
+		return nil, fmt.Errorf("failed to get control plane config: %w", err)
+	}
+
+	data, ok := cm.Data["config"]
+	if !ok {
+		return &ControlPlaneConfig{
+			SSHPort: 22,
+			SSHUser: "root",
+		}, nil
+	}
+
+	var config ControlPlaneConfig
+	if err := json.Unmarshal([]byte(data), &config); err != nil {
+		return nil, fmt.Errorf("failed to parse control plane config: %w", err)
+	}
+
+	return &config, nil
+}
+
+// SaveControlPlaneConfig saves the control plane SSH configuration
+func (s *InitScriptService) SaveControlPlaneConfig(ctx context.Context, config *ControlPlaneConfig) error {
+	logger.Info("Saving control plane config", "host", config.Host)
+
+	// Set defaults
+	if config.SSHPort == 0 {
+		config.SSHPort = 22
+	}
+	if config.SSHUser == "" {
+		config.SSHUser = "root"
+	}
+
+	data, err := json.Marshal(config)
+	if err != nil {
+		return fmt.Errorf("failed to marshal control plane config: %w", err)
+	}
+
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, ControlPlaneConfigConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			// Create new ConfigMap
+			cm = &corev1.ConfigMap{
+				ObjectMeta: metav1.ObjectMeta{
+					Name:      ControlPlaneConfigConfigMap,
+					Namespace: BisonNamespace,
+				},
+				Data: map[string]string{
+					"config": string(data),
+				},
+			}
+			return s.k8sClient.CreateConfigMap(ctx, BisonNamespace, cm)
+		}
+		return fmt.Errorf("failed to get control plane config: %w", err)
+	}
+
+	// Update existing ConfigMap
+	if cm.Data == nil {
+		cm.Data = make(map[string]string)
+	}
+	cm.Data["config"] = string(data)
+
+	return s.k8sClient.UpdateConfigMap(ctx, BisonNamespace, cm)
+}
+
+// SaveAllScriptGroups replaces all script groups at once (used by config import)
+func (s *InitScriptService) SaveAllScriptGroups(ctx context.Context, groups []ScriptGroup) error {
+	logger.Info("Saving all script groups", "count", len(groups))
+	config := &InitScriptsConfig{Groups: groups}
+	return s.saveInitScriptsConfig(ctx, config)
+}
+
+// getInitScriptsConfig returns the init scripts configuration, initializing with defaults if not found
+func (s *InitScriptService) getInitScriptsConfig(ctx context.Context) (*InitScriptsConfig, error) {
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, InitScriptsConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			// Initialize with default builtin scripts
+			config := s.getDefaultInitScriptsConfig()
+			if err := s.saveInitScriptsConfig(ctx, config); err != nil {
+				return nil, err
+			}
+			return config, nil
+		}
+		return nil, fmt.Errorf("failed to get init scripts config: %w", err)
+	}
+
+	data, ok := cm.Data["config"]
+	if !ok {
+		config := s.getDefaultInitScriptsConfig()
+		if err := s.saveInitScriptsConfig(ctx, config); err != nil {
+			return nil, err
+		}
+		return config, nil
+	}
+
+	var config InitScriptsConfig
+	if err := json.Unmarshal([]byte(data), &config); err != nil {
+		return nil, fmt.Errorf("failed to parse init scripts config: %w", err)
+	}
+
+	return &config, nil
+}
+
+// saveInitScriptsConfig saves the init scripts configuration
+func (s *InitScriptService) saveInitScriptsConfig(ctx context.Context, config *InitScriptsConfig) error {
+	data, err := json.Marshal(config)
+	if err != nil {
+		return fmt.Errorf("failed to marshal init scripts config: %w", err)
+	}
+
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, InitScriptsConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			// Create new ConfigMap
+			cm = &corev1.ConfigMap{
+				ObjectMeta: metav1.ObjectMeta{
+					Name:      InitScriptsConfigMap,
+					Namespace: BisonNamespace,
+				},
+				Data: map[string]string{
+					"config": string(data),
+				},
+			}
+			return s.k8sClient.CreateConfigMap(ctx, BisonNamespace, cm)
+		}
+		return fmt.Errorf("failed to get init scripts config: %w", err)
+	}
+
+	// Update existing ConfigMap
+	if cm.Data == nil {
+		cm.Data = make(map[string]string)
+	}
+	cm.Data["config"] = string(data)
+
+	return s.k8sClient.UpdateConfigMap(ctx, BisonNamespace, cm)
+}
+
+// getDefaultInitScriptsConfig returns the default builtin script groups
+func (s *InitScriptService) getDefaultInitScriptsConfig() *InitScriptsConfig {
+	return &InitScriptsConfig{
+		Groups: []ScriptGroup{
+			{
+				ID:          "disable-swap",
+				Name:        "禁用 Swap",
+				Description: "禁用 Swap 分区（Kubernetes 要求）",
+				Phase:       PhasePreJoin,
+				Enabled:     true,
+				Order:       1,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "disable-swap-universal",
+						OS:   "*",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Disabling swap..."
+swapoff -a || true
+sed -i '/swap/d' /etc/fstab || true
+echo "Swap disabled successfully"
+`,
+					},
+				},
+			},
+			{
+				ID:          "configure-kernel",
+				Name:        "配置内核参数",
+				Description: "配置 Kubernetes 所需的内核参数",
+				Phase:       PhasePreJoin,
+				Enabled:     true,
+				Order:       2,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "configure-kernel-universal",
+						OS:   "*",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Configuring kernel parameters..."
+
+# Load required modules
+modprobe br_netfilter || true
+modprobe overlay || true
+
+# Ensure modules load on boot
+cat > /etc/modules-load.d/k8s.conf << EOF
+br_netfilter
+overlay
+EOF
+
+# Configure sysctl
+cat > /etc/sysctl.d/k8s.conf << EOF
+net.bridge.bridge-nf-call-iptables = 1
+net.bridge.bridge-nf-call-ip6tables = 1
+net.ipv4.ip_forward = 1
+EOF
+
+sysctl --system
+echo "Kernel parameters configured successfully"
+`,
+					},
+				},
+			},
+			{
+				ID:          "disable-firewall",
+				Name:        "禁用防火墙",
+				Description: "禁用节点防火墙（firewalld/ufw）",
+				Phase:       PhasePreJoin,
+				Enabled:     false,
+				Order:       3,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "disable-firewall-debian",
+						OS:   "ubuntu",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Disabling firewall..."
+if command -v ufw &> /dev/null; then
+    ufw disable || true
+fi
+echo "Firewall disabled successfully"
+`,
+					},
+					{
+						ID:   "disable-firewall-debian2",
+						OS:   "debian",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Disabling firewall..."
+if command -v ufw &> /dev/null; then
+    ufw disable || true
+fi
+echo "Firewall disabled successfully"
+`,
+					},
+					{
+						ID:   "disable-firewall-rhel",
+						OS:   "centos",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Disabling firewall..."
+if systemctl is-active --quiet firewalld 2>/dev/null; then
+    systemctl stop firewalld
+    systemctl disable firewalld
+fi
+echo "Firewall disabled successfully"
+`,
+					},
+					{
+						ID:   "disable-firewall-rhel2",
+						OS:   "rhel",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Disabling firewall..."
+if systemctl is-active --quiet firewalld 2>/dev/null; then
+    systemctl stop firewalld
+    systemctl disable firewalld
+fi
+echo "Firewall disabled successfully"
+`,
+					},
+					{
+						ID:   "disable-firewall-openeuler",
+						OS:   "openEuler",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Disabling firewall..."
+if systemctl is-active --quiet firewalld 2>/dev/null; then
+    systemctl stop firewalld
+    systemctl disable firewalld
+fi
+echo "Firewall disabled successfully"
+`,
+					},
+				},
+			},
+			{
+				ID:          "configure-selinux",
+				Name:        "配置 SELinux",
+				Description: "设置 SELinux 为 Permissive 模式（仅 RHEL/CentOS/openEuler）",
+				Phase:       PhasePreJoin,
+				Enabled:     false,
+				Order:       4,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "configure-selinux-centos",
+						OS:   "centos",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Configuring SELinux to permissive mode..."
+if command -v setenforce &> /dev/null; then
+    setenforce 0 || true
+    if [ -f /etc/selinux/config ]; then
+        sed -i 's/^SELINUX=enforcing$/SELINUX=permissive/' /etc/selinux/config
+    fi
+fi
+echo "SELinux configured successfully"
+`,
+					},
+					{
+						ID:   "configure-selinux-rhel",
+						OS:   "rhel",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Configuring SELinux to permissive mode..."
+if command -v setenforce &> /dev/null; then
+    setenforce 0 || true
+    if [ -f /etc/selinux/config ]; then
+        sed -i 's/^SELINUX=enforcing$/SELINUX=permissive/' /etc/selinux/config
+    fi
+fi
+echo "SELinux configured successfully"
+`,
+					},
+					{
+						ID:   "configure-selinux-openeuler",
+						OS:   "openEuler",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Configuring SELinux to permissive mode..."
+if command -v setenforce &> /dev/null; then
+    setenforce 0 || true
+    if [ -f /etc/selinux/config ]; then
+        sed -i 's/^SELINUX=enforcing$/SELINUX=permissive/' /etc/selinux/config
+    fi
+fi
+echo "SELinux configured successfully"
+`,
+					},
+				},
+			},
+			{
+				ID:          "configure-timezone",
+				Name:        "配置时区和 NTP",
+				Description: "设置系统时区并启用 NTP 时间同步",
+				Phase:       PhasePreJoin,
+				Enabled:     false,
+				Order:       5,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "configure-timezone-universal",
+						OS:   "*",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+TIMEZONE="${TIMEZONE:-Asia/Shanghai}"
+
+echo "Configuring timezone to $TIMEZONE..."
+timedatectl set-timezone $TIMEZONE || true
+
+echo "Enabling and starting NTP service..."
+if systemctl list-unit-files | grep -q chronyd; then
+    systemctl enable chronyd || true
+    systemctl start chronyd || true
+elif systemctl list-unit-files | grep -q ntpd; then
+    systemctl enable ntpd || true
+    systemctl start ntpd || true
+elif systemctl list-unit-files | grep -q systemd-timesyncd; then
+    systemctl enable systemd-timesyncd || true
+    systemctl start systemd-timesyncd || true
+fi
+
+echo "Timezone and NTP configured successfully"
+`,
+					},
+				},
+			},
+			{
+				ID:          "configure-registry",
+				Name:        "配置私有镜像仓库",
+				Description: "配置 containerd 使用私有镜像仓库（支持 HTTP）",
+				Phase:       PhasePreJoin,
+				Enabled:     false,
+				Order:       6,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "configure-registry-ubuntu",
+						OS:   "ubuntu",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+REGISTRY_URL="${REGISTRY_URL:-registry.example.com:5000}"
+
+echo "Configuring private registry: $REGISTRY_URL"
+
+# Create registry config directory
+mkdir -p /etc/containerd/certs.d/${REGISTRY_URL}
+
+# Configure registry mirror
+cat > /etc/containerd/certs.d/${REGISTRY_URL}/hosts.toml << EOF
+server = "http://${REGISTRY_URL}"
+
+[host."http://${REGISTRY_URL}"]
+  capabilities = ["pull", "resolve", "push"]
+  skip_verify = true
+EOF
+
+# Restart containerd
+systemctl restart containerd
+echo "Private registry configured successfully"
+`,
+					},
+					{
+						ID:   "configure-registry-debian",
+						OS:   "debian",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+REGISTRY_URL="${REGISTRY_URL:-registry.example.com:5000}"
+
+echo "Configuring private registry: $REGISTRY_URL"
+
+# Create registry config directory
+mkdir -p /etc/containerd/certs.d/${REGISTRY_URL}
+
+# Configure registry mirror
+cat > /etc/containerd/certs.d/${REGISTRY_URL}/hosts.toml << EOF
+server = "http://${REGISTRY_URL}"
+
+[host."http://${REGISTRY_URL}"]
+  capabilities = ["pull", "resolve", "push"]
+  skip_verify = true
+EOF
+
+# Restart containerd
+systemctl restart containerd
+echo "Private registry configured successfully"
+`,
+					},
+					{
+						ID:   "configure-registry-centos",
+						OS:   "centos",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+REGISTRY_URL="${REGISTRY_URL:-registry.example.com:5000}"
+
+echo "Configuring private registry: $REGISTRY_URL"
+
+# Create registry config directory
+mkdir -p /etc/containerd/certs.d/${REGISTRY_URL}
+
+# Configure registry mirror
+cat > /etc/containerd/certs.d/${REGISTRY_URL}/hosts.toml << EOF
+server = "http://${REGISTRY_URL}"
+
+[host."http://${REGISTRY_URL}"]
+  capabilities = ["pull", "resolve", "push"]
+  skip_verify = true
+EOF
+
+# Restart containerd
+systemctl restart containerd
+echo "Private registry configured successfully"
+`,
+					},
+					{
+						ID:   "configure-registry-rhel",
+						OS:   "rhel",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+REGISTRY_URL="${REGISTRY_URL:-registry.example.com:5000}"
+
+echo "Configuring private registry: $REGISTRY_URL"
+
+# Create registry config directory
+mkdir -p /etc/containerd/certs.d/${REGISTRY_URL}
+
+# Configure registry mirror
+cat > /etc/containerd/certs.d/${REGISTRY_URL}/hosts.toml << EOF
+server = "http://${REGISTRY_URL}"
+
+[host."http://${REGISTRY_URL}"]
+  capabilities = ["pull", "resolve", "push"]
+  skip_verify = true
+EOF
+
+# Restart containerd
+systemctl restart containerd
+echo "Private registry configured successfully"
+`,
+					},
+					{
+						ID:   "configure-registry-openeuler",
+						OS:   "openEuler",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+REGISTRY_URL="${REGISTRY_URL:-registry.example.com:5000}"
+
+echo "Configuring private registry: $REGISTRY_URL"
+
+# Create registry config directory
+mkdir -p /etc/containerd/certs.d/${REGISTRY_URL}
+
+# Configure registry mirror
+cat > /etc/containerd/certs.d/${REGISTRY_URL}/hosts.toml << EOF
+server = "http://${REGISTRY_URL}"
+
+[host."http://${REGISTRY_URL}"]
+  capabilities = ["pull", "resolve", "push"]
+  skip_verify = true
+EOF
+
+# Restart containerd
+systemctl restart containerd
+echo "Private registry configured successfully"
+`,
+					},
+				},
+			},
+			{
+				ID:          "add-node-labels",
+				Name:        "添加节点标签",
+				Description: "为节点添加 Worker 角色标签",
+				Phase:       PhasePostJoin,
+				Enabled:     false,
+				Order:       7,
+				Builtin:     true,
+				Scripts: []Script{
+					{
+						ID:   "add-node-labels-universal",
+						OS:   "*",
+						Arch: "*",
+						Content: `#!/bin/bash
+set -e
+echo "Adding worker label to node ${NODE_NAME}..."
+
+# Wait for node to be registered
+sleep 5
+
+# Add worker role label
+kubectl label node ${NODE_NAME} node-role.kubernetes.io/worker= --overwrite || true
+
+echo "Node label added successfully"
+`,
+					},
+				},
+			},
+		},
+	}
+}
+
+// ReplaceVariables replaces variables in the script content
+func ReplaceVariables(content string, vars map[string]string) string {
+	result := content
+	for key, value := range vars {
+		placeholder := "${" + key + "}"
+		result = strings.ReplaceAll(result, placeholder, value)
+	}
+	return result
+}
diff --git a/api-server/internal/service/main_test.go b/api-server/internal/service/main_test.go
new file mode 100644
index 0000000..c0d86b0
--- /dev/null
+++ b/api-server/internal/service/main_test.go
@@ -0,0 +1,15 @@
+package service
+
+import (
+	"os"
+	"testing"
+
+	"github.com/bison/api-server/pkg/logger"
+)
+
+// TestMain initializes the package-level logger so service tests that log do not
+// hit a nil SugaredLogger.
+func TestMain(m *testing.M) {
+	logger.Init(false)
+	os.Exit(m.Run())
+}
diff --git a/api-server/internal/service/onboarding_service.go b/api-server/internal/service/onboarding_service.go
new file mode 100644
index 0000000..7efc8a1
--- /dev/null
+++ b/api-server/internal/service/onboarding_service.go
@@ -0,0 +1,760 @@
+package service
+
+import (
+	"context"
+	"encoding/json"
+	"fmt"
+	"sync"
+	"time"
+
+	corev1 "k8s.io/api/core/v1"
+	"k8s.io/apimachinery/pkg/api/errors"
+	metav1 "k8s.io/apimachinery/pkg/apis/meta/v1"
+
+	"github.com/bison/api-server/internal/k8s"
+	"github.com/bison/api-server/internal/ssh"
+	"github.com/bison/api-server/pkg/logger"
+)
+
+// Ensure metav1 is used
+var _ = metav1.Now
+
+const (
+	OnboardingJobsConfigMap = "bison-onboarding-jobs"
+)
+
+// OnboardingJobStatus represents the status of an onboarding job
+type OnboardingJobStatus string
+
+const (
+	JobStatusPending   OnboardingJobStatus = "pending"
+	JobStatusRunning   OnboardingJobStatus = "running"
+	JobStatusSuccess   OnboardingJobStatus = "success"
+	JobStatusFailed    OnboardingJobStatus = "failed"
+	JobStatusCancelled OnboardingJobStatus = "cancelled"
+)
+
+// SubStepStatus represents the status of a sub-step
+type SubStepStatus string
+
+const (
+	SubStepPending SubStepStatus = "pending"
+	SubStepRunning SubStepStatus = "running"
+	SubStepSuccess SubStepStatus = "success"
+	SubStepFailed  SubStepStatus = "failed"
+	SubStepSkipped SubStepStatus = "skipped"
+)
+
+// SubStep represents a sub-step within a main step
+type SubStep struct {
+	Name   string        `json:"name"`
+	Status SubStepStatus `json:"status"`
+	Error  string        `json:"error,omitempty"`
+}
+
+// OnboardingJob represents a node onboarding job
+type OnboardingJob struct {
+	ID           string              `json:"id"`
+	NodeIP       string              `json:"nodeIP"`
+	NodeName     string              `json:"nodeName,omitempty"`
+	Platform     NodePlatform        `json:"platform"`
+	Status       OnboardingJobStatus `json:"status"`
+	CurrentStep  int                 `json:"currentStep"`
+	TotalSteps   int                 `json:"totalSteps"`
+	StepMessage  string              `json:"stepMessage"`
+	SubSteps     []SubStep           `json:"subSteps,omitempty"`
+	ErrorMessage string              `json:"errorMessage,omitempty"`
+	CreatedAt    time.Time           `json:"createdAt"`
+	UpdatedAt    time.Time           `json:"updatedAt"`
+	CompletedAt  *time.Time          `json:"completedAt,omitempty"`
+}
+
+// OnboardingRequest represents a request to onboard a new node
+type OnboardingRequest struct {
+	NodeIP      string `json:"nodeIP" binding:"required"`
+	SSHPort     int    `json:"sshPort"`
+	SSHUsername string `json:"sshUsername" binding:"required"`
+	AuthMethod  string `json:"authMethod" binding:"required,oneof=password privateKey"`
+	Password    string `json:"password"`
+	PrivateKey  string `json:"privateKey"`
+}
+
+// OnboardingService handles node onboarding operations
+type OnboardingService struct {
+	k8sClient     *k8s.Client
+	nodeSvc       *NodeService
+	initScriptSvc *InitScriptService
+	runningJobs   map[string]context.CancelFunc
+	runningJobsMu sync.RWMutex
+}
+
+// NewOnboardingService creates a new OnboardingService
+func NewOnboardingService(k8sClient *k8s.Client, nodeSvc *NodeService, initScriptSvc *InitScriptService) *OnboardingService {
+	return &OnboardingService{
+		k8sClient:     k8sClient,
+		nodeSvc:       nodeSvc,
+		initScriptSvc: initScriptSvc,
+		runningJobs:   make(map[string]context.CancelFunc),
+	}
+}
+
+// StartOnboarding starts a new node onboarding job
+func (s *OnboardingService) StartOnboarding(ctx context.Context, req *OnboardingRequest) (*OnboardingJob, error) {
+	logger.Info("Starting node onboarding", "nodeIP", req.NodeIP)
+
+	// Set defaults
+	if req.SSHPort == 0 {
+		req.SSHPort = 22
+	}
+
+	// Validate authentication
+	if req.AuthMethod == "password" && req.Password == "" {
+		return nil, fmt.Errorf("password is required for password authentication")
+	}
+	if req.AuthMethod == "privateKey" && req.PrivateKey == "" {
+		return nil, fmt.Errorf("private key is required for private key authentication")
+	}
+
+	// Check if there's already a running job for this IP
+	jobs, err := s.ListJobs(ctx)
+	if err != nil {
+		return nil, err
+	}
+	for _, job := range jobs {
+		if job.NodeIP == req.NodeIP && (job.Status == JobStatusPending || job.Status == JobStatusRunning) {
+			return nil, fmt.Errorf("there is already a running onboarding job for this IP: %s", job.ID)
+		}
+	}
+
+	// Create job
+	job := &OnboardingJob{
+		ID:          fmt.Sprintf("job-%d", time.Now().UnixNano()),
+		NodeIP:      req.NodeIP,
+		Status:      JobStatusPending,
+		CurrentStep: 0,
+		TotalSteps:  9,
+		StepMessage: "Job created, waiting to start",
+		CreatedAt:   time.Now(),
+		UpdatedAt:   time.Now(),
+	}
+
+	// Save job
+	if err := s.saveJob(ctx, job); err != nil {
+		return nil, err
+	}
+
+	// Start async execution
+	jobCtx, cancel := context.WithCancel(context.Background())
+	s.runningJobsMu.Lock()
+	s.runningJobs[job.ID] = cancel
+	s.runningJobsMu.Unlock()
+
+	go s.executeOnboarding(jobCtx, job, req)
+
+	return job, nil
+}
+
+// GetJob returns a specific job by ID
+func (s *OnboardingService) GetJob(ctx context.Context, jobID string) (*OnboardingJob, error) {
+	jobs, err := s.getJobsMap(ctx)
+	if err != nil {
+		return nil, err
+	}
+
+	jobData, ok := jobs[jobID]
+	if !ok {
+		return nil, fmt.Errorf("job not found: %s", jobID)
+	}
+
+	var job OnboardingJob
+	if err := json.Unmarshal([]byte(jobData), &job); err != nil {
+		return nil, fmt.Errorf("failed to parse job data: %w", err)
+	}
+
+	return &job, nil
+}
+
+// ListJobs returns all onboarding jobs
+func (s *OnboardingService) ListJobs(ctx context.Context) ([]*OnboardingJob, error) {
+	jobs, err := s.getJobsMap(ctx)
+	if err != nil {
+		return nil, err
+	}
+
+	result := make([]*OnboardingJob, 0, len(jobs))
+	for _, jobData := range jobs {
+		var job OnboardingJob
+		if err := json.Unmarshal([]byte(jobData), &job); err != nil {
+			continue
+		}
+		result = append(result, &job)
+	}
+
+	return result, nil
+}
+
+// CancelJob cancels a running job
+func (s *OnboardingService) CancelJob(ctx context.Context, jobID string) error {
+	logger.Info("Cancelling onboarding job", "jobID", jobID)
+
+	job, err := s.GetJob(ctx, jobID)
+	if err != nil {
+		return err
+	}
+
+	if job.Status != JobStatusPending && job.Status != JobStatusRunning {
+		return fmt.Errorf("job is not running: %s", job.Status)
+	}
+
+	// Cancel the job context
+	s.runningJobsMu.Lock()
+	if cancel, ok := s.runningJobs[jobID]; ok {
+		cancel()
+		delete(s.runningJobs, jobID)
+	}
+	s.runningJobsMu.Unlock()
+
+	// Update job status
+	job.Status = JobStatusCancelled
+	job.StepMessage = "Job cancelled by user"
+	job.UpdatedAt = time.Now()
+	now := time.Now()
+	job.CompletedAt = &now
+
+	return s.saveJob(ctx, job)
+}
+
+// executeOnboarding executes the onboarding process
+func (s *OnboardingService) executeOnboarding(ctx context.Context, job *OnboardingJob, req *OnboardingRequest) {
+	defer func() {
+		s.runningJobsMu.Lock()
+		delete(s.runningJobs, job.ID)
+		s.runningJobsMu.Unlock()
+	}()
+
+	// Update job status to running
+	job.Status = JobStatusRunning
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Create SSH executor for target node
+	sshConfig := &ssh.Config{
+		Host:       req.NodeIP,
+		Port:       req.SSHPort,
+		Username:   req.SSHUsername,
+		AuthMethod: ssh.AuthMethod(req.AuthMethod),
+		Password:   req.Password,
+		PrivateKey: req.PrivateKey,
+		Timeout:    30 * time.Second,
+	}
+	executor := ssh.NewExecutor(sshConfig)
+	defer executor.Close()
+
+	// Step 1: Connection test
+	if err := s.stepConnectionTest(ctx, job, executor); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 2: Platform detection
+	if err := s.stepPlatformDetection(ctx, job, executor); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 3: Environment check
+	if err := s.stepEnvironmentCheck(ctx, job, executor); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 4: Pre-join scripts
+	if err := s.stepPreJoinScripts(ctx, job, executor); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 5: Get join token
+	joinCommand, err := s.stepGetJoinToken(ctx, job)
+	if err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 6: Execute kubeadm join
+	if err := s.stepKubeadmJoin(ctx, job, executor, joinCommand); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 7: Post-join scripts
+	if err := s.stepPostJoinScripts(ctx, job, executor); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 8: Wait for node ready
+	if err := s.stepWaitForNodeReady(ctx, job); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Step 9: Enable node
+	if err := s.stepEnableNode(ctx, job); err != nil {
+		s.failJob(job, err)
+		return
+	}
+
+	// Mark job as successful
+	job.Status = JobStatusSuccess
+	job.StepMessage = "Node onboarding completed successfully"
+	job.UpdatedAt = time.Now()
+	now := time.Now()
+	job.CompletedAt = &now
+	s.saveJob(context.Background(), job)
+
+	logger.Info("Node onboarding completed successfully", "nodeIP", job.NodeIP, "nodeName", job.NodeName)
+}
+
+func (s *OnboardingService) stepConnectionTest(ctx context.Context, job *OnboardingJob, executor *ssh.Executor) error {
+	job.CurrentStep = 1
+	job.StepMessage = "Testing SSH connection..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	if err := executor.TestConnection(ctx); err != nil {
+		return fmt.Errorf("SSH connection test failed: %w", err)
+	}
+
+	return nil
+}
+
+func (s *OnboardingService) stepPlatformDetection(ctx context.Context, job *OnboardingJob, executor *ssh.Executor) error {
+	job.CurrentStep = 2
+	job.StepMessage = "Detecting node platform..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	info, err := executor.GetHostInfo(ctx)
+	if err != nil {
+		return fmt.Errorf("failed to detect platform: %w", err)
+	}
+
+	job.Platform = NodePlatform{
+		OS:      info["os"],
+		Version: info["version"],
+		Arch:    info["arch"],
+	}
+
+	if info["hostname"] != "" {
+		job.NodeName = info["hostname"]
+	}
+
+	job.StepMessage = fmt.Sprintf("Detected: %s %s (%s)", job.Platform.OS, job.Platform.Version, job.Platform.Arch)
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	return nil
+}
+
+func (s *OnboardingService) stepEnvironmentCheck(ctx context.Context, job *OnboardingJob, executor *ssh.Executor) error {
+	job.CurrentStep = 3
+	job.StepMessage = "Checking environment..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Check if kubeadm is installed
+	if !executor.CheckCommand(ctx, "kubeadm") {
+		return fmt.Errorf("kubeadm is not installed on the target node")
+	}
+
+	// Check if kubelet is installed
+	if !executor.CheckCommand(ctx, "kubelet") {
+		return fmt.Errorf("kubelet is not installed on the target node")
+	}
+
+	return nil
+}
+
+func (s *OnboardingService) stepPreJoinScripts(ctx context.Context, job *OnboardingJob, executor *ssh.Executor) error {
+	job.CurrentStep = 4
+	job.StepMessage = "Executing pre-join scripts..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Get init scripts for pre-join phase
+	scripts, err := s.initScriptSvc.GetScriptsForPhase(ctx, PhasePreJoin, job.Platform)
+	if err != nil {
+		return fmt.Errorf("failed to get pre-join scripts: %w", err)
+	}
+
+	if len(scripts) == 0 {
+		job.StepMessage = "No pre-join scripts to execute"
+		job.UpdatedAt = time.Now()
+		s.saveJob(context.Background(), job)
+		return nil
+	}
+
+	// Initialize sub-steps
+	job.SubSteps = make([]SubStep, len(scripts))
+	for i, script := range scripts {
+		job.SubSteps[i] = SubStep{
+			Name:   script.Group.Name,
+			Status: SubStepPending,
+		}
+	}
+	s.saveJob(context.Background(), job)
+
+	// Get variables for script replacement
+	cpConfig, _ := s.initScriptSvc.GetControlPlaneConfig(ctx)
+	controlPlaneIP := ""
+	if cpConfig != nil {
+		controlPlaneIP = cpConfig.Host
+	}
+	vars := map[string]string{
+		"NODE_IP":          job.NodeIP,
+		"NODE_NAME":        job.NodeName,
+		"CONTROL_PLANE_IP": controlPlaneIP,
+	}
+
+	// Execute scripts
+	for stepIdx, script := range scripts {
+		job.SubSteps[stepIdx].Status = SubStepRunning
+		job.StepMessage = fmt.Sprintf("Executing: %s", script.Group.Name)
+		job.UpdatedAt = time.Now()
+		s.saveJob(context.Background(), job)
+
+		// Replace variables in script content
+		content := ReplaceVariables(script.Script.Content, vars)
+
+		// Execute script
+		result := executor.ExecuteScript(ctx, content)
+		if result.Error != nil || result.ExitCode != 0 {
+			job.SubSteps[stepIdx].Status = SubStepFailed
+			errMsg := result.Stderr
+			if result.Error != nil {
+				errMsg = result.Error.Error()
+			}
+			job.SubSteps[stepIdx].Error = errMsg
+			s.saveJob(context.Background(), job)
+			return fmt.Errorf("pre-join script '%s' failed: %s", script.Group.Name, errMsg)
+		}
+
+		job.SubSteps[stepIdx].Status = SubStepSuccess
+		s.saveJob(context.Background(), job)
+	}
+
+	job.SubSteps = nil // Clear sub-steps after completion
+	return nil
+}
+
+func (s *OnboardingService) stepGetJoinToken(ctx context.Context, job *OnboardingJob) (string, error) {
+	job.CurrentStep = 5
+	job.StepMessage = "Getting join token from control plane..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Get control plane config
+	cpConfig, err := s.initScriptSvc.GetControlPlaneConfig(ctx)
+	if err != nil {
+		return "", fmt.Errorf("failed to get control plane config: %w", err)
+	}
+
+	if cpConfig.Host == "" {
+		return "", fmt.Errorf("control plane host is not configured")
+	}
+
+	// Create SSH executor for control plane
+	cpSSHConfig := &ssh.Config{
+		Host:       cpConfig.Host,
+		Port:       cpConfig.SSHPort,
+		Username:   cpConfig.SSHUser,
+		AuthMethod: ssh.AuthMethod(cpConfig.AuthMethod),
+		Password:   cpConfig.Password,
+		PrivateKey: cpConfig.PrivateKey,
+		Timeout:    30 * time.Second,
+	}
+	cpExecutor := ssh.NewExecutor(cpSSHConfig)
+	defer cpExecutor.Close()
+
+	if err := cpExecutor.Connect(ctx); err != nil {
+		return "", fmt.Errorf("failed to connect to control plane: %w", err)
+	}
+
+	// Generate join command
+	result := cpExecutor.Execute(ctx, "kubeadm token create --print-join-command")
+	if result.Error != nil || result.ExitCode != 0 {
+		errMsg := result.Stderr
+		if result.Error != nil {
+			errMsg = result.Error.Error()
+		}
+		return "", fmt.Errorf("failed to generate join command: %s", errMsg)
+	}
+
+	joinCommand := result.Stdout
+	if joinCommand == "" {
+		return "", fmt.Errorf("empty join command returned")
+	}
+
+	return joinCommand, nil
+}
+
+func (s *OnboardingService) stepKubeadmJoin(ctx context.Context, job *OnboardingJob, executor *ssh.Executor, joinCommand string) error {
+	job.CurrentStep = 6
+	job.StepMessage = "Executing kubeadm join..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Execute kubeadm join with a longer timeout
+	joinCtx, cancel := context.WithTimeout(ctx, 5*time.Minute)
+	defer cancel()
+
+	result := executor.Execute(joinCtx, joinCommand)
+	if result.Error != nil || result.ExitCode != 0 {
+		errMsg := result.Stderr
+		if result.Error != nil {
+			errMsg = result.Error.Error()
+		}
+		return fmt.Errorf("kubeadm join failed: %s", errMsg)
+	}
+
+	return nil
+}
+
+func (s *OnboardingService) stepPostJoinScripts(ctx context.Context, job *OnboardingJob, executor *ssh.Executor) error {
+	job.CurrentStep = 7
+	job.StepMessage = "Executing post-join scripts..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Get init scripts for post-join phase
+	scripts, err := s.initScriptSvc.GetScriptsForPhase(ctx, PhasePostJoin, job.Platform)
+	if err != nil {
+		return fmt.Errorf("failed to get post-join scripts: %w", err)
+	}
+
+	if len(scripts) == 0 {
+		job.StepMessage = "No post-join scripts to execute"
+		job.UpdatedAt = time.Now()
+		s.saveJob(context.Background(), job)
+		return nil
+	}
+
+	// Initialize sub-steps
+	job.SubSteps = make([]SubStep, len(scripts))
+	for i, script := range scripts {
+		job.SubSteps[i] = SubStep{
+			Name:   script.Group.Name,
+			Status: SubStepPending,
+		}
+	}
+	s.saveJob(context.Background(), job)
+
+	// Get variables for script replacement
+	cpConfig, _ := s.initScriptSvc.GetControlPlaneConfig(ctx)
+	controlPlaneIP := ""
+	if cpConfig != nil {
+		controlPlaneIP = cpConfig.Host
+	}
+	vars := map[string]string{
+		"NODE_IP":          job.NodeIP,
+		"NODE_NAME":        job.NodeName,
+		"CONTROL_PLANE_IP": controlPlaneIP,
+	}
+
+	// Execute scripts
+	for stepIdx, script := range scripts {
+		job.SubSteps[stepIdx].Status = SubStepRunning
+		job.StepMessage = fmt.Sprintf("Executing: %s", script.Group.Name)
+		job.UpdatedAt = time.Now()
+		s.saveJob(context.Background(), job)
+
+		// Replace variables in script content
+		content := ReplaceVariables(script.Script.Content, vars)
+
+		// Execute script
+		result := executor.ExecuteScript(ctx, content)
+		if result.Error != nil || result.ExitCode != 0 {
+			job.SubSteps[stepIdx].Status = SubStepFailed
+			errMsg := result.Stderr
+			if result.Error != nil {
+				errMsg = result.Error.Error()
+			}
+			job.SubSteps[stepIdx].Error = errMsg
+			s.saveJob(context.Background(), job)
+			return fmt.Errorf("post-join script '%s' failed: %s", script.Group.Name, errMsg)
+		}
+
+		job.SubSteps[stepIdx].Status = SubStepSuccess
+		s.saveJob(context.Background(), job)
+	}
+
+	job.SubSteps = nil // Clear sub-steps after completion
+	return nil
+}
+
+func (s *OnboardingService) stepWaitForNodeReady(ctx context.Context, job *OnboardingJob) error {
+	job.CurrentStep = 8
+	job.StepMessage = "Waiting for node to be ready..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	// Wait for node to appear and become ready
+	timeout := time.After(5 * time.Minute)
+	ticker := time.NewTicker(5 * time.Second)
+	defer ticker.Stop()
+
+	for {
+		select {
+		case <-ctx.Done():
+			return ctx.Err()
+		case <-timeout:
+			return fmt.Errorf("timeout waiting for node to be ready")
+		case <-ticker.C:
+			// Try to find the node
+			nodes, err := s.k8sClient.ListNodes(ctx)
+			if err != nil {
+				continue
+			}
+
+			for _, node := range nodes.Items {
+				// Match by IP or hostname
+				nodeIP := ""
+				for _, addr := range node.Status.Addresses {
+					if addr.Type == corev1.NodeInternalIP {
+						nodeIP = addr.Address
+						break
+					}
+				}
+
+				if nodeIP == job.NodeIP || node.Name == job.NodeName {
+					job.NodeName = node.Name
+
+					// Check if node is ready
+					for _, cond := range node.Status.Conditions {
+						if cond.Type == corev1.NodeReady && cond.Status == corev1.ConditionTrue {
+							job.StepMessage = fmt.Sprintf("Node %s is ready", node.Name)
+							job.UpdatedAt = time.Now()
+							s.saveJob(context.Background(), job)
+							return nil
+						}
+					}
+				}
+			}
+		}
+	}
+}
+
+func (s *OnboardingService) stepEnableNode(ctx context.Context, job *OnboardingJob) error {
+	job.CurrentStep = 9
+	job.StepMessage = "Enabling node in Bison..."
+	job.UpdatedAt = time.Now()
+	s.saveJob(context.Background(), job)
+
+	if job.NodeName == "" {
+		return fmt.Errorf("node name is not set")
+	}
+
+	// Enable node in Bison (add to shared pool)
+	if err := s.nodeSvc.EnableNode(ctx, job.NodeName); err != nil {
+		return fmt.Errorf("failed to enable node: %w", err)
+	}
+
+	return nil
+}
+
+func (s *OnboardingService) failJob(job *OnboardingJob, err error) {
+	job.Status = JobStatusFailed
+	job.ErrorMessage = err.Error()
+	job.UpdatedAt = time.Now()
+	now := time.Now()
+	job.CompletedAt = &now
+	s.saveJob(context.Background(), job)
+
+	logger.Error("Node onboarding failed", "nodeIP", job.NodeIP, "error", err)
+}
+
+func (s *OnboardingService) saveJob(ctx context.Context, job *OnboardingJob) error {
+	data, err := json.Marshal(job)
+	if err != nil {
+		return fmt.Errorf("failed to marshal job: %w", err)
+	}
+
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, OnboardingJobsConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			// Create new ConfigMap
+			cm = &corev1.ConfigMap{
+				ObjectMeta: metav1.ObjectMeta{
+					Name:      OnboardingJobsConfigMap,
+					Namespace: BisonNamespace,
+				},
+				Data: map[string]string{
+					job.ID: string(data),
+				},
+			}
+			return s.k8sClient.CreateConfigMap(ctx, BisonNamespace, cm)
+		}
+		return fmt.Errorf("failed to get jobs config: %w", err)
+	}
+
+	// Update existing ConfigMap
+	if cm.Data == nil {
+		cm.Data = make(map[string]string)
+	}
+	cm.Data[job.ID] = string(data)
+
+	return s.k8sClient.UpdateConfigMap(ctx, BisonNamespace, cm)
+}
+
+func (s *OnboardingService) getJobsMap(ctx context.Context) (map[string]string, error) {
+	cm, err := s.k8sClient.GetConfigMap(ctx, BisonNamespace, OnboardingJobsConfigMap)
+	if err != nil {
+		if errors.IsNotFound(err) {
+			return make(map[string]string), nil
+		}
+		return nil, fmt.Errorf("failed to get jobs config: %w", err)
+	}
+
+	if cm.Data == nil {
+		return make(map[string]string), nil
+	}
+
+	return cm.Data, nil
+}
+
+// TestControlPlaneConnection tests the SSH connection to the control plane
+func (s *OnboardingService) TestControlPlaneConnection(ctx context.Context) error {
+	cpConfig, err := s.initScriptSvc.GetControlPlaneConfig(ctx)
+	if err != nil {
+		return fmt.Errorf("failed to get control plane config: %w", err)
+	}
+
+	if cpConfig.Host == "" {
+		return fmt.Errorf("control plane host is not configured")
+	}
+
+	sshConfig := &ssh.Config{
+		Host:       cpConfig.Host,
+		Port:       cpConfig.SSHPort,
+		Username:   cpConfig.SSHUser,
+		AuthMethod: ssh.AuthMethod(cpConfig.AuthMethod),
+		Password:   cpConfig.Password,
+		PrivateKey: cpConfig.PrivateKey,
+		Timeout:    30 * time.Second,
+	}
+
+	executor := ssh.NewExecutor(sshConfig)
+	defer executor.Close()
+
+	if err := executor.TestConnection(ctx); err != nil {
+		return fmt.Errorf("SSH connection test failed: %w", err)
+	}
+
+	// Also verify kubeadm is available
+	if !executor.CheckCommand(ctx, "kubeadm") {
+		return fmt.Errorf("kubeadm is not available on the control plane")
+	}
+
+	return nil
+}
diff --git a/api-server/internal/service/settings_service.go b/api-server/internal/service/settings_service.go
index 0a561f4..d9c506d 100644
--- a/api-server/internal/service/settings_service.go
+++ b/api-server/internal/service/settings_service.go
@@ -6,6 +6,7 @@ import (
 	"fmt"
 	"io"
 	"net/http"
+	"net/url"
 	"time"
 )
 
@@ -48,28 +49,66 @@ type PrometheusMetric struct {
 	Value     float64 `json:"value"`
 }
 
+// LabeledMetricSeries represents a Prometheus metric series with labels
+type LabeledMetricSeries struct {
+	Labels  map[string]string  `json:"labels"`
+	Metrics []PrometheusMetric `json:"metrics"`
+}
+
 // NodeMetrics represents metrics for a node
 type NodeMetrics struct {
 	CPUUsage    []PrometheusMetric `json:"cpuUsage"`
 	MemoryUsage []PrometheusMetric `json:"memoryUsage"`
+	// Network IO
+	NetworkReceive  []PrometheusMetric `json:"networkReceive,omitempty"`
+	NetworkTransmit []PrometheusMetric `json:"networkTransmit,omitempty"`
+	// RDMA IO
+	RdmaReceive  []PrometheusMetric `json:"rdmaReceive,omitempty"`
+	RdmaTransmit []PrometheusMetric `json:"rdmaTransmit,omitempty"`
+	// GPU (NVIDIA DCGM)
+	GpuUtilization []PrometheusMetric    `json:"gpuUtilization,omitempty"`
+	GpuMemoryUtil  []PrometheusMetric    `json:"gpuMemoryUtil,omitempty"`
+	GpuPerDevice   []LabeledMetricSeries `json:"gpuPerDevice,omitempty"`
+	// NPU (Huawei Ascend)
+	NpuUtilization []PrometheusMetric `json:"npuUtilization,omitempty"`
+	NpuMemoryUtil  []PrometheusMetric `json:"npuMemoryUtil,omitempty"`
+	NpuTemperature []PrometheusMetric `json:"npuTemperature,omitempty"`
 }
 
-// QueryPrometheus queries Prometheus API
-func (s *SettingsService) QueryPrometheus(ctx context.Context, query string, start, end time.Time, step time.Duration) ([]PrometheusMetric, error) {
+// NodeMetricsRequest holds parameters for querying node metrics
+type NodeMetricsRequest struct {
+	NodeName string
+	Hours    int
+	HasGpu   bool
+	HasNpu   bool
+}
+
+// prometheusResponse is the JSON structure returned by Prometheus query_range API
+type prometheusResponse struct {
+	Status string `json:"status"`
+	Data   struct {
+		ResultType string `json:"resultType"`
+		Result     []struct {
+			Metric map[string]string `json:"metric"`
+			Values [][]interface{}   `json:"values"`
+		} `json:"result"`
+	} `json:"data"`
+}
+
+// queryPrometheusRaw executes a Prometheus range query and returns the raw response
+func (s *SettingsService) queryPrometheusRaw(ctx context.Context, query string, start, end time.Time, step time.Duration) (*prometheusResponse, error) {
 	if s.prometheusURL == "" {
 		return nil, fmt.Errorf("prometheus URL not configured")
 	}
 
-	// Build query URL
-	url := fmt.Sprintf("%s/api/v1/query_range?query=%s&start=%d&end=%d&step=%d",
-		s.prometheusURL,
-		query,
-		start.Unix(),
-		end.Unix(),
-		int(step.Seconds()),
-	)
+	params := url.Values{}
+	params.Set("query", query)
+	params.Set("start", fmt.Sprintf("%d", start.Unix()))
+	params.Set("end", fmt.Sprintf("%d", end.Unix()))
+	params.Set("step", fmt.Sprintf("%d", int(step.Seconds())))
+	fullURL := fmt.Sprintf("%s/api/v1/query_range?%s", s.prometheusURL, params.Encode())
 
-	req, err := http.NewRequestWithContext(ctx, "GET", url, nil)
+	req, err := http.NewRequestWithContext(ctx, "GET", fullURL, nil)
 	if err != nil {
 		return nil, fmt.Errorf("failed to create request: %w", err)
 	}
@@ -86,17 +125,7 @@ func (s *SettingsService) QueryPrometheus(ctx context.Context, query string, sta
 		return nil, fmt.Errorf("prometheus returned status %d: %s", resp.StatusCode, string(body))
 	}
 
-	var result struct {
-		Status string `json:"status"`
-		Data   struct {
-			ResultType string `json:"resultType"`
-			Result     []struct {
-				Metric map[string]string `json:"metric"`
-				Values [][]interface{}   `json:"values"`
-			} `json:"result"`
-		} `json:"data"`
-	}
-
+	var result prometheusResponse
 	if err := json.NewDecoder(resp.Body).Decode(&result); err != nil {
 		return nil, fmt.Errorf("failed to decode response: %w", err)
 	}
@@ -105,51 +134,127 @@ func (s *SettingsService) QueryPrometheus(ctx context.Context, query string, sta
 		return nil, fmt.Errorf("prometheus query failed")
 	}
 
+	return &result, nil
+}
+
+// parseMetricValues extracts PrometheusMetric slice from raw Prometheus values
+func parseMetricValues(values [][]interface{}) []PrometheusMetric {
 	var metrics []PrometheusMetric
-	if len(result.Data.Result) > 0 {
-		for _, v := range result.Data.Result[0].Values {
-			if len(v) >= 2 {
-				ts, _ := v[0].(float64)
-				val := 0.0
-				switch vv := v[1].(type) {
-				case string:
-					fmt.Sscanf(vv, "%f", &val)
-				case float64:
-					val = vv
-				}
-				metrics = append(metrics, PrometheusMetric{
-					Timestamp: ts,
-					Value:     val,
-				})
+	for _, v := range values {
+		if len(v) >= 2 {
+			ts, _ := v[0].(float64)
+			val := 0.0
+			switch vv := v[1].(type) {
+			case string:
+				fmt.Sscanf(vv, "%f", &val)
+			case float64:
+				val = vv
 			}
+			metrics = append(metrics, PrometheusMetric{
+				Timestamp: ts,
+				Value:     val,
+			})
 		}
 	}
+	return metrics
+}
+
+// QueryPrometheus queries Prometheus API and returns the first result series
+func (s *SettingsService) QueryPrometheus(ctx context.Context, query string, start, end time.Time, step time.Duration) ([]PrometheusMetric, error) {
+	result, err := s.queryPrometheusRaw(ctx, query, start, end, step)
+	if err != nil {
+		return nil, err
+	}
 
-	return metrics, nil
+	if len(result.Data.Result) > 0 {
+		return parseMetricValues(result.Data.Result[0].Values), nil
+	}
+
+	return nil, nil
+}
+
+// QueryPrometheusMultiSeries queries Prometheus API and returns all result series with labels
+func (s *SettingsService) QueryPrometheusMultiSeries(ctx context.Context, query string, start, end time.Time, step time.Duration) ([]LabeledMetricSeries, error) {
+	result, err := s.queryPrometheusRaw(ctx, query, start, end, step)
+	if err != nil {
+		return nil, err
+	}
+
+	var series []LabeledMetricSeries
+	for _, r := range result.Data.Result {
+		series = append(series, LabeledMetricSeries{
+			Labels:  r.Metric,
+			Metrics: parseMetricValues(r.Values),
+		})
+	}
+
+	return series, nil
 }
 
 // GetNodeMetrics returns metrics for a specific node
-func (s *SettingsService) GetNodeMetrics(ctx context.Context, nodeName string, hours int) (*NodeMetrics, error) {
+func (s *SettingsService) GetNodeMetrics(ctx context.Context, req NodeMetricsRequest) (*NodeMetrics, error) {
 	end := time.Now()
-	start := end.Add(-time.Duration(hours) * time.Hour)
+	start := end.Add(-time.Duration(req.Hours) * time.Hour)
 	step := time.Minute * 5
+	node := req.NodeName
 
-	// Query CPU usage
-	cpuQuery := fmt.Sprintf(`100 - (avg by(instance) (rate(node_cpu_seconds_total{mode="idle", instance=~"%s.*"}[5m])) * 100)`, nodeName)
-	cpuMetrics, err := s.QueryPrometheus(ctx, cpuQuery, start, end, step)
-	if err != nil {
-		cpuMetrics = nil // Non-fatal, continue
+	result := &NodeMetrics{}
+
+	// --- Always query: CPU, Memory, Network, RDMA ---
+
+	// CPU usage (%)
+	cpuQuery := fmt.Sprintf(`100 - (avg by(instance) (rate(node_cpu_seconds_total{mode="idle", instance=~"%s.*"}[5m])) * 100)`, node)
+	result.CPUUsage, _ = s.QueryPrometheus(ctx, cpuQuery, start, end, step)
+
+	// Memory usage (%)
+	memQuery := fmt.Sprintf(`(1 - (node_memory_MemAvailable_bytes{instance=~"%s.*"} / node_memory_MemTotal_bytes{instance=~"%s.*"})) * 100`, node, node)
+	result.MemoryUsage, _ = s.QueryPrometheus(ctx, memQuery, start, end, step)
+
+	// Network receive (bytes/sec, excluding virtual interfaces)
+	netRecvQuery := fmt.Sprintf(`sum(rate(node_network_receive_bytes_total{instance=~"%s.*",device!~"lo|docker.*|veth.*|br.*|cni.*|flannel.*|cali.*|tunl.*|kube.*|virbr.*"}[5m]))`, node)
+	result.NetworkReceive, _ = s.QueryPrometheus(ctx, netRecvQuery, start, end, step)
+
+	// Network transmit (bytes/sec)
+	netTransQuery := fmt.Sprintf(`sum(rate(node_network_transmit_bytes_total{instance=~"%s.*",device!~"lo|docker.*|veth.*|br.*|cni.*|flannel.*|cali.*|tunl.*|kube.*|virbr.*"}[5m]))`, node)
+	result.NetworkTransmit, _ = s.QueryPrometheus(ctx, netTransQuery, start, end, step)
+
+	// RDMA receive (bytes/sec, InfiniBand via node_exporter)
+	rdmaRecvQuery := fmt.Sprintf(`sum(rate(node_infiniband_port_data_received_bytes_total{instance=~"%s.*"}[5m]))`, node)
+	result.RdmaReceive, _ = s.QueryPrometheus(ctx, rdmaRecvQuery, start, end, step)
+
+	// RDMA transmit (bytes/sec)
+	rdmaTransQuery := fmt.Sprintf(`sum(rate(node_infiniband_port_data_transmitted_bytes_total{instance=~"%s.*"}[5m]))`, node)
+	result.RdmaTransmit, _ = s.QueryPrometheus(ctx, rdmaTransQuery, start, end, step)
+
+	// --- Conditional: GPU (DCGM) ---
+	if req.HasGpu {
+		// Average GPU SM utilization (%)
+		gpuUtilQuery := fmt.Sprintf(`avg(DCGM_FI_DEV_GPU_UTIL{Hostname="%s"} or DCGM_FI_DEV_GPU_UTIL{instance=~"%s.*"})`, node, node)
+		result.GpuUtilization, _ = s.QueryPrometheus(ctx, gpuUtilQuery, start, end, step)
+
+		// Average GPU memory utilization (%)
+		gpuMemQuery := fmt.Sprintf(`avg(DCGM_FI_DEV_MEM_COPY_UTIL{Hostname="%s"} or DCGM_FI_DEV_MEM_COPY_UTIL{instance=~"%s.*"})`, node, node)
+		result.GpuMemoryUtil, _ = s.QueryPrometheus(ctx, gpuMemQuery, start, end, step)
+
+		// Per-GPU SM utilization (multi-series)
+		gpuPerDeviceQuery := fmt.Sprintf(`DCGM_FI_DEV_GPU_UTIL{Hostname="%s"} or DCGM_FI_DEV_GPU_UTIL{instance=~"%s.*"}`, node, node)
+		result.GpuPerDevice, _ = s.QueryPrometheusMultiSeries(ctx, gpuPerDeviceQuery, start, end, step)
 	}
 
-	// Query memory usage
-	memQuery := fmt.Sprintf(`(1 - (node_memory_MemAvailable_bytes{instance=~"%s.*"} / node_memory_MemTotal_bytes{instance=~"%s.*"})) * 100`, nodeName, nodeName)
-	memMetrics, err := s.QueryPrometheus(ctx, memQuery, start, end, step)
-	if err != nil {
-		memMetrics = nil // Non-fatal, continue
+	// --- Conditional: NPU (Huawei Ascend) ---
+	if req.HasNpu {
+		// NPU utilization (%)
+		npuUtilQuery := fmt.Sprintf(`avg(npu_chip_info_utilization{id=~"%s.*"})`, node)
+		result.NpuUtilization, _ = s.QueryPrometheus(ctx, npuUtilQuery, start, end, step)
+
+		// NPU HBM usage (%)
+		npuMemQuery := fmt.Sprintf(`avg(npu_chip_info_hbm_usage{id=~"%s.*"})`, node)
+		result.NpuMemoryUtil, _ = s.QueryPrometheus(ctx, npuMemQuery, start, end, step)
+
+		// NPU temperature (°C)
+		npuTempQuery := fmt.Sprintf(`avg(npu_chip_info_temperature{id=~"%s.*"})`, node)
+		result.NpuTemperature, _ = s.QueryPrometheus(ctx, npuTempQuery, start, end, step)
 	}
 
-	return &NodeMetrics{
-		CPUUsage:    cpuMetrics,
-		MemoryUsage: memMetrics,
-	}, nil
+	return result, nil
 }
diff --git a/api-server/internal/ssh/executor.go b/api-server/internal/ssh/executor.go
new file mode 100644
index 0000000..e1feb9e
--- /dev/null
+++ b/api-server/internal/ssh/executor.go
@@ -0,0 +1,370 @@
+package ssh
+
+import (
+	"bytes"
+	"context"
+	"fmt"
+	"io"
+	"net"
+	"strings"
+	"sync"
+	"time"
+
+	"golang.org/x/crypto/ssh"
+)
+
+// AuthMethod represents the SSH authentication method
+type AuthMethod string
+
+const (
+	AuthMethodPassword   AuthMethod = "password"
+	AuthMethodPrivateKey AuthMethod = "privateKey"
+)
+
+// Config holds SSH connection configuration
+type Config struct {
+	Host       string
+	Port       int
+	Username   string
+	AuthMethod AuthMethod
+	Password   string
+	PrivateKey string // PEM encoded private key content
+	Timeout    time.Duration
+}
+
+// CommandResult holds the result of a remote command execution
+type CommandResult struct {
+	Stdout   string
+	Stderr   string
+	ExitCode int
+	Error    error
+}
+
+// Executor handles SSH connections and remote command execution
+type Executor struct {
+	config *Config
+	client *ssh.Client
+	mu     sync.Mutex
+}
+
+// NewExecutor creates a new SSH executor with the given configuration
+func NewExecutor(config *Config) *Executor {
+	if config.Port == 0 {
+		config.Port = 22
+	}
+	if config.Timeout == 0 {
+		config.Timeout = 30 * time.Second
+	}
+	return &Executor{
+		config: config,
+	}
+}
+
+// Connect establishes an SSH connection to the remote host
+func (e *Executor) Connect(ctx context.Context) error {
+	e.mu.Lock()
+	defer e.mu.Unlock()
+
+	if e.client != nil {
+		return nil // Already connected
+	}
+
+	var authMethods []ssh.AuthMethod
+
+	switch e.config.AuthMethod {
+	case AuthMethodPassword:
+		if e.config.Password == "" {
+			return fmt.Errorf("password is required for password authentication")
+		}
+		authMethods = append(authMethods, ssh.Password(e.config.Password))
+
+	case AuthMethodPrivateKey:
+		if e.config.PrivateKey == "" {
+			return fmt.Errorf("private key is required for private key authentication")
+		}
+		signer, err := ssh.ParsePrivateKey([]byte(e.config.PrivateKey))
+		if err != nil {
+			return fmt.Errorf("failed to parse private key: %w", err)
+		}
+		authMethods = append(authMethods, ssh.PublicKeys(signer))
+
+	default:
+		return fmt.Errorf("unsupported authentication method: %s", e.config.AuthMethod)
+	}
+
+	sshConfig := &ssh.ClientConfig{
+		User:            e.config.Username,
+		Auth:            authMethods,
+		HostKeyCallback: ssh.InsecureIgnoreHostKey(), // TODO: Consider using known_hosts in production
+		Timeout:         e.config.Timeout,
+	}
+
+	addr := fmt.Sprintf("%s:%d", e.config.Host, e.config.Port)
+
+	// Use context for connection timeout
+	var client *ssh.Client
+	var err error
+
+	done := make(chan struct{})
+	go func() {
+		client, err = ssh.Dial("tcp", addr, sshConfig)
+		close(done)
+	}()
+
+	select {
+	case <-ctx.Done():
+		return ctx.Err()
+	case <-done:
+		if err != nil {
+			return fmt.Errorf("failed to connect to %s: %w", addr, err)
+		}
+	}
+
+	e.client = client
+	return nil
+}
+
+// Execute runs a command on the remote host and returns the result
+func (e *Executor) Execute(ctx context.Context, command string) *CommandResult {
+	e.mu.Lock()
+	if e.client == nil {
+		e.mu.Unlock()
+		return &CommandResult{
+			ExitCode: -1,
+			Error:    fmt.Errorf("not connected"),
+		}
+	}
+	client := e.client
+	e.mu.Unlock()
+
+	session, err := client.NewSession()
+	if err != nil {
+		return &CommandResult{
+			ExitCode: -1,
+			Error:    fmt.Errorf("failed to create session: %w", err),
+		}
+	}
+	defer session.Close()
+
+	var stdout, stderr bytes.Buffer
+	session.Stdout = &stdout
+	session.Stderr = &stderr
+
+	// Run command with context cancellation support
+	done := make(chan error, 1)
+	go func() {
+		done <- session.Run(command)
+	}()
+
+	select {
+	case <-ctx.Done():
+		// Try to close the session to stop the command
+		session.Close()
+		return &CommandResult{
+			Stdout:   stdout.String(),
+			Stderr:   stderr.String(),
+			ExitCode: -1,
+			Error:    ctx.Err(),
+		}
+	case err := <-done:
+		result := &CommandResult{
+			Stdout:   stdout.String(),
+			Stderr:   stderr.String(),
+			ExitCode: 0,
+		}
+
+		if err != nil {
+			if exitErr, ok := err.(*ssh.ExitError); ok {
+				result.ExitCode = exitErr.ExitStatus()
+			} else {
+				result.ExitCode = -1
+				result.Error = err
+			}
+		}
+
+		return result
+	}
+}
+
+// ExecuteWithTimeout runs a command with a specific timeout
+func (e *Executor) ExecuteWithTimeout(command string, timeout time.Duration) *CommandResult {
+	ctx, cancel := context.WithTimeout(context.Background(), timeout)
+	defer cancel()
+	return e.Execute(ctx, command)
+}
+
+// ExecuteScript executes a shell script on the remote host
+// The script content is passed via stdin to avoid escaping issues
+func (e *Executor) ExecuteScript(ctx context.Context, script string) *CommandResult {
+	e.mu.Lock()
+	if e.client == nil {
+		e.mu.Unlock()
+		return &CommandResult{
+			ExitCode: -1,
+			Error:    fmt.Errorf("not connected"),
+		}
+	}
+	client := e.client
+	e.mu.Unlock()
+
+	session, err := client.NewSession()
+	if err != nil {
+		return &CommandResult{
+			ExitCode: -1,
+			Error:    fmt.Errorf("failed to create session: %w", err),
+		}
+	}
+	defer session.Close()
+
+	var stdout, stderr bytes.Buffer
+	session.Stdout = &stdout
+	session.Stderr = &stderr
+
+	// Pass script via stdin
+	stdin, err := session.StdinPipe()
+	if err != nil {
+		return &CommandResult{
+			ExitCode: -1,
+			Error:    fmt.Errorf("failed to create stdin pipe: %w", err),
+		}
+	}
+
+	done := make(chan error, 1)
+	go func() {
+		done <- session.Run("bash -s")
+	}()
+
+	// Write script to stdin
+	go func() {
+		defer stdin.Close()
+		io.WriteString(stdin, script)
+	}()
+
+	select {
+	case <-ctx.Done():
+		session.Close()
+		return &CommandResult{
+			Stdout:   stdout.String(),
+			Stderr:   stderr.String(),
+			ExitCode: -1,
+			Error:    ctx.Err(),
+		}
+	case err := <-done:
+		result := &CommandResult{
+			Stdout:   stdout.String(),
+			Stderr:   stderr.String(),
+			ExitCode: 0,
+		}
+
+		if err != nil {
+			if exitErr, ok := err.(*ssh.ExitError); ok {
+				result.ExitCode = exitErr.ExitStatus()
+			} else {
+				result.ExitCode = -1
+				result.Error = err
+			}
+		}
+
+		return result
+	}
+}
+
+// TestConnection tests if the SSH connection can be established
+func (e *Executor) TestConnection(ctx context.Context) error {
+	if err := e.Connect(ctx); err != nil {
+		return err
+	}
+
+	// Run a simple command to verify the connection works
+	result := e.Execute(ctx, "echo ok")
+	if result.Error != nil {
+		return result.Error
+	}
+	if result.ExitCode != 0 {
+		return fmt.Errorf("connection test failed: %s", result.Stderr)
+	}
+	if strings.TrimSpace(result.Stdout) != "ok" {
+		return fmt.Errorf("unexpected response: %s", result.Stdout)
+	}
+
+	return nil
+}
+
+// Close closes the SSH connection
+func (e *Executor) Close() error {
+	e.mu.Lock()
+	defer e.mu.Unlock()
+
+	if e.client != nil {
+		err := e.client.Close()
+		e.client = nil
+		return err
+	}
+	return nil
+}
+
+// IsConnected returns true if there is an active SSH connection
+func (e *Executor) IsConnected() bool {
+	e.mu.Lock()
+	defer e.mu.Unlock()
+	return e.client != nil
+}
+
+// GetHostInfo retrieves basic host information (OS, architecture, etc.)
+func (e *Executor) GetHostInfo(ctx context.Context) (map[string]string, error) {
+	info := make(map[string]string)
+
+	// Get OS information
+	osResult := e.Execute(ctx, "cat /etc/os-release 2>/dev/null | grep -E '^(ID|VERSION_ID)=' | cut -d'=' -f2 | tr -d '\"'")
+	if osResult.Error == nil && osResult.ExitCode == 0 {
+		lines := strings.Split(strings.TrimSpace(osResult.Stdout), "\n")
+		if len(lines) >= 1 {
+			info["os"] = strings.TrimSpace(lines[0])
+		}
+		if len(lines) >= 2 {
+			info["version"] = strings.TrimSpace(lines[1])
+		}
+	}
+
+	// Get architecture
+	archResult := e.Execute(ctx, "uname -m")
+	if archResult.Error == nil && archResult.ExitCode == 0 {
+		arch := strings.TrimSpace(archResult.Stdout)
+		// Normalize architecture names
+		switch arch {
+		case "x86_64":
+			arch = "amd64"
+		case "aarch64":
+			arch = "arm64"
+		}
+		info["arch"] = arch
+	}
+
+	// Get hostname
+	hostnameResult := e.Execute(ctx, "hostname")
+	if hostnameResult.Error == nil && hostnameResult.ExitCode == 0 {
+		info["hostname"] = strings.TrimSpace(hostnameResult.Stdout)
+	}
+
+	return info, nil
+}
+
+// CheckCommand checks if a command exists on the remote host
+func (e *Executor) CheckCommand(ctx context.Context, command string) bool {
+	result := e.Execute(ctx, fmt.Sprintf("command -v %s", command))
+	return result.Error == nil && result.ExitCode == 0
+}
+
+// DialFunc returns a function that can be used as a proxy dialer
+func (e *Executor) DialFunc() func(network, addr string) (net.Conn, error) {
+	return func(network, addr string) (net.Conn, error) {
+		e.mu.Lock()
+		client := e.client
+		e.mu.Unlock()
+
+		if client == nil {
+			return nil, fmt.Errorf("not connected")
+		}
+		return client.Dial(network, addr)
+	}
+}
diff --git a/deploy/charts/bison/Chart.yaml b/deploy/charts/bison/Chart.yaml
index 4a36d93..e8401c2 100644
--- a/deploy/charts/bison/Chart.yaml
+++ b/deploy/charts/bison/Chart.yaml
@@ -2,8 +2,9 @@ apiVersion: v2
 name: bison
 description: Bison - GPU 资源计费平台，基于 Capsule 多租户 + OpenCost 成本追踪
 type: application
-version: 0.0.1
-appVersion: "0.0.1"
+version: 0.0.27
+appVersion: "0.0.27"
+kubeVersion: ">=1.22.0-0"
 keywords:
   - gpu
   - billing
@@ -14,6 +15,11 @@ keywords:
   - cost-management
 maintainers:
   - name: Bison Team
+annotations:
+  org.opencontainers.image.source: https://github.com/SuperMarioYL/Bison
+  org.opencontainers.image.description: "Bison Helm Chart - GPU资源计费与多租户管理平台"
+  org.opencontainers.image.documentation: https://bison.lei6393.com
+  org.opencontainers.image.usage: "helm install my-bison oci://ghcr.io/supermarioyl/charts/bison --version VERSION"
 # Dependencies are installed separately:
 # - Capsule: helm install capsule projectcapsule/capsule -n capsule-system --create-namespace
 # - OpenCost: helm install opencost opencost/opencost -n opencost --create-namespace
diff --git a/deploy/charts/bison/README.md b/deploy/charts/bison/README.md
new file mode 100644
index 0000000..49c31f2
--- /dev/null
+++ b/deploy/charts/bison/README.md
@@ -0,0 +1,99 @@
+# Bison Helm Chart
+
+Kubernetes-based GPU Resource Billing and Scheduling Platform
+
+## ⚠️ 重要提示 / Important Notice
+
+**这是一个 Helm Chart，请使用 `helm` 命令安装，而不是 `docker pull`！**
+
+**This is a Helm Chart. Use `helm` command to install, NOT `docker pull`!**
+
+## Installation
+
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
+
+### Method 1: From GHCR (Recommended)
+
+Install directly from GitHub Container Registry using OCI format:
+
+```bash
+# Install specific version
+helm install my-bison oci://ghcr.io/supermarioyl/charts/bison --version 0.0.9
+
+# Or pull first, then install
+helm pull oci://ghcr.io/supermarioyl/charts/bison --version 0.0.9
+helm install my-bison bison-0.0.9.tgz
+
+# With custom configuration
+helm install my-bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.9 \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true
+```
+
+**Why GHCR OCI Format?**
+- ✅ No separate Helm repository needed
+- ✅ Unified storage with Docker images in GHCR
+- ✅ Faster installation
+- ✅ Modern Helm 3.8+ standard
+
+### Method 2: From GitHub Releases
+
+Download the chart from [GitHub Releases](https://github.com/SuperMarioYL/Bison/releases) and install locally:
+
+```bash
+# Download from release page
+wget https://github.com/SuperMarioYL/Bison/releases/download/v0.0.9/bison-0.0.9.tgz
+
+# Install
+helm install my-bison bison-0.0.9.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+## Prerequisites
+
+Before installing Bison, ensure the following dependencies are installed:
+
+1. **Capsule** - Multi-tenant management
+   ```bash
+   helm install capsule projectcapsule/capsule -n capsule-system --create-namespace
+   ```
+
+2. **OpenCost** - Cost tracking
+   ```bash
+   helm install opencost opencost/opencost -n opencost --create-namespace
+   ```
+
+3. **Prometheus** - Metrics collection
+   ```bash
+   helm install prometheus prometheus-community/kube-prometheus-stack -n monitoring --create-namespace
+   ```
+
+## Configuration
+
+See [values.yaml](./values.yaml) for all configuration options.
+
+### Basic Configuration
+
+```bash
+helm install my-bison oci://ghcr.io/supermarioyl/charts/bison \
+  --set apiServer.replicas=2 \
+  --set webUI.replicas=2
+```
+
+## Uninstall
+
+```bash
+helm uninstall my-bison -n bison-system
+```
+
+## More Information
+
+- [Project Homepage](https://bison.lei6393.com)
+- [Documentation](https://bison.lei6393.com/docs/)
+- [GitHub Repository](https://github.com/SuperMarioYL/Bison)
diff --git a/deploy/charts/bison/README_CN.md b/deploy/charts/bison/README_CN.md
new file mode 100644
index 0000000..7cc5411
--- /dev/null
+++ b/deploy/charts/bison/README_CN.md
@@ -0,0 +1,86 @@
+# Bison Helm Chart
+
+基于 Kubernetes 的 GPU 资源计费与调度平台
+
+## 安装
+
+### 从 GHCR 安装（推荐）
+
+直接从 GitHub Container Registry 使用 OCI 格式安装：
+
+```bash
+# 安装指定版本
+helm install my-bison oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+
+# 或者先拉取，再安装
+helm pull oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+helm install my-bison bison-0.0.2.tgz
+```
+
+**要求：**
+- Helm >= 3.8.0（支持 OCI）
+
+### 从 GitHub Releases 安装
+
+从 [GitHub Releases](https://github.com/SuperMarioYL/Bison/releases) 下载 chart 并本地安装：
+
+```bash
+# 从 release 页面下载
+wget https://github.com/SuperMarioYL/Bison/releases/download/v0.0.2/bison-0.0.2.tgz
+
+# 安装
+helm install my-bison bison-0.0.2.tgz
+```
+
+## 前置条件
+
+安装 Bison 前，请确保已安装以下依赖：
+
+1. **Capsule** - 多租户管理
+   ```bash
+   helm install capsule projectcapsule/capsule -n capsule-system --create-namespace
+   ```
+
+2. **OpenCost** - 成本追踪
+   ```bash
+   helm install opencost opencost/opencost -n opencost --create-namespace
+   ```
+
+3. **Prometheus** - 指标收集
+   ```bash
+   helm install prometheus prometheus-community/kube-prometheus-stack -n monitoring --create-namespace
+   ```
+
+## 配置
+
+所有配置选项请查看 [values.yaml](./values.yaml)。
+
+### 基础配置
+
+```bash
+helm install my-bison oci://ghcr.io/supermarioyl/bison/bison \
+  --set apiServer.replicas=2 \
+  --set webUI.replicas=2
+```
+
+### 常用配置项
+
+| 参数 | 说明 | 默认值 |
+|------|------|--------|
+| `apiServer.replicas` | API 服务器副本数 | `1` |
+| `webUI.replicas` | Web UI 副本数 | `1` |
+| `auth.enabled` | 启用认证 | `false` |
+| `opencost.url` | OpenCost API 地址 | `http://opencost.opencost:9003` |
+
+## 卸载
+
+```bash
+helm uninstall my-bison
+```
+
+## 更多信息
+
+- [项目主页](https://supermarioyl.github.io/Bison/)
+- [文档](https://supermarioyl.github.io/Bison/docs/)
+- [GitHub 仓库](https://github.com/SuperMarioYL/Bison)
+- [English README](./README.md)
diff --git a/deploy/charts/bison/templates/NOTES.txt b/deploy/charts/bison/templates/NOTES.txt
index 7ad6d8b..7806fe9 100644
--- a/deploy/charts/bison/templates/NOTES.txt
+++ b/deploy/charts/bison/templates/NOTES.txt
@@ -9,27 +9,21 @@ Namespace: {{ .Release.Namespace }}
 数据存储在 Kubernetes ConfigMaps 中，无需外部数据库
 
 === 访问方式 ===
-{{- if .Values.apiServer.enabled }}
-{{- if .Values.apiServer.ingress.enabled }}
-
-API Server: http://{{ .Values.apiServer.ingress.host }}/api/v1
-{{- else }}
+{{- if and .Values.webUI.enabled .Values.ingress.enabled }}
 
-API Server:
-  kubectl port-forward svc/{{ include "bison.apiServer.fullname" . }} 8080:{{ .Values.apiServer.service.port }} -n {{ .Release.Namespace }}
-  访问: http://localhost:8080/api/v1
-{{- end }}
-{{- end }}
-{{- if .Values.webUI.enabled }}
-{{- if .Values.webUI.ingress.enabled }}
-
-Web UI: http://{{ .Values.webUI.ingress.host }}
-{{- else }}
+Bison: http://{{ .Values.ingress.host }}
+  Web UI nginx 会自动代理 /api 请求到 API Server
+{{- else if .Values.webUI.enabled }}
 
 Web UI:
   kubectl port-forward svc/{{ include "bison.webUI.fullname" . }} 3000:{{ .Values.webUI.service.port }} -n {{ .Release.Namespace }}
   访问: http://localhost:3000
 {{- end }}
+{{- if .Values.apiServer.enabled }}
+
+API Server (调试):
+  kubectl port-forward svc/{{ include "bison.apiServer.fullname" . }} 8080:{{ .Values.apiServer.service.port }} -n {{ .Release.Namespace }}
+  访问: http://localhost:8080/api/v1
 {{- end }}
 
 === 认证 ===
diff --git a/deploy/charts/bison/templates/_helpers.tpl b/deploy/charts/bison/templates/_helpers.tpl
index 1247b30..553da2d 100644
--- a/deploy/charts/bison/templates/_helpers.tpl
+++ b/deploy/charts/bison/templates/_helpers.tpl
@@ -76,14 +76,12 @@ Web UI full name
 {{- end }}
 
 {{/*
-Get image registry
+Build full image reference: global.imageRegistry/repository:tag
+Usage: include "bison.image" (dict "imageConfig" .Values.apiServer.image "global" .Values.global "appVersion" .Chart.AppVersion)
 */}}
-{{- define "bison.imageRegistry" -}}
-{{- if .Values.global.imageRegistry }}
-{{- printf "%s/" .Values.global.imageRegistry }}
-{{- else }}
-{{- "" }}
-{{- end }}
+{{- define "bison.image" -}}
+{{- $tag := .imageConfig.tag | default .appVersion -}}
+{{- printf "%s/%s:%s" .global.imageRegistry .imageConfig.repository $tag -}}
 {{- end }}
 
 {{/*
diff --git a/deploy/charts/bison/templates/api-server/deployment.yaml b/deploy/charts/bison/templates/api-deployment.yaml
similarity index 90%
rename from deploy/charts/bison/templates/api-server/deployment.yaml
rename to deploy/charts/bison/templates/api-deployment.yaml
index b141063..ce17f7f 100644
--- a/deploy/charts/bison/templates/api-server/deployment.yaml
+++ b/deploy/charts/bison/templates/api-deployment.yaml
@@ -8,7 +8,9 @@ metadata:
     {{- include "bison.labels" . | nindent 4 }}
     app.kubernetes.io/component: api-server
 spec:
+  {{- if not .Values.apiServer.autoscaling.enabled }}
   replicas: {{ .Values.apiServer.replicaCount }}
+  {{- end }}
   selector:
     matchLabels:
       {{- include "bison.selectorLabels" . | nindent 6 }}
@@ -30,7 +32,7 @@ spec:
         - name: api
           securityContext:
             {{- toYaml .Values.securityContext | nindent 12 }}
-          image: "{{ include "bison.imageRegistry" . }}{{ .Values.apiServer.image.repository }}:{{ .Values.apiServer.image.tag }}"
+          image: "{{ include "bison.image" (dict "imageConfig" .Values.apiServer.image "global" .Values.global "appVersion" .Chart.AppVersion) }}"
           imagePullPolicy: {{ .Values.apiServer.image.pullPolicy }}
           ports:
             - name: http
@@ -56,6 +58,9 @@ spec:
                   name: {{ if .Values.auth.jwt.existingSecret }}{{ .Values.auth.jwt.existingSecret }}{{ else }}{{ include "bison.authSecretName" . }}{{ end }}
                   key: jwt-secret
             {{- end }}
+            # Capsule integration
+            - name: CAPSULE_ENABLED
+              value: {{ .Values.dependencies.capsule.enabled | quote }}
             # OpenCost integration
             {{- if .Values.dependencies.opencost.enabled }}
             - name: OPENCOST_URL
diff --git a/deploy/charts/bison/templates/api-server/auth-secret.yaml b/deploy/charts/bison/templates/api-server/auth-secret.yaml
deleted file mode 100644
index 3bf3300..0000000
--- a/deploy/charts/bison/templates/api-server/auth-secret.yaml
+++ /dev/null
@@ -1,24 +0,0 @@
-{{- if and .Values.apiServer.enabled .Values.auth.enabled }}
-{{- if not .Values.auth.admin.existingSecret }}
-apiVersion: v1
-kind: Secret
-metadata:
-  name: {{ include "bison.fullname" . }}-auth
-  namespace: {{ .Release.Namespace }}
-  labels:
-    {{- include "bison.labels" . | nindent 4 }}
-type: Opaque
-data:
-  {{- if .Values.auth.admin.password }}
-  password: {{ .Values.auth.admin.password | b64enc | quote }}
-  {{- else }}
-  password: {{ randAlphaNum 16 | b64enc | quote }}
-  {{- end }}
-  {{- if .Values.auth.jwt.secret }}
-  jwt-secret: {{ .Values.auth.jwt.secret | b64enc | quote }}
-  {{- else }}
-  jwt-secret: {{ randAlphaNum 32 | b64enc | quote }}
-  {{- end }}
-{{- end }}
-{{- end }}
-
diff --git a/deploy/charts/bison/templates/api-server/ingress.yaml b/deploy/charts/bison/templates/api-server/ingress.yaml
deleted file mode 100644
index e979851..0000000
--- a/deploy/charts/bison/templates/api-server/ingress.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-{{- if and .Values.apiServer.enabled .Values.apiServer.ingress.enabled }}
-apiVersion: networking.k8s.io/v1
-kind: Ingress
-metadata:
-  name: {{ include "bison.apiServer.fullname" . }}
-  namespace: {{ .Release.Namespace }}
-  labels:
-    {{- include "bison.labels" . | nindent 4 }}
-    app.kubernetes.io/component: api-server
-  {{- with .Values.apiServer.ingress.annotations }}
-  annotations:
-    {{- toYaml . | nindent 4 }}
-  {{- end }}
-spec:
-  {{- if .Values.apiServer.ingress.className }}
-  ingressClassName: {{ .Values.apiServer.ingress.className }}
-  {{- end }}
-  {{- if .Values.apiServer.ingress.tls }}
-  tls:
-    {{- range .Values.apiServer.ingress.tls }}
-    - hosts:
-        {{- range .hosts }}
-        - {{ . | quote }}
-        {{- end }}
-      secretName: {{ .secretName }}
-    {{- end }}
-  {{- end }}
-  rules:
-    - host: {{ .Values.apiServer.ingress.host | quote }}
-      http:
-        paths:
-          - path: /
-            pathType: Prefix
-            backend:
-              service:
-                name: {{ include "bison.apiServer.fullname" . }}
-                port:
-                  number: {{ .Values.apiServer.service.port }}
-{{- end }}
-
diff --git a/deploy/charts/bison/templates/hpa.yaml b/deploy/charts/bison/templates/hpa.yaml
new file mode 100644
index 0000000..ed9e011
--- /dev/null
+++ b/deploy/charts/bison/templates/hpa.yaml
@@ -0,0 +1,49 @@
+{{- if and .Values.apiServer.enabled .Values.apiServer.autoscaling.enabled }}
+apiVersion: autoscaling/v2
+kind: HorizontalPodAutoscaler
+metadata:
+  name: {{ include "bison.apiServer.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+    app.kubernetes.io/component: api-server
+spec:
+  scaleTargetRef:
+    apiVersion: apps/v1
+    kind: Deployment
+    name: {{ include "bison.apiServer.fullname" . }}
+  minReplicas: {{ .Values.apiServer.autoscaling.minReplicas }}
+  maxReplicas: {{ .Values.apiServer.autoscaling.maxReplicas }}
+  metrics:
+    - type: Resource
+      resource:
+        name: cpu
+        target:
+          type: Utilization
+          averageUtilization: {{ .Values.apiServer.autoscaling.targetCPUUtilizationPercentage }}
+{{- end }}
+{{- if and .Values.webUI.enabled .Values.webUI.autoscaling.enabled }}
+---
+apiVersion: autoscaling/v2
+kind: HorizontalPodAutoscaler
+metadata:
+  name: {{ include "bison.webUI.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+    app.kubernetes.io/component: web-ui
+spec:
+  scaleTargetRef:
+    apiVersion: apps/v1
+    kind: Deployment
+    name: {{ include "bison.webUI.fullname" . }}
+  minReplicas: {{ .Values.webUI.autoscaling.minReplicas }}
+  maxReplicas: {{ .Values.webUI.autoscaling.maxReplicas }}
+  metrics:
+    - type: Resource
+      resource:
+        name: cpu
+        target:
+          type: Utilization
+          averageUtilization: {{ .Values.webUI.autoscaling.targetCPUUtilizationPercentage }}
+{{- end }}
diff --git a/deploy/charts/bison/templates/ingress.yaml b/deploy/charts/bison/templates/ingress.yaml
new file mode 100644
index 0000000..9184908
--- /dev/null
+++ b/deploy/charts/bison/templates/ingress.yaml
@@ -0,0 +1,34 @@
+{{- if and .Values.webUI.enabled .Values.ingress.enabled }}
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: {{ include "bison.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+  {{- with .Values.ingress.annotations }}
+  annotations:
+    {{- toYaml . | nindent 4 }}
+  {{- end }}
+spec:
+  {{- if .Values.ingress.className }}
+  ingressClassName: {{ .Values.ingress.className }}
+  {{- end }}
+  {{- if .Values.ingress.tls.enabled }}
+  tls:
+    - hosts:
+        - {{ .Values.ingress.host | quote }}
+      secretName: {{ .Values.ingress.tls.secretName | default (printf "%s-tls" (include "bison.fullname" .)) }}
+  {{- end }}
+  rules:
+    - host: {{ .Values.ingress.host | quote }}
+      http:
+        paths:
+          - path: /
+            pathType: Prefix
+            backend:
+              service:
+                name: {{ include "bison.webUI.fullname" . }}
+                port:
+                  number: {{ .Values.webUI.service.port }}
+{{- end }}
diff --git a/deploy/charts/bison/templates/networkpolicy.yaml b/deploy/charts/bison/templates/networkpolicy.yaml
new file mode 100644
index 0000000..2aa8694
--- /dev/null
+++ b/deploy/charts/bison/templates/networkpolicy.yaml
@@ -0,0 +1,32 @@
+{{- if .Values.networkPolicy.enabled }}
+# Restrict ingress to the api-server: only web-ui pods and pods in the release
+# namespace may reach it on the API port. api-server egress (K8s API, OpenCost,
+# Prometheus) is unaffected since only Ingress is policed here.
+apiVersion: networking.k8s.io/v1
+kind: NetworkPolicy
+metadata:
+  name: {{ include "bison.apiServer.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+    app.kubernetes.io/component: api-server
+spec:
+  podSelector:
+    matchLabels:
+      {{- include "bison.selectorLabels" . | nindent 6 }}
+      app.kubernetes.io/component: api-server
+  policyTypes:
+    - Ingress
+  ingress:
+    - from:
+        - podSelector:
+            matchLabels:
+              {{- include "bison.selectorLabels" . | nindent 14 }}
+              app.kubernetes.io/component: web-ui
+        - namespaceSelector:
+            matchLabels:
+              kubernetes.io/metadata.name: {{ .Release.Namespace }}
+      ports:
+        - protocol: TCP
+          port: {{ .Values.apiServer.service.port }}
+{{- end }}
diff --git a/deploy/charts/bison/templates/pdb.yaml b/deploy/charts/bison/templates/pdb.yaml
new file mode 100644
index 0000000..16f1347
--- /dev/null
+++ b/deploy/charts/bison/templates/pdb.yaml
@@ -0,0 +1,33 @@
+{{- if and .Values.apiServer.enabled .Values.apiServer.podDisruptionBudget.enabled }}
+apiVersion: policy/v1
+kind: PodDisruptionBudget
+metadata:
+  name: {{ include "bison.apiServer.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+    app.kubernetes.io/component: api-server
+spec:
+  minAvailable: {{ .Values.apiServer.podDisruptionBudget.minAvailable }}
+  selector:
+    matchLabels:
+      {{- include "bison.selectorLabels" . | nindent 6 }}
+      app.kubernetes.io/component: api-server
+{{- end }}
+{{- if and .Values.webUI.enabled .Values.webUI.podDisruptionBudget.enabled }}
+---
+apiVersion: policy/v1
+kind: PodDisruptionBudget
+metadata:
+  name: {{ include "bison.webUI.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+    app.kubernetes.io/component: web-ui
+spec:
+  minAvailable: {{ .Values.webUI.podDisruptionBudget.minAvailable }}
+  selector:
+    matchLabels:
+      {{- include "bison.selectorLabels" . | nindent 6 }}
+      app.kubernetes.io/component: web-ui
+{{- end }}
diff --git a/deploy/charts/bison/templates/api-server/rbac.yaml b/deploy/charts/bison/templates/rbac.yaml
similarity index 91%
rename from deploy/charts/bison/templates/api-server/rbac.yaml
rename to deploy/charts/bison/templates/rbac.yaml
index 4a70b0e..dfe0984 100644
--- a/deploy/charts/bison/templates/api-server/rbac.yaml
+++ b/deploy/charts/bison/templates/rbac.yaml
@@ -35,6 +35,10 @@ rules:
   - apiGroups: [""]
     resources: ["nodes"]
     verbs: ["get", "list", "watch", "update", "patch"]
+  # Leader election for the singleton scheduler (coordination.k8s.io Lease)
+  - apiGroups: ["coordination.k8s.io"]
+    resources: ["leases"]
+    verbs: ["get", "create", "update"]
 ---
 apiVersion: rbac.authorization.k8s.io/v1
 kind: ClusterRoleBinding
diff --git a/deploy/charts/bison/templates/secret.yaml b/deploy/charts/bison/templates/secret.yaml
new file mode 100644
index 0000000..8ab02a8
--- /dev/null
+++ b/deploy/charts/bison/templates/secret.yaml
@@ -0,0 +1,35 @@
+{{- if and .Values.apiServer.enabled .Values.auth.enabled }}
+{{- if not .Values.auth.admin.existingSecret }}
+{{- $secretName := printf "%s-auth" (include "bison.fullname" .) -}}
+{{- /* Reuse the already-generated secret on upgrade so the JWT signing key and
+       admin password stay stable across `helm upgrade`. Otherwise every upgrade
+       would re-run randAlphaNum, rotating the JWT key (invalidating all sessions)
+       and silently changing the admin password. */ -}}
+{{- $existing := (lookup "v1" "Secret" .Release.Namespace $secretName) -}}
+{{- $existingData := dict -}}
+{{- if $existing -}}{{- $existingData = $existing.data -}}{{- end -}}
+apiVersion: v1
+kind: Secret
+metadata:
+  name: {{ $secretName }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+type: Opaque
+data:
+  {{- if .Values.auth.admin.password }}
+  password: {{ .Values.auth.admin.password | b64enc | quote }}
+  {{- else if hasKey $existingData "password" }}
+  password: {{ get $existingData "password" | quote }}
+  {{- else }}
+  password: {{ randAlphaNum 16 | b64enc | quote }}
+  {{- end }}
+  {{- if .Values.auth.jwt.secret }}
+  jwt-secret: {{ .Values.auth.jwt.secret | b64enc | quote }}
+  {{- else if hasKey $existingData "jwt-secret" }}
+  jwt-secret: {{ get $existingData "jwt-secret" | quote }}
+  {{- else }}
+  jwt-secret: {{ randAlphaNum 32 | b64enc | quote }}
+  {{- end }}
+{{- end }}
+{{- end }}
diff --git a/deploy/charts/bison/templates/api-server/service.yaml b/deploy/charts/bison/templates/service.yaml
similarity index 50%
rename from deploy/charts/bison/templates/api-server/service.yaml
rename to deploy/charts/bison/templates/service.yaml
index d0c9e18..ab2bcbc 100644
--- a/deploy/charts/bison/templates/api-server/service.yaml
+++ b/deploy/charts/bison/templates/service.yaml
@@ -18,4 +18,24 @@ spec:
     {{- include "bison.selectorLabels" . | nindent 4 }}
     app.kubernetes.io/component: api-server
 {{- end }}
-
+---
+{{- if .Values.webUI.enabled }}
+apiVersion: v1
+kind: Service
+metadata:
+  name: {{ include "bison.webUI.fullname" . }}
+  namespace: {{ .Release.Namespace }}
+  labels:
+    {{- include "bison.labels" . | nindent 4 }}
+    app.kubernetes.io/component: web-ui
+spec:
+  type: {{ .Values.webUI.service.type }}
+  ports:
+    - port: {{ .Values.webUI.service.port }}
+      targetPort: http
+      protocol: TCP
+      name: http
+  selector:
+    {{- include "bison.selectorLabels" . | nindent 4 }}
+    app.kubernetes.io/component: web-ui
+{{- end }}
diff --git a/deploy/charts/bison/templates/web-ui/deployment.yaml b/deploy/charts/bison/templates/web-deployment.yaml
similarity index 90%
rename from deploy/charts/bison/templates/web-ui/deployment.yaml
rename to deploy/charts/bison/templates/web-deployment.yaml
index a637f65..55829cb 100644
--- a/deploy/charts/bison/templates/web-ui/deployment.yaml
+++ b/deploy/charts/bison/templates/web-deployment.yaml
@@ -8,7 +8,9 @@ metadata:
     {{- include "bison.labels" . | nindent 4 }}
     app.kubernetes.io/component: web-ui
 spec:
+  {{- if not .Values.webUI.autoscaling.enabled }}
   replicas: {{ .Values.webUI.replicaCount }}
+  {{- end }}
   selector:
     matchLabels:
       {{- include "bison.selectorLabels" . | nindent 6 }}
@@ -29,7 +31,7 @@ spec:
         - name: web
           securityContext:
             {{- toYaml .Values.securityContext | nindent 12 }}
-          image: "{{ include "bison.imageRegistry" . }}{{ .Values.webUI.image.repository }}:{{ .Values.webUI.image.tag }}"
+          image: "{{ include "bison.image" (dict "imageConfig" .Values.webUI.image "global" .Values.global "appVersion" .Chart.AppVersion) }}"
           imagePullPolicy: {{ .Values.webUI.image.pullPolicy }}
           ports:
             - name: http
@@ -65,4 +67,3 @@ spec:
         {{- toYaml . | nindent 8 }}
       {{- end }}
 {{- end }}
-
diff --git a/deploy/charts/bison/templates/web-ui/ingress.yaml b/deploy/charts/bison/templates/web-ui/ingress.yaml
deleted file mode 100644
index 00c86e6..0000000
--- a/deploy/charts/bison/templates/web-ui/ingress.yaml
+++ /dev/null
@@ -1,40 +0,0 @@
-{{- if and .Values.webUI.enabled .Values.webUI.ingress.enabled }}
-apiVersion: networking.k8s.io/v1
-kind: Ingress
-metadata:
-  name: {{ include "bison.webUI.fullname" . }}
-  namespace: {{ .Release.Namespace }}
-  labels:
-    {{- include "bison.labels" . | nindent 4 }}
-    app.kubernetes.io/component: web-ui
-  {{- with .Values.webUI.ingress.annotations }}
-  annotations:
-    {{- toYaml . | nindent 4 }}
-  {{- end }}
-spec:
-  {{- if .Values.webUI.ingress.className }}
-  ingressClassName: {{ .Values.webUI.ingress.className }}
-  {{- end }}
-  {{- if .Values.webUI.ingress.tls }}
-  tls:
-    {{- range .Values.webUI.ingress.tls }}
-    - hosts:
-        {{- range .hosts }}
-        - {{ . | quote }}
-        {{- end }}
-      secretName: {{ .secretName }}
-    {{- end }}
-  {{- end }}
-  rules:
-    - host: {{ .Values.webUI.ingress.host | quote }}
-      http:
-        paths:
-          - path: /
-            pathType: Prefix
-            backend:
-              service:
-                name: {{ include "bison.webUI.fullname" . }}
-                port:
-                  number: {{ .Values.webUI.service.port }}
-{{- end }}
-
diff --git a/deploy/charts/bison/templates/web-ui/service.yaml b/deploy/charts/bison/templates/web-ui/service.yaml
deleted file mode 100644
index 905e3b6..0000000
--- a/deploy/charts/bison/templates/web-ui/service.yaml
+++ /dev/null
@@ -1,21 +0,0 @@
-{{- if .Values.webUI.enabled }}
-apiVersion: v1
-kind: Service
-metadata:
-  name: {{ include "bison.webUI.fullname" . }}
-  namespace: {{ .Release.Namespace }}
-  labels:
-    {{- include "bison.labels" . | nindent 4 }}
-    app.kubernetes.io/component: web-ui
-spec:
-  type: {{ .Values.webUI.service.type }}
-  ports:
-    - port: {{ .Values.webUI.service.port }}
-      targetPort: http
-      protocol: TCP
-      name: http
-  selector:
-    {{- include "bison.selectorLabels" . | nindent 4 }}
-    app.kubernetes.io/component: web-ui
-{{- end }}
-
diff --git a/deploy/charts/bison/values.schema.json b/deploy/charts/bison/values.schema.json
new file mode 100644
index 0000000..80420eb
--- /dev/null
+++ b/deploy/charts/bison/values.schema.json
@@ -0,0 +1,133 @@
+{
+  "$schema": "https://json-schema.org/draft-07/schema#",
+  "title": "Bison Helm values",
+  "type": "object",
+  "properties": {
+    "global": {
+      "type": "object",
+      "properties": {
+        "imageRegistry": { "type": "string" },
+        "imagePullSecrets": { "type": "array" }
+      }
+    },
+    "auth": {
+      "type": "object",
+      "properties": {
+        "enabled": { "type": "boolean" },
+        "admin": {
+          "type": "object",
+          "properties": {
+            "username": { "type": "string" },
+            "password": { "type": "string" },
+            "existingSecret": { "type": "string" }
+          }
+        },
+        "jwt": {
+          "type": "object",
+          "properties": {
+            "secret": { "type": "string" },
+            "existingSecret": { "type": "string" }
+          }
+        }
+      }
+    },
+    "dependencies": {
+      "type": "object",
+      "properties": {
+        "capsule": {
+          "type": "object",
+          "properties": { "enabled": { "type": "boolean" } }
+        },
+        "opencost": {
+          "type": "object",
+          "properties": {
+            "enabled": { "type": "boolean" },
+            "apiUrl": { "type": "string" }
+          }
+        },
+        "prometheus": {
+          "type": "object",
+          "properties": {
+            "enabled": { "type": "boolean" },
+            "url": { "type": "string" }
+          }
+        }
+      }
+    },
+    "apiServer": { "$ref": "#/$defs/component" },
+    "webUI": { "$ref": "#/$defs/component" },
+    "ingress": {
+      "type": "object",
+      "properties": {
+        "enabled": { "type": "boolean" },
+        "className": { "type": "string" },
+        "annotations": { "type": "object" },
+        "host": { "type": "string" },
+        "tls": {
+          "type": "object",
+          "properties": {
+            "enabled": { "type": "boolean" },
+            "secretName": { "type": "string" }
+          }
+        }
+      }
+    },
+    "serviceAccount": {
+      "type": "object",
+      "properties": {
+        "create": { "type": "boolean" },
+        "annotations": { "type": "object" },
+        "name": { "type": "string" }
+      }
+    },
+    "podSecurityContext": { "type": "object" },
+    "securityContext": { "type": "object" },
+    "networkPolicy": {
+      "type": "object",
+      "properties": { "enabled": { "type": "boolean" } }
+    }
+  },
+  "$defs": {
+    "component": {
+      "type": "object",
+      "properties": {
+        "enabled": { "type": "boolean" },
+        "replicaCount": { "type": "integer", "minimum": 0 },
+        "image": {
+          "type": "object",
+          "properties": {
+            "repository": { "type": "string" },
+            "tag": { "type": "string" },
+            "pullPolicy": { "type": "string" }
+          }
+        },
+        "service": {
+          "type": "object",
+          "properties": {
+            "type": { "type": "string" },
+            "port": { "type": "integer" }
+          }
+        },
+        "resources": { "type": "object" },
+        "nodeSelector": { "type": "object" },
+        "tolerations": { "type": "array" },
+        "affinity": { "type": "object" },
+        "autoscaling": {
+          "type": "object",
+          "properties": {
+            "enabled": { "type": "boolean" },
+            "minReplicas": { "type": "integer", "minimum": 1 },
+            "maxReplicas": { "type": "integer", "minimum": 1 },
+            "targetCPUUtilizationPercentage": { "type": "integer", "minimum": 1, "maximum": 100 }
+          }
+        },
+        "podDisruptionBudget": {
+          "type": "object",
+          "properties": {
+            "enabled": { "type": "boolean" }
+          }
+        }
+      }
+    }
+  }
+}
diff --git a/deploy/charts/bison/values.yaml b/deploy/charts/bison/values.yaml
index 1546f16..84f81ca 100644
--- a/deploy/charts/bison/values.yaml
+++ b/deploy/charts/bison/values.yaml
@@ -2,19 +2,19 @@
 
 # Global configuration
 global:
-  imageRegistry: ""
+  imageRegistry: "ghcr.io/supermarioyl"
   imagePullSecrets: []
 
 # Authentication configuration
 auth:
-  enabled: false                       # Enable login authentication
+  enabled: false # Enable login authentication
   admin:
-    username: admin                   # Admin username
-    password: ""                      # Admin password (not recommended, use existingSecret)
-    existingSecret: ""                # Secret containing 'password' key
+    username: admin # Admin username
+    password: "" # Admin password (not recommended, use existingSecret)
+    existingSecret: "" # Secret containing 'password' key
   jwt:
-    secret: ""                        # JWT signing secret (auto-generated if empty)
-    existingSecret: ""                # Secret containing 'jwt-secret' key
+    secret: "" # JWT signing secret (auto-generated if empty)
+    existingSecret: "" # Secret containing 'jwt-secret' key
 
 # External dependencies
 # Note: Capsule and OpenCost must be installed separately before deploying Bison
@@ -23,16 +23,16 @@ dependencies:
   capsule:
     # Capsule must be installed separately
     # helm install capsule projectcapsule/capsule -n capsule-system --create-namespace
-    enabled: true
-  
+    enabled: false
+
   # OpenCost configuration
   opencost:
     # OpenCost must be installed separately
     # helm install opencost opencost/opencost -n opencost --create-namespace
-    enabled: true
+    enabled: false
     # OpenCost API URL (internal service URL) - use port 9003 for API, NOT 9090 (UI)
     apiUrl: "http://opencost.opencost.svc.cluster.local:9003"
-  
+
   # Prometheus configuration (for node metrics, required by OpenCost)
   prometheus:
     enabled: true
@@ -42,20 +42,19 @@ dependencies:
 # API Server configuration
 apiServer:
   enabled: true
+  # The api-server runs the billing/auto-recharge/alert scheduler. Multiple
+  # replicas are safe: the scheduler is guarded by Kubernetes lease-based leader
+  # election (LEADER_ELECTION_ENABLED, on by default) so it runs on exactly one
+  # replica at a time. Set LEADER_ELECTION_ENABLED=false only for single-replica
+  # or local development.
   replicaCount: 2
   image:
-    repository: ghcr.io/supermarioyl/bison/api-server
-    tag: 0.0.1
+    repository: bison/api-server
+    tag: "" # Defaults to Chart.AppVersion if empty
     pullPolicy: IfNotPresent
   service:
     type: ClusterIP
     port: 8080
-  ingress:
-    enabled: true
-    className: ""
-    annotations: {}
-    host: bison-api.example.com
-    tls: []
   resources:
     limits:
       cpu: 1000m
@@ -66,24 +65,28 @@ apiServer:
   nodeSelector: {}
   tolerations: []
   affinity: {}
+  # Optional autoscaling. When enabled, replicaCount is ignored (HPA owns replicas).
+  autoscaling:
+    enabled: false
+    minReplicas: 2
+    maxReplicas: 5
+    targetCPUUtilizationPercentage: 80
+  # Optional PodDisruptionBudget to keep at least one replica during voluntary disruptions.
+  podDisruptionBudget:
+    enabled: false
+    minAvailable: 1
 
 # Web UI configuration
 webUI:
-  enabled: false
+  enabled: true
   replicaCount: 2
   image:
-    repository: ghcr.io/supermarioyl/bison/web-ui
-    tag: 0.0.1
+    repository: bison/web-ui
+    tag: "" # Defaults to Chart.AppVersion if empty
     pullPolicy: IfNotPresent
   service:
     type: ClusterIP
     port: 80
-  ingress:
-    enabled: true
-    className: ""
-    annotations: {}
-    host: bison.example.com
-    tls: []
   resources:
     limits:
       cpu: 500m
@@ -94,6 +97,30 @@ webUI:
   nodeSelector: {}
   tolerations: []
   affinity: {}
+  autoscaling:
+    enabled: false
+    minReplicas: 2
+    maxReplicas: 5
+    targetCPUUtilizationPercentage: 80
+  podDisruptionBudget:
+    enabled: false
+    minAvailable: 1
+
+# Optional NetworkPolicy restricting ingress to the api-server (off by default).
+# When enabled, the api-server only accepts traffic from web-ui pods and the
+# release namespace. Review before enabling to ensure it fits your CNI/topology.
+networkPolicy:
+  enabled: false
+
+# Ingress (unified entry point, web-ui nginx proxies /api to api-server)
+ingress:
+  enabled: true
+  className: ""
+  annotations: {}
+  host: bison.example.com
+  tls:
+    enabled: false
+    secretName: "" # If empty, auto-generated as <release>-tls
 
 # Service account
 serviceAccount:
diff --git a/docs/README_CN.md b/docs/README_CN.md
index 154539c..72a8013 100644
--- a/docs/README_CN.md
+++ b/docs/README_CN.md
@@ -237,10 +237,38 @@ helm install opencost opencost/opencost -n opencost --create-namespace \
 
 ### 2. 部署 Bison
 
+#### 方式 A: 使用 GHCR (推荐 - OCI 格式)
+
+```bash
+# 直接从 GitHub Container Registry 安装
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set auth.enabled=true \
+  --version 0.0.2
+```
+
+> **注意:** 需要 Helm >= 3.8.0 以支持 OCI
+
+#### 方式 B: 从 GitHub Release
+
+```bash
+# 从 GitHub Release 下载 Helm chart
+wget https://github.com/SuperMarioYL/Bison/releases/download/v0.0.2/bison-0.0.2.tgz
+
+# 从下载的 chart 安装
+helm install bison bison-0.0.2.tgz \
+  --namespace bison-system \
+  --create-namespace \
+  --set auth.enabled=true
+```
+
+#### 方式 C: 从源码
+
 ```bash
 # 克隆并部署
-git clone https://github.com/your-org/bison.git
-cd bison
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
 
 helm install bison ./deploy/charts/bison \
   --namespace bison-system \
diff --git a/docs/optimization-roadmap.md b/docs/optimization-roadmap.md
new file mode 100644
index 0000000..ae8c631
--- /dev/null
+++ b/docs/optimization-roadmap.md
@@ -0,0 +1,226 @@
+# Bison 持续优化路线图
+
+> 基于一次覆盖后端、前端、官网、文档、DevOps、测试的综合优化审计整理（多 agent 并行审计 + 对抗式验证，共 89 条发现）。
+> 生成时间：2026-06-19 · 审计基线版本 **0.0.11**（`deploy/charts/bison/Chart.yaml`、`web-ui/package.json`、`website/versions.json` 一致；唯一例外是 UI 页脚仍硬编码 `v3.0.0`，本次迭代已修复）。
+
+## 概览
+
+本路线图把 89 条已验证发现归并为 **9 个主题**，按「影响 / 工作量」排序为「快赢 → 战略」两档。整体判断：
+
+- **最危险的是一簇资金正确性 + 并发缺陷**：余额/计费状态存在共享 ConfigMap，read-modify-write 无 ResourceVersion 冲突重试（`api-server/internal/k8s/client.go` 的 `UpdateConfigMap` 为裸 `Update`，全仓无 `RetryOnConflict`），而调度器在 `replicaCount: 2`（`deploy/charts/bison/values.yaml`）下**无 leader election**，每个副本独立跑小时计费/自动充值/告警 —— 客户被按副本数重复扣费、并发充值丢更新。这两条必须最先处理。
+- **一组纯文档错误以极低成本拦住所有新用户**：OCI chart 路径写成 `oci://ghcr.io/supermarioyl/bison/bison`，而 CI 实际推送到 `oci://ghcr.io/supermarioyl/charts/bison`；健康检查文档指向不存在的 `/api/v1/health`（实际 `/healthz`）；版本停留 0.0.2/0.0.1；OpenCost 命名空间在 chart 默认（`opencost`）与官网（`opencost-system`）间不一致。
+- **官网正在迭代**：emoji 图标、缺失能力展示、缺失截图、版本错印、homepage i18n、社交卡尺寸、SEO 收尾，已抽成独立的「本次迭代清单」。
+- **测试是 0**：后端 0 个 `*_test.go`，前端仅 `1+1==2`，CI 测试任务空跑报绿，所有金额逻辑无回归安全网。
+
+---
+
+## 已落地版本（v0.0.12 → v0.0.26，按「每个功能一个小版本」迭代）
+
+| 版本 | 主题 | 内容 |
+|---|---|---|
+| 0.0.12 | 资金/前端/官网/文档 | ConfigMap 余额 RMW 加 `RetryOnConflict`；`Deduct` 返回写后余额；前端路由 lazy + echarts 分包 + ErrorBoundary；官网去 emoji 换 SVG + ProductShowcase；安装文档纠错；本路线图 |
+| 0.0.13 | 资金/并发 | 调度器 **leader election**（Lease），恢复 `replicaCount: 2`，scheduler 可重启 + 测试 |
+| 0.0.14 | 安全 | Helm Secret `lookup` 持久化，升级不再轮换 JWT/密码 |
+| 0.0.15 | 安全 | 登录 per-IP 限流 + `crypto/subtle` 常量时间比较 + 测试 |
+| 0.0.16 | 安全 | `CORS_ALLOWED_ORIGINS` 可配置 allowlist |
+| 0.0.17 | 资金 | `lastBilledAt` 时间戳门控，修计费窗口/Interval 不一致 + 防重启重扣 + 测试 |
+| 0.0.18 | 资金 | `CalculateDailyConsumption` 分母改实际跨度，修 ~6x 烧钱速率低估 + 测试 |
+| 0.0.19 | 性能 | 删 `ListTeams` 丢弃用量循环；`loadPrices` 每次计费读一次配置 |
+| 0.0.20 | 性能 | OpenCost 查询 30s TTL + 并发合并缓存 + race 测试 |
+| 0.0.21 | DevOps | release 加 **Test & Lint Gate**（vet/fmt/build/test -race + web）；修 `tslib` 幽灵依赖 |
+| 0.0.22 | 安全 | auth 开启时启动拒绝默认 JWT/密码 + 测试 |
+| 0.0.23 | 前端质量 | 13 处错误提取统一为 `getApiErrorMessage` |
+| 0.0.24 | 前端性能 | Auth/Theme Context value `useMemo` |
+| 0.0.25 | DevOps | `values.schema.json` 类型校验 + `kubeVersion >=1.22` |
+| 0.0.26 | DevOps | 可选 PDB / HPA / NetworkPolicy 模板 |
+
+> 已覆盖 P0 资金正确性与并发、安全基线、开箱即用/CI 门禁、热点性能、chart 健壮性与可用性等全部近期项与多数中期项。
+
+### 仍待办（多需活集群验证或产品决策，建议后续单独排期）
+
+- **后端规模化**：SharedInformer/lister 缓存热点 List、列表分页、per-request 与调度器超时、报表单次聚合查询、`GetCostTrend` 按桶日期映射、suspend/resume 二次缩容修复。
+- **前端**：NodeDetail echarts option `useMemo`、逐行 N+1 query 分页门、硬编码色→主题 token、`formatCurrency`/`currencySymbol`、dayjs 统一 bootstrap、i18n 层。
+- **安全/供应链**：RBAC 去 `clusterrolebindings` 写、onboarding SSH 入参校验、镜像 Trivy 扫描/SBOM/cosign 签名、基础镜像 digest 固定、Dependabot。
+- **架构/平台化（远期）**：余额持久化模型升级（ConfigMap → per-key patch / CRD）、money 整数最小单位、能力补全或下线（OIDC/Email/Excel-PDF）。
+
+---
+
+## 优化主题
+
+### 主题 1 · 资金正确性与并发安全
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| 调度器在每个副本无 leader election（`scheduler.go` 裸 ticker，`replicaCount:2`） | 按副本数重复扣费/重复自动充值/重复告警 —— 资金错误 | 立即将 `values.yaml` replicaCount 设 1 止血；用 `client-go` leaderelection Lease 根治，或拆成单副本 Deployment/CronJob | P0 | M（止血 S） |
+| 余额 ConfigMap read-modify-write 无冲突重试（`balance_service.go`、`k8s/client.go`） | 并发充值与计费扣费丢更新，余额静默腐蚀，无审计差额 | `Recharge/Deduct/addRechargeRecord/SetOverdueAt` 包入 `retry.RetryOnConflict`，循环内重读重算重写 | P0 | M |
+| ProcessBilling 扣费后独立再读余额做停机判断，且丢弃错误（`billing_service.go` `balance, _ := ...GetBalance`） | 基于陈旧/竞态值错误停机：deployment/statefulset 缩 0、删孤儿 pod | 让 `Deduct` 返回写后余额供判断；停止吞错；与上条乐观锁配合 | P0 | M |
+| 计费窗口由 `config.Interval` 决定但 ticker 硬编码 1h（`scheduler.go` vs `billing_service.go`） | Interval≠1 时每小时按 Interval 小时扣费，严重超收 | ticker 周期由 Interval 驱动，或固定查 1h 窗口；加校验；记录 last-billed 时间戳防重启重扣 | P1 | S |
+| `CalculateDailyConsumption` 分母取最近 100 条任意类型记录的最旧时间（`balance_service.go`） | 烧钱速率被低估约 6x，欠费预计时间高估 | 分母改为窗口内 deduction 记录的实际跨度（≤7 天 + 下限） | P1 | S |
+| suspend/resume 依赖 `original-replicas` 注解，二次缩容丢副本数（`billing_service.go`） | 恢复后工作负载回到 0 副本 | suspend 前查 `team.Suspended` 只缩一次；per-object Update 包 RetryOnConflict | P2 | M |
+| `GetCostTrend` 按位置索引映射 OpenCost 日桶（`opencost/client.go`） | 成本错位到错误日期或被静默置 0 | 按每桶 `Window.Start` 解析日期建趋势 | P2 | M |
+
+### 主题 2 · 安全加固
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| 鉴权默认关闭 + admin/admin + 硬编码 JWS 密钥（`config.go`） | 财务+集群控制面开箱即用零鉴权；token 可伪造 | 默认开启鉴权；启动时拒绝内置默认密钥/密码；无密钥时随机生成 | P0 | S |
+| `helm upgrade` 每次 `randAlphaNum` 重生成密码与 JWT（`secret.yaml`） | 每次升级踢出所有用户、admin 密码静默改变 | 用 `lookup` 复用已存在 Secret，仅首装生成；可加 `resource-policy: keep` | P0 | S |
+| 登录无限流、明文非常量时间比较（`auth.go`） | admin 密码可全速暴力破解 | per-IP 限流 + 退避；`crypto/subtle.ConstantTimeCompare` | P1 | S |
+| CORS `Allow-Origin: *` 且允许 Authorization 头（`main.go`） | 任意站点可发起带凭证跨域请求 | 收紧为可配置 allowlist（Bison UI origin） | P2 | S |
+| Onboarding/控制面 SSH 配置零校验（`onboarding.go`） | 配合鉴权关闭可在节点/控制面跑攻击者命令 | 校验 host/user 非空、host allowlist/CIDR、端口范围、脚本约束；限管理员可达 | P1 | M |
+| API ClusterRole 过权：clusterrolebindings 写、node patch、namespace 增删（`rbac.yaml`） | api-server 被攻破≈集群管理员提权 | 去掉 clusterrolebindings 写（除非必需），node 写与最宽 verb 用 values 开关收口，拆 ClusterRole + per-ns Role | P2 | M |
+
+### 主题 3 · 后端性能与 K8s/OpenCost 访问模式
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| client-go 默认 5 QPS 无 informer 缓存（`k8s/client.go`） | 请求在客户端限流后串行，延迟随集群规模线性增长 | 设 `config.QPS=50`/`Burst=100`；为 namespaces/pods/nodes/tenants 引入 SharedInformerFactory + lister | P1 | L |
+| OpenCost 查询无缓存，仪表盘多端点重复查同窗口（`opencost/client.go`、`stats.go`） | 并发用户成倍放大 OpenCost 负载，仪表盘慢 | 加 30-60s TTL 缓存（按 window+aggregate+filter）+ singleflight 合并并发 | P1 | M |
+| `TenantService.List` 每团队按 namespace 逐个列 pod（`tenant_service.go`） | `/teams`、`/stats/overview`、`/stats/quota-alerts` 每次 O(团队×ns×pod) | 单次集群级 ListPods 后内存分桶；或 `?usage=true` 让用量按需 | P1 | M |
+| `ListTeams` 逐团队算 OpenCost 用量后丢弃（`team.go` `_ = usage`） | 纯浪费的 N 次 OpenCost+tenant 扫描 | 删除该循环，或单次 `GetTeamUsage` 合并入响应 | P1 | S |
+| 计费 nsToTeam 逐团队 `ListByTeam` 且吞错（`billing_service.go`） | 列举失败的团队被静默不计费 | 单次 `ListTenants` 用 status.namespaces 构图；记录而非吞错 | P1 | S |
+| `calculateCost` 每行重读资源配置（`billing_service.go`） | 每个 allocation 一次 ConfigMap 读 | 每次计费操作读一次配置，预建价格表传入 | P1 | S |
+| Summary/团队账单每 namespace 一次 OpenCost 查询（`report_service.go`、`billing_service.go`） | T×P 次串行 HTTP，报表生成随项目数变慢 | 一次 `GetAllocationByNamespace(window)` 建 ns→allocation 映射后内存聚合 | P2 | M |
+| 列表无分页（`team.go`/`project.go`/`user.go`） | 大部署返回大而慢的载荷且无法分页 | 仿 `audit.go` 加 page/pageSize + total | P2 | M |
+| 无 per-request/调度器超时（`main.go`、`k8s/client.go`） | K8s/OpenCost 卡住时 goroutine 与连接泄漏 | 中间件包 `context.WithTimeout`(20-25s)；设 `rest.Config.Timeout`；调度每轮加超时 | P2 | M |
+| 调度器 goroutine 无 panic 恢复/无首跑/无 jitter（`scheduler.go`） | 一次 panic 拖垮整进程；多副本同刻齐发踩踏 | 每任务 defer/recover + 随机 jitter + 启动后首跑 | P1 | S |
+
+### 主题 4 · 前端性能与健壮性
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| 无路由级代码分割，echarts 全量进主包（`App.tsx`、`NodeDetail.tsx`、`vite.config.ts`） | 所有会话首屏都下载只 NodeDetail 用的 ~1MB echarts | 路由 `React.lazy`+`Suspense`；`build.rollupOptions.output.manualChunks` 拆 react/antd/echarts | P1 | M |
+| 无 ErrorBoundary，query 读错误未处理 | 渲染异常白屏；读失败页面静默空白/无重试 | 顶层 ErrorBoundary 包 `<Routes>`；共享 `isError/error`→Alert/Result+refetch | P1 | M |
+| `@ant-design/pro-components` 声明却零引用（2.7MB） | 拖慢安装、有误入包风险 | 从 `package.json` 移除并更新 CLAUDE.md 表述 | P1 | S |
+| ProjectList/TeamList 逐行 N+1 query 无分页门（`ProjectList.tsx`、`TeamList.tsx`） | 50 项目=100 次后端调用/页 | 用分页切片驱动 useQueries，或批量后端端点，至少加 `enabled` | P2 | M |
+| Auth/Theme context value 每次渲染新对象（`AuthContext.tsx`、`ThemeContext.tsx`、`main.tsx`） | 所有消费者及整套 antd 主题级联重渲染 | provider value 用 useMemo；`main.tsx` theme token useMemo([isDark]) | P2 | S |
+| NodeDetail 每次渲染重建 8+ echarts option（`NodeDetail.tsx`，无 useMemo） | 隐藏 tab 也计算时序 map | 各 option useMemo 按 metric 切片；可 `destroyInactiveTabPane` | P2 | M |
+| Dashboard 6 路轮询冗余、全局 staleTime 30s 偏激进 | 后台稳定网络负载 | `refetchIntervalInBackground:false`；合并低频概览轮询；分级 staleTime | P3 | S |
+| Dashboard 列定义/渲染闭包每次（含轮询）重建（`Dashboard/index.tsx`） | 每次轮询全表重渲染 | 列数组 useMemo、helper useCallback | P3 | S |
+
+### 主题 5 · 前端质量、可访问性与一致性
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| 错误提取串复制 13 处、无 utils 目录 | 后端错误信封一变需改 13 处 | 加 `src/utils/error.ts` 的 `getApiErrorMessage(err, fallback)` | P2 | S |
+| `error:any` 12 处破坏 strict 模式 | 在处理不可信响应的路径上失去类型安全 | 改 `unknown`/`AxiosError<{error?:string}>`；eslint 禁 explicit-any | P2 | S |
+| 硬编码十六进制色不随暗色主题（`Dashboard`、`ResourceQuotaInput`、`NodeDetail` echarts） | 暗色下 `#999` 文本/弱阴影/图表轴对比度差 | 用 `theme.useToken()` 或 `var(--*)`；echarts 读 `isDark` 派生轴/文本色 | P2 | M |
+| `<a onClick>` 无 href 共 10 处 | 非 tab 可达、无法 Enter/Space、不能新开 | 用 react-router `<Link>` 或 `Typography.Link` | P2 | S |
+| Dashboard 硬编码 `$` 而非 `currencySymbol` | CNY/¥ 部署仪表盘显示 $ | 取 billingConfig + 抽 `formatCurrency(value,symbol)` | P2 | S |
+| dayjs 插件/locale 每文件重复 bootstrap（3 文件） | 第四个页面易漏配 | 在 `main.tsx`/`lib/dayjs.ts` 统一一次 | P3 | S |
+| 残留 `console.log`（`ResourceConfig.tsx`） | 生产控制台泄漏内部数据形状 | 删除；加 eslint `no-console`（留 warn/error） | P3 | S |
+| 无 i18n 层，UI 文案全内联中文 | 无法本地化/集中措辞 | 若需多语引 react-i18next；否则至少集中重复标签/toast 前缀 | P3 | L |
+
+### 主题 6 · 文档与安装链路正确性
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| OCI chart 路径错误 `bison/bison`（应 `charts/bison`） | 主推荐安装命令 not found 全失败 | 全量替换为 `oci://ghcr.io/supermarioyl/charts/bison`；加 CI grep 校验与 release.yml 一致 | P0 | S |
+| 健康检查文档 `/api/v1/health` 不存在（实际 `/healthz`/`/readyz`） | 首装验证步骤返回 404，误判安装失败 | 改 `curl .../healthz` | P1 | S |
+| 版本停留 0.0.2/镜像 0.0.1（实际 0.0.11） | 装到陈旧版本、示例内部不一致 | 改用 VERSION 变量/最新版；release 工作流模板化注入防漂移 | P1 | S |
+| intro.md Option A 用 github.io helm repo（CI 从不发布该 index） | 第一个安装方法即失败 | 重写为 OCI；清理别名命令 | P0 | S |
+| values 键名虚构：`opencost.url`/`apiServer.replicas`/`auth.oidc`/`clusterName` | `--set` 静默 no-op：OpenCost 错指、计费无数据 | 改正键名；移除/标 roadmap 的 oidc 与 clusterName；加 helm template 校验 CI | P0 | M |
+| OpenCost 命名空间不一致：chart 默认 `opencost` vs 官网 `opencost-system` | 默认 URL 触不到文档安装位置，计费显示 0 | 统一为 chart 默认 `opencost` | P1 | S |
+| features.md 夸大未实现能力（OIDC/Email/Excel-PDF/插件） | 卖点接触即失败、生支持工单 | 标 planned 或移除，对齐 README 真实清单 | P1 | M |
+| 配置默认虚构（`BILLING_INTERVAL=10m`、`auth.admin.password=admin`） | 运维误以为 10m 节奏与默认密码 | 删/实现该 env；密码默认改空/自动生成；逐列对照 values.yaml | P2 | S |
+| CHANGELOG 停在 0.0.1、installation.md 对象名错（`bison-api-server`/`bison-webui`，实际 `bison-api`/`bison-web`）、孤儿 `docs/architecture.html` | 误导与维护腐烂 | 回填 0.0.6-0.0.11；改正对象名；删 html 或入构建 | P2 | S-M |
+
+### 主题 7 · 官网本次迭代
+
+详见下方独立「网站本次迭代清单」章节。
+
+### 主题 8 · DevOps / 发布管线 / 部署可用性
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| release 工作流无测试/lint 门（`release.yml`，仅 helm lint） | 破损代码可被打成正式 Release | 加 gating job 跑 `go test -race`/`vet`/`npm lint`/`npm test`（`workflow_call` 复用），build-and-push `needs:` 它 | P0 | S |
+| web-ui nginx envsubst 失效 + 只读根 FS 会 CrashLoop（`nginx.conf`、`values.yaml`、`web-deployment.yaml`） | 默认生产配置下 Web UI 无法启动/连后端 | 改 `nginx-unprivileged`/listen 8080 + `pid /tmp` + emptyDir 挂载；`${API_BASE_URL}` 走 templates | P0 | M |
+| helm upgrade 轮换密钥（见主题 2，列此联动） | 升级即登出全员 | `lookup` 复用 Secret | P0 | S |
+| Dockerfile/CI 删 package-lock 再 install（`web-ui/Dockerfile`、`build-test.yml`） | 构建不可复现、缓存失效 | 修根因后全用 `npm ci` | P2 | S |
+| 镜像无扫描/SBOM/签名（`release.yml` 已声明 id-token 却未接） | 漏洞基础层流向用户、无法验真 | build-push 加 `provenance/sbom`，cosign 无密钥签名，PR 跑非阻断 Trivy | P2 | M |
+| 缺 PDB/HPA/NetworkPolicy（replicaCount:2） | 同时驱逐两副本致停机 | 加可选 PDB(minAvailable:1)/HPA/NetworkPolicy，values 开关 | P2 | M |
+| 基础镜像未按 digest 固定，alpine:3.19 近 EOL | OS 层不可复现、积累 CVE | 按 `@sha256:` 固定并升 alpine；Renovate/Dependabot 维护；api-server 考虑 distroless | P2 | S |
+| GitHub Actions 用 `latest`/浮动 major | CI 行为非确定、供应链风险 | helm 固定具体版本、actions 钉 SHA；启 github-actions Dependabot | P3 | S |
+| Chart 无 kubeVersion 与 values.schema.json | 不支持集群晚失败、values 拼写静默忽略 | 加 `kubeVersion:'>=1.22.0-0'` 与 values.schema.json；`helm lint --strict` | P3 | S |
+| api-server Dockerfile `COPY . .` 无 .dockerignore | 构建上下文大、禁用 Go 缓存 | 加 .dockerignore；去 `-a -installsuffix cgo`；BuildKit cache mount | P3 | S |
+
+### 主题 9 · 测试覆盖
+
+| 问题 | 影响 | 建议 | 优先级 | 工作量 |
+|---|---|---|---|---|
+| 后端 0 个 `*_test.go`，所有金额逻辑无测试 | 符号/边界/重构错误可静默错账上线 | 表驱动单测 + fake clientset，优先 `calculateCost`/`Recharge`/`Deduct`/`isGracePeriodExpired`/`CalculateDailyConsumption` | P0 | L（首批 M） |
+| CI 测试任务 vacuous 通过报绿 0% 覆盖（`build-test.yml`） | 对评审制造虚假信心 | 加最低覆盖门；检测关键包零测试文件即失败 | P0 | S |
+| 并发扣费/充值无 `-race` 测试 | 丢更新竞态不可捕获 | N 并发 Recharge/Deduct 对 fake clientset 断言终值==操作和 | P1 | M |
+| 计费 deduct+复读 分支、grace/suspend 单位逻辑无测试 | 错阈值/单位错停付费租户工作负载 | 覆盖正余额/grace 内/过 grace(hours&days)/恢复 四分支 | P1 | M |
+| recharge 校验仅在 handler binding，`SetAutoRechargeConfig` 无正值检查 | 负自动充值额每 tick 静默扣费 | 加正值检查 + 边界/NaN 测试 | P1 | S |
+| 前端仅占位测试，BillingConfig/api.ts/recharge 0% | money-facing UI 无输入校验/格式/错误保护 | 删 example.test 换真测试 + vitest 覆盖门 | P2 | L |
+
+---
+
+## Top 优先级
+
+> 排序原则：先「低工作量、止血资金/安全/可用性」的快赢，再「打基础」的战略项。
+
+**快赢档（P0，可立即排期）**
+
+1. **调度器 leader election（先 replicaCount=1 止血）** —— 消除按副本数重复扣费。止血 S，根治 M。
+2. **ConfigMap 余额包 `RetryOnConflict` + 乐观并发** —— 杜绝余额丢更新/腐蚀，是金额准确性的地基。M。
+3. **修正安装文档致命错误**（OCI `charts/bison`、`/healthz`、版本 0.0.11、OpenCost 命名空间/键名）。S。
+4. **鉴权安全基线**（默认开启 + 拒绝默认密钥/密码 + helm `lookup` 持久化 Secret + 登录限流 + CORS 收紧）。S。
+5. **修复 web-ui 部署可用性**（nginx envsubst + 只读根 FS → unprivileged/8080 + emptyDir）。M。
+6. **release 工作流加测试/lint 门 + CI 覆盖门**。S。
+7. **官网本次迭代快赢三连**（修 `v3.0.0` 版本号 → emoji 改 Tabler SVG → 社交卡 1200x630）。S-M。
+
+**战略档（P1，打基础）**
+
+8. **首批后端单元测试**（`calculateCost` 最高价值，叠加 `Recharge`/`Deduct`/计费分支）。M。
+9. **前端 `React.lazy` + Vite `manualChunks` 拆 echarts，并加顶层 ErrorBoundary**。M。
+10. **K8s client QPS/Burst + 热点 List informer 缓存 + OpenCost 短 TTL+singleflight 缓存**。L。
+
+---
+
+## 网站本次迭代清单
+
+> 官网（Docusaurus，`website/`，线上 `bison.lei6393.com`）。第 1 项是第 7 项截图的前置条件。✅ = 本次迭代已落地。
+
+1. ✅ **修正版本号（前置项）**：`web-ui/src/layouts/BasicLayout.tsx` 硬编码的 `v3.0.0` 改为从 `package.json` 经 Vite `define`（`__APP_VERSION__`）注入。
+2. ✅ **emoji 图标改 Tabler 内联 SVG**：`HomepageFeatures` 的 🔐💰📊🚀⚡🎯 改为 `Icons/` 内联 SVG（shield-lock / currency-dollar / dashboard / rocket / bolt / shield-check），`stroke=currentColor` 适配暗色。
+3. ✅ **UseCases / hero emoji 替换**：🤖🏢💵 与 ❌/✅/→ 改内联 SVG；hero 按钮去 🚀/⭐。
+4. ✅ **Homepage i18n**：6 张 feature 卡 + showcase 标签包 `<Translate>` 并补 `i18n/zh-Hans/code.json` 中文。
+5. ✅ **补内联 SVG 图表/示意图**：新增 `ProductShowcase` 组件（资源总览/集群节点/报表中心/计费配置 四屏全矢量渲染），呼应「多用 SVG 图栏展示功能」。
+6. **刷新陈旧内容**：在 `features.md` 与 `HomepageFeatures` 增补已发布但缺失的能力——「集群与节点管理」「自动化节点 Onboarding」；校正 features.md 夸大项。
+7. **补缺失截图**：本次以矢量 `ProductShowcase` 替代（无可用集群拍摄真实截图）；待有环境后补 Reports/Audit/Cluster/Project/Settings/Login 真实截图。
+8. **修正官网安装文档**：`installation.md`/`intro.md` 的 OCI 路径、OpenCost 命名空间、values 键名、对象名、版本号。
+9. **社交 / OG 卡**：换 1200×630，`docusaurus.config.ts` 补 `twitter:card=summary_large_image` 与 `og:image:width/height`。
+10. **SEO 收尾**：确认 google/baidu 验证标签、robots.txt、sitemap 完整；清理默认脚手架（blog 样例、plushie banner、boilerplate README）。
+11. **ParticleBackground 可访问性**：加 `prefers-reduced-motion` 短路与离屏暂停 rAF。
+
+---
+
+## 后续持续优化方向
+
+### 近期（本季度，止血与开箱即用）
+
+- **资金正确性收口**：完成 leader election + ConfigMap 乐观并发 + `Deduct` 返回写后余额 + 计费窗口/Interval 校验 + `CalculateDailyConsumption` 分母修复，让一笔钱在任何并发与重启下都不丢、不重复、不基于陈旧值停机。
+- **安全基线**：鉴权默认开启 + 启动拒绝默认密钥 + helm Secret 持久化 + 登录限流 + CORS allowlist。
+- **开箱即用**：修复 web-ui nginx/只读根 FS CrashLoop；全量修正安装文档（OCI 路径、healthz、版本、values 键名、OpenCost 命名空间）。
+- **CI 门禁**：release 工作流接测试/lint 门 + 最低覆盖门，并补首批后端金额单测（`calculateCost`/`Recharge`/`Deduct`/计费分支 + `-race` 并发测试）。
+- **官网本次迭代**：执行上方 11 项清单。
+- **快赢清理**：删 `@ant-design/pro-components`、去 `ListTeams` 丢弃用量循环、计费 `calculateCost` 配置改读一次。
+
+### 中期（规模化与体验）
+
+- **后端规模化**：K8s client QPS/Burst + SharedInformer/lister 缓存热点 List；OpenCost 短 TTL + singleflight 缓存；计费/Summary 改单次 `GetAllocationByNamespace` 聚合；列表加分页；per-request 与调度器超时；调度器 panic 恢复 + jitter。
+- **前端体验**：路由 lazy + manualChunks；顶层 ErrorBoundary + 共享 query 错误 UI；逐行 N+1 query 分页门/批量端点；Context value 与 Dashboard 列/闭包 memo 化；NodeDetail echarts option useMemo；轮询节流。
+- **前端一致性**：`getApiErrorMessage` 工具 + `error: unknown` + eslint 禁 any；硬编码色改主题 token（含 echarts 暗色）；`<a onClick>` 改 `<Link>`；`formatCurrency` + 统一 `currencySymbol`；dayjs 统一 bootstrap；去 console.log。
+- **DevOps 供应链**：镜像扫描(Trivy)/SBOM/cosign 签名；npm ci 复现构建；基础镜像 digest 固定 + alpine 升级；PDB/HPA/NetworkPolicy；Chart kubeVersion + values.schema.json。
+- **文档治理**：CHANGELOG 回填并在 release 强制每 tag 有条目；features.md 与代码对齐；删孤儿 architecture.html；配置默认逐列对照 values.yaml。
+- **测试纵深**：补 `ProcessBilling` 分支、suspend/resume、grace 单位、自动充值正值校验测试；前端 api 拦截器/BillingConfig/recharge 表单测试 + vitest 覆盖门。
+
+### 远期（架构与平台化）
+
+- **持久化模型升级**：评估将余额/计费历史从单一共享 ConfigMap 迁移到 per-team key + patch 语义，或引入轻量嵌入式存储/CRD，从根上消除 read-modify-write 竞态与单对象写放大；money 字段考虑整数最小单位避免 float64 精度问题。
+- **RBAC 最小权限**：拆分 ClusterRole + per-namespace Role，去除 clusterrolebindings 写，node 写按 values 开关。
+- **可观测性与多副本水平扩展**：在 leader election + informer 缓存到位后，让 API 真正多副本水平扩展，配 HPA/PDB/NetworkPolicy 与请求级 metrics/trace。
+- **i18n 平台化**：若多语言成为目标，引入 react-i18next 与 zh-CN 目录，逐步替换内联文案。
+- **能力补全或下线**：对 features.md 中标为 planned 的 OIDC/SSO、Email/SMTP 告警、Excel/PDF 导出、插件化计费规则，按路线图实现或正式从对外材料移除，保持「文档=能力」。
diff --git a/scripts/make-ghcr-public.md b/scripts/make-ghcr-public.md
new file mode 100644
index 0000000..7b71804
--- /dev/null
+++ b/scripts/make-ghcr-public.md
@@ -0,0 +1,89 @@
+# 将 GHCR Package 设为公开
+
+由于你无法通过 OCI 路径拉取 Helm chart (`Error: invalid_reference: invalid repository` 或 `403 Forbidden`)，这是因为 GitHub Container Registry 的包默认是私有的。
+
+## 手动设置 Package 为 Public
+
+1. **访问 GitHub Packages**:
+   - 进入 https://github.com/SuperMarioYL?tab=packages
+   - 或者直接访问仓库首页，点击右侧的 "Packages"
+
+2. **找到 charts/bison package**:
+   - 如果存在，点击进入 `charts/bison` package
+
+3. **修改可见性**:
+   - 点击 **Package settings** (右上角齿轮图标)
+   - 滚动到底部找到 **Danger Zone**
+   - 点击 **Change visibility**
+   - 选择 **Public**
+   - 确认更改
+
+## 如果找不到 charts/bison Package
+
+说明 Helm chart 推送到 GHCR 失败了。检查步骤:
+
+1. **检查 GitHub Actions 运行日志**:
+   ```
+   https://github.com/SuperMarioYL/Bison/actions
+   ```
+   - 找到最近的 "Release" workflow run (v0.0.7)
+   - 查看 "Publish to Helm Repository (GHCR)" job 的日志
+   - 检查是否有错误信息
+
+2. **常见失败原因**:
+   - 权限不足 (GITHUB_TOKEN 没有 `packages: write` 权限)
+   - OCI 路径错误
+   - Helm 登录失败
+
+## 临时解决方案
+
+在 GHCR OCI 路径修复之前，使用 GitHub Releases:
+
+```bash
+# 列出所有可用版本
+curl -s https://api.github.com/repos/SuperMarioYL/Bison/releases | grep tag_name
+
+# 下载特定版本
+VERSION=0.0.7
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# 安装
+helm install my-bison bison-${VERSION}.tgz
+
+# 或者创建本地 Helm 仓库
+mkdir -p ~/helm-charts
+cp bison-*.tgz ~/helm-charts/
+helm repo index ~/helm-charts/
+helm repo add local-bison ~/helm-charts/
+helm install my-bison local-bison/bison --version ${VERSION}
+```
+
+## 验证 Package 是否存在于 GHCR
+
+```bash
+# 使用 GitHub API 检查
+curl -H "Authorization: token YOUR_GITHUB_TOKEN" \
+  https://api.github.com/users/SuperMarioYL/packages/container/charts%2Fbison/versions
+
+# 或者尝试拉取（如果是公开的）
+helm pull oci://ghcr.io/supermarioyl/charts/bison --version 0.0.7
+```
+
+## 检查是否需要认证
+
+即使设置为 public，某些情况下可能仍需要认证:
+
+```bash
+# 登录 GHCR
+echo YOUR_GITHUB_TOKEN | helm registry login ghcr.io -u SuperMarioYL --password-stdin
+
+# 然后拉取
+helm pull oci://ghcr.io/supermarioyl/charts/bison --version 0.0.7
+```
+
+## 下一步
+
+1. 先检查 v0.0.7 的 GitHub Actions workflow 日志
+2. 确认 Helm chart 推送步骤是否成功
+3. 如果推送成功，设置 package 为 public
+4. 如果推送失败，发布新版本 v0.0.8 来测试修复后的配置
diff --git a/web-ui/.dockerignore b/web-ui/.dockerignore
new file mode 100644
index 0000000..e619916
--- /dev/null
+++ b/web-ui/.dockerignore
@@ -0,0 +1,9 @@
+# Keep the Docker build context small and reproducible.
+node_modules
+dist
+coverage
+.git
+.gitignore
+.dockerignore
+Dockerfile
+npm-debug.log*
diff --git a/web-ui/Dockerfile b/web-ui/Dockerfile
index abbfa53..5c9668c 100644
--- a/web-ui/Dockerfile
+++ b/web-ui/Dockerfile
@@ -7,7 +7,8 @@ WORKDIR /app
 COPY package*.json ./
 
 # Install dependencies
-RUN npm ci
+# Remove package-lock.json and use npm install to ensure optional deps are installed correctly
+RUN rm -f package-lock.json && npm install
 
 # Copy source code
 COPY . .
diff --git a/web-ui/package-lock.json b/web-ui/package-lock.json
index 89696a0..4571970 100644
--- a/web-ui/package-lock.json
+++ b/web-ui/package-lock.json
@@ -1,15 +1,14 @@
 {
   "name": "bison-web-ui",
-  "version": "0.0.1",
+  "version": "0.0.20",
   "lockfileVersion": 3,
   "requires": true,
   "packages": {
     "": {
       "name": "bison-web-ui",
-      "version": "0.0.1",
+      "version": "0.0.20",
       "dependencies": {
         "@ant-design/icons": "^5.2.6",
-        "@ant-design/pro-components": "^2.6.43",
         "@tanstack/react-query": "^5.17.0",
         "antd": "^5.12.8",
         "axios": "^1.6.5",
@@ -18,7 +17,8 @@
         "echarts-for-react": "^3.0.2",
         "react": "^18.2.0",
         "react-dom": "^18.2.0",
-        "react-router-dom": "^6.21.1"
+        "react-router-dom": "^6.21.1",
+        "tslib": "^2.6.0"
       },
       "devDependencies": {
         "@testing-library/jest-dom": "^6.9.1",
@@ -143,267 +143,6 @@
       "version": "4.4.2",
       "license": "MIT"
     },
-    "node_modules/@ant-design/pro-card": {
-      "version": "2.10.0",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/cssinjs": "^1.21.1",
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "classnames": "^2.3.2",
-        "rc-resize-observer": "^1.0.0",
-        "rc-util": "^5.4.0"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-components": {
-      "version": "2.8.10",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/pro-card": "2.10.0",
-        "@ant-design/pro-descriptions": "2.6.10",
-        "@ant-design/pro-field": "3.1.0",
-        "@ant-design/pro-form": "2.32.0",
-        "@ant-design/pro-layout": "7.22.7",
-        "@ant-design/pro-list": "2.6.10",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-skeleton": "2.2.1",
-        "@ant-design/pro-table": "3.21.0",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.16.3"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-descriptions": {
-      "version": "2.6.10",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/pro-field": "3.1.0",
-        "@ant-design/pro-form": "2.32.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-skeleton": "2.2.1",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "rc-resize-observer": "^0.2.3",
-        "rc-util": "^5.0.6"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-descriptions/node_modules/rc-resize-observer": {
-      "version": "0.2.6",
-      "license": "MIT",
-      "dependencies": {
-        "@babel/runtime": "^7.10.1",
-        "classnames": "^2.2.1",
-        "rc-util": "^5.0.0",
-        "resize-observer-polyfill": "^1.5.1"
-      },
-      "peerDependencies": {
-        "react": ">=16.9.0",
-        "react-dom": ">=16.9.0"
-      }
-    },
-    "node_modules/@ant-design/pro-field": {
-      "version": "3.1.0",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "@chenshuai2144/sketch-color": "^1.0.8",
-        "classnames": "^2.3.2",
-        "dayjs": "^1.11.10",
-        "lodash": "^4.17.21",
-        "lodash-es": "^4.17.21",
-        "rc-util": "^5.4.0",
-        "swr": "^2.0.0"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-form": {
-      "version": "2.32.0",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-field": "3.1.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "@chenshuai2144/sketch-color": "^1.0.7",
-        "@umijs/use-params": "^1.0.9",
-        "classnames": "^2.3.2",
-        "dayjs": "^1.11.10",
-        "lodash": "^4.17.21",
-        "lodash-es": "^4.17.21",
-        "rc-resize-observer": "^1.1.0",
-        "rc-util": "^5.0.6"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "rc-field-form": ">=1.22.0",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-layout": {
-      "version": "7.22.7",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/cssinjs": "^1.21.1",
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "@umijs/route-utils": "^4.0.0",
-        "@umijs/use-params": "^1.0.9",
-        "classnames": "^2.3.2",
-        "lodash": "^4.17.21",
-        "lodash-es": "^4.17.21",
-        "path-to-regexp": "8.2.0",
-        "rc-resize-observer": "^1.1.0",
-        "rc-util": "^5.0.6",
-        "swr": "^2.0.0",
-        "warning": "^4.0.3"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-list": {
-      "version": "2.6.10",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/cssinjs": "^1.21.1",
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-card": "2.10.0",
-        "@ant-design/pro-field": "3.1.0",
-        "@ant-design/pro-table": "3.21.0",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "classnames": "^2.3.2",
-        "dayjs": "^1.11.10",
-        "rc-resize-observer": "^1.0.0",
-        "rc-util": "^4.19.0"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-list/node_modules/rc-util": {
-      "version": "4.21.1",
-      "license": "MIT",
-      "dependencies": {
-        "add-dom-event-listener": "^1.1.0",
-        "prop-types": "^15.5.10",
-        "react-is": "^16.12.0",
-        "react-lifecycles-compat": "^3.0.4",
-        "shallowequal": "^1.1.0"
-      }
-    },
-    "node_modules/@ant-design/pro-list/node_modules/react-is": {
-      "version": "16.13.1",
-      "license": "MIT"
-    },
-    "node_modules/@ant-design/pro-provider": {
-      "version": "2.16.2",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/cssinjs": "^1.21.1",
-        "@babel/runtime": "^7.18.0",
-        "@ctrl/tinycolor": "^3.4.0",
-        "dayjs": "^1.11.10",
-        "rc-util": "^5.0.1",
-        "swr": "^2.0.0"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-skeleton": {
-      "version": "2.2.1",
-      "license": "MIT",
-      "dependencies": {
-        "@babel/runtime": "^7.18.0"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-table": {
-      "version": "3.21.0",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/cssinjs": "^1.21.1",
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-card": "2.10.0",
-        "@ant-design/pro-field": "3.1.0",
-        "@ant-design/pro-form": "2.32.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@ant-design/pro-utils": "2.18.0",
-        "@babel/runtime": "^7.18.0",
-        "@dnd-kit/core": "^6.0.8",
-        "@dnd-kit/modifiers": "^6.0.1",
-        "@dnd-kit/sortable": "^7.0.2",
-        "@dnd-kit/utilities": "^3.2.1",
-        "classnames": "^2.3.2",
-        "dayjs": "^1.11.10",
-        "lodash": "^4.17.21",
-        "lodash-es": "^4.17.21",
-        "rc-resize-observer": "^1.0.0",
-        "rc-util": "^5.0.1"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "rc-field-form": ">=1.22.0",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
-    "node_modules/@ant-design/pro-utils": {
-      "version": "2.18.0",
-      "license": "MIT",
-      "dependencies": {
-        "@ant-design/icons": "^5.0.0",
-        "@ant-design/pro-provider": "2.16.2",
-        "@babel/runtime": "^7.18.0",
-        "classnames": "^2.3.2",
-        "dayjs": "^1.11.10",
-        "lodash": "^4.17.21",
-        "lodash-es": "^4.17.21",
-        "rc-util": "^5.0.6",
-        "safe-stable-stringify": "^2.4.3",
-        "swr": "^2.0.0"
-      },
-      "peerDependencies": {
-        "antd": "^4.24.15 || ^5.11.2",
-        "react": ">=17.0.0",
-        "react-dom": ">=17.0.0"
-      }
-    },
     "node_modules/@ant-design/react-slick": {
       "version": "1.1.2",
       "license": "MIT",
@@ -750,17 +489,6 @@
         "node": ">=18"
       }
     },
-    "node_modules/@chenshuai2144/sketch-color": {
-      "version": "1.0.9",
-      "license": "MIT",
-      "dependencies": {
-        "reactcss": "^1.2.3",
-        "tinycolor2": "^1.4.2"
-      },
-      "peerDependencies": {
-        "react": ">=16.12.0"
-      }
-    },
     "node_modules/@csstools/color-helpers": {
       "version": "5.1.0",
       "resolved": "https://registry.npmjs.org/@csstools/color-helpers/-/color-helpers-5.1.0.tgz",
@@ -896,70 +624,6 @@
         "node": ">=18"
       }
     },
-    "node_modules/@ctrl/tinycolor": {
-      "version": "3.6.1",
-      "license": "MIT",
-      "engines": {
-        "node": ">=10"
-      }
-    },
-    "node_modules/@dnd-kit/accessibility": {
-      "version": "3.1.1",
-      "license": "MIT",
-      "dependencies": {
-        "tslib": "^2.0.0"
-      },
-      "peerDependencies": {
-        "react": ">=16.8.0"
-      }
-    },
-    "node_modules/@dnd-kit/core": {
-      "version": "6.3.1",
-      "license": "MIT",
-      "dependencies": {
-        "@dnd-kit/accessibility": "^3.1.1",
-        "@dnd-kit/utilities": "^3.2.2",
-        "tslib": "^2.0.0"
-      },
-      "peerDependencies": {
-        "react": ">=16.8.0",
-        "react-dom": ">=16.8.0"
-      }
-    },
-    "node_modules/@dnd-kit/modifiers": {
-      "version": "6.0.1",
-      "license": "MIT",
-      "dependencies": {
-        "@dnd-kit/utilities": "^3.2.1",
-        "tslib": "^2.0.0"
-      },
-      "peerDependencies": {
-        "@dnd-kit/core": "^6.0.6",
-        "react": ">=16.8.0"
-      }
-    },
-    "node_modules/@dnd-kit/sortable": {
-      "version": "7.0.2",
-      "license": "MIT",
-      "dependencies": {
-        "@dnd-kit/utilities": "^3.2.0",
-        "tslib": "^2.0.0"
-      },
-      "peerDependencies": {
-        "@dnd-kit/core": "^6.0.7",
-        "react": ">=16.8.0"
-      }
-    },
-    "node_modules/@dnd-kit/utilities": {
-      "version": "3.2.2",
-      "license": "MIT",
-      "dependencies": {
-        "tslib": "^2.0.0"
-      },
-      "peerDependencies": {
-        "react": ">=16.8.0"
-      }
-    },
     "node_modules/@emotion/hash": {
       "version": "0.8.0",
       "license": "MIT"
@@ -1802,17 +1466,6 @@
         "url": "https://opencollective.com/typescript-eslint"
       }
     },
-    "node_modules/@umijs/route-utils": {
-      "version": "4.0.3",
-      "license": "MIT"
-    },
-    "node_modules/@umijs/use-params": {
-      "version": "1.0.9",
-      "license": "MIT",
-      "peerDependencies": {
-        "react": "*"
-      }
-    },
     "node_modules/@ungap/structured-clone": {
       "version": "1.3.0",
       "dev": true,
@@ -2027,13 +1680,6 @@
         "acorn": "^6.0.0 || ^7.0.0 || ^8.0.0"
       }
     },
-    "node_modules/add-dom-event-listener": {
-      "version": "1.1.0",
-      "license": "MIT",
-      "dependencies": {
-        "object-assign": "4.x"
-      }
-    },
     "node_modules/agent-base": {
       "version": "7.1.4",
       "resolved": "https://registry.npmjs.org/agent-base/-/agent-base-7.1.4.tgz",
@@ -2671,6 +2317,7 @@
     },
     "node_modules/dequal": {
       "version": "2.0.3",
+      "dev": true,
       "license": "MIT",
       "engines": {
         "node": ">=6"
@@ -3869,14 +3516,6 @@
         "url": "https://github.com/sponsors/sindresorhus"
       }
     },
-    "node_modules/lodash": {
-      "version": "4.17.21",
-      "license": "MIT"
-    },
-    "node_modules/lodash-es": {
-      "version": "4.17.22",
-      "license": "MIT"
-    },
     "node_modules/lodash.merge": {
       "version": "4.6.2",
       "dev": true,
@@ -4103,6 +3742,7 @@
     },
     "node_modules/object-assign": {
       "version": "4.1.1",
+      "dev": true,
       "license": "MIT",
       "engines": {
         "node": ">=0.10.0"
@@ -4252,13 +3892,6 @@
       "dev": true,
       "license": "ISC"
     },
-    "node_modules/path-to-regexp": {
-      "version": "8.2.0",
-      "license": "MIT",
-      "engines": {
-        "node": ">=16"
-      }
-    },
     "node_modules/path-type": {
       "version": "4.0.0",
       "dev": true,
@@ -4511,19 +4144,6 @@
       "license": "MIT",
       "peer": true
     },
-    "node_modules/prop-types": {
-      "version": "15.8.1",
-      "license": "MIT",
-      "dependencies": {
-        "loose-envify": "^1.4.0",
-        "object-assign": "^4.1.1",
-        "react-is": "^16.13.1"
-      }
-    },
-    "node_modules/prop-types/node_modules/react-is": {
-      "version": "16.13.1",
-      "license": "MIT"
-    },
     "node_modules/proxy-from-env": {
       "version": "1.1.0",
       "license": "MIT"
@@ -5118,10 +4738,6 @@
       "version": "18.3.1",
       "license": "MIT"
     },
-    "node_modules/react-lifecycles-compat": {
-      "version": "3.0.4",
-      "license": "MIT"
-    },
     "node_modules/react-refresh": {
       "version": "0.17.0",
       "dev": true,
@@ -5158,13 +4774,6 @@
         "react-dom": ">=16.8"
       }
     },
-    "node_modules/reactcss": {
-      "version": "1.2.3",
-      "license": "MIT",
-      "dependencies": {
-        "lodash": "^4.0.1"
-      }
-    },
     "node_modules/read-cache": {
       "version": "1.0.0",
       "dev": true,
@@ -5331,13 +4940,6 @@
         "queue-microtask": "^1.2.2"
       }
     },
-    "node_modules/safe-stable-stringify": {
-      "version": "2.5.0",
-      "license": "MIT",
-      "engines": {
-        "node": ">=10"
-      }
-    },
     "node_modules/safer-buffer": {
       "version": "2.1.2",
       "resolved": "https://registry.npmjs.org/safer-buffer/-/safer-buffer-2.1.2.tgz",
@@ -5383,10 +4985,6 @@
         "node": ">=10"
       }
     },
-    "node_modules/shallowequal": {
-      "version": "1.1.0",
-      "license": "MIT"
-    },
     "node_modules/shebang-command": {
       "version": "2.0.0",
       "dev": true,
@@ -5665,17 +5263,6 @@
         "url": "https://github.com/sponsors/ljharb"
       }
     },
-    "node_modules/swr": {
-      "version": "2.3.8",
-      "license": "MIT",
-      "dependencies": {
-        "dequal": "^2.0.3",
-        "use-sync-external-store": "^1.6.0"
-      },
-      "peerDependencies": {
-        "react": "^16.11.0 || ^17.0.0 || ^18.0.0 || ^19.0.0"
-      }
-    },
     "node_modules/symbol-tree": {
       "version": "3.2.4",
       "resolved": "https://registry.npmjs.org/symbol-tree/-/symbol-tree-3.2.4.tgz",
@@ -5809,10 +5396,6 @@
       "dev": true,
       "license": "MIT"
     },
-    "node_modules/tinycolor2": {
-      "version": "1.6.0",
-      "license": "MIT"
-    },
     "node_modules/tinyexec": {
       "version": "0.3.2",
       "resolved": "https://registry.npmjs.org/tinyexec/-/tinyexec-0.3.2.tgz",
@@ -5981,6 +5564,8 @@
     },
     "node_modules/tslib": {
       "version": "2.8.1",
+      "resolved": "https://registry.npmjs.org/tslib/-/tslib-2.8.1.tgz",
+      "integrity": "sha512-oJFu94HQb+KVduSUQL7wnpmqnfmLsOA/nAh6b6EH0wCEoK0/mPeXU6c3wKDV83MkOuHPRHtSXKKU99IBazS/2w==",
       "license": "0BSD"
     },
     "node_modules/type-check": {
@@ -6054,13 +5639,6 @@
         "punycode": "^2.1.0"
       }
     },
-    "node_modules/use-sync-external-store": {
-      "version": "1.6.0",
-      "license": "MIT",
-      "peerDependencies": {
-        "react": "^16.8.0 || ^17.0.0 || ^18.0.0 || ^19.0.0"
-      }
-    },
     "node_modules/util-deprecate": {
       "version": "1.0.2",
       "dev": true,
@@ -6246,13 +5824,6 @@
         "node": ">=18"
       }
     },
-    "node_modules/warning": {
-      "version": "4.0.3",
-      "license": "MIT",
-      "dependencies": {
-        "loose-envify": "^1.0.0"
-      }
-    },
     "node_modules/webidl-conversions": {
       "version": "8.0.0",
       "resolved": "https://registry.npmjs.org/webidl-conversions/-/webidl-conversions-8.0.0.tgz",
diff --git a/web-ui/package.json b/web-ui/package.json
index 1d4bdd1..54483e1 100644
--- a/web-ui/package.json
+++ b/web-ui/package.json
@@ -1,6 +1,6 @@
 {
   "name": "bison-web-ui",
-  "version": "0.0.1",
+  "version": "0.0.27",
   "private": true,
   "scripts": {
     "dev": "vite",
@@ -13,7 +13,6 @@
   },
   "dependencies": {
     "@ant-design/icons": "^5.2.6",
-    "@ant-design/pro-components": "^2.6.43",
     "@tanstack/react-query": "^5.17.0",
     "antd": "^5.12.8",
     "axios": "^1.6.5",
@@ -22,7 +21,8 @@
     "echarts-for-react": "^3.0.2",
     "react": "^18.2.0",
     "react-dom": "^18.2.0",
-    "react-router-dom": "^6.21.1"
+    "react-router-dom": "^6.21.1",
+    "tslib": "^2.6.0"
   },
   "devDependencies": {
     "@testing-library/jest-dom": "^6.9.1",
diff --git a/web-ui/src/App.tsx b/web-ui/src/App.tsx
index 1c4d22c..cead6fc 100644
--- a/web-ui/src/App.tsx
+++ b/web-ui/src/App.tsx
@@ -1,49 +1,70 @@
-import React from 'react';
+import React, { Suspense, lazy } from 'react';
 import { Routes, Route, Navigate } from 'react-router-dom';
+import { Spin } from 'antd';
 import BasicLayout from './layouts/BasicLayout';
-import Login from './pages/Login';
-import Dashboard from './pages/Dashboard';
-import ProjectList from './pages/Project/ProjectList';
-import ProjectCreate from './pages/Project/ProjectCreate';
-import ProjectDetail from './pages/Project/ProjectDetail';
-import ClusterNodes from './pages/Cluster/ClusterNodes';
-import NodeDetail from './pages/Cluster/NodeDetail';
-import TeamList from './pages/Team/TeamList';
-import TeamCreate from './pages/Team/TeamCreate';
-import TeamDetail from './pages/Team/TeamDetail';
-import UserList from './pages/User/UserList';
-import UserDetail from './pages/User/UserDetail';
-import AuditList from './pages/Audit/AuditList';
-import ReportCenter from './pages/Report/ReportCenter';
-import Settings from './pages/Settings';
 import ProtectedRoute from './components/ProtectedRoute';
+import { useFeatures } from './hooks/useFeatures';
+
+// Route-level code splitting: each page (and its heavy deps such as echarts on
+// the node-detail page) is only downloaded when first visited.
+const Login = lazy(() => import('./pages/Login'));
+const Dashboard = lazy(() => import('./pages/Dashboard'));
+const ProjectList = lazy(() => import('./pages/Project/ProjectList'));
+const ProjectCreate = lazy(() => import('./pages/Project/ProjectCreate'));
+const ProjectDetail = lazy(() => import('./pages/Project/ProjectDetail'));
+const ClusterNodes = lazy(() => import('./pages/Cluster/ClusterNodes'));
+const NodeDetail = lazy(() => import('./pages/Cluster/NodeDetail'));
+const TeamList = lazy(() => import('./pages/Team/TeamList'));
+const TeamCreate = lazy(() => import('./pages/Team/TeamCreate'));
+const TeamDetail = lazy(() => import('./pages/Team/TeamDetail'));
+const UserList = lazy(() => import('./pages/User/UserList'));
+const UserDetail = lazy(() => import('./pages/User/UserDetail'));
+const AuditList = lazy(() => import('./pages/Audit/AuditList'));
+const ReportCenter = lazy(() => import('./pages/Report/ReportCenter'));
+const Settings = lazy(() => import('./pages/Settings'));
+
+const PageFallback: React.FC = () => (
+  <div style={{ display: 'flex', justifyContent: 'center', alignItems: 'center', minHeight: '40vh' }}>
+    <Spin size="large" />
+  </div>
+);
 
 const App: React.FC = () => {
+  const { data: features } = useFeatures();
+
   return (
-    <Routes>
-      <Route path="/login" element={<Login />} />
-      <Route path="/" element={
-        <ProtectedRoute>
-          <BasicLayout />
-        </ProtectedRoute>
-      }>
-        <Route index element={<Navigate to="/dashboard" replace />} />
-        <Route path="dashboard" element={<Dashboard />} />
-        <Route path="teams" element={<TeamList />} />
-        <Route path="teams/create" element={<TeamCreate />} />
-        <Route path="teams/:name" element={<TeamDetail />} />
-        <Route path="projects" element={<ProjectList />} />
-        <Route path="projects/create" element={<ProjectCreate />} />
-        <Route path="projects/:name" element={<ProjectDetail />} />
-        <Route path="users" element={<UserList />} />
-        <Route path="users/:email" element={<UserDetail />} />
-        <Route path="cluster/nodes" element={<ClusterNodes />} />
-        <Route path="cluster/nodes/:name" element={<NodeDetail />} />
-        <Route path="reports" element={<ReportCenter />} />
-        <Route path="audit" element={<AuditList />} />
-        <Route path="settings/*" element={<Settings />} />
-      </Route>
-    </Routes>
+    <Suspense fallback={<PageFallback />}>
+      <Routes>
+        <Route path="/login" element={<Login />} />
+        <Route path="/" element={
+          <ProtectedRoute>
+            <BasicLayout />
+          </ProtectedRoute>
+        }>
+          <Route index element={<Navigate to="/dashboard" replace />} />
+          <Route path="dashboard" element={<Dashboard />} />
+          {features?.capsuleEnabled !== false && (
+            <>
+              <Route path="teams" element={<TeamList />} />
+              <Route path="teams/create" element={<TeamCreate />} />
+              <Route path="teams/:name" element={<TeamDetail />} />
+              <Route path="projects" element={<ProjectList />} />
+              <Route path="projects/create" element={<ProjectCreate />} />
+              <Route path="projects/:name" element={<ProjectDetail />} />
+              <Route path="users" element={<UserList />} />
+              <Route path="users/:email" element={<UserDetail />} />
+            </>
+          )}
+          <Route path="cluster/nodes" element={<ClusterNodes />} />
+          <Route path="cluster/nodes/:name" element={<NodeDetail />} />
+          {features?.costEnabled !== false && (
+            <Route path="reports" element={<ReportCenter />} />
+          )}
+          <Route path="audit" element={<AuditList />} />
+          <Route path="settings/*" element={<Settings />} />
+        </Route>
+      </Routes>
+    </Suspense>
   );
 };
 
diff --git a/web-ui/src/components/ErrorBoundary.tsx b/web-ui/src/components/ErrorBoundary.tsx
new file mode 100644
index 0000000..91504ef
--- /dev/null
+++ b/web-ui/src/components/ErrorBoundary.tsx
@@ -0,0 +1,58 @@
+import React from 'react';
+import { Button, Result } from 'antd';
+
+interface Props {
+  children: React.ReactNode;
+}
+
+interface State {
+  hasError: boolean;
+  error?: Error;
+}
+
+/**
+ * Top-level error boundary so a render-time exception in any page shows a
+ * recoverable fallback instead of a blank white screen.
+ */
+class ErrorBoundary extends React.Component<Props, State> {
+  constructor(props: Props) {
+    super(props);
+    this.state = { hasError: false };
+  }
+
+  static getDerivedStateFromError(error: Error): State {
+    return { hasError: true, error };
+  }
+
+  componentDidCatch(error: Error, info: React.ErrorInfo) {
+    // eslint-disable-next-line no-console
+    console.error('Unhandled UI error:', error, info.componentStack);
+  }
+
+  handleReset = () => {
+    this.setState({ hasError: false, error: undefined });
+  };
+
+  render() {
+    if (this.state.hasError) {
+      return (
+        <Result
+          status="error"
+          title="页面出错了"
+          subTitle={this.state.error?.message || '渲染时发生未预期的错误，请重试或刷新页面。'}
+          extra={[
+            <Button type="primary" key="retry" onClick={this.handleReset}>
+              重试
+            </Button>,
+            <Button key="reload" onClick={() => window.location.reload()}>
+              刷新页面
+            </Button>,
+          ]}
+        />
+      );
+    }
+    return this.props.children;
+  }
+}
+
+export default ErrorBoundary;
diff --git a/web-ui/src/components/NodeOnboardingModal.tsx b/web-ui/src/components/NodeOnboardingModal.tsx
new file mode 100644
index 0000000..b7c1029
--- /dev/null
+++ b/web-ui/src/components/NodeOnboardingModal.tsx
@@ -0,0 +1,183 @@
+import React, { useState } from 'react';
+import {
+  Modal,
+  Form,
+  Input,
+  InputNumber,
+  Select,
+  Alert,
+  Typography,
+} from 'antd';
+import { useMutation } from '@tanstack/react-query';
+import { startNodeOnboarding, OnboardingRequest } from '../services/api';
+
+const { TextArea } = Input;
+const { Text } = Typography;
+
+interface NodeOnboardingModalProps {
+  open: boolean;
+  onClose: () => void;
+  onStarted: (jobId: string) => void;
+}
+
+const NodeOnboardingModal: React.FC<NodeOnboardingModalProps> = ({
+  open,
+  onClose,
+  onStarted,
+}) => {
+  const [form] = Form.useForm();
+  const [authMethod, setAuthMethod] = useState<'password' | 'privateKey'>('password');
+
+  const startMutation = useMutation({
+    mutationFn: startNodeOnboarding,
+    onSuccess: (response) => {
+      form.resetFields();
+      onStarted(response.data.id);
+    },
+  });
+
+  const handleSubmit = () => {
+    form.validateFields().then(values => {
+      const request: OnboardingRequest = {
+        nodeIP: values.nodeIP,
+        sshPort: values.sshPort || 22,
+        sshUsername: values.sshUsername,
+        authMethod: values.authMethod,
+        password: values.authMethod === 'password' ? values.password : undefined,
+        privateKey: values.authMethod === 'privateKey' ? values.privateKey : undefined,
+      };
+      startMutation.mutate(request);
+    });
+  };
+
+  const handleClose = () => {
+    form.resetFields();
+    setAuthMethod('password');
+    onClose();
+  };
+
+  // IP address validation
+  const validateIP = (_: unknown, value: string) => {
+    if (!value) {
+      return Promise.reject(new Error('请输入节点 IP'));
+    }
+    // Simple IP format validation
+    const ipRegex = /^(\d{1,3}\.){3}\d{1,3}$/;
+    if (!ipRegex.test(value)) {
+      return Promise.reject(new Error('请输入有效的 IP 地址'));
+    }
+    const parts = value.split('.').map(Number);
+    if (parts.some(p => p > 255)) {
+      return Promise.reject(new Error('请输入有效的 IP 地址'));
+    }
+    return Promise.resolve();
+  };
+
+  return (
+    <Modal
+      title="添加裸金属节点"
+      open={open}
+      onOk={handleSubmit}
+      onCancel={handleClose}
+      okText="开始添加"
+      cancelText="取消"
+      confirmLoading={startMutation.isPending}
+      width={500}
+      destroyOnClose
+    >
+      <Alert
+        message="前置条件"
+        description={
+          <ul style={{ margin: 0, paddingLeft: 20 }}>
+            <li>目标节点已安装操作系统（Ubuntu/CentOS 等）</li>
+            <li>目标节点已安装 kubeadm、kubelet、kubectl</li>
+            <li>目标节点网络可达，支持 SSH 连接</li>
+          </ul>
+        }
+        type="info"
+        showIcon
+        style={{ marginBottom: 24 }}
+      />
+
+      {startMutation.isError && (
+        <Alert
+          message="启动失败"
+          description={(startMutation.error as Error).message}
+          type="error"
+          showIcon
+          style={{ marginBottom: 16 }}
+        />
+      )}
+
+      <Form
+        form={form}
+        layout="vertical"
+        initialValues={{
+          sshPort: 22,
+          sshUsername: 'root',
+          authMethod: 'password',
+        }}
+      >
+        <Form.Item
+          name="nodeIP"
+          label="节点 IP"
+          rules={[{ validator: validateIP }]}
+        >
+          <Input placeholder="如：192.168.1.100" />
+        </Form.Item>
+
+        <Form.Item
+          name="sshPort"
+          label="SSH 端口"
+          rules={[{ required: true, message: '请输入 SSH 端口' }]}
+        >
+          <InputNumber min={1} max={65535} style={{ width: 150 }} />
+        </Form.Item>
+
+        <Form.Item
+          name="sshUsername"
+          label="SSH 用户名"
+          rules={[{ required: true, message: '请输入 SSH 用户名' }]}
+        >
+          <Input placeholder="root" />
+        </Form.Item>
+
+        <Form.Item
+          name="authMethod"
+          label="认证方式"
+          rules={[{ required: true }]}
+        >
+          <Select onChange={(value) => setAuthMethod(value)}>
+            <Select.Option value="password">密码</Select.Option>
+            <Select.Option value="privateKey">私钥</Select.Option>
+          </Select>
+        </Form.Item>
+
+        {authMethod === 'password' ? (
+          <Form.Item
+            name="password"
+            label="密码"
+            rules={[{ required: true, message: '请输入密码' }]}
+          >
+            <Input.Password placeholder="SSH 登录密码" />
+          </Form.Item>
+        ) : (
+          <Form.Item
+            name="privateKey"
+            label="私钥内容"
+            rules={[{ required: true, message: '请输入私钥' }]}
+            extra={<Text type="secondary">将私钥内容粘贴到此处</Text>}
+          >
+            <TextArea
+              rows={6}
+              placeholder="-----BEGIN RSA PRIVATE KEY-----&#10;...&#10;-----END RSA PRIVATE KEY-----"
+              style={{ fontFamily: 'monospace', fontSize: 12 }}
+            />
+          </Form.Item>
+        )}
+      </Form>
+    </Modal>
+  );
+};
+
+export default NodeOnboardingModal;
diff --git a/web-ui/src/components/OnboardingProgressDrawer.tsx b/web-ui/src/components/OnboardingProgressDrawer.tsx
new file mode 100644
index 0000000..e3e405d
--- /dev/null
+++ b/web-ui/src/components/OnboardingProgressDrawer.tsx
@@ -0,0 +1,295 @@
+import React, { useEffect } from 'react';
+import {
+  Drawer,
+  Steps,
+  Typography,
+  Space,
+  Tag,
+  Alert,
+  Button,
+  Spin,
+  Descriptions,
+} from 'antd';
+import {
+  CheckCircleOutlined,
+  CloseCircleOutlined,
+  LoadingOutlined,
+  ClockCircleOutlined,
+  MinusCircleOutlined,
+} from '@ant-design/icons';
+import { useQuery, useMutation, useQueryClient } from '@tanstack/react-query';
+import {
+  getOnboardingJob,
+  cancelOnboardingJob,
+  OnboardingJobStatus,
+  SubStep,
+  SubStepStatus,
+} from '../services/api';
+
+const { Text, Paragraph } = Typography;
+
+interface OnboardingProgressDrawerProps {
+  jobId: string | null;
+  open: boolean;
+  onClose: () => void;
+}
+
+const stepTitles = [
+  '连接测试',
+  '平台检测',
+  '环境检查',
+  'Pre-join 脚本',
+  '获取 Join Token',
+  '执行 kubeadm join',
+  'Post-join 脚本',
+  '等待节点就绪',
+  '启用节点',
+];
+
+const getStepStatus = (currentStep: number, stepIndex: number, jobStatus: OnboardingJobStatus) => {
+  if (jobStatus === 'failed' && currentStep === stepIndex + 1) {
+    return 'error';
+  }
+  if (currentStep > stepIndex + 1) {
+    return 'finish';
+  }
+  if (currentStep === stepIndex + 1) {
+    return 'process';
+  }
+  return 'wait';
+};
+
+const getSubStepIcon = (status: SubStepStatus) => {
+  switch (status) {
+    case 'success':
+      return <CheckCircleOutlined style={{ color: '#52c41a' }} />;
+    case 'failed':
+      return <CloseCircleOutlined style={{ color: '#ff4d4f' }} />;
+    case 'running':
+      return <LoadingOutlined style={{ color: '#1890ff' }} />;
+    case 'skipped':
+      return <MinusCircleOutlined style={{ color: '#d9d9d9' }} />;
+    default:
+      return <ClockCircleOutlined style={{ color: '#d9d9d9' }} />;
+  }
+};
+
+const SubStepList: React.FC<{ subSteps: SubStep[] }> = ({ subSteps }) => {
+  if (!subSteps || subSteps.length === 0) return null;
+
+  return (
+    <div style={{ marginTop: 8, marginLeft: 24 }}>
+      {subSteps.map((subStep, index) => (
+        <div key={index} style={{ marginBottom: 4 }}>
+          <Space>
+            {getSubStepIcon(subStep.status)}
+            <Text type={subStep.status === 'failed' ? 'danger' : undefined}>
+              {subStep.name}
+            </Text>
+          </Space>
+          {subStep.error && (
+            <div style={{ marginLeft: 22, marginTop: 4 }}>
+              <Text type="danger" style={{ fontSize: 12 }}>
+                {subStep.error}
+              </Text>
+            </div>
+          )}
+        </div>
+      ))}
+    </div>
+  );
+};
+
+const OnboardingProgressDrawer: React.FC<OnboardingProgressDrawerProps> = ({
+  jobId,
+  open,
+  onClose,
+}) => {
+  const queryClient = useQueryClient();
+
+  const { data: job, isLoading } = useQuery({
+    queryKey: ['onboardingJob', jobId],
+    queryFn: () => getOnboardingJob(jobId!).then(res => res.data),
+    enabled: !!jobId && open,
+    refetchInterval: (query) => {
+      // Stop polling when job is completed
+      const data = query.state.data;
+      if (data && ['success', 'failed', 'cancelled'].includes(data.status)) {
+        return false;
+      }
+      return 2000; // Poll every 2 seconds
+    },
+  });
+
+  const cancelMutation = useMutation({
+    mutationFn: cancelOnboardingJob,
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ['onboardingJob', jobId] });
+    },
+  });
+
+  useEffect(() => {
+    if (!open) {
+      // Refresh nodes list when drawer closes
+      queryClient.invalidateQueries({ queryKey: ['managedNodes'] });
+    }
+  }, [open, queryClient]);
+
+  const handleCancel = () => {
+    if (jobId) {
+      cancelMutation.mutate(jobId);
+    }
+  };
+
+  const isRunning = job?.status === 'pending' || job?.status === 'running';
+  const isSuccess = job?.status === 'success';
+  const isFailed = job?.status === 'failed';
+  const isCancelled = job?.status === 'cancelled';
+
+  const getStatusTag = () => {
+    if (!job) return null;
+    switch (job.status) {
+      case 'pending':
+        return <Tag color="default">等待中</Tag>;
+      case 'running':
+        return <Tag color="processing">执行中</Tag>;
+      case 'success':
+        return <Tag color="success">成功</Tag>;
+      case 'failed':
+        return <Tag color="error">失败</Tag>;
+      case 'cancelled':
+        return <Tag color="warning">已取消</Tag>;
+      default:
+        return null;
+    }
+  };
+
+  // Build step items with sub-steps
+  const getStepItems = () => {
+    if (!job) return stepTitles.map(title => ({ title }));
+
+    return stepTitles.map((title, index) => {
+      const stepNumber = index + 1;
+      const status = getStepStatus(job.currentStep, index, job.status);
+
+      // Show sub-steps for script execution steps (4 and 7)
+      let description = null;
+      if ((stepNumber === 4 || stepNumber === 7) && job.currentStep === stepNumber && job.subSteps) {
+        description = <SubStepList subSteps={job.subSteps} />;
+      }
+
+      return {
+        title,
+        status,
+        description,
+      };
+    });
+  };
+
+  return (
+    <Drawer
+      title="节点添加进度"
+      placement="right"
+      width={450}
+      open={open}
+      onClose={onClose}
+      extra={getStatusTag()}
+    >
+      {isLoading ? (
+        <div style={{ textAlign: 'center', padding: 50 }}>
+          <Spin size="large" />
+        </div>
+      ) : job ? (
+        <div>
+          <Descriptions column={1} size="small" style={{ marginBottom: 24 }}>
+            <Descriptions.Item label="节点 IP">{job.nodeIP}</Descriptions.Item>
+            {job.nodeName && (
+              <Descriptions.Item label="节点名称">{job.nodeName}</Descriptions.Item>
+            )}
+            {job.platform.os && (
+              <Descriptions.Item label="平台">
+                <Space>
+                  <Tag color="blue">{job.platform.os} {job.platform.version}</Tag>
+                  <Tag color="green">{job.platform.arch}</Tag>
+                </Space>
+              </Descriptions.Item>
+            )}
+          </Descriptions>
+
+          <Steps
+            direction="vertical"
+            size="small"
+            current={job.currentStep - 1}
+            items={getStepItems()}
+          />
+
+          {job.stepMessage && (
+            <Alert
+              message="当前状态"
+              description={job.stepMessage}
+              type="info"
+              showIcon
+              style={{ marginTop: 24 }}
+            />
+          )}
+
+          {isFailed && job.errorMessage && (
+            <Alert
+              message="错误信息"
+              description={job.errorMessage}
+              type="error"
+              showIcon
+              style={{ marginTop: 16 }}
+            />
+          )}
+
+          {isSuccess && (
+            <Alert
+              message="节点添加成功"
+              description={
+                <Paragraph style={{ marginBottom: 0 }}>
+                  节点 <Text strong>{job.nodeName}</Text> 已成功加入集群并启用。
+                </Paragraph>
+              }
+              type="success"
+              showIcon
+              style={{ marginTop: 16 }}
+            />
+          )}
+
+          {isCancelled && (
+            <Alert
+              message="操作已取消"
+              type="warning"
+              showIcon
+              style={{ marginTop: 16 }}
+            />
+          )}
+
+          <div style={{ marginTop: 24 }}>
+            {isRunning && (
+              <Button
+                danger
+                onClick={handleCancel}
+                loading={cancelMutation.isPending}
+              >
+                取消操作
+              </Button>
+            )}
+            {!isRunning && (
+              <Button onClick={onClose}>
+                关闭
+              </Button>
+            )}
+          </div>
+        </div>
+      ) : (
+        <div style={{ textAlign: 'center', padding: 50 }}>
+          <Text type="secondary">无法加载任务信息</Text>
+        </div>
+      )}
+    </Drawer>
+  );
+};
+
+export default OnboardingProgressDrawer;
diff --git a/web-ui/src/contexts/AuthContext.tsx b/web-ui/src/contexts/AuthContext.tsx
index d55609e..a404eb3 100644
--- a/web-ui/src/contexts/AuthContext.tsx
+++ b/web-ui/src/contexts/AuthContext.tsx
@@ -1,4 +1,4 @@
-import React, { createContext, useContext, useState, useEffect, useCallback } from 'react';
+import React, { createContext, useContext, useState, useEffect, useCallback, useMemo } from 'react';
 import { getAuthStatus } from '../services/api';
 
 interface AuthContextType {
@@ -72,18 +72,12 @@ export const AuthProvider: React.FC<{ children: React.ReactNode }> = ({ children
     setUsername(null);
   }, []);
 
-  return (
-    <AuthContext.Provider value={{ 
-      isAuthenticated, 
-      authEnabled, 
-      username, 
-      loading, 
-      logout,
-      checkAuth 
-    }}>
-      {children}
-    </AuthContext.Provider>
+  const value = useMemo<AuthContextType>(
+    () => ({ isAuthenticated, authEnabled, username, loading, logout, checkAuth }),
+    [isAuthenticated, authEnabled, username, loading, logout, checkAuth],
   );
+
+  return <AuthContext.Provider value={value}>{children}</AuthContext.Provider>;
 };
 
 export const useAuth = () => {
diff --git a/web-ui/src/contexts/ThemeContext.tsx b/web-ui/src/contexts/ThemeContext.tsx
index 5b765ae..cec0ae7 100644
--- a/web-ui/src/contexts/ThemeContext.tsx
+++ b/web-ui/src/contexts/ThemeContext.tsx
@@ -1,4 +1,4 @@
-import React, { createContext, useContext, useState, useEffect, useCallback } from 'react';
+import React, { createContext, useContext, useState, useEffect, useCallback, useMemo } from 'react';
 
 type ThemeMode = 'light' | 'dark';
 
@@ -56,16 +56,12 @@ export const ThemeProvider: React.FC<{ children: React.ReactNode }> = ({ childre
     setThemeState(newTheme);
   }, []);
 
-  return (
-    <ThemeContext.Provider value={{ 
-      theme, 
-      toggleTheme, 
-      setTheme, 
-      isDark: theme === 'dark' 
-    }}>
-      {children}
-    </ThemeContext.Provider>
+  const value = useMemo<ThemeContextType>(
+    () => ({ theme, toggleTheme, setTheme, isDark: theme === 'dark' }),
+    [theme, toggleTheme, setTheme],
   );
+
+  return <ThemeContext.Provider value={value}>{children}</ThemeContext.Provider>;
 };
 
 export const useTheme = (): ThemeContextType => {
diff --git a/web-ui/src/layouts/BasicLayout.tsx b/web-ui/src/layouts/BasicLayout.tsx
index 7f75b28..daee1aa 100644
--- a/web-ui/src/layouts/BasicLayout.tsx
+++ b/web-ui/src/layouts/BasicLayout.tsx
@@ -16,6 +16,7 @@ import {
 } from '@ant-design/icons';
 import { useAuth } from '../contexts/AuthContext';
 import { useTheme } from '../contexts/ThemeContext';
+import { useFeatures } from '../hooks/useFeatures';
 import './BasicLayout.css';
 
 const { Header, Sider, Content } = Layout;
@@ -26,6 +27,7 @@ const BasicLayout: React.FC = () => {
   const location = useLocation();
   const { logout, username, authEnabled } = useAuth();
   const { theme, toggleTheme, isDark } = useTheme();
+  const { data: features } = useFeatures();
 
   const handleLogout = () => {
     logout();
@@ -52,26 +54,30 @@ const BasicLayout: React.FC = () => {
       icon: <ClusterOutlined />,
       label: '集群节点',
     },
-    {
-      key: '/teams',
-      icon: <ApartmentOutlined />,
-      label: '团队管理',
-    },
-    {
-      key: '/projects',
-      icon: <ProjectOutlined />,
-      label: '项目管理',
-    },
-    {
-      key: '/users',
-      icon: <UserOutlined />,
-      label: '用户管理',
-    },
-    {
-      key: '/reports',
-      icon: <BarChartOutlined />,
-      label: '报表中心',
-    },
+    ...(features?.capsuleEnabled !== false ? [
+      {
+        key: '/teams',
+        icon: <ApartmentOutlined />,
+        label: '团队管理',
+      },
+      {
+        key: '/projects',
+        icon: <ProjectOutlined />,
+        label: '项目管理',
+      },
+      {
+        key: '/users',
+        icon: <UserOutlined />,
+        label: '用户管理',
+      },
+    ] : []),
+    ...(features?.costEnabled !== false ? [
+      {
+        key: '/reports',
+        icon: <BarChartOutlined />,
+        label: '报表中心',
+      },
+    ] : []),
     {
       key: '/audit',
       icon: <AuditOutlined />,
@@ -116,7 +122,11 @@ const BasicLayout: React.FC = () => {
           className="app-menu"
         />
         <div className="sider-footer">
-          <Text className="version-text">v3.0.0 (Capsule + OpenCost)</Text>
+          <Text className="version-text">v{__APP_VERSION__}{features ? ` (${[
+            features.capsuleEnabled && 'Capsule',
+            features.costEnabled && 'OpenCost',
+            features.prometheusEnabled && 'Prometheus',
+          ].filter(Boolean).join(' + ') || '基础模式'})` : ''}</Text>
         </div>
       </Sider>
       <Layout className="main-layout">
diff --git a/web-ui/src/main.tsx b/web-ui/src/main.tsx
index 657d853..af7f309 100644
--- a/web-ui/src/main.tsx
+++ b/web-ui/src/main.tsx
@@ -5,6 +5,7 @@ import { QueryClient, QueryClientProvider } from '@tanstack/react-query';
 import { ConfigProvider, theme } from 'antd';
 import zhCN from 'antd/locale/zh_CN';
 import App from './App';
+import ErrorBoundary from './components/ErrorBoundary';
 import { AuthProvider } from './contexts/AuthContext';
 import { ThemeProvider, useTheme } from './contexts/ThemeContext';
 import './styles/theme.css';
@@ -87,7 +88,9 @@ const ThemedApp: React.FC = () => {
     >
       <BrowserRouter>
         <AuthProvider>
-          <App />
+          <ErrorBoundary>
+            <App />
+          </ErrorBoundary>
         </AuthProvider>
       </BrowserRouter>
     </ConfigProvider>
diff --git a/web-ui/src/pages/Cluster/ClusterNodes.tsx b/web-ui/src/pages/Cluster/ClusterNodes.tsx
index bdb2064..918328e 100644
--- a/web-ui/src/pages/Cluster/ClusterNodes.tsx
+++ b/web-ui/src/pages/Cluster/ClusterNodes.tsx
@@ -1,12 +1,14 @@
 import {
   CheckCircleOutlined,
   LockOutlined,
+  PlusOutlined,
   QuestionCircleOutlined,
   StopOutlined,
   TeamOutlined,
   UnlockOutlined
 } from '@ant-design/icons';
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
+import { getApiErrorMessage } from '../../utils/error';
 import {
   Badge,
   Button,
@@ -22,6 +24,8 @@ import {
 } from 'antd';
 import React, { useMemo, useState } from 'react';
 import { Link } from 'react-router-dom';
+import NodeOnboardingModal from '../../components/NodeOnboardingModal';
+import OnboardingProgressDrawer from '../../components/OnboardingProgressDrawer';
 import {
   NodeInfo, NodeStatus,
   ResourceDefinition,
@@ -60,6 +64,11 @@ const ClusterNodes: React.FC = () => {
   const [selectedNode, setSelectedNode] = useState<string | null>(null);
   const [selectedTeam, setSelectedTeam] = useState<string | null>(null);
 
+  // Node onboarding states
+  const [onboardingModalVisible, setOnboardingModalVisible] = useState(false);
+  const [onboardingDrawerVisible, setOnboardingDrawerVisible] = useState(false);
+  const [currentJobId, setCurrentJobId] = useState<string | null>(null);
+
   // Fetch nodes
   const { data: nodes, isLoading } = useQuery({
     queryKey: ['managedNodes'],
@@ -89,7 +98,7 @@ const ClusterNodes: React.FC = () => {
       queryClient.invalidateQueries({ queryKey: ['managedNodes'] });
     },
     onError: (err: any) => {
-      message.error(`启用失败: ${err.response?.data?.error || err.message}`);
+      message.error(`启用失败: ${getApiErrorMessage(err, '未知错误')}`);
     },
   });
 
@@ -100,7 +109,7 @@ const ClusterNodes: React.FC = () => {
       queryClient.invalidateQueries({ queryKey: ['managedNodes'] });
     },
     onError: (err: any) => {
-      message.error(`禁用失败: ${err.response?.data?.error || err.message}`);
+      message.error(`禁用失败: ${getApiErrorMessage(err, '未知错误')}`);
     },
   });
 
@@ -115,7 +124,7 @@ const ClusterNodes: React.FC = () => {
       setSelectedTeam(null);
     },
     onError: (err: any) => {
-      message.error(`分配失败: ${err.response?.data?.error || err.message}`);
+      message.error(`分配失败: ${getApiErrorMessage(err, '未知错误')}`);
     },
   });
 
@@ -126,7 +135,7 @@ const ClusterNodes: React.FC = () => {
       queryClient.invalidateQueries({ queryKey: ['managedNodes'] });
     },
     onError: (err: any) => {
-      message.error(`释放失败: ${err.response?.data?.error || err.message}`);
+      message.error(`释放失败: ${getApiErrorMessage(err, '未知错误')}`);
     },
   });
 
@@ -157,6 +166,13 @@ const ClusterNodes: React.FC = () => {
     setAssignModalVisible(true);
   };
 
+  // Handle onboarding started
+  const handleOnboardingStarted = (jobId: string) => {
+    setCurrentJobId(jobId);
+    setOnboardingModalVisible(false);
+    setOnboardingDrawerVisible(true);
+  };
+
   const handleAssignConfirm = () => {
     if (selectedNode && selectedTeam) {
       assignMutation.mutate({ nodeName: selectedNode, teamName: selectedTeam });
@@ -455,8 +471,17 @@ const ClusterNodes: React.FC = () => {
   return (
     <div>
       <div style={{ marginBottom: 16 }}>
-        <h2 style={{ margin: 0, marginBottom: 16 }}>节点管理</h2>
-        
+        <div style={{ display: 'flex', justifyContent: 'space-between', alignItems: 'center', marginBottom: 16 }}>
+          <h2 style={{ margin: 0 }}>节点管理</h2>
+          <Button
+            type="primary"
+            icon={<PlusOutlined />}
+            onClick={() => setOnboardingModalVisible(true)}
+          >
+            添加节点
+          </Button>
+        </div>
+
         {/* Status summary */}
         <Space style={{ marginBottom: 16 }}>
           <Tag>共 {nodes?.length || 0} 个节点</Tag>
@@ -539,6 +564,20 @@ const ClusterNodes: React.FC = () => {
           <QuestionCircleOutlined /> 只有独占模式的团队可以被分配节点
         </Text>
       </Modal>
+
+      {/* Node Onboarding Modal */}
+      <NodeOnboardingModal
+        open={onboardingModalVisible}
+        onClose={() => setOnboardingModalVisible(false)}
+        onStarted={handleOnboardingStarted}
+      />
+
+      {/* Onboarding Progress Drawer */}
+      <OnboardingProgressDrawer
+        jobId={currentJobId}
+        open={onboardingDrawerVisible}
+        onClose={() => setOnboardingDrawerVisible(false)}
+      />
     </div>
   );
 };
diff --git a/web-ui/src/pages/Cluster/NodeDetail.tsx b/web-ui/src/pages/Cluster/NodeDetail.tsx
index c5145b5..1a1ae57 100644
--- a/web-ui/src/pages/Cluster/NodeDetail.tsx
+++ b/web-ui/src/pages/Cluster/NodeDetail.tsx
@@ -20,6 +20,8 @@ import {
   Popconfirm,
   Alert,
   Empty,
+  Divider,
+  Typography,
 } from 'antd';
 import {
   ArrowLeftOutlined,
@@ -40,12 +42,132 @@ import {
   getEnabledResourceConfigs,
   NodeTaint,
   ResourceDefinition,
+  PrometheusMetric,
 } from '../../services/api';
+import { useFeatures } from '../../hooks/useFeatures';
+
+// Format bytes per second to human-readable string
+const formatBytesPerSec = (value: number): string => {
+  if (value >= 1e9) return (value / 1e9).toFixed(2) + ' GB/s';
+  if (value >= 1e6) return (value / 1e6).toFixed(2) + ' MB/s';
+  if (value >= 1e3) return (value / 1e3).toFixed(1) + ' KB/s';
+  return value.toFixed(0) + ' B/s';
+};
+
+// Shared X-axis time formatter
+const timeAxisLabel = {
+  formatter: (value: number) => {
+    const date = new Date(value);
+    return `${date.getHours()}:${String(date.getMinutes()).padStart(2, '0')}`;
+  },
+};
+
+// Build ECharts option for percentage metrics (0-100%)
+const buildPercentChartOption = (data?: PrometheusMetric[], color = '#1890ff') => ({
+  tooltip: { trigger: 'axis' as const },
+  xAxis: { type: 'time' as const, axisLabel: timeAxisLabel },
+  yAxis: { type: 'value' as const, min: 0, max: 100, axisLabel: { formatter: '{value}%' } },
+  series: [{
+    data: data?.map((m) => [m.timestamp * 1000, Number(m.value.toFixed(2))]) || [],
+    type: 'line' as const,
+    smooth: true,
+    areaStyle: { opacity: 0.3 },
+    itemStyle: { color },
+    showSymbol: false,
+  }],
+});
+
+// Build ECharts option for bandwidth metrics (auto-scale, bytes/sec)
+const buildBandwidthChartOption = (data?: PrometheusMetric[], color = '#722ed1') => ({
+  tooltip: {
+    trigger: 'axis' as const,
+    formatter: (params: { value: [number, number] }[]) => {
+      if (!params?.length) return '';
+      const p = params[0];
+      const date = new Date(p.value[0]);
+      const time = `${date.getHours()}:${String(date.getMinutes()).padStart(2, '0')}`;
+      return `${time}<br/>${formatBytesPerSec(p.value[1])}`;
+    },
+  },
+  xAxis: { type: 'time' as const, axisLabel: timeAxisLabel },
+  yAxis: {
+    type: 'value' as const,
+    min: 0,
+    axisLabel: { formatter: (v: number) => formatBytesPerSec(v) },
+  },
+  series: [{
+    data: data?.map((m) => [m.timestamp * 1000, m.value]) || [],
+    type: 'line' as const,
+    smooth: true,
+    areaStyle: { opacity: 0.3 },
+    itemStyle: { color },
+    showSymbol: false,
+  }],
+});
+
+// Build ECharts option for auto-scale metrics (e.g., temperature)
+const buildAutoScaleChartOption = (data?: PrometheusMetric[], color = '#fa8c16', yFormatter?: (v: number) => string) => ({
+  tooltip: { trigger: 'axis' as const },
+  xAxis: { type: 'time' as const, axisLabel: timeAxisLabel },
+  yAxis: {
+    type: 'value' as const,
+    min: 0,
+    axisLabel: yFormatter ? { formatter: (v: number) => yFormatter(v) } : undefined,
+  },
+  series: [{
+    data: data?.map((m) => [m.timestamp * 1000, Number(m.value.toFixed(1))]) || [],
+    type: 'line' as const,
+    smooth: true,
+    areaStyle: { opacity: 0.3 },
+    itemStyle: { color },
+    showSymbol: false,
+  }],
+});
+
+// Build ECharts option for GPU with average + per-device breakdown
+const buildGpuChartOption = (
+  avgData?: PrometheusMetric[],
+  perDevice?: { labels: Record<string, string>; metrics: PrometheusMetric[] }[],
+  color = '#f5222d',
+) => {
+  const gpuColors = ['#f5222d', '#fa541c', '#fa8c16', '#fadb14', '#a0d911', '#52c41a', '#13c2c2', '#1890ff'];
+  const series: object[] = [
+    {
+      name: '平均值',
+      data: avgData?.map((m) => [m.timestamp * 1000, Number(m.value.toFixed(2))]) || [],
+      type: 'line',
+      smooth: true,
+      lineStyle: { width: 2 },
+      areaStyle: { opacity: 0.2 },
+      itemStyle: { color },
+      showSymbol: false,
+    },
+    ...(perDevice || []).map((s, i) => ({
+      name: `GPU ${s.labels?.gpu ?? s.labels?.GPU_I_ID ?? i}`,
+      data: s.metrics?.map((m) => [m.timestamp * 1000, Number(m.value.toFixed(2))]) || [],
+      type: 'line',
+      smooth: true,
+      lineStyle: { width: 1, type: 'dashed' },
+      itemStyle: { color: gpuColors[i % gpuColors.length] },
+      showSymbol: false,
+    })),
+  ];
+
+  return {
+    tooltip: { trigger: 'axis' as const },
+    legend: { show: (perDevice?.length ?? 0) > 0, bottom: 0, type: 'scroll' as const },
+    xAxis: { type: 'time' as const, axisLabel: timeAxisLabel },
+    yAxis: { type: 'value' as const, min: 0, max: 100, axisLabel: { formatter: '{value}%' } },
+    grid: { bottom: (perDevice?.length ?? 0) > 0 ? 40 : 10 },
+    series,
+  };
+};
 
 const NodeDetail: React.FC = () => {
   const { name } = useParams<{ name: string }>();
   const navigate = useNavigate();
   const queryClient = useQueryClient();
+  const { data: features } = useFeatures();
   const [labelsModalOpen, setLabelsModalOpen] = useState(false);
   const [taintsModalOpen, setTaintsModalOpen] = useState(false);
   const [labelsForm] = Form.useForm();
@@ -86,13 +208,17 @@ const NodeDetail: React.FC = () => {
     staleTime: 5 * 60 * 1000,
   });
 
+  // Detect node accelerator type from resources
+  const hasGpu = node?.resources?.some(r => r.name.includes('nvidia.com/gpu') && r.capacity > 0) ?? false;
+  const hasNpu = node?.resources?.some(r => r.name.includes('huawei.com/Ascend') && r.capacity > 0) ?? false;
+
   const { data: metrics, isLoading: metricsLoading } = useQuery({
-    queryKey: ['nodeMetrics', name],
+    queryKey: ['nodeMetrics', name, hasGpu, hasNpu],
     queryFn: async () => {
-      const { data } = await getNodeMetrics(name!, 24);
+      const { data } = await getNodeMetrics(name!, { hours: 24, hasGpu, hasNpu });
       return data;
     },
-    enabled: !!name && !!settings?.prometheusUrl,
+    enabled: !!name && !!settings?.prometheusUrl && features?.prometheusEnabled !== false,
   });
 
   const updateLabelsMutation = useMutation({
@@ -441,10 +567,10 @@ const NodeDetail: React.FC = () => {
       ),
       children: (
         <Card>
-          {!settings?.prometheusUrl ? (
+          {features?.prometheusEnabled === false || !settings?.prometheusUrl ? (
             <Alert
-              message="未配置 Prometheus"
-              description="请前往系统设置配置 Prometheus 地址以启用监控功能。"
+              message="Prometheus 未启用"
+              description={features?.prometheusEnabled === false ? "Prometheus 组件未启用，请在 Helm values 中启用 Prometheus 集成。" : "请前往系统设置配置 Prometheus 地址以启用监控功能。"}
               type="warning"
               showIcon
             />
@@ -456,63 +582,104 @@ const NodeDetail: React.FC = () => {
             <Empty description="暂无监控数据" />
           ) : (
             <Row gutter={[16, 16]}>
-              <Col span={24}>
+              {/* CPU & Memory */}
+              <Col xs={24} lg={12}>
                 <Card size="small" title="CPU 使用率 (%)">
-                  <ReactECharts
-                    option={{
-                      tooltip: { trigger: 'axis' },
-                      xAxis: {
-                        type: 'time',
-                        axisLabel: {
-                          formatter: (value: number) => {
-                            const date = new Date(value * 1000);
-                            return `${date.getHours()}:${String(date.getMinutes()).padStart(2, '0')}`;
-                          },
-                        },
-                      },
-                      yAxis: { type: 'value', min: 0, max: 100 },
-                      series: [
-                        {
-                          data: metrics?.cpuUsage?.map((m) => [m.timestamp * 1000, m.value.toFixed(2)]) || [],
-                          type: 'line',
-                          smooth: true,
-                          areaStyle: { opacity: 0.3 },
-                        },
-                      ],
-                    }}
-                    style={{ height: 250 }}
-                  />
+                  <ReactECharts option={buildPercentChartOption(metrics?.cpuUsage, '#1890ff')} style={{ height: 220 }} />
                 </Card>
               </Col>
-              <Col span={24}>
+              <Col xs={24} lg={12}>
                 <Card size="small" title="内存使用率 (%)">
-                  <ReactECharts
-                    option={{
-                      tooltip: { trigger: 'axis' },
-                      xAxis: {
-                        type: 'time',
-                        axisLabel: {
-                          formatter: (value: number) => {
-                            const date = new Date(value * 1000);
-                            return `${date.getHours()}:${String(date.getMinutes()).padStart(2, '0')}`;
-                          },
-                        },
-                      },
-                      yAxis: { type: 'value', min: 0, max: 100 },
-                      series: [
-                        {
-                          data: metrics?.memoryUsage?.map((m) => [m.timestamp * 1000, m.value.toFixed(2)]) || [],
-                          type: 'line',
-                          smooth: true,
-                          areaStyle: { opacity: 0.3 },
-                          itemStyle: { color: '#52c41a' },
-                        },
-                      ],
-                    }}
-                    style={{ height: 250 }}
-                  />
+                  <ReactECharts option={buildPercentChartOption(metrics?.memoryUsage, '#52c41a')} style={{ height: 220 }} />
+                </Card>
+              </Col>
+
+              {/* Network IO */}
+              <Col span={24}><Divider plain><Typography.Text type="secondary">网络 IO</Typography.Text></Divider></Col>
+              <Col xs={24} lg={12}>
+                <Card size="small" title="以太网接收带宽">
+                  {metrics?.networkReceive?.length ? (
+                    <ReactECharts option={buildBandwidthChartOption(metrics.networkReceive, '#722ed1')} style={{ height: 220 }} />
+                  ) : (
+                    <Empty description="暂无数据" image={Empty.PRESENTED_IMAGE_SIMPLE} />
+                  )}
+                </Card>
+              </Col>
+              <Col xs={24} lg={12}>
+                <Card size="small" title="以太网发送带宽">
+                  {metrics?.networkTransmit?.length ? (
+                    <ReactECharts option={buildBandwidthChartOption(metrics.networkTransmit, '#eb2f96')} style={{ height: 220 }} />
+                  ) : (
+                    <Empty description="暂无数据" image={Empty.PRESENTED_IMAGE_SIMPLE} />
+                  )}
                 </Card>
               </Col>
+
+              {/* RDMA IO - only show if data exists */}
+              {(metrics?.rdmaReceive?.length || metrics?.rdmaTransmit?.length) ? (
+                <>
+                  <Col span={24}><Divider plain><Typography.Text type="secondary">RDMA IO (InfiniBand)</Typography.Text></Divider></Col>
+                  <Col xs={24} lg={12}>
+                    <Card size="small" title="RDMA 接收带宽">
+                      {metrics?.rdmaReceive?.length ? (
+                        <ReactECharts option={buildBandwidthChartOption(metrics.rdmaReceive, '#13c2c2')} style={{ height: 220 }} />
+                      ) : (
+                        <Empty description="暂无数据" image={Empty.PRESENTED_IMAGE_SIMPLE} />
+                      )}
+                    </Card>
+                  </Col>
+                  <Col xs={24} lg={12}>
+                    <Card size="small" title="RDMA 发送带宽">
+                      {metrics?.rdmaTransmit?.length ? (
+                        <ReactECharts option={buildBandwidthChartOption(metrics.rdmaTransmit, '#faad14')} style={{ height: 220 }} />
+                      ) : (
+                        <Empty description="暂无数据" image={Empty.PRESENTED_IMAGE_SIMPLE} />
+                      )}
+                    </Card>
+                  </Col>
+                </>
+              ) : null}
+
+              {/* GPU Metrics (DCGM) - only for GPU nodes */}
+              {hasGpu && (metrics?.gpuUtilization?.length || metrics?.gpuMemoryUtil?.length) ? (
+                <>
+                  <Col span={24}><Divider plain><Typography.Text type="secondary">GPU 监控 (NVIDIA DCGM)</Typography.Text></Divider></Col>
+                  <Col xs={24} lg={12}>
+                    <Card size="small" title="GPU SM 利用率 (%)">
+                      <ReactECharts option={buildGpuChartOption(metrics?.gpuUtilization, metrics?.gpuPerDevice, '#f5222d')} style={{ height: 250 }} />
+                    </Card>
+                  </Col>
+                  <Col xs={24} lg={12}>
+                    <Card size="small" title="GPU 显存利用率 (%)">
+                      <ReactECharts option={buildPercentChartOption(metrics?.gpuMemoryUtil, '#fa541c')} style={{ height: 250 }} />
+                    </Card>
+                  </Col>
+                </>
+              ) : null}
+
+              {/* NPU Metrics (Ascend) - only for NPU nodes */}
+              {hasNpu && (metrics?.npuUtilization?.length || metrics?.npuMemoryUtil?.length) ? (
+                <>
+                  <Col span={24}><Divider plain><Typography.Text type="secondary">NPU 监控 (Huawei Ascend)</Typography.Text></Divider></Col>
+                  <Col xs={24} lg={12}>
+                    <Card size="small" title="NPU AI Core 利用率 (%)">
+                      <ReactECharts option={buildPercentChartOption(metrics?.npuUtilization, '#2f54eb')} style={{ height: 220 }} />
+                    </Card>
+                  </Col>
+                  <Col xs={24} lg={12}>
+                    <Card size="small" title="NPU HBM 使用率 (%)">
+                      <ReactECharts option={buildPercentChartOption(metrics?.npuMemoryUtil, '#a0d911')} style={{ height: 220 }} />
+                    </Card>
+                  </Col>
+                  {metrics?.npuTemperature?.length ? (
+                    <Col xs={24} lg={12}>
+                      <Card size="small" title="NPU 温度 (\u00B0C)">
+                        <ReactECharts option={buildAutoScaleChartOption(metrics.npuTemperature, '#fa8c16', (v) => `${v.toFixed(0)}\u00B0C`)} style={{ height: 220 }} />
+                      </Card>
+                    </Col>
+                  ) : null}
+                </>
+              ) : null}
             </Row>
           )}
         </Card>
diff --git a/web-ui/src/pages/Dashboard/index.tsx b/web-ui/src/pages/Dashboard/index.tsx
index 1b1951a..4c3fbf2 100644
--- a/web-ui/src/pages/Dashboard/index.tsx
+++ b/web-ui/src/pages/Dashboard/index.tsx
@@ -25,6 +25,7 @@ import {
   CostTrendPoint,
   TopConsumer
 } from '../../services/api';
+import { useFeatures } from '../../hooks/useFeatures';
 
 const { Title, Text } = Typography;
 
@@ -127,6 +128,7 @@ const SimpleLineChart: React.FC<{ data: CostTrendPoint[]; height?: number }> = (
 
 const Dashboard: React.FC = () => {
   const navigate = useNavigate();
+  const { data: features } = useFeatures();
 
   const { data: overview, isLoading: overviewLoading } = useQuery({
     queryKey: ['overview'],
@@ -138,12 +140,14 @@ const Dashboard: React.FC = () => {
     queryKey: ['teamUsage', '7d'],
     queryFn: () => getTeamUsage('7d').then(res => res.data),
     refetchInterval: 60000,
+    enabled: features?.capsuleEnabled !== false && (overview?.costEnabled ?? false),
   });
 
   const { data: projectUsage, isLoading: projectUsageLoading } = useQuery({
     queryKey: ['projectUsage', '7d'],
     queryFn: () => getProjectsUsageReport('7d').then(res => res.data),
     refetchInterval: 60000,
+    enabled: features?.capsuleEnabled !== false && (overview?.costEnabled ?? false),
   });
 
   // Fetch resource configs for display names and units
@@ -158,6 +162,7 @@ const Dashboard: React.FC = () => {
     queryKey: ['quotaAlerts', 80],
     queryFn: () => getQuotaAlerts(80).then(res => res.data.items),
     refetchInterval: 60000,
+    enabled: features?.capsuleEnabled !== false,
   });
 
   // Fetch cost trend
@@ -318,8 +323,8 @@ const Dashboard: React.FC = () => {
       {/* Summary Cards */}
       <Row gutter={[16, 16]}>
         <Col xs={24} sm={12} lg={6}>
-          <Card 
-            hoverable 
+          <Card
+            hoverable
             onClick={() => navigate('/cluster/nodes')}
             className="glass-card"
           >
@@ -331,44 +336,50 @@ const Dashboard: React.FC = () => {
             />
           </Card>
         </Col>
-        <Col xs={24} sm={12} lg={6}>
-          <Card 
-            hoverable 
-            onClick={() => navigate('/teams')}
-            className="glass-card"
-          >
-            <Statistic
-              title="团队数量"
-              value={overview?.totalTeams || 0}
-              prefix={<TeamOutlined />}
-              suffix="个"
-            />
-          </Card>
-        </Col>
-        <Col xs={24} sm={12} lg={6}>
-          <Card 
-            hoverable 
-            onClick={() => navigate('/projects')}
-            className="glass-card"
-          >
-            <Statistic
-              title="项目数量"
-              value={overview?.totalProjects || 0}
-              prefix={<ProjectOutlined />}
-              suffix="个"
-            />
-          </Card>
-        </Col>
-        <Col xs={24} sm={12} lg={6}>
-          <Card className="glass-card">
-            <Statistic
-              title="费用统计"
-              value={overview?.costEnabled ? '已启用' : '未启用'}
-              prefix={<DollarOutlined />}
-              valueStyle={{ color: overview?.costEnabled ? '#52c41a' : '#999' }}
-            />
-          </Card>
-        </Col>
+        {features?.capsuleEnabled !== false && (
+          <>
+            <Col xs={24} sm={12} lg={6}>
+              <Card
+                hoverable
+                onClick={() => navigate('/teams')}
+                className="glass-card"
+              >
+                <Statistic
+                  title="团队数量"
+                  value={overview?.totalTeams || 0}
+                  prefix={<TeamOutlined />}
+                  suffix="个"
+                />
+              </Card>
+            </Col>
+            <Col xs={24} sm={12} lg={6}>
+              <Card
+                hoverable
+                onClick={() => navigate('/projects')}
+                className="glass-card"
+              >
+                <Statistic
+                  title="项目数量"
+                  value={overview?.totalProjects || 0}
+                  prefix={<ProjectOutlined />}
+                  suffix="个"
+                />
+              </Card>
+            </Col>
+          </>
+        )}
+        {features?.costEnabled !== false && (
+          <Col xs={24} sm={12} lg={6}>
+            <Card className="glass-card">
+              <Statistic
+                title="费用统计"
+                value={overview?.costEnabled ? '已启用' : '未启用'}
+                prefix={<DollarOutlined />}
+                valueStyle={{ color: overview?.costEnabled ? '#52c41a' : '#999' }}
+              />
+            </Card>
+          </Col>
+        )}
       </Row>
 
       {/* Node Status and Quota Alerts */}
@@ -522,8 +533,8 @@ const Dashboard: React.FC = () => {
         </Col>
       </Row>
 
-      {/* Team Usage (if cost enabled) */}
-      {overview?.costEnabled && (
+      {/* Team Usage (if cost and capsule enabled) */}
+      {overview?.costEnabled && features?.capsuleEnabled !== false && (
         <Row gutter={[16, 16]} style={{ marginTop: 16 }}>
           <Col xs={24} lg={12}>
             <Card 
diff --git a/web-ui/src/pages/Login/index.tsx b/web-ui/src/pages/Login/index.tsx
index 3480206..a823062 100644
--- a/web-ui/src/pages/Login/index.tsx
+++ b/web-ui/src/pages/Login/index.tsx
@@ -5,6 +5,7 @@ import { useNavigate } from 'react-router-dom';
 import { login, getAuthStatus } from '../../services/api';
 import { useAuth } from '../../contexts/AuthContext';
 import { useTheme } from '../../contexts/ThemeContext';
+import { getApiErrorMessage } from '../../utils/error';
 import './Login.css';
 
 const { Title, Text } = Typography;
@@ -52,7 +53,7 @@ const Login: React.FC = () => {
       navigate('/dashboard', { replace: true });
     } catch (error: unknown) {
       const err = error as { response?: { data?: { error?: string } } };
-      message.error(err.response?.data?.error || '登录失败，请检查用户名和密码');
+      message.error(getApiErrorMessage(err, '登录失败，请检查用户名和密码'));
     } finally {
       setLoading(false);
     }
diff --git a/web-ui/src/pages/Settings/ConfigTransfer.tsx b/web-ui/src/pages/Settings/ConfigTransfer.tsx
new file mode 100644
index 0000000..59ecbf9
--- /dev/null
+++ b/web-ui/src/pages/Settings/ConfigTransfer.tsx
@@ -0,0 +1,484 @@
+import React, { useState } from 'react';
+import {
+  Card,
+  Row,
+  Col,
+  Checkbox,
+  Switch,
+  Button,
+  Upload,
+  Alert,
+  Collapse,
+  Tag,
+  Table,
+  Modal,
+  message,
+  Typography,
+  Space,
+  Spin,
+  Descriptions,
+} from 'antd';
+import {
+  DownloadOutlined,
+  UploadOutlined,
+  InboxOutlined,
+  CheckCircleOutlined,
+  CloseCircleOutlined,
+  WarningOutlined,
+  ExclamationCircleOutlined,
+} from '@ant-design/icons';
+import { useQueryClient } from '@tanstack/react-query';
+import {
+  exportConfig,
+  previewImport,
+  applyImport,
+  ExportConfigData,
+  ImportPreviewResult,
+  SectionPreview,
+} from '../../services/api';
+
+const { Text, Paragraph } = Typography;
+const { Dragger } = Upload;
+
+const SECTION_LABELS: Record<string, string> = {
+  billing: '计费配置',
+  alerts: '告警配置',
+  resources: '资源配置',
+  controlPlane: '控制面配置',
+  initScripts: '节点初始化脚本',
+};
+
+const ALL_SECTIONS = Object.keys(SECTION_LABELS);
+
+const ConfigTransfer: React.FC = () => {
+  const queryClient = useQueryClient();
+
+  // Export state
+  const [exportSections, setExportSections] = useState<string[]>(ALL_SECTIONS);
+  const [includeSensitive, setIncludeSensitive] = useState(false);
+  const [exporting, setExporting] = useState(false);
+
+  // Import state
+  const [importedConfig, setImportedConfig] = useState<ExportConfigData | null>(null);
+  const [previewResult, setPreviewResult] = useState<ImportPreviewResult | null>(null);
+  const [importSections, setImportSections] = useState<string[]>([]);
+  const [previewing, setPreviewing] = useState(false);
+  const [applying, setApplying] = useState(false);
+  const [fileName, setFileName] = useState('');
+
+  const handleExport = async () => {
+    setExporting(true);
+    try {
+      const response = await exportConfig({
+        sections: exportSections.join(','),
+        includeSensitive,
+      });
+      const blob = new Blob([response.data], { type: 'application/json' });
+      const url = URL.createObjectURL(blob);
+      const a = document.createElement('a');
+      a.href = url;
+      const now = new Date();
+      const ts = now.toISOString().replace(/[-:T]/g, '').slice(0, 15);
+      a.download = `bison-config-${ts}.json`;
+      a.click();
+      URL.revokeObjectURL(url);
+      message.success('配置导出成功');
+    } catch {
+      message.error('配置导出失败');
+    } finally {
+      setExporting(false);
+    }
+  };
+
+  const handleFileUpload = async (file: File) => {
+    setFileName(file.name);
+    setPreviewing(true);
+    setPreviewResult(null);
+    setImportedConfig(null);
+    setImportSections([]);
+
+    try {
+      const text = await file.text();
+      const config: ExportConfigData = JSON.parse(text);
+
+      if (!config.version || !config.sections) {
+        message.error('无效的配置文件：缺少 version 或 sections 字段');
+        setPreviewing(false);
+        return;
+      }
+
+      setImportedConfig(config);
+
+      const response = await previewImport(config);
+      const result = response.data;
+      setPreviewResult(result);
+
+      // Auto-select valid sections
+      const validSections = Object.entries(result.sections)
+        .filter(([, preview]) => preview.present && preview.valid)
+        .map(([key]) => key);
+      setImportSections(validSections);
+    } catch {
+      message.error('文件解析失败，请确认是有效的 Bison 配置文件');
+    } finally {
+      setPreviewing(false);
+    }
+  };
+
+  const handleApply = () => {
+    if (!importedConfig || importSections.length === 0) return;
+
+    Modal.confirm({
+      title: '确认导入配置',
+      icon: <ExclamationCircleOutlined />,
+      content: (
+        <div>
+          <p>即将导入以下配置模块：</p>
+          <ul>
+            {importSections.map((s) => (
+              <li key={s}>{SECTION_LABELS[s] || s}</li>
+            ))}
+          </ul>
+          <p style={{ color: '#ff4d4f' }}>此操作将覆盖对应的当前配置，请确认已备份重要数据。</p>
+        </div>
+      ),
+      okText: '确认导入',
+      okType: 'danger',
+      cancelText: '取消',
+      onOk: doApply,
+    });
+  };
+
+  const doApply = async () => {
+    if (!importedConfig) return;
+    setApplying(true);
+    try {
+      const response = await applyImport({
+        config: importedConfig,
+        sections: importSections,
+        preserveSensitive: true,
+      });
+      const result = response.data;
+      if (result.applied.length > 0) {
+        message.success(result.message);
+        // Invalidate relevant query caches
+        queryClient.invalidateQueries({ queryKey: ['billingConfig'] });
+        queryClient.invalidateQueries({ queryKey: ['alertConfig'] });
+        queryClient.invalidateQueries({ queryKey: ['resourceConfigs'] });
+        queryClient.invalidateQueries({ queryKey: ['controlPlaneConfig'] });
+        queryClient.invalidateQueries({ queryKey: ['initScripts'] });
+      }
+      if (result.warnings.length > 0) {
+        result.warnings.forEach((w) => message.warning(w));
+      }
+      if (result.applied.length === 0) {
+        message.error(result.message);
+      }
+    } catch {
+      message.error('配置导入失败');
+    } finally {
+      setApplying(false);
+    }
+  };
+
+  const resetImport = () => {
+    setImportedConfig(null);
+    setPreviewResult(null);
+    setImportSections([]);
+    setFileName('');
+  };
+
+  const renderFieldChanges = (preview: SectionPreview) => {
+    if (!preview.changes || Object.keys(preview.changes).length === 0) {
+      return <Text type="secondary">无变更</Text>;
+    }
+
+    const columns = [
+      { title: '字段', dataIndex: 'field', key: 'field', width: 180 },
+      {
+        title: '当前值',
+        dataIndex: 'current',
+        key: 'current',
+        render: (val: unknown) => (
+          <Text type="secondary">{val === null || val === undefined ? '-' : String(val)}</Text>
+        ),
+      },
+      {
+        title: '导入值',
+        dataIndex: 'imported',
+        key: 'imported',
+        render: (val: unknown) => <Text strong>{val === null || val === undefined ? '-' : String(val)}</Text>,
+      },
+    ];
+
+    const data = Object.entries(preview.changes).map(([field, change]) => ({
+      key: field,
+      field,
+      current: change.current,
+      imported: change.imported,
+    }));
+
+    return <Table columns={columns} dataSource={data} pagination={false} size="small" />;
+  };
+
+  const renderResourceSummary = (preview: SectionPreview) => {
+    const summary = preview.summary;
+    if (!summary) return <Text type="secondary">无变更信息</Text>;
+
+    return (
+      <Space direction="vertical" style={{ width: '100%' }}>
+        {summary.added && summary.added.length > 0 && (
+          <div>
+            <Tag color="green">新增 ({summary.added.length})</Tag>
+            <Text>{summary.added.join(', ')}</Text>
+          </div>
+        )}
+        {summary.modified && summary.modified.length > 0 && (
+          <div>
+            <Tag color="orange">修改 ({summary.modified.length})</Tag>
+            <Text>{summary.modified.join(', ')}</Text>
+          </div>
+        )}
+        {summary.removed && summary.removed.length > 0 && (
+          <div>
+            <Tag color="red">移除 ({summary.removed.length})</Tag>
+            <Text>{summary.removed.join(', ')}</Text>
+          </div>
+        )}
+        {summary.unchanged && summary.unchanged.length > 0 && (
+          <div>
+            <Tag>未变更 ({summary.unchanged.length})</Tag>
+            <Text type="secondary">{summary.unchanged.join(', ')}</Text>
+          </div>
+        )}
+      </Space>
+    );
+  };
+
+  const renderSectionPreview = (sectionKey: string, preview: SectionPreview) => {
+    const isArraySection = sectionKey === 'resources' || sectionKey === 'initScripts';
+
+    return (
+      <div>
+        {preview.errors && preview.errors.length > 0 && (
+          <Alert
+            type="error"
+            message={preview.errors.join('; ')}
+            style={{ marginBottom: 8 }}
+            showIcon
+          />
+        )}
+        {preview.warnings && preview.warnings.length > 0 && (
+          <Alert
+            type="warning"
+            message={preview.warnings.join('; ')}
+            style={{ marginBottom: 8 }}
+            showIcon
+          />
+        )}
+        {isArraySection ? renderResourceSummary(preview) : renderFieldChanges(preview)}
+      </div>
+    );
+  };
+
+  return (
+    <Row gutter={[16, 16]}>
+      <Col span={24}>
+        <Card
+          title={
+            <Space>
+              <DownloadOutlined />
+              导出配置
+            </Space>
+          }
+        >
+          <Space direction="vertical" style={{ width: '100%' }} size="middle">
+            <div>
+              <Text strong style={{ display: 'block', marginBottom: 8 }}>
+                选择导出模块
+              </Text>
+              <Checkbox.Group
+                value={exportSections}
+                onChange={(values) => setExportSections(values as string[])}
+              >
+                <Row gutter={[16, 8]}>
+                  {ALL_SECTIONS.map((key) => (
+                    <Col key={key} xs={12} sm={8} md={6}>
+                      <Checkbox value={key}>{SECTION_LABELS[key]}</Checkbox>
+                    </Col>
+                  ))}
+                </Row>
+              </Checkbox.Group>
+            </div>
+
+            <div>
+              <Space>
+                <Switch
+                  checked={includeSensitive}
+                  onChange={setIncludeSensitive}
+                />
+                <Text>包含敏感数据（密码、私钥、Webhook 地址）</Text>
+              </Space>
+              {includeSensitive && (
+                <Alert
+                  type="warning"
+                  message="导出文件将包含明文密码和私钥等敏感信息，请妥善保管导出文件。"
+                  style={{ marginTop: 8 }}
+                  showIcon
+                />
+              )}
+            </div>
+
+            <Button
+              type="primary"
+              icon={<DownloadOutlined />}
+              onClick={handleExport}
+              loading={exporting}
+              disabled={exportSections.length === 0}
+            >
+              导出配置
+            </Button>
+          </Space>
+        </Card>
+      </Col>
+
+      <Col span={24}>
+        <Card
+          title={
+            <Space>
+              <UploadOutlined />
+              导入配置
+            </Space>
+          }
+          extra={
+            previewResult && (
+              <Button size="small" onClick={resetImport}>
+                重新选择文件
+              </Button>
+            )
+          }
+        >
+          {!previewResult && !previewing && (
+            <Dragger
+              accept=".json"
+              showUploadList={false}
+              beforeUpload={(file) => {
+                handleFileUpload(file);
+                return false;
+              }}
+            >
+              <p className="ant-upload-drag-icon">
+                <InboxOutlined />
+              </p>
+              <p className="ant-upload-text">点击或拖拽 JSON 配置文件到此处</p>
+              <p className="ant-upload-hint">支持 Bison 导出的 .json 配置文件</p>
+            </Dragger>
+          )}
+
+          {previewing && (
+            <div style={{ textAlign: 'center', padding: 40 }}>
+              <Spin tip="正在解析配置文件..." />
+            </div>
+          )}
+
+          {previewResult && (
+            <Space direction="vertical" style={{ width: '100%' }} size="middle">
+              {/* File info */}
+              <Descriptions size="small" column={3} bordered>
+                <Descriptions.Item label="文件名">{fileName}</Descriptions.Item>
+                <Descriptions.Item label="版本">{previewResult.version}</Descriptions.Item>
+                <Descriptions.Item label="导出时间">
+                  {previewResult.exportedAt || '-'}
+                </Descriptions.Item>
+              </Descriptions>
+
+              {/* Global validation status */}
+              {previewResult.valid ? (
+                <Alert
+                  type="success"
+                  message="配置文件校验通过"
+                  icon={<CheckCircleOutlined />}
+                  showIcon
+                />
+              ) : (
+                <Alert
+                  type="error"
+                  message="配置文件校验失败"
+                  description={previewResult.errors.join('; ')}
+                  icon={<CloseCircleOutlined />}
+                  showIcon
+                />
+              )}
+
+              {previewResult.warnings.length > 0 && (
+                <Alert
+                  type="warning"
+                  message={previewResult.warnings.join('; ')}
+                  icon={<WarningOutlined />}
+                  showIcon
+                />
+              )}
+
+              {/* Section previews */}
+              <div>
+                <Text strong style={{ display: 'block', marginBottom: 8 }}>
+                  配置模块预览
+                </Text>
+                <Checkbox.Group
+                  value={importSections}
+                  onChange={(values) => setImportSections(values as string[])}
+                  style={{ width: '100%' }}
+                >
+                  <Collapse>
+                    {Object.entries(previewResult.sections).map(([key, preview]) => (
+                      <Collapse.Panel
+                        key={key}
+                        header={
+                          <Space>
+                            <Checkbox
+                              value={key}
+                              disabled={!preview.valid}
+                              onClick={(e) => e.stopPropagation()}
+                            />
+                            <span>{SECTION_LABELS[key] || key}</span>
+                            {preview.valid ? (
+                              <Tag color="success">有效</Tag>
+                            ) : (
+                              <Tag color="error">无效</Tag>
+                            )}
+                            {preview.hasSensitiveData && (
+                              <Tag color="warning">含脱敏数据</Tag>
+                            )}
+                          </Space>
+                        }
+                      >
+                        {renderSectionPreview(key, preview)}
+                      </Collapse.Panel>
+                    ))}
+                  </Collapse>
+                </Checkbox.Group>
+              </div>
+
+              <Paragraph type="secondary">
+                脱敏的敏感数据（密码、私钥等）在导入时将自动保留当前集群中的值。
+              </Paragraph>
+
+              <Button
+                type="primary"
+                danger
+                icon={<UploadOutlined />}
+                onClick={handleApply}
+                loading={applying}
+                disabled={importSections.length === 0 || !previewResult.valid}
+              >
+                应用选中的配置 ({importSections.length} 个模块)
+              </Button>
+            </Space>
+          )}
+        </Card>
+      </Col>
+    </Row>
+  );
+};
+
+export default ConfigTransfer;
diff --git a/web-ui/src/pages/Settings/ControlPlaneConfig.tsx b/web-ui/src/pages/Settings/ControlPlaneConfig.tsx
new file mode 100644
index 0000000..fabdae3
--- /dev/null
+++ b/web-ui/src/pages/Settings/ControlPlaneConfig.tsx
@@ -0,0 +1,234 @@
+import React, { useEffect, useState } from 'react';
+import {
+  Card,
+  Form,
+  Input,
+  InputNumber,
+  Select,
+  Button,
+  Space,
+  message,
+  Alert,
+  Typography,
+  Tag,
+  Spin,
+} from 'antd';
+import {
+  CloudServerOutlined,
+  SafetyCertificateOutlined,
+  CheckCircleOutlined,
+  CloseCircleOutlined,
+} from '@ant-design/icons';
+import { useQuery, useMutation, useQueryClient } from '@tanstack/react-query';
+import {
+  getControlPlaneConfig,
+  updateControlPlaneConfig,
+  testControlPlaneConnection,
+} from '../../services/api';
+
+const { TextArea } = Input;
+const { Paragraph, Text } = Typography;
+
+const ControlPlaneConfig: React.FC = () => {
+  const [form] = Form.useForm();
+  const queryClient = useQueryClient();
+  const [authMethod, setAuthMethod] = useState<'password' | 'privateKey'>('password');
+  const [testResult, setTestResult] = useState<'success' | 'error' | null>(null);
+
+  const { data: config, isLoading } = useQuery({
+    queryKey: ['controlPlaneConfig'],
+    queryFn: () => getControlPlaneConfig().then(res => res.data),
+  });
+
+  useEffect(() => {
+    if (config) {
+      form.setFieldsValue({
+        host: config.host,
+        sshPort: config.sshPort || 22,
+        sshUser: config.sshUser || 'root',
+        authMethod: config.authMethod || 'password',
+      });
+      setAuthMethod(config.authMethod || 'password');
+    }
+  }, [config, form]);
+
+  const updateMutation = useMutation({
+    mutationFn: updateControlPlaneConfig,
+    onSuccess: () => {
+      message.success('控制面配置已保存');
+      queryClient.invalidateQueries({ queryKey: ['controlPlaneConfig'] });
+      setTestResult(null);
+    },
+    onError: (err: Error) => {
+      message.error(`保存失败: ${err.message}`);
+    },
+  });
+
+  const testMutation = useMutation({
+    mutationFn: testControlPlaneConnection,
+    onSuccess: () => {
+      setTestResult('success');
+      message.success('连接测试成功');
+    },
+    onError: (err: Error) => {
+      setTestResult('error');
+      message.error(`连接测试失败: ${err.message}`);
+    },
+  });
+
+  const handleSave = () => {
+    form.validateFields().then(values => {
+      updateMutation.mutate(values);
+    });
+  };
+
+  const handleTest = () => {
+    // First save, then test
+    form.validateFields().then(values => {
+      updateMutation.mutate(values, {
+        onSuccess: () => {
+          testMutation.mutate();
+        },
+      });
+    });
+  };
+
+  if (isLoading) {
+    return (
+      <div style={{ textAlign: 'center', padding: 50 }}>
+        <Spin size="large" />
+      </div>
+    );
+  }
+
+  return (
+    <div>
+      <Alert
+        message="控制面 SSH 配置"
+        description={
+          <Paragraph style={{ marginBottom: 0 }}>
+            配置 Kubernetes 控制面节点的 SSH 访问信息，用于在添加节点时执行
+            <Text code>kubeadm token create</Text> 命令生成加入令牌。
+            请确保控制面节点上已安装 kubeadm。
+          </Paragraph>
+        }
+        type="info"
+        showIcon
+        style={{ marginBottom: 24 }}
+      />
+
+      <Card className="glass-card">
+        <Form
+          form={form}
+          layout="vertical"
+          initialValues={{
+            sshPort: 22,
+            sshUser: 'root',
+            authMethod: 'password',
+          }}
+        >
+          <Form.Item
+            name="host"
+            label={
+              <Space>
+                <CloudServerOutlined />
+                控制面节点 IP/主机名
+              </Space>
+            }
+            rules={[{ required: true, message: '请输入控制面节点地址' }]}
+          >
+            <Input placeholder="如：192.168.1.100 或 k8s-master" />
+          </Form.Item>
+
+          <Space size="large" style={{ width: '100%' }}>
+            <Form.Item
+              name="sshPort"
+              label="SSH 端口"
+              rules={[{ required: true }]}
+              style={{ width: 150 }}
+            >
+              <InputNumber min={1} max={65535} style={{ width: '100%' }} />
+            </Form.Item>
+
+            <Form.Item
+              name="sshUser"
+              label="SSH 用户名"
+              rules={[{ required: true }]}
+              style={{ width: 200 }}
+            >
+              <Input placeholder="root" />
+            </Form.Item>
+          </Space>
+
+          <Form.Item
+            name="authMethod"
+            label={
+              <Space>
+                <SafetyCertificateOutlined />
+                认证方式
+              </Space>
+            }
+            rules={[{ required: true }]}
+          >
+            <Select onChange={(value) => setAuthMethod(value)}>
+              <Select.Option value="password">密码</Select.Option>
+              <Select.Option value="privateKey">私钥</Select.Option>
+            </Select>
+          </Form.Item>
+
+          {authMethod === 'password' ? (
+            <Form.Item
+              name="password"
+              label="密码"
+              extra={config?.hasPassword ? <Tag color="green">已配置密码</Tag> : null}
+            >
+              <Input.Password placeholder="留空则保留原密码" />
+            </Form.Item>
+          ) : (
+            <Form.Item
+              name="privateKey"
+              label="私钥内容"
+              extra={config?.hasPrivateKey ? <Tag color="green">已配置私钥</Tag> : null}
+            >
+              <TextArea
+                rows={8}
+                placeholder="-----BEGIN RSA PRIVATE KEY-----&#10;...&#10;-----END RSA PRIVATE KEY-----"
+                style={{ fontFamily: 'monospace', fontSize: 12 }}
+              />
+            </Form.Item>
+          )}
+
+          {testResult && (
+            <Alert
+              message={testResult === 'success' ? '连接测试成功' : '连接测试失败'}
+              type={testResult === 'success' ? 'success' : 'error'}
+              showIcon
+              icon={testResult === 'success' ? <CheckCircleOutlined /> : <CloseCircleOutlined />}
+              style={{ marginBottom: 16 }}
+            />
+          )}
+
+          <Form.Item>
+            <Space>
+              <Button
+                type="primary"
+                onClick={handleSave}
+                loading={updateMutation.isPending}
+              >
+                保存配置
+              </Button>
+              <Button
+                onClick={handleTest}
+                loading={testMutation.isPending || updateMutation.isPending}
+              >
+                测试连接
+              </Button>
+            </Space>
+          </Form.Item>
+        </Form>
+      </Card>
+    </div>
+  );
+};
+
+export default ControlPlaneConfig;
diff --git a/web-ui/src/pages/Settings/GeneralSettings.tsx b/web-ui/src/pages/Settings/GeneralSettings.tsx
index 59cfe08..1d11b63 100644
--- a/web-ui/src/pages/Settings/GeneralSettings.tsx
+++ b/web-ui/src/pages/Settings/GeneralSettings.tsx
@@ -1,6 +1,6 @@
 import React from 'react';
 import { Card, Descriptions, Typography, Alert, Spin, Tag } from 'antd';
-import { CloudOutlined, LineChartOutlined, DollarOutlined } from '@ant-design/icons';
+import { CloudOutlined, LineChartOutlined, DollarOutlined, ApartmentOutlined } from '@ant-design/icons';
 import { useQuery } from '@tanstack/react-query';
 import { getSettings, getFeatures } from '../../services/api';
 
@@ -71,11 +71,26 @@ const GeneralSettings: React.FC = () => {
               )}
             </Descriptions.Item>
 
-            <Descriptions.Item 
+            <Descriptions.Item
+              label={
+                <span>
+                  <ApartmentOutlined style={{ marginRight: 8 }} />
+                  Capsule 多租户
+                </span>
+              }
+            >
+              {features?.capsuleEnabled ? (
+                <Tag color="success">已启用</Tag>
+              ) : (
+                <Tag color="default">未启用</Tag>
+              )}
+            </Descriptions.Item>
+
+            <Descriptions.Item
               label={
                 <span>
                   <CloudOutlined style={{ marginRight: 8 }} />
-                  费用统计
+                  费用统计 (OpenCost)
                 </span>
               }
             >
@@ -85,6 +100,21 @@ const GeneralSettings: React.FC = () => {
                 <Tag color="default">未启用</Tag>
               )}
             </Descriptions.Item>
+
+            <Descriptions.Item
+              label={
+                <span>
+                  <LineChartOutlined style={{ marginRight: 8 }} />
+                  Prometheus 监控
+                </span>
+              }
+            >
+              {features?.prometheusEnabled ? (
+                <Tag color="success">已启用</Tag>
+              ) : (
+                <Tag color="default">未启用</Tag>
+              )}
+            </Descriptions.Item>
           </Descriptions>
 
           <div style={{ marginTop: 24 }}>
diff --git a/web-ui/src/pages/Settings/NodeInitConfig.tsx b/web-ui/src/pages/Settings/NodeInitConfig.tsx
new file mode 100644
index 0000000..5fef97f
--- /dev/null
+++ b/web-ui/src/pages/Settings/NodeInitConfig.tsx
@@ -0,0 +1,504 @@
+import React, { useState } from 'react';
+import {
+  Card,
+  Form,
+  Input,
+  Select,
+  Button,
+  Space,
+  Switch,
+  message,
+  Alert,
+  Typography,
+  Spin,
+  Tag,
+  Table,
+  Modal,
+  Popconfirm,
+  Tooltip,
+  Collapse,
+  Empty,
+} from 'antd';
+import {
+  PlusOutlined,
+  EditOutlined,
+  DeleteOutlined,
+  CodeOutlined,
+} from '@ant-design/icons';
+import { useQuery, useMutation, useQueryClient } from '@tanstack/react-query';
+import {
+  getInitScripts,
+  createInitScript,
+  updateInitScript,
+  deleteInitScript,
+  toggleInitScript,
+  ScriptGroup,
+  Script,
+  ScriptPhase,
+} from '../../services/api';
+
+const { TextArea } = Input;
+const { Text, Paragraph } = Typography;
+const { Panel } = Collapse;
+
+const phaseLabels: Record<ScriptPhase, string> = {
+  'pre-join': 'Pre-join',
+  'post-join': 'Post-join',
+};
+
+const phaseColors: Record<ScriptPhase, string> = {
+  'pre-join': 'blue',
+  'post-join': 'green',
+};
+
+// Platform script editor component
+interface PlatformScriptEditorProps {
+  scripts: Script[];
+  onChange: (scripts: Script[]) => void;
+}
+
+const PlatformScriptEditor: React.FC<PlatformScriptEditorProps> = ({
+  scripts,
+  onChange,
+}) => {
+  const [editingScript, setEditingScript] = useState<Script | null>(null);
+  const [editModalVisible, setEditModalVisible] = useState(false);
+  const [form] = Form.useForm();
+
+  const osList = [
+    { value: '*', label: '通用 (所有系统)' },
+    { value: 'ubuntu', label: 'Ubuntu' },
+    { value: 'centos', label: 'CentOS' },
+    { value: 'debian', label: 'Debian' },
+    { value: 'rhel', label: 'RHEL' },
+    { value: 'openEuler', label: 'openEuler' },
+    { value: 'rocky', label: 'Rocky Linux' },
+    { value: 'almalinux', label: 'AlmaLinux' },
+    { value: 'kylin', label: 'Kylin' },
+    { value: 'uos', label: 'UOS (统信)' },
+  ];
+  const archList = [
+    { value: '*', label: '通用 (所有架构)' },
+    { value: 'amd64', label: 'amd64 (x86_64)' },
+    { value: 'arm64', label: 'arm64 (aarch64)' },
+  ];
+
+  const handleAdd = () => {
+    setEditingScript(null);
+    form.resetFields();
+    form.setFieldsValue({ os: '*', arch: '*', content: '#!/bin/bash\nset -e\n\n' });
+    setEditModalVisible(true);
+  };
+
+  const handleEdit = (script: Script) => {
+    setEditingScript(script);
+    form.setFieldsValue(script);
+    setEditModalVisible(true);
+  };
+
+  const handleDelete = (scriptId: string) => {
+    onChange(scripts.filter(s => s.id !== scriptId));
+  };
+
+  const handleSave = () => {
+    form.validateFields().then(values => {
+      if (editingScript) {
+        onChange(scripts.map(s => s.id === editingScript.id ? { ...s, ...values } : s));
+      } else {
+        const newScript: Script = {
+          id: `script-${Date.now()}`,
+          ...values,
+        };
+        onChange([...scripts, newScript]);
+      }
+      setEditModalVisible(false);
+    });
+  };
+
+  const getPlatformLabel = (os: string, arch: string) => {
+    const osLabel = os === '*' ? '通用' : os;
+    const archLabel = arch === '*' ? '所有架构' : arch;
+    return `${osLabel} × ${archLabel}`;
+  };
+
+  return (
+    <div>
+      <div style={{ marginBottom: 16 }}>
+        <Button type="dashed" icon={<PlusOutlined />} onClick={handleAdd}>
+          添加平台脚本
+        </Button>
+      </div>
+
+      {scripts.length === 0 ? (
+        <Empty description="暂无平台脚本" image={Empty.PRESENTED_IMAGE_SIMPLE} />
+      ) : (
+        <Collapse>
+          {scripts.map(script => (
+            <Panel
+              key={script.id}
+              header={
+                <Space>
+                  <Tag color={script.os === '*' && script.arch === '*' ? 'default' : 'blue'}>
+                    {getPlatformLabel(script.os, script.arch)}
+                  </Tag>
+                </Space>
+              }
+              extra={
+                <Space onClick={e => e.stopPropagation()}>
+                  <Button
+                    type="text"
+                    size="small"
+                    icon={<EditOutlined />}
+                    onClick={() => handleEdit(script)}
+                  />
+                  <Popconfirm
+                    title="确定删除此平台脚本？"
+                    onConfirm={() => handleDelete(script.id)}
+                  >
+                    <Button type="text" size="small" danger icon={<DeleteOutlined />} />
+                  </Popconfirm>
+                </Space>
+              }
+            >
+              <pre style={{
+                background: '#f5f5f5',
+                padding: 12,
+                borderRadius: 4,
+                maxHeight: 200,
+                overflow: 'auto',
+                fontSize: 12,
+              }}>
+                {script.content}
+              </pre>
+            </Panel>
+          ))}
+        </Collapse>
+      )}
+
+      <Modal
+        title={editingScript ? '编辑平台脚本' : '添加平台脚本'}
+        open={editModalVisible}
+        onOk={handleSave}
+        onCancel={() => setEditModalVisible(false)}
+        width={700}
+      >
+        <Form form={form} layout="vertical">
+          <Space style={{ width: '100%' }} size="large">
+            <Form.Item name="os" label="操作系统" rules={[{ required: true }]} style={{ width: 220 }}>
+              <Select
+                showSearch
+                optionFilterProp="label"
+                options={osList}
+                placeholder="选择或输入操作系统"
+              />
+            </Form.Item>
+            <Form.Item name="arch" label="CPU 架构" rules={[{ required: true }]} style={{ width: 200 }}>
+              <Select options={archList} />
+            </Form.Item>
+          </Space>
+          <Text type="secondary" style={{ display: 'block', marginBottom: 16 }}>
+            操作系统名称来自节点的 /etc/os-release 文件中的 ID 字段。如果列表中没有你需要的系统，可以先添加一个节点，查看检测到的系统名称后再配置脚本。
+          </Text>
+          <Form.Item
+            name="content"
+            label="脚本内容"
+            rules={[{ required: true, message: '请输入脚本内容' }]}
+          >
+            <TextArea
+              rows={15}
+              style={{ fontFamily: 'monospace', fontSize: 12 }}
+              placeholder="#!/bin/bash&#10;set -e&#10;&#10;# Your script here"
+            />
+          </Form.Item>
+        </Form>
+      </Modal>
+    </div>
+  );
+};
+
+// ==================== Main Component ====================
+
+const NodeInitConfig: React.FC = () => {
+  const queryClient = useQueryClient();
+
+  const [scriptModalVisible, setScriptModalVisible] = useState(false);
+  const [editingGroup, setEditingGroup] = useState<ScriptGroup | null>(null);
+  const [scriptForm] = Form.useForm();
+  const [scripts, setScripts] = useState<Script[]>([]);
+
+  const { data: scriptGroups, isLoading } = useQuery({
+    queryKey: ['initScripts'],
+    queryFn: () => getInitScripts().then(res => res.data.items),
+  });
+
+  const toggleMutation = useMutation({
+    mutationFn: ({ id, enabled }: { id: string; enabled: boolean }) =>
+      toggleInitScript(id, enabled),
+    onSuccess: () => {
+      queryClient.invalidateQueries({ queryKey: ['initScripts'] });
+    },
+    onError: (err: Error) => {
+      message.error(`操作失败: ${err.message}`);
+    },
+  });
+
+  const createMutation = useMutation({
+    mutationFn: createInitScript,
+    onSuccess: () => {
+      message.success('脚本分组创建成功');
+      queryClient.invalidateQueries({ queryKey: ['initScripts'] });
+      setScriptModalVisible(false);
+    },
+    onError: (err: Error) => {
+      message.error(`创建失败: ${err.message}`);
+    },
+  });
+
+  const updateScriptMutation = useMutation({
+    mutationFn: ({ id, data }: { id: string; data: Partial<ScriptGroup> }) =>
+      updateInitScript(id, data),
+    onSuccess: () => {
+      message.success('脚本分组更新成功');
+      queryClient.invalidateQueries({ queryKey: ['initScripts'] });
+      setScriptModalVisible(false);
+    },
+    onError: (err: Error) => {
+      message.error(`更新失败: ${err.message}`);
+    },
+  });
+
+  const deleteMutation = useMutation({
+    mutationFn: deleteInitScript,
+    onSuccess: () => {
+      message.success('脚本分组已删除');
+      queryClient.invalidateQueries({ queryKey: ['initScripts'] });
+    },
+    onError: (err: Error) => {
+      message.error(`删除失败: ${err.message}`);
+    },
+  });
+
+  const handleAddScript = () => {
+    setEditingGroup(null);
+    setScripts([]);
+    scriptForm.resetFields();
+    scriptForm.setFieldsValue({ phase: 'pre-join', enabled: true });
+    setScriptModalVisible(true);
+  };
+
+  const handleEditScript = (group: ScriptGroup) => {
+    setEditingGroup(group);
+    setScripts(group.scripts || []);
+    scriptForm.setFieldsValue({
+      name: group.name,
+      description: group.description,
+      phase: group.phase,
+      enabled: group.enabled,
+    });
+    setScriptModalVisible(true);
+  };
+
+  const handleSaveScript = () => {
+    scriptForm.validateFields().then(values => {
+      const data = {
+        ...values,
+        scripts,
+      };
+
+      if (editingGroup) {
+        updateScriptMutation.mutate({ id: editingGroup.id, data });
+      } else {
+        createMutation.mutate(data);
+      }
+    });
+  };
+
+  const getSupportedPlatforms = (group: ScriptGroup) => {
+    if (!group.scripts || group.scripts.length === 0) return '无';
+
+    const platforms = group.scripts.map(s => {
+      if (s.os === '*' && s.arch === '*') return '通用';
+      const os = s.os === '*' ? '*' : s.os;
+      const arch = s.arch === '*' ? '*' : s.arch;
+      return `${os}×${arch}`;
+    });
+
+    return platforms.join(', ');
+  };
+
+  const scriptColumns = [
+    {
+      title: '脚本名称',
+      dataIndex: 'name',
+      key: 'name',
+      render: (name: string, record: ScriptGroup) => (
+        <Space>
+          <CodeOutlined />
+          <span>{name}</span>
+          {record.builtin && <Tag>内置</Tag>}
+        </Space>
+      ),
+    },
+    {
+      title: '执行阶段',
+      dataIndex: 'phase',
+      key: 'phase',
+      width: 120,
+      render: (phase: ScriptPhase) => (
+        <Tag color={phaseColors[phase]}>{phaseLabels[phase]}</Tag>
+      ),
+    },
+    {
+      title: '支持平台',
+      key: 'platforms',
+      width: 250,
+      render: (_: unknown, record: ScriptGroup) => (
+        <Text type="secondary" style={{ fontSize: 12 }}>
+          {getSupportedPlatforms(record)}
+        </Text>
+      ),
+    },
+    {
+      title: '状态',
+      dataIndex: 'enabled',
+      key: 'enabled',
+      width: 100,
+      render: (enabled: boolean, record: ScriptGroup) => (
+        <Switch
+          checked={enabled}
+          onChange={(checked) => toggleMutation.mutate({ id: record.id, enabled: checked })}
+          checkedChildren="启用"
+          unCheckedChildren="禁用"
+        />
+      ),
+    },
+    {
+      title: '操作',
+      key: 'actions',
+      width: 120,
+      render: (_: unknown, record: ScriptGroup) => (
+        <Space>
+          <Tooltip title="编辑">
+            <Button
+              type="text"
+              icon={<EditOutlined />}
+              onClick={() => handleEditScript(record)}
+            />
+          </Tooltip>
+          {!record.builtin && (
+            <Popconfirm
+              title="确定删除此脚本分组？"
+              onConfirm={() => deleteMutation.mutate(record.id)}
+            >
+              <Tooltip title="删除">
+                <Button type="text" danger icon={<DeleteOutlined />} />
+              </Tooltip>
+            </Popconfirm>
+          )}
+        </Space>
+      ),
+    },
+  ];
+
+  if (isLoading) {
+    return (
+      <div style={{ textAlign: 'center', padding: 50 }}>
+        <Spin size="large" />
+      </div>
+    );
+  }
+
+  return (
+    <div>
+      <Alert
+        message="节点初始化配置"
+        description={
+          <div>
+            <Paragraph style={{ marginBottom: 8 }}>
+              初始化脚本在节点加入集群时自动执行。Pre-join 脚本在 kubeadm join 之前执行（如配置私有仓库、禁用防火墙），
+              Post-join 脚本在节点加入集群后执行（如安装驱动、添加标签）。
+            </Paragraph>
+            <Paragraph style={{ marginBottom: 8 }}>
+              <strong>平台匹配：</strong>系统会自动检测节点的操作系统和 CPU 架构，按优先级匹配脚本：
+              精确匹配 &gt; OS 通用 &gt; 架构通用 &gt; 全通用。
+            </Paragraph>
+            <Paragraph style={{ marginBottom: 0 }}>
+              <strong>支持的系统：</strong>Ubuntu、CentOS、Debian、RHEL、openEuler、Rocky Linux、AlmaLinux、Kylin、UOS 等。
+              系统名称来自 /etc/os-release 的 ID 字段。
+            </Paragraph>
+          </div>
+        }
+        type="info"
+        showIcon
+        style={{ marginBottom: 24 }}
+      />
+
+      <Card
+        className="glass-card"
+        title="脚本分组"
+        extra={
+          <Button type="primary" icon={<PlusOutlined />} onClick={handleAddScript}>
+            新建分组
+          </Button>
+        }
+      >
+        <Table
+          columns={scriptColumns}
+          dataSource={scriptGroups}
+          rowKey="id"
+          loading={isLoading}
+          pagination={false}
+        />
+      </Card>
+
+      <Modal
+        title={editingGroup ? '编辑脚本分组' : '新建脚本分组'}
+        open={scriptModalVisible}
+        onOk={handleSaveScript}
+        onCancel={() => setScriptModalVisible(false)}
+        width={800}
+        confirmLoading={createMutation.isPending || updateScriptMutation.isPending}
+      >
+        <Form form={scriptForm} layout="vertical">
+          <Form.Item
+            name="name"
+            label="分组名称"
+            rules={[{ required: true, message: '请输入分组名称' }]}
+          >
+            <Input placeholder="如：配置私有镜像仓库" />
+          </Form.Item>
+          <Form.Item name="description" label="描述">
+            <Input placeholder="简要描述此脚本的功能" />
+          </Form.Item>
+          <Form.Item
+            name="phase"
+            label="执行阶段"
+            rules={[{ required: true }]}
+          >
+            <Select>
+              <Select.Option value="pre-join">Pre-join（kubeadm join 之前）</Select.Option>
+              <Select.Option value="post-join">Post-join（kubeadm join 之后）</Select.Option>
+            </Select>
+          </Form.Item>
+
+          <Form.Item label="平台脚本">
+            <PlatformScriptEditor scripts={scripts} onChange={setScripts} />
+          </Form.Item>
+
+          <Alert
+            message="支持的变量"
+            description={
+              <Text code>
+                {'${NODE_IP}'}, {'${NODE_NAME}'}, {'${REGISTRY_URL}'}, {'${CONTROL_PLANE_IP}'}
+              </Text>
+            }
+            type="info"
+            style={{ marginTop: 16 }}
+          />
+        </Form>
+      </Modal>
+    </div>
+  );
+};
+
+export default NodeInitConfig;
diff --git a/web-ui/src/pages/Settings/ResourceConfig.tsx b/web-ui/src/pages/Settings/ResourceConfig.tsx
index abdaccc..118a0f3 100644
--- a/web-ui/src/pages/Settings/ResourceConfig.tsx
+++ b/web-ui/src/pages/Settings/ResourceConfig.tsx
@@ -1,4 +1,5 @@
 import React, { useState } from 'react';
+import { getApiErrorMessage } from '../../utils/error';
 import {
   Card,
   Table,
@@ -72,7 +73,6 @@ const ResourceConfig: React.FC = () => {
   // Sync fetched data to local state
   React.useEffect(() => {
     if (configsData) {
-      console.log('Loaded configs from API:', configsData);
       setConfigs(configsData);
       setHasChanges(false);
     }
@@ -95,7 +95,7 @@ const ResourceConfig: React.FC = () => {
       setHasChanges(false);
     },
     onError: (error: any) => {
-      const errorMsg = error?.response?.data?.error || error?.message || '未知错误';
+      const errorMsg = getApiErrorMessage(error, '未知错误');
       message.error(`保存失败: ${errorMsg}`);
       console.error('Save error:', error);
     },
@@ -169,7 +169,6 @@ const ResourceConfig: React.FC = () => {
       ...cfg,
       divisor: cfg.divisor && cfg.divisor > 0 ? cfg.divisor : 1,
     }));
-    console.log('Saving configs:', validConfigs);
     saveMutation.mutate(validConfigs);
   };
 
diff --git a/web-ui/src/pages/Settings/index.tsx b/web-ui/src/pages/Settings/index.tsx
index f43a674..b931a03 100644
--- a/web-ui/src/pages/Settings/index.tsx
+++ b/web-ui/src/pages/Settings/index.tsx
@@ -1,12 +1,15 @@
 import React from 'react';
 import { Tabs, Typography } from 'antd';
-import { 
-  SettingOutlined, 
-  DollarOutlined, 
-  BellOutlined, 
+import {
+  SettingOutlined,
+  DollarOutlined,
+  BellOutlined,
   DashboardOutlined,
   CloudOutlined,
   AppstoreOutlined,
+  CloudServerOutlined,
+  ToolOutlined,
+  SwapOutlined,
 } from '@ant-design/icons';
 import { Routes, Route, useNavigate, useLocation } from 'react-router-dom';
 import BillingConfig from './BillingConfig';
@@ -14,18 +17,26 @@ import AlertConfig from './AlertConfig';
 import SystemStatus from './SystemStatus';
 import GeneralSettings from './GeneralSettings';
 import ResourceConfig from './ResourceConfig';
+import ControlPlaneConfig from './ControlPlaneConfig';
+import NodeInitConfig from './NodeInitConfig';
+import ConfigTransfer from './ConfigTransfer';
+import { useFeatures } from '../../hooks/useFeatures';
 
 const { Title } = Typography;
 
 const Settings: React.FC = () => {
   const navigate = useNavigate();
   const location = useLocation();
+  const { data: features } = useFeatures();
 
   const getCurrentTab = () => {
     const path = location.pathname;
     if (path.includes('/settings/resources')) return 'resources';
     if (path.includes('/settings/billing')) return 'billing';
     if (path.includes('/settings/alerts')) return 'alerts';
+    if (path.includes('/settings/control-plane')) return 'control-plane';
+    if (path.includes('/settings/node-init')) return 'node-init';
+    if (path.includes('/settings/transfer')) return 'transfer';
     if (path.includes('/settings/status')) return 'status';
     return 'general';
   };
@@ -49,7 +60,7 @@ const Settings: React.FC = () => {
         </span>
       ),
     },
-    {
+    ...(features?.costEnabled !== false ? [{
       key: 'billing',
       label: (
         <span>
@@ -57,8 +68,8 @@ const Settings: React.FC = () => {
           计费配置
         </span>
       ),
-    },
-    {
+    }] : []),
+    ...(features?.capsuleEnabled !== false ? [{
       key: 'alerts',
       label: (
         <span>
@@ -66,6 +77,33 @@ const Settings: React.FC = () => {
           告警配置
         </span>
       ),
+    }] : []),
+    {
+      key: 'control-plane',
+      label: (
+        <span>
+          <CloudServerOutlined />
+          控制面配置
+        </span>
+      ),
+    },
+    {
+      key: 'node-init',
+      label: (
+        <span>
+          <ToolOutlined />
+          节点初始化配置
+        </span>
+      ),
+    },
+    {
+      key: 'transfer',
+      label: (
+        <span>
+          <SwapOutlined />
+          配置迁移
+        </span>
+      ),
     },
     {
       key: 'status',
@@ -105,6 +143,9 @@ const Settings: React.FC = () => {
           <Route path="resources" element={<ResourceConfig />} />
           <Route path="billing" element={<BillingConfig />} />
           <Route path="alerts" element={<AlertConfig />} />
+          <Route path="control-plane" element={<ControlPlaneConfig />} />
+          <Route path="node-init" element={<NodeInitConfig />} />
+          <Route path="transfer" element={<ConfigTransfer />} />
           <Route path="status" element={<SystemStatus />} />
         </Routes>
       </div>
diff --git a/web-ui/src/pages/Team/TeamCreate.tsx b/web-ui/src/pages/Team/TeamCreate.tsx
index 4b494f7..2cca73e 100644
--- a/web-ui/src/pages/Team/TeamCreate.tsx
+++ b/web-ui/src/pages/Team/TeamCreate.tsx
@@ -1,5 +1,6 @@
 import { CloudServerOutlined, DeleteOutlined, PlusOutlined, TeamOutlined, UserOutlined } from '@ant-design/icons';
 import { useMutation, useQuery, useQueryClient } from '@tanstack/react-query';
+import { getApiErrorMessage } from '../../utils/error';
 import {
   Alert,
   Button, Card,
@@ -80,7 +81,7 @@ const TeamCreate: React.FC = () => {
       navigate('/teams');
     },
     onError: (error: any) => {
-      message.error(`创建失败: ${error.response?.data?.error || error.message}`);
+      message.error(`创建失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
diff --git a/web-ui/src/pages/Team/TeamDetail.tsx b/web-ui/src/pages/Team/TeamDetail.tsx
index 5dcd1be..a0e0d38 100644
--- a/web-ui/src/pages/Team/TeamDetail.tsx
+++ b/web-ui/src/pages/Team/TeamDetail.tsx
@@ -1,4 +1,5 @@
 import React, { useState, useEffect, useMemo } from 'react';
+import { getApiErrorMessage } from '../../utils/error';
 import { 
   Card, Form, Input, Button, Typography, message, Space, Select, 
   Descriptions, Spin, Tag, Table, Statistic, Row, Col, Divider, Popconfirm,
@@ -144,7 +145,7 @@ const TeamDetail: React.FC = () => {
       queryClient.invalidateQueries({ queryKey: ['teamNodes', name] });
     },
     onError: (error: any) => {
-      message.error(`更新失败: ${error.response?.data?.error || error.message}`);
+      message.error(`更新失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
@@ -158,7 +159,7 @@ const TeamDetail: React.FC = () => {
       navigate('/teams');
     },
     onError: (error: any) => {
-      message.error(`删除失败: ${error.response?.data?.error || error.message}`);
+      message.error(`删除失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
@@ -174,7 +175,7 @@ const TeamDetail: React.FC = () => {
       rechargeForm.resetFields();
     },
     onError: (error: any) => {
-      message.error(`充值失败: ${error.response?.data?.error || error.message}`);
+      message.error(`充值失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
@@ -187,7 +188,7 @@ const TeamDetail: React.FC = () => {
       setAutoRechargeModalVisible(false);
     },
     onError: (error: any) => {
-      message.error(`配置失败: ${error.response?.data?.error || error.message}`);
+      message.error(`配置失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
@@ -200,7 +201,7 @@ const TeamDetail: React.FC = () => {
       queryClient.invalidateQueries({ queryKey: ['teams'] });
     },
     onError: (error: any) => {
-      message.error(`操作失败: ${error.response?.data?.error || error.message}`);
+      message.error(`操作失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
@@ -212,7 +213,7 @@ const TeamDetail: React.FC = () => {
       queryClient.invalidateQueries({ queryKey: ['teams'] });
     },
     onError: (error: any) => {
-      message.error(`操作失败: ${error.response?.data?.error || error.message}`);
+      message.error(`操作失败: ${getApiErrorMessage(error, '未知错误')}`);
     },
   });
 
diff --git a/web-ui/src/services/api.ts b/web-ui/src/services/api.ts
index a7b312b..3606291 100644
--- a/web-ui/src/services/api.ts
+++ b/web-ui/src/services/api.ts
@@ -54,6 +54,8 @@ export const login = (data: LoginRequest) => api.post<LoginResponse>('/auth/logi
 // Feature flags
 export interface Features {
   costEnabled: boolean;
+  capsuleEnabled: boolean;
+  prometheusEnabled: boolean;
 }
 
 export const getFeatures = () => api.get<Features>('/features');
@@ -693,13 +695,36 @@ export interface PrometheusMetric {
   value: number;
 }
 
+export interface LabeledMetricSeries {
+  labels: Record<string, string>;
+  metrics: PrometheusMetric[];
+}
+
 export interface NodeMetrics {
   cpuUsage: PrometheusMetric[];
   memoryUsage: PrometheusMetric[];
-}
-
-export const getNodeMetrics = (name: string, hours = 24) =>
-  api.get<NodeMetrics>(`/metrics/node/${name}`, { params: { hours } });
+  // Network IO
+  networkReceive?: PrometheusMetric[];
+  networkTransmit?: PrometheusMetric[];
+  // RDMA IO
+  rdmaReceive?: PrometheusMetric[];
+  rdmaTransmit?: PrometheusMetric[];
+  // GPU (NVIDIA DCGM)
+  gpuUtilization?: PrometheusMetric[];
+  gpuMemoryUtil?: PrometheusMetric[];
+  gpuPerDevice?: LabeledMetricSeries[];
+  // NPU (Huawei Ascend)
+  npuUtilization?: PrometheusMetric[];
+  npuMemoryUtil?: PrometheusMetric[];
+  npuTemperature?: PrometheusMetric[];
+}
+
+export const getNodeMetrics = (name: string, params?: {
+  hours?: number; hasGpu?: boolean; hasNpu?: boolean;
+}) =>
+  api.get<NodeMetrics>(`/metrics/node/${name}`, {
+    params: { hours: params?.hours ?? 24, hasGpu: params?.hasGpu, hasNpu: params?.hasNpu },
+  });
 
 // Resource Configuration APIs
 export type ResourceCategory = 'compute' | 'memory' | 'storage' | 'accelerator' | 'other';
@@ -738,4 +763,170 @@ export const updateResourceConfig = (name: string, config: ResourceDefinition) =
 export const addResourceConfig = (config: ResourceDefinition) =>
   api.post('/resource-configs', config);
 
+// Node Onboarding APIs
+export type OnboardingJobStatus = 'pending' | 'running' | 'success' | 'failed' | 'cancelled';
+export type SubStepStatus = 'pending' | 'running' | 'success' | 'failed' | 'skipped';
+
+export interface NodePlatform {
+  os: string;
+  version: string;
+  arch: string;
+}
+
+export interface SubStep {
+  name: string;
+  status: SubStepStatus;
+  error?: string;
+}
+
+export interface OnboardingJob {
+  id: string;
+  nodeIP: string;
+  nodeName?: string;
+  platform: NodePlatform;
+  status: OnboardingJobStatus;
+  currentStep: number;
+  totalSteps: number;
+  stepMessage: string;
+  subSteps?: SubStep[];
+  errorMessage?: string;
+  createdAt: string;
+  updatedAt: string;
+  completedAt?: string;
+}
+
+export interface OnboardingRequest {
+  nodeIP: string;
+  sshPort?: number;
+  sshUsername: string;
+  authMethod: 'password' | 'privateKey';
+  password?: string;
+  privateKey?: string;
+}
+
+export const startNodeOnboarding = (data: OnboardingRequest) =>
+  api.post<OnboardingJob>('/nodes/onboard', data);
+export const getOnboardingJob = (jobId: string) =>
+  api.get<OnboardingJob>(`/nodes/onboard/${jobId}`);
+export const getOnboardingJobs = () =>
+  api.get<{ items: OnboardingJob[] }>('/nodes/onboard');
+export const cancelOnboardingJob = (jobId: string) =>
+  api.delete(`/nodes/onboard/${jobId}`);
+
+// Control Plane Config APIs
+export interface ControlPlaneConfig {
+  host: string;
+  sshPort: number;
+  sshUser: string;
+  authMethod: 'password' | 'privateKey';
+  hasPassword?: boolean;
+  hasPrivateKey?: boolean;
+  password?: string;
+  privateKey?: string;
+}
+
+export const getControlPlaneConfig = () =>
+  api.get<ControlPlaneConfig>('/settings/control-plane');
+export const updateControlPlaneConfig = (config: ControlPlaneConfig) =>
+  api.put('/settings/control-plane', config);
+export const testControlPlaneConnection = () =>
+  api.post('/settings/control-plane/test');
+
+// Init Scripts APIs
+export type ScriptPhase = 'pre-join' | 'post-join';
+
+export interface Script {
+  id: string;
+  os: string;
+  arch: string;
+  content: string;
+}
+
+export interface ScriptGroup {
+  id: string;
+  name: string;
+  description: string;
+  phase: ScriptPhase;
+  enabled: boolean;
+  order: number;
+  builtin: boolean;
+  scripts: Script[];
+}
+
+export const getInitScripts = () =>
+  api.get<{ items: ScriptGroup[] }>('/settings/init-scripts');
+export const getInitScript = (id: string) =>
+  api.get<ScriptGroup>(`/settings/init-scripts/${id}`);
+export const createInitScript = (data: Omit<ScriptGroup, 'id' | 'builtin'>) =>
+  api.post<ScriptGroup>('/settings/init-scripts', data);
+export const updateInitScript = (id: string, data: Partial<ScriptGroup>) =>
+  api.put<ScriptGroup>(`/settings/init-scripts/${id}`, data);
+export const deleteInitScript = (id: string) =>
+  api.delete(`/settings/init-scripts/${id}`);
+export const toggleInitScript = (id: string, enabled: boolean) =>
+  api.put(`/settings/init-scripts/${id}/toggle`, { enabled });
+export const reorderInitScripts = (ids: string[]) =>
+  api.put('/settings/init-scripts/reorder', { ids });
+
+// Configuration Import/Export APIs
+export interface ExportConfigData {
+  version: string;
+  exportedAt: string;
+  exportedBy: string;
+  sections: Record<string, unknown>;
+}
+
+export interface FieldChange {
+  current: unknown;
+  imported: unknown;
+}
+
+export interface ResourceChangeSummary {
+  added?: string[];
+  modified?: string[];
+  removed?: string[];
+  unchanged?: string[];
+}
+
+export interface SectionPreview {
+  present: boolean;
+  valid: boolean;
+  hasSensitiveData: boolean;
+  changes?: Record<string, FieldChange>;
+  summary?: ResourceChangeSummary;
+  warnings?: string[];
+  errors?: string[];
+}
+
+export interface ImportPreviewResult {
+  valid: boolean;
+  version: string;
+  exportedAt?: string;
+  sections: Record<string, SectionPreview>;
+  errors: string[];
+  warnings: string[];
+}
+
+export interface ImportApplyRequest {
+  config: ExportConfigData;
+  sections: string[];
+  preserveSensitive: boolean;
+}
+
+export interface ImportApplyResult {
+  message: string;
+  applied: string[];
+  skipped: string[];
+  warnings: string[];
+}
+
+export const exportConfig = (params?: { sections?: string; includeSensitive?: boolean }) =>
+  api.get('/settings/export', { params, responseType: 'blob' });
+
+export const previewImport = (config: ExportConfigData) =>
+  api.post<ImportPreviewResult>('/settings/import/preview', config);
+
+export const applyImport = (data: ImportApplyRequest) =>
+  api.post<ImportApplyResult>('/settings/import/apply', data);
+
 export default api;
diff --git a/web-ui/src/utils/error.ts b/web-ui/src/utils/error.ts
new file mode 100644
index 0000000..0b325f5
--- /dev/null
+++ b/web-ui/src/utils/error.ts
@@ -0,0 +1,19 @@
+import { AxiosError } from 'axios';
+
+/**
+ * Extract a human-readable message from an API/network error.
+ *
+ * The backend wraps errors as `{ "error": "..." }`; this centralizes that
+ * extraction so callers no longer copy the same `err?.response?.data?.error`
+ * dance (previously duplicated across ~13 sites).
+ */
+export function getApiErrorMessage(err: unknown, fallback = '操作失败'): string {
+  if (err instanceof AxiosError) {
+    const data = err.response?.data as { error?: string; message?: string } | undefined;
+    return data?.error || data?.message || err.message || fallback;
+  }
+  if (err instanceof Error) {
+    return err.message || fallback;
+  }
+  return fallback;
+}
diff --git a/web-ui/src/vite-env.d.ts b/web-ui/src/vite-env.d.ts
new file mode 100644
index 0000000..af71465
--- /dev/null
+++ b/web-ui/src/vite-env.d.ts
@@ -0,0 +1,4 @@
+/// <reference types="vite/client" />
+
+// Injected by Vite `define` from package.json — see vite.config.ts.
+declare const __APP_VERSION__: string;
diff --git a/web-ui/vite.config.ts b/web-ui/vite.config.ts
index 95d2363..e0cee4c 100644
--- a/web-ui/vite.config.ts
+++ b/web-ui/vite.config.ts
@@ -1,8 +1,17 @@
 import { defineConfig } from 'vite';
 import react from '@vitejs/plugin-react';
+import { readFileSync } from 'node:fs';
+
+// Single source of truth for the displayed app version: package.json.
+const pkg = JSON.parse(
+  readFileSync(new URL('./package.json', import.meta.url), 'utf-8'),
+) as { version: string };
 
 export default defineConfig({
   plugins: [react()],
+  define: {
+    __APP_VERSION__: JSON.stringify(pkg.version),
+  },
   server: {
     port: 3000,
     proxy: {
@@ -15,6 +24,18 @@ export default defineConfig({
   build: {
     outDir: 'dist',
     sourcemap: false,
+    rollupOptions: {
+      output: {
+        // Split heavy vendors into their own chunks so the initial bundle does
+        // not ship echarts (~1MB, only used by the node-detail page) to every
+        // Login/Dashboard session.
+        manualChunks: {
+          react: ['react', 'react-dom', 'react-router-dom'],
+          antd: ['antd', '@ant-design/icons'],
+          echarts: ['echarts', 'echarts-for-react'],
+          query: ['@tanstack/react-query'],
+        },
+      },
+    },
   },
 });
-
diff --git a/website/DOMAIN_SETUP.md b/website/DOMAIN_SETUP.md
new file mode 100644
index 0000000..cd6fc19
--- /dev/null
+++ b/website/DOMAIN_SETUP.md
@@ -0,0 +1,119 @@
+# 自定义域名配置指南
+
+本文档说明如何为 Bison 文档站点配置自定义域名 `bison.lei6393.com`。
+
+## 1. DNS 配置
+
+在你的 DNS 服务商（lei6393.com 的域名注册商）添加以下 DNS 记录:
+
+### 方式一：使用 CNAME（推荐）
+
+```
+类型: CNAME
+主机记录: bison
+记录值: supermarioyl.github.io
+TTL: 600 (或默认值)
+```
+
+### 方式二：使用 A 记录
+
+如果 DNS 服务商不支持 CNAME，可以使用 A 记录指向 GitHub Pages 的 IP:
+
+```
+类型: A
+主机记录: bison
+记录值: 185.199.108.153
+TTL: 600
+
+重复添加以下 IP:
+185.199.109.153
+185.199.110.153
+185.199.111.153
+```
+
+## 2. GitHub 仓库设置
+
+1. 进入 GitHub 仓库: https://github.com/SuperMarioYL/Bison
+2. 点击 **Settings** > **Pages**
+3. 在 **Custom domain** 输入框中填写: `bison.lei6393.com`
+4. 勾选 **Enforce HTTPS** (DNS 生效后)
+5. 点击 **Save**
+
+## 3. 验证配置
+
+### 检查 DNS 解析
+
+```bash
+# 检查 CNAME 记录
+dig bison.lei6393.com CNAME +short
+# 应该返回: supermarioyl.github.io
+
+# 检查 A 记录
+dig bison.lei6393.com A +short
+# 应该返回 GitHub Pages 的 IP 地址
+```
+
+### 测试网站访问
+
+DNS 生效后（通常 5-30 分钟），访问:
+
+- 主域名: https://bison.lei6393.com
+- 中文版: https://bison.lei6393.com/zh-Hans/
+- 文档: https://bison.lei6393.com/docs/
+
+### 旧 GitHub Pages URL 重定向
+
+GitHub 会自动将以下 URL 重定向到新域名:
+- https://supermarioyl.github.io/Bison/ → https://bison.lei6393.com/
+
+## 4. 本地开发
+
+本地开发时仍然使用 `npm start`，会在 `http://localhost:3001/` 运行（注意不再有 `/Bison/` 路径）。
+
+## 5. 部署
+
+自定义域名配置已包含在代码中:
+
+- ✅ `website/static/CNAME` - 包含域名配置
+- ✅ `website/docusaurus.config.ts` - URL 和 baseUrl 已更新
+
+每次 `npm run build` 构建时，CNAME 文件会自动复制到 `build/` 目录。
+
+部署到 GitHub Pages:
+
+```bash
+cd website
+npm run deploy
+```
+
+## 常见问题
+
+### Q: DNS 配置后多久生效?
+A: 通常 5-30 分钟，最长可能需要 48 小时。
+
+### Q: HTTPS 证书如何配置?
+A: GitHub Pages 会在 DNS 生效后自动生成和配置 Let's Encrypt 证书，无需手动操作。
+
+### Q: 为什么选择 bison.lei6393.com 而不是 www.lei6393.com?
+A:
+- 语义清晰，专门用于 Bison 项目
+- 便于未来扩展其他子域名项目
+- 符合企业级开源项目的最佳实践
+
+### Q: 旧的 GitHub Pages 链接还能用吗?
+A: 可以，GitHub 会自动重定向到新域名。
+
+## 技术细节
+
+当前配置:
+
+```typescript
+// docusaurus.config.ts
+url: "https://bison.lei6393.com",
+baseUrl: "/",
+```
+
+这意味着:
+- 所有链接使用根路径 `/` 而不是 `/Bison/`
+- 中文版访问路径: `/zh-Hans/` (不再是 `/Bison/zh-Hans/`)
+- 文档路径: `/docs/` (不再是 `/Bison/docs/`)
diff --git a/website/docs/configuration.md b/website/docs/configuration.md
index 539aaa3..029b43a 100644
--- a/website/docs/configuration.md
+++ b/website/docs/configuration.md
@@ -19,11 +19,11 @@ Bison is configured primarily through Helm values. You can customize the install
 | `auth.admin.password` | Admin password | `admin` | `changeme` |
 | `apiServer.replicaCount` | API server replicas | `2` | `3` |
 | `apiServer.image.repository` | API server image | `ghcr.io/supermarioyl/bison/api-server` | - |
-| `apiServer.image.tag` | API server image tag | `0.0.1` | `latest` |
+| `apiServer.image.tag` | API server image tag | `0.0.12` | `latest` |
 | `webUI.replicaCount` | Web UI replicas | `2` | `3` |
 | `webUI.image.repository` | Web UI image | `ghcr.io/supermarioyl/bison/web-ui` | - |
-| `webUI.image.tag` | Web UI image tag | `0.0.1` | `latest` |
-| `opencost.url` | OpenCost API endpoint | `http://opencost.opencost-system.svc:9003` | Custom URL |
+| `webUI.image.tag` | Web UI image tag | `0.0.12` | `latest` |
+| `dependencies.opencost.apiUrl` | OpenCost API endpoint | `http://opencost.opencost.svc.cluster.local:9003` | Custom URL |
 
 ### Example Custom Values
 
@@ -41,7 +41,7 @@ auth:
 apiServer:
   replicaCount: 3
   image:
-    tag: 0.0.1
+    tag: 0.0.12
   resources:
     requests:
       cpu: 200m
@@ -54,7 +54,7 @@ apiServer:
 webUI:
   replicaCount: 3
   image:
-    tag: 0.0.1
+    tag: 0.0.12
   resources:
     requests:
       cpu: 100m
@@ -64,8 +64,10 @@ webUI:
       memory: 256Mi
 
 # OpenCost Integration
-opencost:
-  url: http://opencost.opencost-system.svc:9003
+dependencies:
+  opencost:
+    enabled: true
+    apiUrl: http://opencost.opencost.svc.cluster.local:9003
 
 # Node Selection (optional)
 nodeSelector:
@@ -81,7 +83,8 @@ tolerations:
 Install with custom values:
 
 ```bash
-helm install bison bison/bison \
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
   --namespace bison-system \
   --create-namespace \
   --values custom-values.yaml
@@ -254,7 +257,7 @@ Configure OpenCost connection:
 
 ```bash
 # Test OpenCost API
-kubectl port-forward -n opencost-system svc/opencost 9003:9003
+kubectl port-forward -n opencost svc/opencost 9003:9003
 curl http://localhost:9003/healthz
 
 # Test allocation API
@@ -266,8 +269,10 @@ curl http://localhost:9003/allocation/compute?window=1d
 If OpenCost is deployed in a different namespace or with a different service name:
 
 ```bash
-helm upgrade bison bison/bison \
-  --set opencost.url=http://my-opencost.custom-namespace.svc:9003 \
+helm upgrade bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
+  --set dependencies.opencost.apiUrl=http://my-opencost.custom-namespace.svc:9003 \
+  --set dependencies.opencost.enabled=true \
   --namespace bison-system
 ```
 
@@ -305,7 +310,7 @@ Additional configuration can be provided via environment variables:
 | Variable | Description | Default |
 |----------|-------------|---------|
 | `KUBECONFIG` | Path to kubeconfig file | In-cluster config |
-| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost-system.svc:9003` |
+| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost.svc.cluster.local:9003` |
 | `AUTH_ENABLED` | Enable authentication | `false` |
 | `LOG_LEVEL` | Logging level | `info` |
 | `BILLING_INTERVAL` | Billing calculation interval | `10m` |
diff --git a/website/docs/features.md b/website/docs/features.md
index 8d0c438..6a1192c 100644
--- a/website/docs/features.md
+++ b/website/docs/features.md
@@ -8,7 +8,7 @@ Bison provides a comprehensive suite of features for GPU resource management, bi
 
 ## See Bison in Action
 
-### 🎯 Real-Time Resource Dashboard
+### Real-Time Resource Dashboard
 
 ![Bison Dashboard](/img/ui-dashboard.png)
 
@@ -26,15 +26,15 @@ Bison provides a comprehensive suite of features for GPU resource management, bi
 
 ---
 
-### 💼 Team Management & Budget Monitoring
+### Team Management & Budget Monitoring
 
 ![Team Management](/img/ui-team.png)
 
 **What you see:**
 - **Team List** with real-time status indicators:
-  - 🟢 Green balance = Healthy budget
-  - 🟡 Yellow balance = Approaching threshold
-  - 🔴 Red balance = Low balance or suspended
+  - **Green** balance = Healthy budget
+  - **Amber** balance = Approaching threshold
+  - **Red** balance = Low balance or suspended
 - **Resource Allocation** - CPU/Memory/GPU quotas per team (e.g., "cpu 0/10" means 0 used out of 10 allocated)
 - **Project Count** - Number of namespaces/projects under each team
 - **Quick Actions** - Edit quotas, recharge balance, or delete team with one click
@@ -46,7 +46,7 @@ Bison provides a comprehensive suite of features for GPU resource management, bi
 
 ---
 
-### 💰 Flexible Billing Configuration
+### Flexible Billing Configuration
 
 ![Billing Configuration](/img/ui-billing.png)
 
@@ -66,52 +66,62 @@ Bison provides a comprehensive suite of features for GPU resource management, bi
 
 ## Core Capabilities
 
+> **Legend** — items marked _Planned_ are on the [optimization roadmap](https://github.com/SuperMarioYL/Bison/blob/main/docs/optimization-roadmap.md) and not yet implemented. Everything else ships today.
+
 ### Multi-Tenant Management
-✅ **Capsule-Powered Isolation** - True multi-tenancy using Kubernetes-native Capsule operator
-✅ **OIDC Integration** - Enterprise SSO support for authentication
-✅ **Team-Based Access Control** - Manage users, roles, and permissions per team
-✅ **Shared & Exclusive Node Pools** - Flexible resource allocation strategies
+- **Capsule-Powered Isolation** — true multi-tenancy using the Kubernetes-native Capsule operator
+- **Team-Based Access Control** — manage users, roles, and permissions per team
+- **Shared & Exclusive Node Pools** — flexible resource allocation strategies
+- **Enterprise SSO / OIDC** — _Planned_
 
 ### Real-Time Billing
-✅ **Usage-Based Billing** - Accurate cost tracking based on actual resource consumption
-✅ **Configurable Pricing** - Set custom rates for CPU, Memory, GPU, and any Kubernetes resource
-✅ **Multi-Currency Support** - CNY, USD, EUR, and more
-✅ **Billing Rules Engine** - Define custom billing logic and aggregation periods
+- **Usage-Based Billing** — accurate cost tracking based on actual resource consumption (via OpenCost)
+- **Configurable Pricing** — set custom rates for CPU, Memory, GPU, and any Kubernetes resource
+- **Multi-Currency Support** — configurable currency and symbol (e.g. CNY ¥, USD $)
+- **Prepaid Balances with Real-Time Deduction** — hourly metering with optimistic-concurrency-safe balance writes
+
+### Cluster & Node Management
+- **Node Inventory** — live view of every node with architecture, status, and GPU device breakdown
+- **Node Pool Modes** — mark nodes as shared, exclusive, disabled, or unmanaged
+- **Per-Node Detail** — CPU / memory / GPU utilization time series and workload placement
+- **Resource Discovery** — auto-discover cluster resources (CPU, memory, GPU, storage, custom) and configure display units and pricing
+
+### Automated Node Onboarding
+- **Init Script Generation** — generate a per-node bootstrap script from the control-plane configuration
+- **SSH Onboarding Tasks** — run onboarding over SSH with live progress tracking
+- **Control-Plane Configuration** — manage how new nodes join the managed pool
 
 ### Dynamic Resource Quotas
-✅ **Per-Team Quotas** - CPU, Memory, GPU, Storage, and custom resources
-✅ **Namespace Quotas** - Project-level resource limits within teams
-✅ **Auto-Enforcement** - Kubernetes-native quota enforcement
-✅ **Quota Alerts** - Notifications when approaching limits
+- **Per-Team Quotas** — CPU, Memory, GPU, Storage, and custom resources
+- **Namespace Quotas** — project-level resource limits within teams
+- **Auto-Enforcement** — Kubernetes-native quota enforcement via Capsule
+- **Quota Alerts** — dashboard warnings when usage approaches limits (≥ 80%)
 
 ### Team Balance & Wallet System
-✅ **Prepaid Balances** - Team wallets with real-time deduction
-✅ **Auto-Deduction** - Automated billing based on resource usage
-✅ **Balance Thresholds** - Configurable warning and suspension levels
-✅ **Transaction History** - Complete audit trail of all balance changes
+- **Prepaid Balances** — team wallets with real-time deduction
+- **Transaction History** — complete audit trail of every recharge and deduction
+- **Grace Period & Auto-Suspension** — configurable grace window before suspending overdue teams
 
 ### Auto-Recharge
-✅ **Scheduled Top-Ups** - Weekly or monthly automatic recharges
-✅ **Custom Amounts** - Flexible recharge amounts per team
-✅ **Recharge Notifications** - Alert teams when balance is added
+- **Scheduled Top-Ups** — weekly or monthly automatic recharges
+- **Custom Amounts** — flexible recharge amounts per team
 
 ### Balance Alerts
-✅ **Multi-Channel Notifications** - Webhook, DingTalk, WeChat, Email
-✅ **Configurable Thresholds** - Set warning levels (e.g., 20%, 10%, 5%)
-✅ **Auto-Suspension** - Automatically suspend workloads when balance depleted
-✅ **Custom Templates** - Customize alert messages
+- **Multi-Channel Notifications** — Webhook, DingTalk, WeChat
+- **Configurable Thresholds** — set warning levels (e.g. 20%, 10%, 5%)
+- **Auto-Suspension** — automatically suspend workloads when the grace period expires
+- **Email / SMTP notifications** — _Planned_
 
 ### Usage Reports
-✅ **Team Analytics** - Per-team cost breakdowns and trends
-✅ **Project Analytics** - Namespace-level resource consumption
-✅ **Export Capabilities** - CSV, Excel, PDF reports
-✅ **Historical Data** - 30/60/90-day cost analysis
+- **Team & Project Analytics** — per-team and per-namespace cost breakdowns and trends
+- **CSV Export** — export summary reports for finance reconciliation
+- **Historical Windows** — 7 / 30 / 90-day cost analysis
+- **Excel & PDF export** — _Planned_
 
 ### Audit Logging
-✅ **Complete Operation History** - Track all administrative actions
-✅ **User Attribution** - Who did what and when
-✅ **Resource Changes** - Track quota, balance, and configuration changes
-✅ **Compliance Ready** - Meet internal audit requirements
+- **Complete Operation History** — track administrative actions with pagination
+- **User Attribution** — who did what and when
+- **Resource Changes** — track quota, balance, and configuration changes
 
 ---
 
@@ -158,7 +168,7 @@ graph TB
 - **Scalable** - Stateless API server that can scale horizontally
 - **Secure** - Kubernetes RBAC integration and optional authentication
 - **Observable** - Prometheus metrics and structured logging
-- **Extensible** - Plugin architecture for custom billing rules and alerts
+- **Configurable** - custom per-resource pricing, alert thresholds, and grace policy
 
 ---
 
@@ -176,7 +186,6 @@ Bison uses [Capsule](https://capsule.clastix.io/) for multi-tenancy:
 - Team-based tenant isolation
 - Namespace quota enforcement
 - Network and security policies
-- OIDC/SSO integration
 
 ### Prometheus Integration
 Metrics collection and monitoring:
diff --git a/website/docs/installation.md b/website/docs/installation.md
index c9abf61..a8c4411 100644
--- a/website/docs/installation.md
+++ b/website/docs/installation.md
@@ -36,7 +36,7 @@ helm install capsule projectcapsule/capsule \
 # Using Helm
 helm repo add opencost https://opencost.github.io/opencost-helm-chart
 helm install opencost opencost/opencost \
-  --namespace opencost-system \
+  --namespace opencost \
   --create-namespace \
   --set prometheus.internal.serviceName=prometheus-server \
   --set prometheus.internal.namespaceName=prometheus-system
@@ -44,39 +44,54 @@ helm install opencost opencost/opencost \
 
 ## Installation Methods
 
-Choose one of the following methods to install Bison:
+Bison Helm charts are distributed via **GitHub Container Registry (GHCR)** using the modern OCI format.
 
-### Option A: Helm Repository (Recommended)
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
 
-The simplest way to install Bison is using the official Helm repository:
+### Option A: From GHCR (Recommended)
+
+The simplest way to install Bison is directly from GitHub Container Registry:
 
 ```bash
-# Add Bison Helm repository
-helm repo add bison https://supermarioyl.github.io/Bison/charts/
-helm repo update
+# Install specific version from GHCR
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
+  --namespace bison-system \
+  --create-namespace
 
-# Install with default configuration
-helm install bison bison/bison \
+# Or pull the chart first, then install
+helm pull oci://ghcr.io/supermarioyl/charts/bison --version 0.0.12
+helm install bison bison-0.0.12.tgz \
   --namespace bison-system \
   --create-namespace
 
-# Or customize installation
-helm install bison bison/bison \
+# Customize installation
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
   --namespace bison-system \
   --create-namespace \
-  --set opencost.url=http://opencost.opencost-system.svc:9003 \
-  --set auth.enabled=false \
-  --set apiServer.image.tag=0.0.1 \
-  --set webUI.image.tag=0.0.1
+  --set dependencies.opencost.apiUrl=http://opencost.opencost.svc.cluster.local:9003 \
+  --set dependencies.opencost.enabled=true \
+  --set auth.enabled=true \
+  --set apiServer.image.tag=0.0.12 \
+  --set webUI.image.tag=0.0.12
 ```
 
+**Why GHCR OCI Format?**
+- ✅ No separate Helm repository maintenance needed
+- ✅ Unified with Docker images in GHCR
+- ✅ Faster installation (direct registry pull)
+- ✅ Modern Helm 3.8+ standard practice
+
 ### Option B: From GitHub Release
 
 Download a specific version from GitHub Releases:
 
 ```bash
-# Download latest Helm chart
-VERSION=0.0.1
+# Download Helm chart
+VERSION=0.0.12
 wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
 
 # Install the chart
@@ -115,18 +130,20 @@ Bison can be configured using Helm values. Here are the key configuration option
 apiServer:
   image:
     repository: ghcr.io/supermarioyl/bison/api-server
-    tag: 0.0.1
-  replicas: 2
+    tag: 0.0.12
+  replicaCount: 2
 
 webUI:
   image:
     repository: ghcr.io/supermarioyl/bison/web-ui
-    tag: 0.0.1
-  replicas: 2
+    tag: 0.0.12
+  replicaCount: 2
 
 # OpenCost URL
-opencost:
-  url: http://opencost.opencost-system.svc:9003
+dependencies:
+  opencost:
+    enabled: true
+    apiUrl: http://opencost.opencost.svc.cluster.local:9003
 
 # Authentication
 auth:
@@ -136,12 +153,14 @@ auth:
 ### Custom Configuration Example
 
 ```bash
-helm install bison bison/bison \
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
   --namespace bison-system \
   --create-namespace \
-  --set apiServer.replicas=3 \
-  --set webUI.replicas=3 \
-  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set apiServer.replicaCount=3 \
+  --set webUI.replicaCount=3 \
+  --set dependencies.opencost.apiUrl=http://opencost.opencost.svc.cluster.local:9003 \
+  --set dependencies.opencost.enabled=true \
   --set auth.enabled=true
 ```
 
@@ -154,16 +173,16 @@ After installation, verify that all components are running:
 kubectl get pods -n bison-system
 
 # Expected output:
-# NAME                              READY   STATUS    RESTARTS   AGE
-# bison-api-server-xxxxxxxxx-xxxxx  1/1     Running   0          2m
-# bison-webui-xxxxxxxxx-xxxxx       1/1     Running   0          2m
+# NAME                          READY   STATUS    RESTARTS   AGE
+# bison-api-xxxxxxxxx-xxxxx      1/1     Running   0          2m
+# bison-web-xxxxxxxxx-xxxxx      1/1     Running   0          2m
 
 # Check services
 kubectl get svc -n bison-system
 
 # Check logs
-kubectl logs -n bison-system deployment/bison-api-server
-kubectl logs -n bison-system deployment/bison-webui
+kubectl logs -n bison-system deployment/bison-api
+kubectl logs -n bison-system deployment/bison-web
 ```
 
 ## Access the Platform
@@ -172,7 +191,7 @@ kubectl logs -n bison-system deployment/bison-webui
 
 ```bash
 # Port-forward the Web UI
-kubectl port-forward -n bison-system svc/bison-webui 3000:80
+kubectl port-forward -n bison-system svc/bison-web 3000:80
 
 # Access at http://localhost:3000
 ```
@@ -199,14 +218,14 @@ spec:
         pathType: Prefix
         backend:
           service:
-            name: bison-webui
+            name: bison-web
             port:
               number: 80
       - path: /api
         pathType: Prefix
         backend:
           service:
-            name: bison-api-server
+            name: bison-api
             port:
               number: 8080
 ```
@@ -240,14 +259,10 @@ docker pull ghcr.io/supermarioyl/bison/web-ui:latest
 To upgrade Bison to a new version:
 
 ```bash
-# Update Helm repository
-helm repo update
-
-# Upgrade to latest version
-helm upgrade bison bison/bison --namespace bison-system
-
-# Or upgrade to specific version
-helm upgrade bison bison/bison --version 0.0.2 --namespace bison-system
+# Upgrade to a specific version directly from GHCR
+helm upgrade bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
+  --namespace bison-system
 ```
 
 ## Uninstalling
@@ -269,7 +284,7 @@ kubectl delete namespace bison-system
 Check pod logs for errors:
 
 ```bash
-kubectl logs -n bison-system deployment/bison-api-server
+kubectl logs -n bison-system deployment/bison-api
 kubectl describe pod -n bison-system <pod-name>
 ```
 
@@ -278,8 +293,8 @@ kubectl describe pod -n bison-system <pod-name>
 Verify OpenCost is running and accessible:
 
 ```bash
-kubectl get svc -n opencost-system
-kubectl port-forward -n opencost-system svc/opencost 9003:9003
+kubectl get svc -n opencost
+kubectl port-forward -n opencost svc/opencost 9003:9003
 
 # Test endpoint
 curl http://localhost:9003/healthz
diff --git a/website/docs/intro.md b/website/docs/intro.md
index b3dc3aa..0a5f717 100644
--- a/website/docs/intro.md
+++ b/website/docs/intro.md
@@ -96,21 +96,22 @@ graph TB
 
 Choose one of the following installation methods:
 
-#### Option A: Using Helm Repository (Recommended)
+#### Option A: Using GHCR (Recommended - OCI Format)
 
 ```bash
-# Add Bison Helm repository
-helm repo add bison https://supermarioyl.github.io/Bison/charts/
-helm repo update
-
-# Install with default configuration
-helm install bison bison/bison --namespace bison-system --create-namespace
+# Install with default configuration directly from GitHub Container Registry
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
+  --namespace bison-system \
+  --create-namespace
 
 # Or customize installation
-helm install bison bison/bison \
+helm install bison oci://ghcr.io/supermarioyl/charts/bison \
+  --version 0.0.12 \
   --namespace bison-system \
   --create-namespace \
-  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set dependencies.opencost.apiUrl=http://opencost.opencost.svc.cluster.local:9003 \
+  --set dependencies.opencost.enabled=true \
   --set auth.enabled=false
 ```
 
@@ -118,7 +119,7 @@ helm install bison bison/bison \
 
 ```bash
 # Download latest Helm chart
-VERSION=0.0.1
+VERSION=0.0.12
 wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
 
 # Install
@@ -150,7 +151,7 @@ After installation, access Bison through:
 
 ```bash
 # Port-forward the Web UI
-kubectl port-forward -n bison-system svc/bison-webui 3000:80
+kubectl port-forward -n bison-system svc/bison-web 3000:80
 
 # Access at http://localhost:3000
 # Default credentials (if auth enabled):
diff --git a/website/docusaurus.config.ts b/website/docusaurus.config.ts
index 4b6b1d6..bb7cd6d 100644
--- a/website/docusaurus.config.ts
+++ b/website/docusaurus.config.ts
@@ -15,10 +15,10 @@ const config: Config = {
   },
 
   // Set the production url of your site here
-  url: "https://supermarioyl.github.io",
+  url: "https://bison.lei6393.com",
   // Set the /<baseUrl>/ pathname under which your site is served
   // For GitHub pages deployment, it is often '/<projectName>/'
-  baseUrl: "/Bison/",
+  baseUrl: "/",
 
   // GitHub pages deployment config.
   // If you aren't using GitHub pages, you don't need these.
@@ -64,6 +64,15 @@ const config: Config = {
   themeConfig: {
     // Replace with your project's social card
     image: "img/bison-social-card.png",
+    metadata: [
+      { name: 'google-site-verification', content: 'AKwgEpVubW0iVPeZN2RkopUMJbx4K-Yy8aWwCZq-T34' },
+      { name: 'baidu-site-verification', content: 'codeva-E3148CbKk3' },
+      { name: 'keywords', content: 'Kubernetes, GPU, billing, chargeback, multi-tenant, Capsule, OpenCost, GPU 计费, 多租户, 资源调度' },
+      { name: 'twitter:card', content: 'summary_large_image' },
+      { property: 'og:type', content: 'website' },
+      { property: 'og:image:width', content: '1200' },
+      { property: 'og:image:height', content: '630' },
+    ],
     colorMode: {
       respectPrefersColorScheme: true,
     },
diff --git a/website/i18n/zh-Hans/code.json b/website/i18n/zh-Hans/code.json
index e92fe8a..7b2b02c 100644
--- a/website/i18n/zh-Hans/code.json
+++ b/website/i18n/zh-Hans/code.json
@@ -325,5 +325,226 @@
   "theme.tags.tagsPageTitle": {
     "message": "标签",
     "description": "The title of the tag list page"
+  },
+  "component.statsSection.efficiency": {
+    "message": "GPU 资源效率",
+    "description": "Label for GPU resource efficiency statistic"
+  },
+  "component.statsSection.deployTime": {
+    "message": "平均部署时间",
+    "description": "Label for average deployment time statistic"
+  },
+  "component.statsSection.tenants": {
+    "message": "支持租户数",
+    "description": "Label for supported tenants statistic"
+  },
+  "component.statsSection.savings": {
+    "message": "成本节省",
+    "description": "Label for cost savings statistic"
+  },
+  "component.architectureDiagram.title": {
+    "message": "架构概览"
+  },
+  "component.architectureDiagram.subtitle": {
+    "message": "基于云原生技术构建，具备可扩展性和可靠性"
+  },
+  "component.architectureDiagram.node.bison": {
+    "message": "GPU 计费与调度平台",
+    "description": "Description for Bison node"
+  },
+  "component.architectureDiagram.node.capsule": {
+    "message": "多租户管理",
+    "description": "Description for Capsule node"
+  },
+  "component.architectureDiagram.node.opencost": {
+    "message": "成本追踪与分析",
+    "description": "Description for OpenCost node"
+  },
+  "component.architectureDiagram.node.k8s": {
+    "message": "容器编排",
+    "description": "Description for Kubernetes node"
+  },
+  "component.architectureDiagram.node.prometheus": {
+    "message": "指标收集",
+    "description": "Description for Prometheus node"
+  },
+  "component.useCases.title": {
+    "message": "真实应用场景"
+  },
+  "component.useCases.subtitle": {
+    "message": "了解 Bison 如何在不同场景下转变 GPU 资源管理"
+  },
+  "component.useCases.beforeBison": {
+    "message": "使用前"
+  },
+  "component.useCases.withBison": {
+    "message": "使用后"
+  },
+  "component.useCases.aiTraining.title": {
+    "message": "AI 训练平台",
+    "description": "Title for AI training use case"
+  },
+  "component.useCases.aiTraining.description": {
+    "message": "多团队机器学习工作负载的 GPU 资源共享",
+    "description": "Description for AI training use case"
+  },
+  "component.useCases.aiTraining.before.manual": {
+    "message": "手动分配 GPU",
+    "description": "AI training before: manual allocation"
+  },
+  "component.useCases.aiTraining.before.noCost": {
+    "message": "成本不可见",
+    "description": "AI training before: no cost visibility"
+  },
+  "component.useCases.aiTraining.before.conflicts": {
+    "message": "资源冲突",
+    "description": "AI training before: resource conflicts"
+  },
+  "component.useCases.aiTraining.after.automated": {
+    "message": "自动化调度",
+    "description": "AI training after: automated scheduling"
+  },
+  "component.useCases.aiTraining.after.realtime": {
+    "message": "实时成本追踪",
+    "description": "AI training after: real-time cost tracking"
+  },
+  "component.useCases.aiTraining.after.fair": {
+    "message": "公平资源共享",
+    "description": "AI training after: fair resource sharing"
+  },
+  "component.useCases.enterprise.title": {
+    "message": "企业云平台",
+    "description": "Title for enterprise cloud use case"
+  },
+  "component.useCases.enterprise.description": {
+    "message": "部门级资源隔离与计费",
+    "description": "Description for enterprise cloud use case"
+  },
+  "component.useCases.enterprise.before.chaos": {
+    "message": "共享集群混乱",
+    "description": "Enterprise before: shared cluster chaos"
+  },
+  "component.useCases.enterprise.before.noBudget": {
+    "message": "无预算控制",
+    "description": "Enterprise before: no budget control"
+  },
+  "component.useCases.enterprise.before.manual": {
+    "message": "手动报告",
+    "description": "Enterprise before: manual reporting"
+  },
+  "component.useCases.enterprise.after.isolated": {
+    "message": "租户隔离",
+    "description": "Enterprise after: isolated tenants"
+  },
+  "component.useCases.enterprise.after.prepaid": {
+    "message": "预付费余额",
+    "description": "Enterprise after: prepaid balances"
+  },
+  "component.useCases.enterprise.after.automated": {
+    "message": "自动化报表",
+    "description": "Enterprise after: automated reports"
+  },
+  "component.useCases.billing.title": {
+    "message": "成本中心计费",
+    "description": "Title for cost center billing use case"
+  },
+  "component.useCases.billing.description": {
+    "message": "内部 GPU 资源的计费回扣系统",
+    "description": "Description for cost center billing use case"
+  },
+  "component.useCases.billing.before.excel": {
+    "message": "基于 Excel 跟踪",
+    "description": "Billing before: Excel-based tracking"
+  },
+  "component.useCases.billing.before.monthly": {
+    "message": "月度对账",
+    "description": "Billing before: monthly reconciliation"
+  },
+  "component.useCases.billing.before.disputes": {
+    "message": "账单纠纷",
+    "description": "Billing before: billing disputes"
+  },
+  "component.useCases.billing.after.realtime": {
+    "message": "实时扣费",
+    "description": "Billing after: real-time deduction"
+  },
+  "component.useCases.billing.after.transparent": {
+    "message": "透明定价",
+    "description": "Billing after: transparent pricing"
+  },
+  "component.useCases.billing.after.automated": {
+    "message": "自动开票",
+    "description": "Billing after: automated invoicing"
+  },
+  "homepage.getStarted": {
+    "message": "快速开始"
+  },
+  "homepage.title": {
+    "message": "Bison - Kubernetes GPU 资源计费与多租户管理",
+    "description": "Homepage title"
+  },
+  "homepage.description": {
+    "message": "基于 Kubernetes、Capsule 和 OpenCost 的企业级 GPU 资源计费和多租户管理平台",
+    "description": "Homepage meta description"
+  },
+  "homepage.features.title": {
+    "message": "运行 GPU 集群所需的一切能力"
+  },
+  "homepage.features.subtitle": {
+    "message": "多租户、计量与计费 —— 统一在一个云原生平台中"
+  },
+  "homepage.feature.multitenant.title": {
+    "message": "多租户隔离"
+  },
+  "homepage.feature.multitenant.desc": {
+    "message": "基于 Capsule 实现真正的 Kubernetes 原生多租户。每个团队获得隔离的资源与共享/独占节点池，免去手动配额配置。"
+  },
+  "homepage.feature.billing.title": {
+    "message": "实时计费"
+  },
+  "homepage.feature.billing.desc": {
+    "message": "集成 OpenCost 自动追踪成本。按 Pod、按命名空间、按团队可视化，CPU、内存、GPU 价格均可自定义。"
+  },
+  "homepage.feature.dashboard.title": {
+    "message": "统一控制台"
+  },
+  "homepage.feature.dashboard.desc": {
+    "message": "为管理员、团队负责人与财务提供一站式视图：实时余额监控、告警、自动停用与完整用量报表。"
+  },
+  "homepage.feature.deploy.title": {
+    "message": "分钟级部署"
+  },
+  "homepage.feature.deploy.desc": {
+    "message": "零外部依赖 —— 所有数据存储于 Kubernetes ConfigMap。一条 Helm 命令安装，30 分钟内即可拥有完整的 GPU 资源管理能力。"
+  },
+  "homepage.feature.alerts.title": {
+    "message": "自动扣费与告警"
+  },
+  "homepage.feature.alerts.desc": {
+    "message": "预付费余额 + 实时扣费的自动计费。多渠道告警（Webhook、钉钉、企业微信），阈值可配置并支持自动停用。"
+  },
+  "homepage.feature.production.title": {
+    "message": "生产就绪"
+  },
+  "homepage.feature.production.desc": {
+    "message": "云原生架构，支持水平扩展、RBAC 集成与完整审计日志，提供多平台 Docker 镜像与企业 SSO 支持。"
+  },
+  "showcase.title": {
+    "message": "一个控制台，管好 GPU 全生命周期"
+  },
+  "showcase.subtitle": {
+    "message": "从集群拓扑到团队级分摊计费 —— 每一个界面，皆由矢量渲染"
+  },
+  "showcase.tab.dashboard": {
+    "message": "资源总览"
+  },
+  "showcase.tab.cluster": {
+    "message": "集群节点"
+  },
+  "showcase.tab.report": {
+    "message": "报表中心"
+  },
+  "showcase.tab.billing": {
+    "message": "计费配置"
   }
 }
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/architecture.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/architecture.md
new file mode 100644
index 0000000..9b467ec
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/architecture.md
@@ -0,0 +1,418 @@
+---
+sidebar_position: 5
+---
+
+# 架构
+
+本文档提供 Bison 架构的技术概览，采用高内聚、低耦合的设计原则，以保证可维护性和可扩展性。
+
+## 系统概览
+
+### 高层架构
+
+```mermaid
+graph TB
+    subgraph PRESENT[展示层]
+        WEB[Web UI<br/>React 18 + Ant Design 5]
+        CLI[kubectl / API Client]
+    end
+
+    subgraph GATEWAY[API 网关层]
+        GW[API Server<br/>Go + Gin Framework]
+        AUTH[Auth Middleware<br/>JWT + OIDC]
+    end
+
+    subgraph BUSINESS[业务逻辑层]
+        TS[Tenant Service<br/>团队与项目 CRUD]
+        BS[Billing Service<br/>成本计算]
+        BLS[Balance Service<br/>钱包管理]
+        QS[Quota Service<br/>资源限制]
+        AS[Alert Service<br/>通知]
+        RS[Report Service<br/>分析]
+    end
+
+    subgraph INTEGRATION[集成层]
+        K8S[Kubernetes Client<br/>client-go]
+        OCC[OpenCost Client<br/>REST API]
+        PC[Prometheus Client<br/>PromQL]
+    end
+
+    subgraph EXTERNAL[外部系统]
+        KAPI[Kubernetes API]
+        CAP[Capsule Controller]
+        OC[OpenCost]
+        PROM[Prometheus]
+    end
+
+    subgraph DATA[数据层]
+        CM[ConfigMaps<br/>持久化存储]
+    end
+
+    WEB --> GW
+    CLI --> GW
+    GW --> AUTH
+    AUTH --> TS & BS & BLS & QS & AS & RS
+
+    TS --> K8S
+    BS --> OCC
+    BLS --> K8S
+    QS --> K8S
+    RS --> OCC & PC
+
+    K8S --> KAPI
+    K8S --> CAP
+    OCC --> OC
+    PC --> PROM
+
+    TS & BLS --> CM
+    KAPI --> CM
+```
+
+### 设计原则
+
+| 原则 | 实现方式 |
+|-----------|----------------|
+| **高内聚** | 每个服务处理单一领域（计费、配额、告警） |
+| **低耦合** | 服务之间通过明确定义的接口通信 |
+| **无状态 API** | 所有状态持久化到 Kubernetes ConfigMaps |
+| **云原生** | 利用 Kubernetes 原语实现高可用和扩展 |
+| **零数据库** | ConfigMaps 消除了外部数据库依赖 |
+
+## 架构层次
+
+Bison 遵循分层架构模式：
+
+### 1. 展示层
+- **Web UI**: React 18 + TypeScript + Ant Design 5
+- **API Client**: REST API 用于外部集成
+
+### 2. API 网关层
+- **API Server**: Go + Gin 框架
+- **认证**: JWT 和 OIDC 支持
+- **中间件**: 日志、恢复、CORS 处理
+
+### 3. 业务逻辑层
+- **Tenant Service**: 团队和项目管理
+- **Billing Service**: 成本计算和聚合
+- **Balance Service**: 钱包管理和自动扣费
+- **Quota Service**: 资源限制执行
+- **Alert Service**: 多渠道通知
+- **Report Service**: 分析和导出
+
+### 4. 集成层
+- **Kubernetes Client**: client-go 用于 K8s API 交互
+- **OpenCost Client**: REST API 用于成本数据
+- **Prometheus Client**: PromQL 查询指标
+
+### 5. 数据层
+- **ConfigMaps**: 余额、计费配置和元数据的持久化存储
+- **etcd**: 通过 Kubernetes ConfigMaps 作为后端存储
+
+## 核心组件
+
+### API Server
+
+API Server 是处理所有 HTTP 请求的核心组件：
+
+**技术栈：**
+- Go 1.24+
+- Gin web 框架
+- client-go 用于 Kubernetes API
+
+**关键职责：**
+- 提供 REST API 端点
+- 认证和授权
+- 请求路由和中间件
+- 后台任务调度
+
+**端点：**
+```
+/api/v1/teams          - 团队管理
+/api/v1/projects       - 项目管理
+/api/v1/billing        - 计费配置
+/api/v1/balance        - 余额操作
+/api/v1/stats          - 统计和报告
+```
+
+### Web UI
+
+基于 React 的单页应用：
+
+**技术栈：**
+- React 18
+- TypeScript
+- Vite（构建工具）
+- Ant Design 5
+- ECharts（可视化）
+- React Query（状态管理）
+
+**功能：**
+- 实时指标仪表板
+- 团队和项目管理
+- 计费配置
+- 余额监控
+- 使用报告和导出
+
+### Billing Service
+
+基于资源使用计算成本：
+
+**数据流：**
+```mermaid
+sequenceDiagram
+    participant S as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant K8S as Kubernetes
+
+    S->>BS: 触发计费（每 10 分钟）
+    BS->>OC: 查询团队成本
+    OC-->>BS: 返回使用数据
+    BS->>BS: 计算成本
+    BS->>BLS: 从余额扣除
+    BLS->>K8S: 更新 ConfigMap
+    BLS-->>BS: 确认
+    BS->>AS: 检查阈值
+    alt 余额不足
+        AS->>Webhook: 发送告警
+    end
+```
+
+**计费公式：**
+```
+总成本 = (CPU_核数 × CPU_价格 × 小时) +
+        (内存_GB × 内存_价格 × 小时) +
+        (GPU_数量 × GPU_价格 × 小时)
+```
+
+### Balance Service
+
+管理团队钱包和自动扣费：
+
+**功能：**
+- 实时余额追踪
+- 基于使用量自动扣费
+- 充值操作
+- 交易历史
+- 余额耗尽时自动暂停
+
+**存储：**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: bison-team-balances
+  namespace: bison-system
+data:
+  ml-team: "1523.45"
+  data-team: "890.12"
+  dev-team: "2100.00"
+```
+
+### Tenant Service
+
+管理团队（Capsule Tenants）和项目（Namespaces）：
+
+**功能：**
+- 创建/删除团队
+- 分配资源配额
+- 配置节点池（共享/独占）
+- 管理团队元数据
+
+**Capsule 集成：**
+```yaml
+apiVersion: capsule.clastix.io/v1beta1
+kind: Tenant
+metadata:
+  name: ml-team
+spec:
+  owners:
+  - name: team-leader
+    kind: User
+  resourceQuota:
+    items:
+    - hard:
+        cpu: "20"
+        memory: 64Gi
+        nvidia.com/gpu: "4"
+```
+
+## 数据流
+
+### 团队创建流程
+
+```mermaid
+sequenceDiagram
+    participant U as Admin
+    participant API as API Server
+    participant TS as Tenant Service
+    participant K8S as Kubernetes
+    participant CAP as Capsule
+
+    U->>API: POST /api/v1/teams
+    API->>TS: CreateTeam(name, quota, balance)
+    TS->>CAP: 创建 Tenant
+    CAP-->>TS: Tenant 已创建
+    TS->>K8S: 创建 ConfigMap（余额）
+    K8S-->>TS: ConfigMap 已创建
+    TS-->>API: 成功
+    API-->>U: 201 Created
+```
+
+### 计费周期流程
+
+```mermaid
+sequenceDiagram
+    participant SCH as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant AS as Alert Service
+
+    loop 每 10 分钟
+        SCH->>BS: 触发计费计算
+        BS->>OC: 查询成本（最近 10 分钟）
+        OC-->>BS: 返回使用指标
+        BS->>BS: 计算总成本
+        BS->>BLS: 从余额扣除成本
+        BLS->>BLS: 更新余额
+        BLS-->>BS: 余额已更新
+        BS->>AS: 检查余额阈值
+        alt 余额 < 20%
+            AS->>AS: 发送低余额告警
+        end
+        alt 余额 <= 0
+            AS->>BS: 暂停团队工作负载
+        end
+    end
+```
+
+## 集成点
+
+### Kubernetes 集成
+
+Bison 与 Kubernetes 深度集成：
+
+- **Capsule Tenants** 用于多租户
+- **ResourceQuotas** 用于限制执行
+- **Namespaces** 用于项目隔离
+- **ConfigMaps** 用于数据持久化
+- **RBAC** 用于访问控制
+
+### OpenCost 集成
+
+通过 OpenCost API 实现实时成本追踪：
+
+```bash
+# 查询团队成本
+GET /allocation/compute?window=10m&aggregate=namespace&filter=namespace:ml-team
+
+# 响应
+{
+  "ml-team": {
+    "cpuCost": 0.25,
+    "memCost": 0.10,
+    "gpuCost": 4.17,
+    "totalCost": 4.52
+  }
+}
+```
+
+### Prometheus 集成
+
+指标收集用于监控：
+
+- 资源利用率指标
+- 成本指标
+- 余额指标
+- 告警指标
+
+## 部署架构
+
+### 高可用设置
+
+```mermaid
+graph TB
+    subgraph K8S[Kubernetes 集群]
+        subgraph NS1[bison-system 命名空间]
+            API1[API Server Pod 1]
+            API2[API Server Pod 2]
+            WEB1[Web UI Pod 1]
+            WEB2[Web UI Pod 2]
+        end
+
+        subgraph NS2[opencost-system 命名空间]
+            OC[OpenCost]
+        end
+
+        subgraph NS3[prometheus-system 命名空间]
+            PROM[Prometheus]
+        end
+
+        LB[LoadBalancer]
+    end
+
+    LB --> API1 & API2
+    LB --> WEB1 & WEB2
+    API1 & API2 --> OC
+    OC --> PROM
+```
+
+### 资源要求
+
+**最低配置：**
+- API Server: 200m CPU，256Mi 内存
+- Web UI: 100m CPU，128Mi 内存
+
+**推荐配置（生产环境）：**
+- API Server: 1000m CPU，512Mi 内存（2 个副本）
+- Web UI: 500m CPU，256Mi 内存（2 个副本）
+
+## 安全模型
+
+### 认证
+- 基于 JWT token 的认证
+- OIDC/SSO 集成
+- 管理员用户管理
+
+### 授权
+- Kubernetes RBAC 集成
+- 基于角色的访问控制
+- 团队范围的权限
+
+### 数据安全
+- 所有数据静态加密（etcd 加密）
+- API 通信使用 TLS
+- 通过 Kubernetes Secrets 管理密钥
+
+## 技术栈
+
+### 后端
+- **语言**: Go 1.24+
+- **框架**: Gin
+- **Kubernetes 客户端**: client-go
+- **配置**: Viper
+- **日志**: Logrus
+
+### 前端
+- **框架**: React 18
+- **语言**: TypeScript
+- **UI 库**: Ant Design 5
+- **构建工具**: Vite
+- **状态管理**: React Query
+- **图表**: ECharts
+
+### 基础设施
+- **平台**: Kubernetes 1.22+
+- **多租户**: Capsule
+- **成本追踪**: OpenCost
+- **指标**: Prometheus
+- **存储**: ConfigMaps（etcd）
+
+## 下一步
+
+- [安装指南](installation.md) - 部署 Bison
+- [配置](configuration.md) - 配置计费
+- [用户指南](user-guides/admin.md) - 学习使用 Bison
+- [功能特性](features.md) - 探索功能
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/configuration.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/configuration.md
new file mode 100644
index 0000000..e8d7e4f
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/configuration.md
@@ -0,0 +1,361 @@
+---
+sidebar_position: 6
+---
+
+# 配置
+
+本指南介绍如何根据您的特定环境和需求配置 Bison。
+
+## Helm Chart 配置
+
+Bison 主要通过 Helm values 进行配置。您可以通过提供 `values.yaml` 文件或使用 `--set` 参数来自定义安装。
+
+### 关键配置参数
+
+| 参数 | 描述 | 默认值 | 示例 |
+|-----------|-------------|---------|---------|
+| `auth.enabled` | 启用认证 | `false` | `true` |
+| `auth.admin.username` | 管理员用户名 | `admin` | `admin` |
+| `auth.admin.password` | 管理员密码 | `admin` | `changeme` |
+| `apiServer.replicaCount` | API Server 副本数 | `2` | `3` |
+| `apiServer.image.repository` | API Server 镜像 | `ghcr.io/supermarioyl/bison/api-server` | - |
+| `apiServer.image.tag` | API Server 镜像标签 | `0.0.1` | `latest` |
+| `webUI.replicaCount` | Web UI 副本数 | `2` | `3` |
+| `webUI.image.repository` | Web UI 镜像 | `ghcr.io/supermarioyl/bison/web-ui` | - |
+| `webUI.image.tag` | Web UI 镜像标签 | `0.0.1` | `latest` |
+| `opencost.url` | OpenCost API 端点 | `http://opencost.opencost-system.svc:9003` | 自定义 URL |
+
+### 自定义 Values 示例
+
+创建一个 `custom-values.yaml` 文件：
+
+```yaml
+# 认证
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: MySecurePassword123
+
+# API Server
+apiServer:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 200m
+      memory: 256Mi
+    limits:
+      cpu: 1000m
+      memory: 512Mi
+
+# Web UI
+webUI:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 100m
+      memory: 128Mi
+    limits:
+      cpu: 500m
+      memory: 256Mi
+
+# OpenCost 集成
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# 节点选择（可选）
+nodeSelector:
+  node-role.kubernetes.io/control-plane: ""
+
+# 容忍度（可选）
+tolerations:
+  - key: node-role.kubernetes.io/control-plane
+    operator: Exists
+    effect: NoSchedule
+```
+
+使用自定义 values 安装：
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --values custom-values.yaml
+```
+
+## 计费配置
+
+计费设置在安装后通过 Web UI 或 API 进行配置。
+
+### 访问计费配置
+
+1. **通过 Web UI：**
+   - 导航到 **设置** > **计费配置**
+   - 设置 CPU、内存、GPU 和其他资源的价格
+   - 配置货币和计费周期
+
+2. **通过 API：**
+   ```bash
+   curl -X POST http://localhost:8080/api/v1/billing/config \
+     -H "Content-Type: application/json" \
+     -d '{
+       "enabled": true,
+       "currency": "USD",
+       "pricing": {
+         "cpu": 0.05,
+         "memory": 0.01,
+         "nvidia.com/gpu": 2.50
+       },
+       "billingInterval": "hourly"
+     }'
+   ```
+
+### 计费参数
+
+| 参数 | 描述 | 示例 |
+|-----------|-------------|---------|
+| `enabled` | 启用/禁用计费 | `true` |
+| `currency` | 计费货币 | `USD`, `CNY`, `EUR` |
+| `pricing.cpu` | CPU 价格（每核心小时） | `0.05` |
+| `pricing.memory` | 内存价格（每 GB 小时） | `0.01` |
+| `pricing["nvidia.com/gpu"]` | GPU 价格（每 GPU 小时） | `2.50` |
+| `billingInterval` | 计费聚合周期 | `hourly`, `daily` |
+| `lowBalanceThreshold` | 警告阈值（%） | `20` |
+| `suspendThreshold` | 自动暂停阈值（%） | `5` |
+
+### 计费配置示例
+
+```json
+{
+  "enabled": true,
+  "currency": "USD",
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "nvidia.com/mig-1g.5gb": 0.50,
+    "nvidia.com/mig-2g.10gb": 1.00
+  },
+  "billingInterval": "hourly",
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## 团队配置
+
+### 创建团队
+
+团队可以通过 Web UI 或 API 创建：
+
+**通过 Web UI：**
+1. 导航到 **团队** 页面
+2. 点击 **创建团队**
+3. 设置团队名称、配额和初始余额
+
+**通过 API：**
+```bash
+curl -X POST http://localhost:8080/api/v1/teams \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "ml-team",
+    "description": "Machine Learning Team",
+    "quota": {
+      "cpu": "20",
+      "memory": "64Gi",
+      "nvidia.com/gpu": "4"
+    },
+    "balance": 1000.00
+  }'
+```
+
+### 团队配额
+
+团队配额定义资源限制：
+
+```yaml
+quota:
+  cpu: "20"              # 20 个 CPU 核心
+  memory: "64Gi"         # 64 GB 内存
+  nvidia.com/gpu: "4"    # 4 个 GPU
+  storage: "500Gi"       # 500 GB 存储
+```
+
+### 团队余额管理
+
+设置初始余额并配置自动充值：
+
+```json
+{
+  "balance": 1000.00,
+  "autoRecharge": {
+    "enabled": true,
+    "amount": 500.00,
+    "schedule": "monthly",
+    "threshold": 100.00
+  }
+}
+```
+
+## 告警配置
+
+配置多渠道告警，用于低余额和配额警告。
+
+### Webhook 告警
+
+```json
+{
+  "type": "webhook",
+  "enabled": true,
+  "url": "https://your-webhook-endpoint.com/alerts",
+  "headers": {
+    "Authorization": "Bearer YOUR_TOKEN"
+  },
+  "template": {
+    "title": "Bison Alert",
+    "message": "Team {{.TeamName}} balance is {{.Balance}}"
+  }
+}
+```
+
+### 钉钉告警
+
+```json
+{
+  "type": "dingtalk",
+  "enabled": true,
+  "webhook": "https://oapi.dingtalk.com/robot/send?access_token=YOUR_TOKEN",
+  "secret": "YOUR_SECRET"
+}
+```
+
+### 企业微信告警
+
+```json
+{
+  "type": "wechat",
+  "enabled": true,
+  "corpid": "YOUR_CORP_ID",
+  "corpsecret": "YOUR_CORP_SECRET",
+  "agentid": 1000001
+}
+```
+
+## OpenCost 集成
+
+配置 OpenCost 连接：
+
+### 检查 OpenCost 连通性
+
+```bash
+# 测试 OpenCost API
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+
+# 测试 allocation API
+curl http://localhost:9003/allocation/compute?window=1d
+```
+
+### 更新 OpenCost URL
+
+如果 OpenCost 部署在不同的命名空间或使用不同的服务名称：
+
+```bash
+helm upgrade bison bison/bison \
+  --set opencost.url=http://my-opencost.custom-namespace.svc:9003 \
+  --namespace bison-system
+```
+
+## 认证与 OIDC
+
+启用认证并与您的 SSO 提供商集成：
+
+### 基本认证
+
+```yaml
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: SecurePassword123
+```
+
+### OIDC 集成
+
+```yaml
+auth:
+  enabled: true
+  oidc:
+    enabled: true
+    issuerURL: https://your-oidc-provider.com
+    clientID: bison-client-id
+    clientSecret: your-client-secret
+    redirectURL: https://bison.example.com/callback
+```
+
+## 环境变量
+
+可以通过环境变量提供其他配置：
+
+| 变量 | 描述 | 默认值 |
+|----------|-------------|---------|
+| `KUBECONFIG` | kubeconfig 文件路径 | 集群内配置 |
+| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost-system.svc:9003` |
+| `AUTH_ENABLED` | 启用认证 | `false` |
+| `LOG_LEVEL` | 日志级别 | `info` |
+| `BILLING_INTERVAL` | 计费计算间隔 | `10m` |
+
+在 Helm values 中设置环境变量：
+
+```yaml
+apiServer:
+  env:
+    - name: LOG_LEVEL
+      value: debug
+    - name: BILLING_INTERVAL
+      value: 5m
+```
+
+## 高级配置
+
+### 自定义资源定价
+
+为任何 Kubernetes 资源定价：
+
+```json
+{
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "amd.com/gpu": 2.00,
+    "ephemeral-storage": 0.001,
+    "custom.io/fpga": 5.00
+  }
+}
+```
+
+### 多集群支持
+
+在每个集群中部署 Bison，共享计费：
+
+```yaml
+# 集群 A
+apiServer:
+  clusterName: prod-us-west
+
+# 集群 B
+apiServer:
+  clusterName: prod-us-east
+```
+
+## 下一步
+
+- [用户指南](user-guides/admin.md) - 学习如何使用 Bison
+- [架构](architecture.md) - 理解系统设计
+- [功能特性](features.md) - 探索所有功能
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/features.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/features.md
new file mode 100644
index 0000000..fd3be31
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/features.md
@@ -0,0 +1,195 @@
+---
+sidebar_position: 2
+---
+
+# 功能特性
+
+Bison 为 Kubernetes 环境中的 GPU 资源管理、计费和多租户隔离提供了全面的功能套件。
+
+## Bison 实际运行
+
+### 🎯 实时资源仪表板
+
+![Bison Dashboard](/img/ui-dashboard.png)
+
+**您可以看到：**
+- **集群概览** - 一目了然地查看总团队数、项目数、资源池和配额
+- **资源利用率** - 可视化展示哪些团队正在消耗资源
+- **7 天成本趋势** - 历史成本数据，用于识别支出模式
+- **Top 5 成本排名** - 快速识别 GPU 重度使用者
+- **团队预算状态** - 实时余额监控，带有颜色编码的告警
+
+**谁会受益：**
+- **平台管理员** 即时了解集群健康状况和使用模式
+- **财务团队** 可以实时跟踪成本，无需等待月度报告
+- **团队负责人** 可以将自己的使用情况与其他团队进行比较
+
+---
+
+### 💼 团队管理与预算监控
+
+![Team Management](/img/ui-team.png)
+
+**您可以看到：**
+- **团队列表** 带有实时状态指示器：
+  - 🟢 绿色余额 = 预算健康
+  - 🟡 黄色余额 = 接近阈值
+  - 🔴 红色余额 = 余额不足或已暂停
+- **资源分配** - 每个团队的 CPU/内存/GPU 配额（例如，"cpu 0/10" 表示已分配 10 个中使用了 0 个）
+- **项目计数** - 每个团队下的命名空间/项目数量
+- **快速操作** - 一键编辑配额、充值余额或删除团队
+
+**谁会受益：**
+- **团队负责人** 一目了然地监控他们的预算状态和资源使用情况
+- **管理员** 从单一统一视图管理多个团队
+- **财务团队** 查看哪些团队需要充值
+
+---
+
+### 💰 灵活的计费配置
+
+![Billing Configuration](/img/ui-billing.png)
+
+**您可以看到：**
+- **按资源定价** - 为 CPU（每核心小时）、内存（每 GB 小时）、GPU（每 GPU 小时）设置自定义价格
+- **货币选择** - 支持 CNY、USD、EUR 等货币
+- **启用/禁用开关** - 一键打开或关闭特定资源的计费
+- **计费规则** - 定义资源计量方式（每小时、每天等）
+- **告警阈值** - 配置何时发送低余额警告
+
+**谁会受益：**
+- **财务团队** 将云成本与内部退款政策对齐
+- **管理员** 根据实际硬件成本调整定价
+- **预算管理者** 设置适当的警告阈值以防止超支
+
+---
+
+## 核心能力
+
+### 多租户管理
+✅ **Capsule 驱动的隔离** - 使用 Kubernetes 原生 Capsule operator 实现真正的多租户
+✅ **OIDC 集成** - 企业 SSO 支持认证
+✅ **基于团队的访问控制** - 管理每个团队的用户、角色和权限
+✅ **共享与独占节点池** - 灵活的资源分配策略
+
+### 实时计费
+✅ **基于使用量的计费** - 基于实际资源消耗的准确成本追踪
+✅ **可配置定价** - 为 CPU、内存、GPU 和任何 Kubernetes 资源设置自定义费率
+✅ **多货币支持** - CNY、USD、EUR 等
+✅ **计费规则引擎** - 定义自定义计费逻辑和聚合周期
+
+### 动态资源配额
+✅ **团队级配额** - CPU、内存、GPU、存储和自定义资源
+✅ **命名空间配额** - 团队内的项目级资源限制
+✅ **自动执行** - Kubernetes 原生配额执行
+✅ **配额告警** - 接近限制时的通知
+
+### 团队余额与钱包系统
+✅ **预付费余额** - 团队钱包实时扣费
+✅ **自动扣费** - 基于资源使用的自动计费
+✅ **余额阈值** - 可配置的警告和暂停级别
+✅ **交易历史** - 所有余额变更的完整审计跟踪
+
+### 自动充值
+✅ **定时充值** - 每周或每月自动充值
+✅ **自定义金额** - 每个团队的灵活充值金额
+✅ **充值通知** - 余额增加时通知团队
+
+### 余额告警
+✅ **多渠道通知** - Webhook、钉钉、微信、邮件
+✅ **可配置阈值** - 设置警告级别（例如 20%、10%、5%）
+✅ **自动暂停** - 余额耗尽时自动暂停工作负载
+✅ **自定义模板** - 自定义告警消息
+
+### 使用报告
+✅ **团队分析** - 团队级成本细分和趋势
+✅ **项目分析** - 命名空间级资源消耗
+✅ **导出功能** - CSV、Excel、PDF 报告
+✅ **历史数据** - 30/60/90 天成本分析
+
+### 审计日志
+✅ **完整操作历史** - 跟踪所有管理操作
+✅ **用户归属** - 谁在何时做了什么
+✅ **资源变更** - 跟踪配额、余额和配置变更
+✅ **合规就绪** - 满足内部审计要求
+
+---
+
+## 架构亮点
+
+Bison 的架构设计简单、可扩展，且无外部依赖。
+
+```mermaid
+graph TB
+    subgraph USER_LAYER[用户层]
+        UI[Web UI<br/>React + Ant Design]
+        API[REST API<br/>Go + Gin]
+    end
+
+    subgraph CORE[核心服务]
+        BS[Billing Service]
+        TS[Tenant Service]
+        QS[Quota Service]
+    end
+
+    subgraph K8S[Kubernetes 层]
+        CA[Capsule<br/>多租户]
+        OC[OpenCost<br/>成本追踪]
+        PR[Prometheus<br/>指标]
+    end
+
+    subgraph DATA[数据层]
+        CM[ConfigMaps<br/>零数据库]
+    end
+
+    UI --> API
+    API --> BS & TS & QS
+    BS --> OC
+    TS --> CA
+    QS --> CA
+    BS & TS --> CM
+    OC --> PR
+```
+
+### 关键架构优势
+
+- **零外部依赖** - 所有数据存储在 Kubernetes ConfigMaps（etcd 支持）
+- **云原生** - 基于 Kubernetes 原语构建，实现最大可移植性
+- **可扩展** - 无状态 API Server 可以水平扩展
+- **安全** - Kubernetes RBAC 集成和可选认证
+- **可观测** - Prometheus 指标和结构化日志
+- **可扩展** - 用于自定义计费规则和告警的插件架构
+
+---
+
+## 集成点
+
+### OpenCost 集成
+Bison 利用 [OpenCost](https://www.opencost.io/) 进行实时成本追踪：
+- 按 pod、按命名空间、按团队的成本可见性
+- GPU 利用率指标
+- 历史成本数据和趋势
+- 与 Prometheus 集成以收集指标
+
+### Capsule 集成
+Bison 使用 [Capsule](https://capsule.clastix.io/) 实现多租户：
+- 基于团队的租户隔离
+- 命名空间配额执行
+- 网络和安全策略
+- OIDC/SSO 集成
+
+### Prometheus 集成
+指标收集和监控：
+- 资源利用率追踪
+- 自定义计费指标
+- 告警规则评估
+- 历史数据保留
+
+---
+
+## 下一步
+
+- [安装指南](installation.md) - 在您的集群中部署 Bison
+- [用户指南](user-guides/admin.md) - 学习如何使用 Bison
+- [架构](architecture.md) - 深入了解系统设计
+- [配置](configuration.md) - 配置计费和设置
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/installation.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/installation.md
new file mode 100644
index 0000000..55dae7f
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/installation.md
@@ -0,0 +1,316 @@
+---
+sidebar_position: 3
+---
+
+# 安装指南
+
+本指南提供在 Kubernetes 集群中安装 Bison 的详细说明。
+
+## 前置要求
+
+在安装 Bison 之前，请确保您具备：
+
+- **Kubernetes 1.22+** - 正在运行的 Kubernetes 集群
+- **kubectl** - 已配置为访问您的集群
+- **Helm 3.0+** - Kubernetes 包管理器
+- **Capsule Operator v0.1.0+** - 用于多租户隔离
+- **OpenCost** - 已与 Prometheus 一起部署用于成本追踪
+
+### 安装前置组件
+
+如果您还没有安装所需的组件：
+
+#### 安装 Capsule
+
+```bash
+# 使用 Helm
+helm repo add projectcapsule https://projectcapsule.github.io/charts
+helm install capsule projectcapsule/capsule \
+  --namespace capsule-system \
+  --create-namespace
+```
+
+#### 安装 OpenCost
+
+```bash
+# 使用 Helm
+helm repo add opencost https://opencost.github.io/opencost-helm-chart
+helm install opencost opencost/opencost \
+  --namespace opencost-system \
+  --create-namespace \
+  --set prometheus.internal.serviceName=prometheus-server \
+  --set prometheus.internal.namespaceName=prometheus-system
+```
+
+## 安装方法
+
+Bison Helm charts 通过 **GitHub Container Registry (GHCR)** 使用现代 OCI 格式分发。
+
+**要求：**
+- Helm >= 3.8.0（用于 OCI 支持）
+- Kubernetes >= 1.22
+
+### 方式 A：从 GHCR 安装（推荐）
+
+从 GitHub Container Registry 直接安装 Bison 是最简单的方法：
+
+```bash
+# 从 GHCR 安装特定版本
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace
+
+# 或先拉取 chart，然后安装
+helm pull oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+helm install bison bison-0.0.2.tgz \
+  --namespace bison-system \
+  --create-namespace
+
+# 自定义安装
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true \
+  --set apiServer.image.tag=0.0.2 \
+  --set webUI.image.tag=0.0.2
+```
+
+**为什么使用 GHCR OCI 格式？**
+- ✅ 无需维护单独的 Helm 仓库
+- ✅ 在 GHCR 中与 Docker 镜像统一
+- ✅ 更快的安装速度（直接从注册表拉取）
+- ✅ 现代 Helm 3.8+ 标准实践
+
+### 方式 B：从 GitHub Release 安装
+
+从 GitHub Releases 下载特定版本：
+
+```bash
+# 下载 Helm chart
+VERSION=0.0.2
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# 安装 chart
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### 方式 C：从源码安装
+
+克隆并从源码构建：
+
+```bash
+# 克隆仓库
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# 安装依赖并构建
+make install-deps
+make build
+
+# 使用 Helm 部署
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+## 配置选项
+
+Bison 可以使用 Helm values 进行配置。以下是关键配置选项：
+
+### 基本配置
+
+```yaml
+# values.yaml
+apiServer:
+  image:
+    repository: ghcr.io/supermarioyl/bison/api-server
+    tag: 0.0.1
+  replicas: 2
+
+webUI:
+  image:
+    repository: ghcr.io/supermarioyl/bison/web-ui
+    tag: 0.0.1
+  replicas: 2
+
+# OpenCost URL
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# 认证
+auth:
+  enabled: false
+```
+
+### 自定义配置示例
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set apiServer.replicas=3 \
+  --set webUI.replicas=3 \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true
+```
+
+## 验证安装
+
+安装后，验证所有组件是否正在运行：
+
+```bash
+# 检查 pod 状态
+kubectl get pods -n bison-system
+
+# 预期输出：
+# NAME                              READY   STATUS    RESTARTS   AGE
+# bison-api-server-xxxxxxxxx-xxxxx  1/1     Running   0          2m
+# bison-webui-xxxxxxxxx-xxxxx       1/1     Running   0          2m
+
+# 检查服务
+kubectl get svc -n bison-system
+
+# 检查日志
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl logs -n bison-system deployment/bison-webui
+```
+
+## 访问平台
+
+### 端口转发（开发环境）
+
+```bash
+# 端口转发 Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# 访问 http://localhost:3000
+```
+
+### Ingress（生产环境）
+
+对于生产部署，配置 Ingress：
+
+```yaml
+# ingress.yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: bison-ingress
+  namespace: bison-system
+  annotations:
+    kubernetes.io/ingress.class: nginx
+spec:
+  rules:
+  - host: bison.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-webui
+            port:
+              number: 80
+      - path: /api
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-api-server
+            port:
+              number: 8080
+```
+
+应用 Ingress：
+
+```bash
+kubectl apply -f ingress.yaml
+```
+
+## Docker 镜像
+
+Bison 镜像可在 GitHub Container Registry 上获取：
+
+```bash
+# 拉取镜像
+docker pull ghcr.io/supermarioyl/bison/api-server:0.0.1
+docker pull ghcr.io/supermarioyl/bison/web-ui:0.0.1
+
+# 或使用 latest
+docker pull ghcr.io/supermarioyl/bison/api-server:latest
+docker pull ghcr.io/supermarioyl/bison/web-ui:latest
+```
+
+**支持的平台：**
+- `linux/amd64`
+- `linux/arm64`
+
+## 升级
+
+将 Bison 升级到新版本：
+
+```bash
+# 更新 Helm 仓库
+helm repo update
+
+# 升级到最新版本
+helm upgrade bison bison/bison --namespace bison-system
+
+# 或升级到特定版本
+helm upgrade bison bison/bison --version 0.0.2 --namespace bison-system
+```
+
+## 卸载
+
+完全删除 Bison：
+
+```bash
+# 卸载 Helm release
+helm uninstall bison --namespace bison-system
+
+# 删除命名空间（可选）
+kubectl delete namespace bison-system
+```
+
+## 故障排查
+
+### Pod 无法启动
+
+检查 pod 日志以查找错误：
+
+```bash
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl describe pod -n bison-system <pod-name>
+```
+
+### 无法连接到 OpenCost
+
+验证 OpenCost 是否正在运行且可访问：
+
+```bash
+kubectl get svc -n opencost-system
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+
+# 测试端点
+curl http://localhost:9003/healthz
+```
+
+### 认证问题
+
+如果启用了认证，请确保您有正确的凭据：
+
+```bash
+# 默认凭据（生产环境请更改！）
+用户名: admin
+密码: admin
+```
+
+## 下一步
+
+- [配置指南](configuration.md) - 配置计费和设置
+- [用户指南](user-guides/admin.md) - 学习如何使用 Bison
+- [架构](architecture.md) - 理解系统设计
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/intro.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/intro.md
new file mode 100644
index 0000000..1a9216b
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/intro.md
@@ -0,0 +1,62 @@
+---
+sidebar_position: 1
+---
+
+# 简介
+
+让我们**在不到 5 分钟内**了解 **Bison**。
+
+## 开始使用
+
+通过**创建新集群**或**添加 Bison 到现有 Kubernetes 集群**开始使用。
+
+### 您需要什么
+
+- [Kubernetes](https://kubernetes.io/) 版本 1.22 或更高:
+  - 运行中的 Kubernetes 集群
+  - 已配置 kubectl 访问
+- [Helm](https://helm.sh/) 版本 3.x 或更高
+- [Capsule](https://capsule.clastix.io/) 用于多租户管理
+- [OpenCost](https://www.opencost.io/) 用于成本追踪
+- [Prometheus](https://prometheus.io/) 用于指标收集
+
+## 安装 Bison
+
+使用 Helm 在您的 Kubernetes 集群中安装 Bison:
+
+```bash
+# 添加 Bison Helm 仓库
+helm repo add bison https://supermarioyl.github.io/Bison/
+helm repo update
+
+# 安装 Bison
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system:9003
+```
+
+## 配置您的第一个租户
+
+安装完成后,创建您的第一个租户(团队):
+
+```bash
+kubectl apply -f - <<EOF
+apiVersion: capsule.clastix.io/v1beta2
+kind: Tenant
+metadata:
+  name: team-ai
+spec:
+  owners:
+  - name: admin@team-ai.com
+    kind: User
+EOF
+```
+
+恭喜!您已经在 Kubernetes 集群上成功安装并配置了 **Bison**!🎉
+
+## 下一步
+
+- 了解 Bison 的[核心功能](./features.md)
+- 探索[架构设计](./architecture.md)
+- 查看[用户指南](./category/user-guides)了解不同角色的使用方法
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/_category_.json b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/_category_.json
new file mode 100644
index 0000000..3fbcf22
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "用户指南",
+  "position": 4,
+  "link": {
+    "type": "generated-index",
+    "description": "基于角色的 Bison 使用指南。"
+  }
+}
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/admin.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/admin.md
new file mode 100644
index 0000000..28d259d
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/admin.md
@@ -0,0 +1,176 @@
+---
+sidebar_position: 1
+---
+
+# 管理员指南
+
+本指南面向部署、配置和管理 Bison 平台的平台管理员。
+
+## 职责
+
+作为平台管理员，您负责：
+
+- ✅ 部署和配置 Bison
+- ✅ 创建和管理团队
+- ✅ 设置全局计费配置
+- ✅ 监控集群范围的指标
+- ✅ 响应告警和充值请求
+
+## 入门
+
+### 1. 部署 Bison
+
+按照[安装指南](../installation.md)在您的 Kubernetes 集群中部署 Bison。
+
+### 2. 配置计费
+
+设置计费规则和定价：
+
+1. 访问 Web UI
+2. 导航到 **设置** > **计费配置**
+3. 配置：
+   - **货币**: USD、CNY、EUR 等
+   - **CPU 价格**: 每核心小时的成本
+   - **内存价格**: 每 GB 小时的成本
+   - **GPU 价格**: 每 GPU 小时的成本
+4. 点击 **保存**
+
+### 3. 创建第一个团队
+
+为您的用户创建团队：
+
+1. 导航到 **团队** 页面
+2. 点击 **创建团队**
+3. 填写：
+   - **团队名称**: 例如 "ml-team"
+   - **描述**: 团队用途
+   - **资源配额**:
+     - CPU: 例如 "20" 核心
+     - 内存: 例如 "64Gi"
+     - GPU: 例如 "4"
+   - **初始余额**: 例如 1000.00
+4. 点击 **创建**
+
+## 常见任务
+
+### 管理团队
+
+#### 查看所有团队
+
+```bash
+# 通过 kubectl
+kubectl get tenants
+
+# 通过 API
+curl http://localhost:8080/api/v1/teams
+```
+
+#### 更新团队配额
+
+1. 导航到 **团队** 页面
+2. 点击团队行上的 **编辑**
+3. 修改配额
+4. 点击 **保存**
+
+#### 充值团队余额
+
+1. 导航到 **团队** 页面
+2. 点击团队行上的 **充值**
+3. 输入金额
+4. 添加备注（可选）
+5. 点击 **确认**
+
+### 监控
+
+#### 查看仪表板
+
+访问实时集群指标：
+- 总团队数和项目数
+- 资源利用率
+- 成本趋势
+- 热门消费者
+- 余额状态
+
+#### 检查告警
+
+监控低余额和配额告警：
+1. 导航到 **告警** 页面
+2. 查看活动告警
+3. 根据需要采取行动
+
+### 计费配置
+
+#### 更新定价
+
+```bash
+curl -X PUT http://localhost:8080/api/v1/billing/config \
+  -H "Content-Type: application/json" \
+  -d '{
+    "pricing": {
+      "cpu": 0.06,
+      "memory": 0.012,
+      "nvidia.com/gpu": 3.00
+    }
+  }'
+```
+
+#### 配置告警阈值
+
+```json
+{
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## 最佳实践
+
+### 团队命名
+- 使用小写字母、数字和连字符
+- 示例：`ml-team`、`data-science`、`dev-team`
+
+### 配额分配
+- 从保守的配额开始
+- 监控 1-2 周的使用情况
+- 根据实际需求调整
+
+### 余额管理
+- 为关键团队设置自动充值
+- 每周监控余额趋势
+- 及时响应低余额告警
+
+### 安全
+- 在生产环境中启用认证
+- 使用 OIDC/SSO 进行企业部署
+- 定期审计用户权限
+
+## 故障排查
+
+### 团队创建失败
+
+检查 Capsule operator 日志：
+```bash
+kubectl logs -n capsule-system deployment/capsule-controller-manager
+```
+
+### 计费无法工作
+
+验证 OpenCost 连接性：
+```bash
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+```
+
+### 高资源使用率
+
+检查资源消耗：
+```bash
+kubectl top pods -n bison-system
+```
+
+## 下一步
+
+- [团队负责人指南](team-leader.md) - 团队负责人指南
+- [开发者指南](developer.md) - 开发者指南
+- [配置](../configuration.md) - 高级配置
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/developer.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/developer.md
new file mode 100644
index 0000000..17f9915
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/developer.md
@@ -0,0 +1,187 @@
+---
+sidebar_position: 3
+---
+
+# 开发者指南
+
+本指南面向在团队项目中部署工作负载和消耗资源的开发者。
+
+## 职责
+
+作为开发者，您负责：
+
+- ✅ 在您的项目中部署应用程序
+- ✅ 监控资源使用情况
+- ✅ 保持在配额限制内
+- ✅ 优化资源消耗
+
+## 入门
+
+### 1. 获取 Kubeconfig
+
+向您的团队负责人或管理员请求 kubeconfig。
+
+### 2. 设置上下文
+
+```bash
+# 将上下文设置为您的项目命名空间
+kubectl config set-context --current --namespace=your-project
+
+# 验证
+kubectl config view --minify | grep namespace
+```
+
+### 3. 检查配额
+
+查看您的可用资源：
+```bash
+kubectl describe quota
+```
+
+## 部署工作负载
+
+### 基本 Pod 部署
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: gpu-training-job
+  namespace: your-project
+spec:
+  containers:
+  - name: trainer
+    image: your-ml-image:latest
+    resources:
+      requests:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+      limits:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+```
+
+### 使用 Deployments
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: ml-inference
+  namespace: your-project
+spec:
+  replicas: 2
+  selector:
+    matchLabels:
+      app: ml-inference
+  template:
+    metadata:
+      labels:
+        app: ml-inference
+    spec:
+      containers:
+      - name: inference
+        image: your-inference-image:latest
+        resources:
+          requests:
+            cpu: "2"
+            memory: "8Gi"
+            nvidia.com/gpu: "1"
+```
+
+## 监控使用情况
+
+### 检查 Pod 资源使用情况
+
+```bash
+# 查看资源消耗
+kubectl top pods
+
+# 详细的 pod 信息
+kubectl describe pod <pod-name>
+```
+
+### 查看日志
+
+```bash
+# 流式查看日志
+kubectl logs -f <pod-name>
+
+# 查看之前的日志（如果 pod 重启了）
+kubectl logs --previous <pod-name>
+```
+
+## 最佳实践
+
+### 资源请求和限制
+
+始终指定请求和限制：
+```yaml
+resources:
+  requests:
+    cpu: "2"
+    memory: "8Gi"
+  limits:
+    cpu: "4"
+    memory: "16Gi"
+```
+
+### GPU 使用
+
+- 仅在需要时请求 GPU
+- 将 GPU 用于计算密集型任务
+- 监控 GPU 利用率
+
+### 清理
+
+不再需要时删除资源：
+```bash
+# 删除 pod
+kubectl delete pod <pod-name>
+
+# 删除 deployment
+kubectl delete deployment <deployment-name>
+
+# 清理已完成的 job
+kubectl delete job --field-selector status.successful=1
+```
+
+### 成本优化
+
+- 正确调整资源请求的大小
+- 使用水平 pod 自动扩展
+- 清理空闲资源
+- 在可能的情况下共享 GPU（如果支持）
+
+## 故障排查
+
+### Pod 处于 Pending 状态（配额不足）
+
+如果您的 pod 卡在 `Pending` 状态：
+
+```bash
+kubectl describe pod <pod-name>
+```
+
+查找与配额相关的错误，并减少资源请求或向团队负责人申请更多配额。
+
+### 内存不足 (OOM)
+
+如果 pod 因 OOM 被杀死：
+1. 检查内存使用模式
+2. 增加内存限制
+3. 优化应用程序内存使用
+
+### GPU 不可用
+
+验证 GPU 请求：
+```bash
+kubectl get nodes -o custom-columns=NAME:.metadata.name,GPU:.status.allocatable."nvidia\.com/gpu"
+```
+
+## 下一步
+
+- [团队负责人指南](team-leader.md) - 了解团队管理
+- [架构](../architecture.md) - 了解平台
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/team-leader.md b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/team-leader.md
new file mode 100644
index 0000000..45fd901
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/current/user-guides/team-leader.md
@@ -0,0 +1,126 @@
+---
+sidebar_position: 2
+---
+
+# 团队负责人指南
+
+本指南面向管理项目、监控预算并在团队内分配资源的团队负责人。
+
+## 职责
+
+作为团队负责人，您负责：
+
+- ✅ 创建和管理项目（命名空间）
+- ✅ 为项目分配配额
+- ✅ 监控团队余额和消耗
+- ✅ 在需要时请求充值
+
+## 入门
+
+### 1. 访问 Bison
+
+使用您的凭据登录 Web UI。
+
+### 2. 查看团队仪表板
+
+您的仪表板显示：
+- 团队余额和状态
+- 资源利用率
+- 活动项目
+- 成本趋势
+
+## 管理项目
+
+### 创建项目
+
+1. 导航到 **项目** 页面
+2. 点击 **创建项目**
+3. 填写：
+   - **项目名称**: 例如 "training-ml-models"
+   - **描述**: 项目用途
+   - **配额**（可选）:
+     - CPU: 例如 "8" 核心
+     - 内存: 例如 "32Gi"
+     - GPU: 例如 "2"
+4. 点击 **创建**
+
+### 列出项目
+
+```bash
+# 通过 kubectl（如果您有访问权限）
+kubectl get namespaces -l capsule.clastix.io/tenant=your-team
+
+# 通过 API
+curl http://localhost:8080/api/v1/teams/your-team/projects
+```
+
+### 删除项目
+
+1. 导航到 **项目** 页面
+2. 点击项目行上的 **删除**
+3. 确认删除
+
+**警告**: 这将删除项目中的所有资源！
+
+## 监控预算
+
+### 检查余额
+
+查看您的当前余额：
+1. 导航到 **团队** 页面
+2. 在状态卡片中查看余额
+
+### 查看使用趋势
+
+分析支出模式：
+1. 导航到 **报告** 页面
+2. 选择时间范围（7 天、30 天、90 天）
+3. 查看：
+   - 按资源类型的成本细分
+   - 每日成本趋势
+   - 每个项目的消耗
+
+### 请求充值
+
+当余额不足时：
+1. 点击 **请求充值** 按钮
+2. 输入请求金额
+3. 添加理由说明
+4. 向管理员提交请求
+
+## 资源管理
+
+### 监控配额使用情况
+
+检查您的配额使用了多少：
+```bash
+kubectl describe quota -n your-project
+```
+
+### 优化成本
+
+减少支出的技巧：
+- **合理调整资源大小**: 不要过度配置 CPU/内存
+- **清理空闲 pod**: 删除未使用的工作负载
+- **使用 spot/可抢占实例**: 在适用的情况下
+- **监控 GPU 利用率**: 确保 GPU 被充分利用
+
+## 最佳实践
+
+### 项目组织
+- 为不同的工作负载创建单独的项目
+- 示例：`ml-training`、`ml-inference`、`data-processing`
+
+### 配额分配
+- 根据项目优先级分配配额
+- 为紧急任务保留缓冲
+
+### 成本意识
+- 每周审查成本
+- 识别并消除浪费
+- 设置成本告警
+
+## 下一步
+
+- [开发者指南](developer.md) - 您团队成员的指南
+- [功能特性](../features.md) - 探索所有 Bison 功能
diff --git a/website/i18n/zh-Hans/docusaurus-plugin-content-docs/version-0.0.1.json b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/version-0.0.1.json
new file mode 100644
index 0000000..7b17ccb
--- /dev/null
+++ b/website/i18n/zh-Hans/docusaurus-plugin-content-docs/version-0.0.1.json
@@ -0,0 +1,14 @@
+{
+  "version.label": {
+    "message": "0.0.1",
+    "description": "The label for version 0.0.1"
+  },
+  "sidebar.tutorialSidebar.category.User Guides": {
+    "message": "User Guides",
+    "description": "The label for category 'User Guides' in sidebar 'tutorialSidebar'"
+  },
+  "sidebar.tutorialSidebar.category.User Guides.link.generated-index.description": {
+    "message": "Role-based guides for using Bison effectively.",
+    "description": "The generated-index page description for category 'User Guides' in sidebar 'tutorialSidebar'"
+  }
+}
diff --git a/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json b/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json
index da63b28..923115b 100644
--- a/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json
+++ b/website/i18n/zh-Hans/docusaurus-theme-classic/footer.json
@@ -1,22 +1,22 @@
 {
   "link.title.Docs": {
-    "message": "Docs",
+    "message": "文档",
     "description": "The title of the footer links column with title=Docs in the footer"
   },
   "link.title.Resources": {
-    "message": "Resources",
+    "message": "资源",
     "description": "The title of the footer links column with title=Resources in the footer"
   },
   "link.title.More": {
-    "message": "More",
+    "message": "更多",
     "description": "The title of the footer links column with title=More in the footer"
   },
   "link.item.label.Getting Started": {
-    "message": "Getting Started",
-    "description": "The label of footer link with label=Getting Started linking to /docs/intro"
+    "message": "快速开始",
+    "description": "The label of footer link with label=Getting Started linking to /docs"
   },
   "link.item.label.Architecture": {
-    "message": "Architecture",
+    "message": "架构",
     "description": "The label of footer link with label=Architecture linking to /docs/architecture"
   },
   "link.item.label.Helm Charts": {
@@ -32,11 +32,11 @@
     "description": "The label of footer link with label=GitHub linking to https://github.com/SuperMarioYL/Bison"
   },
   "link.item.label.Issues": {
-    "message": "Issues",
+    "message": "问题反馈",
     "description": "The label of footer link with label=Issues linking to https://github.com/SuperMarioYL/Bison/issues"
   },
   "copyright": {
-    "message": "Copyright © 2025 Bison Project. Built with Docusaurus.",
+    "message": "Copyright © 2025 Bison 项目。使用 Docusaurus 构建。",
     "description": "The footer copyright"
   }
 }
diff --git a/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json b/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json
index 5de3c8a..90c372f 100644
--- a/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json
+++ b/website/i18n/zh-Hans/docusaurus-theme-classic/navbar.json
@@ -8,7 +8,7 @@
     "description": "The alt text of navbar logo"
   },
   "item.label.Documentation": {
-    "message": "Documentation",
+    "message": "文档",
     "description": "Navbar item with label Documentation"
   },
   "item.label.GitHub": {
diff --git a/website/src/components/ArchitectureDiagram/index.tsx b/website/src/components/ArchitectureDiagram/index.tsx
new file mode 100644
index 0000000..a2aba96
--- /dev/null
+++ b/website/src/components/ArchitectureDiagram/index.tsx
@@ -0,0 +1,160 @@
+import type {ReactNode} from 'react';
+import {translate} from '@docusaurus/Translate';
+import Translate from '@docusaurus/Translate';
+import Heading from '@theme/Heading';
+import styles from './styles.module.css';
+
+interface ArchNode {
+  id: string;
+  label: string;
+  description: string;
+  color: string;
+}
+
+const nodes: ArchNode[] = [
+  {
+    id: 'bison',
+    label: 'Bison',
+    description: translate({
+      id: 'component.architectureDiagram.node.bison',
+      message: 'GPU Billing & Scheduling Platform',
+      description: 'Description for Bison node',
+    }),
+    color: '#0A84FF',
+  },
+  {
+    id: 'capsule',
+    label: 'Capsule',
+    description: translate({
+      id: 'component.architectureDiagram.node.capsule',
+      message: 'Multi-Tenant Management',
+      description: 'Description for Capsule node',
+    }),
+    color: '#5E5CE6',
+  },
+  {
+    id: 'opencost',
+    label: 'OpenCost',
+    description: translate({
+      id: 'component.architectureDiagram.node.opencost',
+      message: 'Cost Tracking & Analytics',
+      description: 'Description for OpenCost node',
+    }),
+    color: '#BF5AF2',
+  },
+  {
+    id: 'k8s',
+    label: 'Kubernetes',
+    description: translate({
+      id: 'component.architectureDiagram.node.k8s',
+      message: 'Container Orchestration',
+      description: 'Description for Kubernetes node',
+    }),
+    color: '#326CE5',
+  },
+  {
+    id: 'prometheus',
+    label: 'Prometheus',
+    description: translate({
+      id: 'component.architectureDiagram.node.prometheus',
+      message: 'Metrics Collection',
+      description: 'Description for Prometheus node',
+    }),
+    color: '#E6522C',
+  },
+];
+
+export default function ArchitectureDiagram(): ReactNode {
+  return (
+    <section className={styles.architectureSection}>
+      <div className="container">
+        <div className="text--center margin-bottom--lg">
+          <Heading as="h2" className={styles.sectionTitle}>
+            <Translate id="component.architectureDiagram.title">
+              Architecture Overview
+            </Translate>
+          </Heading>
+          <p className={styles.sectionSubtitle}>
+            <Translate id="component.architectureDiagram.subtitle">
+              Built on cloud-native technologies for scalability and reliability
+            </Translate>
+          </p>
+        </div>
+
+        <div className={styles.diagramContainer}>
+          <svg viewBox="0 0 800 400" className={styles.diagram}>
+            <defs>
+              <marker
+                id="arrowhead"
+                markerWidth="10"
+                markerHeight="10"
+                refX="9"
+                refY="3"
+                orient="auto">
+                <polygon points="0 0, 10 3, 0 6" fill="#999" />
+              </marker>
+
+              <filter id="glow">
+                <feGaussianBlur stdDeviation="3" result="coloredBlur" />
+                <feMerge>
+                  <feMergeNode in="coloredBlur" />
+                  <feMergeNode in="SourceGraphic" />
+                </feMerge>
+              </filter>
+            </defs>
+
+            {/* Connections */}
+            <g className={styles.connections}>
+              <line x1="400" y1="80" x2="400" y2="140" stroke="#999" strokeWidth="2" markerEnd="url(#arrowhead)" className={styles.connectionLine} />
+              <line x1="400" y1="200" x2="250" y2="260" stroke="#999" strokeWidth="2" markerEnd="url(#arrowhead)" className={styles.connectionLine} />
+              <line x1="400" y1="200" x2="550" y2="260" stroke="#999" strokeWidth="2" markerEnd="url(#arrowhead)" className={styles.connectionLine} />
+              <line x1="250" y1="320" x2="400" y2="320" stroke="#999" strokeWidth="2" markerEnd="url(#arrowhead)" className={styles.connectionLine} />
+              <line x1="550" y1="320" x2="650" y2="320" stroke="#999" strokeWidth="2" markerEnd="url(#arrowhead)" className={styles.connectionLine} />
+            </g>
+
+            {/* Bison */}
+            <g className={styles.node}>
+              <rect x="330" y="40" width="140" height="60" rx="8" fill="#0A84FF" filter="url(#glow)" />
+              <text x="400" y="75" textAnchor="middle" fill="white" fontSize="18" fontWeight="600">Bison</text>
+            </g>
+
+            {/* Capsule */}
+            <g className={styles.node}>
+              <rect x="330" y="160" width="140" height="60" rx="8" fill="#5E5CE6" filter="url(#glow)" />
+              <text x="400" y="195" textAnchor="middle" fill="white" fontSize="18" fontWeight="600">Capsule</text>
+            </g>
+
+            {/* OpenCost */}
+            <g className={styles.node}>
+              <rect x="480" y="280" width="140" height="60" rx="8" fill="#BF5AF2" filter="url(#glow)" />
+              <text x="550" y="315" textAnchor="middle" fill="white" fontSize="18" fontWeight="600">OpenCost</text>
+            </g>
+
+            {/* Kubernetes */}
+            <g className={styles.node}>
+              <rect x="180" y="280" width="140" height="60" rx="8" fill="#326CE5" filter="url(#glow)" />
+              <text x="250" y="315" textAnchor="middle" fill="white" fontSize="18" fontWeight="600">Kubernetes</text>
+            </g>
+
+            {/* Prometheus */}
+            <g className={styles.node}>
+              <rect x="630" y="280" width="140" height="60" rx="8" fill="#E6522C" filter="url(#glow)" />
+              <text x="700" y="315" textAnchor="middle" fill="white" fontSize="18" fontWeight="600">Prometheus</text>
+            </g>
+          </svg>
+
+          <div className={styles.nodeDescriptions}>
+            {nodes.map(node => (
+              <div key={node.id} className={styles.nodeCard} style={{borderColor: node.color}}>
+                <div className={styles.nodeCardTitle} style={{color: node.color}}>
+                  {node.label}
+                </div>
+                <div className={styles.nodeCardDescription}>{node.description}</div>
+              </div>
+            ))}
+          </div>
+        </div>
+      </div>
+    </section>
+  );
+}
diff --git a/website/src/components/ArchitectureDiagram/styles.module.css b/website/src/components/ArchitectureDiagram/styles.module.css
new file mode 100644
index 0000000..074c7ed
--- /dev/null
+++ b/website/src/components/ArchitectureDiagram/styles.module.css
@@ -0,0 +1,183 @@
+.architectureSection {
+  padding: 4rem 0;
+  background: #ffffff;
+}
+
+[data-theme='dark'] .architectureSection {
+  background: #0d0d0d;
+}
+
+.sectionTitle {
+  font-size: 2.5rem;
+  font-weight: 700;
+  margin-bottom: 1rem;
+}
+
+.sectionSubtitle {
+  font-size: 1.125rem;
+  color: #666;
+  max-width: 600px;
+  margin: 0 auto;
+}
+
+[data-theme='dark'] .sectionSubtitle {
+  color: #b3b3b3;
+}
+
+.diagramContainer {
+  margin-top: 3rem;
+}
+
+.diagram {
+  width: 100%;
+  max-width: 800px;
+  height: auto;
+  margin: 0 auto;
+  display: block;
+  margin-bottom: 3rem;
+}
+
+.node {
+  cursor: pointer;
+  transition: transform 0.3s ease;
+  animation: nodeAppear 0.6s ease-out backwards;
+}
+
+.node:nth-child(1) {
+  animation-delay: 0.1s;
+}
+
+.node:nth-child(2) {
+  animation-delay: 0.2s;
+}
+
+.node:nth-child(3) {
+  animation-delay: 0.3s;
+}
+
+.node:nth-child(4) {
+  animation-delay: 0.4s;
+}
+
+.node:nth-child(5) {
+  animation-delay: 0.5s;
+}
+
+.node:hover {
+  transform: scale(1.05);
+}
+
+.node rect {
+  transition: all 0.3s ease;
+}
+
+.node:hover rect {
+  filter: url(#glow) brightness(1.1);
+}
+
+.connectionLine {
+  stroke-dasharray: 5, 5;
+  animation: dashMove 20s linear infinite;
+}
+
+@keyframes dashMove {
+  to {
+    stroke-dashoffset: -1000;
+  }
+}
+
+@keyframes nodeAppear {
+  from {
+    opacity: 0;
+    transform: scale(0.8);
+  }
+  to {
+    opacity: 1;
+    transform: scale(1);
+  }
+}
+
+.nodeDescriptions {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+  gap: 1.5rem;
+  margin-top: 2rem;
+}
+
+.nodeCard {
+  padding: 1.5rem;
+  border-radius: 12px;
+  border-left: 4px solid;
+  background: rgba(0, 0, 0, 0.02);
+  transition: all 0.3s ease;
+  animation: cardSlideIn 0.6s ease-out backwards;
+}
+
+[data-theme='dark'] .nodeCard {
+  background: rgba(255, 255, 255, 0.05);
+}
+
+.nodeCard:nth-child(1) {
+  animation-delay: 0.6s;
+}
+
+.nodeCard:nth-child(2) {
+  animation-delay: 0.7s;
+}
+
+.nodeCard:nth-child(3) {
+  animation-delay: 0.8s;
+}
+
+.nodeCard:nth-child(4) {
+  animation-delay: 0.9s;
+}
+
+.nodeCard:nth-child(5) {
+  animation-delay: 1s;
+}
+
+.nodeCard:hover {
+  transform: translateX(4px);
+  box-shadow: 0 4px 12px rgba(0, 0, 0, 0.1);
+}
+
+.nodeCardTitle {
+  font-size: 1.125rem;
+  font-weight: 600;
+  margin-bottom: 0.5rem;
+}
+
+.nodeCardDescription {
+  font-size: 0.875rem;
+  color: #666;
+}
+
+[data-theme='dark'] .nodeCardDescription {
+  color: #b3b3b3;
+}
+
+@keyframes cardSlideIn {
+  from {
+    opacity: 0;
+    transform: translateX(-20px);
+  }
+  to {
+    opacity: 1;
+    transform: translateX(0);
+  }
+}
+
+@media screen and (max-width: 768px) {
+  .sectionTitle {
+    font-size: 2rem;
+  }
+
+  .diagram {
+    height: 300px;
+  }
+
+  .nodeDescriptions {
+    grid-template-columns: 1fr;
+  }
+}
diff --git a/website/src/components/HomepageFeatures/index.tsx b/website/src/components/HomepageFeatures/index.tsx
index 69b3dd0..06d46a4 100644
--- a/website/src/components/HomepageFeatures/index.tsx
+++ b/website/src/components/HomepageFeatures/index.tsx
@@ -1,90 +1,131 @@
-import type {ReactNode} from 'react';
+import type {ComponentType, ReactNode} from 'react';
 import clsx from 'clsx';
 import Heading from '@theme/Heading';
+import Translate from '@docusaurus/Translate';
+import {
+  ShieldLockIcon,
+  CurrencyDollarIcon,
+  DashboardIcon,
+  RocketIcon,
+  BoltIcon,
+  ShieldCheckIcon,
+  type IconProps,
+} from '../Icons';
 import styles from './styles.module.css';
 
 type FeatureItem = {
-  title: string;
-  Svg?: React.ComponentType<React.ComponentProps<'svg'>>;
-  icon?: string;
+  Icon: ComponentType<IconProps>;
+  color: string;
+  title: ReactNode;
   description: ReactNode;
 };
 
 const FeatureList: FeatureItem[] = [
   {
-    title: '🔐 Multi-Tenant Isolation',
-    icon: '🔐',
+    Icon: ShieldLockIcon,
+    color: '#5E5CE6',
+    title: (
+      <Translate id="homepage.feature.multitenant.title">
+        Multi-Tenant Isolation
+      </Translate>
+    ),
     description: (
-      <>
-        Built on Capsule for true Kubernetes-native multi-tenancy.
-        Each team gets isolated resources with shared or exclusive node pools,
-        eliminating manual quota configuration.
-      </>
+      <Translate id="homepage.feature.multitenant.desc">
+        Built on Capsule for true Kubernetes-native multi-tenancy. Each team gets
+        isolated resources with shared or exclusive node pools, eliminating manual
+        quota configuration.
+      </Translate>
     ),
   },
   {
-    title: '💰 Real-Time Billing',
-    icon: '💰',
+    Icon: CurrencyDollarIcon,
+    color: '#34C759',
+    title: (
+      <Translate id="homepage.feature.billing.title">Real-Time Billing</Translate>
+    ),
     description: (
-      <>
-        Integrated with OpenCost for automatic cost tracking.
-        Per-pod, per-namespace, per-team visibility with customizable pricing
-        for CPU, Memory, and GPU resources.
-      </>
+      <Translate id="homepage.feature.billing.desc">
+        Integrated with OpenCost for automatic cost tracking. Per-pod, per-namespace,
+        per-team visibility with customizable pricing for CPU, Memory, and GPU
+        resources.
+      </Translate>
     ),
   },
   {
-    title: '📊 Unified Dashboard',
-    icon: '📊',
+    Icon: DashboardIcon,
+    color: '#0A84FF',
+    title: (
+      <Translate id="homepage.feature.dashboard.title">Unified Dashboard</Translate>
+    ),
     description: (
-      <>
-        Single pane of glass for admins, team leaders, and finance teams.
-        Real-time balance monitoring, alerts, auto-suspension,
-        and comprehensive usage reports.
-      </>
+      <Translate id="homepage.feature.dashboard.desc">
+        Single pane of glass for admins, team leaders, and finance teams. Real-time
+        balance monitoring, alerts, auto-suspension, and comprehensive usage reports.
+      </Translate>
     ),
   },
   {
-    title: '🚀 Deploy in Minutes',
-    icon: '🚀',
+    Icon: RocketIcon,
+    color: '#BF5AF2',
+    title: (
+      <Translate id="homepage.feature.deploy.title">Deploy in Minutes</Translate>
+    ),
     description: (
-      <>
-        Zero external dependencies - all data stored in Kubernetes ConfigMaps.
-        Install with a single Helm command and get complete GPU resource
-        management in under 30 minutes.
-      </>
+      <Translate id="homepage.feature.deploy.desc">
+        Zero external dependencies — all data stored in Kubernetes ConfigMaps. Install
+        with a single Helm command and get complete GPU resource management in under 30
+        minutes.
+      </Translate>
     ),
   },
   {
-    title: '⚡ Auto-Deduction & Alerts',
-    icon: '⚡',
+    Icon: BoltIcon,
+    color: '#FF9F0A',
+    title: (
+      <Translate id="homepage.feature.alerts.title">
+        Auto-Deduction &amp; Alerts
+      </Translate>
+    ),
     description: (
-      <>
-        Automated billing with prepaid balances and real-time deduction.
-        Multi-channel alerts (Webhook, DingTalk, WeChat) with configurable
-        thresholds and auto-suspension.
-      </>
+      <Translate id="homepage.feature.alerts.desc">
+        Automated billing with prepaid balances and real-time deduction. Multi-channel
+        alerts (Webhook, DingTalk, WeChat) with configurable thresholds and
+        auto-suspension.
+      </Translate>
     ),
   },
   {
-    title: '🎯 Production Ready',
-    icon: '🎯',
+    Icon: ShieldCheckIcon,
+    color: '#0FB5BA',
+    title: (
+      <Translate id="homepage.feature.production.title">Production Ready</Translate>
+    ),
     description: (
-      <>
-        Cloud-native architecture with horizontal scaling, RBAC integration,
-        and comprehensive audit logging. Support for multi-platform
-        Docker images and enterprise SSO.
-      </>
+      <Translate id="homepage.feature.production.desc">
+        Cloud-native architecture with horizontal scaling, RBAC integration, and
+        comprehensive audit logging. Multi-platform Docker images and enterprise SSO
+        support.
+      </Translate>
     ),
   },
 ];
 
-function Feature({title, Svg, icon, description}: FeatureItem) {
+function Feature({Icon, color, title, description}: FeatureItem): ReactNode {
   return (
-    <div className={clsx('col col--4')}>
-      <div className="text--center padding-horiz--md">
-        <Heading as="h3">{title}</Heading>
-        <p>{description}</p>
+    <div className={clsx('col col--4')} style={{marginBottom: '2rem'}}>
+      <div className={styles.featureCard}>
+        <div
+          className={styles.featureIcon}
+          style={{
+            background: `linear-gradient(135deg, ${color}, ${color}cc)`,
+            boxShadow: `0 6px 16px ${color}40`,
+          }}>
+          <Icon size={28} stroke="#fff" />
+        </div>
+        <Heading as="h3" className={styles.featureTitle}>
+          {title}
+        </Heading>
+        <p className={styles.featureDescription}>{description}</p>
       </div>
     </div>
   );
@@ -94,6 +135,18 @@ export default function HomepageFeatures(): ReactNode {
   return (
     <section className={styles.features}>
       <div className="container">
+        <div className="text--center margin-bottom--lg">
+          <Heading as="h2" className={styles.sectionTitle}>
+            <Translate id="homepage.features.title">
+              Everything you need to run GPU clusters
+            </Translate>
+          </Heading>
+          <p className={styles.sectionSubtitle}>
+            <Translate id="homepage.features.subtitle">
+              Multi-tenancy, metering and billing — built into one cloud-native platform
+            </Translate>
+          </p>
+        </div>
         <div className="row">
           {FeatureList.map((props, idx) => (
             <Feature key={idx} {...props} />
diff --git a/website/src/components/HomepageFeatures/styles.module.css b/website/src/components/HomepageFeatures/styles.module.css
index b248eb2..86ff32b 100644
--- a/website/src/components/HomepageFeatures/styles.module.css
+++ b/website/src/components/HomepageFeatures/styles.module.css
@@ -1,11 +1,145 @@
 .features {
   display: flex;
   align-items: center;
-  padding: 2rem 0;
+  padding: 4rem 0;
   width: 100%;
+  background: linear-gradient(180deg, #f8f9fa 0%, #ffffff 100%);
 }
 
-.featureSvg {
-  height: 200px;
-  width: 200px;
+[data-theme='dark'] .features {
+  background: linear-gradient(180deg, #1a1a1a 0%, #0d0d0d 100%);
+}
+
+.sectionTitle {
+  font-size: 2.2rem;
+  font-weight: 700;
+  margin-bottom: 0.6rem;
+}
+
+.sectionSubtitle {
+  color: #86868b;
+  font-size: 1.1rem;
+  max-width: 640px;
+  margin: 0 auto;
+}
+
+[data-theme='dark'] .sectionSubtitle {
+  color: #98989d;
+}
+
+.featureCard {
+  padding: 2rem;
+  border-radius: 16px;
+  background: rgba(255, 255, 255, 0.9);
+  backdrop-filter: blur(10px);
+  box-shadow: 0 4px 6px rgba(0, 0, 0, 0.05);
+  transition: all 0.4s cubic-bezier(0.4, 0, 0.2, 1);
+  border: 1px solid rgba(0, 0, 0, 0.05);
+  height: 100%;
+  position: relative;
+  overflow: hidden;
+}
+
+[data-theme='dark'] .featureCard {
+  background: rgba(30, 30, 30, 0.8);
+  border: 1px solid rgba(255, 255, 255, 0.1);
+}
+
+.featureCard::before {
+  content: '';
+  position: absolute;
+  top: 0;
+  left: 0;
+  right: 0;
+  height: 3px;
+  background: linear-gradient(90deg, #0A84FF, #5E5CE6, #BF5AF2);
+  transform: scaleX(0);
+  transition: transform 0.4s ease;
+}
+
+.featureCard:hover::before {
+  transform: scaleX(1);
+}
+
+.featureCard:hover {
+  transform: translateY(-8px) scale(1.02);
+  box-shadow:
+    0 12px 24px rgba(10, 132, 255, 0.15),
+    0 0 0 1px rgba(10, 132, 255, 0.1);
+}
+
+.featureIcon {
+  width: 56px;
+  height: 56px;
+  border-radius: 14px;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  transition: transform 0.4s cubic-bezier(0.4, 0, 0.2, 1);
+  margin-bottom: 1.25rem;
+}
+
+.featureCard:hover .featureIcon {
+  transform: scale(1.08) rotate(-3deg);
+}
+
+.featureTitle {
+  margin-bottom: 0.75rem;
+  font-weight: 600;
+  font-size: 1.2rem;
+  color: #1a1a1a;
+}
+
+[data-theme='dark'] .featureTitle {
+  color: #ffffff;
+}
+
+.featureDescription {
+  color: #666;
+  line-height: 1.6;
+}
+
+[data-theme='dark'] .featureDescription {
+  color: #b3b3b3;
+}
+
+/* Stagger animation on scroll */
+.featureCard {
+  opacity: 0;
+  animation: fadeInUp 0.6s ease-out forwards;
+}
+
+.featureCard:nth-child(1) {
+  animation-delay: 0.1s;
+}
+
+.featureCard:nth-child(2) {
+  animation-delay: 0.2s;
+}
+
+.featureCard:nth-child(3) {
+  animation-delay: 0.3s;
+}
+
+.featureCard:nth-child(4) {
+  animation-delay: 0.4s;
+}
+
+.featureCard:nth-child(5) {
+  animation-delay: 0.5s;
+}
+
+.featureCard:nth-child(6) {
+  animation-delay: 0.6s;
+}
+
+@keyframes fadeInUp {
+  from {
+    opacity: 0;
+    transform: translateY(30px);
+  }
+  to {
+    opacity: 1;
+    transform: translateY(0);
+  }
 }
diff --git a/website/src/components/Icons/index.tsx b/website/src/components/Icons/index.tsx
new file mode 100644
index 0000000..1e9ce3b
--- /dev/null
+++ b/website/src/components/Icons/index.tsx
@@ -0,0 +1,137 @@
+import type {ReactNode, SVGProps} from 'react';
+
+/**
+ * Tabler-style line icons (24x24, stroke = currentColor, no emoji).
+ * Project standard: use line icons instead of emoji for UI decoration.
+ * https://tabler.io/icons — geometry kept faithful to the Tabler aesthetic.
+ */
+
+export type IconProps = SVGProps<SVGSVGElement> & {size?: number};
+
+function Icon({
+  size = 24,
+  children,
+  ...props
+}: IconProps & {children: ReactNode}): ReactNode {
+  return (
+    <svg
+      xmlns="http://www.w3.org/2000/svg"
+      width={size}
+      height={size}
+      viewBox="0 0 24 24"
+      fill="none"
+      stroke="currentColor"
+      strokeWidth={1.75}
+      strokeLinecap="round"
+      strokeLinejoin="round"
+      aria-hidden="true"
+      focusable="false"
+      {...props}>
+      {children}
+    </svg>
+  );
+}
+
+/* ---------------- Feature icons ---------------- */
+
+export const ShieldLockIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M12 3l7 3v5c0 4 -3 7 -7 8c-4 -1 -7 -4 -7 -8v-5l7 -3z" />
+    <circle cx="12" cy="11" r="1.4" />
+    <path d="M12 12.4v2.6" />
+  </Icon>
+);
+
+export const CurrencyDollarIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <circle cx="12" cy="12" r="9" />
+    <path d="M14.8 9.3a3.2 2.8 0 0 0 -2.8 -1.3h-1a2.4 2.4 0 0 0 0 4.8h1a2.4 2.4 0 0 1 0 4.8h-1a3.2 2.8 0 0 1 -2.8 -1.3" />
+    <path d="M12 6v12" />
+  </Icon>
+);
+
+export const DashboardIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <rect x="4" y="4" width="6" height="8" rx="1.2" />
+    <rect x="4" y="15" width="6" height="5" rx="1.2" />
+    <rect x="14" y="12" width="6" height="8" rx="1.2" />
+    <rect x="14" y="4" width="6" height="5" rx="1.2" />
+  </Icon>
+);
+
+export const RocketIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M4 13a8 8 0 0 1 7 7a6 6 0 0 0 3 -5a9 9 0 0 0 6 -8a3 3 0 0 0 -3 -3a9 9 0 0 0 -8 6a6 6 0 0 0 -5 3z" />
+    <path d="M7 14a6 6 0 0 0 -3 6a6 6 0 0 0 6 -3" />
+    <circle cx="15" cy="9" r="1.2" />
+  </Icon>
+);
+
+export const BoltIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M13 3l0 7l6 0l-8 11l0 -7l-6 0l8 -11z" />
+  </Icon>
+);
+
+export const ShieldCheckIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M12 3l7 3v5c0 4 -3 7 -7 8c-4 -1 -7 -4 -7 -8v-5l7 -3z" />
+    <path d="M9 12l2 2l4 -4" />
+  </Icon>
+);
+
+/* ---------------- Use-case icons ---------------- */
+
+export const CpuIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <rect x="5" y="5" width="14" height="14" rx="2" />
+    <rect x="9" y="9" width="6" height="6" rx="1" />
+    <path d="M9 3v2M15 3v2M9 19v2M15 19v2M3 9h2M3 15h2M19 9h2M19 15h2" />
+  </Icon>
+);
+
+export const BuildingIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M3 21h18" />
+    <path d="M5 21v-15a1 1 0 0 1 1 -1h8a1 1 0 0 1 1 1v15" />
+    <path d="M15 21v-9a1 1 0 0 1 1 -1h2a1 1 0 0 1 1 1v9" />
+    <path d="M8 8h2M8 12h2M8 16h2" />
+  </Icon>
+);
+
+export const ReportMoneyIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M14 3v4a1 1 0 0 0 1 1h4" />
+    <path d="M17 21h-10a2 2 0 0 1 -2 -2v-14a2 2 0 0 1 2 -2h7l5 5v11a2 2 0 0 1 -2 2z" />
+    <path d="M14 14a2 1.6 0 0 0 -2 -1h-.5a1.4 1.4 0 0 0 0 2.6h1a1.4 1.4 0 0 1 0 2.6h-.5a2 1.6 0 0 1 -2 -1" />
+    <path d="M12 11.4v.6M12 18v.6" />
+  </Icon>
+);
+
+/* ---------------- Status / utility icons ---------------- */
+
+export const CheckCircleIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <circle cx="12" cy="12" r="9" />
+    <path d="M9 12l2 2l4 -4" />
+  </Icon>
+);
+
+export const XCircleIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <circle cx="12" cy="12" r="9" />
+    <path d="M10 10l4 4M14 10l-4 4" />
+  </Icon>
+);
+
+export const ArrowRightIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M5 12h14M13 18l6 -6l-6 -6" />
+  </Icon>
+);
+
+export const GithubIcon = (p: IconProps): ReactNode => (
+  <Icon {...p}>
+    <path d="M9 19c-4.3 1.4 -4.3 -2.5 -6 -3m12 5v-3.5c0 -1 .1 -1.4 -.5 -2c2.8 -.3 5.5 -1.4 5.5 -6a4.6 4.6 0 0 0 -1.3 -3.2a4.2 4.2 0 0 0 -.1 -3.2s-1.1 -.3 -3.5 1.3a12.3 12.3 0 0 0 -6.2 0c-2.4 -1.6 -3.5 -1.3 -3.5 -1.3a4.2 4.2 0 0 0 -.1 3.2a4.6 4.6 0 0 0 -1.3 3.2c0 4.6 2.7 5.7 5.5 6c-.6 .6 -.6 1.2 -.5 2v3.5" />
+  </Icon>
+);
diff --git a/website/src/components/ParticleBackground/index.tsx b/website/src/components/ParticleBackground/index.tsx
new file mode 100644
index 0000000..e582180
--- /dev/null
+++ b/website/src/components/ParticleBackground/index.tsx
@@ -0,0 +1,134 @@
+import {useEffect, useRef} from 'react';
+import type {ReactNode} from 'react';
+import styles from './styles.module.css';
+
+interface Particle {
+  x: number;
+  y: number;
+  vx: number;
+  vy: number;
+  size: number;
+  opacity: number;
+}
+
+export default function ParticleBackground(): ReactNode {
+  const canvasRef = useRef<HTMLCanvasElement>(null);
+
+  useEffect(() => {
+    const canvas = canvasRef.current;
+    if (!canvas) return;
+
+    const ctx = canvas.getContext('2d');
+    if (!ctx) return;
+
+    // Set canvas size
+    const resizeCanvas = () => {
+      canvas.width = window.innerWidth;
+      canvas.height = window.innerHeight;
+    };
+    resizeCanvas();
+    window.addEventListener('resize', resizeCanvas);
+
+    // Particle settings - fewer particles on mobile
+    const isMobile = window.innerWidth < 768;
+    const particleCount = isMobile ? 30 : 80;
+    const particles: Particle[] = [];
+
+    // Initialize particles
+    for (let i = 0; i < particleCount; i++) {
+      particles.push({
+        x: Math.random() * canvas.width,
+        y: Math.random() * canvas.height,
+        vx: (Math.random() - 0.5) * 0.5,
+        vy: (Math.random() - 0.5) * 0.5,
+        size: Math.random() * 2 + 1,
+        opacity: Math.random() * 0.5 + 0.2,
+      });
+    }
+
+    // Draw a single frame (positions are advanced by the caller when animating).
+    const draw = () => {
+      ctx.clearRect(0, 0, canvas.width, canvas.height);
+
+      particles.forEach((particle, i) => {
+        ctx.beginPath();
+        ctx.arc(particle.x, particle.y, particle.size, 0, Math.PI * 2);
+        ctx.fillStyle = `rgba(255, 255, 255, ${particle.opacity})`;
+        ctx.fill();
+
+        // Draw connections
+        particles.slice(i + 1).forEach(otherParticle => {
+          const dx = particle.x - otherParticle.x;
+          const dy = particle.y - otherParticle.y;
+          const distance = Math.sqrt(dx * dx + dy * dy);
+
+          if (distance < 120) {
+            ctx.beginPath();
+            ctx.moveTo(particle.x, particle.y);
+            ctx.lineTo(otherParticle.x, otherParticle.y);
+            const opacity = (1 - distance / 120) * 0.15;
+            ctx.strokeStyle = `rgba(255, 255, 255, ${opacity})`;
+            ctx.lineWidth = 0.5;
+            ctx.stroke();
+          }
+        });
+      });
+    };
+
+    // Respect reduced-motion: render a single static frame and skip the loop.
+    const reduceMotion = window.matchMedia('(prefers-reduced-motion: reduce)').matches;
+    if (reduceMotion) {
+      draw();
+      return () => window.removeEventListener('resize', resizeCanvas);
+    }
+
+    // Animation loop
+    let animationFrameId = 0;
+    const animate = () => {
+      particles.forEach(particle => {
+        particle.x += particle.vx;
+        particle.y += particle.vy;
+        if (particle.x < 0) particle.x = canvas.width;
+        if (particle.x > canvas.width) particle.x = 0;
+        if (particle.y < 0) particle.y = canvas.height;
+        if (particle.y > canvas.height) particle.y = 0;
+      });
+      draw();
+      animationFrameId = requestAnimationFrame(animate);
+    };
+
+    // Pause the rAF loop while the hero is scrolled off-screen to save CPU/battery.
+    let running = false;
+    const start = () => {
+      if (!running) {
+        running = true;
+        animationFrameId = requestAnimationFrame(animate);
+      }
+    };
+    const stop = () => {
+      running = false;
+      cancelAnimationFrame(animationFrameId);
+    };
+
+    const observer = new IntersectionObserver(
+      entries => {
+        if (entries[0].isIntersecting) {
+          start();
+        } else {
+          stop();
+        }
+      },
+      {threshold: 0},
+    );
+    observer.observe(canvas);
+    start();
+
+    return () => {
+      window.removeEventListener('resize', resizeCanvas);
+      observer.disconnect();
+      stop();
+    };
+  }, []);
+
+  return <canvas ref={canvasRef} className={styles.particleCanvas} />;
+}
diff --git a/website/src/components/ParticleBackground/styles.module.css b/website/src/components/ParticleBackground/styles.module.css
new file mode 100644
index 0000000..13d4b89
--- /dev/null
+++ b/website/src/components/ParticleBackground/styles.module.css
@@ -0,0 +1,9 @@
+.particleCanvas {
+  position: absolute;
+  top: 0;
+  left: 0;
+  width: 100%;
+  height: 100%;
+  pointer-events: none;
+  z-index: 1;
+}
diff --git a/website/src/components/ProductShowcase/index.tsx b/website/src/components/ProductShowcase/index.tsx
new file mode 100644
index 0000000..8e05955
--- /dev/null
+++ b/website/src/components/ProductShowcase/index.tsx
@@ -0,0 +1,597 @@
+import {useState, type ReactNode} from 'react';
+import {translate} from '@docusaurus/Translate';
+import Translate from '@docusaurus/Translate';
+import Heading from '@theme/Heading';
+import {
+  DashboardIcon,
+  CpuIcon,
+  ReportMoneyIcon,
+  CurrencyDollarIcon,
+} from '../Icons';
+import styles from './styles.module.css';
+
+/* ------------------------------------------------------------------ */
+/*  Reusable SVG primitives — all panels share one "app chrome"        */
+/* ------------------------------------------------------------------ */
+
+const C = {
+  sidebar: '#f7f8fa',
+  sidebarActive: '#eaf2ff',
+  card: '#ffffff',
+  border: '#ececf0',
+  bg: '#f4f5f7',
+  ink: '#1d1d1f',
+  muted: '#86868b',
+  blue: '#0A84FF',
+  green: '#34C759',
+  indigo: '#5E5CE6',
+  purple: '#BF5AF2',
+  orange: '#FF9F0A',
+  gold: '#FFB300',
+  silver: '#B0B5BD',
+  bronze: '#CD7F32',
+};
+
+const NAV = [
+  '资源总览',
+  '集群节点',
+  '团队管理',
+  '项目管理',
+  '用户管理',
+  '报表中心',
+  '审计日志',
+  '系统设置',
+];
+
+function StatCard({
+  x,
+  y,
+  w,
+  label,
+  value,
+  accent,
+}: {
+  x: number;
+  y: number;
+  w: number;
+  label: string;
+  value: string;
+  accent: string;
+}): ReactNode {
+  return (
+    <g>
+      <rect x={x} y={y} width={w} height={68} rx={10} fill={C.card} stroke={C.border} />
+      <rect x={x} y={y} width={4} height={68} rx={2} fill={accent} />
+      <text x={x + 18} y={y + 26} fontSize={11} fill={C.muted}>
+        {label}
+      </text>
+      <text x={x + 18} y={y + 50} fontSize={20} fontWeight={700} fill={C.ink}>
+        {value}
+      </text>
+    </g>
+  );
+}
+
+function Donut({cx, cy, r}: {cx: number; cy: number; r: number}): ReactNode {
+  // Three segments: 共享池 55%, 独占 33%, 未管理 12%
+  const segs = [
+    {p: 0.55, c: C.blue},
+    {p: 0.33, c: C.green},
+    {p: 0.12, c: '#d9dde3'},
+  ];
+  const circ = 2 * Math.PI * r;
+  let offset = 0;
+  return (
+    <g transform={`rotate(-90 ${cx} ${cy})`}>
+      {segs.map((s, i) => {
+        const len = s.p * circ;
+        const el = (
+          <circle
+            key={i}
+            cx={cx}
+            cy={cy}
+            r={r}
+            fill="none"
+            stroke={s.c}
+            strokeWidth={16}
+            strokeDasharray={`${len} ${circ - len}`}
+            strokeDashoffset={-offset}
+          />
+        );
+        offset += len;
+        return el;
+      })}
+    </g>
+  );
+}
+
+function Sparkline({
+  x,
+  y,
+  w,
+  h,
+  pts,
+  color,
+}: {
+  x: number;
+  y: number;
+  w: number;
+  h: number;
+  pts: number[];
+  color: string;
+}): ReactNode {
+  const max = Math.max(...pts);
+  const min = Math.min(...pts);
+  const span = max - min || 1;
+  const coords = pts.map((p, i) => {
+    const px = x + (i / (pts.length - 1)) * w;
+    const py = y + h - ((p - min) / span) * h;
+    return [px, py];
+  });
+  const line = coords.map((c, i) => `${i === 0 ? 'M' : 'L'}${c[0]},${c[1]}`).join(' ');
+  const area = `${line} L${x + w},${y + h} L${x},${y + h} Z`;
+  return (
+    <g>
+      <path d={area} fill={`${color}22`} />
+      <path d={line} fill="none" stroke={color} strokeWidth={2} strokeLinecap="round" strokeLinejoin="round" />
+      {coords.map((c, i) => (
+        <circle key={i} cx={c[0]} cy={c[1]} r={2.6} fill={color} />
+      ))}
+    </g>
+  );
+}
+
+function ProgressBar({
+  x,
+  y,
+  w,
+  pct,
+  color,
+}: {
+  x: number;
+  y: number;
+  w: number;
+  pct: number;
+  color: string;
+}): ReactNode {
+  return (
+    <g>
+      <rect x={x} y={y} width={w} height={6} rx={3} fill="#eef0f3" />
+      <rect x={x} y={y} width={(w * pct) / 100} height={6} rx={3} fill={color} />
+    </g>
+  );
+}
+
+function Tag({
+  x,
+  y,
+  w,
+  label,
+  color,
+}: {
+  x: number;
+  y: number;
+  w: number;
+  label: string;
+  color: string;
+}): ReactNode {
+  return (
+    <g>
+      <rect x={x} y={y} width={w} height={18} rx={4} fill={`${color}1f`} />
+      <text x={x + w / 2} y={y + 13} fontSize={10} fill={color} textAnchor="middle" fontWeight={600}>
+        {label}
+      </text>
+    </g>
+  );
+}
+
+/* ------------------------------------------------------------------ */
+/*  Per-screen content (drawn inside the content viewport 196..940)    */
+/* ------------------------------------------------------------------ */
+
+function DashboardPanel(): ReactNode {
+  return (
+    <g>
+      <text x={214} y={84} fontSize={17} fontWeight={700} fill={C.ink}>
+        资源总览
+      </text>
+      <StatCard x={214} y={100} w={170} label="集群节点" value="8 个" accent={C.blue} />
+      <StatCard x={398} y={100} w={170} label="团队数量" value="5 个" accent={C.indigo} />
+      <StatCard x={582} y={100} w={170} label="项目数量" value="12 个" accent={C.purple} />
+      <StatCard x={766} y={100} w={158} label="费用统计" value="已启用" accent={C.green} />
+
+      {/* Node status pie */}
+      <rect x={214} y={184} width={344} height={150} rx={10} fill={C.card} stroke={C.border} />
+      <text x={232} y={208} fontSize={12} fontWeight={600} fill={C.ink}>
+        节点状态分布
+      </text>
+      <Donut cx={282} cy={272} r={34} />
+      {[
+        ['共享池', C.blue, '4'],
+        ['独占', C.green, '3'],
+        ['未管理', '#d9dde3', '1'],
+      ].map((row, i) => (
+        <g key={i}>
+          <rect x={360} y={236 + i * 26} width={9} height={9} rx={2} fill={row[1]} />
+          <text x={378} y={245 + i * 26} fontSize={11} fill={C.ink}>
+            {row[0]}
+          </text>
+          <text x={528} y={245 + i * 26} fontSize={11} fill={C.muted} textAnchor="end">
+            {row[2]}
+          </text>
+        </g>
+      ))}
+
+      {/* Cost trend */}
+      <rect x={572} y={184} width={352} height={150} rx={10} fill={C.card} stroke={C.border} />
+      <text x={590} y={208} fontSize={12} fontWeight={600} fill={C.ink}>
+        费用趋势 (7 天)
+      </text>
+      <Sparkline x={590} y={224} w={316} h={86} pts={[12, 14, 11, 18, 16, 24, 30]} color={C.blue} />
+
+      {/* Resource table */}
+      <rect x={214} y={350} width={500} height={150} rx={10} fill={C.card} stroke={C.border} />
+      <text x={232} y={374} fontSize={12} fontWeight={600} fill={C.ink}>
+        集群资源
+      </text>
+      {[
+        ['CPU', 62, C.blue],
+        ['Memory', 48, C.green],
+        ['GPU (nvidia)', 81, C.purple],
+        ['Storage', 35, C.indigo],
+      ].map((row, i) => (
+        <g key={i}>
+          <text x={232} y={406 + i * 24} fontSize={11} fill={C.ink}>
+            {row[0] as string}
+          </text>
+          <ProgressBar x={360} y={398 + i * 24} w={260} pct={row[1] as number} color={row[2] as string} />
+          <text x={636} y={406 + i * 24} fontSize={11} fill={C.muted} textAnchor="end">
+            {row[1]}%
+          </text>
+        </g>
+      ))}
+
+      {/* Top consumers */}
+      <rect x={728} y={350} width={196} height={150} rx={10} fill={C.card} stroke={C.border} />
+      <text x={746} y={374} fontSize={12} fontWeight={600} fill={C.ink}>
+        资源消耗 Top 5
+      </text>
+      {[
+        ['vision-lab', '$42.10', C.gold],
+        ['nlp-team', '$31.80', C.silver],
+        ['rec-sys', '$22.40', C.bronze],
+        ['infra', '$9.10', '#d9dde3'],
+      ].map((row, i) => (
+        <g key={i}>
+          <circle cx={752} cy={398 + i * 24} r={7} fill={row[2] as string} />
+          <text x={752} y={401 + i * 24} fontSize={8} fill="#fff" textAnchor="middle" fontWeight={700}>
+            {i + 1}
+          </text>
+          <text x={768} y={402 + i * 24} fontSize={10.5} fill={C.ink}>
+            {row[0]}
+          </text>
+          <text x={908} y={402 + i * 24} fontSize={10.5} fill={C.blue} textAnchor="end" fontWeight={600}>
+            {row[1]}
+          </text>
+        </g>
+      ))}
+    </g>
+  );
+}
+
+function ClusterPanel(): ReactNode {
+  const rows = [
+    ['gpu-node-01', 'amd64', '独占', C.green, 78, 'A100 × 8'],
+    ['gpu-node-02', 'amd64', '独占', C.green, 64, 'A100 × 8'],
+    ['gpu-node-03', 'amd64', '共享池', C.blue, 51, 'L40S × 4'],
+    ['cpu-node-01', 'arm64', '共享池', C.blue, 33, '—'],
+    ['cpu-node-02', 'amd64', '未管理', '#9aa0a6', 12, '—'],
+  ];
+  return (
+    <g>
+      <text x={214} y={84} fontSize={17} fontWeight={700} fill={C.ink}>
+        集群节点
+      </text>
+      <StatCard x={214} y={100} w={228} label="节点总数" value="8 个" accent={C.blue} />
+      <StatCard x={456} y={100} w={228} label="GPU 卡总数" value="28 张" accent={C.purple} />
+      <StatCard x={698} y={100} w={226} label="可分配 GPU" value="11 张" accent={C.green} />
+
+      <rect x={214} y={184} width={710} height={316} rx={10} fill={C.card} stroke={C.border} />
+      {/* header */}
+      {['节点名称', '架构', '状态', 'GPU 使用率', 'GPU 设备'].map((h, i) => (
+        <text key={i} x={[232, 392, 470, 580, 800][i]} y={212} fontSize={11} fill={C.muted} fontWeight={600}>
+          {h}
+        </text>
+      ))}
+      <line x1={214} y1={224} x2={924} y2={224} stroke={C.border} />
+      {rows.map((r, i) => {
+        const y = 248 + i * 48;
+        return (
+          <g key={i}>
+            <circle cx={238} cy={y - 4} r={4} fill={C.green} />
+            <text x={252} y={y} fontSize={11.5} fill={C.ink} fontWeight={600}>
+              {r[0] as string}
+            </text>
+            <text x={392} y={y} fontSize={11} fill={C.muted}>
+              {r[1] as string}
+            </text>
+            <Tag x={470} y={y - 13} w={54} label={r[2] as string} color={r[3] as string} />
+            <ProgressBar x={580} y={y - 8} w={150} pct={r[4] as number} color={C.blue} />
+            <text x={740} y={y} fontSize={10.5} fill={C.muted}>
+              {r[4]}%
+            </text>
+            <text x={800} y={y} fontSize={11} fill={C.ink}>
+              {r[5] as string}
+            </text>
+            {i < rows.length - 1 && <line x1={232} y1={y + 22} x2={906} y2={y + 22} stroke="#f3f4f6" />}
+          </g>
+        );
+      })}
+    </g>
+  );
+}
+
+function ReportPanel(): ReactNode {
+  const bars = [
+    ['vision-lab', 92, C.blue],
+    ['nlp-team', 70, C.indigo],
+    ['rec-sys', 54, C.purple],
+    ['infra', 28, C.green],
+    ['platform', 18, C.orange],
+  ];
+  const rank = [
+    ['vision-lab', '¥4210.00', '38.2%', C.gold],
+    ['nlp-team', '¥3180.50', '28.9%', C.silver],
+    ['rec-sys', '¥2240.10', '20.3%', C.bronze],
+  ];
+  return (
+    <g>
+      <text x={214} y={84} fontSize={17} fontWeight={700} fill={C.ink}>
+        报表中心
+      </text>
+      <StatCard x={214} y={100} w={228} label="总消费" value="¥11030" accent={C.blue} />
+      <StatCard x={456} y={100} w={228} label="团队数" value="5" accent={C.indigo} />
+      <StatCard x={698} y={100} w={226} label="统计周期" value="30d" accent={C.green} />
+
+      {/* Bar chart */}
+      <rect x={214} y={184} width={356} height={316} rx={10} fill={C.card} stroke={C.border} />
+      <text x={232} y={208} fontSize={12} fontWeight={600} fill={C.ink}>
+        团队消费分布
+      </text>
+      {bars.map((b, i) => {
+        const y = 234 + i * 50;
+        return (
+          <g key={i}>
+            <text x={232} y={y + 4} fontSize={10.5} fill={C.ink}>
+              {b[0] as string}
+            </text>
+            <rect x={232} y={y + 14} width={320} height={10} rx={5} fill="#eef0f3" />
+            <rect x={232} y={y + 14} width={(320 * (b[1] as number)) / 100} height={10} rx={5} fill={b[2] as string} />
+          </g>
+        );
+      })}
+
+      {/* Ranking table */}
+      <rect x={584} y={184} width={340} height={316} rx={10} fill={C.card} stroke={C.border} />
+      <text x={602} y={208} fontSize={12} fontWeight={600} fill={C.ink}>
+        团队消费排行榜 Top 10
+      </text>
+      {['排名', '团队', '金额', '占比'].map((h, i) => (
+        <text key={i} x={[602, 648, 770, 890][i]} y={236} fontSize={10} fill={C.muted} fontWeight={600} textAnchor={i >= 2 ? 'end' : 'start'}>
+          {h}
+        </text>
+      ))}
+      <line x1={602} y1={246} x2={906} y2={246} stroke={C.border} />
+      {rank.map((r, i) => {
+        const y = 274 + i * 40;
+        return (
+          <g key={i}>
+            <path
+              d={`M${608} ${y - 9} l3 6 l6 .8 l-4.5 4.3 l1 6 l-5.5 -3 l-5.5 3 l1 -6 l-4.5 -4.3 l6 -.8 z`}
+              fill={r[3] as string}
+            />
+            <text x={648} y={y} fontSize={11} fill={C.ink} fontWeight={600}>
+              {r[0] as string}
+            </text>
+            <text x={770} y={y} fontSize={11} fill={C.ink} textAnchor="end">
+              {r[1] as string}
+            </text>
+            <text x={890} y={y} fontSize={11} fill={C.muted} textAnchor="end">
+              {r[2] as string}
+            </text>
+            {i < rank.length - 1 && <line x1={602} y1={y + 18} x2={906} y2={y + 18} stroke="#f3f4f6" />}
+          </g>
+        );
+      })}
+    </g>
+  );
+}
+
+function BillingPanel(): ReactNode {
+  const rows = [
+    ['cpu', 'CPU', '核', '其他', '0.10', C.blue],
+    ['memory', 'Memory', 'GiB', '其他', '0.05', C.green],
+    ['nvidia.com/gpu', 'GPU', '张', 'GPU', '8.00', C.purple],
+    ['ephemeral-storage', 'Storage', 'GiB', '存储', '0.01', C.indigo],
+  ];
+  return (
+    <g>
+      <text x={214} y={84} fontSize={17} fontWeight={700} fill={C.ink}>
+        系统设置 · 计费配置
+      </text>
+      {/* tab strip */}
+      {['基本配置', '资源配置', '计费配置', '告警配置', '系统状态'].map((t, i) => (
+        <g key={i}>
+          <text
+            x={232 + i * 96}
+            y={114}
+            fontSize={11}
+            fontWeight={i === 2 ? 700 : 500}
+            fill={i === 2 ? C.blue : C.muted}>
+            {t}
+          </text>
+          {i === 2 && <rect x={228 + i * 96} y={122} width={62} height={2.5} rx={1} fill={C.blue} />}
+        </g>
+      ))}
+
+      <rect x={214} y={140} width={710} height={360} rx={10} fill={C.card} stroke={C.border} />
+      {/* info banner */}
+      <rect x={232} y={158} width={674} height={40} rx={8} fill="#eaf2ff" />
+      <CurrencyDollarIcon x={244} y={168} size={18} stroke={C.blue} />
+      <text x={272} y={174} fontSize={10.5} fill={C.blue}>
+        单价用于计费：按（显示值 × 单价 × 使用时长）实时扣费，支持 CPU / 内存 / GPU 自定义价格
+      </text>
+      <text x={272} y={188} fontSize={10.5} fill={C.blue}>
+        换算除数用于将 K8s 原始值转为显示值（如 memory 1073741824 → 1 GiB）
+      </text>
+
+      {/* table header */}
+      {['资源名称', '显示名', '单位', '分类', '启用', '单价 (¥/单位·时)'].map((h, i) => (
+        <text key={i} x={[244, 380, 500, 580, 690, 770][i]} y={228} fontSize={10.5} fill={C.muted} fontWeight={600}>
+          {h}
+        </text>
+      ))}
+      <line x1={232} y1={240} x2={906} y2={240} stroke={C.border} />
+      {rows.map((r, i) => {
+        const y = 268 + i * 50;
+        return (
+          <g key={i}>
+            <rect x={244} y={y - 13} width={106} height={18} rx={4} fill="#f1f3f5" />
+            <text x={250} y={y} fontSize={9.5} fill={C.ink} fontFamily="monospace">
+              {r[0] as string}
+            </text>
+            <text x={380} y={y} fontSize={11} fill={C.ink}>
+              {r[1] as string}
+            </text>
+            <text x={500} y={y} fontSize={11} fill={C.muted}>
+              {r[2] as string}
+            </text>
+            <Tag x={580} y={y - 13} w={44} label={r[3] as string} color={r[5] as string} />
+            {/* toggle on */}
+            <rect x={690} y={y - 11} width={30} height={16} rx={8} fill={C.green} />
+            <circle cx={712} cy={y - 3} r={6} fill="#fff" />
+            <text x={774} y={y} fontSize={12} fill={C.ink} fontWeight={600}>
+              ¥ {r[4] as string}
+            </text>
+            {i < rows.length - 1 && <line x1={244} y1={y + 22} x2={894} y2={y + 22} stroke="#f3f4f6" />}
+          </g>
+        );
+      })}
+    </g>
+  );
+}
+
+/* ------------------------------------------------------------------ */
+/*  Tabbed showcase                                                    */
+/* ------------------------------------------------------------------ */
+
+type TabKey = 'dashboard' | 'cluster' | 'report' | 'billing';
+
+const TABS: {key: TabKey; label: string; Icon: typeof DashboardIcon}[] = [
+  {key: 'dashboard', label: translate({id: 'showcase.tab.dashboard', message: '资源总览'}), Icon: DashboardIcon},
+  {key: 'cluster', label: translate({id: 'showcase.tab.cluster', message: '集群节点'}), Icon: CpuIcon},
+  {key: 'report', label: translate({id: 'showcase.tab.report', message: '报表中心'}), Icon: ReportMoneyIcon},
+  {key: 'billing', label: translate({id: 'showcase.tab.billing', message: '计费配置'}), Icon: CurrencyDollarIcon},
+];
+
+const NAV_ACTIVE: Record<TabKey, number> = {dashboard: 0, cluster: 1, report: 5, billing: 7};
+
+function AppFrame({tab}: {tab: TabKey}): ReactNode {
+  const activeNav = NAV_ACTIVE[tab];
+  return (
+    <svg viewBox="0 0 940 520" className={styles.screen} role="img" aria-label="Bison UI">
+      {/* window */}
+      <rect x={0.5} y={0.5} width={939} height={519} rx={14} fill={C.bg} stroke={C.border} />
+      {/* sidebar */}
+      <rect x={0} y={0} width={184} height={520} rx={14} fill={C.sidebar} />
+      <rect x={170} y={0} width={14} height={520} fill={C.sidebar} />
+      {/* brand */}
+      <circle cx={28} cy={32} r={11} fill="url(#bisonGrad)" />
+      <text x={48} y={37} fontSize={15} fontWeight={700} fill={C.ink}>
+        Bison
+      </text>
+      {/* nav */}
+      {NAV.map((item, i) => {
+        const y = 70 + i * 38;
+        const active = i === activeNav;
+        return (
+          <g key={i}>
+            {active && <rect x={12} y={y} width={160} height={30} rx={8} fill={C.sidebarActive} />}
+            <rect x={20} y={y + 9} width={13} height={13} rx={3} fill="none" stroke={active ? C.blue : C.muted} strokeWidth={1.6} />
+            <text x={44} y={y + 20} fontSize={11.5} fill={active ? C.blue : '#5b5f66'} fontWeight={active ? 600 : 400}>
+              {item}
+            </text>
+          </g>
+        );
+      })}
+      <text x={20} y={500} fontSize={9.5} fill={C.muted}>
+        v0.0.12 · Capsule + OpenCost
+      </text>
+
+      {/* top bar */}
+      <rect x={184} y={0} width={756} height={48} fill="#ffffff" />
+      <line x1={184} y1={48} x2={940} y2={48} stroke={C.border} />
+      <text x={206} y={30} fontSize={12.5} fill={C.muted}>
+        集群资源调度计费平台
+      </text>
+      <circle cx={886} cy={24} r={11} fill="#eef0f3" />
+      <text x={886} y={28} fontSize={10} fill={C.muted} textAnchor="middle">
+        A
+      </text>
+      <text x={870} y={28} fontSize={11} fill={C.ink} textAnchor="end">
+        admin
+      </text>
+
+      <defs>
+        <linearGradient id="bisonGrad" x1="0" y1="0" x2="1" y2="1">
+          <stop offset="0" stopColor={C.blue} />
+          <stop offset="1" stopColor={C.purple} />
+        </linearGradient>
+      </defs>
+
+      {tab === 'dashboard' && <DashboardPanel />}
+      {tab === 'cluster' && <ClusterPanel />}
+      {tab === 'report' && <ReportPanel />}
+      {tab === 'billing' && <BillingPanel />}
+    </svg>
+  );
+}
+
+export default function ProductShowcase(): ReactNode {
+  const [tab, setTab] = useState<TabKey>('dashboard');
+  return (
+    <section className={styles.section}>
+      <div className="container">
+        <div className="text--center margin-bottom--lg">
+          <Heading as="h2" className={styles.title}>
+            <Translate id="showcase.title">One console for the whole GPU lifecycle</Translate>
+          </Heading>
+          <p className={styles.subtitle}>
+            <Translate id="showcase.subtitle">
+              From cluster topology to per-team chargeback — every screen, vector-rendered
+            </Translate>
+          </p>
+        </div>
+
+        <div className={styles.tabs} role="tablist">
+          {TABS.map(({key, label, Icon}) => (
+            <button
+              key={key}
+              type="button"
+              role="tab"
+              aria-selected={tab === key}
+              className={`${styles.tab} ${tab === key ? styles.tabActive : ''}`}
+              onClick={() => setTab(key)}>
+              <Icon size={18} />
+              <span>{label}</span>
+            </button>
+          ))}
+        </div>
+
+        <div className={styles.frame}>
+          <AppFrame tab={tab} />
+        </div>
+      </div>
+    </section>
+  );
+}
diff --git a/website/src/components/ProductShowcase/styles.module.css b/website/src/components/ProductShowcase/styles.module.css
new file mode 100644
index 0000000..695d6ea
--- /dev/null
+++ b/website/src/components/ProductShowcase/styles.module.css
@@ -0,0 +1,108 @@
+.section {
+  padding: 4rem 0;
+  background: linear-gradient(180deg, #f8f9fa 0%, #ffffff 100%);
+}
+
+[data-theme='dark'] .section {
+  background: linear-gradient(180deg, #0d0d0d 0%, #1a1a1a 100%);
+}
+
+.title {
+  font-size: 2.2rem;
+  font-weight: 700;
+  margin-bottom: 0.6rem;
+}
+
+.subtitle {
+  color: #86868b;
+  font-size: 1.1rem;
+  max-width: 660px;
+  margin: 0 auto;
+}
+
+[data-theme='dark'] .subtitle {
+  color: #98989d;
+}
+
+.tabs {
+  display: flex;
+  flex-wrap: wrap;
+  justify-content: center;
+  gap: 0.5rem;
+  margin-bottom: 1.75rem;
+}
+
+.tab {
+  display: inline-flex;
+  align-items: center;
+  gap: 0.45rem;
+  padding: 0.5rem 1rem;
+  border-radius: 999px;
+  border: 1px solid rgba(0, 0, 0, 0.08);
+  background: rgba(255, 255, 255, 0.7);
+  color: #5b5f66;
+  font-size: 0.92rem;
+  font-weight: 600;
+  cursor: pointer;
+  transition: all 0.25s cubic-bezier(0.4, 0, 0.2, 1);
+}
+
+[data-theme='dark'] .tab {
+  background: rgba(40, 40, 40, 0.6);
+  border-color: rgba(255, 255, 255, 0.1);
+  color: #c7c7cc;
+}
+
+.tab:hover {
+  transform: translateY(-1px);
+  border-color: rgba(10, 132, 255, 0.4);
+  color: var(--ifm-color-primary);
+}
+
+.tabActive {
+  background: linear-gradient(135deg, #0A84FF, #5E5CE6);
+  border-color: transparent;
+  color: #fff;
+  box-shadow: 0 6px 16px rgba(10, 132, 255, 0.35);
+}
+
+[data-theme='dark'] .tabActive {
+  color: #fff;
+}
+
+.frame {
+  max-width: 1000px;
+  margin: 0 auto;
+  padding: 14px;
+  border-radius: 18px;
+  background: linear-gradient(135deg, rgba(10, 132, 255, 0.08), rgba(191, 90, 242, 0.08));
+  border: 1px solid rgba(0, 0, 0, 0.06);
+  box-shadow:
+    0 24px 60px rgba(10, 30, 80, 0.18),
+    0 2px 8px rgba(0, 0, 0, 0.06);
+}
+
+[data-theme='dark'] .frame {
+  border-color: rgba(255, 255, 255, 0.08);
+  box-shadow: 0 24px 60px rgba(0, 0, 0, 0.5);
+}
+
+.screen {
+  display: block;
+  width: 100%;
+  height: auto;
+  border-radius: 12px;
+  overflow: hidden;
+  animation: fadeIn 0.4s ease-out;
+}
+
+@keyframes fadeIn {
+  from {
+    opacity: 0;
+    transform: scale(0.99);
+  }
+  to {
+    opacity: 1;
+    transform: scale(1);
+  }
+}
diff --git a/website/src/components/StatsSection/index.tsx b/website/src/components/StatsSection/index.tsx
new file mode 100644
index 0000000..91349f7
--- /dev/null
+++ b/website/src/components/StatsSection/index.tsx
@@ -0,0 +1,124 @@
+import {useEffect, useState, useRef} from 'react';
+import type {ReactNode} from 'react';
+import {translate} from '@docusaurus/Translate';
+import styles from './styles.module.css';
+
+interface StatItem {
+  value: string;
+  label: string;
+  suffix?: string;
+}
+
+const stats: StatItem[] = [
+  {
+    value: '99.9',
+    label: translate({
+      id: 'component.statsSection.efficiency',
+      message: 'GPU Resource Efficiency',
+      description: 'Label for GPU resource efficiency statistic',
+    }),
+    suffix: '%',
+  },
+  {
+    value: '30',
+    label: translate({
+      id: 'component.statsSection.deployTime',
+      message: 'Avg Deploy Time',
+      description: 'Label for average deployment time statistic',
+    }),
+    suffix: ' min',
+  },
+  {
+    value: '1000',
+    label: translate({
+      id: 'component.statsSection.tenants',
+      message: 'Supported Tenants',
+      description: 'Label for supported tenants statistic',
+    }),
+    suffix: '+',
+  },
+  {
+    value: '40',
+    label: translate({
+      id: 'component.statsSection.savings',
+      message: 'Cost Savings',
+      description: 'Label for cost savings statistic',
+    }),
+    suffix: '%+',
+  },
+];
+
+function CountUpNumber({end, suffix = '', duration = 2000}: {end: number; suffix?: string; duration?: number}): ReactNode {
+  const [count, setCount] = useState(0);
+  const [hasAnimated, setHasAnimated] = useState(false);
+  const ref = useRef<HTMLSpanElement>(null);
+
+  useEffect(() => {
+    const observer = new IntersectionObserver(
+      entries => {
+        if (entries[0].isIntersecting && !hasAnimated) {
+          setHasAnimated(true);
+
+          const startTime = Date.now();
+          const startValue = 0;
+
+          const animate = () => {
+            const now = Date.now();
+            const progress = Math.min((now - startTime) / duration, 1);
+
+            // Easing function (ease-out cubic)
+            const easeOut = 1 - Math.pow(1 - progress, 3);
+            const current = startValue + (end - startValue) * easeOut;
+
+            setCount(current);
+
+            if (progress < 1) {
+              requestAnimationFrame(animate);
+            } else {
+              setCount(end);
+            }
+          };
+
+          animate();
+        }
+      },
+      {threshold: 0.3}
+    );
+
+    if (ref.current) {
+      observer.observe(ref.current);
+    }
+
+    return () => observer.disconnect();
+  }, [end, duration, hasAnimated]);
+
+  return (
+    <span ref={ref}>
+      {end % 1 === 0 ? Math.floor(count) : count.toFixed(1)}
+      {suffix}
+    </span>
+  );
+}
+
+export default function StatsSection(): ReactNode {
+  return (
+    <section className={styles.statsSection}>
+      <div className="container">
+        <div className={styles.statsGrid}>
+          {stats.map((stat, index) => (
+            <div key={index} className={styles.statItem}>
+              <div className={styles.statValue}>
+                <CountUpNumber
+                  end={parseFloat(stat.value)}
+                  suffix={stat.suffix}
+                  duration={2000}
+                />
+              </div>
+              <div className={styles.statLabel}>{stat.label}</div>
+            </div>
+          ))}
+        </div>
+      </div>
+    </section>
+  );
+}
diff --git a/website/src/components/StatsSection/styles.module.css b/website/src/components/StatsSection/styles.module.css
new file mode 100644
index 0000000..b0ee418
--- /dev/null
+++ b/website/src/components/StatsSection/styles.module.css
@@ -0,0 +1,101 @@
+.statsSection {
+  padding: 4rem 0;
+  background: linear-gradient(135deg, #0A84FF 0%, #5E5CE6 100%);
+  position: relative;
+  overflow: hidden;
+}
+
+.statsSection::before {
+  content: '';
+  position: absolute;
+  top: 0;
+  left: 0;
+  right: 0;
+  bottom: 0;
+  background:
+    radial-gradient(circle at 10% 20%, rgba(255, 255, 255, 0.1) 0%, transparent 40%),
+    radial-gradient(circle at 90% 80%, rgba(255, 255, 255, 0.1) 0%, transparent 40%);
+  animation: shimmer 10s ease-in-out infinite;
+}
+
+@keyframes shimmer {
+  0%, 100% {
+    opacity: 0.5;
+  }
+  50% {
+    opacity: 1;
+  }
+}
+
+.statsGrid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(200px, 1fr));
+  gap: 3rem;
+  position: relative;
+  z-index: 1;
+}
+
+.statItem {
+  text-align: center;
+  color: white;
+  animation: fadeInScale 0.8s ease-out backwards;
+}
+
+.statItem:nth-child(1) {
+  animation-delay: 0.1s;
+}
+
+.statItem:nth-child(2) {
+  animation-delay: 0.2s;
+}
+
+.statItem:nth-child(3) {
+  animation-delay: 0.3s;
+}
+
+.statItem:nth-child(4) {
+  animation-delay: 0.4s;
+}
+
+.statValue {
+  font-size: 3.5rem;
+  font-weight: 700;
+  line-height: 1.2;
+  margin-bottom: 0.5rem;
+  text-shadow: 0 2px 10px rgba(0, 0, 0, 0.2);
+  font-variant-numeric: tabular-nums;
+}
+
+.statLabel {
+  font-size: 1rem;
+  font-weight: 500;
+  opacity: 0.95;
+  text-transform: uppercase;
+  letter-spacing: 1px;
+}
+
+@keyframes fadeInScale {
+  from {
+    opacity: 0;
+    transform: scale(0.8) translateY(20px);
+  }
+  to {
+    opacity: 1;
+    transform: scale(1) translateY(0);
+  }
+}
+
+@media screen and (max-width: 768px) {
+  .statsGrid {
+    grid-template-columns: repeat(2, 1fr);
+    gap: 2rem;
+  }
+
+  .statValue {
+    font-size: 2.5rem;
+  }
+
+  .statLabel {
+    font-size: 0.875rem;
+  }
+}
diff --git a/website/src/components/UseCases/index.tsx b/website/src/components/UseCases/index.tsx
new file mode 100644
index 0000000..be4ca19
--- /dev/null
+++ b/website/src/components/UseCases/index.tsx
@@ -0,0 +1,263 @@
+import type {ComponentType, ReactNode} from 'react';
+import {translate} from '@docusaurus/Translate';
+import Translate from '@docusaurus/Translate';
+import Heading from '@theme/Heading';
+import {
+  CpuIcon,
+  BuildingIcon,
+  ReportMoneyIcon,
+  CheckCircleIcon,
+  XCircleIcon,
+  ArrowRightIcon,
+  type IconProps,
+} from '../Icons';
+import styles from './styles.module.css';
+
+interface UseCase {
+  Icon: ComponentType<IconProps>;
+  color: string;
+  title: string;
+  description: string;
+  before: string[];
+  after: string[];
+}
+
+const useCases: UseCase[] = [
+  {
+    Icon: CpuIcon,
+    color: '#5E5CE6',
+    title: translate({
+      id: 'component.useCases.aiTraining.title',
+      message: 'AI Training Platform',
+      description: 'Title for AI training use case',
+    }),
+    description: translate({
+      id: 'component.useCases.aiTraining.description',
+      message: 'Multi-team GPU resource sharing for machine learning workloads',
+      description: 'Description for AI training use case',
+    }),
+    before: [
+      translate({
+        id: 'component.useCases.aiTraining.before.manual',
+        message: 'Manual GPU allocation',
+        description: 'AI training before: manual allocation',
+      }),
+      translate({
+        id: 'component.useCases.aiTraining.before.noCost',
+        message: 'No cost visibility',
+        description: 'AI training before: no cost visibility',
+      }),
+      translate({
+        id: 'component.useCases.aiTraining.before.conflicts',
+        message: 'Resource conflicts',
+        description: 'AI training before: resource conflicts',
+      }),
+    ],
+    after: [
+      translate({
+        id: 'component.useCases.aiTraining.after.automated',
+        message: 'Automated scheduling',
+        description: 'AI training after: automated scheduling',
+      }),
+      translate({
+        id: 'component.useCases.aiTraining.after.realtime',
+        message: 'Real-time cost tracking',
+        description: 'AI training after: real-time cost tracking',
+      }),
+      translate({
+        id: 'component.useCases.aiTraining.after.fair',
+        message: 'Fair resource sharing',
+        description: 'AI training after: fair resource sharing',
+      }),
+    ],
+  },
+  {
+    Icon: BuildingIcon,
+    color: '#0A84FF',
+    title: translate({
+      id: 'component.useCases.enterprise.title',
+      message: 'Enterprise Cloud',
+      description: 'Title for enterprise cloud use case',
+    }),
+    description: translate({
+      id: 'component.useCases.enterprise.description',
+      message: 'Department-level resource isolation and billing',
+      description: 'Description for enterprise cloud use case',
+    }),
+    before: [
+      translate({
+        id: 'component.useCases.enterprise.before.chaos',
+        message: 'Shared cluster chaos',
+        description: 'Enterprise before: shared cluster chaos',
+      }),
+      translate({
+        id: 'component.useCases.enterprise.before.noBudget',
+        message: 'No budget control',
+        description: 'Enterprise before: no budget control',
+      }),
+      translate({
+        id: 'component.useCases.enterprise.before.manual',
+        message: 'Manual reporting',
+        description: 'Enterprise before: manual reporting',
+      }),
+    ],
+    after: [
+      translate({
+        id: 'component.useCases.enterprise.after.isolated',
+        message: 'Isolated tenants',
+        description: 'Enterprise after: isolated tenants',
+      }),
+      translate({
+        id: 'component.useCases.enterprise.after.prepaid',
+        message: 'Prepaid balances',
+        description: 'Enterprise after: prepaid balances',
+      }),
+      translate({
+        id: 'component.useCases.enterprise.after.automated',
+        message: 'Automated reports',
+        description: 'Enterprise after: automated reports',
+      }),
+    ],
+  },
+  {
+    Icon: ReportMoneyIcon,
+    color: '#34C759',
+    title: translate({
+      id: 'component.useCases.billing.title',
+      message: 'Cost Center Billing',
+      description: 'Title for cost center billing use case',
+    }),
+    description: translate({
+      id: 'component.useCases.billing.description',
+      message: 'Chargeback system for internal GPU resources',
+      description: 'Description for cost center billing use case',
+    }),
+    before: [
+      translate({
+        id: 'component.useCases.billing.before.excel',
+        message: 'Excel-based tracking',
+        description: 'Billing before: Excel-based tracking',
+      }),
+      translate({
+        id: 'component.useCases.billing.before.monthly',
+        message: 'Monthly reconciliation',
+        description: 'Billing before: monthly reconciliation',
+      }),
+      translate({
+        id: 'component.useCases.billing.before.disputes',
+        message: 'Billing disputes',
+        description: 'Billing before: billing disputes',
+      }),
+    ],
+    after: [
+      translate({
+        id: 'component.useCases.billing.after.realtime',
+        message: 'Real-time deduction',
+        description: 'Billing after: real-time deduction',
+      }),
+      translate({
+        id: 'component.useCases.billing.after.transparent',
+        message: 'Transparent pricing',
+        description: 'Billing after: transparent pricing',
+      }),
+      translate({
+        id: 'component.useCases.billing.after.automated',
+        message: 'Automated invoicing',
+        description: 'Billing after: automated invoicing',
+      }),
+    ],
+  },
+];
+
+function ComparisonCard({useCase}: {useCase: UseCase}): ReactNode {
+  const {Icon} = useCase;
+  return (
+    <div className={styles.useCaseCard}>
+      <div
+        className={styles.useCaseIcon}
+        style={{
+          background: `linear-gradient(135deg, ${useCase.color}, ${useCase.color}cc)`,
+          boxShadow: `0 6px 16px ${useCase.color}40`,
+        }}>
+        <Icon size={26} stroke="#fff" />
+      </div>
+      <Heading as="h3" className={styles.useCaseTitle}>
+        {useCase.title}
+      </Heading>
+      <p className={styles.useCaseDescription}>{useCase.description}</p>
+
+      <div className={styles.comparison}>
+        <div className={styles.comparisonColumn}>
+          <div className={styles.comparisonHeader}>
+            <span className={styles.crossIcon}>
+              <XCircleIcon size={18} />
+            </span>
+            <span>
+              <Translate id="component.useCases.beforeBison">
+                Before Bison
+              </Translate>
+            </span>
+          </div>
+          <ul className={styles.comparisonList}>
+            {useCase.before.map((item, i) => (
+              <li key={i} className={styles.comparisonItemBefore}>
+                {item}
+              </li>
+            ))}
+          </ul>
+        </div>
+
+        <div className={styles.comparisonDivider}>
+          <ArrowRightIcon size={22} />
+        </div>
+
+        <div className={styles.comparisonColumn}>
+          <div className={styles.comparisonHeader}>
+            <span className={styles.checkIcon}>
+              <CheckCircleIcon size={18} />
+            </span>
+            <span>
+              <Translate id="component.useCases.withBison">
+                With Bison
+              </Translate>
+            </span>
+          </div>
+          <ul className={styles.comparisonList}>
+            {useCase.after.map((item, i) => (
+              <li key={i} className={styles.comparisonItemAfter}>
+                {item}
+              </li>
+            ))}
+          </ul>
+        </div>
+      </div>
+    </div>
+  );
+}
+
+export default function UseCases(): ReactNode {
+  return (
+    <section className={styles.useCasesSection}>
+      <div className="container">
+        <div className="text--center margin-bottom--lg">
+          <Heading as="h2" className={styles.sectionTitle}>
+            <Translate id="component.useCases.title">
+              Real-World Use Cases
+            </Translate>
+          </Heading>
+          <p className={styles.sectionSubtitle}>
+            <Translate id="component.useCases.subtitle">
+              See how Bison transforms GPU resource management across different scenarios
+            </Translate>
+          </p>
+        </div>
+
+        <div className={styles.useCasesGrid}>
+          {useCases.map((useCase, index) => (
+            <ComparisonCard key={index} useCase={useCase} />
+          ))}
+        </div>
+      </div>
+    </section>
+  );
+}
diff --git a/website/src/components/UseCases/styles.module.css b/website/src/components/UseCases/styles.module.css
new file mode 100644
index 0000000..4657fe2
--- /dev/null
+++ b/website/src/components/UseCases/styles.module.css
@@ -0,0 +1,208 @@
+.useCasesSection {
+  padding: 4rem 0;
+  background: linear-gradient(180deg, #ffffff 0%, #f8f9fa 100%);
+}
+
+[data-theme='dark'] .useCasesSection {
+  background: linear-gradient(180deg, #0d0d0d 0%, #1a1a1a 100%);
+}
+
+.sectionTitle {
+  font-size: 2.5rem;
+  font-weight: 700;
+  margin-bottom: 1rem;
+}
+
+.sectionSubtitle {
+  font-size: 1.125rem;
+  color: #666;
+  max-width: 700px;
+  margin: 0 auto;
+}
+
+[data-theme='dark'] .sectionSubtitle {
+  color: #b3b3b3;
+}
+
+.useCasesGrid {
+  display: grid;
+  grid-template-columns: repeat(auto-fit, minmax(320px, 1fr));
+  gap: 2rem;
+  margin-top: 3rem;
+}
+
+.useCaseCard {
+  padding: 2rem;
+  border-radius: 16px;
+  background: white;
+  box-shadow: 0 4px 6px rgba(0, 0, 0, 0.05);
+  transition: all 0.4s cubic-bezier(0.4, 0, 0.2, 1);
+  border: 1px solid rgba(0, 0, 0, 0.05);
+  animation: fadeInUp 0.6s ease-out backwards;
+}
+
+[data-theme='dark'] .useCaseCard {
+  background: rgba(30, 30, 30, 0.8);
+  border: 1px solid rgba(255, 255, 255, 0.1);
+}
+
+.useCaseCard:nth-child(1) {
+  animation-delay: 0.1s;
+}
+
+.useCaseCard:nth-child(2) {
+  animation-delay: 0.2s;
+}
+
+.useCaseCard:nth-child(3) {
+  animation-delay: 0.3s;
+}
+
+.useCaseCard:hover {
+  transform: translateY(-8px);
+  box-shadow: 0 12px 24px rgba(10, 132, 255, 0.1);
+}
+
+.useCaseIcon {
+  width: 54px;
+  height: 54px;
+  border-radius: 14px;
+  margin-bottom: 1.25rem;
+  display: flex;
+  align-items: center;
+  justify-content: center;
+  transition: transform 0.4s cubic-bezier(0.4, 0, 0.2, 1);
+}
+
+.useCaseCard:hover .useCaseIcon {
+  transform: scale(1.08) rotate(-3deg);
+}
+
+.useCaseTitle {
+  font-size: 1.5rem;
+  font-weight: 600;
+  margin-bottom: 0.75rem;
+}
+
+.useCaseDescription {
+  color: #666;
+  margin-bottom: 1.5rem;
+  line-height: 1.6;
+}
+
+[data-theme='dark'] .useCaseDescription {
+  color: #b3b3b3;
+}
+
+.comparison {
+  display: grid;
+  grid-template-columns: 1fr auto 1fr;
+  gap: 1rem;
+  align-items: start;
+}
+
+.comparisonColumn {
+  min-width: 0;
+}
+
+.comparisonHeader {
+  display: flex;
+  align-items: center;
+  gap: 0.5rem;
+  font-weight: 600;
+  margin-bottom: 0.75rem;
+  font-size: 0.875rem;
+}
+
+.crossIcon {
+  display: inline-flex;
+  color: #ff453a;
+}
+
+.checkIcon {
+  display: inline-flex;
+  color: #34c759;
+}
+
+.comparisonDivider {
+  display: flex;
+  align-items: center;
+  color: #0A84FF;
+  padding-top: 1.5rem;
+}
+
+.comparisonList {
+  list-style: none;
+  padding: 0;
+  margin: 0;
+}
+
+.comparisonList li {
+  padding: 0.5rem 0;
+  font-size: 0.875rem;
+  position: relative;
+  padding-left: 1.25rem;
+}
+
+.comparisonList li::before {
+  content: '';
+  position: absolute;
+  left: 0;
+  top: 0.875rem;
+  width: 6px;
+  height: 6px;
+  border-radius: 50%;
+}
+
+.comparisonItemBefore {
+  color: #999;
+}
+
+.comparisonItemBefore::before {
+  background: #ff4444;
+}
+
+.comparisonItemAfter {
+  color: #333;
+  font-weight: 500;
+}
+
+[data-theme='dark'] .comparisonItemAfter {
+  color: #ffffff;
+}
+
+.comparisonItemAfter::before {
+  background: #00c853;
+}
+
+@keyframes fadeInUp {
+  from {
+    opacity: 0;
+    transform: translateY(30px);
+  }
+  to {
+    opacity: 1;
+    transform: translateY(0);
+  }
+}
+
+@media screen and (max-width: 768px) {
+  .useCasesGrid {
+    grid-template-columns: 1fr;
+  }
+
+  .comparison {
+    grid-template-columns: 1fr;
+    gap: 1.5rem;
+  }
+
+  .comparisonDivider {
+    text-align: center;
+    padding-top: 0;
+    transform: rotate(90deg);
+  }
+
+  .sectionTitle {
+    font-size: 2rem;
+  }
+}
diff --git a/website/src/css/custom.css b/website/src/css/custom.css
index 8df8ae0..a9ab623 100644
--- a/website/src/css/custom.css
+++ b/website/src/css/custom.css
@@ -127,3 +127,146 @@ button:focus,
   outline-offset: 2px;
   border-radius: 4px;
 }
+
+/* ==================== Additional Modern Effects ==================== */
+
+/* Smooth scroll behavior */
+html {
+  scroll-behavior: smooth;
+}
+
+/* Page transitions */
+main {
+  animation: pageEnter 0.5s ease-out;
+}
+
+@keyframes pageEnter {
+  from {
+    opacity: 0;
+    transform: translateY(20px);
+  }
+  to {
+    opacity: 1;
+    transform: translateY(0);
+  }
+}
+
+/* Enhanced button styles */
+.button--primary,
+.button--secondary {
+  font-weight: 600;
+  letter-spacing: 0.3px;
+  position: relative;
+  overflow: hidden;
+}
+
+.button--primary::before,
+.button--secondary::before {
+  content: '';
+  position: absolute;
+  top: 50%;
+  left: 50%;
+  width: 0;
+  height: 0;
+  border-radius: 50%;
+  background: rgba(255, 255, 255, 0.2);
+  transform: translate(-50%, -50%);
+  transition: width 0.6s, height 0.6s;
+}
+
+.button--primary:hover::before,
+.button--secondary:hover::before {
+  width: 300px;
+  height: 300px;
+}
+
+/* Card hover glow effect */
+.card:hover {
+  box-shadow:
+    0 4px 20px rgba(10, 132, 255, 0.15),
+    0 0 0 1px rgba(10, 132, 255, 0.1);
+}
+
+/* Improved text selection */
+::selection {
+  background: rgba(10, 132, 255, 0.3);
+  color: inherit;
+}
+
+/* Loading shimmer effect */
+@keyframes shimmer {
+  0% {
+    background-position: -1000px 0;
+  }
+  100% {
+    background-position: 1000px 0;
+  }
+}
+
+/* Pulse animation for important elements */
+@keyframes pulse {
+  0%, 100% {
+    opacity: 1;
+  }
+  50% {
+    opacity: 0.8;
+  }
+}
+
+/* Gradient text effect */
+.gradient-text {
+  background: linear-gradient(135deg, #0A84FF, #5E5CE6, #BF5AF2);
+  -webkit-background-clip: text;
+  -webkit-text-fill-color: transparent;
+  background-clip: text;
+}
+
+/* Scrollbar styling */
+::-webkit-scrollbar {
+  width: 10px;
+  height: 10px;
+}
+
+::-webkit-scrollbar-track {
+  background: rgba(0, 0, 0, 0.05);
+}
+
+::-webkit-scrollbar-thumb {
+  background: rgba(10, 132, 255, 0.3);
+  border-radius: 5px;
+}
+
+::-webkit-scrollbar-thumb:hover {
+  background: rgba(10, 132, 255, 0.5);
+}
+
+[data-theme='dark'] ::-webkit-scrollbar-track {
+  background: rgba(255, 255, 255, 0.05);
+}
+
+[data-theme='dark'] ::-webkit-scrollbar-thumb {
+  background: rgba(10, 132, 255, 0.4);
+}
+
+[data-theme='dark'] ::-webkit-scrollbar-thumb:hover {
+  background: rgba(10, 132, 255, 0.6);
+}
+
+/* Performance optimization hints */
+.hero,
+.card,
+button,
+a {
+  will-change: transform;
+}
+
+/* Reduce motion for accessibility */
+@media (prefers-reduced-motion: reduce) {
+  *,
+  *::before,
+  *::after {
+    animation-duration: 0.01ms !important;
+    animation-iteration-count: 1 !important;
+    transition-duration: 0.01ms !important;
+  }
+}
diff --git a/website/src/pages/index.module.css b/website/src/pages/index.module.css
index 9f71a5d..95cdd6c 100644
--- a/website/src/pages/index.module.css
+++ b/website/src/pages/index.module.css
@@ -8,11 +8,51 @@
   text-align: center;
   position: relative;
   overflow: hidden;
+  background: linear-gradient(135deg, #0A84FF 0%, #5E5CE6 50%, #BF5AF2 100%);
+  background-size: 400% 400%;
+  animation: gradientShift 15s ease infinite;
+  min-height: 500px;
+  display: flex;
+  align-items: center;
+}
+
+.heroBanner::before {
+  content: '';
+  position: absolute;
+  top: 0;
+  left: 0;
+  right: 0;
+  bottom: 0;
+  background: radial-gradient(circle at 20% 50%, rgba(255, 255, 255, 0.1) 0%, transparent 50%),
+              radial-gradient(circle at 80% 80%, rgba(255, 255, 255, 0.1) 0%, transparent 50%);
+  animation: pulse 8s ease-in-out infinite;
+}
+
+@keyframes gradientShift {
+  0% {
+    background-position: 0% 50%;
+  }
+  50% {
+    background-position: 100% 50%;
+  }
+  100% {
+    background-position: 0% 50%;
+  }
+}
+
+@keyframes pulse {
+  0%, 100% {
+    opacity: 0.5;
+  }
+  50% {
+    opacity: 1;
+  }
 }
 
 @media screen and (max-width: 996px) {
   .heroBanner {
     padding: 2rem;
+    min-height: 400px;
   }
 }
 
@@ -20,4 +60,32 @@
   display: flex;
   align-items: center;
   justify-content: center;
+  gap: 1rem;
+  margin-top: 2rem;
+  position: relative;
+  z-index: 10;
+}
+
+.buttons a {
+  animation: fadeInUp 0.8s ease-out;
+  animation-fill-mode: both;
+}
+
+.buttons a:nth-child(1) {
+  animation-delay: 0.2s;
+}
+
+.buttons a:nth-child(2) {
+  animation-delay: 0.4s;
+}
+
+@keyframes fadeInUp {
+  from {
+    opacity: 0;
+    transform: translateY(30px);
+  }
+  to {
+    opacity: 1;
+    transform: translateY(0);
+  }
 }
diff --git a/website/src/pages/index.tsx b/website/src/pages/index.tsx
index 6b7ad24..c4b40b9 100644
--- a/website/src/pages/index.tsx
+++ b/website/src/pages/index.tsx
@@ -5,7 +5,14 @@ import useDocusaurusContext from '@docusaurus/useDocusaurusContext';
 import useBaseUrl from '@docusaurus/useBaseUrl';
 import Layout from '@theme/Layout';
 import HomepageFeatures from '@site/src/components/HomepageFeatures';
+import ParticleBackground from '@site/src/components/ParticleBackground';
+import StatsSection from '@site/src/components/StatsSection';
+import ProductShowcase from '@site/src/components/ProductShowcase';
+import ArchitectureDiagram from '@site/src/components/ArchitectureDiagram';
+import UseCases from '@site/src/components/UseCases';
 import Heading from '@theme/Heading';
+import Translate, {translate} from '@docusaurus/Translate';
+import {ArrowRightIcon, GithubIcon} from '@site/src/components/Icons';
 
 import styles from './index.module.css';
 
@@ -13,27 +20,50 @@ function HomepageHeader() {
   const {siteConfig} = useDocusaurusContext();
   return (
     <header className={clsx('hero hero--primary', styles.heroBanner)}>
-      <div className="container">
+      <ParticleBackground />
+      <div className="container" style={{position: 'relative', zIndex: 10}}>
         <img
           src={useBaseUrl('/img/logo.svg')}
           alt="Bison Logo"
-          style={{width: '120px', height: '120px', marginBottom: '1rem'}}
+          style={{
+            width: '120px',
+            height: '120px',
+            marginBottom: '1rem',
+            animation: 'fadeInUp 0.8s ease-out',
+            filter: 'drop-shadow(0 4px 12px rgba(0,0,0,0.2))',
+          }}
         />
-        <Heading as="h1" className="hero__title">
+        <Heading
+          as="h1"
+          className="hero__title"
+          style={{
+            animation: 'fadeInUp 0.8s ease-out 0.1s both',
+            textShadow: '0 2px 10px rgba(0,0,0,0.2)',
+          }}>
           {siteConfig.title}
         </Heading>
-        <p className="hero__subtitle">{siteConfig.tagline}</p>
+        <p
+          className="hero__subtitle"
+          style={{
+            animation: 'fadeInUp 0.8s ease-out 0.2s both',
+            textShadow: '0 1px 5px rgba(0,0,0,0.2)',
+          }}>
+          {siteConfig.tagline}
+        </p>
         <div className={styles.buttons}>
           <Link
             className="button button--secondary button--lg"
-            to="/docs">
-            Get Started 🚀
+            to="/docs"
+            style={{display: 'inline-flex', alignItems: 'center', gap: '0.5rem'}}>
+            <Translate id="homepage.getStarted">Get Started</Translate>
+            <ArrowRightIcon size={20} />
           </Link>
           <Link
             className="button button--outline button--secondary button--lg"
             to="https://github.com/SuperMarioYL/Bison"
-            style={{marginLeft: '1rem'}}>
-            GitHub ⭐
+            style={{display: 'inline-flex', alignItems: 'center', gap: '0.5rem'}}>
+            <GithubIcon size={20} />
+            GitHub
           </Link>
         </div>
       </div>
@@ -45,11 +75,23 @@ export default function Home(): ReactNode {
   const {siteConfig} = useDocusaurusContext();
   return (
     <Layout
-      title={`${siteConfig.title} - Kubernetes GPU Resource Billing & Multi-Tenant Management`}
-      description="Enterprise GPU resource billing and multi-tenant management platform based on Kubernetes, Capsule, and OpenCost">
+      title={translate({
+        id: 'homepage.title',
+        message: 'Bison - Kubernetes GPU Resource Billing & Multi-Tenant Management',
+        description: 'Homepage title',
+      })}
+      description={translate({
+        id: 'homepage.description',
+        message: 'Enterprise GPU resource billing and multi-tenant management platform based on Kubernetes, Capsule, and OpenCost',
+        description: 'Homepage meta description',
+      })}>
       <HomepageHeader />
       <main>
+        <StatsSection />
+        <ProductShowcase />
         <HomepageFeatures />
+        <ArchitectureDiagram />
+        <UseCases />
       </main>
     </Layout>
   );
diff --git a/website/static/CNAME b/website/static/CNAME
new file mode 100644
index 0000000..ba638fd
--- /dev/null
+++ b/website/static/CNAME
@@ -0,0 +1 @@
+bison.lei6393.com
diff --git a/website/static/img/bison-social-card.png b/website/static/img/bison-social-card.png
index cbd1719..db32261 100644
Binary files a/website/static/img/bison-social-card.png and b/website/static/img/bison-social-card.png differ
diff --git a/website/static/img/bison-social-card.svg b/website/static/img/bison-social-card.svg
new file mode 100644
index 0000000..76d2a52
--- /dev/null
+++ b/website/static/img/bison-social-card.svg
@@ -0,0 +1,71 @@
+<svg xmlns="http://www.w3.org/2000/svg" width="1200" height="630" viewBox="0 0 1200 630">
+  <defs>
+    <linearGradient id="bg" x1="0" y1="0" x2="1" y2="1">
+      <stop offset="0" stop-color="#0a1430"/>
+      <stop offset="0.55" stop-color="#0b1f4d"/>
+      <stop offset="1" stop-color="#241047"/>
+    </linearGradient>
+    <linearGradient id="brand" x1="0" y1="0" x2="1" y2="1">
+      <stop offset="0" stop-color="#0A84FF"/>
+      <stop offset="1" stop-color="#BF5AF2"/>
+    </linearGradient>
+    <linearGradient id="accent" x1="0" y1="0" x2="1" y2="0">
+      <stop offset="0" stop-color="#0A84FF"/>
+      <stop offset="0.5" stop-color="#5E5CE6"/>
+      <stop offset="1" stop-color="#BF5AF2"/>
+    </linearGradient>
+    <style>
+      text { font-family: -apple-system, "Segoe UI", "Helvetica Neue", Arial, "PingFang SC", "Microsoft YaHei", sans-serif; }
+    </style>
+  </defs>
+
+  <rect width="1200" height="630" fill="url(#bg)"/>
+
+  <!-- subtle grid -->
+  <g stroke="#ffffff" stroke-opacity="0.04" stroke-width="1">
+    <path d="M0 158 H1200 M0 316 H1200 M0 474 H1200 M300 0 V630 M600 0 V630 M900 0 V630"/>
+  </g>
+
+  <!-- glow blobs -->
+  <circle cx="1010" cy="150" r="220" fill="#0A84FF" opacity="0.16"/>
+  <circle cx="1080" cy="470" r="200" fill="#BF5AF2" opacity="0.14"/>
+
+  <!-- logo mark -->
+  <g transform="translate(90,96)">
+    <rect width="84" height="84" rx="22" fill="url(#brand)"/>
+    <g fill="none" stroke="#ffffff" stroke-width="4.5" stroke-linecap="round" stroke-linejoin="round" transform="translate(20,20)">
+      <rect x="2" y="2" width="18" height="24" rx="3"/>
+      <rect x="24" y="2" width="18" height="14" rx="3"/>
+      <rect x="2" y="30" width="18" height="12" rx="3"/>
+      <rect x="24" y="20" width="18" height="22" rx="3"/>
+    </g>
+  </g>
+
+  <text x="196" y="138" fill="#ffffff" font-size="64" font-weight="800" letter-spacing="-1">Bison</text>
+  <text x="198" y="176" fill="#9db4e6" font-size="23" font-weight="600" letter-spacing="3">GPU BILLING &amp; SCHEDULING</text>
+
+  <!-- headline -->
+  <text x="90" y="320" fill="#ffffff" font-size="58" font-weight="800">Kubernetes GPU 资源</text>
+  <text x="90" y="392" fill="#ffffff" font-size="58" font-weight="800">计费与多租户管理平台</text>
+
+  <text x="90" y="452" fill="#aab8d6" font-size="27" font-weight="500">Capsule 多租户 · OpenCost 实时计费 · 一条 Helm 命令部署</text>
+
+  <!-- feature chips -->
+  <g font-size="22" font-weight="600">
+    <g transform="translate(90,500)">
+      <rect width="232" height="52" rx="26" fill="#ffffff" fill-opacity="0.08" stroke="#0A84FF" stroke-opacity="0.5"/>
+      <text x="116" y="33" fill="#cfe0ff" text-anchor="middle">多租户隔离</text>
+    </g>
+    <g transform="translate(338,500)">
+      <rect width="232" height="52" rx="26" fill="#ffffff" fill-opacity="0.08" stroke="#34C759" stroke-opacity="0.5"/>
+      <text x="116" y="33" fill="#c7f3d4" text-anchor="middle">实时扣费 / 告警</text>
+    </g>
+    <g transform="translate(586,500)">
+      <rect width="232" height="52" rx="26" fill="#ffffff" fill-opacity="0.08" stroke="#BF5AF2" stroke-opacity="0.5"/>
+      <text x="116" y="33" fill="#ecd4fb" text-anchor="middle">无外部数据库</text>
+    </g>
+  </g>
+
+  <!-- bottom accent bar -->
+  <rect x="0" y="618" width="1200" height="12" fill="url(#accent)"/>
+</svg>
diff --git a/website/static/robots.txt b/website/static/robots.txt
new file mode 100644
index 0000000..44699ff
--- /dev/null
+++ b/website/static/robots.txt
@@ -0,0 +1,6 @@
+User-agent: *
+Allow: /
+
+# Sitemap
+Sitemap: https://bison.lei6393.com/sitemap.xml
+Sitemap: https://bison.lei6393.com/zh-Hans/sitemap.xml
diff --git a/website/versioned_docs/version-0.0.11/architecture.md b/website/versioned_docs/version-0.0.11/architecture.md
new file mode 100644
index 0000000..dbbe50d
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/architecture.md
@@ -0,0 +1,418 @@
+---
+sidebar_position: 5
+---
+
+# Architecture
+
+This document provides a technical overview of Bison's architecture, designed with high cohesion and low coupling principles for maintainability and scalability.
+
+## System Overview
+
+### High-Level Architecture
+
+```mermaid
+graph TB
+    subgraph PRESENT[Presentation Layer]
+        WEB[Web UI<br/>React 18 + Ant Design 5]
+        CLI[kubectl / API Client]
+    end
+
+    subgraph GATEWAY[API Gateway Layer]
+        GW[API Server<br/>Go + Gin Framework]
+        AUTH[Auth Middleware<br/>JWT + OIDC]
+    end
+
+    subgraph BUSINESS[Business Logic Layer]
+        TS[Tenant Service<br/>Team & Project CRUD]
+        BS[Billing Service<br/>Cost Calculation]
+        BLS[Balance Service<br/>Wallet Management]
+        QS[Quota Service<br/>Resource Limits]
+        AS[Alert Service<br/>Notifications]
+        RS[Report Service<br/>Analytics]
+    end
+
+    subgraph INTEGRATION[Integration Layer]
+        K8S[Kubernetes Client<br/>client-go]
+        OCC[OpenCost Client<br/>REST API]
+        PC[Prometheus Client<br/>PromQL]
+    end
+
+    subgraph EXTERNAL[External Systems]
+        KAPI[Kubernetes API]
+        CAP[Capsule Controller]
+        OC[OpenCost]
+        PROM[Prometheus]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Persistent Storage]
+    end
+
+    WEB --> GW
+    CLI --> GW
+    GW --> AUTH
+    AUTH --> TS & BS & BLS & QS & AS & RS
+
+    TS --> K8S
+    BS --> OCC
+    BLS --> K8S
+    QS --> K8S
+    RS --> OCC & PC
+
+    K8S --> KAPI
+    K8S --> CAP
+    OCC --> OC
+    PC --> PROM
+
+    TS & BLS --> CM
+    KAPI --> CM
+```
+
+### Design Principles
+
+| Principle | Implementation |
+|-----------|----------------|
+| **High Cohesion** | Each service handles a single domain (billing, quota, alerts) |
+| **Low Coupling** | Services communicate via well-defined interfaces |
+| **Stateless API** | All state persisted in Kubernetes ConfigMaps |
+| **Cloud Native** | Leverages Kubernetes primitives for HA and scaling |
+| **Zero Database** | ConfigMaps eliminate external database dependencies |
+
+## Architecture Layers
+
+Bison follows a layered architecture pattern:
+
+### 1. Presentation Layer
+- **Web UI**: React 18 + TypeScript + Ant Design 5
+- **API Client**: REST API for external integrations
+
+### 2. API Gateway Layer
+- **API Server**: Go + Gin framework
+- **Authentication**: JWT and OIDC support
+- **Middleware**: Logging, recovery, CORS handling
+
+### 3. Business Logic Layer
+- **Tenant Service**: Team and project management
+- **Billing Service**: Cost calculation and aggregation
+- **Balance Service**: Wallet management and auto-deduction
+- **Quota Service**: Resource limit enforcement
+- **Alert Service**: Multi-channel notifications
+- **Report Service**: Analytics and export
+
+### 4. Integration Layer
+- **Kubernetes Client**: client-go for K8s API interaction
+- **OpenCost Client**: REST API for cost data
+- **Prometheus Client**: PromQL queries for metrics
+
+### 5. Data Layer
+- **ConfigMaps**: Persistent storage for balances, billing config, and metadata
+- **etcd**: Backing store via Kubernetes ConfigMaps
+
+## Core Components
+
+### API Server
+
+The API server is the central component that handles all HTTP requests:
+
+**Technology Stack:**
+- Go 1.24+
+- Gin web framework
+- client-go for Kubernetes API
+
+**Key Responsibilities:**
+- Serve REST API endpoints
+- Authentication and authorization
+- Request routing and middleware
+- Background task scheduling
+
+**Endpoints:**
+```
+/api/v1/teams          - Team management
+/api/v1/projects       - Project management
+/api/v1/billing        - Billing configuration
+/api/v1/balance        - Balance operations
+/api/v1/stats          - Statistics and reports
+```
+
+### Web UI
+
+React-based single-page application:
+
+**Technology Stack:**
+- React 18
+- TypeScript
+- Vite (build tool)
+- Ant Design 5
+- ECharts (visualization)
+- React Query (state management)
+
+**Features:**
+- Dashboard with real-time metrics
+- Team and project management
+- Billing configuration
+- Balance monitoring
+- Usage reports and export
+
+### Billing Service
+
+Calculates costs based on resource usage:
+
+**Data Flow:**
+```mermaid
+sequenceDiagram
+    participant S as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant K8S as Kubernetes
+
+    S->>BS: Trigger billing (every 10min)
+    BS->>OC: Query team costs
+    OC-->>BS: Return usage data
+    BS->>BS: Calculate cost
+    BS->>BLS: Deduct from balance
+    BLS->>K8S: Update ConfigMap
+    BLS-->>BS: Confirm
+    BS->>AS: Check threshold
+    alt Balance low
+        AS->>Webhook: Send alert
+    end
+```
+
+**Billing Formula:**
+```
+Total Cost = (CPU_cores × CPU_price × hours) +
+             (Memory_GB × Memory_price × hours) +
+             (GPU_count × GPU_price × hours)
+```
+
+### Balance Service
+
+Manages team wallets and auto-deduction:
+
+**Features:**
+- Real-time balance tracking
+- Auto-deduction based on usage
+- Recharge operations
+- Transaction history
+- Auto-suspension when balance depleted
+
+**Storage:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: bison-team-balances
+  namespace: bison-system
+data:
+  ml-team: "1523.45"
+  data-team: "890.12"
+  dev-team: "2100.00"
+```
+
+### Tenant Service
+
+Manages teams (Capsule Tenants) and projects (Namespaces):
+
+**Features:**
+- Create/delete teams
+- Assign resource quotas
+- Configure node pools (shared/exclusive)
+- Manage team metadata
+
+**Capsule Integration:**
+```yaml
+apiVersion: capsule.clastix.io/v1beta1
+kind: Tenant
+metadata:
+  name: ml-team
+spec:
+  owners:
+  - name: team-leader
+    kind: User
+  resourceQuota:
+    items:
+    - hard:
+        cpu: "20"
+        memory: 64Gi
+        nvidia.com/gpu: "4"
+```
+
+## Data Flow
+
+### Team Creation Flow
+
+```mermaid
+sequenceDiagram
+    participant U as Admin
+    participant API as API Server
+    participant TS as Tenant Service
+    participant K8S as Kubernetes
+    participant CAP as Capsule
+
+    U->>API: POST /api/v1/teams
+    API->>TS: CreateTeam(name, quota, balance)
+    TS->>CAP: Create Tenant
+    CAP-->>TS: Tenant created
+    TS->>K8S: Create ConfigMap (balance)
+    K8S-->>TS: ConfigMap created
+    TS-->>API: Success
+    API-->>U: 201 Created
+```
+
+### Billing Cycle Flow
+
+```mermaid
+sequenceDiagram
+    participant SCH as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant AS as Alert Service
+
+    loop Every 10 minutes
+        SCH->>BS: Trigger billing calculation
+        BS->>OC: Query costs (last 10min)
+        OC-->>BS: Return usage metrics
+        BS->>BS: Calculate total cost
+        BS->>BLS: Deduct cost from balance
+        BLS->>BLS: Update balance
+        BLS-->>BS: Balance updated
+        BS->>AS: Check balance threshold
+        alt Balance < 20%
+            AS->>AS: Send low balance alert
+        end
+        alt Balance <= 0
+            AS->>BS: Suspend team workloads
+        end
+    end
+```
+
+## Integration Points
+
+### Kubernetes Integration
+
+Bison integrates deeply with Kubernetes:
+
+- **Capsule Tenants** for multi-tenancy
+- **ResourceQuotas** for limit enforcement
+- **Namespaces** for project isolation
+- **ConfigMaps** for data persistence
+- **RBAC** for access control
+
+### OpenCost Integration
+
+Real-time cost tracking via OpenCost API:
+
+```bash
+# Query team costs
+GET /allocation/compute?window=10m&aggregate=namespace&filter=namespace:ml-team
+
+# Response
+{
+  "ml-team": {
+    "cpuCost": 0.25,
+    "memCost": 0.10,
+    "gpuCost": 4.17,
+    "totalCost": 4.52
+  }
+}
+```
+
+### Prometheus Integration
+
+Metrics collection for monitoring:
+
+- Resource utilization metrics
+- Cost metrics
+- Balance metrics
+- Alert metrics
+
+## Deployment Architecture
+
+### High Availability Setup
+
+```mermaid
+graph TB
+    subgraph K8S[Kubernetes Cluster]
+        subgraph NS1[bison-system namespace]
+            API1[API Server Pod 1]
+            API2[API Server Pod 2]
+            WEB1[Web UI Pod 1]
+            WEB2[Web UI Pod 2]
+        end
+
+        subgraph NS2[opencost-system namespace]
+            OC[OpenCost]
+        end
+
+        subgraph NS3[prometheus-system namespace]
+            PROM[Prometheus]
+        end
+
+        LB[LoadBalancer]
+    end
+
+    LB --> API1 & API2
+    LB --> WEB1 & WEB2
+    API1 & API2 --> OC
+    OC --> PROM
+```
+
+### Resource Requirements
+
+**Minimum:**
+- API Server: 200m CPU, 256Mi Memory
+- Web UI: 100m CPU, 128Mi Memory
+
+**Recommended (Production):**
+- API Server: 1000m CPU, 512Mi Memory (2 replicas)
+- Web UI: 500m CPU, 256Mi Memory (2 replicas)
+
+## Security Model
+
+### Authentication
+- JWT token-based authentication
+- OIDC/SSO integration
+- Admin user management
+
+### Authorization
+- Kubernetes RBAC integration
+- Role-based access control
+- Team-scoped permissions
+
+### Data Security
+- All data encrypted at rest (etcd encryption)
+- TLS for API communication
+- Secret management via Kubernetes Secrets
+
+## Technology Stack
+
+### Backend
+- **Language**: Go 1.24+
+- **Framework**: Gin
+- **Kubernetes Client**: client-go
+- **Configuration**: Viper
+- **Logging**: Logrus
+
+### Frontend
+- **Framework**: React 18
+- **Language**: TypeScript
+- **UI Library**: Ant Design 5
+- **Build Tool**: Vite
+- **State Management**: React Query
+- **Charts**: ECharts
+
+### Infrastructure
+- **Platform**: Kubernetes 1.22+
+- **Multi-Tenancy**: Capsule
+- **Cost Tracking**: OpenCost
+- **Metrics**: Prometheus
+- **Storage**: ConfigMaps (etcd)
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison
+- [Configuration](configuration.md) - Configure billing
+- [User Guides](user-guides/admin.md) - Learn to use Bison
+- [Features](features.md) - Explore capabilities
diff --git a/website/versioned_docs/version-0.0.11/configuration.md b/website/versioned_docs/version-0.0.11/configuration.md
new file mode 100644
index 0000000..539aaa3
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/configuration.md
@@ -0,0 +1,361 @@
+---
+sidebar_position: 6
+---
+
+# Configuration
+
+This guide covers how to configure Bison for your specific environment and requirements.
+
+## Helm Chart Configuration
+
+Bison is configured primarily through Helm values. You can customize the installation by providing a `values.yaml` file or using `--set` flags.
+
+### Key Configuration Parameters
+
+| Parameter | Description | Default | Example |
+|-----------|-------------|---------|---------|
+| `auth.enabled` | Enable authentication | `false` | `true` |
+| `auth.admin.username` | Admin username | `admin` | `admin` |
+| `auth.admin.password` | Admin password | `admin` | `changeme` |
+| `apiServer.replicaCount` | API server replicas | `2` | `3` |
+| `apiServer.image.repository` | API server image | `ghcr.io/supermarioyl/bison/api-server` | - |
+| `apiServer.image.tag` | API server image tag | `0.0.1` | `latest` |
+| `webUI.replicaCount` | Web UI replicas | `2` | `3` |
+| `webUI.image.repository` | Web UI image | `ghcr.io/supermarioyl/bison/web-ui` | - |
+| `webUI.image.tag` | Web UI image tag | `0.0.1` | `latest` |
+| `opencost.url` | OpenCost API endpoint | `http://opencost.opencost-system.svc:9003` | Custom URL |
+
+### Example Custom Values
+
+Create a `custom-values.yaml` file:
+
+```yaml
+# Authentication
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: MySecurePassword123
+
+# API Server
+apiServer:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 200m
+      memory: 256Mi
+    limits:
+      cpu: 1000m
+      memory: 512Mi
+
+# Web UI
+webUI:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 100m
+      memory: 128Mi
+    limits:
+      cpu: 500m
+      memory: 256Mi
+
+# OpenCost Integration
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Node Selection (optional)
+nodeSelector:
+  node-role.kubernetes.io/control-plane: ""
+
+# Tolerations (optional)
+tolerations:
+  - key: node-role.kubernetes.io/control-plane
+    operator: Exists
+    effect: NoSchedule
+```
+
+Install with custom values:
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --values custom-values.yaml
+```
+
+## Billing Configuration
+
+Billing settings are configured through the Web UI or API after installation.
+
+### Access Billing Configuration
+
+1. **Via Web UI:**
+   - Navigate to **Settings** > **Billing Configuration**
+   - Set pricing for CPU, Memory, GPU, and other resources
+   - Configure currency and billing intervals
+
+2. **Via API:**
+   ```bash
+   curl -X POST http://localhost:8080/api/v1/billing/config \
+     -H "Content-Type: application/json" \
+     -d '{
+       "enabled": true,
+       "currency": "USD",
+       "pricing": {
+         "cpu": 0.05,
+         "memory": 0.01,
+         "nvidia.com/gpu": 2.50
+       },
+       "billingInterval": "hourly"
+     }'
+   ```
+
+### Billing Parameters
+
+| Parameter | Description | Example |
+|-----------|-------------|---------|
+| `enabled` | Enable/disable billing | `true` |
+| `currency` | Currency for billing | `USD`, `CNY`, `EUR` |
+| `pricing.cpu` | CPU price per core-hour | `0.05` |
+| `pricing.memory` | Memory price per GB-hour | `0.01` |
+| `pricing["nvidia.com/gpu"]` | GPU price per GPU-hour | `2.50` |
+| `billingInterval` | Billing aggregation period | `hourly`, `daily` |
+| `lowBalanceThreshold` | Warning threshold (%) | `20` |
+| `suspendThreshold` | Auto-suspend threshold (%) | `5` |
+
+### Example Billing Configuration
+
+```json
+{
+  "enabled": true,
+  "currency": "USD",
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "nvidia.com/mig-1g.5gb": 0.50,
+    "nvidia.com/mig-2g.10gb": 1.00
+  },
+  "billingInterval": "hourly",
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Team Configuration
+
+### Creating Teams
+
+Teams can be created through the Web UI or API:
+
+**Via Web UI:**
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Set team name, quota, and initial balance
+
+**Via API:**
+```bash
+curl -X POST http://localhost:8080/api/v1/teams \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "ml-team",
+    "description": "Machine Learning Team",
+    "quota": {
+      "cpu": "20",
+      "memory": "64Gi",
+      "nvidia.com/gpu": "4"
+    },
+    "balance": 1000.00
+  }'
+```
+
+### Team Quotas
+
+Team quotas define resource limits:
+
+```yaml
+quota:
+  cpu: "20"              # 20 CPU cores
+  memory: "64Gi"         # 64 GB RAM
+  nvidia.com/gpu: "4"    # 4 GPUs
+  storage: "500Gi"       # 500 GB storage
+```
+
+### Team Balance Management
+
+Set initial balance and configure auto-recharge:
+
+```json
+{
+  "balance": 1000.00,
+  "autoRecharge": {
+    "enabled": true,
+    "amount": 500.00,
+    "schedule": "monthly",
+    "threshold": 100.00
+  }
+}
+```
+
+## Alert Configuration
+
+Configure multi-channel alerts for low balance and quota warnings.
+
+### Webhook Alerts
+
+```json
+{
+  "type": "webhook",
+  "enabled": true,
+  "url": "https://your-webhook-endpoint.com/alerts",
+  "headers": {
+    "Authorization": "Bearer YOUR_TOKEN"
+  },
+  "template": {
+    "title": "Bison Alert",
+    "message": "Team {{.TeamName}} balance is {{.Balance}}"
+  }
+}
+```
+
+### DingTalk Alerts
+
+```json
+{
+  "type": "dingtalk",
+  "enabled": true,
+  "webhook": "https://oapi.dingtalk.com/robot/send?access_token=YOUR_TOKEN",
+  "secret": "YOUR_SECRET"
+}
+```
+
+### WeChat Work Alerts
+
+```json
+{
+  "type": "wechat",
+  "enabled": true,
+  "corpid": "YOUR_CORP_ID",
+  "corpsecret": "YOUR_CORP_SECRET",
+  "agentid": 1000001
+}
+```
+
+## OpenCost Integration
+
+Configure OpenCost connection:
+
+### Check OpenCost Connectivity
+
+```bash
+# Test OpenCost API
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+
+# Test allocation API
+curl http://localhost:9003/allocation/compute?window=1d
+```
+
+### Update OpenCost URL
+
+If OpenCost is deployed in a different namespace or with a different service name:
+
+```bash
+helm upgrade bison bison/bison \
+  --set opencost.url=http://my-opencost.custom-namespace.svc:9003 \
+  --namespace bison-system
+```
+
+## Authentication & OIDC
+
+Enable authentication and integrate with your SSO provider:
+
+### Basic Authentication
+
+```yaml
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: SecurePassword123
+```
+
+### OIDC Integration
+
+```yaml
+auth:
+  enabled: true
+  oidc:
+    enabled: true
+    issuerURL: https://your-oidc-provider.com
+    clientID: bison-client-id
+    clientSecret: your-client-secret
+    redirectURL: https://bison.example.com/callback
+```
+
+## Environment Variables
+
+Additional configuration can be provided via environment variables:
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `KUBECONFIG` | Path to kubeconfig file | In-cluster config |
+| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost-system.svc:9003` |
+| `AUTH_ENABLED` | Enable authentication | `false` |
+| `LOG_LEVEL` | Logging level | `info` |
+| `BILLING_INTERVAL` | Billing calculation interval | `10m` |
+
+Set environment variables in Helm values:
+
+```yaml
+apiServer:
+  env:
+    - name: LOG_LEVEL
+      value: debug
+    - name: BILLING_INTERVAL
+      value: 5m
+```
+
+## Advanced Configuration
+
+### Custom Resource Pricing
+
+Price any Kubernetes resource:
+
+```json
+{
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "amd.com/gpu": 2.00,
+    "ephemeral-storage": 0.001,
+    "custom.io/fpga": 5.00
+  }
+}
+```
+
+### Multi-Cluster Support
+
+Deploy Bison in each cluster with shared billing:
+
+```yaml
+# Cluster A
+apiServer:
+  clusterName: prod-us-west
+
+# Cluster B
+apiServer:
+  clusterName: prod-us-east
+```
+
+## Next Steps
+
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
+- [Features](features.md) - Explore all capabilities
diff --git a/website/versioned_docs/version-0.0.11/features.md b/website/versioned_docs/version-0.0.11/features.md
new file mode 100644
index 0000000..8d0c438
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/features.md
@@ -0,0 +1,195 @@
+---
+sidebar_position: 2
+---
+
+# Features
+
+Bison provides a comprehensive suite of features for GPU resource management, billing, and multi-tenant isolation in Kubernetes environments.
+
+## See Bison in Action
+
+### 🎯 Real-Time Resource Dashboard
+
+![Bison Dashboard](/img/ui-dashboard.png)
+
+**What you see:**
+- **Cluster Overview** - Total teams, projects, resource pools, and quotas at a glance
+- **Resource Utilization** - Visual breakdown showing which teams are consuming resources
+- **7-Day Cost Trends** - Historical cost data to identify spending patterns
+- **Top 5 Cost Rankings** - Quickly identify heavy GPU consumers
+- **Team Budget Status** - Real-time balance monitoring with color-coded alerts
+
+**Who benefits:**
+- **Platform Administrators** get instant visibility into cluster health and usage patterns
+- **Finance Teams** can track costs in real-time without waiting for monthly reports
+- **Team Leaders** can compare their usage against other teams
+
+---
+
+### 💼 Team Management & Budget Monitoring
+
+![Team Management](/img/ui-team.png)
+
+**What you see:**
+- **Team List** with real-time status indicators:
+  - 🟢 Green balance = Healthy budget
+  - 🟡 Yellow balance = Approaching threshold
+  - 🔴 Red balance = Low balance or suspended
+- **Resource Allocation** - CPU/Memory/GPU quotas per team (e.g., "cpu 0/10" means 0 used out of 10 allocated)
+- **Project Count** - Number of namespaces/projects under each team
+- **Quick Actions** - Edit quotas, recharge balance, or delete team with one click
+
+**Who benefits:**
+- **Team Leaders** monitor their budget status and resource usage at a glance
+- **Administrators** manage multiple teams from a single unified view
+- **Finance Teams** see which teams need recharging
+
+---
+
+### 💰 Flexible Billing Configuration
+
+![Billing Configuration](/img/ui-billing.png)
+
+**What you see:**
+- **Per-Resource Pricing** - Set custom prices for CPU (per core-hour), Memory (per GB-hour), GPU (per GPU-hour)
+- **Currency Selection** - Support for CNY, USD, EUR, and other currencies
+- **Enable/Disable Toggle** - Turn billing on/off for specific resources with one click
+- **Billing Rules** - Define how resources are metered (hourly, daily, etc.)
+- **Alert Thresholds** - Configure when to send low-balance warnings
+
+**Who benefits:**
+- **Finance Teams** align cloud costs with internal chargeback policies
+- **Administrators** adjust pricing based on actual hardware costs
+- **Budget Managers** set appropriate warning thresholds to prevent overruns
+
+---
+
+## Core Capabilities
+
+### Multi-Tenant Management
+✅ **Capsule-Powered Isolation** - True multi-tenancy using Kubernetes-native Capsule operator
+✅ **OIDC Integration** - Enterprise SSO support for authentication
+✅ **Team-Based Access Control** - Manage users, roles, and permissions per team
+✅ **Shared & Exclusive Node Pools** - Flexible resource allocation strategies
+
+### Real-Time Billing
+✅ **Usage-Based Billing** - Accurate cost tracking based on actual resource consumption
+✅ **Configurable Pricing** - Set custom rates for CPU, Memory, GPU, and any Kubernetes resource
+✅ **Multi-Currency Support** - CNY, USD, EUR, and more
+✅ **Billing Rules Engine** - Define custom billing logic and aggregation periods
+
+### Dynamic Resource Quotas
+✅ **Per-Team Quotas** - CPU, Memory, GPU, Storage, and custom resources
+✅ **Namespace Quotas** - Project-level resource limits within teams
+✅ **Auto-Enforcement** - Kubernetes-native quota enforcement
+✅ **Quota Alerts** - Notifications when approaching limits
+
+### Team Balance & Wallet System
+✅ **Prepaid Balances** - Team wallets with real-time deduction
+✅ **Auto-Deduction** - Automated billing based on resource usage
+✅ **Balance Thresholds** - Configurable warning and suspension levels
+✅ **Transaction History** - Complete audit trail of all balance changes
+
+### Auto-Recharge
+✅ **Scheduled Top-Ups** - Weekly or monthly automatic recharges
+✅ **Custom Amounts** - Flexible recharge amounts per team
+✅ **Recharge Notifications** - Alert teams when balance is added
+
+### Balance Alerts
+✅ **Multi-Channel Notifications** - Webhook, DingTalk, WeChat, Email
+✅ **Configurable Thresholds** - Set warning levels (e.g., 20%, 10%, 5%)
+✅ **Auto-Suspension** - Automatically suspend workloads when balance depleted
+✅ **Custom Templates** - Customize alert messages
+
+### Usage Reports
+✅ **Team Analytics** - Per-team cost breakdowns and trends
+✅ **Project Analytics** - Namespace-level resource consumption
+✅ **Export Capabilities** - CSV, Excel, PDF reports
+✅ **Historical Data** - 30/60/90-day cost analysis
+
+### Audit Logging
+✅ **Complete Operation History** - Track all administrative actions
+✅ **User Attribution** - Who did what and when
+✅ **Resource Changes** - Track quota, balance, and configuration changes
+✅ **Compliance Ready** - Meet internal audit requirements
+
+---
+
+## Architecture Highlights
+
+Bison's architecture is designed for simplicity, scalability, and zero external dependencies.
+
+```mermaid
+graph TB
+    subgraph USER_LAYER[User Layer]
+        UI[Web UI<br/>React + Ant Design]
+        API[REST API<br/>Go + Gin]
+    end
+
+    subgraph CORE[Core Services]
+        BS[Billing Service]
+        TS[Tenant Service]
+        QS[Quota Service]
+    end
+
+    subgraph K8S[Kubernetes Layer]
+        CA[Capsule<br/>Multi-Tenancy]
+        OC[OpenCost<br/>Cost Tracking]
+        PR[Prometheus<br/>Metrics]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Zero Database]
+    end
+
+    UI --> API
+    API --> BS & TS & QS
+    BS --> OC
+    TS --> CA
+    QS --> CA
+    BS & TS --> CM
+    OC --> PR
+```
+
+### Key Architectural Benefits
+
+- **Zero External Dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+- **Cloud-Native** - Built on Kubernetes primitives for maximum portability
+- **Scalable** - Stateless API server that can scale horizontally
+- **Secure** - Kubernetes RBAC integration and optional authentication
+- **Observable** - Prometheus metrics and structured logging
+- **Extensible** - Plugin architecture for custom billing rules and alerts
+
+---
+
+## Integration Points
+
+### OpenCost Integration
+Bison leverages [OpenCost](https://www.opencost.io/) for real-time cost tracking:
+- Per-pod, per-namespace, per-team cost visibility
+- GPU utilization metrics
+- Historical cost data and trends
+- Integration with Prometheus for metric collection
+
+### Capsule Integration
+Bison uses [Capsule](https://capsule.clastix.io/) for multi-tenancy:
+- Team-based tenant isolation
+- Namespace quota enforcement
+- Network and security policies
+- OIDC/SSO integration
+
+### Prometheus Integration
+Metrics collection and monitoring:
+- Resource utilization tracking
+- Custom billing metrics
+- Alert rule evaluation
+- Historical data retention
+
+---
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison in your cluster
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Deep dive into system design
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.11/installation.md b/website/versioned_docs/version-0.0.11/installation.md
new file mode 100644
index 0000000..da89191
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/installation.md
@@ -0,0 +1,316 @@
+---
+sidebar_position: 3
+---
+
+# Installation Guide
+
+This guide provides detailed instructions for installing Bison in your Kubernetes cluster.
+
+## Prerequisites
+
+Before installing Bison, ensure you have:
+
+- **Kubernetes 1.22+** - A running Kubernetes cluster
+- **kubectl** - Configured to access your cluster
+- **Helm 3.0+** - Package manager for Kubernetes
+- **Capsule Operator v0.1.0+** - For multi-tenant isolation
+- **OpenCost** - Deployed with Prometheus for cost tracking
+
+### Install Prerequisites
+
+If you haven't installed the required components:
+
+#### Install Capsule
+
+```bash
+# Using Helm
+helm repo add projectcapsule https://projectcapsule.github.io/charts
+helm install capsule projectcapsule/capsule \
+  --namespace capsule-system \
+  --create-namespace
+```
+
+#### Install OpenCost
+
+```bash
+# Using Helm
+helm repo add opencost https://opencost.github.io/opencost-helm-chart
+helm install opencost opencost/opencost \
+  --namespace opencost-system \
+  --create-namespace \
+  --set prometheus.internal.serviceName=prometheus-server \
+  --set prometheus.internal.namespaceName=prometheus-system
+```
+
+## Installation Methods
+
+Bison Helm charts are distributed via **GitHub Container Registry (GHCR)** using the modern OCI format.
+
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
+
+### Option A: From GHCR (Recommended)
+
+The simplest way to install Bison is directly from GitHub Container Registry:
+
+```bash
+# Install specific version from GHCR
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace
+
+# Or pull the chart first, then install
+helm pull oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+helm install bison bison-0.0.2.tgz \
+  --namespace bison-system \
+  --create-namespace
+
+# Customize installation
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true \
+  --set apiServer.image.tag=0.0.2 \
+  --set webUI.image.tag=0.0.2
+```
+
+**Why GHCR OCI Format?**
+- ✅ No separate Helm repository maintenance needed
+- ✅ Unified with Docker images in GHCR
+- ✅ Faster installation (direct registry pull)
+- ✅ Modern Helm 3.8+ standard practice
+
+### Option B: From GitHub Release
+
+Download a specific version from GitHub Releases:
+
+```bash
+# Download Helm chart
+VERSION=0.0.2
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install the chart
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Option C: From Source
+
+Clone and build from source:
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+## Configuration Options
+
+Bison can be configured using Helm values. Here are the key configuration options:
+
+### Basic Configuration
+
+```yaml
+# values.yaml
+apiServer:
+  image:
+    repository: ghcr.io/supermarioyl/bison/api-server
+    tag: 0.0.1
+  replicas: 2
+
+webUI:
+  image:
+    repository: ghcr.io/supermarioyl/bison/web-ui
+    tag: 0.0.1
+  replicas: 2
+
+# OpenCost URL
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Authentication
+auth:
+  enabled: false
+```
+
+### Custom Configuration Example
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set apiServer.replicas=3 \
+  --set webUI.replicas=3 \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true
+```
+
+## Verify Installation
+
+After installation, verify that all components are running:
+
+```bash
+# Check pod status
+kubectl get pods -n bison-system
+
+# Expected output:
+# NAME                              READY   STATUS    RESTARTS   AGE
+# bison-api-server-xxxxxxxxx-xxxxx  1/1     Running   0          2m
+# bison-webui-xxxxxxxxx-xxxxx       1/1     Running   0          2m
+
+# Check services
+kubectl get svc -n bison-system
+
+# Check logs
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl logs -n bison-system deployment/bison-webui
+```
+
+## Access the Platform
+
+### Port Forward (Development)
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+```
+
+### Ingress (Production)
+
+For production deployments, configure an Ingress:
+
+```yaml
+# ingress.yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: bison-ingress
+  namespace: bison-system
+  annotations:
+    kubernetes.io/ingress.class: nginx
+spec:
+  rules:
+  - host: bison.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-webui
+            port:
+              number: 80
+      - path: /api
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-api-server
+            port:
+              number: 8080
+```
+
+Apply the Ingress:
+
+```bash
+kubectl apply -f ingress.yaml
+```
+
+## Docker Images
+
+Bison images are available on GitHub Container Registry:
+
+```bash
+# Pull images
+docker pull ghcr.io/supermarioyl/bison/api-server:0.0.1
+docker pull ghcr.io/supermarioyl/bison/web-ui:0.0.1
+
+# Or use latest
+docker pull ghcr.io/supermarioyl/bison/api-server:latest
+docker pull ghcr.io/supermarioyl/bison/web-ui:latest
+```
+
+**Supported Platforms:**
+- `linux/amd64`
+- `linux/arm64`
+
+## Upgrading
+
+To upgrade Bison to a new version:
+
+```bash
+# Update Helm repository
+helm repo update
+
+# Upgrade to latest version
+helm upgrade bison bison/bison --namespace bison-system
+
+# Or upgrade to specific version
+helm upgrade bison bison/bison --version 0.0.2 --namespace bison-system
+```
+
+## Uninstalling
+
+To completely remove Bison:
+
+```bash
+# Uninstall Helm release
+helm uninstall bison --namespace bison-system
+
+# Remove namespace (optional)
+kubectl delete namespace bison-system
+```
+
+## Troubleshooting
+
+### Pod Not Starting
+
+Check pod logs for errors:
+
+```bash
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl describe pod -n bison-system <pod-name>
+```
+
+### Cannot Connect to OpenCost
+
+Verify OpenCost is running and accessible:
+
+```bash
+kubectl get svc -n opencost-system
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+
+# Test endpoint
+curl http://localhost:9003/healthz
+```
+
+### Authentication Issues
+
+If authentication is enabled, ensure you have the correct credentials:
+
+```bash
+# Default credentials (change in production!)
+Username: admin
+Password: admin
+```
+
+## Next Steps
+
+- [Configuration Guide](configuration.md) - Configure billing and settings
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
diff --git a/website/versioned_docs/version-0.0.11/intro.md b/website/versioned_docs/version-0.0.11/intro.md
new file mode 100644
index 0000000..b3dc3aa
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/intro.md
@@ -0,0 +1,167 @@
+---
+sidebar_position: 1
+slug: /
+---
+
+# Introduction to Bison
+
+![Bison Logo](/img/logo.png)
+
+**Enterprise GPU Resource Billing & Multi-Tenant Management Platform**
+
+Bison is a Kubernetes-based platform that provides comprehensive GPU resource management, billing, and multi-tenant isolation for organizations running shared GPU clusters.
+
+## The GPU Management Challenge
+
+Managing shared GPU clusters across multiple teams creates critical operational and financial challenges:
+
+**For Platform Administrators:**
+- How do you fairly allocate expensive GPU resources across competing teams?
+- How do you prevent resource hogging while ensuring everyone gets their fair share?
+- How do you track who's using what and implement accurate chargeback?
+- How do you maintain strict multi-tenant isolation without complex manual configuration?
+
+**For Finance & Budget Teams:**
+- How do you implement automated chargeback for GPU usage without manual accounting?
+- How do you prevent budget overruns before they happen?
+- How do you generate accurate cost reports for internal billing?
+
+**For Development Teams:**
+- How do you get predictable, isolated access to GPU resources?
+- How do you know when you're approaching your budget limits?
+- How do you avoid impacting other teams' workloads?
+
+**Traditional Approach:**
+- Manual quota configuration per namespace
+- Excel-based billing calculations
+- No real-time cost visibility
+- Complex multi-tool setup (quota management + cost tracking + billing system)
+- Frequent resource conflicts and budget surprises
+
+## Bison's Integrated Solution
+
+```mermaid
+graph TB
+    subgraph WITHOUT["Without Bison"]
+        P1[❌ Manual Quota Management<br/>Per-namespace configuration]
+        P2[❌ Spreadsheet Billing<br/>Manual calculations & reports]
+        P3[❌ No Resource Isolation<br/>Teams compete for resources]
+        P4[❌ Budget Overruns<br/>No proactive alerts]
+        P5[❌ Complex Tooling<br/>Multiple systems to manage]
+    end
+
+    subgraph WITH["With Bison"]
+        S1[✅ Automated Team Quotas<br/>Capsule-powered isolation]
+        S2[✅ Real-Time Billing<br/>OpenCost integration]
+        S3[✅ True Multi-Tenancy<br/>Shared/Exclusive modes]
+        S4[✅ Proactive Alerts<br/>Balance monitoring & auto-suspend]
+        S5[✅ Unified Platform<br/>Single pane of glass]
+    end
+
+    P1 -.Transform.-> S1
+    P2 -.Transform.-> S2
+    P3 -.Transform.-> S3
+    P4 -.Transform.-> S4
+    P5 -.Transform.-> S5
+
+    style WITHOUT fill:#ffebee
+    style WITH fill:#e8f5e9
+    style S1 fill:#4caf50,color:#fff
+    style S2 fill:#4caf50,color:#fff
+    style S3 fill:#4caf50,color:#fff
+    style S4 fill:#4caf50,color:#fff
+    style S5 fill:#4caf50,color:#fff
+```
+
+**Bison combines:**
+- 🔐 **Kubernetes-native multi-tenancy** (Capsule) - True team isolation with shared or exclusive node pools
+- 💰 **Real-time cost tracking** (OpenCost + Prometheus) - Per-pod, per-namespace, per-team cost visibility
+- 💳 **Automated billing & budgets** - Prepaid balances, auto-deduction, low-balance alerts, and auto-suspension
+- 📊 **Unified dashboard** - Single interface for admins, team leaders, and finance teams
+- 🔧 **Zero external dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+
+**Result:** Deploy once, get complete GPU resource management with automated billing in under 30 minutes.
+
+## Quick Start
+
+### Prerequisites
+
+- Kubernetes 1.22+
+- kubectl configured
+- Helm 3.0+
+- Capsule operator (v0.1.0+) installed
+- OpenCost deployed with Prometheus
+
+### Installation
+
+Choose one of the following installation methods:
+
+#### Option A: Using Helm Repository (Recommended)
+
+```bash
+# Add Bison Helm repository
+helm repo add bison https://supermarioyl.github.io/Bison/charts/
+helm repo update
+
+# Install with default configuration
+helm install bison bison/bison --namespace bison-system --create-namespace
+
+# Or customize installation
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=false
+```
+
+#### Option B: From GitHub Release
+
+```bash
+# Download latest Helm chart
+VERSION=0.0.1
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+#### Option C: From Source
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Access the Platform
+
+After installation, access Bison through:
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+# Default credentials (if auth enabled):
+# Username: admin
+# Password: admin (change immediately in production!)
+```
+
+## Next Steps
+
+- [Explore Features](features.md) - Learn about all capabilities
+- [Installation Guide](installation.md) - Detailed installation instructions
+- [User Guides](user-guides/admin.md) - Role-based user guides
+- [Architecture](architecture.md) - Understand the system architecture
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.11/user-guides/_category_.json b/website/versioned_docs/version-0.0.11/user-guides/_category_.json
new file mode 100644
index 0000000..fe79f61
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/user-guides/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "User Guides",
+  "position": 4,
+  "link": {
+    "type": "generated-index",
+    "description": "Role-based guides for using Bison effectively."
+  }
+}
diff --git a/website/versioned_docs/version-0.0.11/user-guides/admin.md b/website/versioned_docs/version-0.0.11/user-guides/admin.md
new file mode 100644
index 0000000..a466cbb
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/user-guides/admin.md
@@ -0,0 +1,176 @@
+---
+sidebar_position: 1
+---
+
+# Administrator Guide
+
+This guide is for platform administrators who deploy, configure, and manage the Bison platform.
+
+## Responsibilities
+
+As a platform administrator, you are responsible for:
+
+- ✅ Deploying and configuring Bison
+- ✅ Creating and managing teams
+- ✅ Setting global billing configuration
+- ✅ Monitoring cluster-wide metrics
+- ✅ Responding to alerts and recharge requests
+
+## Getting Started
+
+### 1. Deploy Bison
+
+Follow the [Installation Guide](../installation.md) to deploy Bison in your Kubernetes cluster.
+
+### 2. Configure Billing
+
+Set up billing rules and pricing:
+
+1. Access the Web UI
+2. Navigate to **Settings** > **Billing Configuration**
+3. Configure:
+   - **Currency**: USD, CNY, EUR, etc.
+   - **CPU Price**: Cost per core-hour
+   - **Memory Price**: Cost per GB-hour
+   - **GPU Price**: Cost per GPU-hour
+4. Click **Save**
+
+### 3. Create First Team
+
+Create a team for your users:
+
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Fill in:
+   - **Team Name**: e.g., "ml-team"
+   - **Description**: Team purpose
+   - **Resource Quota**:
+     - CPU: e.g., "20" cores
+     - Memory: e.g., "64Gi"
+     - GPU: e.g., "4"
+   - **Initial Balance**: e.g., 1000.00
+4. Click **Create**
+
+## Common Tasks
+
+### Managing Teams
+
+#### View All Teams
+
+```bash
+# Via kubectl
+kubectl get tenants
+
+# Via API
+curl http://localhost:8080/api/v1/teams
+```
+
+#### Update Team Quota
+
+1. Navigate to **Teams** page
+2. Click **Edit** on the team row
+3. Modify quotas
+4. Click **Save**
+
+#### Recharge Team Balance
+
+1. Navigate to **Teams** page
+2. Click **Recharge** on the team row
+3. Enter amount
+4. Add notes (optional)
+5. Click **Confirm**
+
+### Monitoring
+
+#### View Dashboard
+
+Access real-time cluster metrics:
+- Total teams and projects
+- Resource utilization
+- Cost trends
+- Top consumers
+- Balance status
+
+#### Check Alerts
+
+Monitor low-balance and quota alerts:
+1. Navigate to **Alerts** page
+2. Review active alerts
+3. Take action as needed
+
+### Billing Configuration
+
+#### Update Pricing
+
+```bash
+curl -X PUT http://localhost:8080/api/v1/billing/config \
+  -H "Content-Type: application/json" \
+  -d '{
+    "pricing": {
+      "cpu": 0.06,
+      "memory": 0.012,
+      "nvidia.com/gpu": 3.00
+    }
+  }'
+```
+
+#### Configure Alert Thresholds
+
+```json
+{
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Best Practices
+
+### Team Naming
+- Use lowercase, alphanumeric characters and hyphens
+- Example: `ml-team`, `data-science`, `dev-team`
+
+### Quota Allocation
+- Start with conservative quotas
+- Monitor usage for 1-2 weeks
+- Adjust based on actual needs
+
+### Balance Management
+- Set up auto-recharge for critical teams
+- Monitor balance trends weekly
+- Respond to low-balance alerts promptly
+
+### Security
+- Enable authentication in production
+- Use OIDC/SSO for enterprise deployments
+- Regularly audit user permissions
+
+## Troubleshooting
+
+### Team Creation Failed
+
+Check Capsule operator logs:
+```bash
+kubectl logs -n capsule-system deployment/capsule-controller-manager
+```
+
+### Billing Not Working
+
+Verify OpenCost connectivity:
+```bash
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+```
+
+### High Resource Usage
+
+Check resource consumption:
+```bash
+kubectl top pods -n bison-system
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Guide for team leaders
+- [Developer Guide](developer.md) - Guide for developers
+- [Configuration](../configuration.md) - Advanced configuration
diff --git a/website/versioned_docs/version-0.0.11/user-guides/developer.md b/website/versioned_docs/version-0.0.11/user-guides/developer.md
new file mode 100644
index 0000000..d14ab62
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/user-guides/developer.md
@@ -0,0 +1,187 @@
+---
+sidebar_position: 3
+---
+
+# Developer Guide
+
+This guide is for developers who deploy workloads and consume resources within team projects.
+
+## Responsibilities
+
+As a developer, you are responsible for:
+
+- ✅ Deploying applications within your project
+- ✅ Monitoring resource usage
+- ✅ Staying within quota limits
+- ✅ Optimizing resource consumption
+
+## Getting Started
+
+### 1. Get Kubeconfig
+
+Request kubeconfig from your team leader or administrator.
+
+### 2. Set Context
+
+```bash
+# Set context to your project namespace
+kubectl config set-context --current --namespace=your-project
+
+# Verify
+kubectl config view --minify | grep namespace
+```
+
+### 3. Check Quota
+
+See your available resources:
+```bash
+kubectl describe quota
+```
+
+## Deploying Workloads
+
+### Basic Pod Deployment
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: gpu-training-job
+  namespace: your-project
+spec:
+  containers:
+  - name: trainer
+    image: your-ml-image:latest
+    resources:
+      requests:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+      limits:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+```
+
+### Using Deployments
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: ml-inference
+  namespace: your-project
+spec:
+  replicas: 2
+  selector:
+    matchLabels:
+      app: ml-inference
+  template:
+    metadata:
+      labels:
+        app: ml-inference
+    spec:
+      containers:
+      - name: inference
+        image: your-inference-image:latest
+        resources:
+          requests:
+            cpu: "2"
+            memory: "8Gi"
+            nvidia.com/gpu: "1"
+```
+
+## Monitoring Usage
+
+### Check Pod Resource Usage
+
+```bash
+# View resource consumption
+kubectl top pods
+
+# Detailed pod information
+kubectl describe pod <pod-name>
+```
+
+### View Logs
+
+```bash
+# Stream logs
+kubectl logs -f <pod-name>
+
+# Previous logs (if pod restarted)
+kubectl logs --previous <pod-name>
+```
+
+## Best Practices
+
+### Resource Requests and Limits
+
+Always specify both requests and limits:
+```yaml
+resources:
+  requests:
+    cpu: "2"
+    memory: "8Gi"
+  limits:
+    cpu: "4"
+    memory: "16Gi"
+```
+
+### GPU Usage
+
+- Request GPUs only when needed
+- Use GPU for compute-intensive tasks
+- Monitor GPU utilization
+
+### Clean Up
+
+Delete resources when no longer needed:
+```bash
+# Delete pod
+kubectl delete pod <pod-name>
+
+# Delete deployment
+kubectl delete deployment <deployment-name>
+
+# Clean up completed jobs
+kubectl delete job --field-selector status.successful=1
+```
+
+### Cost Optimization
+
+- Right-size your resource requests
+- Use horizontal pod autoscaling
+- Clean up idle resources
+- Share GPUs when possible (if supported)
+
+## Troubleshooting
+
+### Pod Pending (Insufficient Quota)
+
+If your pod is stuck in `Pending` state:
+
+```bash
+kubectl describe pod <pod-name>
+```
+
+Look for quota-related errors and reduce resource requests or ask your team leader for more quota.
+
+### Out of Memory (OOM)
+
+If pods are killed due to OOM:
+1. Check memory usage patterns
+2. Increase memory limits
+3. Optimize application memory usage
+
+### GPU Not Available
+
+Verify GPU requests:
+```bash
+kubectl get nodes -o custom-columns=NAME:.metadata.name,GPU:.status.allocatable."nvidia\.com/gpu"
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Understand team management
+- [Architecture](../architecture.md) - Learn about the platform
diff --git a/website/versioned_docs/version-0.0.11/user-guides/team-leader.md b/website/versioned_docs/version-0.0.11/user-guides/team-leader.md
new file mode 100644
index 0000000..7b6de96
--- /dev/null
+++ b/website/versioned_docs/version-0.0.11/user-guides/team-leader.md
@@ -0,0 +1,126 @@
+---
+sidebar_position: 2
+---
+
+# Team Leader Guide
+
+This guide is for team leaders who manage projects, monitor budgets, and allocate resources within their team.
+
+## Responsibilities
+
+As a team leader, you are responsible for:
+
+- ✅ Creating and managing projects (namespaces)
+- ✅ Allocating quotas to projects
+- ✅ Monitoring team balance and consumption
+- ✅ Requesting recharges when needed
+
+## Getting Started
+
+### 1. Access Bison
+
+Log in to the Web UI with your credentials.
+
+### 2. View Team Dashboard
+
+Your dashboard shows:
+- Team balance and status
+- Resource utilization
+- Active projects
+- Cost trends
+
+## Managing Projects
+
+### Create a Project
+
+1. Navigate to **Projects** page
+2. Click **Create Project**
+3. Fill in:
+   - **Project Name**: e.g., "training-ml-models"
+   - **Description**: Project purpose
+   - **Quota** (optional):
+     - CPU: e.g., "8" cores
+     - Memory: e.g., "32Gi"
+     - GPU: e.g., "2"
+4. Click **Create**
+
+### List Projects
+
+```bash
+# Via kubectl (if you have access)
+kubectl get namespaces -l capsule.clastix.io/tenant=your-team
+
+# Via API
+curl http://localhost:8080/api/v1/teams/your-team/projects
+```
+
+### Delete a Project
+
+1. Navigate to **Projects** page
+2. Click **Delete** on the project row
+3. Confirm deletion
+
+**Warning**: This will delete all resources in the project!
+
+## Monitoring Budget
+
+### Check Balance
+
+View your current balance:
+1. Navigate to **Team** page
+2. See balance in the status card
+
+### View Usage Trends
+
+Analyze spending patterns:
+1. Navigate to **Reports** page
+2. Select time range (7 days, 30 days, 90 days)
+3. View:
+   - Cost breakdown by resource type
+   - Daily cost trends
+   - Per-project consumption
+
+### Request Recharge
+
+When balance is low:
+1. Click **Request Recharge** button
+2. Enter requested amount
+3. Add justification
+4. Submit request to administrator
+
+## Resource Management
+
+### Monitor Quota Usage
+
+Check how much of your quota is being used:
+```bash
+kubectl describe quota -n your-project
+```
+
+### Optimize Costs
+
+Tips to reduce spending:
+- **Right-size resources**: Don't over-provision CPU/Memory
+- **Clean up idle pods**: Delete unused workloads
+- **Use spot/preemptible instances**: Where applicable
+- **Monitor GPU utilization**: Ensure GPUs are fully utilized
+
+## Best Practices
+
+### Project Organization
+- Create separate projects for different workloads
+- Example: `ml-training`, `ml-inference`, `data-processing`
+
+### Quota Allocation
+- Allocate quotas based on project priority
+- Reserve buffer for urgent tasks
+
+### Cost Awareness
+- Review costs weekly
+- Identify and eliminate waste
+- Set up cost alerts
+
+## Next Steps
+
+- [Developer Guide](developer.md) - Guide for your team members
+- [Features](../features.md) - Explore all Bison features
diff --git a/website/versioned_docs/version-0.0.6/architecture.md b/website/versioned_docs/version-0.0.6/architecture.md
new file mode 100644
index 0000000..dbbe50d
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/architecture.md
@@ -0,0 +1,418 @@
+---
+sidebar_position: 5
+---
+
+# Architecture
+
+This document provides a technical overview of Bison's architecture, designed with high cohesion and low coupling principles for maintainability and scalability.
+
+## System Overview
+
+### High-Level Architecture
+
+```mermaid
+graph TB
+    subgraph PRESENT[Presentation Layer]
+        WEB[Web UI<br/>React 18 + Ant Design 5]
+        CLI[kubectl / API Client]
+    end
+
+    subgraph GATEWAY[API Gateway Layer]
+        GW[API Server<br/>Go + Gin Framework]
+        AUTH[Auth Middleware<br/>JWT + OIDC]
+    end
+
+    subgraph BUSINESS[Business Logic Layer]
+        TS[Tenant Service<br/>Team & Project CRUD]
+        BS[Billing Service<br/>Cost Calculation]
+        BLS[Balance Service<br/>Wallet Management]
+        QS[Quota Service<br/>Resource Limits]
+        AS[Alert Service<br/>Notifications]
+        RS[Report Service<br/>Analytics]
+    end
+
+    subgraph INTEGRATION[Integration Layer]
+        K8S[Kubernetes Client<br/>client-go]
+        OCC[OpenCost Client<br/>REST API]
+        PC[Prometheus Client<br/>PromQL]
+    end
+
+    subgraph EXTERNAL[External Systems]
+        KAPI[Kubernetes API]
+        CAP[Capsule Controller]
+        OC[OpenCost]
+        PROM[Prometheus]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Persistent Storage]
+    end
+
+    WEB --> GW
+    CLI --> GW
+    GW --> AUTH
+    AUTH --> TS & BS & BLS & QS & AS & RS
+
+    TS --> K8S
+    BS --> OCC
+    BLS --> K8S
+    QS --> K8S
+    RS --> OCC & PC
+
+    K8S --> KAPI
+    K8S --> CAP
+    OCC --> OC
+    PC --> PROM
+
+    TS & BLS --> CM
+    KAPI --> CM
+```
+
+### Design Principles
+
+| Principle | Implementation |
+|-----------|----------------|
+| **High Cohesion** | Each service handles a single domain (billing, quota, alerts) |
+| **Low Coupling** | Services communicate via well-defined interfaces |
+| **Stateless API** | All state persisted in Kubernetes ConfigMaps |
+| **Cloud Native** | Leverages Kubernetes primitives for HA and scaling |
+| **Zero Database** | ConfigMaps eliminate external database dependencies |
+
+## Architecture Layers
+
+Bison follows a layered architecture pattern:
+
+### 1. Presentation Layer
+- **Web UI**: React 18 + TypeScript + Ant Design 5
+- **API Client**: REST API for external integrations
+
+### 2. API Gateway Layer
+- **API Server**: Go + Gin framework
+- **Authentication**: JWT and OIDC support
+- **Middleware**: Logging, recovery, CORS handling
+
+### 3. Business Logic Layer
+- **Tenant Service**: Team and project management
+- **Billing Service**: Cost calculation and aggregation
+- **Balance Service**: Wallet management and auto-deduction
+- **Quota Service**: Resource limit enforcement
+- **Alert Service**: Multi-channel notifications
+- **Report Service**: Analytics and export
+
+### 4. Integration Layer
+- **Kubernetes Client**: client-go for K8s API interaction
+- **OpenCost Client**: REST API for cost data
+- **Prometheus Client**: PromQL queries for metrics
+
+### 5. Data Layer
+- **ConfigMaps**: Persistent storage for balances, billing config, and metadata
+- **etcd**: Backing store via Kubernetes ConfigMaps
+
+## Core Components
+
+### API Server
+
+The API server is the central component that handles all HTTP requests:
+
+**Technology Stack:**
+- Go 1.24+
+- Gin web framework
+- client-go for Kubernetes API
+
+**Key Responsibilities:**
+- Serve REST API endpoints
+- Authentication and authorization
+- Request routing and middleware
+- Background task scheduling
+
+**Endpoints:**
+```
+/api/v1/teams          - Team management
+/api/v1/projects       - Project management
+/api/v1/billing        - Billing configuration
+/api/v1/balance        - Balance operations
+/api/v1/stats          - Statistics and reports
+```
+
+### Web UI
+
+React-based single-page application:
+
+**Technology Stack:**
+- React 18
+- TypeScript
+- Vite (build tool)
+- Ant Design 5
+- ECharts (visualization)
+- React Query (state management)
+
+**Features:**
+- Dashboard with real-time metrics
+- Team and project management
+- Billing configuration
+- Balance monitoring
+- Usage reports and export
+
+### Billing Service
+
+Calculates costs based on resource usage:
+
+**Data Flow:**
+```mermaid
+sequenceDiagram
+    participant S as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant K8S as Kubernetes
+
+    S->>BS: Trigger billing (every 10min)
+    BS->>OC: Query team costs
+    OC-->>BS: Return usage data
+    BS->>BS: Calculate cost
+    BS->>BLS: Deduct from balance
+    BLS->>K8S: Update ConfigMap
+    BLS-->>BS: Confirm
+    BS->>AS: Check threshold
+    alt Balance low
+        AS->>Webhook: Send alert
+    end
+```
+
+**Billing Formula:**
+```
+Total Cost = (CPU_cores × CPU_price × hours) +
+             (Memory_GB × Memory_price × hours) +
+             (GPU_count × GPU_price × hours)
+```
+
+### Balance Service
+
+Manages team wallets and auto-deduction:
+
+**Features:**
+- Real-time balance tracking
+- Auto-deduction based on usage
+- Recharge operations
+- Transaction history
+- Auto-suspension when balance depleted
+
+**Storage:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: bison-team-balances
+  namespace: bison-system
+data:
+  ml-team: "1523.45"
+  data-team: "890.12"
+  dev-team: "2100.00"
+```
+
+### Tenant Service
+
+Manages teams (Capsule Tenants) and projects (Namespaces):
+
+**Features:**
+- Create/delete teams
+- Assign resource quotas
+- Configure node pools (shared/exclusive)
+- Manage team metadata
+
+**Capsule Integration:**
+```yaml
+apiVersion: capsule.clastix.io/v1beta1
+kind: Tenant
+metadata:
+  name: ml-team
+spec:
+  owners:
+  - name: team-leader
+    kind: User
+  resourceQuota:
+    items:
+    - hard:
+        cpu: "20"
+        memory: 64Gi
+        nvidia.com/gpu: "4"
+```
+
+## Data Flow
+
+### Team Creation Flow
+
+```mermaid
+sequenceDiagram
+    participant U as Admin
+    participant API as API Server
+    participant TS as Tenant Service
+    participant K8S as Kubernetes
+    participant CAP as Capsule
+
+    U->>API: POST /api/v1/teams
+    API->>TS: CreateTeam(name, quota, balance)
+    TS->>CAP: Create Tenant
+    CAP-->>TS: Tenant created
+    TS->>K8S: Create ConfigMap (balance)
+    K8S-->>TS: ConfigMap created
+    TS-->>API: Success
+    API-->>U: 201 Created
+```
+
+### Billing Cycle Flow
+
+```mermaid
+sequenceDiagram
+    participant SCH as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant AS as Alert Service
+
+    loop Every 10 minutes
+        SCH->>BS: Trigger billing calculation
+        BS->>OC: Query costs (last 10min)
+        OC-->>BS: Return usage metrics
+        BS->>BS: Calculate total cost
+        BS->>BLS: Deduct cost from balance
+        BLS->>BLS: Update balance
+        BLS-->>BS: Balance updated
+        BS->>AS: Check balance threshold
+        alt Balance < 20%
+            AS->>AS: Send low balance alert
+        end
+        alt Balance <= 0
+            AS->>BS: Suspend team workloads
+        end
+    end
+```
+
+## Integration Points
+
+### Kubernetes Integration
+
+Bison integrates deeply with Kubernetes:
+
+- **Capsule Tenants** for multi-tenancy
+- **ResourceQuotas** for limit enforcement
+- **Namespaces** for project isolation
+- **ConfigMaps** for data persistence
+- **RBAC** for access control
+
+### OpenCost Integration
+
+Real-time cost tracking via OpenCost API:
+
+```bash
+# Query team costs
+GET /allocation/compute?window=10m&aggregate=namespace&filter=namespace:ml-team
+
+# Response
+{
+  "ml-team": {
+    "cpuCost": 0.25,
+    "memCost": 0.10,
+    "gpuCost": 4.17,
+    "totalCost": 4.52
+  }
+}
+```
+
+### Prometheus Integration
+
+Metrics collection for monitoring:
+
+- Resource utilization metrics
+- Cost metrics
+- Balance metrics
+- Alert metrics
+
+## Deployment Architecture
+
+### High Availability Setup
+
+```mermaid
+graph TB
+    subgraph K8S[Kubernetes Cluster]
+        subgraph NS1[bison-system namespace]
+            API1[API Server Pod 1]
+            API2[API Server Pod 2]
+            WEB1[Web UI Pod 1]
+            WEB2[Web UI Pod 2]
+        end
+
+        subgraph NS2[opencost-system namespace]
+            OC[OpenCost]
+        end
+
+        subgraph NS3[prometheus-system namespace]
+            PROM[Prometheus]
+        end
+
+        LB[LoadBalancer]
+    end
+
+    LB --> API1 & API2
+    LB --> WEB1 & WEB2
+    API1 & API2 --> OC
+    OC --> PROM
+```
+
+### Resource Requirements
+
+**Minimum:**
+- API Server: 200m CPU, 256Mi Memory
+- Web UI: 100m CPU, 128Mi Memory
+
+**Recommended (Production):**
+- API Server: 1000m CPU, 512Mi Memory (2 replicas)
+- Web UI: 500m CPU, 256Mi Memory (2 replicas)
+
+## Security Model
+
+### Authentication
+- JWT token-based authentication
+- OIDC/SSO integration
+- Admin user management
+
+### Authorization
+- Kubernetes RBAC integration
+- Role-based access control
+- Team-scoped permissions
+
+### Data Security
+- All data encrypted at rest (etcd encryption)
+- TLS for API communication
+- Secret management via Kubernetes Secrets
+
+## Technology Stack
+
+### Backend
+- **Language**: Go 1.24+
+- **Framework**: Gin
+- **Kubernetes Client**: client-go
+- **Configuration**: Viper
+- **Logging**: Logrus
+
+### Frontend
+- **Framework**: React 18
+- **Language**: TypeScript
+- **UI Library**: Ant Design 5
+- **Build Tool**: Vite
+- **State Management**: React Query
+- **Charts**: ECharts
+
+### Infrastructure
+- **Platform**: Kubernetes 1.22+
+- **Multi-Tenancy**: Capsule
+- **Cost Tracking**: OpenCost
+- **Metrics**: Prometheus
+- **Storage**: ConfigMaps (etcd)
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison
+- [Configuration](configuration.md) - Configure billing
+- [User Guides](user-guides/admin.md) - Learn to use Bison
+- [Features](features.md) - Explore capabilities
diff --git a/website/versioned_docs/version-0.0.6/configuration.md b/website/versioned_docs/version-0.0.6/configuration.md
new file mode 100644
index 0000000..539aaa3
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/configuration.md
@@ -0,0 +1,361 @@
+---
+sidebar_position: 6
+---
+
+# Configuration
+
+This guide covers how to configure Bison for your specific environment and requirements.
+
+## Helm Chart Configuration
+
+Bison is configured primarily through Helm values. You can customize the installation by providing a `values.yaml` file or using `--set` flags.
+
+### Key Configuration Parameters
+
+| Parameter | Description | Default | Example |
+|-----------|-------------|---------|---------|
+| `auth.enabled` | Enable authentication | `false` | `true` |
+| `auth.admin.username` | Admin username | `admin` | `admin` |
+| `auth.admin.password` | Admin password | `admin` | `changeme` |
+| `apiServer.replicaCount` | API server replicas | `2` | `3` |
+| `apiServer.image.repository` | API server image | `ghcr.io/supermarioyl/bison/api-server` | - |
+| `apiServer.image.tag` | API server image tag | `0.0.1` | `latest` |
+| `webUI.replicaCount` | Web UI replicas | `2` | `3` |
+| `webUI.image.repository` | Web UI image | `ghcr.io/supermarioyl/bison/web-ui` | - |
+| `webUI.image.tag` | Web UI image tag | `0.0.1` | `latest` |
+| `opencost.url` | OpenCost API endpoint | `http://opencost.opencost-system.svc:9003` | Custom URL |
+
+### Example Custom Values
+
+Create a `custom-values.yaml` file:
+
+```yaml
+# Authentication
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: MySecurePassword123
+
+# API Server
+apiServer:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 200m
+      memory: 256Mi
+    limits:
+      cpu: 1000m
+      memory: 512Mi
+
+# Web UI
+webUI:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 100m
+      memory: 128Mi
+    limits:
+      cpu: 500m
+      memory: 256Mi
+
+# OpenCost Integration
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Node Selection (optional)
+nodeSelector:
+  node-role.kubernetes.io/control-plane: ""
+
+# Tolerations (optional)
+tolerations:
+  - key: node-role.kubernetes.io/control-plane
+    operator: Exists
+    effect: NoSchedule
+```
+
+Install with custom values:
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --values custom-values.yaml
+```
+
+## Billing Configuration
+
+Billing settings are configured through the Web UI or API after installation.
+
+### Access Billing Configuration
+
+1. **Via Web UI:**
+   - Navigate to **Settings** > **Billing Configuration**
+   - Set pricing for CPU, Memory, GPU, and other resources
+   - Configure currency and billing intervals
+
+2. **Via API:**
+   ```bash
+   curl -X POST http://localhost:8080/api/v1/billing/config \
+     -H "Content-Type: application/json" \
+     -d '{
+       "enabled": true,
+       "currency": "USD",
+       "pricing": {
+         "cpu": 0.05,
+         "memory": 0.01,
+         "nvidia.com/gpu": 2.50
+       },
+       "billingInterval": "hourly"
+     }'
+   ```
+
+### Billing Parameters
+
+| Parameter | Description | Example |
+|-----------|-------------|---------|
+| `enabled` | Enable/disable billing | `true` |
+| `currency` | Currency for billing | `USD`, `CNY`, `EUR` |
+| `pricing.cpu` | CPU price per core-hour | `0.05` |
+| `pricing.memory` | Memory price per GB-hour | `0.01` |
+| `pricing["nvidia.com/gpu"]` | GPU price per GPU-hour | `2.50` |
+| `billingInterval` | Billing aggregation period | `hourly`, `daily` |
+| `lowBalanceThreshold` | Warning threshold (%) | `20` |
+| `suspendThreshold` | Auto-suspend threshold (%) | `5` |
+
+### Example Billing Configuration
+
+```json
+{
+  "enabled": true,
+  "currency": "USD",
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "nvidia.com/mig-1g.5gb": 0.50,
+    "nvidia.com/mig-2g.10gb": 1.00
+  },
+  "billingInterval": "hourly",
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Team Configuration
+
+### Creating Teams
+
+Teams can be created through the Web UI or API:
+
+**Via Web UI:**
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Set team name, quota, and initial balance
+
+**Via API:**
+```bash
+curl -X POST http://localhost:8080/api/v1/teams \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "ml-team",
+    "description": "Machine Learning Team",
+    "quota": {
+      "cpu": "20",
+      "memory": "64Gi",
+      "nvidia.com/gpu": "4"
+    },
+    "balance": 1000.00
+  }'
+```
+
+### Team Quotas
+
+Team quotas define resource limits:
+
+```yaml
+quota:
+  cpu: "20"              # 20 CPU cores
+  memory: "64Gi"         # 64 GB RAM
+  nvidia.com/gpu: "4"    # 4 GPUs
+  storage: "500Gi"       # 500 GB storage
+```
+
+### Team Balance Management
+
+Set initial balance and configure auto-recharge:
+
+```json
+{
+  "balance": 1000.00,
+  "autoRecharge": {
+    "enabled": true,
+    "amount": 500.00,
+    "schedule": "monthly",
+    "threshold": 100.00
+  }
+}
+```
+
+## Alert Configuration
+
+Configure multi-channel alerts for low balance and quota warnings.
+
+### Webhook Alerts
+
+```json
+{
+  "type": "webhook",
+  "enabled": true,
+  "url": "https://your-webhook-endpoint.com/alerts",
+  "headers": {
+    "Authorization": "Bearer YOUR_TOKEN"
+  },
+  "template": {
+    "title": "Bison Alert",
+    "message": "Team {{.TeamName}} balance is {{.Balance}}"
+  }
+}
+```
+
+### DingTalk Alerts
+
+```json
+{
+  "type": "dingtalk",
+  "enabled": true,
+  "webhook": "https://oapi.dingtalk.com/robot/send?access_token=YOUR_TOKEN",
+  "secret": "YOUR_SECRET"
+}
+```
+
+### WeChat Work Alerts
+
+```json
+{
+  "type": "wechat",
+  "enabled": true,
+  "corpid": "YOUR_CORP_ID",
+  "corpsecret": "YOUR_CORP_SECRET",
+  "agentid": 1000001
+}
+```
+
+## OpenCost Integration
+
+Configure OpenCost connection:
+
+### Check OpenCost Connectivity
+
+```bash
+# Test OpenCost API
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+
+# Test allocation API
+curl http://localhost:9003/allocation/compute?window=1d
+```
+
+### Update OpenCost URL
+
+If OpenCost is deployed in a different namespace or with a different service name:
+
+```bash
+helm upgrade bison bison/bison \
+  --set opencost.url=http://my-opencost.custom-namespace.svc:9003 \
+  --namespace bison-system
+```
+
+## Authentication & OIDC
+
+Enable authentication and integrate with your SSO provider:
+
+### Basic Authentication
+
+```yaml
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: SecurePassword123
+```
+
+### OIDC Integration
+
+```yaml
+auth:
+  enabled: true
+  oidc:
+    enabled: true
+    issuerURL: https://your-oidc-provider.com
+    clientID: bison-client-id
+    clientSecret: your-client-secret
+    redirectURL: https://bison.example.com/callback
+```
+
+## Environment Variables
+
+Additional configuration can be provided via environment variables:
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `KUBECONFIG` | Path to kubeconfig file | In-cluster config |
+| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost-system.svc:9003` |
+| `AUTH_ENABLED` | Enable authentication | `false` |
+| `LOG_LEVEL` | Logging level | `info` |
+| `BILLING_INTERVAL` | Billing calculation interval | `10m` |
+
+Set environment variables in Helm values:
+
+```yaml
+apiServer:
+  env:
+    - name: LOG_LEVEL
+      value: debug
+    - name: BILLING_INTERVAL
+      value: 5m
+```
+
+## Advanced Configuration
+
+### Custom Resource Pricing
+
+Price any Kubernetes resource:
+
+```json
+{
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "amd.com/gpu": 2.00,
+    "ephemeral-storage": 0.001,
+    "custom.io/fpga": 5.00
+  }
+}
+```
+
+### Multi-Cluster Support
+
+Deploy Bison in each cluster with shared billing:
+
+```yaml
+# Cluster A
+apiServer:
+  clusterName: prod-us-west
+
+# Cluster B
+apiServer:
+  clusterName: prod-us-east
+```
+
+## Next Steps
+
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
+- [Features](features.md) - Explore all capabilities
diff --git a/website/versioned_docs/version-0.0.6/features.md b/website/versioned_docs/version-0.0.6/features.md
new file mode 100644
index 0000000..8d0c438
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/features.md
@@ -0,0 +1,195 @@
+---
+sidebar_position: 2
+---
+
+# Features
+
+Bison provides a comprehensive suite of features for GPU resource management, billing, and multi-tenant isolation in Kubernetes environments.
+
+## See Bison in Action
+
+### 🎯 Real-Time Resource Dashboard
+
+![Bison Dashboard](/img/ui-dashboard.png)
+
+**What you see:**
+- **Cluster Overview** - Total teams, projects, resource pools, and quotas at a glance
+- **Resource Utilization** - Visual breakdown showing which teams are consuming resources
+- **7-Day Cost Trends** - Historical cost data to identify spending patterns
+- **Top 5 Cost Rankings** - Quickly identify heavy GPU consumers
+- **Team Budget Status** - Real-time balance monitoring with color-coded alerts
+
+**Who benefits:**
+- **Platform Administrators** get instant visibility into cluster health and usage patterns
+- **Finance Teams** can track costs in real-time without waiting for monthly reports
+- **Team Leaders** can compare their usage against other teams
+
+---
+
+### 💼 Team Management & Budget Monitoring
+
+![Team Management](/img/ui-team.png)
+
+**What you see:**
+- **Team List** with real-time status indicators:
+  - 🟢 Green balance = Healthy budget
+  - 🟡 Yellow balance = Approaching threshold
+  - 🔴 Red balance = Low balance or suspended
+- **Resource Allocation** - CPU/Memory/GPU quotas per team (e.g., "cpu 0/10" means 0 used out of 10 allocated)
+- **Project Count** - Number of namespaces/projects under each team
+- **Quick Actions** - Edit quotas, recharge balance, or delete team with one click
+
+**Who benefits:**
+- **Team Leaders** monitor their budget status and resource usage at a glance
+- **Administrators** manage multiple teams from a single unified view
+- **Finance Teams** see which teams need recharging
+
+---
+
+### 💰 Flexible Billing Configuration
+
+![Billing Configuration](/img/ui-billing.png)
+
+**What you see:**
+- **Per-Resource Pricing** - Set custom prices for CPU (per core-hour), Memory (per GB-hour), GPU (per GPU-hour)
+- **Currency Selection** - Support for CNY, USD, EUR, and other currencies
+- **Enable/Disable Toggle** - Turn billing on/off for specific resources with one click
+- **Billing Rules** - Define how resources are metered (hourly, daily, etc.)
+- **Alert Thresholds** - Configure when to send low-balance warnings
+
+**Who benefits:**
+- **Finance Teams** align cloud costs with internal chargeback policies
+- **Administrators** adjust pricing based on actual hardware costs
+- **Budget Managers** set appropriate warning thresholds to prevent overruns
+
+---
+
+## Core Capabilities
+
+### Multi-Tenant Management
+✅ **Capsule-Powered Isolation** - True multi-tenancy using Kubernetes-native Capsule operator
+✅ **OIDC Integration** - Enterprise SSO support for authentication
+✅ **Team-Based Access Control** - Manage users, roles, and permissions per team
+✅ **Shared & Exclusive Node Pools** - Flexible resource allocation strategies
+
+### Real-Time Billing
+✅ **Usage-Based Billing** - Accurate cost tracking based on actual resource consumption
+✅ **Configurable Pricing** - Set custom rates for CPU, Memory, GPU, and any Kubernetes resource
+✅ **Multi-Currency Support** - CNY, USD, EUR, and more
+✅ **Billing Rules Engine** - Define custom billing logic and aggregation periods
+
+### Dynamic Resource Quotas
+✅ **Per-Team Quotas** - CPU, Memory, GPU, Storage, and custom resources
+✅ **Namespace Quotas** - Project-level resource limits within teams
+✅ **Auto-Enforcement** - Kubernetes-native quota enforcement
+✅ **Quota Alerts** - Notifications when approaching limits
+
+### Team Balance & Wallet System
+✅ **Prepaid Balances** - Team wallets with real-time deduction
+✅ **Auto-Deduction** - Automated billing based on resource usage
+✅ **Balance Thresholds** - Configurable warning and suspension levels
+✅ **Transaction History** - Complete audit trail of all balance changes
+
+### Auto-Recharge
+✅ **Scheduled Top-Ups** - Weekly or monthly automatic recharges
+✅ **Custom Amounts** - Flexible recharge amounts per team
+✅ **Recharge Notifications** - Alert teams when balance is added
+
+### Balance Alerts
+✅ **Multi-Channel Notifications** - Webhook, DingTalk, WeChat, Email
+✅ **Configurable Thresholds** - Set warning levels (e.g., 20%, 10%, 5%)
+✅ **Auto-Suspension** - Automatically suspend workloads when balance depleted
+✅ **Custom Templates** - Customize alert messages
+
+### Usage Reports
+✅ **Team Analytics** - Per-team cost breakdowns and trends
+✅ **Project Analytics** - Namespace-level resource consumption
+✅ **Export Capabilities** - CSV, Excel, PDF reports
+✅ **Historical Data** - 30/60/90-day cost analysis
+
+### Audit Logging
+✅ **Complete Operation History** - Track all administrative actions
+✅ **User Attribution** - Who did what and when
+✅ **Resource Changes** - Track quota, balance, and configuration changes
+✅ **Compliance Ready** - Meet internal audit requirements
+
+---
+
+## Architecture Highlights
+
+Bison's architecture is designed for simplicity, scalability, and zero external dependencies.
+
+```mermaid
+graph TB
+    subgraph USER_LAYER[User Layer]
+        UI[Web UI<br/>React + Ant Design]
+        API[REST API<br/>Go + Gin]
+    end
+
+    subgraph CORE[Core Services]
+        BS[Billing Service]
+        TS[Tenant Service]
+        QS[Quota Service]
+    end
+
+    subgraph K8S[Kubernetes Layer]
+        CA[Capsule<br/>Multi-Tenancy]
+        OC[OpenCost<br/>Cost Tracking]
+        PR[Prometheus<br/>Metrics]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Zero Database]
+    end
+
+    UI --> API
+    API --> BS & TS & QS
+    BS --> OC
+    TS --> CA
+    QS --> CA
+    BS & TS --> CM
+    OC --> PR
+```
+
+### Key Architectural Benefits
+
+- **Zero External Dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+- **Cloud-Native** - Built on Kubernetes primitives for maximum portability
+- **Scalable** - Stateless API server that can scale horizontally
+- **Secure** - Kubernetes RBAC integration and optional authentication
+- **Observable** - Prometheus metrics and structured logging
+- **Extensible** - Plugin architecture for custom billing rules and alerts
+
+---
+
+## Integration Points
+
+### OpenCost Integration
+Bison leverages [OpenCost](https://www.opencost.io/) for real-time cost tracking:
+- Per-pod, per-namespace, per-team cost visibility
+- GPU utilization metrics
+- Historical cost data and trends
+- Integration with Prometheus for metric collection
+
+### Capsule Integration
+Bison uses [Capsule](https://capsule.clastix.io/) for multi-tenancy:
+- Team-based tenant isolation
+- Namespace quota enforcement
+- Network and security policies
+- OIDC/SSO integration
+
+### Prometheus Integration
+Metrics collection and monitoring:
+- Resource utilization tracking
+- Custom billing metrics
+- Alert rule evaluation
+- Historical data retention
+
+---
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison in your cluster
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Deep dive into system design
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.6/installation.md b/website/versioned_docs/version-0.0.6/installation.md
new file mode 100644
index 0000000..da89191
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/installation.md
@@ -0,0 +1,316 @@
+---
+sidebar_position: 3
+---
+
+# Installation Guide
+
+This guide provides detailed instructions for installing Bison in your Kubernetes cluster.
+
+## Prerequisites
+
+Before installing Bison, ensure you have:
+
+- **Kubernetes 1.22+** - A running Kubernetes cluster
+- **kubectl** - Configured to access your cluster
+- **Helm 3.0+** - Package manager for Kubernetes
+- **Capsule Operator v0.1.0+** - For multi-tenant isolation
+- **OpenCost** - Deployed with Prometheus for cost tracking
+
+### Install Prerequisites
+
+If you haven't installed the required components:
+
+#### Install Capsule
+
+```bash
+# Using Helm
+helm repo add projectcapsule https://projectcapsule.github.io/charts
+helm install capsule projectcapsule/capsule \
+  --namespace capsule-system \
+  --create-namespace
+```
+
+#### Install OpenCost
+
+```bash
+# Using Helm
+helm repo add opencost https://opencost.github.io/opencost-helm-chart
+helm install opencost opencost/opencost \
+  --namespace opencost-system \
+  --create-namespace \
+  --set prometheus.internal.serviceName=prometheus-server \
+  --set prometheus.internal.namespaceName=prometheus-system
+```
+
+## Installation Methods
+
+Bison Helm charts are distributed via **GitHub Container Registry (GHCR)** using the modern OCI format.
+
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
+
+### Option A: From GHCR (Recommended)
+
+The simplest way to install Bison is directly from GitHub Container Registry:
+
+```bash
+# Install specific version from GHCR
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace
+
+# Or pull the chart first, then install
+helm pull oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+helm install bison bison-0.0.2.tgz \
+  --namespace bison-system \
+  --create-namespace
+
+# Customize installation
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true \
+  --set apiServer.image.tag=0.0.2 \
+  --set webUI.image.tag=0.0.2
+```
+
+**Why GHCR OCI Format?**
+- ✅ No separate Helm repository maintenance needed
+- ✅ Unified with Docker images in GHCR
+- ✅ Faster installation (direct registry pull)
+- ✅ Modern Helm 3.8+ standard practice
+
+### Option B: From GitHub Release
+
+Download a specific version from GitHub Releases:
+
+```bash
+# Download Helm chart
+VERSION=0.0.2
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install the chart
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Option C: From Source
+
+Clone and build from source:
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+## Configuration Options
+
+Bison can be configured using Helm values. Here are the key configuration options:
+
+### Basic Configuration
+
+```yaml
+# values.yaml
+apiServer:
+  image:
+    repository: ghcr.io/supermarioyl/bison/api-server
+    tag: 0.0.1
+  replicas: 2
+
+webUI:
+  image:
+    repository: ghcr.io/supermarioyl/bison/web-ui
+    tag: 0.0.1
+  replicas: 2
+
+# OpenCost URL
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Authentication
+auth:
+  enabled: false
+```
+
+### Custom Configuration Example
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set apiServer.replicas=3 \
+  --set webUI.replicas=3 \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true
+```
+
+## Verify Installation
+
+After installation, verify that all components are running:
+
+```bash
+# Check pod status
+kubectl get pods -n bison-system
+
+# Expected output:
+# NAME                              READY   STATUS    RESTARTS   AGE
+# bison-api-server-xxxxxxxxx-xxxxx  1/1     Running   0          2m
+# bison-webui-xxxxxxxxx-xxxxx       1/1     Running   0          2m
+
+# Check services
+kubectl get svc -n bison-system
+
+# Check logs
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl logs -n bison-system deployment/bison-webui
+```
+
+## Access the Platform
+
+### Port Forward (Development)
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+```
+
+### Ingress (Production)
+
+For production deployments, configure an Ingress:
+
+```yaml
+# ingress.yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: bison-ingress
+  namespace: bison-system
+  annotations:
+    kubernetes.io/ingress.class: nginx
+spec:
+  rules:
+  - host: bison.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-webui
+            port:
+              number: 80
+      - path: /api
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-api-server
+            port:
+              number: 8080
+```
+
+Apply the Ingress:
+
+```bash
+kubectl apply -f ingress.yaml
+```
+
+## Docker Images
+
+Bison images are available on GitHub Container Registry:
+
+```bash
+# Pull images
+docker pull ghcr.io/supermarioyl/bison/api-server:0.0.1
+docker pull ghcr.io/supermarioyl/bison/web-ui:0.0.1
+
+# Or use latest
+docker pull ghcr.io/supermarioyl/bison/api-server:latest
+docker pull ghcr.io/supermarioyl/bison/web-ui:latest
+```
+
+**Supported Platforms:**
+- `linux/amd64`
+- `linux/arm64`
+
+## Upgrading
+
+To upgrade Bison to a new version:
+
+```bash
+# Update Helm repository
+helm repo update
+
+# Upgrade to latest version
+helm upgrade bison bison/bison --namespace bison-system
+
+# Or upgrade to specific version
+helm upgrade bison bison/bison --version 0.0.2 --namespace bison-system
+```
+
+## Uninstalling
+
+To completely remove Bison:
+
+```bash
+# Uninstall Helm release
+helm uninstall bison --namespace bison-system
+
+# Remove namespace (optional)
+kubectl delete namespace bison-system
+```
+
+## Troubleshooting
+
+### Pod Not Starting
+
+Check pod logs for errors:
+
+```bash
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl describe pod -n bison-system <pod-name>
+```
+
+### Cannot Connect to OpenCost
+
+Verify OpenCost is running and accessible:
+
+```bash
+kubectl get svc -n opencost-system
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+
+# Test endpoint
+curl http://localhost:9003/healthz
+```
+
+### Authentication Issues
+
+If authentication is enabled, ensure you have the correct credentials:
+
+```bash
+# Default credentials (change in production!)
+Username: admin
+Password: admin
+```
+
+## Next Steps
+
+- [Configuration Guide](configuration.md) - Configure billing and settings
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
diff --git a/website/versioned_docs/version-0.0.6/intro.md b/website/versioned_docs/version-0.0.6/intro.md
new file mode 100644
index 0000000..b3dc3aa
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/intro.md
@@ -0,0 +1,167 @@
+---
+sidebar_position: 1
+slug: /
+---
+
+# Introduction to Bison
+
+![Bison Logo](/img/logo.png)
+
+**Enterprise GPU Resource Billing & Multi-Tenant Management Platform**
+
+Bison is a Kubernetes-based platform that provides comprehensive GPU resource management, billing, and multi-tenant isolation for organizations running shared GPU clusters.
+
+## The GPU Management Challenge
+
+Managing shared GPU clusters across multiple teams creates critical operational and financial challenges:
+
+**For Platform Administrators:**
+- How do you fairly allocate expensive GPU resources across competing teams?
+- How do you prevent resource hogging while ensuring everyone gets their fair share?
+- How do you track who's using what and implement accurate chargeback?
+- How do you maintain strict multi-tenant isolation without complex manual configuration?
+
+**For Finance & Budget Teams:**
+- How do you implement automated chargeback for GPU usage without manual accounting?
+- How do you prevent budget overruns before they happen?
+- How do you generate accurate cost reports for internal billing?
+
+**For Development Teams:**
+- How do you get predictable, isolated access to GPU resources?
+- How do you know when you're approaching your budget limits?
+- How do you avoid impacting other teams' workloads?
+
+**Traditional Approach:**
+- Manual quota configuration per namespace
+- Excel-based billing calculations
+- No real-time cost visibility
+- Complex multi-tool setup (quota management + cost tracking + billing system)
+- Frequent resource conflicts and budget surprises
+
+## Bison's Integrated Solution
+
+```mermaid
+graph TB
+    subgraph WITHOUT["Without Bison"]
+        P1[❌ Manual Quota Management<br/>Per-namespace configuration]
+        P2[❌ Spreadsheet Billing<br/>Manual calculations & reports]
+        P3[❌ No Resource Isolation<br/>Teams compete for resources]
+        P4[❌ Budget Overruns<br/>No proactive alerts]
+        P5[❌ Complex Tooling<br/>Multiple systems to manage]
+    end
+
+    subgraph WITH["With Bison"]
+        S1[✅ Automated Team Quotas<br/>Capsule-powered isolation]
+        S2[✅ Real-Time Billing<br/>OpenCost integration]
+        S3[✅ True Multi-Tenancy<br/>Shared/Exclusive modes]
+        S4[✅ Proactive Alerts<br/>Balance monitoring & auto-suspend]
+        S5[✅ Unified Platform<br/>Single pane of glass]
+    end
+
+    P1 -.Transform.-> S1
+    P2 -.Transform.-> S2
+    P3 -.Transform.-> S3
+    P4 -.Transform.-> S4
+    P5 -.Transform.-> S5
+
+    style WITHOUT fill:#ffebee
+    style WITH fill:#e8f5e9
+    style S1 fill:#4caf50,color:#fff
+    style S2 fill:#4caf50,color:#fff
+    style S3 fill:#4caf50,color:#fff
+    style S4 fill:#4caf50,color:#fff
+    style S5 fill:#4caf50,color:#fff
+```
+
+**Bison combines:**
+- 🔐 **Kubernetes-native multi-tenancy** (Capsule) - True team isolation with shared or exclusive node pools
+- 💰 **Real-time cost tracking** (OpenCost + Prometheus) - Per-pod, per-namespace, per-team cost visibility
+- 💳 **Automated billing & budgets** - Prepaid balances, auto-deduction, low-balance alerts, and auto-suspension
+- 📊 **Unified dashboard** - Single interface for admins, team leaders, and finance teams
+- 🔧 **Zero external dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+
+**Result:** Deploy once, get complete GPU resource management with automated billing in under 30 minutes.
+
+## Quick Start
+
+### Prerequisites
+
+- Kubernetes 1.22+
+- kubectl configured
+- Helm 3.0+
+- Capsule operator (v0.1.0+) installed
+- OpenCost deployed with Prometheus
+
+### Installation
+
+Choose one of the following installation methods:
+
+#### Option A: Using Helm Repository (Recommended)
+
+```bash
+# Add Bison Helm repository
+helm repo add bison https://supermarioyl.github.io/Bison/charts/
+helm repo update
+
+# Install with default configuration
+helm install bison bison/bison --namespace bison-system --create-namespace
+
+# Or customize installation
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=false
+```
+
+#### Option B: From GitHub Release
+
+```bash
+# Download latest Helm chart
+VERSION=0.0.1
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+#### Option C: From Source
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Access the Platform
+
+After installation, access Bison through:
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+# Default credentials (if auth enabled):
+# Username: admin
+# Password: admin (change immediately in production!)
+```
+
+## Next Steps
+
+- [Explore Features](features.md) - Learn about all capabilities
+- [Installation Guide](installation.md) - Detailed installation instructions
+- [User Guides](user-guides/admin.md) - Role-based user guides
+- [Architecture](architecture.md) - Understand the system architecture
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.6/user-guides/_category_.json b/website/versioned_docs/version-0.0.6/user-guides/_category_.json
new file mode 100644
index 0000000..fe79f61
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/user-guides/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "User Guides",
+  "position": 4,
+  "link": {
+    "type": "generated-index",
+    "description": "Role-based guides for using Bison effectively."
+  }
+}
diff --git a/website/versioned_docs/version-0.0.6/user-guides/admin.md b/website/versioned_docs/version-0.0.6/user-guides/admin.md
new file mode 100644
index 0000000..a466cbb
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/user-guides/admin.md
@@ -0,0 +1,176 @@
+---
+sidebar_position: 1
+---
+
+# Administrator Guide
+
+This guide is for platform administrators who deploy, configure, and manage the Bison platform.
+
+## Responsibilities
+
+As a platform administrator, you are responsible for:
+
+- ✅ Deploying and configuring Bison
+- ✅ Creating and managing teams
+- ✅ Setting global billing configuration
+- ✅ Monitoring cluster-wide metrics
+- ✅ Responding to alerts and recharge requests
+
+## Getting Started
+
+### 1. Deploy Bison
+
+Follow the [Installation Guide](../installation.md) to deploy Bison in your Kubernetes cluster.
+
+### 2. Configure Billing
+
+Set up billing rules and pricing:
+
+1. Access the Web UI
+2. Navigate to **Settings** > **Billing Configuration**
+3. Configure:
+   - **Currency**: USD, CNY, EUR, etc.
+   - **CPU Price**: Cost per core-hour
+   - **Memory Price**: Cost per GB-hour
+   - **GPU Price**: Cost per GPU-hour
+4. Click **Save**
+
+### 3. Create First Team
+
+Create a team for your users:
+
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Fill in:
+   - **Team Name**: e.g., "ml-team"
+   - **Description**: Team purpose
+   - **Resource Quota**:
+     - CPU: e.g., "20" cores
+     - Memory: e.g., "64Gi"
+     - GPU: e.g., "4"
+   - **Initial Balance**: e.g., 1000.00
+4. Click **Create**
+
+## Common Tasks
+
+### Managing Teams
+
+#### View All Teams
+
+```bash
+# Via kubectl
+kubectl get tenants
+
+# Via API
+curl http://localhost:8080/api/v1/teams
+```
+
+#### Update Team Quota
+
+1. Navigate to **Teams** page
+2. Click **Edit** on the team row
+3. Modify quotas
+4. Click **Save**
+
+#### Recharge Team Balance
+
+1. Navigate to **Teams** page
+2. Click **Recharge** on the team row
+3. Enter amount
+4. Add notes (optional)
+5. Click **Confirm**
+
+### Monitoring
+
+#### View Dashboard
+
+Access real-time cluster metrics:
+- Total teams and projects
+- Resource utilization
+- Cost trends
+- Top consumers
+- Balance status
+
+#### Check Alerts
+
+Monitor low-balance and quota alerts:
+1. Navigate to **Alerts** page
+2. Review active alerts
+3. Take action as needed
+
+### Billing Configuration
+
+#### Update Pricing
+
+```bash
+curl -X PUT http://localhost:8080/api/v1/billing/config \
+  -H "Content-Type: application/json" \
+  -d '{
+    "pricing": {
+      "cpu": 0.06,
+      "memory": 0.012,
+      "nvidia.com/gpu": 3.00
+    }
+  }'
+```
+
+#### Configure Alert Thresholds
+
+```json
+{
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Best Practices
+
+### Team Naming
+- Use lowercase, alphanumeric characters and hyphens
+- Example: `ml-team`, `data-science`, `dev-team`
+
+### Quota Allocation
+- Start with conservative quotas
+- Monitor usage for 1-2 weeks
+- Adjust based on actual needs
+
+### Balance Management
+- Set up auto-recharge for critical teams
+- Monitor balance trends weekly
+- Respond to low-balance alerts promptly
+
+### Security
+- Enable authentication in production
+- Use OIDC/SSO for enterprise deployments
+- Regularly audit user permissions
+
+## Troubleshooting
+
+### Team Creation Failed
+
+Check Capsule operator logs:
+```bash
+kubectl logs -n capsule-system deployment/capsule-controller-manager
+```
+
+### Billing Not Working
+
+Verify OpenCost connectivity:
+```bash
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+```
+
+### High Resource Usage
+
+Check resource consumption:
+```bash
+kubectl top pods -n bison-system
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Guide for team leaders
+- [Developer Guide](developer.md) - Guide for developers
+- [Configuration](../configuration.md) - Advanced configuration
diff --git a/website/versioned_docs/version-0.0.6/user-guides/developer.md b/website/versioned_docs/version-0.0.6/user-guides/developer.md
new file mode 100644
index 0000000..d14ab62
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/user-guides/developer.md
@@ -0,0 +1,187 @@
+---
+sidebar_position: 3
+---
+
+# Developer Guide
+
+This guide is for developers who deploy workloads and consume resources within team projects.
+
+## Responsibilities
+
+As a developer, you are responsible for:
+
+- ✅ Deploying applications within your project
+- ✅ Monitoring resource usage
+- ✅ Staying within quota limits
+- ✅ Optimizing resource consumption
+
+## Getting Started
+
+### 1. Get Kubeconfig
+
+Request kubeconfig from your team leader or administrator.
+
+### 2. Set Context
+
+```bash
+# Set context to your project namespace
+kubectl config set-context --current --namespace=your-project
+
+# Verify
+kubectl config view --minify | grep namespace
+```
+
+### 3. Check Quota
+
+See your available resources:
+```bash
+kubectl describe quota
+```
+
+## Deploying Workloads
+
+### Basic Pod Deployment
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: gpu-training-job
+  namespace: your-project
+spec:
+  containers:
+  - name: trainer
+    image: your-ml-image:latest
+    resources:
+      requests:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+      limits:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+```
+
+### Using Deployments
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: ml-inference
+  namespace: your-project
+spec:
+  replicas: 2
+  selector:
+    matchLabels:
+      app: ml-inference
+  template:
+    metadata:
+      labels:
+        app: ml-inference
+    spec:
+      containers:
+      - name: inference
+        image: your-inference-image:latest
+        resources:
+          requests:
+            cpu: "2"
+            memory: "8Gi"
+            nvidia.com/gpu: "1"
+```
+
+## Monitoring Usage
+
+### Check Pod Resource Usage
+
+```bash
+# View resource consumption
+kubectl top pods
+
+# Detailed pod information
+kubectl describe pod <pod-name>
+```
+
+### View Logs
+
+```bash
+# Stream logs
+kubectl logs -f <pod-name>
+
+# Previous logs (if pod restarted)
+kubectl logs --previous <pod-name>
+```
+
+## Best Practices
+
+### Resource Requests and Limits
+
+Always specify both requests and limits:
+```yaml
+resources:
+  requests:
+    cpu: "2"
+    memory: "8Gi"
+  limits:
+    cpu: "4"
+    memory: "16Gi"
+```
+
+### GPU Usage
+
+- Request GPUs only when needed
+- Use GPU for compute-intensive tasks
+- Monitor GPU utilization
+
+### Clean Up
+
+Delete resources when no longer needed:
+```bash
+# Delete pod
+kubectl delete pod <pod-name>
+
+# Delete deployment
+kubectl delete deployment <deployment-name>
+
+# Clean up completed jobs
+kubectl delete job --field-selector status.successful=1
+```
+
+### Cost Optimization
+
+- Right-size your resource requests
+- Use horizontal pod autoscaling
+- Clean up idle resources
+- Share GPUs when possible (if supported)
+
+## Troubleshooting
+
+### Pod Pending (Insufficient Quota)
+
+If your pod is stuck in `Pending` state:
+
+```bash
+kubectl describe pod <pod-name>
+```
+
+Look for quota-related errors and reduce resource requests or ask your team leader for more quota.
+
+### Out of Memory (OOM)
+
+If pods are killed due to OOM:
+1. Check memory usage patterns
+2. Increase memory limits
+3. Optimize application memory usage
+
+### GPU Not Available
+
+Verify GPU requests:
+```bash
+kubectl get nodes -o custom-columns=NAME:.metadata.name,GPU:.status.allocatable."nvidia\.com/gpu"
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Understand team management
+- [Architecture](../architecture.md) - Learn about the platform
diff --git a/website/versioned_docs/version-0.0.6/user-guides/team-leader.md b/website/versioned_docs/version-0.0.6/user-guides/team-leader.md
new file mode 100644
index 0000000..7b6de96
--- /dev/null
+++ b/website/versioned_docs/version-0.0.6/user-guides/team-leader.md
@@ -0,0 +1,126 @@
+---
+sidebar_position: 2
+---
+
+# Team Leader Guide
+
+This guide is for team leaders who manage projects, monitor budgets, and allocate resources within their team.
+
+## Responsibilities
+
+As a team leader, you are responsible for:
+
+- ✅ Creating and managing projects (namespaces)
+- ✅ Allocating quotas to projects
+- ✅ Monitoring team balance and consumption
+- ✅ Requesting recharges when needed
+
+## Getting Started
+
+### 1. Access Bison
+
+Log in to the Web UI with your credentials.
+
+### 2. View Team Dashboard
+
+Your dashboard shows:
+- Team balance and status
+- Resource utilization
+- Active projects
+- Cost trends
+
+## Managing Projects
+
+### Create a Project
+
+1. Navigate to **Projects** page
+2. Click **Create Project**
+3. Fill in:
+   - **Project Name**: e.g., "training-ml-models"
+   - **Description**: Project purpose
+   - **Quota** (optional):
+     - CPU: e.g., "8" cores
+     - Memory: e.g., "32Gi"
+     - GPU: e.g., "2"
+4. Click **Create**
+
+### List Projects
+
+```bash
+# Via kubectl (if you have access)
+kubectl get namespaces -l capsule.clastix.io/tenant=your-team
+
+# Via API
+curl http://localhost:8080/api/v1/teams/your-team/projects
+```
+
+### Delete a Project
+
+1. Navigate to **Projects** page
+2. Click **Delete** on the project row
+3. Confirm deletion
+
+**Warning**: This will delete all resources in the project!
+
+## Monitoring Budget
+
+### Check Balance
+
+View your current balance:
+1. Navigate to **Team** page
+2. See balance in the status card
+
+### View Usage Trends
+
+Analyze spending patterns:
+1. Navigate to **Reports** page
+2. Select time range (7 days, 30 days, 90 days)
+3. View:
+   - Cost breakdown by resource type
+   - Daily cost trends
+   - Per-project consumption
+
+### Request Recharge
+
+When balance is low:
+1. Click **Request Recharge** button
+2. Enter requested amount
+3. Add justification
+4. Submit request to administrator
+
+## Resource Management
+
+### Monitor Quota Usage
+
+Check how much of your quota is being used:
+```bash
+kubectl describe quota -n your-project
+```
+
+### Optimize Costs
+
+Tips to reduce spending:
+- **Right-size resources**: Don't over-provision CPU/Memory
+- **Clean up idle pods**: Delete unused workloads
+- **Use spot/preemptible instances**: Where applicable
+- **Monitor GPU utilization**: Ensure GPUs are fully utilized
+
+## Best Practices
+
+### Project Organization
+- Create separate projects for different workloads
+- Example: `ml-training`, `ml-inference`, `data-processing`
+
+### Quota Allocation
+- Allocate quotas based on project priority
+- Reserve buffer for urgent tasks
+
+### Cost Awareness
+- Review costs weekly
+- Identify and eliminate waste
+- Set up cost alerts
+
+## Next Steps
+
+- [Developer Guide](developer.md) - Guide for your team members
+- [Features](../features.md) - Explore all Bison features
diff --git a/website/versioned_docs/version-0.0.7/architecture.md b/website/versioned_docs/version-0.0.7/architecture.md
new file mode 100644
index 0000000..dbbe50d
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/architecture.md
@@ -0,0 +1,418 @@
+---
+sidebar_position: 5
+---
+
+# Architecture
+
+This document provides a technical overview of Bison's architecture, designed with high cohesion and low coupling principles for maintainability and scalability.
+
+## System Overview
+
+### High-Level Architecture
+
+```mermaid
+graph TB
+    subgraph PRESENT[Presentation Layer]
+        WEB[Web UI<br/>React 18 + Ant Design 5]
+        CLI[kubectl / API Client]
+    end
+
+    subgraph GATEWAY[API Gateway Layer]
+        GW[API Server<br/>Go + Gin Framework]
+        AUTH[Auth Middleware<br/>JWT + OIDC]
+    end
+
+    subgraph BUSINESS[Business Logic Layer]
+        TS[Tenant Service<br/>Team & Project CRUD]
+        BS[Billing Service<br/>Cost Calculation]
+        BLS[Balance Service<br/>Wallet Management]
+        QS[Quota Service<br/>Resource Limits]
+        AS[Alert Service<br/>Notifications]
+        RS[Report Service<br/>Analytics]
+    end
+
+    subgraph INTEGRATION[Integration Layer]
+        K8S[Kubernetes Client<br/>client-go]
+        OCC[OpenCost Client<br/>REST API]
+        PC[Prometheus Client<br/>PromQL]
+    end
+
+    subgraph EXTERNAL[External Systems]
+        KAPI[Kubernetes API]
+        CAP[Capsule Controller]
+        OC[OpenCost]
+        PROM[Prometheus]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Persistent Storage]
+    end
+
+    WEB --> GW
+    CLI --> GW
+    GW --> AUTH
+    AUTH --> TS & BS & BLS & QS & AS & RS
+
+    TS --> K8S
+    BS --> OCC
+    BLS --> K8S
+    QS --> K8S
+    RS --> OCC & PC
+
+    K8S --> KAPI
+    K8S --> CAP
+    OCC --> OC
+    PC --> PROM
+
+    TS & BLS --> CM
+    KAPI --> CM
+```
+
+### Design Principles
+
+| Principle | Implementation |
+|-----------|----------------|
+| **High Cohesion** | Each service handles a single domain (billing, quota, alerts) |
+| **Low Coupling** | Services communicate via well-defined interfaces |
+| **Stateless API** | All state persisted in Kubernetes ConfigMaps |
+| **Cloud Native** | Leverages Kubernetes primitives for HA and scaling |
+| **Zero Database** | ConfigMaps eliminate external database dependencies |
+
+## Architecture Layers
+
+Bison follows a layered architecture pattern:
+
+### 1. Presentation Layer
+- **Web UI**: React 18 + TypeScript + Ant Design 5
+- **API Client**: REST API for external integrations
+
+### 2. API Gateway Layer
+- **API Server**: Go + Gin framework
+- **Authentication**: JWT and OIDC support
+- **Middleware**: Logging, recovery, CORS handling
+
+### 3. Business Logic Layer
+- **Tenant Service**: Team and project management
+- **Billing Service**: Cost calculation and aggregation
+- **Balance Service**: Wallet management and auto-deduction
+- **Quota Service**: Resource limit enforcement
+- **Alert Service**: Multi-channel notifications
+- **Report Service**: Analytics and export
+
+### 4. Integration Layer
+- **Kubernetes Client**: client-go for K8s API interaction
+- **OpenCost Client**: REST API for cost data
+- **Prometheus Client**: PromQL queries for metrics
+
+### 5. Data Layer
+- **ConfigMaps**: Persistent storage for balances, billing config, and metadata
+- **etcd**: Backing store via Kubernetes ConfigMaps
+
+## Core Components
+
+### API Server
+
+The API server is the central component that handles all HTTP requests:
+
+**Technology Stack:**
+- Go 1.24+
+- Gin web framework
+- client-go for Kubernetes API
+
+**Key Responsibilities:**
+- Serve REST API endpoints
+- Authentication and authorization
+- Request routing and middleware
+- Background task scheduling
+
+**Endpoints:**
+```
+/api/v1/teams          - Team management
+/api/v1/projects       - Project management
+/api/v1/billing        - Billing configuration
+/api/v1/balance        - Balance operations
+/api/v1/stats          - Statistics and reports
+```
+
+### Web UI
+
+React-based single-page application:
+
+**Technology Stack:**
+- React 18
+- TypeScript
+- Vite (build tool)
+- Ant Design 5
+- ECharts (visualization)
+- React Query (state management)
+
+**Features:**
+- Dashboard with real-time metrics
+- Team and project management
+- Billing configuration
+- Balance monitoring
+- Usage reports and export
+
+### Billing Service
+
+Calculates costs based on resource usage:
+
+**Data Flow:**
+```mermaid
+sequenceDiagram
+    participant S as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant K8S as Kubernetes
+
+    S->>BS: Trigger billing (every 10min)
+    BS->>OC: Query team costs
+    OC-->>BS: Return usage data
+    BS->>BS: Calculate cost
+    BS->>BLS: Deduct from balance
+    BLS->>K8S: Update ConfigMap
+    BLS-->>BS: Confirm
+    BS->>AS: Check threshold
+    alt Balance low
+        AS->>Webhook: Send alert
+    end
+```
+
+**Billing Formula:**
+```
+Total Cost = (CPU_cores × CPU_price × hours) +
+             (Memory_GB × Memory_price × hours) +
+             (GPU_count × GPU_price × hours)
+```
+
+### Balance Service
+
+Manages team wallets and auto-deduction:
+
+**Features:**
+- Real-time balance tracking
+- Auto-deduction based on usage
+- Recharge operations
+- Transaction history
+- Auto-suspension when balance depleted
+
+**Storage:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: bison-team-balances
+  namespace: bison-system
+data:
+  ml-team: "1523.45"
+  data-team: "890.12"
+  dev-team: "2100.00"
+```
+
+### Tenant Service
+
+Manages teams (Capsule Tenants) and projects (Namespaces):
+
+**Features:**
+- Create/delete teams
+- Assign resource quotas
+- Configure node pools (shared/exclusive)
+- Manage team metadata
+
+**Capsule Integration:**
+```yaml
+apiVersion: capsule.clastix.io/v1beta1
+kind: Tenant
+metadata:
+  name: ml-team
+spec:
+  owners:
+  - name: team-leader
+    kind: User
+  resourceQuota:
+    items:
+    - hard:
+        cpu: "20"
+        memory: 64Gi
+        nvidia.com/gpu: "4"
+```
+
+## Data Flow
+
+### Team Creation Flow
+
+```mermaid
+sequenceDiagram
+    participant U as Admin
+    participant API as API Server
+    participant TS as Tenant Service
+    participant K8S as Kubernetes
+    participant CAP as Capsule
+
+    U->>API: POST /api/v1/teams
+    API->>TS: CreateTeam(name, quota, balance)
+    TS->>CAP: Create Tenant
+    CAP-->>TS: Tenant created
+    TS->>K8S: Create ConfigMap (balance)
+    K8S-->>TS: ConfigMap created
+    TS-->>API: Success
+    API-->>U: 201 Created
+```
+
+### Billing Cycle Flow
+
+```mermaid
+sequenceDiagram
+    participant SCH as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant AS as Alert Service
+
+    loop Every 10 minutes
+        SCH->>BS: Trigger billing calculation
+        BS->>OC: Query costs (last 10min)
+        OC-->>BS: Return usage metrics
+        BS->>BS: Calculate total cost
+        BS->>BLS: Deduct cost from balance
+        BLS->>BLS: Update balance
+        BLS-->>BS: Balance updated
+        BS->>AS: Check balance threshold
+        alt Balance < 20%
+            AS->>AS: Send low balance alert
+        end
+        alt Balance <= 0
+            AS->>BS: Suspend team workloads
+        end
+    end
+```
+
+## Integration Points
+
+### Kubernetes Integration
+
+Bison integrates deeply with Kubernetes:
+
+- **Capsule Tenants** for multi-tenancy
+- **ResourceQuotas** for limit enforcement
+- **Namespaces** for project isolation
+- **ConfigMaps** for data persistence
+- **RBAC** for access control
+
+### OpenCost Integration
+
+Real-time cost tracking via OpenCost API:
+
+```bash
+# Query team costs
+GET /allocation/compute?window=10m&aggregate=namespace&filter=namespace:ml-team
+
+# Response
+{
+  "ml-team": {
+    "cpuCost": 0.25,
+    "memCost": 0.10,
+    "gpuCost": 4.17,
+    "totalCost": 4.52
+  }
+}
+```
+
+### Prometheus Integration
+
+Metrics collection for monitoring:
+
+- Resource utilization metrics
+- Cost metrics
+- Balance metrics
+- Alert metrics
+
+## Deployment Architecture
+
+### High Availability Setup
+
+```mermaid
+graph TB
+    subgraph K8S[Kubernetes Cluster]
+        subgraph NS1[bison-system namespace]
+            API1[API Server Pod 1]
+            API2[API Server Pod 2]
+            WEB1[Web UI Pod 1]
+            WEB2[Web UI Pod 2]
+        end
+
+        subgraph NS2[opencost-system namespace]
+            OC[OpenCost]
+        end
+
+        subgraph NS3[prometheus-system namespace]
+            PROM[Prometheus]
+        end
+
+        LB[LoadBalancer]
+    end
+
+    LB --> API1 & API2
+    LB --> WEB1 & WEB2
+    API1 & API2 --> OC
+    OC --> PROM
+```
+
+### Resource Requirements
+
+**Minimum:**
+- API Server: 200m CPU, 256Mi Memory
+- Web UI: 100m CPU, 128Mi Memory
+
+**Recommended (Production):**
+- API Server: 1000m CPU, 512Mi Memory (2 replicas)
+- Web UI: 500m CPU, 256Mi Memory (2 replicas)
+
+## Security Model
+
+### Authentication
+- JWT token-based authentication
+- OIDC/SSO integration
+- Admin user management
+
+### Authorization
+- Kubernetes RBAC integration
+- Role-based access control
+- Team-scoped permissions
+
+### Data Security
+- All data encrypted at rest (etcd encryption)
+- TLS for API communication
+- Secret management via Kubernetes Secrets
+
+## Technology Stack
+
+### Backend
+- **Language**: Go 1.24+
+- **Framework**: Gin
+- **Kubernetes Client**: client-go
+- **Configuration**: Viper
+- **Logging**: Logrus
+
+### Frontend
+- **Framework**: React 18
+- **Language**: TypeScript
+- **UI Library**: Ant Design 5
+- **Build Tool**: Vite
+- **State Management**: React Query
+- **Charts**: ECharts
+
+### Infrastructure
+- **Platform**: Kubernetes 1.22+
+- **Multi-Tenancy**: Capsule
+- **Cost Tracking**: OpenCost
+- **Metrics**: Prometheus
+- **Storage**: ConfigMaps (etcd)
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison
+- [Configuration](configuration.md) - Configure billing
+- [User Guides](user-guides/admin.md) - Learn to use Bison
+- [Features](features.md) - Explore capabilities
diff --git a/website/versioned_docs/version-0.0.7/configuration.md b/website/versioned_docs/version-0.0.7/configuration.md
new file mode 100644
index 0000000..539aaa3
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/configuration.md
@@ -0,0 +1,361 @@
+---
+sidebar_position: 6
+---
+
+# Configuration
+
+This guide covers how to configure Bison for your specific environment and requirements.
+
+## Helm Chart Configuration
+
+Bison is configured primarily through Helm values. You can customize the installation by providing a `values.yaml` file or using `--set` flags.
+
+### Key Configuration Parameters
+
+| Parameter | Description | Default | Example |
+|-----------|-------------|---------|---------|
+| `auth.enabled` | Enable authentication | `false` | `true` |
+| `auth.admin.username` | Admin username | `admin` | `admin` |
+| `auth.admin.password` | Admin password | `admin` | `changeme` |
+| `apiServer.replicaCount` | API server replicas | `2` | `3` |
+| `apiServer.image.repository` | API server image | `ghcr.io/supermarioyl/bison/api-server` | - |
+| `apiServer.image.tag` | API server image tag | `0.0.1` | `latest` |
+| `webUI.replicaCount` | Web UI replicas | `2` | `3` |
+| `webUI.image.repository` | Web UI image | `ghcr.io/supermarioyl/bison/web-ui` | - |
+| `webUI.image.tag` | Web UI image tag | `0.0.1` | `latest` |
+| `opencost.url` | OpenCost API endpoint | `http://opencost.opencost-system.svc:9003` | Custom URL |
+
+### Example Custom Values
+
+Create a `custom-values.yaml` file:
+
+```yaml
+# Authentication
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: MySecurePassword123
+
+# API Server
+apiServer:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 200m
+      memory: 256Mi
+    limits:
+      cpu: 1000m
+      memory: 512Mi
+
+# Web UI
+webUI:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 100m
+      memory: 128Mi
+    limits:
+      cpu: 500m
+      memory: 256Mi
+
+# OpenCost Integration
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Node Selection (optional)
+nodeSelector:
+  node-role.kubernetes.io/control-plane: ""
+
+# Tolerations (optional)
+tolerations:
+  - key: node-role.kubernetes.io/control-plane
+    operator: Exists
+    effect: NoSchedule
+```
+
+Install with custom values:
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --values custom-values.yaml
+```
+
+## Billing Configuration
+
+Billing settings are configured through the Web UI or API after installation.
+
+### Access Billing Configuration
+
+1. **Via Web UI:**
+   - Navigate to **Settings** > **Billing Configuration**
+   - Set pricing for CPU, Memory, GPU, and other resources
+   - Configure currency and billing intervals
+
+2. **Via API:**
+   ```bash
+   curl -X POST http://localhost:8080/api/v1/billing/config \
+     -H "Content-Type: application/json" \
+     -d '{
+       "enabled": true,
+       "currency": "USD",
+       "pricing": {
+         "cpu": 0.05,
+         "memory": 0.01,
+         "nvidia.com/gpu": 2.50
+       },
+       "billingInterval": "hourly"
+     }'
+   ```
+
+### Billing Parameters
+
+| Parameter | Description | Example |
+|-----------|-------------|---------|
+| `enabled` | Enable/disable billing | `true` |
+| `currency` | Currency for billing | `USD`, `CNY`, `EUR` |
+| `pricing.cpu` | CPU price per core-hour | `0.05` |
+| `pricing.memory` | Memory price per GB-hour | `0.01` |
+| `pricing["nvidia.com/gpu"]` | GPU price per GPU-hour | `2.50` |
+| `billingInterval` | Billing aggregation period | `hourly`, `daily` |
+| `lowBalanceThreshold` | Warning threshold (%) | `20` |
+| `suspendThreshold` | Auto-suspend threshold (%) | `5` |
+
+### Example Billing Configuration
+
+```json
+{
+  "enabled": true,
+  "currency": "USD",
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "nvidia.com/mig-1g.5gb": 0.50,
+    "nvidia.com/mig-2g.10gb": 1.00
+  },
+  "billingInterval": "hourly",
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Team Configuration
+
+### Creating Teams
+
+Teams can be created through the Web UI or API:
+
+**Via Web UI:**
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Set team name, quota, and initial balance
+
+**Via API:**
+```bash
+curl -X POST http://localhost:8080/api/v1/teams \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "ml-team",
+    "description": "Machine Learning Team",
+    "quota": {
+      "cpu": "20",
+      "memory": "64Gi",
+      "nvidia.com/gpu": "4"
+    },
+    "balance": 1000.00
+  }'
+```
+
+### Team Quotas
+
+Team quotas define resource limits:
+
+```yaml
+quota:
+  cpu: "20"              # 20 CPU cores
+  memory: "64Gi"         # 64 GB RAM
+  nvidia.com/gpu: "4"    # 4 GPUs
+  storage: "500Gi"       # 500 GB storage
+```
+
+### Team Balance Management
+
+Set initial balance and configure auto-recharge:
+
+```json
+{
+  "balance": 1000.00,
+  "autoRecharge": {
+    "enabled": true,
+    "amount": 500.00,
+    "schedule": "monthly",
+    "threshold": 100.00
+  }
+}
+```
+
+## Alert Configuration
+
+Configure multi-channel alerts for low balance and quota warnings.
+
+### Webhook Alerts
+
+```json
+{
+  "type": "webhook",
+  "enabled": true,
+  "url": "https://your-webhook-endpoint.com/alerts",
+  "headers": {
+    "Authorization": "Bearer YOUR_TOKEN"
+  },
+  "template": {
+    "title": "Bison Alert",
+    "message": "Team {{.TeamName}} balance is {{.Balance}}"
+  }
+}
+```
+
+### DingTalk Alerts
+
+```json
+{
+  "type": "dingtalk",
+  "enabled": true,
+  "webhook": "https://oapi.dingtalk.com/robot/send?access_token=YOUR_TOKEN",
+  "secret": "YOUR_SECRET"
+}
+```
+
+### WeChat Work Alerts
+
+```json
+{
+  "type": "wechat",
+  "enabled": true,
+  "corpid": "YOUR_CORP_ID",
+  "corpsecret": "YOUR_CORP_SECRET",
+  "agentid": 1000001
+}
+```
+
+## OpenCost Integration
+
+Configure OpenCost connection:
+
+### Check OpenCost Connectivity
+
+```bash
+# Test OpenCost API
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+
+# Test allocation API
+curl http://localhost:9003/allocation/compute?window=1d
+```
+
+### Update OpenCost URL
+
+If OpenCost is deployed in a different namespace or with a different service name:
+
+```bash
+helm upgrade bison bison/bison \
+  --set opencost.url=http://my-opencost.custom-namespace.svc:9003 \
+  --namespace bison-system
+```
+
+## Authentication & OIDC
+
+Enable authentication and integrate with your SSO provider:
+
+### Basic Authentication
+
+```yaml
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: SecurePassword123
+```
+
+### OIDC Integration
+
+```yaml
+auth:
+  enabled: true
+  oidc:
+    enabled: true
+    issuerURL: https://your-oidc-provider.com
+    clientID: bison-client-id
+    clientSecret: your-client-secret
+    redirectURL: https://bison.example.com/callback
+```
+
+## Environment Variables
+
+Additional configuration can be provided via environment variables:
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `KUBECONFIG` | Path to kubeconfig file | In-cluster config |
+| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost-system.svc:9003` |
+| `AUTH_ENABLED` | Enable authentication | `false` |
+| `LOG_LEVEL` | Logging level | `info` |
+| `BILLING_INTERVAL` | Billing calculation interval | `10m` |
+
+Set environment variables in Helm values:
+
+```yaml
+apiServer:
+  env:
+    - name: LOG_LEVEL
+      value: debug
+    - name: BILLING_INTERVAL
+      value: 5m
+```
+
+## Advanced Configuration
+
+### Custom Resource Pricing
+
+Price any Kubernetes resource:
+
+```json
+{
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "amd.com/gpu": 2.00,
+    "ephemeral-storage": 0.001,
+    "custom.io/fpga": 5.00
+  }
+}
+```
+
+### Multi-Cluster Support
+
+Deploy Bison in each cluster with shared billing:
+
+```yaml
+# Cluster A
+apiServer:
+  clusterName: prod-us-west
+
+# Cluster B
+apiServer:
+  clusterName: prod-us-east
+```
+
+## Next Steps
+
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
+- [Features](features.md) - Explore all capabilities
diff --git a/website/versioned_docs/version-0.0.7/features.md b/website/versioned_docs/version-0.0.7/features.md
new file mode 100644
index 0000000..8d0c438
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/features.md
@@ -0,0 +1,195 @@
+---
+sidebar_position: 2
+---
+
+# Features
+
+Bison provides a comprehensive suite of features for GPU resource management, billing, and multi-tenant isolation in Kubernetes environments.
+
+## See Bison in Action
+
+### 🎯 Real-Time Resource Dashboard
+
+![Bison Dashboard](/img/ui-dashboard.png)
+
+**What you see:**
+- **Cluster Overview** - Total teams, projects, resource pools, and quotas at a glance
+- **Resource Utilization** - Visual breakdown showing which teams are consuming resources
+- **7-Day Cost Trends** - Historical cost data to identify spending patterns
+- **Top 5 Cost Rankings** - Quickly identify heavy GPU consumers
+- **Team Budget Status** - Real-time balance monitoring with color-coded alerts
+
+**Who benefits:**
+- **Platform Administrators** get instant visibility into cluster health and usage patterns
+- **Finance Teams** can track costs in real-time without waiting for monthly reports
+- **Team Leaders** can compare their usage against other teams
+
+---
+
+### 💼 Team Management & Budget Monitoring
+
+![Team Management](/img/ui-team.png)
+
+**What you see:**
+- **Team List** with real-time status indicators:
+  - 🟢 Green balance = Healthy budget
+  - 🟡 Yellow balance = Approaching threshold
+  - 🔴 Red balance = Low balance or suspended
+- **Resource Allocation** - CPU/Memory/GPU quotas per team (e.g., "cpu 0/10" means 0 used out of 10 allocated)
+- **Project Count** - Number of namespaces/projects under each team
+- **Quick Actions** - Edit quotas, recharge balance, or delete team with one click
+
+**Who benefits:**
+- **Team Leaders** monitor their budget status and resource usage at a glance
+- **Administrators** manage multiple teams from a single unified view
+- **Finance Teams** see which teams need recharging
+
+---
+
+### 💰 Flexible Billing Configuration
+
+![Billing Configuration](/img/ui-billing.png)
+
+**What you see:**
+- **Per-Resource Pricing** - Set custom prices for CPU (per core-hour), Memory (per GB-hour), GPU (per GPU-hour)
+- **Currency Selection** - Support for CNY, USD, EUR, and other currencies
+- **Enable/Disable Toggle** - Turn billing on/off for specific resources with one click
+- **Billing Rules** - Define how resources are metered (hourly, daily, etc.)
+- **Alert Thresholds** - Configure when to send low-balance warnings
+
+**Who benefits:**
+- **Finance Teams** align cloud costs with internal chargeback policies
+- **Administrators** adjust pricing based on actual hardware costs
+- **Budget Managers** set appropriate warning thresholds to prevent overruns
+
+---
+
+## Core Capabilities
+
+### Multi-Tenant Management
+✅ **Capsule-Powered Isolation** - True multi-tenancy using Kubernetes-native Capsule operator
+✅ **OIDC Integration** - Enterprise SSO support for authentication
+✅ **Team-Based Access Control** - Manage users, roles, and permissions per team
+✅ **Shared & Exclusive Node Pools** - Flexible resource allocation strategies
+
+### Real-Time Billing
+✅ **Usage-Based Billing** - Accurate cost tracking based on actual resource consumption
+✅ **Configurable Pricing** - Set custom rates for CPU, Memory, GPU, and any Kubernetes resource
+✅ **Multi-Currency Support** - CNY, USD, EUR, and more
+✅ **Billing Rules Engine** - Define custom billing logic and aggregation periods
+
+### Dynamic Resource Quotas
+✅ **Per-Team Quotas** - CPU, Memory, GPU, Storage, and custom resources
+✅ **Namespace Quotas** - Project-level resource limits within teams
+✅ **Auto-Enforcement** - Kubernetes-native quota enforcement
+✅ **Quota Alerts** - Notifications when approaching limits
+
+### Team Balance & Wallet System
+✅ **Prepaid Balances** - Team wallets with real-time deduction
+✅ **Auto-Deduction** - Automated billing based on resource usage
+✅ **Balance Thresholds** - Configurable warning and suspension levels
+✅ **Transaction History** - Complete audit trail of all balance changes
+
+### Auto-Recharge
+✅ **Scheduled Top-Ups** - Weekly or monthly automatic recharges
+✅ **Custom Amounts** - Flexible recharge amounts per team
+✅ **Recharge Notifications** - Alert teams when balance is added
+
+### Balance Alerts
+✅ **Multi-Channel Notifications** - Webhook, DingTalk, WeChat, Email
+✅ **Configurable Thresholds** - Set warning levels (e.g., 20%, 10%, 5%)
+✅ **Auto-Suspension** - Automatically suspend workloads when balance depleted
+✅ **Custom Templates** - Customize alert messages
+
+### Usage Reports
+✅ **Team Analytics** - Per-team cost breakdowns and trends
+✅ **Project Analytics** - Namespace-level resource consumption
+✅ **Export Capabilities** - CSV, Excel, PDF reports
+✅ **Historical Data** - 30/60/90-day cost analysis
+
+### Audit Logging
+✅ **Complete Operation History** - Track all administrative actions
+✅ **User Attribution** - Who did what and when
+✅ **Resource Changes** - Track quota, balance, and configuration changes
+✅ **Compliance Ready** - Meet internal audit requirements
+
+---
+
+## Architecture Highlights
+
+Bison's architecture is designed for simplicity, scalability, and zero external dependencies.
+
+```mermaid
+graph TB
+    subgraph USER_LAYER[User Layer]
+        UI[Web UI<br/>React + Ant Design]
+        API[REST API<br/>Go + Gin]
+    end
+
+    subgraph CORE[Core Services]
+        BS[Billing Service]
+        TS[Tenant Service]
+        QS[Quota Service]
+    end
+
+    subgraph K8S[Kubernetes Layer]
+        CA[Capsule<br/>Multi-Tenancy]
+        OC[OpenCost<br/>Cost Tracking]
+        PR[Prometheus<br/>Metrics]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Zero Database]
+    end
+
+    UI --> API
+    API --> BS & TS & QS
+    BS --> OC
+    TS --> CA
+    QS --> CA
+    BS & TS --> CM
+    OC --> PR
+```
+
+### Key Architectural Benefits
+
+- **Zero External Dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+- **Cloud-Native** - Built on Kubernetes primitives for maximum portability
+- **Scalable** - Stateless API server that can scale horizontally
+- **Secure** - Kubernetes RBAC integration and optional authentication
+- **Observable** - Prometheus metrics and structured logging
+- **Extensible** - Plugin architecture for custom billing rules and alerts
+
+---
+
+## Integration Points
+
+### OpenCost Integration
+Bison leverages [OpenCost](https://www.opencost.io/) for real-time cost tracking:
+- Per-pod, per-namespace, per-team cost visibility
+- GPU utilization metrics
+- Historical cost data and trends
+- Integration with Prometheus for metric collection
+
+### Capsule Integration
+Bison uses [Capsule](https://capsule.clastix.io/) for multi-tenancy:
+- Team-based tenant isolation
+- Namespace quota enforcement
+- Network and security policies
+- OIDC/SSO integration
+
+### Prometheus Integration
+Metrics collection and monitoring:
+- Resource utilization tracking
+- Custom billing metrics
+- Alert rule evaluation
+- Historical data retention
+
+---
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison in your cluster
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Deep dive into system design
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.7/installation.md b/website/versioned_docs/version-0.0.7/installation.md
new file mode 100644
index 0000000..da89191
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/installation.md
@@ -0,0 +1,316 @@
+---
+sidebar_position: 3
+---
+
+# Installation Guide
+
+This guide provides detailed instructions for installing Bison in your Kubernetes cluster.
+
+## Prerequisites
+
+Before installing Bison, ensure you have:
+
+- **Kubernetes 1.22+** - A running Kubernetes cluster
+- **kubectl** - Configured to access your cluster
+- **Helm 3.0+** - Package manager for Kubernetes
+- **Capsule Operator v0.1.0+** - For multi-tenant isolation
+- **OpenCost** - Deployed with Prometheus for cost tracking
+
+### Install Prerequisites
+
+If you haven't installed the required components:
+
+#### Install Capsule
+
+```bash
+# Using Helm
+helm repo add projectcapsule https://projectcapsule.github.io/charts
+helm install capsule projectcapsule/capsule \
+  --namespace capsule-system \
+  --create-namespace
+```
+
+#### Install OpenCost
+
+```bash
+# Using Helm
+helm repo add opencost https://opencost.github.io/opencost-helm-chart
+helm install opencost opencost/opencost \
+  --namespace opencost-system \
+  --create-namespace \
+  --set prometheus.internal.serviceName=prometheus-server \
+  --set prometheus.internal.namespaceName=prometheus-system
+```
+
+## Installation Methods
+
+Bison Helm charts are distributed via **GitHub Container Registry (GHCR)** using the modern OCI format.
+
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
+
+### Option A: From GHCR (Recommended)
+
+The simplest way to install Bison is directly from GitHub Container Registry:
+
+```bash
+# Install specific version from GHCR
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace
+
+# Or pull the chart first, then install
+helm pull oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+helm install bison bison-0.0.2.tgz \
+  --namespace bison-system \
+  --create-namespace
+
+# Customize installation
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true \
+  --set apiServer.image.tag=0.0.2 \
+  --set webUI.image.tag=0.0.2
+```
+
+**Why GHCR OCI Format?**
+- ✅ No separate Helm repository maintenance needed
+- ✅ Unified with Docker images in GHCR
+- ✅ Faster installation (direct registry pull)
+- ✅ Modern Helm 3.8+ standard practice
+
+### Option B: From GitHub Release
+
+Download a specific version from GitHub Releases:
+
+```bash
+# Download Helm chart
+VERSION=0.0.2
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install the chart
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Option C: From Source
+
+Clone and build from source:
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+## Configuration Options
+
+Bison can be configured using Helm values. Here are the key configuration options:
+
+### Basic Configuration
+
+```yaml
+# values.yaml
+apiServer:
+  image:
+    repository: ghcr.io/supermarioyl/bison/api-server
+    tag: 0.0.1
+  replicas: 2
+
+webUI:
+  image:
+    repository: ghcr.io/supermarioyl/bison/web-ui
+    tag: 0.0.1
+  replicas: 2
+
+# OpenCost URL
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Authentication
+auth:
+  enabled: false
+```
+
+### Custom Configuration Example
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set apiServer.replicas=3 \
+  --set webUI.replicas=3 \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true
+```
+
+## Verify Installation
+
+After installation, verify that all components are running:
+
+```bash
+# Check pod status
+kubectl get pods -n bison-system
+
+# Expected output:
+# NAME                              READY   STATUS    RESTARTS   AGE
+# bison-api-server-xxxxxxxxx-xxxxx  1/1     Running   0          2m
+# bison-webui-xxxxxxxxx-xxxxx       1/1     Running   0          2m
+
+# Check services
+kubectl get svc -n bison-system
+
+# Check logs
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl logs -n bison-system deployment/bison-webui
+```
+
+## Access the Platform
+
+### Port Forward (Development)
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+```
+
+### Ingress (Production)
+
+For production deployments, configure an Ingress:
+
+```yaml
+# ingress.yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: bison-ingress
+  namespace: bison-system
+  annotations:
+    kubernetes.io/ingress.class: nginx
+spec:
+  rules:
+  - host: bison.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-webui
+            port:
+              number: 80
+      - path: /api
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-api-server
+            port:
+              number: 8080
+```
+
+Apply the Ingress:
+
+```bash
+kubectl apply -f ingress.yaml
+```
+
+## Docker Images
+
+Bison images are available on GitHub Container Registry:
+
+```bash
+# Pull images
+docker pull ghcr.io/supermarioyl/bison/api-server:0.0.1
+docker pull ghcr.io/supermarioyl/bison/web-ui:0.0.1
+
+# Or use latest
+docker pull ghcr.io/supermarioyl/bison/api-server:latest
+docker pull ghcr.io/supermarioyl/bison/web-ui:latest
+```
+
+**Supported Platforms:**
+- `linux/amd64`
+- `linux/arm64`
+
+## Upgrading
+
+To upgrade Bison to a new version:
+
+```bash
+# Update Helm repository
+helm repo update
+
+# Upgrade to latest version
+helm upgrade bison bison/bison --namespace bison-system
+
+# Or upgrade to specific version
+helm upgrade bison bison/bison --version 0.0.2 --namespace bison-system
+```
+
+## Uninstalling
+
+To completely remove Bison:
+
+```bash
+# Uninstall Helm release
+helm uninstall bison --namespace bison-system
+
+# Remove namespace (optional)
+kubectl delete namespace bison-system
+```
+
+## Troubleshooting
+
+### Pod Not Starting
+
+Check pod logs for errors:
+
+```bash
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl describe pod -n bison-system <pod-name>
+```
+
+### Cannot Connect to OpenCost
+
+Verify OpenCost is running and accessible:
+
+```bash
+kubectl get svc -n opencost-system
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+
+# Test endpoint
+curl http://localhost:9003/healthz
+```
+
+### Authentication Issues
+
+If authentication is enabled, ensure you have the correct credentials:
+
+```bash
+# Default credentials (change in production!)
+Username: admin
+Password: admin
+```
+
+## Next Steps
+
+- [Configuration Guide](configuration.md) - Configure billing and settings
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
diff --git a/website/versioned_docs/version-0.0.7/intro.md b/website/versioned_docs/version-0.0.7/intro.md
new file mode 100644
index 0000000..b3dc3aa
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/intro.md
@@ -0,0 +1,167 @@
+---
+sidebar_position: 1
+slug: /
+---
+
+# Introduction to Bison
+
+![Bison Logo](/img/logo.png)
+
+**Enterprise GPU Resource Billing & Multi-Tenant Management Platform**
+
+Bison is a Kubernetes-based platform that provides comprehensive GPU resource management, billing, and multi-tenant isolation for organizations running shared GPU clusters.
+
+## The GPU Management Challenge
+
+Managing shared GPU clusters across multiple teams creates critical operational and financial challenges:
+
+**For Platform Administrators:**
+- How do you fairly allocate expensive GPU resources across competing teams?
+- How do you prevent resource hogging while ensuring everyone gets their fair share?
+- How do you track who's using what and implement accurate chargeback?
+- How do you maintain strict multi-tenant isolation without complex manual configuration?
+
+**For Finance & Budget Teams:**
+- How do you implement automated chargeback for GPU usage without manual accounting?
+- How do you prevent budget overruns before they happen?
+- How do you generate accurate cost reports for internal billing?
+
+**For Development Teams:**
+- How do you get predictable, isolated access to GPU resources?
+- How do you know when you're approaching your budget limits?
+- How do you avoid impacting other teams' workloads?
+
+**Traditional Approach:**
+- Manual quota configuration per namespace
+- Excel-based billing calculations
+- No real-time cost visibility
+- Complex multi-tool setup (quota management + cost tracking + billing system)
+- Frequent resource conflicts and budget surprises
+
+## Bison's Integrated Solution
+
+```mermaid
+graph TB
+    subgraph WITHOUT["Without Bison"]
+        P1[❌ Manual Quota Management<br/>Per-namespace configuration]
+        P2[❌ Spreadsheet Billing<br/>Manual calculations & reports]
+        P3[❌ No Resource Isolation<br/>Teams compete for resources]
+        P4[❌ Budget Overruns<br/>No proactive alerts]
+        P5[❌ Complex Tooling<br/>Multiple systems to manage]
+    end
+
+    subgraph WITH["With Bison"]
+        S1[✅ Automated Team Quotas<br/>Capsule-powered isolation]
+        S2[✅ Real-Time Billing<br/>OpenCost integration]
+        S3[✅ True Multi-Tenancy<br/>Shared/Exclusive modes]
+        S4[✅ Proactive Alerts<br/>Balance monitoring & auto-suspend]
+        S5[✅ Unified Platform<br/>Single pane of glass]
+    end
+
+    P1 -.Transform.-> S1
+    P2 -.Transform.-> S2
+    P3 -.Transform.-> S3
+    P4 -.Transform.-> S4
+    P5 -.Transform.-> S5
+
+    style WITHOUT fill:#ffebee
+    style WITH fill:#e8f5e9
+    style S1 fill:#4caf50,color:#fff
+    style S2 fill:#4caf50,color:#fff
+    style S3 fill:#4caf50,color:#fff
+    style S4 fill:#4caf50,color:#fff
+    style S5 fill:#4caf50,color:#fff
+```
+
+**Bison combines:**
+- 🔐 **Kubernetes-native multi-tenancy** (Capsule) - True team isolation with shared or exclusive node pools
+- 💰 **Real-time cost tracking** (OpenCost + Prometheus) - Per-pod, per-namespace, per-team cost visibility
+- 💳 **Automated billing & budgets** - Prepaid balances, auto-deduction, low-balance alerts, and auto-suspension
+- 📊 **Unified dashboard** - Single interface for admins, team leaders, and finance teams
+- 🔧 **Zero external dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+
+**Result:** Deploy once, get complete GPU resource management with automated billing in under 30 minutes.
+
+## Quick Start
+
+### Prerequisites
+
+- Kubernetes 1.22+
+- kubectl configured
+- Helm 3.0+
+- Capsule operator (v0.1.0+) installed
+- OpenCost deployed with Prometheus
+
+### Installation
+
+Choose one of the following installation methods:
+
+#### Option A: Using Helm Repository (Recommended)
+
+```bash
+# Add Bison Helm repository
+helm repo add bison https://supermarioyl.github.io/Bison/charts/
+helm repo update
+
+# Install with default configuration
+helm install bison bison/bison --namespace bison-system --create-namespace
+
+# Or customize installation
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=false
+```
+
+#### Option B: From GitHub Release
+
+```bash
+# Download latest Helm chart
+VERSION=0.0.1
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+#### Option C: From Source
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Access the Platform
+
+After installation, access Bison through:
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+# Default credentials (if auth enabled):
+# Username: admin
+# Password: admin (change immediately in production!)
+```
+
+## Next Steps
+
+- [Explore Features](features.md) - Learn about all capabilities
+- [Installation Guide](installation.md) - Detailed installation instructions
+- [User Guides](user-guides/admin.md) - Role-based user guides
+- [Architecture](architecture.md) - Understand the system architecture
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.7/user-guides/_category_.json b/website/versioned_docs/version-0.0.7/user-guides/_category_.json
new file mode 100644
index 0000000..fe79f61
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/user-guides/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "User Guides",
+  "position": 4,
+  "link": {
+    "type": "generated-index",
+    "description": "Role-based guides for using Bison effectively."
+  }
+}
diff --git a/website/versioned_docs/version-0.0.7/user-guides/admin.md b/website/versioned_docs/version-0.0.7/user-guides/admin.md
new file mode 100644
index 0000000..a466cbb
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/user-guides/admin.md
@@ -0,0 +1,176 @@
+---
+sidebar_position: 1
+---
+
+# Administrator Guide
+
+This guide is for platform administrators who deploy, configure, and manage the Bison platform.
+
+## Responsibilities
+
+As a platform administrator, you are responsible for:
+
+- ✅ Deploying and configuring Bison
+- ✅ Creating and managing teams
+- ✅ Setting global billing configuration
+- ✅ Monitoring cluster-wide metrics
+- ✅ Responding to alerts and recharge requests
+
+## Getting Started
+
+### 1. Deploy Bison
+
+Follow the [Installation Guide](../installation.md) to deploy Bison in your Kubernetes cluster.
+
+### 2. Configure Billing
+
+Set up billing rules and pricing:
+
+1. Access the Web UI
+2. Navigate to **Settings** > **Billing Configuration**
+3. Configure:
+   - **Currency**: USD, CNY, EUR, etc.
+   - **CPU Price**: Cost per core-hour
+   - **Memory Price**: Cost per GB-hour
+   - **GPU Price**: Cost per GPU-hour
+4. Click **Save**
+
+### 3. Create First Team
+
+Create a team for your users:
+
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Fill in:
+   - **Team Name**: e.g., "ml-team"
+   - **Description**: Team purpose
+   - **Resource Quota**:
+     - CPU: e.g., "20" cores
+     - Memory: e.g., "64Gi"
+     - GPU: e.g., "4"
+   - **Initial Balance**: e.g., 1000.00
+4. Click **Create**
+
+## Common Tasks
+
+### Managing Teams
+
+#### View All Teams
+
+```bash
+# Via kubectl
+kubectl get tenants
+
+# Via API
+curl http://localhost:8080/api/v1/teams
+```
+
+#### Update Team Quota
+
+1. Navigate to **Teams** page
+2. Click **Edit** on the team row
+3. Modify quotas
+4. Click **Save**
+
+#### Recharge Team Balance
+
+1. Navigate to **Teams** page
+2. Click **Recharge** on the team row
+3. Enter amount
+4. Add notes (optional)
+5. Click **Confirm**
+
+### Monitoring
+
+#### View Dashboard
+
+Access real-time cluster metrics:
+- Total teams and projects
+- Resource utilization
+- Cost trends
+- Top consumers
+- Balance status
+
+#### Check Alerts
+
+Monitor low-balance and quota alerts:
+1. Navigate to **Alerts** page
+2. Review active alerts
+3. Take action as needed
+
+### Billing Configuration
+
+#### Update Pricing
+
+```bash
+curl -X PUT http://localhost:8080/api/v1/billing/config \
+  -H "Content-Type: application/json" \
+  -d '{
+    "pricing": {
+      "cpu": 0.06,
+      "memory": 0.012,
+      "nvidia.com/gpu": 3.00
+    }
+  }'
+```
+
+#### Configure Alert Thresholds
+
+```json
+{
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Best Practices
+
+### Team Naming
+- Use lowercase, alphanumeric characters and hyphens
+- Example: `ml-team`, `data-science`, `dev-team`
+
+### Quota Allocation
+- Start with conservative quotas
+- Monitor usage for 1-2 weeks
+- Adjust based on actual needs
+
+### Balance Management
+- Set up auto-recharge for critical teams
+- Monitor balance trends weekly
+- Respond to low-balance alerts promptly
+
+### Security
+- Enable authentication in production
+- Use OIDC/SSO for enterprise deployments
+- Regularly audit user permissions
+
+## Troubleshooting
+
+### Team Creation Failed
+
+Check Capsule operator logs:
+```bash
+kubectl logs -n capsule-system deployment/capsule-controller-manager
+```
+
+### Billing Not Working
+
+Verify OpenCost connectivity:
+```bash
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+```
+
+### High Resource Usage
+
+Check resource consumption:
+```bash
+kubectl top pods -n bison-system
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Guide for team leaders
+- [Developer Guide](developer.md) - Guide for developers
+- [Configuration](../configuration.md) - Advanced configuration
diff --git a/website/versioned_docs/version-0.0.7/user-guides/developer.md b/website/versioned_docs/version-0.0.7/user-guides/developer.md
new file mode 100644
index 0000000..d14ab62
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/user-guides/developer.md
@@ -0,0 +1,187 @@
+---
+sidebar_position: 3
+---
+
+# Developer Guide
+
+This guide is for developers who deploy workloads and consume resources within team projects.
+
+## Responsibilities
+
+As a developer, you are responsible for:
+
+- ✅ Deploying applications within your project
+- ✅ Monitoring resource usage
+- ✅ Staying within quota limits
+- ✅ Optimizing resource consumption
+
+## Getting Started
+
+### 1. Get Kubeconfig
+
+Request kubeconfig from your team leader or administrator.
+
+### 2. Set Context
+
+```bash
+# Set context to your project namespace
+kubectl config set-context --current --namespace=your-project
+
+# Verify
+kubectl config view --minify | grep namespace
+```
+
+### 3. Check Quota
+
+See your available resources:
+```bash
+kubectl describe quota
+```
+
+## Deploying Workloads
+
+### Basic Pod Deployment
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: gpu-training-job
+  namespace: your-project
+spec:
+  containers:
+  - name: trainer
+    image: your-ml-image:latest
+    resources:
+      requests:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+      limits:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+```
+
+### Using Deployments
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: ml-inference
+  namespace: your-project
+spec:
+  replicas: 2
+  selector:
+    matchLabels:
+      app: ml-inference
+  template:
+    metadata:
+      labels:
+        app: ml-inference
+    spec:
+      containers:
+      - name: inference
+        image: your-inference-image:latest
+        resources:
+          requests:
+            cpu: "2"
+            memory: "8Gi"
+            nvidia.com/gpu: "1"
+```
+
+## Monitoring Usage
+
+### Check Pod Resource Usage
+
+```bash
+# View resource consumption
+kubectl top pods
+
+# Detailed pod information
+kubectl describe pod <pod-name>
+```
+
+### View Logs
+
+```bash
+# Stream logs
+kubectl logs -f <pod-name>
+
+# Previous logs (if pod restarted)
+kubectl logs --previous <pod-name>
+```
+
+## Best Practices
+
+### Resource Requests and Limits
+
+Always specify both requests and limits:
+```yaml
+resources:
+  requests:
+    cpu: "2"
+    memory: "8Gi"
+  limits:
+    cpu: "4"
+    memory: "16Gi"
+```
+
+### GPU Usage
+
+- Request GPUs only when needed
+- Use GPU for compute-intensive tasks
+- Monitor GPU utilization
+
+### Clean Up
+
+Delete resources when no longer needed:
+```bash
+# Delete pod
+kubectl delete pod <pod-name>
+
+# Delete deployment
+kubectl delete deployment <deployment-name>
+
+# Clean up completed jobs
+kubectl delete job --field-selector status.successful=1
+```
+
+### Cost Optimization
+
+- Right-size your resource requests
+- Use horizontal pod autoscaling
+- Clean up idle resources
+- Share GPUs when possible (if supported)
+
+## Troubleshooting
+
+### Pod Pending (Insufficient Quota)
+
+If your pod is stuck in `Pending` state:
+
+```bash
+kubectl describe pod <pod-name>
+```
+
+Look for quota-related errors and reduce resource requests or ask your team leader for more quota.
+
+### Out of Memory (OOM)
+
+If pods are killed due to OOM:
+1. Check memory usage patterns
+2. Increase memory limits
+3. Optimize application memory usage
+
+### GPU Not Available
+
+Verify GPU requests:
+```bash
+kubectl get nodes -o custom-columns=NAME:.metadata.name,GPU:.status.allocatable."nvidia\.com/gpu"
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Understand team management
+- [Architecture](../architecture.md) - Learn about the platform
diff --git a/website/versioned_docs/version-0.0.7/user-guides/team-leader.md b/website/versioned_docs/version-0.0.7/user-guides/team-leader.md
new file mode 100644
index 0000000..7b6de96
--- /dev/null
+++ b/website/versioned_docs/version-0.0.7/user-guides/team-leader.md
@@ -0,0 +1,126 @@
+---
+sidebar_position: 2
+---
+
+# Team Leader Guide
+
+This guide is for team leaders who manage projects, monitor budgets, and allocate resources within their team.
+
+## Responsibilities
+
+As a team leader, you are responsible for:
+
+- ✅ Creating and managing projects (namespaces)
+- ✅ Allocating quotas to projects
+- ✅ Monitoring team balance and consumption
+- ✅ Requesting recharges when needed
+
+## Getting Started
+
+### 1. Access Bison
+
+Log in to the Web UI with your credentials.
+
+### 2. View Team Dashboard
+
+Your dashboard shows:
+- Team balance and status
+- Resource utilization
+- Active projects
+- Cost trends
+
+## Managing Projects
+
+### Create a Project
+
+1. Navigate to **Projects** page
+2. Click **Create Project**
+3. Fill in:
+   - **Project Name**: e.g., "training-ml-models"
+   - **Description**: Project purpose
+   - **Quota** (optional):
+     - CPU: e.g., "8" cores
+     - Memory: e.g., "32Gi"
+     - GPU: e.g., "2"
+4. Click **Create**
+
+### List Projects
+
+```bash
+# Via kubectl (if you have access)
+kubectl get namespaces -l capsule.clastix.io/tenant=your-team
+
+# Via API
+curl http://localhost:8080/api/v1/teams/your-team/projects
+```
+
+### Delete a Project
+
+1. Navigate to **Projects** page
+2. Click **Delete** on the project row
+3. Confirm deletion
+
+**Warning**: This will delete all resources in the project!
+
+## Monitoring Budget
+
+### Check Balance
+
+View your current balance:
+1. Navigate to **Team** page
+2. See balance in the status card
+
+### View Usage Trends
+
+Analyze spending patterns:
+1. Navigate to **Reports** page
+2. Select time range (7 days, 30 days, 90 days)
+3. View:
+   - Cost breakdown by resource type
+   - Daily cost trends
+   - Per-project consumption
+
+### Request Recharge
+
+When balance is low:
+1. Click **Request Recharge** button
+2. Enter requested amount
+3. Add justification
+4. Submit request to administrator
+
+## Resource Management
+
+### Monitor Quota Usage
+
+Check how much of your quota is being used:
+```bash
+kubectl describe quota -n your-project
+```
+
+### Optimize Costs
+
+Tips to reduce spending:
+- **Right-size resources**: Don't over-provision CPU/Memory
+- **Clean up idle pods**: Delete unused workloads
+- **Use spot/preemptible instances**: Where applicable
+- **Monitor GPU utilization**: Ensure GPUs are fully utilized
+
+## Best Practices
+
+### Project Organization
+- Create separate projects for different workloads
+- Example: `ml-training`, `ml-inference`, `data-processing`
+
+### Quota Allocation
+- Allocate quotas based on project priority
+- Reserve buffer for urgent tasks
+
+### Cost Awareness
+- Review costs weekly
+- Identify and eliminate waste
+- Set up cost alerts
+
+## Next Steps
+
+- [Developer Guide](developer.md) - Guide for your team members
+- [Features](../features.md) - Explore all Bison features
diff --git a/website/versioned_docs/version-0.0.8/architecture.md b/website/versioned_docs/version-0.0.8/architecture.md
new file mode 100644
index 0000000..dbbe50d
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/architecture.md
@@ -0,0 +1,418 @@
+---
+sidebar_position: 5
+---
+
+# Architecture
+
+This document provides a technical overview of Bison's architecture, designed with high cohesion and low coupling principles for maintainability and scalability.
+
+## System Overview
+
+### High-Level Architecture
+
+```mermaid
+graph TB
+    subgraph PRESENT[Presentation Layer]
+        WEB[Web UI<br/>React 18 + Ant Design 5]
+        CLI[kubectl / API Client]
+    end
+
+    subgraph GATEWAY[API Gateway Layer]
+        GW[API Server<br/>Go + Gin Framework]
+        AUTH[Auth Middleware<br/>JWT + OIDC]
+    end
+
+    subgraph BUSINESS[Business Logic Layer]
+        TS[Tenant Service<br/>Team & Project CRUD]
+        BS[Billing Service<br/>Cost Calculation]
+        BLS[Balance Service<br/>Wallet Management]
+        QS[Quota Service<br/>Resource Limits]
+        AS[Alert Service<br/>Notifications]
+        RS[Report Service<br/>Analytics]
+    end
+
+    subgraph INTEGRATION[Integration Layer]
+        K8S[Kubernetes Client<br/>client-go]
+        OCC[OpenCost Client<br/>REST API]
+        PC[Prometheus Client<br/>PromQL]
+    end
+
+    subgraph EXTERNAL[External Systems]
+        KAPI[Kubernetes API]
+        CAP[Capsule Controller]
+        OC[OpenCost]
+        PROM[Prometheus]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Persistent Storage]
+    end
+
+    WEB --> GW
+    CLI --> GW
+    GW --> AUTH
+    AUTH --> TS & BS & BLS & QS & AS & RS
+
+    TS --> K8S
+    BS --> OCC
+    BLS --> K8S
+    QS --> K8S
+    RS --> OCC & PC
+
+    K8S --> KAPI
+    K8S --> CAP
+    OCC --> OC
+    PC --> PROM
+
+    TS & BLS --> CM
+    KAPI --> CM
+```
+
+### Design Principles
+
+| Principle | Implementation |
+|-----------|----------------|
+| **High Cohesion** | Each service handles a single domain (billing, quota, alerts) |
+| **Low Coupling** | Services communicate via well-defined interfaces |
+| **Stateless API** | All state persisted in Kubernetes ConfigMaps |
+| **Cloud Native** | Leverages Kubernetes primitives for HA and scaling |
+| **Zero Database** | ConfigMaps eliminate external database dependencies |
+
+## Architecture Layers
+
+Bison follows a layered architecture pattern:
+
+### 1. Presentation Layer
+- **Web UI**: React 18 + TypeScript + Ant Design 5
+- **API Client**: REST API for external integrations
+
+### 2. API Gateway Layer
+- **API Server**: Go + Gin framework
+- **Authentication**: JWT and OIDC support
+- **Middleware**: Logging, recovery, CORS handling
+
+### 3. Business Logic Layer
+- **Tenant Service**: Team and project management
+- **Billing Service**: Cost calculation and aggregation
+- **Balance Service**: Wallet management and auto-deduction
+- **Quota Service**: Resource limit enforcement
+- **Alert Service**: Multi-channel notifications
+- **Report Service**: Analytics and export
+
+### 4. Integration Layer
+- **Kubernetes Client**: client-go for K8s API interaction
+- **OpenCost Client**: REST API for cost data
+- **Prometheus Client**: PromQL queries for metrics
+
+### 5. Data Layer
+- **ConfigMaps**: Persistent storage for balances, billing config, and metadata
+- **etcd**: Backing store via Kubernetes ConfigMaps
+
+## Core Components
+
+### API Server
+
+The API server is the central component that handles all HTTP requests:
+
+**Technology Stack:**
+- Go 1.24+
+- Gin web framework
+- client-go for Kubernetes API
+
+**Key Responsibilities:**
+- Serve REST API endpoints
+- Authentication and authorization
+- Request routing and middleware
+- Background task scheduling
+
+**Endpoints:**
+```
+/api/v1/teams          - Team management
+/api/v1/projects       - Project management
+/api/v1/billing        - Billing configuration
+/api/v1/balance        - Balance operations
+/api/v1/stats          - Statistics and reports
+```
+
+### Web UI
+
+React-based single-page application:
+
+**Technology Stack:**
+- React 18
+- TypeScript
+- Vite (build tool)
+- Ant Design 5
+- ECharts (visualization)
+- React Query (state management)
+
+**Features:**
+- Dashboard with real-time metrics
+- Team and project management
+- Billing configuration
+- Balance monitoring
+- Usage reports and export
+
+### Billing Service
+
+Calculates costs based on resource usage:
+
+**Data Flow:**
+```mermaid
+sequenceDiagram
+    participant S as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant K8S as Kubernetes
+
+    S->>BS: Trigger billing (every 10min)
+    BS->>OC: Query team costs
+    OC-->>BS: Return usage data
+    BS->>BS: Calculate cost
+    BS->>BLS: Deduct from balance
+    BLS->>K8S: Update ConfigMap
+    BLS-->>BS: Confirm
+    BS->>AS: Check threshold
+    alt Balance low
+        AS->>Webhook: Send alert
+    end
+```
+
+**Billing Formula:**
+```
+Total Cost = (CPU_cores × CPU_price × hours) +
+             (Memory_GB × Memory_price × hours) +
+             (GPU_count × GPU_price × hours)
+```
+
+### Balance Service
+
+Manages team wallets and auto-deduction:
+
+**Features:**
+- Real-time balance tracking
+- Auto-deduction based on usage
+- Recharge operations
+- Transaction history
+- Auto-suspension when balance depleted
+
+**Storage:**
+```yaml
+apiVersion: v1
+kind: ConfigMap
+metadata:
+  name: bison-team-balances
+  namespace: bison-system
+data:
+  ml-team: "1523.45"
+  data-team: "890.12"
+  dev-team: "2100.00"
+```
+
+### Tenant Service
+
+Manages teams (Capsule Tenants) and projects (Namespaces):
+
+**Features:**
+- Create/delete teams
+- Assign resource quotas
+- Configure node pools (shared/exclusive)
+- Manage team metadata
+
+**Capsule Integration:**
+```yaml
+apiVersion: capsule.clastix.io/v1beta1
+kind: Tenant
+metadata:
+  name: ml-team
+spec:
+  owners:
+  - name: team-leader
+    kind: User
+  resourceQuota:
+    items:
+    - hard:
+        cpu: "20"
+        memory: 64Gi
+        nvidia.com/gpu: "4"
+```
+
+## Data Flow
+
+### Team Creation Flow
+
+```mermaid
+sequenceDiagram
+    participant U as Admin
+    participant API as API Server
+    participant TS as Tenant Service
+    participant K8S as Kubernetes
+    participant CAP as Capsule
+
+    U->>API: POST /api/v1/teams
+    API->>TS: CreateTeam(name, quota, balance)
+    TS->>CAP: Create Tenant
+    CAP-->>TS: Tenant created
+    TS->>K8S: Create ConfigMap (balance)
+    K8S-->>TS: ConfigMap created
+    TS-->>API: Success
+    API-->>U: 201 Created
+```
+
+### Billing Cycle Flow
+
+```mermaid
+sequenceDiagram
+    participant SCH as Scheduler
+    participant BS as Billing Service
+    participant OC as OpenCost
+    participant BLS as Balance Service
+    participant AS as Alert Service
+
+    loop Every 10 minutes
+        SCH->>BS: Trigger billing calculation
+        BS->>OC: Query costs (last 10min)
+        OC-->>BS: Return usage metrics
+        BS->>BS: Calculate total cost
+        BS->>BLS: Deduct cost from balance
+        BLS->>BLS: Update balance
+        BLS-->>BS: Balance updated
+        BS->>AS: Check balance threshold
+        alt Balance < 20%
+            AS->>AS: Send low balance alert
+        end
+        alt Balance <= 0
+            AS->>BS: Suspend team workloads
+        end
+    end
+```
+
+## Integration Points
+
+### Kubernetes Integration
+
+Bison integrates deeply with Kubernetes:
+
+- **Capsule Tenants** for multi-tenancy
+- **ResourceQuotas** for limit enforcement
+- **Namespaces** for project isolation
+- **ConfigMaps** for data persistence
+- **RBAC** for access control
+
+### OpenCost Integration
+
+Real-time cost tracking via OpenCost API:
+
+```bash
+# Query team costs
+GET /allocation/compute?window=10m&aggregate=namespace&filter=namespace:ml-team
+
+# Response
+{
+  "ml-team": {
+    "cpuCost": 0.25,
+    "memCost": 0.10,
+    "gpuCost": 4.17,
+    "totalCost": 4.52
+  }
+}
+```
+
+### Prometheus Integration
+
+Metrics collection for monitoring:
+
+- Resource utilization metrics
+- Cost metrics
+- Balance metrics
+- Alert metrics
+
+## Deployment Architecture
+
+### High Availability Setup
+
+```mermaid
+graph TB
+    subgraph K8S[Kubernetes Cluster]
+        subgraph NS1[bison-system namespace]
+            API1[API Server Pod 1]
+            API2[API Server Pod 2]
+            WEB1[Web UI Pod 1]
+            WEB2[Web UI Pod 2]
+        end
+
+        subgraph NS2[opencost-system namespace]
+            OC[OpenCost]
+        end
+
+        subgraph NS3[prometheus-system namespace]
+            PROM[Prometheus]
+        end
+
+        LB[LoadBalancer]
+    end
+
+    LB --> API1 & API2
+    LB --> WEB1 & WEB2
+    API1 & API2 --> OC
+    OC --> PROM
+```
+
+### Resource Requirements
+
+**Minimum:**
+- API Server: 200m CPU, 256Mi Memory
+- Web UI: 100m CPU, 128Mi Memory
+
+**Recommended (Production):**
+- API Server: 1000m CPU, 512Mi Memory (2 replicas)
+- Web UI: 500m CPU, 256Mi Memory (2 replicas)
+
+## Security Model
+
+### Authentication
+- JWT token-based authentication
+- OIDC/SSO integration
+- Admin user management
+
+### Authorization
+- Kubernetes RBAC integration
+- Role-based access control
+- Team-scoped permissions
+
+### Data Security
+- All data encrypted at rest (etcd encryption)
+- TLS for API communication
+- Secret management via Kubernetes Secrets
+
+## Technology Stack
+
+### Backend
+- **Language**: Go 1.24+
+- **Framework**: Gin
+- **Kubernetes Client**: client-go
+- **Configuration**: Viper
+- **Logging**: Logrus
+
+### Frontend
+- **Framework**: React 18
+- **Language**: TypeScript
+- **UI Library**: Ant Design 5
+- **Build Tool**: Vite
+- **State Management**: React Query
+- **Charts**: ECharts
+
+### Infrastructure
+- **Platform**: Kubernetes 1.22+
+- **Multi-Tenancy**: Capsule
+- **Cost Tracking**: OpenCost
+- **Metrics**: Prometheus
+- **Storage**: ConfigMaps (etcd)
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison
+- [Configuration](configuration.md) - Configure billing
+- [User Guides](user-guides/admin.md) - Learn to use Bison
+- [Features](features.md) - Explore capabilities
diff --git a/website/versioned_docs/version-0.0.8/configuration.md b/website/versioned_docs/version-0.0.8/configuration.md
new file mode 100644
index 0000000..539aaa3
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/configuration.md
@@ -0,0 +1,361 @@
+---
+sidebar_position: 6
+---
+
+# Configuration
+
+This guide covers how to configure Bison for your specific environment and requirements.
+
+## Helm Chart Configuration
+
+Bison is configured primarily through Helm values. You can customize the installation by providing a `values.yaml` file or using `--set` flags.
+
+### Key Configuration Parameters
+
+| Parameter | Description | Default | Example |
+|-----------|-------------|---------|---------|
+| `auth.enabled` | Enable authentication | `false` | `true` |
+| `auth.admin.username` | Admin username | `admin` | `admin` |
+| `auth.admin.password` | Admin password | `admin` | `changeme` |
+| `apiServer.replicaCount` | API server replicas | `2` | `3` |
+| `apiServer.image.repository` | API server image | `ghcr.io/supermarioyl/bison/api-server` | - |
+| `apiServer.image.tag` | API server image tag | `0.0.1` | `latest` |
+| `webUI.replicaCount` | Web UI replicas | `2` | `3` |
+| `webUI.image.repository` | Web UI image | `ghcr.io/supermarioyl/bison/web-ui` | - |
+| `webUI.image.tag` | Web UI image tag | `0.0.1` | `latest` |
+| `opencost.url` | OpenCost API endpoint | `http://opencost.opencost-system.svc:9003` | Custom URL |
+
+### Example Custom Values
+
+Create a `custom-values.yaml` file:
+
+```yaml
+# Authentication
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: MySecurePassword123
+
+# API Server
+apiServer:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 200m
+      memory: 256Mi
+    limits:
+      cpu: 1000m
+      memory: 512Mi
+
+# Web UI
+webUI:
+  replicaCount: 3
+  image:
+    tag: 0.0.1
+  resources:
+    requests:
+      cpu: 100m
+      memory: 128Mi
+    limits:
+      cpu: 500m
+      memory: 256Mi
+
+# OpenCost Integration
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Node Selection (optional)
+nodeSelector:
+  node-role.kubernetes.io/control-plane: ""
+
+# Tolerations (optional)
+tolerations:
+  - key: node-role.kubernetes.io/control-plane
+    operator: Exists
+    effect: NoSchedule
+```
+
+Install with custom values:
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --values custom-values.yaml
+```
+
+## Billing Configuration
+
+Billing settings are configured through the Web UI or API after installation.
+
+### Access Billing Configuration
+
+1. **Via Web UI:**
+   - Navigate to **Settings** > **Billing Configuration**
+   - Set pricing for CPU, Memory, GPU, and other resources
+   - Configure currency and billing intervals
+
+2. **Via API:**
+   ```bash
+   curl -X POST http://localhost:8080/api/v1/billing/config \
+     -H "Content-Type: application/json" \
+     -d '{
+       "enabled": true,
+       "currency": "USD",
+       "pricing": {
+         "cpu": 0.05,
+         "memory": 0.01,
+         "nvidia.com/gpu": 2.50
+       },
+       "billingInterval": "hourly"
+     }'
+   ```
+
+### Billing Parameters
+
+| Parameter | Description | Example |
+|-----------|-------------|---------|
+| `enabled` | Enable/disable billing | `true` |
+| `currency` | Currency for billing | `USD`, `CNY`, `EUR` |
+| `pricing.cpu` | CPU price per core-hour | `0.05` |
+| `pricing.memory` | Memory price per GB-hour | `0.01` |
+| `pricing["nvidia.com/gpu"]` | GPU price per GPU-hour | `2.50` |
+| `billingInterval` | Billing aggregation period | `hourly`, `daily` |
+| `lowBalanceThreshold` | Warning threshold (%) | `20` |
+| `suspendThreshold` | Auto-suspend threshold (%) | `5` |
+
+### Example Billing Configuration
+
+```json
+{
+  "enabled": true,
+  "currency": "USD",
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "nvidia.com/mig-1g.5gb": 0.50,
+    "nvidia.com/mig-2g.10gb": 1.00
+  },
+  "billingInterval": "hourly",
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Team Configuration
+
+### Creating Teams
+
+Teams can be created through the Web UI or API:
+
+**Via Web UI:**
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Set team name, quota, and initial balance
+
+**Via API:**
+```bash
+curl -X POST http://localhost:8080/api/v1/teams \
+  -H "Content-Type: application/json" \
+  -d '{
+    "name": "ml-team",
+    "description": "Machine Learning Team",
+    "quota": {
+      "cpu": "20",
+      "memory": "64Gi",
+      "nvidia.com/gpu": "4"
+    },
+    "balance": 1000.00
+  }'
+```
+
+### Team Quotas
+
+Team quotas define resource limits:
+
+```yaml
+quota:
+  cpu: "20"              # 20 CPU cores
+  memory: "64Gi"         # 64 GB RAM
+  nvidia.com/gpu: "4"    # 4 GPUs
+  storage: "500Gi"       # 500 GB storage
+```
+
+### Team Balance Management
+
+Set initial balance and configure auto-recharge:
+
+```json
+{
+  "balance": 1000.00,
+  "autoRecharge": {
+    "enabled": true,
+    "amount": 500.00,
+    "schedule": "monthly",
+    "threshold": 100.00
+  }
+}
+```
+
+## Alert Configuration
+
+Configure multi-channel alerts for low balance and quota warnings.
+
+### Webhook Alerts
+
+```json
+{
+  "type": "webhook",
+  "enabled": true,
+  "url": "https://your-webhook-endpoint.com/alerts",
+  "headers": {
+    "Authorization": "Bearer YOUR_TOKEN"
+  },
+  "template": {
+    "title": "Bison Alert",
+    "message": "Team {{.TeamName}} balance is {{.Balance}}"
+  }
+}
+```
+
+### DingTalk Alerts
+
+```json
+{
+  "type": "dingtalk",
+  "enabled": true,
+  "webhook": "https://oapi.dingtalk.com/robot/send?access_token=YOUR_TOKEN",
+  "secret": "YOUR_SECRET"
+}
+```
+
+### WeChat Work Alerts
+
+```json
+{
+  "type": "wechat",
+  "enabled": true,
+  "corpid": "YOUR_CORP_ID",
+  "corpsecret": "YOUR_CORP_SECRET",
+  "agentid": 1000001
+}
+```
+
+## OpenCost Integration
+
+Configure OpenCost connection:
+
+### Check OpenCost Connectivity
+
+```bash
+# Test OpenCost API
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+
+# Test allocation API
+curl http://localhost:9003/allocation/compute?window=1d
+```
+
+### Update OpenCost URL
+
+If OpenCost is deployed in a different namespace or with a different service name:
+
+```bash
+helm upgrade bison bison/bison \
+  --set opencost.url=http://my-opencost.custom-namespace.svc:9003 \
+  --namespace bison-system
+```
+
+## Authentication & OIDC
+
+Enable authentication and integrate with your SSO provider:
+
+### Basic Authentication
+
+```yaml
+auth:
+  enabled: true
+  admin:
+    username: admin
+    password: SecurePassword123
+```
+
+### OIDC Integration
+
+```yaml
+auth:
+  enabled: true
+  oidc:
+    enabled: true
+    issuerURL: https://your-oidc-provider.com
+    clientID: bison-client-id
+    clientSecret: your-client-secret
+    redirectURL: https://bison.example.com/callback
+```
+
+## Environment Variables
+
+Additional configuration can be provided via environment variables:
+
+| Variable | Description | Default |
+|----------|-------------|---------|
+| `KUBECONFIG` | Path to kubeconfig file | In-cluster config |
+| `OPENCOST_URL` | OpenCost API URL | `http://opencost.opencost-system.svc:9003` |
+| `AUTH_ENABLED` | Enable authentication | `false` |
+| `LOG_LEVEL` | Logging level | `info` |
+| `BILLING_INTERVAL` | Billing calculation interval | `10m` |
+
+Set environment variables in Helm values:
+
+```yaml
+apiServer:
+  env:
+    - name: LOG_LEVEL
+      value: debug
+    - name: BILLING_INTERVAL
+      value: 5m
+```
+
+## Advanced Configuration
+
+### Custom Resource Pricing
+
+Price any Kubernetes resource:
+
+```json
+{
+  "pricing": {
+    "cpu": 0.05,
+    "memory": 0.01,
+    "nvidia.com/gpu": 2.50,
+    "amd.com/gpu": 2.00,
+    "ephemeral-storage": 0.001,
+    "custom.io/fpga": 5.00
+  }
+}
+```
+
+### Multi-Cluster Support
+
+Deploy Bison in each cluster with shared billing:
+
+```yaml
+# Cluster A
+apiServer:
+  clusterName: prod-us-west
+
+# Cluster B
+apiServer:
+  clusterName: prod-us-east
+```
+
+## Next Steps
+
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
+- [Features](features.md) - Explore all capabilities
diff --git a/website/versioned_docs/version-0.0.8/features.md b/website/versioned_docs/version-0.0.8/features.md
new file mode 100644
index 0000000..8d0c438
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/features.md
@@ -0,0 +1,195 @@
+---
+sidebar_position: 2
+---
+
+# Features
+
+Bison provides a comprehensive suite of features for GPU resource management, billing, and multi-tenant isolation in Kubernetes environments.
+
+## See Bison in Action
+
+### 🎯 Real-Time Resource Dashboard
+
+![Bison Dashboard](/img/ui-dashboard.png)
+
+**What you see:**
+- **Cluster Overview** - Total teams, projects, resource pools, and quotas at a glance
+- **Resource Utilization** - Visual breakdown showing which teams are consuming resources
+- **7-Day Cost Trends** - Historical cost data to identify spending patterns
+- **Top 5 Cost Rankings** - Quickly identify heavy GPU consumers
+- **Team Budget Status** - Real-time balance monitoring with color-coded alerts
+
+**Who benefits:**
+- **Platform Administrators** get instant visibility into cluster health and usage patterns
+- **Finance Teams** can track costs in real-time without waiting for monthly reports
+- **Team Leaders** can compare their usage against other teams
+
+---
+
+### 💼 Team Management & Budget Monitoring
+
+![Team Management](/img/ui-team.png)
+
+**What you see:**
+- **Team List** with real-time status indicators:
+  - 🟢 Green balance = Healthy budget
+  - 🟡 Yellow balance = Approaching threshold
+  - 🔴 Red balance = Low balance or suspended
+- **Resource Allocation** - CPU/Memory/GPU quotas per team (e.g., "cpu 0/10" means 0 used out of 10 allocated)
+- **Project Count** - Number of namespaces/projects under each team
+- **Quick Actions** - Edit quotas, recharge balance, or delete team with one click
+
+**Who benefits:**
+- **Team Leaders** monitor their budget status and resource usage at a glance
+- **Administrators** manage multiple teams from a single unified view
+- **Finance Teams** see which teams need recharging
+
+---
+
+### 💰 Flexible Billing Configuration
+
+![Billing Configuration](/img/ui-billing.png)
+
+**What you see:**
+- **Per-Resource Pricing** - Set custom prices for CPU (per core-hour), Memory (per GB-hour), GPU (per GPU-hour)
+- **Currency Selection** - Support for CNY, USD, EUR, and other currencies
+- **Enable/Disable Toggle** - Turn billing on/off for specific resources with one click
+- **Billing Rules** - Define how resources are metered (hourly, daily, etc.)
+- **Alert Thresholds** - Configure when to send low-balance warnings
+
+**Who benefits:**
+- **Finance Teams** align cloud costs with internal chargeback policies
+- **Administrators** adjust pricing based on actual hardware costs
+- **Budget Managers** set appropriate warning thresholds to prevent overruns
+
+---
+
+## Core Capabilities
+
+### Multi-Tenant Management
+✅ **Capsule-Powered Isolation** - True multi-tenancy using Kubernetes-native Capsule operator
+✅ **OIDC Integration** - Enterprise SSO support for authentication
+✅ **Team-Based Access Control** - Manage users, roles, and permissions per team
+✅ **Shared & Exclusive Node Pools** - Flexible resource allocation strategies
+
+### Real-Time Billing
+✅ **Usage-Based Billing** - Accurate cost tracking based on actual resource consumption
+✅ **Configurable Pricing** - Set custom rates for CPU, Memory, GPU, and any Kubernetes resource
+✅ **Multi-Currency Support** - CNY, USD, EUR, and more
+✅ **Billing Rules Engine** - Define custom billing logic and aggregation periods
+
+### Dynamic Resource Quotas
+✅ **Per-Team Quotas** - CPU, Memory, GPU, Storage, and custom resources
+✅ **Namespace Quotas** - Project-level resource limits within teams
+✅ **Auto-Enforcement** - Kubernetes-native quota enforcement
+✅ **Quota Alerts** - Notifications when approaching limits
+
+### Team Balance & Wallet System
+✅ **Prepaid Balances** - Team wallets with real-time deduction
+✅ **Auto-Deduction** - Automated billing based on resource usage
+✅ **Balance Thresholds** - Configurable warning and suspension levels
+✅ **Transaction History** - Complete audit trail of all balance changes
+
+### Auto-Recharge
+✅ **Scheduled Top-Ups** - Weekly or monthly automatic recharges
+✅ **Custom Amounts** - Flexible recharge amounts per team
+✅ **Recharge Notifications** - Alert teams when balance is added
+
+### Balance Alerts
+✅ **Multi-Channel Notifications** - Webhook, DingTalk, WeChat, Email
+✅ **Configurable Thresholds** - Set warning levels (e.g., 20%, 10%, 5%)
+✅ **Auto-Suspension** - Automatically suspend workloads when balance depleted
+✅ **Custom Templates** - Customize alert messages
+
+### Usage Reports
+✅ **Team Analytics** - Per-team cost breakdowns and trends
+✅ **Project Analytics** - Namespace-level resource consumption
+✅ **Export Capabilities** - CSV, Excel, PDF reports
+✅ **Historical Data** - 30/60/90-day cost analysis
+
+### Audit Logging
+✅ **Complete Operation History** - Track all administrative actions
+✅ **User Attribution** - Who did what and when
+✅ **Resource Changes** - Track quota, balance, and configuration changes
+✅ **Compliance Ready** - Meet internal audit requirements
+
+---
+
+## Architecture Highlights
+
+Bison's architecture is designed for simplicity, scalability, and zero external dependencies.
+
+```mermaid
+graph TB
+    subgraph USER_LAYER[User Layer]
+        UI[Web UI<br/>React + Ant Design]
+        API[REST API<br/>Go + Gin]
+    end
+
+    subgraph CORE[Core Services]
+        BS[Billing Service]
+        TS[Tenant Service]
+        QS[Quota Service]
+    end
+
+    subgraph K8S[Kubernetes Layer]
+        CA[Capsule<br/>Multi-Tenancy]
+        OC[OpenCost<br/>Cost Tracking]
+        PR[Prometheus<br/>Metrics]
+    end
+
+    subgraph DATA[Data Layer]
+        CM[ConfigMaps<br/>Zero Database]
+    end
+
+    UI --> API
+    API --> BS & TS & QS
+    BS --> OC
+    TS --> CA
+    QS --> CA
+    BS & TS --> CM
+    OC --> PR
+```
+
+### Key Architectural Benefits
+
+- **Zero External Dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+- **Cloud-Native** - Built on Kubernetes primitives for maximum portability
+- **Scalable** - Stateless API server that can scale horizontally
+- **Secure** - Kubernetes RBAC integration and optional authentication
+- **Observable** - Prometheus metrics and structured logging
+- **Extensible** - Plugin architecture for custom billing rules and alerts
+
+---
+
+## Integration Points
+
+### OpenCost Integration
+Bison leverages [OpenCost](https://www.opencost.io/) for real-time cost tracking:
+- Per-pod, per-namespace, per-team cost visibility
+- GPU utilization metrics
+- Historical cost data and trends
+- Integration with Prometheus for metric collection
+
+### Capsule Integration
+Bison uses [Capsule](https://capsule.clastix.io/) for multi-tenancy:
+- Team-based tenant isolation
+- Namespace quota enforcement
+- Network and security policies
+- OIDC/SSO integration
+
+### Prometheus Integration
+Metrics collection and monitoring:
+- Resource utilization tracking
+- Custom billing metrics
+- Alert rule evaluation
+- Historical data retention
+
+---
+
+## Next Steps
+
+- [Installation Guide](installation.md) - Deploy Bison in your cluster
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Deep dive into system design
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.8/installation.md b/website/versioned_docs/version-0.0.8/installation.md
new file mode 100644
index 0000000..da89191
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/installation.md
@@ -0,0 +1,316 @@
+---
+sidebar_position: 3
+---
+
+# Installation Guide
+
+This guide provides detailed instructions for installing Bison in your Kubernetes cluster.
+
+## Prerequisites
+
+Before installing Bison, ensure you have:
+
+- **Kubernetes 1.22+** - A running Kubernetes cluster
+- **kubectl** - Configured to access your cluster
+- **Helm 3.0+** - Package manager for Kubernetes
+- **Capsule Operator v0.1.0+** - For multi-tenant isolation
+- **OpenCost** - Deployed with Prometheus for cost tracking
+
+### Install Prerequisites
+
+If you haven't installed the required components:
+
+#### Install Capsule
+
+```bash
+# Using Helm
+helm repo add projectcapsule https://projectcapsule.github.io/charts
+helm install capsule projectcapsule/capsule \
+  --namespace capsule-system \
+  --create-namespace
+```
+
+#### Install OpenCost
+
+```bash
+# Using Helm
+helm repo add opencost https://opencost.github.io/opencost-helm-chart
+helm install opencost opencost/opencost \
+  --namespace opencost-system \
+  --create-namespace \
+  --set prometheus.internal.serviceName=prometheus-server \
+  --set prometheus.internal.namespaceName=prometheus-system
+```
+
+## Installation Methods
+
+Bison Helm charts are distributed via **GitHub Container Registry (GHCR)** using the modern OCI format.
+
+**Requirements:**
+- Helm >= 3.8.0 (for OCI support)
+- Kubernetes >= 1.22
+
+### Option A: From GHCR (Recommended)
+
+The simplest way to install Bison is directly from GitHub Container Registry:
+
+```bash
+# Install specific version from GHCR
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace
+
+# Or pull the chart first, then install
+helm pull oci://ghcr.io/supermarioyl/bison/bison --version 0.0.2
+helm install bison bison-0.0.2.tgz \
+  --namespace bison-system \
+  --create-namespace
+
+# Customize installation
+helm install bison oci://ghcr.io/supermarioyl/bison/bison \
+  --version 0.0.2 \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true \
+  --set apiServer.image.tag=0.0.2 \
+  --set webUI.image.tag=0.0.2
+```
+
+**Why GHCR OCI Format?**
+- ✅ No separate Helm repository maintenance needed
+- ✅ Unified with Docker images in GHCR
+- ✅ Faster installation (direct registry pull)
+- ✅ Modern Helm 3.8+ standard practice
+
+### Option B: From GitHub Release
+
+Download a specific version from GitHub Releases:
+
+```bash
+# Download Helm chart
+VERSION=0.0.2
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install the chart
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Option C: From Source
+
+Clone and build from source:
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+## Configuration Options
+
+Bison can be configured using Helm values. Here are the key configuration options:
+
+### Basic Configuration
+
+```yaml
+# values.yaml
+apiServer:
+  image:
+    repository: ghcr.io/supermarioyl/bison/api-server
+    tag: 0.0.1
+  replicas: 2
+
+webUI:
+  image:
+    repository: ghcr.io/supermarioyl/bison/web-ui
+    tag: 0.0.1
+  replicas: 2
+
+# OpenCost URL
+opencost:
+  url: http://opencost.opencost-system.svc:9003
+
+# Authentication
+auth:
+  enabled: false
+```
+
+### Custom Configuration Example
+
+```bash
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set apiServer.replicas=3 \
+  --set webUI.replicas=3 \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=true
+```
+
+## Verify Installation
+
+After installation, verify that all components are running:
+
+```bash
+# Check pod status
+kubectl get pods -n bison-system
+
+# Expected output:
+# NAME                              READY   STATUS    RESTARTS   AGE
+# bison-api-server-xxxxxxxxx-xxxxx  1/1     Running   0          2m
+# bison-webui-xxxxxxxxx-xxxxx       1/1     Running   0          2m
+
+# Check services
+kubectl get svc -n bison-system
+
+# Check logs
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl logs -n bison-system deployment/bison-webui
+```
+
+## Access the Platform
+
+### Port Forward (Development)
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+```
+
+### Ingress (Production)
+
+For production deployments, configure an Ingress:
+
+```yaml
+# ingress.yaml
+apiVersion: networking.k8s.io/v1
+kind: Ingress
+metadata:
+  name: bison-ingress
+  namespace: bison-system
+  annotations:
+    kubernetes.io/ingress.class: nginx
+spec:
+  rules:
+  - host: bison.example.com
+    http:
+      paths:
+      - path: /
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-webui
+            port:
+              number: 80
+      - path: /api
+        pathType: Prefix
+        backend:
+          service:
+            name: bison-api-server
+            port:
+              number: 8080
+```
+
+Apply the Ingress:
+
+```bash
+kubectl apply -f ingress.yaml
+```
+
+## Docker Images
+
+Bison images are available on GitHub Container Registry:
+
+```bash
+# Pull images
+docker pull ghcr.io/supermarioyl/bison/api-server:0.0.1
+docker pull ghcr.io/supermarioyl/bison/web-ui:0.0.1
+
+# Or use latest
+docker pull ghcr.io/supermarioyl/bison/api-server:latest
+docker pull ghcr.io/supermarioyl/bison/web-ui:latest
+```
+
+**Supported Platforms:**
+- `linux/amd64`
+- `linux/arm64`
+
+## Upgrading
+
+To upgrade Bison to a new version:
+
+```bash
+# Update Helm repository
+helm repo update
+
+# Upgrade to latest version
+helm upgrade bison bison/bison --namespace bison-system
+
+# Or upgrade to specific version
+helm upgrade bison bison/bison --version 0.0.2 --namespace bison-system
+```
+
+## Uninstalling
+
+To completely remove Bison:
+
+```bash
+# Uninstall Helm release
+helm uninstall bison --namespace bison-system
+
+# Remove namespace (optional)
+kubectl delete namespace bison-system
+```
+
+## Troubleshooting
+
+### Pod Not Starting
+
+Check pod logs for errors:
+
+```bash
+kubectl logs -n bison-system deployment/bison-api-server
+kubectl describe pod -n bison-system <pod-name>
+```
+
+### Cannot Connect to OpenCost
+
+Verify OpenCost is running and accessible:
+
+```bash
+kubectl get svc -n opencost-system
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+
+# Test endpoint
+curl http://localhost:9003/healthz
+```
+
+### Authentication Issues
+
+If authentication is enabled, ensure you have the correct credentials:
+
+```bash
+# Default credentials (change in production!)
+Username: admin
+Password: admin
+```
+
+## Next Steps
+
+- [Configuration Guide](configuration.md) - Configure billing and settings
+- [User Guides](user-guides/admin.md) - Learn how to use Bison
+- [Architecture](architecture.md) - Understand the system design
diff --git a/website/versioned_docs/version-0.0.8/intro.md b/website/versioned_docs/version-0.0.8/intro.md
new file mode 100644
index 0000000..b3dc3aa
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/intro.md
@@ -0,0 +1,167 @@
+---
+sidebar_position: 1
+slug: /
+---
+
+# Introduction to Bison
+
+![Bison Logo](/img/logo.png)
+
+**Enterprise GPU Resource Billing & Multi-Tenant Management Platform**
+
+Bison is a Kubernetes-based platform that provides comprehensive GPU resource management, billing, and multi-tenant isolation for organizations running shared GPU clusters.
+
+## The GPU Management Challenge
+
+Managing shared GPU clusters across multiple teams creates critical operational and financial challenges:
+
+**For Platform Administrators:**
+- How do you fairly allocate expensive GPU resources across competing teams?
+- How do you prevent resource hogging while ensuring everyone gets their fair share?
+- How do you track who's using what and implement accurate chargeback?
+- How do you maintain strict multi-tenant isolation without complex manual configuration?
+
+**For Finance & Budget Teams:**
+- How do you implement automated chargeback for GPU usage without manual accounting?
+- How do you prevent budget overruns before they happen?
+- How do you generate accurate cost reports for internal billing?
+
+**For Development Teams:**
+- How do you get predictable, isolated access to GPU resources?
+- How do you know when you're approaching your budget limits?
+- How do you avoid impacting other teams' workloads?
+
+**Traditional Approach:**
+- Manual quota configuration per namespace
+- Excel-based billing calculations
+- No real-time cost visibility
+- Complex multi-tool setup (quota management + cost tracking + billing system)
+- Frequent resource conflicts and budget surprises
+
+## Bison's Integrated Solution
+
+```mermaid
+graph TB
+    subgraph WITHOUT["Without Bison"]
+        P1[❌ Manual Quota Management<br/>Per-namespace configuration]
+        P2[❌ Spreadsheet Billing<br/>Manual calculations & reports]
+        P3[❌ No Resource Isolation<br/>Teams compete for resources]
+        P4[❌ Budget Overruns<br/>No proactive alerts]
+        P5[❌ Complex Tooling<br/>Multiple systems to manage]
+    end
+
+    subgraph WITH["With Bison"]
+        S1[✅ Automated Team Quotas<br/>Capsule-powered isolation]
+        S2[✅ Real-Time Billing<br/>OpenCost integration]
+        S3[✅ True Multi-Tenancy<br/>Shared/Exclusive modes]
+        S4[✅ Proactive Alerts<br/>Balance monitoring & auto-suspend]
+        S5[✅ Unified Platform<br/>Single pane of glass]
+    end
+
+    P1 -.Transform.-> S1
+    P2 -.Transform.-> S2
+    P3 -.Transform.-> S3
+    P4 -.Transform.-> S4
+    P5 -.Transform.-> S5
+
+    style WITHOUT fill:#ffebee
+    style WITH fill:#e8f5e9
+    style S1 fill:#4caf50,color:#fff
+    style S2 fill:#4caf50,color:#fff
+    style S3 fill:#4caf50,color:#fff
+    style S4 fill:#4caf50,color:#fff
+    style S5 fill:#4caf50,color:#fff
+```
+
+**Bison combines:**
+- 🔐 **Kubernetes-native multi-tenancy** (Capsule) - True team isolation with shared or exclusive node pools
+- 💰 **Real-time cost tracking** (OpenCost + Prometheus) - Per-pod, per-namespace, per-team cost visibility
+- 💳 **Automated billing & budgets** - Prepaid balances, auto-deduction, low-balance alerts, and auto-suspension
+- 📊 **Unified dashboard** - Single interface for admins, team leaders, and finance teams
+- 🔧 **Zero external dependencies** - All data stored in Kubernetes ConfigMaps (etcd-backed)
+
+**Result:** Deploy once, get complete GPU resource management with automated billing in under 30 minutes.
+
+## Quick Start
+
+### Prerequisites
+
+- Kubernetes 1.22+
+- kubectl configured
+- Helm 3.0+
+- Capsule operator (v0.1.0+) installed
+- OpenCost deployed with Prometheus
+
+### Installation
+
+Choose one of the following installation methods:
+
+#### Option A: Using Helm Repository (Recommended)
+
+```bash
+# Add Bison Helm repository
+helm repo add bison https://supermarioyl.github.io/Bison/charts/
+helm repo update
+
+# Install with default configuration
+helm install bison bison/bison --namespace bison-system --create-namespace
+
+# Or customize installation
+helm install bison bison/bison \
+  --namespace bison-system \
+  --create-namespace \
+  --set opencost.url=http://opencost.opencost-system.svc:9003 \
+  --set auth.enabled=false
+```
+
+#### Option B: From GitHub Release
+
+```bash
+# Download latest Helm chart
+VERSION=0.0.1
+wget https://github.com/SuperMarioYL/Bison/releases/download/v${VERSION}/bison-${VERSION}.tgz
+
+# Install
+helm install bison bison-${VERSION}.tgz \
+  --namespace bison-system \
+  --create-namespace
+```
+
+#### Option C: From Source
+
+```bash
+# Clone repository
+git clone https://github.com/SuperMarioYL/Bison.git
+cd Bison
+
+# Install dependencies and build
+make install-deps
+make build
+
+# Deploy using Helm
+helm install bison ./deploy/charts/bison \
+  --namespace bison-system \
+  --create-namespace
+```
+
+### Access the Platform
+
+After installation, access Bison through:
+
+```bash
+# Port-forward the Web UI
+kubectl port-forward -n bison-system svc/bison-webui 3000:80
+
+# Access at http://localhost:3000
+# Default credentials (if auth enabled):
+# Username: admin
+# Password: admin (change immediately in production!)
+```
+
+## Next Steps
+
+- [Explore Features](features.md) - Learn about all capabilities
+- [Installation Guide](installation.md) - Detailed installation instructions
+- [User Guides](user-guides/admin.md) - Role-based user guides
+- [Architecture](architecture.md) - Understand the system architecture
+- [Configuration](configuration.md) - Configure billing and settings
diff --git a/website/versioned_docs/version-0.0.8/user-guides/_category_.json b/website/versioned_docs/version-0.0.8/user-guides/_category_.json
new file mode 100644
index 0000000..fe79f61
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/user-guides/_category_.json
@@ -0,0 +1,8 @@
+{
+  "label": "User Guides",
+  "position": 4,
+  "link": {
+    "type": "generated-index",
+    "description": "Role-based guides for using Bison effectively."
+  }
+}
diff --git a/website/versioned_docs/version-0.0.8/user-guides/admin.md b/website/versioned_docs/version-0.0.8/user-guides/admin.md
new file mode 100644
index 0000000..a466cbb
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/user-guides/admin.md
@@ -0,0 +1,176 @@
+---
+sidebar_position: 1
+---
+
+# Administrator Guide
+
+This guide is for platform administrators who deploy, configure, and manage the Bison platform.
+
+## Responsibilities
+
+As a platform administrator, you are responsible for:
+
+- ✅ Deploying and configuring Bison
+- ✅ Creating and managing teams
+- ✅ Setting global billing configuration
+- ✅ Monitoring cluster-wide metrics
+- ✅ Responding to alerts and recharge requests
+
+## Getting Started
+
+### 1. Deploy Bison
+
+Follow the [Installation Guide](../installation.md) to deploy Bison in your Kubernetes cluster.
+
+### 2. Configure Billing
+
+Set up billing rules and pricing:
+
+1. Access the Web UI
+2. Navigate to **Settings** > **Billing Configuration**
+3. Configure:
+   - **Currency**: USD, CNY, EUR, etc.
+   - **CPU Price**: Cost per core-hour
+   - **Memory Price**: Cost per GB-hour
+   - **GPU Price**: Cost per GPU-hour
+4. Click **Save**
+
+### 3. Create First Team
+
+Create a team for your users:
+
+1. Navigate to **Teams** page
+2. Click **Create Team**
+3. Fill in:
+   - **Team Name**: e.g., "ml-team"
+   - **Description**: Team purpose
+   - **Resource Quota**:
+     - CPU: e.g., "20" cores
+     - Memory: e.g., "64Gi"
+     - GPU: e.g., "4"
+   - **Initial Balance**: e.g., 1000.00
+4. Click **Create**
+
+## Common Tasks
+
+### Managing Teams
+
+#### View All Teams
+
+```bash
+# Via kubectl
+kubectl get tenants
+
+# Via API
+curl http://localhost:8080/api/v1/teams
+```
+
+#### Update Team Quota
+
+1. Navigate to **Teams** page
+2. Click **Edit** on the team row
+3. Modify quotas
+4. Click **Save**
+
+#### Recharge Team Balance
+
+1. Navigate to **Teams** page
+2. Click **Recharge** on the team row
+3. Enter amount
+4. Add notes (optional)
+5. Click **Confirm**
+
+### Monitoring
+
+#### View Dashboard
+
+Access real-time cluster metrics:
+- Total teams and projects
+- Resource utilization
+- Cost trends
+- Top consumers
+- Balance status
+
+#### Check Alerts
+
+Monitor low-balance and quota alerts:
+1. Navigate to **Alerts** page
+2. Review active alerts
+3. Take action as needed
+
+### Billing Configuration
+
+#### Update Pricing
+
+```bash
+curl -X PUT http://localhost:8080/api/v1/billing/config \
+  -H "Content-Type: application/json" \
+  -d '{
+    "pricing": {
+      "cpu": 0.06,
+      "memory": 0.012,
+      "nvidia.com/gpu": 3.00
+    }
+  }'
+```
+
+#### Configure Alert Thresholds
+
+```json
+{
+  "lowBalanceThreshold": 20,
+  "suspendThreshold": 5,
+  "alertChannels": ["webhook", "dingtalk"]
+}
+```
+
+## Best Practices
+
+### Team Naming
+- Use lowercase, alphanumeric characters and hyphens
+- Example: `ml-team`, `data-science`, `dev-team`
+
+### Quota Allocation
+- Start with conservative quotas
+- Monitor usage for 1-2 weeks
+- Adjust based on actual needs
+
+### Balance Management
+- Set up auto-recharge for critical teams
+- Monitor balance trends weekly
+- Respond to low-balance alerts promptly
+
+### Security
+- Enable authentication in production
+- Use OIDC/SSO for enterprise deployments
+- Regularly audit user permissions
+
+## Troubleshooting
+
+### Team Creation Failed
+
+Check Capsule operator logs:
+```bash
+kubectl logs -n capsule-system deployment/capsule-controller-manager
+```
+
+### Billing Not Working
+
+Verify OpenCost connectivity:
+```bash
+kubectl port-forward -n opencost-system svc/opencost 9003:9003
+curl http://localhost:9003/healthz
+```
+
+### High Resource Usage
+
+Check resource consumption:
+```bash
+kubectl top pods -n bison-system
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Guide for team leaders
+- [Developer Guide](developer.md) - Guide for developers
+- [Configuration](../configuration.md) - Advanced configuration
diff --git a/website/versioned_docs/version-0.0.8/user-guides/developer.md b/website/versioned_docs/version-0.0.8/user-guides/developer.md
new file mode 100644
index 0000000..d14ab62
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/user-guides/developer.md
@@ -0,0 +1,187 @@
+---
+sidebar_position: 3
+---
+
+# Developer Guide
+
+This guide is for developers who deploy workloads and consume resources within team projects.
+
+## Responsibilities
+
+As a developer, you are responsible for:
+
+- ✅ Deploying applications within your project
+- ✅ Monitoring resource usage
+- ✅ Staying within quota limits
+- ✅ Optimizing resource consumption
+
+## Getting Started
+
+### 1. Get Kubeconfig
+
+Request kubeconfig from your team leader or administrator.
+
+### 2. Set Context
+
+```bash
+# Set context to your project namespace
+kubectl config set-context --current --namespace=your-project
+
+# Verify
+kubectl config view --minify | grep namespace
+```
+
+### 3. Check Quota
+
+See your available resources:
+```bash
+kubectl describe quota
+```
+
+## Deploying Workloads
+
+### Basic Pod Deployment
+
+```yaml
+apiVersion: v1
+kind: Pod
+metadata:
+  name: gpu-training-job
+  namespace: your-project
+spec:
+  containers:
+  - name: trainer
+    image: your-ml-image:latest
+    resources:
+      requests:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+      limits:
+        cpu: "4"
+        memory: "16Gi"
+        nvidia.com/gpu: "1"
+```
+
+### Using Deployments
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: ml-inference
+  namespace: your-project
+spec:
+  replicas: 2
+  selector:
+    matchLabels:
+      app: ml-inference
+  template:
+    metadata:
+      labels:
+        app: ml-inference
+    spec:
+      containers:
+      - name: inference
+        image: your-inference-image:latest
+        resources:
+          requests:
+            cpu: "2"
+            memory: "8Gi"
+            nvidia.com/gpu: "1"
+```
+
+## Monitoring Usage
+
+### Check Pod Resource Usage
+
+```bash
+# View resource consumption
+kubectl top pods
+
+# Detailed pod information
+kubectl describe pod <pod-name>
+```
+
+### View Logs
+
+```bash
+# Stream logs
+kubectl logs -f <pod-name>
+
+# Previous logs (if pod restarted)
+kubectl logs --previous <pod-name>
+```
+
+## Best Practices
+
+### Resource Requests and Limits
+
+Always specify both requests and limits:
+```yaml
+resources:
+  requests:
+    cpu: "2"
+    memory: "8Gi"
+  limits:
+    cpu: "4"
+    memory: "16Gi"
+```
+
+### GPU Usage
+
+- Request GPUs only when needed
+- Use GPU for compute-intensive tasks
+- Monitor GPU utilization
+
+### Clean Up
+
+Delete resources when no longer needed:
+```bash
+# Delete pod
+kubectl delete pod <pod-name>
+
+# Delete deployment
+kubectl delete deployment <deployment-name>
+
+# Clean up completed jobs
+kubectl delete job --field-selector status.successful=1
+```
+
+### Cost Optimization
+
+- Right-size your resource requests
+- Use horizontal pod autoscaling
+- Clean up idle resources
+- Share GPUs when possible (if supported)
+
+## Troubleshooting
+
+### Pod Pending (Insufficient Quota)
+
+If your pod is stuck in `Pending` state:
+
+```bash
+kubectl describe pod <pod-name>
+```
+
+Look for quota-related errors and reduce resource requests or ask your team leader for more quota.
+
+### Out of Memory (OOM)
+
+If pods are killed due to OOM:
+1. Check memory usage patterns
+2. Increase memory limits
+3. Optimize application memory usage
+
+### GPU Not Available
+
+Verify GPU requests:
+```bash
+kubectl get nodes -o custom-columns=NAME:.metadata.name,GPU:.status.allocatable."nvidia\.com/gpu"
+```
+
+## Next Steps
+
+- [Team Leader Guide](team-leader.md) - Understand team management
+- [Architecture](../architecture.md) - Learn about the platform
diff --git a/website/versioned_docs/version-0.0.8/user-guides/team-leader.md b/website/versioned_docs/version-0.0.8/user-guides/team-leader.md
new file mode 100644
index 0000000..7b6de96
--- /dev/null
+++ b/website/versioned_docs/version-0.0.8/user-guides/team-leader.md
@@ -0,0 +1,126 @@
+---
+sidebar_position: 2
+---
+
+# Team Leader Guide
+
+This guide is for team leaders who manage projects, monitor budgets, and allocate resources within their team.
+
+## Responsibilities
+
+As a team leader, you are responsible for:
+
+- ✅ Creating and managing projects (namespaces)
+- ✅ Allocating quotas to projects
+- ✅ Monitoring team balance and consumption
+- ✅ Requesting recharges when needed
+
+## Getting Started
+
+### 1. Access Bison
+
+Log in to the Web UI with your credentials.
+
+### 2. View Team Dashboard
+
+Your dashboard shows:
+- Team balance and status
+- Resource utilization
+- Active projects
+- Cost trends
+
+## Managing Projects
+
+### Create a Project
+
+1. Navigate to **Projects** page
+2. Click **Create Project**
+3. Fill in:
+   - **Project Name**: e.g., "training-ml-models"
+   - **Description**: Project purpose
+   - **Quota** (optional):
+     - CPU: e.g., "8" cores
+     - Memory: e.g., "32Gi"
+     - GPU: e.g., "2"
+4. Click **Create**
+
+### List Projects
+
+```bash
+# Via kubectl (if you have access)
+kubectl get namespaces -l capsule.clastix.io/tenant=your-team
+
+# Via API
+curl http://localhost:8080/api/v1/teams/your-team/projects
+```
+
+### Delete a Project
+
+1. Navigate to **Projects** page
+2. Click **Delete** on the project row
+3. Confirm deletion
+
+**Warning**: This will delete all resources in the project!
+
+## Monitoring Budget
+
+### Check Balance
+
+View your current balance:
+1. Navigate to **Team** page
+2. See balance in the status card
+
+### View Usage Trends
+
+Analyze spending patterns:
+1. Navigate to **Reports** page
+2. Select time range (7 days, 30 days, 90 days)
+3. View:
+   - Cost breakdown by resource type
+   - Daily cost trends
+   - Per-project consumption
+
+### Request Recharge
+
+When balance is low:
+1. Click **Request Recharge** button
+2. Enter requested amount
+3. Add justification
+4. Submit request to administrator
+
+## Resource Management
+
+### Monitor Quota Usage
+
+Check how much of your quota is being used:
+```bash
+kubectl describe quota -n your-project
+```
+
+### Optimize Costs
+
+Tips to reduce spending:
+- **Right-size resources**: Don't over-provision CPU/Memory
+- **Clean up idle pods**: Delete unused workloads
+- **Use spot/preemptible instances**: Where applicable
+- **Monitor GPU utilization**: Ensure GPUs are fully utilized
+
+## Best Practices
+
+### Project Organization
+- Create separate projects for different workloads
+- Example: `ml-training`, `ml-inference`, `data-processing`
+
+### Quota Allocation
+- Allocate quotas based on project priority
+- Reserve buffer for urgent tasks
+
+### Cost Awareness
+- Review costs weekly
+- Identify and eliminate waste
+- Set up cost alerts
+
+## Next Steps
+
+- [Developer Guide](developer.md) - Guide for your team members
+- [Features](../features.md) - Explore all Bison features
diff --git a/website/versioned_sidebars/version-0.0.11-sidebars.json b/website/versioned_sidebars/version-0.0.11-sidebars.json
new file mode 100644
index 0000000..caea0c0
--- /dev/null
+++ b/website/versioned_sidebars/version-0.0.11-sidebars.json
@@ -0,0 +1,8 @@
+{
+  "tutorialSidebar": [
+    {
+      "type": "autogenerated",
+      "dirName": "."
+    }
+  ]
+}
diff --git a/website/versioned_sidebars/version-0.0.6-sidebars.json b/website/versioned_sidebars/version-0.0.6-sidebars.json
new file mode 100644
index 0000000..caea0c0
--- /dev/null
+++ b/website/versioned_sidebars/version-0.0.6-sidebars.json
@@ -0,0 +1,8 @@
+{
+  "tutorialSidebar": [
+    {
+      "type": "autogenerated",
+      "dirName": "."
+    }
+  ]
+}
diff --git a/website/versioned_sidebars/version-0.0.7-sidebars.json b/website/versioned_sidebars/version-0.0.7-sidebars.json
new file mode 100644
index 0000000..caea0c0
--- /dev/null
+++ b/website/versioned_sidebars/version-0.0.7-sidebars.json
@@ -0,0 +1,8 @@
+{
+  "tutorialSidebar": [
+    {
+      "type": "autogenerated",
+      "dirName": "."
+    }
+  ]
+}
diff --git a/website/versioned_sidebars/version-0.0.8-sidebars.json b/website/versioned_sidebars/version-0.0.8-sidebars.json
new file mode 100644
index 0000000..caea0c0
--- /dev/null
+++ b/website/versioned_sidebars/version-0.0.8-sidebars.json
@@ -0,0 +1,8 @@
+{
+  "tutorialSidebar": [
+    {
+      "type": "autogenerated",
+      "dirName": "."
+    }
+  ]
+}
diff --git a/website/versions.json b/website/versions.json
index daa9a70..7f5dfc1 100644
--- a/website/versions.json
+++ b/website/versions.json
@@ -1,3 +1,7 @@
 [
+  "0.0.11",
+  "0.0.8",
+  "0.0.7",
+  "0.0.6",
   "0.0.1"
 ]