aitbc/.github/workflows/gpu-benchmark.yml

name: GPU Benchmark CI

on:
  push:
    branches: [ main, develop ]
  pull_request:
    branches: [ main ]
  schedule:
    # Run benchmarks daily at 2 AM UTC
    - cron: '0 2 * * *'

jobs:
  gpu-benchmark:
    runs-on: ubuntu-latest
    strategy:
      matrix:
        python-version: [3.13.5]

    steps:
    - uses: actions/checkout@v4

    - name: Set up Python ${{ matrix.python-version }}
      uses: actions/setup-python@v6
      with:
        python-version: ${{ matrix.python-version }}

    - name: Install system dependencies
      run: |
        sudo apt-get update
        sudo apt-get install -y \
          build-essential \
          python3-dev \
          pkg-config \
          libnvidia-compute-515 \
          cuda-toolkit-12-2 \
          nvidia-driver-515

    - name: Cache pip dependencies
      uses: actions/cache@v5
      with:
        path: ~/.cache/pip
        key: ${{ runner.os }}-pip-${{ hashFiles('**/pyproject.toml') }}
        restore-keys: |
          ${{ runner.os }}-pip-

    - name: Install Python dependencies
      run: |
        python -m pip install --upgrade pip
        pip install -e .
        pip install pytest pytest-benchmark torch torchvision torchaudio
        pip install cupy-cuda12x
        pip install nvidia-ml-py3

    - name: Verify GPU availability
      run: |
        python -c "
        import torch
        print(f'PyTorch version: {torch.__version__}')
        print(f'CUDA available: {torch.cuda.is_available()}')
        if torch.cuda.is_available():
            print(f'CUDA version: {torch.version.cuda}')
            print(f'GPU count: {torch.cuda.device_count()}')
            print(f'GPU name: {torch.cuda.get_device_name(0)}')
        "

    - name: Run GPU benchmarks
      run: |
        python -m pytest dev/gpu/test_gpu_performance.py \
          --benchmark-only \
          --benchmark-json=benchmark_results.json \
          --benchmark-sort=mean \
          -v

    - name: Generate benchmark report
      run: |
        python dev/gpu/generate_benchmark_report.py \
          --input benchmark_results.json \
          --output benchmark_report.html \
          --history-file benchmark_history.json

    - name: Upload benchmark results
      uses: actions/upload-artifact@v3
      with:
        name: benchmark-results-${{ matrix.python-version }}
        path: |
          benchmark_results.json
          benchmark_report.html
          benchmark_history.json
        retention-days: 30

    - name: Compare with baseline
      run: |
        python dev/gpu/compare_benchmarks.py \
          --current benchmark_results.json \
          --baseline .github/baselines/gpu_baseline.json \
          --threshold 5.0 \
          --output comparison_report.json

    - name: Comment PR with results
      if: github.event_name == 'pull_request'
      uses: actions/github-script@v7
      with:
        script: |
          const fs = require('fs');
          try {
            const results = JSON.parse(fs.readFileSync('comparison_report.json', 'utf8'));
            const comment = `
            ## 🚀 GPU Benchmark Results

            **Performance Summary:**
            - **Mean Performance**: ${results.mean_performance.toFixed(2)} ops/sec
            - **Performance Change**: ${results.performance_change > 0 ? '+' : ''}${results.performance_change.toFixed(2)}%
            - **Status**: ${results.status}

            **Key Metrics:**
            ${results.metrics.map(m => `- **${m.name}**: ${m.value.toFixed(2)} ops/sec (${m.change > 0 ? '+' : ''}${m.change.toFixed(2)}%)`).join('\n')}

            ${results.regressions.length > 0 ? '⚠️ **Performance Regressions Detected**' : '✅ **No Performance Regressions**'}

            [View detailed report](${process.env.GITHUB_SERVER_URL}/${process.env.GITHUB_REPOSITORY}/actions/runs/${process.env.GITHUB_RUN_ID})
            `;

            github.rest.issues.createComment({
              issue_number: context.issue.number,
              owner: context.repo.owner,
              repo: context.repo.repo,
              body: comment
            });
          } catch (error) {
            console.log('Could not generate benchmark comment:', error.message);
          }

    - name: Update benchmark history
      run: |
        python dev/gpu/update_benchmark_history.py \
          --results benchmark_results.json \
          --history-file .github/baselines/benchmark_history.json \
          --max-entries 100

    - name: Fail on performance regression
      run: |
        python dev/gpu/check_performance_regression.py \
          --results benchmark_results.json \
          --baseline .github/baselines/gpu_baseline.json \
          --threshold 10.0