scisharp
/
LLamaSharp

 
			
			   
				 
					
						
						
							
							name: Benchmark Test
on:
  push:
    branches: [master]
  pull_request:
    branches: [master]
concurrency:
  group: ${{ github.workflow }}-${{ github.ref }}-benchmark
  cancel-in-progress: true

jobs:
  # linux-benchmark-cuda:
  #   if: contains(github.event.pull_request.labels.*.name, 'benchmark')
  #   runs-on: [self-hosted, linux, gpu]

  #   strategy:
  #     fail-fast: false
  #     matrix:
  #       build: [cuda11]
  #       include:
  #         - build: cuda11
  #           image: nvidia/cuda:11.7.1-devel-ubuntu22.04
  #           modeldir: /llamasharp_ci/models_benchmark
  #         # - build: cuda12
  #         #   image: nvidia/cuda:12.1.1-runtime-ubuntu22.04

  #   container:
  #     image: ${{ matrix.image }}
  #     env:
  #       BENCHMARK_MODEL_DIR: ${{ matrix.modeldir }}
  #     ports:
  #       - 80
  #     volumes:
  #       - /llamasharp_ci:/llamasharp_ci
  #     options: --gpus=all --ipc=host --runtime=nvidia

  #   steps:
  #   - uses: actions/checkout@v4
    
  #   - name: Install libraries
  #     run: |
  #       apt update
  #       apt install -y curl libicu-dev
  #       apt-get install wget
  #       wget https://packages.microsoft.com/config/ubuntu/22.04/packages-microsoft-prod.deb -O packages-microsoft-prod.deb
  #       dpkg -i packages-microsoft-prod.deb
  #       rm packages-microsoft-prod.deb
  #       apt-get update  && apt-get install -y dotnet-sdk-8.0

  #   - name: Prepare models
  #     run: | 
  #       apt-get update
  #       apt-get install -y python3.10 python3-pip
  #       python3 --version
  #       pip install huggingface_hub
  #       python3 .github/download_models.py --model-dir ${{ matrix.modeldir }} --model-list LLama.Benchmark/Assets/models.txt --endpoint https://hf-mirror.com

  #   - name: Clear package cache
  #     run: dotnet clean LLamaSharp.sln && dotnet nuget locals all --clear
  #   - name: Restore packages
  #     run: dotnet restore LLamaSharp.sln
  #   - name: Build
  #     run: | 
  #       dotnet clean
  #       dotnet build LLama/LLamaSharp.csproj -c Release --no-restore
  #       dotnet build LLama.Benchmark/LLama.Benchmark.csproj -c Release --no-restore
  #   - name: Run benchmark test
  #     run: dotnet run --project LLama.Benchmark/LLama.Benchmark.csproj -c Release --anyCategories LLama
  #   - name: Upload artifacts
  #     if: always()
  #     uses: actions/upload-artifact@v3
  #     with:
  #       name: Benchmark_Results
  #       path: BenchmarkDotNet.Artifacts/results/*

  windows-benchmark-cuda:
    if: contains(github.event.pull_request.labels.*.name, 'benchmark')
    runs-on: [self-hosted, windows, gpu]

    strategy:
      fail-fast: false
      matrix:
        build: [cuda11]
        include:
          - build: cuda11
            modeldir: F:\Models

    steps:
    - uses: actions/checkout@v4

    - uses: actions/setup-python@v5
      with:
        python-version: '3.10'

    - name: Prepare models
      run: | 
        python --version
        pip install huggingface_hub
        python .github/download_models.py --model-dir ${{ matrix.modeldir }} --model-list LLama.Benchmark/Assets/models.txt --endpoint https://hf-mirror.com

    - name: Clear package cache
      run: dotnet clean LLamaSharp.sln && dotnet nuget locals all --clear
    - name: Restore packages
      run: dotnet restore LLamaSharp.sln
    - name: Build
      run: | 
        dotnet clean
        dotnet build LLama/LLamaSharp.csproj -c Release --no-restore
        dotnet build LLama.Benchmark/LLama.Benchmark.csproj -c Release --no-restore
    - name: Run benchmark test
      run: dotnet run --project LLama.Benchmark/LLama.Benchmark.csproj -c Release --anyCategories LLama
    - name: Upload artifacts
      if: always()
      uses: actions/upload-artifact@v3
      with:
        name: Benchmark_Results
        path: BenchmarkDotNet.Artifacts/results/*