| @@ -20,7 +20,7 @@ jobs: | |||||
| include: | include: | ||||
| - build: cuda11 | - build: cuda11 | ||||
| image: nvidia/cuda:11.7.1-devel-ubuntu22.04 | image: nvidia/cuda:11.7.1-devel-ubuntu22.04 | ||||
| model_dir: /llamasharp_ci/models_benchmark | |||||
| modeldir: /llamasharp_ci/models_benchmark | |||||
| # - build: cuda12 | # - build: cuda12 | ||||
| # image: nvidia/cuda:12.1.1-runtime-ubuntu22.04 | # image: nvidia/cuda:12.1.1-runtime-ubuntu22.04 | ||||
| @@ -58,7 +58,7 @@ jobs: | |||||
| python-version: '3.10' | python-version: '3.10' | ||||
| run: | | run: | | ||||
| pip install huggingface_hub | pip install huggingface_hub | ||||
| python3 LLama.Benchmark/prepare_models.py --model-dir ${{ matrix.model_dir }} --model-list LLama.Benchmark/Assets/models.txt --endpoint https://hf-mirror.com | |||||
| python3 LLama.Benchmark/prepare_models.py --model-dir ${{ matrix.modeldir }} --model-list LLama.Benchmark/Assets/models.txt --endpoint https://hf-mirror.com | |||||
| - name: Clear package cache | - name: Clear package cache | ||||
| run: dotnet clean LLamaSharp.sln && dotnet nuget locals all --clear | run: dotnet clean LLamaSharp.sln && dotnet nuget locals all --clear | ||||
| @@ -69,7 +69,7 @@ jobs: | |||||
| dotnet build LLama/LLamaSharp.csproj -c release --no-restore | dotnet build LLama/LLamaSharp.csproj -c release --no-restore | ||||
| dotnet build LLama.Benchmark/LLama.Benchmark.csproj -c release --no-restore | dotnet build LLama.Benchmark/LLama.Benchmark.csproj -c release --no-restore | ||||
| - name: Run benchmark test | - name: Run benchmark test | ||||
| run: dotnet run --project LLama.Benchmark/LLama.Benchmark.csproj -c release ${{ matrix.model_dir }} | |||||
| run: dotnet run --project LLama.Benchmark/LLama.Benchmark.csproj -c release ${{ matrix.modeldir }} | |||||
| - name: Upload artifacts | - name: Upload artifacts | ||||
| if: always() | if: always() | ||||
| uses: actions/upload-artifact@v3 | uses: actions/upload-artifact@v3 | ||||