bench-server-baseline (phi-2, q4_0)
Details
Push Docker image to Docker Hub (light, .devops/main.Dockerfile, linux/amd64,linux/arm64)
Details
bench-server-baseline (phi-2, q8_0)
Details
Push Docker image to Docker Hub (full, .devops/full.Dockerfile, linux/amd64,linux/arm64)
Details
bench-server-baseline (phi-2, f16)
Details
Push Docker image to Docker Hub (server, .devops/server.Dockerfile, linux/amd64,linux/arm64)
Details
Push Docker image to Docker Hub (light-cuda, .devops/main-cuda.Dockerfile, linux/amd64)
Details
Push Docker image to Docker Hub (full-cuda, .devops/full-cuda.Dockerfile, linux/amd64)
Details
Push Docker image to Docker Hub (server-cuda, .devops/server-cuda.Dockerfile, linux/amd64)
Details
Push Docker image to Docker Hub (light-rocm, .devops/main-rocm.Dockerfile, linux/amd64,linux/arm64)
Details
Push Docker image to Docker Hub (full-rocm, .devops/full-rocm.Dockerfile, linux/amd64,linux/arm64)
Details
Push Docker image to Docker Hub (server-rocm, .devops/server-rocm.Dockerfile, linux/amd64,linux/a...
Details
Push Docker image to Docker Hub (light-intel, .devops/main-intel.Dockerfile, linux/amd64)
Details
Push Docker image to Docker Hub (server-intel, .devops/server-intel.Dockerfile, linux/amd64)
Details
ubuntu-latest-cmake-mpi (mpich)
Details
ubuntu-latest-cmake-mpi (libopenmpi-dev)
Details
macOS-latest-swift (generic/platform=macOS)
Details
macOS-latest-swift (generic/platform=iOS)
Details
macOS-latest-swift (generic/platform=tvOS)
Details
windows-msys2 (UCRT64, ucrt-x86_64, Release)
Details
windows-msys2 (CLANG64, clang-x86_64, Release)
Details
windows-latest-cmake (noavx, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_AVX=OFF -DLLAMA_A...
Details
windows-latest-cmake (avx2, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DBUILD_SHARED_LIBS=ON)
Details
windows-latest-cmake (avx, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_AVX2=OFF -DBUILD_SH...
Details
windows-latest-cmake (avx512, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_AVX512=ON -DBUIL...
Details
windows-latest-cmake (clblast, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_CLBLAST=ON -DBU...
Details
windows-latest-cmake (openblas, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_BLAS=ON -DBUIL...
Details
windows-latest-cmake (kompute, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_KOMPUTE=ON -DKO...
Details
windows-latest-cmake (vulkan, -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DLLAMA_VULKAN=ON -DBUIL...
Details
windows-latest-cmake (arm64, -A ARM64 -DLLAMA_NATIVE=OFF -DLLAMA_BUILD_SERVER=ON -DBUILD_SHARED_L...
Details
windows-latest-cmake-cuda (12.2.0, cuda)
Details
windows-latest-cmake-cuda (11.7.1, cuda)
Details
bench-server-bench-server-baseline-Standard_NC4as_T4_v3-phi-2-f16
{"i":471,"req":{"p95":24996.71,"avg":10016.94},"pp":{"p95":578.91,"avg":127.91,"0":1203.82},"tg":{"p95":28.18,"avg":25.55,"0":22.68}}
Details
bench-server-bench-server-baseline-Standard_NC4as_T4_v3-phi-2-q4_0
{"i":519,"req":{"p95":22221.76,"avg":9024.52},"pp":{"p95":466.16,"avg":106.05,"0":760.85},"tg":{"p95":47.97,"avg":30.9,"0":28.3}}
Details
bench-server-bench-server-baseline-Standard_NC4as_T4_v3-phi-2-q8_0
{"i":480,"req":{"p95":22983.79,"avg":9835.62},"pp":{"p95":611.29,"avg":128.61,"0":858.65},"tg":{"p95":37.47,"avg":28.04,"0":27.32}}
Details