feat: replace cuda13 flavour with per-GPU-generation packages
All checks were successful
deploy-ui / build-and-deploy (push) Successful in 44s

Build separate packages for each GPU generation instead of a single
cuda13 package:
- mistralrs-ampere (sm_86, RTX 3060)
- mistralrs-ada (sm_89, RTX 4090)
- mistralrs-blackwell (sm_120, RTX 5090)

All use the same CUDA 13.0 toolkit and features (cuda, cudnn, flash-attn,
nccl), varying only the compute capability target.

Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
2026-05-11 14:45:28 +03:00
parent 661cf574f2
commit ace6037a2d
5 changed files with 53 additions and 10 deletions

View File

@@ -30,7 +30,23 @@ jobs:
fail-fast: false
matrix:
include:
- name: cuda13
- name: ampere
fedora_version: "43"
runner: cuda-13.0
cuda_home: /usr/local/cuda-13.0
cargo_features: "cuda cudnn flash-attn nccl"
compute_caps: "86"
build_jobs: 12
nvcc_threads: 4
- name: ada
fedora_version: "43"
runner: cuda-13.0
cuda_home: /usr/local/cuda-13.0
cargo_features: "cuda cudnn flash-attn nccl"
compute_caps: "89"
build_jobs: 12
nvcc_threads: 4
- name: blackwell
fedora_version: "43"
runner: cuda-13.0
cuda_home: /usr/local/cuda-13.0
@@ -89,7 +105,11 @@ jobs:
fail-fast: false
matrix:
include:
- name: cuda13
- name: ampere
fedora_version: "43"
- name: ada
fedora_version: "43"
- name: blackwell
fedora_version: "43"
steps:
- uses: actions/checkout@v4

View File

@@ -18,7 +18,23 @@ jobs:
fail-fast: false
matrix:
include:
- name: cuda13
- name: ampere
fedora_version: "43"
runner: cuda-13.0
cuda_home: /usr/local/cuda-13.0
cargo_features: "cuda cudnn flash-attn nccl"
compute_caps: "86"
build_jobs: 12
nvcc_threads: 4
- name: ada
fedora_version: "43"
runner: cuda-13.0
cuda_home: /usr/local/cuda-13.0
cargo_features: "cuda cudnn flash-attn nccl"
compute_caps: "89"
build_jobs: 12
nvcc_threads: 4
- name: blackwell
fedora_version: "43"
runner: cuda-13.0
cuda_home: /usr/local/cuda-13.0
@@ -76,7 +92,11 @@ jobs:
fail-fast: false
matrix:
include:
- name: cuda13
- name: ampere
fedora_version: "43"
- name: ada
fedora_version: "43"
- name: blackwell
fedora_version: "43"
steps:
- uses: actions/checkout@v4

View File

@@ -28,7 +28,7 @@ jobs:
run: |
version="${UPSTREAM_TAG#v}"
needs_build=false
for target in "43:cuda13"; do
for target in "43:ampere" "43:ada" "43:blackwell"; do
fedora_version="${target%%:*}"
flavour="${target##*:}"
base_url="https://rpm.lair.cafe/fedora/${fedora_version}/x86_64"
@@ -116,7 +116,7 @@ jobs:
run: |
prerelease="0.1.${UPSTREAM_DATE}git${UPSTREAM_SHORT_SHA}"
needs_build=false
for target in "43:cuda13"; do
for target in "43:ampere" "43:ada" "43:blackwell"; do
fedora_version="${target%%:*}"
flavour="${target##*:}"
base_url="https://rpm.lair.cafe/fedora/${fedora_version}/x86_64/unstable"

View File

@@ -4,7 +4,7 @@
# Passed in via --define at rpmbuild time
%{!?mistralrs_version: %global mistralrs_version 0.7.0}
%{!?mistralrs_flavour: %global mistralrs_flavour cuda13}
%{!?mistralrs_flavour: %global mistralrs_flavour blackwell}
# For prerelease builds, pass --define "mistralrs_prerelease 0.1.YYYYMMDDgitSHORTSHA"
%if 0%{?mistralrs_prerelease:1}

View File

@@ -44,8 +44,11 @@ export function Home() {
</CodeBlock>
<h6 className="mt-4">3. Install a package</h6>
<p className="text-body-secondary">
Choose the package matching your GPU generation:
</p>
<CodeBlock language="bash">
{`sudo dnf install mistralrs-cuda13`}
{`# RTX 3000 series (Ampere)\nsudo dnf install mistralrs-ampere\n\n# RTX 4000 series (Ada Lovelace)\nsudo dnf install mistralrs-ada\n\n# RTX 5000 series (Blackwell)\nsudo dnf install mistralrs-blackwell`}
</CodeBlock>
</Card.Body>
</Card>
@@ -78,7 +81,7 @@ export function Home() {
Install or update from unstable
</h6>
<CodeBlock language="bash">
{`sudo dnf --enablerepo=lair-cafe-unstable install mistralrs-cuda13`}
{`sudo dnf --enablerepo=lair-cafe-unstable install mistralrs-ada`}
</CodeBlock>
<h6 className="mt-4">
@@ -89,7 +92,7 @@ export function Home() {
stable releases, exclude prerelease versions:
</p>
<CodeBlock language="bash">
{`sudo dnf --disablerepo=lair-cafe-unstable update mistralrs-cuda13`}
{`sudo dnf --disablerepo=lair-cafe-unstable update mistralrs-ada`}
</CodeBlock>
</Card.Body>
</Card>