feat: replace cuda13 flavour with per-GPU-generation packages
All checks were successful
deploy-ui / build-and-deploy (push) Successful in 44s
All checks were successful
deploy-ui / build-and-deploy (push) Successful in 44s
Build separate packages for each GPU generation instead of a single cuda13 package: - mistralrs-ampere (sm_86, RTX 3060) - mistralrs-ada (sm_89, RTX 4090) - mistralrs-blackwell (sm_120, RTX 5090) All use the same CUDA 13.0 toolkit and features (cuda, cudnn, flash-attn, nccl), varying only the compute capability target. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
This commit is contained in:
@@ -30,7 +30,23 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
include:
|
include:
|
||||||
- name: cuda13
|
- name: ampere
|
||||||
|
fedora_version: "43"
|
||||||
|
runner: cuda-13.0
|
||||||
|
cuda_home: /usr/local/cuda-13.0
|
||||||
|
cargo_features: "cuda cudnn flash-attn nccl"
|
||||||
|
compute_caps: "86"
|
||||||
|
build_jobs: 12
|
||||||
|
nvcc_threads: 4
|
||||||
|
- name: ada
|
||||||
|
fedora_version: "43"
|
||||||
|
runner: cuda-13.0
|
||||||
|
cuda_home: /usr/local/cuda-13.0
|
||||||
|
cargo_features: "cuda cudnn flash-attn nccl"
|
||||||
|
compute_caps: "89"
|
||||||
|
build_jobs: 12
|
||||||
|
nvcc_threads: 4
|
||||||
|
- name: blackwell
|
||||||
fedora_version: "43"
|
fedora_version: "43"
|
||||||
runner: cuda-13.0
|
runner: cuda-13.0
|
||||||
cuda_home: /usr/local/cuda-13.0
|
cuda_home: /usr/local/cuda-13.0
|
||||||
@@ -89,7 +105,11 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
include:
|
include:
|
||||||
- name: cuda13
|
- name: ampere
|
||||||
|
fedora_version: "43"
|
||||||
|
- name: ada
|
||||||
|
fedora_version: "43"
|
||||||
|
- name: blackwell
|
||||||
fedora_version: "43"
|
fedora_version: "43"
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
|
|||||||
@@ -18,7 +18,23 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
include:
|
include:
|
||||||
- name: cuda13
|
- name: ampere
|
||||||
|
fedora_version: "43"
|
||||||
|
runner: cuda-13.0
|
||||||
|
cuda_home: /usr/local/cuda-13.0
|
||||||
|
cargo_features: "cuda cudnn flash-attn nccl"
|
||||||
|
compute_caps: "86"
|
||||||
|
build_jobs: 12
|
||||||
|
nvcc_threads: 4
|
||||||
|
- name: ada
|
||||||
|
fedora_version: "43"
|
||||||
|
runner: cuda-13.0
|
||||||
|
cuda_home: /usr/local/cuda-13.0
|
||||||
|
cargo_features: "cuda cudnn flash-attn nccl"
|
||||||
|
compute_caps: "89"
|
||||||
|
build_jobs: 12
|
||||||
|
nvcc_threads: 4
|
||||||
|
- name: blackwell
|
||||||
fedora_version: "43"
|
fedora_version: "43"
|
||||||
runner: cuda-13.0
|
runner: cuda-13.0
|
||||||
cuda_home: /usr/local/cuda-13.0
|
cuda_home: /usr/local/cuda-13.0
|
||||||
@@ -76,7 +92,11 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
include:
|
include:
|
||||||
- name: cuda13
|
- name: ampere
|
||||||
|
fedora_version: "43"
|
||||||
|
- name: ada
|
||||||
|
fedora_version: "43"
|
||||||
|
- name: blackwell
|
||||||
fedora_version: "43"
|
fedora_version: "43"
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
|
|||||||
@@ -28,7 +28,7 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
version="${UPSTREAM_TAG#v}"
|
version="${UPSTREAM_TAG#v}"
|
||||||
needs_build=false
|
needs_build=false
|
||||||
for target in "43:cuda13"; do
|
for target in "43:ampere" "43:ada" "43:blackwell"; do
|
||||||
fedora_version="${target%%:*}"
|
fedora_version="${target%%:*}"
|
||||||
flavour="${target##*:}"
|
flavour="${target##*:}"
|
||||||
base_url="https://rpm.lair.cafe/fedora/${fedora_version}/x86_64"
|
base_url="https://rpm.lair.cafe/fedora/${fedora_version}/x86_64"
|
||||||
@@ -116,7 +116,7 @@ jobs:
|
|||||||
run: |
|
run: |
|
||||||
prerelease="0.1.${UPSTREAM_DATE}git${UPSTREAM_SHORT_SHA}"
|
prerelease="0.1.${UPSTREAM_DATE}git${UPSTREAM_SHORT_SHA}"
|
||||||
needs_build=false
|
needs_build=false
|
||||||
for target in "43:cuda13"; do
|
for target in "43:ampere" "43:ada" "43:blackwell"; do
|
||||||
fedora_version="${target%%:*}"
|
fedora_version="${target%%:*}"
|
||||||
flavour="${target##*:}"
|
flavour="${target##*:}"
|
||||||
base_url="https://rpm.lair.cafe/fedora/${fedora_version}/x86_64/unstable"
|
base_url="https://rpm.lair.cafe/fedora/${fedora_version}/x86_64/unstable"
|
||||||
|
|||||||
@@ -4,7 +4,7 @@
|
|||||||
|
|
||||||
# Passed in via --define at rpmbuild time
|
# Passed in via --define at rpmbuild time
|
||||||
%{!?mistralrs_version: %global mistralrs_version 0.7.0}
|
%{!?mistralrs_version: %global mistralrs_version 0.7.0}
|
||||||
%{!?mistralrs_flavour: %global mistralrs_flavour cuda13}
|
%{!?mistralrs_flavour: %global mistralrs_flavour blackwell}
|
||||||
|
|
||||||
# For prerelease builds, pass --define "mistralrs_prerelease 0.1.YYYYMMDDgitSHORTSHA"
|
# For prerelease builds, pass --define "mistralrs_prerelease 0.1.YYYYMMDDgitSHORTSHA"
|
||||||
%if 0%{?mistralrs_prerelease:1}
|
%if 0%{?mistralrs_prerelease:1}
|
||||||
|
|||||||
@@ -44,8 +44,11 @@ export function Home() {
|
|||||||
</CodeBlock>
|
</CodeBlock>
|
||||||
|
|
||||||
<h6 className="mt-4">3. Install a package</h6>
|
<h6 className="mt-4">3. Install a package</h6>
|
||||||
|
<p className="text-body-secondary">
|
||||||
|
Choose the package matching your GPU generation:
|
||||||
|
</p>
|
||||||
<CodeBlock language="bash">
|
<CodeBlock language="bash">
|
||||||
{`sudo dnf install mistralrs-cuda13`}
|
{`# RTX 3000 series (Ampere)\nsudo dnf install mistralrs-ampere\n\n# RTX 4000 series (Ada Lovelace)\nsudo dnf install mistralrs-ada\n\n# RTX 5000 series (Blackwell)\nsudo dnf install mistralrs-blackwell`}
|
||||||
</CodeBlock>
|
</CodeBlock>
|
||||||
</Card.Body>
|
</Card.Body>
|
||||||
</Card>
|
</Card>
|
||||||
@@ -78,7 +81,7 @@ export function Home() {
|
|||||||
Install or update from unstable
|
Install or update from unstable
|
||||||
</h6>
|
</h6>
|
||||||
<CodeBlock language="bash">
|
<CodeBlock language="bash">
|
||||||
{`sudo dnf --enablerepo=lair-cafe-unstable install mistralrs-cuda13`}
|
{`sudo dnf --enablerepo=lair-cafe-unstable install mistralrs-ada`}
|
||||||
</CodeBlock>
|
</CodeBlock>
|
||||||
|
|
||||||
<h6 className="mt-4">
|
<h6 className="mt-4">
|
||||||
@@ -89,7 +92,7 @@ export function Home() {
|
|||||||
stable releases, exclude prerelease versions:
|
stable releases, exclude prerelease versions:
|
||||||
</p>
|
</p>
|
||||||
<CodeBlock language="bash">
|
<CodeBlock language="bash">
|
||||||
{`sudo dnf --disablerepo=lair-cafe-unstable update mistralrs-cuda13`}
|
{`sudo dnf --disablerepo=lair-cafe-unstable update mistralrs-ada`}
|
||||||
</CodeBlock>
|
</CodeBlock>
|
||||||
</Card.Body>
|
</Card.Body>
|
||||||
</Card>
|
</Card>
|
||||||
|
|||||||
Reference in New Issue
Block a user