Compare commits
3 Commits
b713dbe669
...
03bed93fee
| Author | SHA1 | Date | |
|---|---|---|---|
|
03bed93fee
|
|||
|
4a5211d830
|
|||
|
6d2dc5ff1a
|
@@ -94,6 +94,13 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
include:
|
include:
|
||||||
|
- flavour: ampere
|
||||||
|
compute_cap: "86"
|
||||||
|
runner: cuda-13.0
|
||||||
|
cuda_home: /usr/local/cuda-13.0
|
||||||
|
build_jobs: 8
|
||||||
|
nvcc_threads: 4
|
||||||
|
cargo_features: "cuda cudnn flash-attn"
|
||||||
- flavour: ada
|
- flavour: ada
|
||||||
compute_cap: "89"
|
compute_cap: "89"
|
||||||
runner: cuda-13.0
|
runner: cuda-13.0
|
||||||
@@ -193,6 +200,7 @@ jobs:
|
|||||||
fail-fast: false
|
fail-fast: false
|
||||||
matrix:
|
matrix:
|
||||||
include:
|
include:
|
||||||
|
- flavour: ampere
|
||||||
- flavour: ada
|
- flavour: ada
|
||||||
- flavour: blackwell
|
- flavour: blackwell
|
||||||
steps:
|
steps:
|
||||||
|
|||||||
@@ -16,6 +16,13 @@ env:
|
|||||||
SCCACHE_S3_USE_SSL: "false"
|
SCCACHE_S3_USE_SSL: "false"
|
||||||
AWS_ACCESS_KEY_ID: ${{ secrets.SCCACHE_S3_ACCESS_KEY }}
|
AWS_ACCESS_KEY_ID: ${{ secrets.SCCACHE_S3_ACCESS_KEY }}
|
||||||
AWS_SECRET_ACCESS_KEY: ${{ secrets.SCCACHE_S3_SECRET_KEY }}
|
AWS_SECRET_ACCESS_KEY: ${{ secrets.SCCACHE_S3_SECRET_KEY }}
|
||||||
|
# fmt, clippy, and test all run in parallel on the same `rust` runner
|
||||||
|
# and would otherwise share /root/.cache/act/<hash>/hostexecutor/target/,
|
||||||
|
# racing each other's cargo temp files (.tmpXXXXXX) and failing builds
|
||||||
|
# mid-compile. Give each job its own target directory so the invocations
|
||||||
|
# don't collide. sccache still backs the actual rustc cache, so the
|
||||||
|
# rebuild penalty is small.
|
||||||
|
CARGO_TARGET_DIR: target-${{ github.job }}
|
||||||
|
|
||||||
jobs:
|
jobs:
|
||||||
fmt:
|
fmt:
|
||||||
|
|||||||
30
asset/manifest.yml
Normal file
30
asset/manifest.yml
Normal file
@@ -0,0 +1,30 @@
|
|||||||
|
# Helexa fleet manifest.
|
||||||
|
#
|
||||||
|
# Drives rolling deploys via script/deploy.sh and serves as the source
|
||||||
|
# of truth for which hosts run cortex vs neuron, and which CUDA
|
||||||
|
# compute-capability flavour each neuron host needs.
|
||||||
|
#
|
||||||
|
# Flavour ↔ NVIDIA generation ↔ compute cap:
|
||||||
|
# ampere sm_86 (RTX 30 series — e.g. 3060)
|
||||||
|
# ada sm_89 (RTX 40 series — e.g. 4090)
|
||||||
|
# blackwell sm_120 (RTX 50 series — e.g. 5090)
|
||||||
|
#
|
||||||
|
# The flavour determines which RPM is installed on a given neuron host:
|
||||||
|
# helexa-neuron-<flavour>. Only one flavour may be installed at a time
|
||||||
|
# (the packages Conflict: with each other).
|
||||||
|
|
||||||
|
cortex:
|
||||||
|
host: hanzalova.internal
|
||||||
|
|
||||||
|
neurons:
|
||||||
|
- host: beast.hanzalova.internal
|
||||||
|
flavour: blackwell
|
||||||
|
gpu: "2x RTX 5090"
|
||||||
|
|
||||||
|
- host: benjy.hanzalova.internal
|
||||||
|
flavour: ada
|
||||||
|
gpu: "RTX 4090"
|
||||||
|
|
||||||
|
- host: quadbrat.hanzalova.internal
|
||||||
|
flavour: ampere
|
||||||
|
gpu: "RTX 3060"
|
||||||
Reference in New Issue
Block a user