Compare commits
8 Commits
v0.1.15
...
7f797b0265
| Author | SHA1 | Date | |
|---|---|---|---|
|
7f797b0265
|
|||
|
5a0360c1d5
|
|||
|
472c0e8737
|
|||
|
|
b9d8e30058 | ||
|
25f75fe552
|
|||
|
3f94c50817
|
|||
|
3e1fb60076
|
|||
|
|
9bf987888c |
@@ -18,51 +18,33 @@ env:
|
|||||||
AWS_SECRET_ACCESS_KEY: ${{ secrets.SCCACHE_S3_SECRET_KEY }}
|
AWS_SECRET_ACCESS_KEY: ${{ secrets.SCCACHE_S3_SECRET_KEY }}
|
||||||
|
|
||||||
jobs:
|
jobs:
|
||||||
check:
|
fmt:
|
||||||
name: Format, lint, build, test
|
name: Format
|
||||||
runs-on: fedora
|
runs-on: rust
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
|
- run: cargo fmt --check --all
|
||||||
|
|
||||||
- name: Cache cargo registry and target
|
clippy:
|
||||||
uses: actions/cache@v4
|
name: Clippy
|
||||||
with:
|
runs-on: rust
|
||||||
path: |
|
steps:
|
||||||
~/.cargo/bin
|
- uses: actions/checkout@v4
|
||||||
~/.cargo/registry/index
|
- run: cargo clippy --workspace -- -D warnings
|
||||||
~/.cargo/registry/cache
|
- run: sccache --show-stats
|
||||||
~/.cargo/git/db
|
|
||||||
target
|
|
||||||
key: ${{ runner.os }}-cargo-${{ hashFiles('**/Cargo.lock') }}
|
|
||||||
restore-keys: |
|
|
||||||
${{ runner.os }}-cargo-
|
|
||||||
|
|
||||||
- name: Ensure sccache with S3 support
|
test:
|
||||||
env:
|
name: Test
|
||||||
RUSTC_WRAPPER: ""
|
runs-on: rust
|
||||||
run: |
|
steps:
|
||||||
if sccache --version 2>/dev/null && sccache --show-stats 2>/dev/null; then
|
- uses: actions/checkout@v4
|
||||||
echo "sccache with S3 support already installed"
|
- run: cargo test --workspace
|
||||||
else
|
- run: sccache --show-stats
|
||||||
cargo install sccache --features s3 --locked
|
|
||||||
fi
|
|
||||||
|
|
||||||
- name: Check formatting
|
|
||||||
run: cargo fmt --check --all
|
|
||||||
|
|
||||||
- name: Clippy
|
|
||||||
run: cargo clippy --workspace -- -D warnings
|
|
||||||
|
|
||||||
- name: Test
|
|
||||||
run: cargo test --workspace
|
|
||||||
|
|
||||||
- name: Show sccache stats
|
|
||||||
run: sccache --show-stats
|
|
||||||
|
|
||||||
srpm-cortex:
|
srpm-cortex:
|
||||||
name: Build cortex SRPM
|
name: Build cortex SRPM
|
||||||
runs-on: fedora
|
runs-on: rpm
|
||||||
needs: check
|
needs: [fmt, clippy, test]
|
||||||
if: startsWith(github.ref, 'refs/tags/v')
|
if: startsWith(github.ref, 'refs/tags/v')
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
@@ -121,8 +103,8 @@ jobs:
|
|||||||
|
|
||||||
srpm-neuron:
|
srpm-neuron:
|
||||||
name: Build neuron SRPM
|
name: Build neuron SRPM
|
||||||
runs-on: fedora
|
runs-on: rpm
|
||||||
needs: check
|
needs: [fmt, clippy, test]
|
||||||
if: startsWith(github.ref, 'refs/tags/v')
|
if: startsWith(github.ref, 'refs/tags/v')
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
@@ -181,7 +163,7 @@ jobs:
|
|||||||
|
|
||||||
copr-cortex:
|
copr-cortex:
|
||||||
name: Publish cortex to COPR
|
name: Publish cortex to COPR
|
||||||
runs-on: fedora
|
runs-on: fedora-43
|
||||||
needs: srpm-cortex
|
needs: srpm-cortex
|
||||||
steps:
|
steps:
|
||||||
- name: Download SRPM
|
- name: Download SRPM
|
||||||
@@ -198,7 +180,7 @@ jobs:
|
|||||||
|
|
||||||
copr-neuron:
|
copr-neuron:
|
||||||
name: Publish neuron to COPR
|
name: Publish neuron to COPR
|
||||||
runs-on: fedora
|
runs-on: fedora-43
|
||||||
needs: srpm-neuron
|
needs: srpm-neuron
|
||||||
steps:
|
steps:
|
||||||
- name: Download SRPM
|
- name: Download SRPM
|
||||||
@@ -215,7 +197,7 @@ jobs:
|
|||||||
|
|
||||||
bump-version:
|
bump-version:
|
||||||
name: Bump version in source
|
name: Bump version in source
|
||||||
runs-on: fedora
|
runs-on: rust
|
||||||
needs: [copr-cortex, copr-neuron]
|
needs: [copr-cortex, copr-neuron]
|
||||||
steps:
|
steps:
|
||||||
- uses: actions/checkout@v4
|
- uses: actions/checkout@v4
|
||||||
|
|||||||
1
.gitignore
vendored
1
.gitignore
vendored
@@ -5,3 +5,4 @@
|
|||||||
.vscode/
|
.vscode/
|
||||||
cortex.toml
|
cortex.toml
|
||||||
doc/plan/*
|
doc/plan/*
|
||||||
|
script/deploy.sh
|
||||||
|
|||||||
17
CLAUDE.md
17
CLAUDE.md
@@ -125,7 +125,8 @@ automatically. Clippy warnings must be resolved, not suppressed with
|
|||||||
- One or more GPU nodes running mistral.rs on port 8080
|
- One or more GPU nodes running mistral.rs on port 8080
|
||||||
- Optionally a metrics-only node (no GPU) for Prometheus/Grafana
|
- Optionally a metrics-only node (no GPU) for Prometheus/Grafana
|
||||||
- Each node runs `mistralrs serve` on port 8080
|
- Each node runs `mistralrs serve` on port 8080
|
||||||
- Gateway listens on port 8000 (API) and 9100 (metrics)
|
- Gateway listens on port 31313 (API) and 31314 (metrics)
|
||||||
|
- neuron listens on port 13131 on each GPU host
|
||||||
- TLS terminated at gateway or via nginx; internal traffic is plaintext over WireGuard
|
- TLS terminated at gateway or via nginx; internal traffic is plaintext over WireGuard
|
||||||
|
|
||||||
## Conventions
|
## Conventions
|
||||||
@@ -380,7 +381,7 @@ processes (one process per loaded model, each on its own port).
|
|||||||
|
|
||||||
## neuron API
|
## neuron API
|
||||||
|
|
||||||
neuron exposes an HTTP API on port 9090 that cortex polls and calls.
|
neuron exposes an HTTP API on port 13131 that cortex polls and calls.
|
||||||
|
|
||||||
```
|
```
|
||||||
GET /discovery
|
GET /discovery
|
||||||
@@ -424,8 +425,8 @@ endpoint. cortex.toml shrinks to:
|
|||||||
|
|
||||||
```toml
|
```toml
|
||||||
[gateway]
|
[gateway]
|
||||||
listen = "0.0.0.0:8000"
|
listen = "0.0.0.0:31313"
|
||||||
metrics_listen = "0.0.0.0:9100"
|
metrics_listen = "0.0.0.0:31314"
|
||||||
|
|
||||||
[eviction]
|
[eviction]
|
||||||
strategy = "lru"
|
strategy = "lru"
|
||||||
@@ -433,15 +434,15 @@ defrag_after_cycles = 50
|
|||||||
|
|
||||||
[[neurons]]
|
[[neurons]]
|
||||||
name = "beast"
|
name = "beast"
|
||||||
endpoint = "http://beast.hanzalova.internal:9090"
|
endpoint = "http://beast.hanzalova.internal:13131"
|
||||||
|
|
||||||
[[neurons]]
|
[[neurons]]
|
||||||
name = "benjy"
|
name = "benjy"
|
||||||
endpoint = "http://benjy.kosherinata.internal:9090"
|
endpoint = "http://benjy.hanzalova.internal:13131"
|
||||||
|
|
||||||
[[neurons]]
|
[[neurons]]
|
||||||
name = "quadbrat"
|
name = "quadbrat"
|
||||||
endpoint = "http://quadbrat.hanzalova.internal:9090"
|
endpoint = "http://quadbrat.hanzalova.internal:13131"
|
||||||
```
|
```
|
||||||
|
|
||||||
On startup and periodically, cortex calls `GET /discovery` and
|
On startup and periodically, cortex calls `GET /discovery` and
|
||||||
@@ -521,7 +522,7 @@ cortex/
|
|||||||
│ │ └── metrics.rs # prometheus exporter (unchanged)
|
│ │ └── metrics.rs # prometheus exporter (unchanged)
|
||||||
│ ├── neuron/ # node plane (replaces cortex-agent)
|
│ ├── neuron/ # node plane (replaces cortex-agent)
|
||||||
│ │ └── src/
|
│ │ └── src/
|
||||||
│ │ ├── main.rs # binary entrypoint, axum server on :9090
|
│ │ ├── main.rs # binary entrypoint, axum server on :13131
|
||||||
│ │ ├── discovery.rs # nvidia-smi, device enumeration
|
│ │ ├── discovery.rs # nvidia-smi, device enumeration
|
||||||
│ │ ├── health.rs # runtime GPU polling
|
│ │ ├── health.rs # runtime GPU polling
|
||||||
│ │ ├── api.rs # HTTP handlers for /discovery, /models, etc.
|
│ │ ├── api.rs # HTTP handlers for /discovery, /models, etc.
|
||||||
|
|||||||
8
Cargo.lock
generated
8
Cargo.lock
generated
@@ -351,7 +351,7 @@ checksum = "773648b94d0e5d620f64f280777445740e61fe701025087ec8b57f45c791888b"
|
|||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "cortex-cli"
|
name = "cortex-cli"
|
||||||
version = "0.1.12"
|
version = "0.1.16"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"anyhow",
|
"anyhow",
|
||||||
"clap",
|
"clap",
|
||||||
@@ -366,7 +366,7 @@ dependencies = [
|
|||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "cortex-core"
|
name = "cortex-core"
|
||||||
version = "0.1.12"
|
version = "0.1.16"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"anyhow",
|
"anyhow",
|
||||||
"async-trait",
|
"async-trait",
|
||||||
@@ -381,7 +381,7 @@ dependencies = [
|
|||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "cortex-gateway"
|
name = "cortex-gateway"
|
||||||
version = "0.1.12"
|
version = "0.1.16"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"anyhow",
|
"anyhow",
|
||||||
"axum",
|
"axum",
|
||||||
@@ -1184,7 +1184,7 @@ dependencies = [
|
|||||||
|
|
||||||
[[package]]
|
[[package]]
|
||||||
name = "neuron"
|
name = "neuron"
|
||||||
version = "0.1.12"
|
version = "0.1.16"
|
||||||
dependencies = [
|
dependencies = [
|
||||||
"anyhow",
|
"anyhow",
|
||||||
"async-trait",
|
"async-trait",
|
||||||
|
|||||||
@@ -8,7 +8,7 @@ members = [
|
|||||||
]
|
]
|
||||||
|
|
||||||
[workspace.package]
|
[workspace.package]
|
||||||
version = "0.1.12"
|
version = "0.1.16"
|
||||||
edition = "2024"
|
edition = "2024"
|
||||||
license = "GPL-3.0-or-later"
|
license = "GPL-3.0-or-later"
|
||||||
repository = "https://git.lair.cafe/helexa/cortex"
|
repository = "https://git.lair.cafe/helexa/cortex"
|
||||||
|
|||||||
@@ -88,8 +88,8 @@ WantedBy=multi-user.target
|
|||||||
```toml
|
```toml
|
||||||
# cortex.toml
|
# cortex.toml
|
||||||
[gateway]
|
[gateway]
|
||||||
listen = "0.0.0.0:8000"
|
listen = "0.0.0.0:31313"
|
||||||
metrics_listen = "0.0.0.0:9100"
|
metrics_listen = "0.0.0.0:31314"
|
||||||
|
|
||||||
[eviction]
|
[eviction]
|
||||||
strategy = "lru" # lru | priority
|
strategy = "lru" # lru | priority
|
||||||
@@ -143,7 +143,7 @@ cortex serve --config cortex.toml
|
|||||||
cortex status
|
cortex status
|
||||||
|
|
||||||
# list all models across nodes
|
# list all models across nodes
|
||||||
curl http://localhost:8000/v1/models
|
curl http://localhost:31313/v1/models
|
||||||
```
|
```
|
||||||
|
|
||||||
## License
|
## License
|
||||||
|
|||||||
@@ -3,11 +3,11 @@
|
|||||||
# Copy to cortex.toml and adjust for your environment.
|
# Copy to cortex.toml and adjust for your environment.
|
||||||
#
|
#
|
||||||
# Environment variable overrides use CORTEX_ prefix with __ separators:
|
# Environment variable overrides use CORTEX_ prefix with __ separators:
|
||||||
# CORTEX_GATEWAY__LISTEN=0.0.0.0:9000
|
# CORTEX_GATEWAY__LISTEN=0.0.0.0:31313
|
||||||
|
|
||||||
[gateway]
|
[gateway]
|
||||||
listen = "0.0.0.0:8000"
|
listen = "0.0.0.0:31313"
|
||||||
metrics_listen = "0.0.0.0:9100"
|
metrics_listen = "0.0.0.0:31314"
|
||||||
|
|
||||||
[eviction]
|
[eviction]
|
||||||
strategy = "lru"
|
strategy = "lru"
|
||||||
|
|||||||
15
cortex.spec
15
cortex.spec
@@ -1,5 +1,5 @@
|
|||||||
Name: cortex
|
Name: cortex
|
||||||
Version: 0.1.12
|
Version: 0.1.16
|
||||||
Release: 1%{?dist}
|
Release: 1%{?dist}
|
||||||
Summary: Inference gateway for multi-node GPU clusters
|
Summary: Inference gateway for multi-node GPU clusters
|
||||||
|
|
||||||
@@ -21,6 +21,7 @@ BuildRequires: systemd-rpm-macros
|
|||||||
|
|
||||||
Requires(pre): shadow-utils
|
Requires(pre): shadow-utils
|
||||||
Requires: systemd
|
Requires: systemd
|
||||||
|
Requires: firewalld-filesystem
|
||||||
|
|
||||||
# systemd-rpm-macros ships a unit dep generator that parses User=/Group=
|
# systemd-rpm-macros ships a unit dep generator that parses User=/Group=
|
||||||
# from our .service file and emits Requires: user(cortex)/group(cortex).
|
# from our .service file and emits Requires: user(cortex)/group(cortex).
|
||||||
@@ -56,6 +57,7 @@ cargo build --release -p cortex-cli
|
|||||||
install -Dm755 target/release/cortex %{buildroot}%{_bindir}/cortex
|
install -Dm755 target/release/cortex %{buildroot}%{_bindir}/cortex
|
||||||
install -Dm644 data/cortex.service %{buildroot}%{_unitdir}/cortex.service
|
install -Dm644 data/cortex.service %{buildroot}%{_unitdir}/cortex.service
|
||||||
install -Dm644 data/cortex-sysusers.conf %{buildroot}%{_sysusersdir}/cortex.conf
|
install -Dm644 data/cortex-sysusers.conf %{buildroot}%{_sysusersdir}/cortex.conf
|
||||||
|
install -Dm644 data/cortex-firewalld.xml %{buildroot}%{_prefix}/lib/firewalld/services/cortex.xml
|
||||||
install -dm755 %{buildroot}%{_sysconfdir}/cortex
|
install -dm755 %{buildroot}%{_sysconfdir}/cortex
|
||||||
install -Dm644 cortex.example.toml %{buildroot}%{_sysconfdir}/cortex/cortex.toml
|
install -Dm644 cortex.example.toml %{buildroot}%{_sysconfdir}/cortex/cortex.toml
|
||||||
install -Dm644 models.example.toml %{buildroot}%{_sysconfdir}/cortex/models.toml
|
install -Dm644 models.example.toml %{buildroot}%{_sysconfdir}/cortex/models.toml
|
||||||
@@ -78,10 +80,21 @@ install -Dm644 models.example.toml %{buildroot}%{_sysconfdir}/cortex/models.toml
|
|||||||
%{_bindir}/cortex
|
%{_bindir}/cortex
|
||||||
%{_unitdir}/cortex.service
|
%{_unitdir}/cortex.service
|
||||||
%{_sysusersdir}/cortex.conf
|
%{_sysusersdir}/cortex.conf
|
||||||
|
%{_prefix}/lib/firewalld/services/cortex.xml
|
||||||
%dir %{_sysconfdir}/cortex
|
%dir %{_sysconfdir}/cortex
|
||||||
%config(noreplace) %{_sysconfdir}/cortex/cortex.toml
|
%config(noreplace) %{_sysconfdir}/cortex/cortex.toml
|
||||||
%config(noreplace) %{_sysconfdir}/cortex/models.toml
|
%config(noreplace) %{_sysconfdir}/cortex/models.toml
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
|
* Thu Apr 16 2026 Gitea Actions <actions@git.lair.cafe> - 0.1.16-1
|
||||||
|
- chore: ignore local deploy script
|
||||||
|
- chore: move default ports out of common-collision ranges
|
||||||
|
- ci: drop actions/cache for cargo registry and target
|
||||||
|
|
||||||
|
* Thu Apr 16 2026 Gitea Actions <actions@git.lair.cafe> - 0.1.14-1
|
||||||
|
- ci: publish both packages to a single helexa/helexa COPR project
|
||||||
|
- fix(rpm): rename neuron package to helexa-neuron
|
||||||
|
- ci: commit generated %changelog entries back to main
|
||||||
|
|
||||||
* Wed Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
|
* Wed Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
|
||||||
- Initial package
|
- Initial package
|
||||||
|
|||||||
@@ -23,7 +23,7 @@ enum Commands {
|
|||||||
/// Print the fleet status (models, nodes, health).
|
/// Print the fleet status (models, nodes, health).
|
||||||
Status {
|
Status {
|
||||||
/// Gateway API endpoint to query.
|
/// Gateway API endpoint to query.
|
||||||
#[arg(short, long, default_value = "http://localhost:8000")]
|
#[arg(short, long, default_value = "http://localhost:31313")]
|
||||||
endpoint: String,
|
endpoint: String,
|
||||||
},
|
},
|
||||||
}
|
}
|
||||||
|
|||||||
@@ -22,9 +22,9 @@ fn default_models_path() -> String {
|
|||||||
|
|
||||||
#[derive(Debug, Clone, Serialize, Deserialize)]
|
#[derive(Debug, Clone, Serialize, Deserialize)]
|
||||||
pub struct GatewaySettings {
|
pub struct GatewaySettings {
|
||||||
/// Address to listen on for API requests (e.g. "0.0.0.0:8000")
|
/// Address to listen on for API requests (e.g. "0.0.0.0:31313")
|
||||||
pub listen: String,
|
pub listen: String,
|
||||||
/// Address to listen on for Prometheus metrics (e.g. "0.0.0.0:9100")
|
/// Address to listen on for Prometheus metrics (e.g. "0.0.0.0:31314")
|
||||||
pub metrics_listen: String,
|
pub metrics_listen: String,
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -50,7 +50,7 @@ pub enum EvictionStrategy {
|
|||||||
pub struct NeuronEndpoint {
|
pub struct NeuronEndpoint {
|
||||||
/// Human-readable node name (e.g. "beast")
|
/// Human-readable node name (e.g. "beast")
|
||||||
pub name: String,
|
pub name: String,
|
||||||
/// Base URL of the neuron daemon (e.g. "http://beast.internal:9090")
|
/// Base URL of the neuron daemon (e.g. "http://beast.internal:13131")
|
||||||
pub endpoint: String,
|
pub endpoint: String,
|
||||||
}
|
}
|
||||||
|
|
||||||
@@ -70,8 +70,8 @@ impl Default for GatewayConfig {
|
|||||||
fn default() -> Self {
|
fn default() -> Self {
|
||||||
Self {
|
Self {
|
||||||
gateway: GatewaySettings {
|
gateway: GatewaySettings {
|
||||||
listen: "0.0.0.0:8000".into(),
|
listen: "0.0.0.0:31313".into(),
|
||||||
metrics_listen: "0.0.0.0:9100".into(),
|
metrics_listen: "0.0.0.0:31314".into(),
|
||||||
},
|
},
|
||||||
eviction: EvictionSettings {
|
eviction: EvictionSettings {
|
||||||
strategy: EvictionStrategy::Lru,
|
strategy: EvictionStrategy::Lru,
|
||||||
|
|||||||
@@ -6,7 +6,7 @@ use std::collections::HashMap;
|
|||||||
#[derive(Debug, Clone)]
|
#[derive(Debug, Clone)]
|
||||||
pub struct NodeState {
|
pub struct NodeState {
|
||||||
pub name: String,
|
pub name: String,
|
||||||
/// Base URL of the neuron daemon (e.g. "http://beast.internal:9090").
|
/// Base URL of the neuron daemon (e.g. "http://beast.internal:13131").
|
||||||
pub endpoint: String,
|
pub endpoint: String,
|
||||||
pub healthy: bool,
|
pub healthy: bool,
|
||||||
pub models: HashMap<String, ModelEntry>,
|
pub models: HashMap<String, ModelEntry>,
|
||||||
|
|||||||
@@ -17,7 +17,7 @@ pub struct NeuronConfig {
|
|||||||
}
|
}
|
||||||
|
|
||||||
fn default_port() -> u16 {
|
fn default_port() -> u16 {
|
||||||
9090
|
13131
|
||||||
}
|
}
|
||||||
|
|
||||||
impl NeuronConfig {
|
impl NeuronConfig {
|
||||||
@@ -33,7 +33,7 @@ impl NeuronConfig {
|
|||||||
impl Default for NeuronConfig {
|
impl Default for NeuronConfig {
|
||||||
fn default() -> Self {
|
fn default() -> Self {
|
||||||
Self {
|
Self {
|
||||||
port: 9090,
|
port: 13131,
|
||||||
harnesses: vec![],
|
harnesses: vec![],
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|||||||
7
data/cortex-firewalld.xml
Normal file
7
data/cortex-firewalld.xml
Normal file
@@ -0,0 +1,7 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<service>
|
||||||
|
<short>cortex</short>
|
||||||
|
<description>Cortex — inference gateway for multi-node GPU clusters</description>
|
||||||
|
<port protocol="tcp" port="31313"/>
|
||||||
|
<port protocol="tcp" port="31314"/>
|
||||||
|
</service>
|
||||||
6
data/neuron-firewalld.xml
Normal file
6
data/neuron-firewalld.xml
Normal file
@@ -0,0 +1,6 @@
|
|||||||
|
<?xml version="1.0" encoding="utf-8"?>
|
||||||
|
<service>
|
||||||
|
<short>helexa-neuron</short>
|
||||||
|
<description>Neuron — per-node GPU discovery and harness daemon for cortex</description>
|
||||||
|
<port protocol="tcp" port="13131"/>
|
||||||
|
</service>
|
||||||
@@ -1,5 +1,5 @@
|
|||||||
Name: helexa-neuron
|
Name: helexa-neuron
|
||||||
Version: 0.1.12
|
Version: 0.1.16
|
||||||
Release: 1%{?dist}
|
Release: 1%{?dist}
|
||||||
Summary: Per-node GPU discovery and harness management daemon for cortex
|
Summary: Per-node GPU discovery and harness management daemon for cortex
|
||||||
# Package name disambiguates from Fedora's existing "neuron" package
|
# Package name disambiguates from Fedora's existing "neuron" package
|
||||||
@@ -24,6 +24,7 @@ BuildRequires: systemd-rpm-macros
|
|||||||
|
|
||||||
Requires(pre): shadow-utils
|
Requires(pre): shadow-utils
|
||||||
Requires: systemd
|
Requires: systemd
|
||||||
|
Requires: firewalld-filesystem
|
||||||
|
|
||||||
# systemd-rpm-macros ships a unit dep generator that parses User=/Group=
|
# systemd-rpm-macros ships a unit dep generator that parses User=/Group=
|
||||||
# from our .service file and emits Requires: user(neuron)/group(neuron).
|
# from our .service file and emits Requires: user(neuron)/group(neuron).
|
||||||
@@ -58,6 +59,7 @@ cargo build --release -p neuron
|
|||||||
install -Dm755 target/release/neuron %{buildroot}%{_bindir}/neuron
|
install -Dm755 target/release/neuron %{buildroot}%{_bindir}/neuron
|
||||||
install -Dm644 data/neuron.service %{buildroot}%{_unitdir}/neuron.service
|
install -Dm644 data/neuron.service %{buildroot}%{_unitdir}/neuron.service
|
||||||
install -Dm644 data/neuron-sysusers.conf %{buildroot}%{_sysusersdir}/neuron.conf
|
install -Dm644 data/neuron-sysusers.conf %{buildroot}%{_sysusersdir}/neuron.conf
|
||||||
|
install -Dm644 data/neuron-firewalld.xml %{buildroot}%{_prefix}/lib/firewalld/services/helexa-neuron.xml
|
||||||
install -dm755 %{buildroot}%{_sysconfdir}/neuron
|
install -dm755 %{buildroot}%{_sysconfdir}/neuron
|
||||||
install -Dm644 neuron.example.toml %{buildroot}%{_sysconfdir}/neuron/neuron.toml
|
install -Dm644 neuron.example.toml %{buildroot}%{_sysconfdir}/neuron/neuron.toml
|
||||||
|
|
||||||
@@ -79,9 +81,20 @@ install -Dm644 neuron.example.toml %{buildroot}%{_sysconfdir}/neuron/neuron.toml
|
|||||||
%{_bindir}/neuron
|
%{_bindir}/neuron
|
||||||
%{_unitdir}/neuron.service
|
%{_unitdir}/neuron.service
|
||||||
%{_sysusersdir}/neuron.conf
|
%{_sysusersdir}/neuron.conf
|
||||||
|
%{_prefix}/lib/firewalld/services/helexa-neuron.xml
|
||||||
%dir %{_sysconfdir}/neuron
|
%dir %{_sysconfdir}/neuron
|
||||||
%config(noreplace) %{_sysconfdir}/neuron/neuron.toml
|
%config(noreplace) %{_sysconfdir}/neuron/neuron.toml
|
||||||
|
|
||||||
%changelog
|
%changelog
|
||||||
|
* Thu Apr 16 2026 Gitea Actions <actions@git.lair.cafe> - 0.1.16-1
|
||||||
|
- chore: ignore local deploy script
|
||||||
|
- chore: move default ports out of common-collision ranges
|
||||||
|
- ci: drop actions/cache for cargo registry and target
|
||||||
|
|
||||||
|
* Thu Apr 16 2026 Gitea Actions <actions@git.lair.cafe> - 0.1.14-1
|
||||||
|
- ci: publish both packages to a single helexa/helexa COPR project
|
||||||
|
- fix(rpm): rename neuron package to helexa-neuron
|
||||||
|
- ci: commit generated %changelog entries back to main
|
||||||
|
|
||||||
* Wed Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
|
* Wed Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
|
||||||
- Initial package
|
- Initial package
|
||||||
|
|||||||
@@ -3,9 +3,9 @@
|
|||||||
# Copy to /etc/neuron/neuron.toml and adjust for your environment.
|
# Copy to /etc/neuron/neuron.toml and adjust for your environment.
|
||||||
#
|
#
|
||||||
# Environment variable overrides use NEURON_ prefix with __ separators:
|
# Environment variable overrides use NEURON_ prefix with __ separators:
|
||||||
# NEURON_PORT=9090
|
# NEURON_PORT=13131
|
||||||
|
|
||||||
port = 9090
|
port = 13131
|
||||||
|
|
||||||
# -- Harnesses ---------------------------------------------------------------
|
# -- Harnesses ---------------------------------------------------------------
|
||||||
# Each [[harnesses]] entry declares an inference engine managed by neuron.
|
# Each [[harnesses]] entry declares an inference engine managed by neuron.
|
||||||
|
|||||||
Reference in New Issue
Block a user