fix(rpm): drop %attr(,,user) on config files to avoid dnf silent filter

Using %attr(,,cortex) / %attr(,,neuron) on config files caused rpm's auto-dep-generator to emit Requires: user(name) and group(name) on each package. When those Requires couldn't be resolved — whether due to sysusers Provides mismatches, missing GPG keys, or dnf5 cache state — dnf5 silently filtered the package out of the candidate set and reported "Nothing to do" rather than an unsatisfied-dep error. Adopt the pattern that already works reliably across our infra (grenade/monsoon): ship config files as default root:root with 0644 perms, don't declare user/group ownership in the rpm file list. systemd-sysusers still creates the service user via the shipped sysusers.d file; the service drops to that user at runtime via the User= directive in the unit. This removes the user(cortex)/user(neuron) Requires entirely, which is the root cause of the dnf5 filtering. File permission tightening can be reintroduced later — either via a separate secrets file with different mode bits, or by moving secret material to /var/lib/<svc>/ where the service drop-privileges account already has write access. Co-Authored-By: Claude Opus 4.6 (1M context) <noreply@anthropic.com>
2026-04-16 14:33:08 +03:00
13 changed files with 69 additions and 124 deletions
--- a/.gitea/workflows/ci.yml
+++ b/.gitea/workflows/ci.yml
@@ -24,6 +24,19 @@ jobs:
    steps:
      - uses: actions/checkout@v4

+      - name: Cache cargo registry and target
+        uses: actions/cache@v4
+        with:
+          path: |
+            ~/.cargo/bin
+            ~/.cargo/registry/index
+            ~/.cargo/registry/cache
+            ~/.cargo/git/db
+            target
+          key: ${{ runner.os }}-cargo-${{ hashFiles('**/Cargo.lock') }}
+          restore-keys: |
+            ${{ runner.os }}-cargo-
+
      - name: Ensure sccache with S3 support
        env:
          RUSTC_WRAPPER: ""
@@ -53,8 +66,6 @@ jobs:
    if: startsWith(github.ref, 'refs/tags/v')
    steps:
      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 0

      - name: Determine version
        id: version
@@ -68,12 +79,6 @@ jobs:
          sed -i '/\[workspace\.package\]/,/\[/{ s/^version = ".*"/version = "'"${VERSION}"'"/ }' Cargo.toml
          sed -i "s/^Version:.*/Version:        ${VERSION}/" cortex.spec

-      - name: Generate changelog entry
-        uses: https://git.lair.cafe/actions/rpm-changelog@v1
-        with:
-          spec: cortex.spec
-          version: ${{ steps.version.outputs.VERSION }}
-
      - name: Generate source tarball
        run: |
          set -ex
@@ -113,8 +118,6 @@ jobs:
    if: startsWith(github.ref, 'refs/tags/v')
    steps:
      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 0

      - name: Determine version
        id: version
@@ -126,37 +129,31 @@ jobs:
        run: |
          VERSION="${{ steps.version.outputs.VERSION }}"
          sed -i '/\[workspace\.package\]/,/\[/{ s/^version = ".*"/version = "'"${VERSION}"'"/ }' Cargo.toml
-          sed -i "s/^Version:.*/Version:        ${VERSION}/" helexa-neuron.spec
-
-      - name: Generate changelog entry
-        uses: https://git.lair.cafe/actions/rpm-changelog@v1
-        with:
-          spec: helexa-neuron.spec
-          version: ${{ steps.version.outputs.VERSION }}
+          sed -i "s/^Version:.*/Version:        ${VERSION}/" neuron.spec

      - name: Generate source tarball
        run: |
          set -ex
          VERSION="${{ steps.version.outputs.VERSION }}"
-          tar czf /tmp/helexa-neuron-${VERSION}.tar.gz \
-            --transform "s,^\.,helexa-neuron-${VERSION}," \
+          tar czf /tmp/neuron-${VERSION}.tar.gz \
+            --transform "s,^\.,neuron-${VERSION}," \
            --exclude='./target' \
            --exclude='./.git' \
            --exclude='*.tar.gz' \
            --exclude='*.src.rpm' \
            .
-          mv /tmp/helexa-neuron-${VERSION}.tar.gz .
+          mv /tmp/neuron-${VERSION}.tar.gz .

      - name: Vendor Rust dependencies
        run: |
          VERSION="${{ steps.version.outputs.VERSION }}"
          cargo vendor vendor/
-          tar czf helexa-neuron-${VERSION}-vendor.tar.gz vendor/
+          tar czf neuron-${VERSION}-vendor.tar.gz vendor/
          rm -rf vendor/

      - name: Build SRPM
        run: |
-          rpmbuild -bs helexa-neuron.spec \
+          rpmbuild -bs neuron.spec \
            --define "_sourcedir $(pwd)" \
            --define "_srcrpmdir $(pwd)"

@@ -179,7 +176,7 @@ jobs:
      - name: Publish to COPR
        uses: https://git.lair.cafe/actions/copr-publish@v1
        with:
-          project: helexa/helexa
+          project: helexa/cortex
          srpm: "*.src.rpm"
          copr-config: ${{ secrets.COPR_CONFIG }}

@@ -196,7 +193,7 @@ jobs:
      - name: Publish to COPR
        uses: https://git.lair.cafe/actions/copr-publish@v1
        with:
-          project: helexa/helexa
+          project: helexa/neuron
          srpm: "*.src.rpm"
          copr-config: ${{ secrets.COPR_CONFIG }}

@@ -206,43 +203,21 @@ jobs:
    needs: [copr-cortex, copr-neuron]
    steps:
      - uses: actions/checkout@v4
-        with:
-          fetch-depth: 0

-      - name: Determine version
-        id: version
-        run: echo "VERSION=${GITHUB_REF#refs/tags/v}" >> "$GITHUB_OUTPUT"
-
-      - name: Stamp version
-        run: |
-          VERSION="${{ steps.version.outputs.VERSION }}"
-          sed -i '/\[workspace\.package\]/,/\[/{ s/^version = ".*"/version = "'"${VERSION}"'"/ }' Cargo.toml
-          sed -i "s/^Version:.*/Version:        ${VERSION}/" cortex.spec
-          sed -i "s/^Version:.*/Version:        ${VERSION}/" helexa-neuron.spec
-          cargo check --workspace 2>/dev/null || true
-
-      - name: Generate cortex changelog entry
-        uses: https://git.lair.cafe/actions/rpm-changelog@v1
-        with:
-          spec: cortex.spec
-          version: ${{ steps.version.outputs.VERSION }}
-
-      - name: Generate helexa-neuron changelog entry
-        uses: https://git.lair.cafe/actions/rpm-changelog@v1
-        with:
-          spec: helexa-neuron.spec
-          version: ${{ steps.version.outputs.VERSION }}
-
-      - name: Commit and push
+      - name: Stamp version and push
        env:
          GITEA_TOKEN: ${{ secrets.GITEA_TOKEN }}
        run: |
-          VERSION="${{ steps.version.outputs.VERSION }}"
+          VERSION="${GITHUB_REF#refs/tags/v}"
+          sed -i '/\[workspace\.package\]/,/\[/{ s/^version = ".*"/version = "'"${VERSION}"'"/ }' Cargo.toml
+          sed -i "s/^Version:.*/Version:        ${VERSION}/" cortex.spec
+          sed -i "s/^Version:.*/Version:        ${VERSION}/" neuron.spec
+          cargo check --workspace 2>/dev/null || true
          git config user.name "Gitea Actions"
          git config user.email "actions@git.lair.cafe"
-          git add Cargo.toml Cargo.lock cortex.spec helexa-neuron.spec
+          git add Cargo.toml Cargo.lock cortex.spec neuron.spec
          if git diff --cached --quiet; then
-            echo "Nothing to commit for ${VERSION}"
+            echo "Version already at ${VERSION}"
          else
            git commit -m "chore: bump version to ${VERSION}"
            git remote set-url origin "https://gitea-actions:${GITEA_TOKEN}@git.lair.cafe/helexa/cortex.git"
--- a/CLAUDE.md
+++ b/CLAUDE.md
@@ -125,8 +125,7 @@ automatically. Clippy warnings must be resolved, not suppressed with
  - One or more GPU nodes running mistral.rs on port 8080
  - Optionally a metrics-only node (no GPU) for Prometheus/Grafana
 - Each node runs `mistralrs serve` on port 8080
- Gateway listens on port 31313 (API) and 31314 (metrics)
- neuron listens on port 13131 on each GPU host
+- Gateway listens on port 8000 (API) and 9100 (metrics)
 - TLS terminated at gateway or via nginx; internal traffic is plaintext over WireGuard

 ## Conventions
@@ -381,7 +380,7 @@ processes (one process per loaded model, each on its own port).

 ## neuron API

-neuron exposes an HTTP API on port 13131 that cortex polls and calls.
+neuron exposes an HTTP API on port 9090 that cortex polls and calls.

 ```
 GET  /discovery
@@ -425,8 +424,8 @@ endpoint. cortex.toml shrinks to:

 ```toml
 [gateway]
-listen = "0.0.0.0:31313"
-metrics_listen = "0.0.0.0:31314"
+listen = "0.0.0.0:8000"
+metrics_listen = "0.0.0.0:9100"

 [eviction]
 strategy = "lru"
@@ -434,15 +433,15 @@ defrag_after_cycles = 50

 [[neurons]]
 name = "beast"
-endpoint = "http://beast.hanzalova.internal:13131"
+endpoint = "http://beast.hanzalova.internal:9090"

 [[neurons]]
 name = "benjy"
-endpoint = "http://benjy.hanzalova.internal:13131"
+endpoint = "http://benjy.kosherinata.internal:9090"

 [[neurons]]
 name = "quadbrat"
-endpoint = "http://quadbrat.hanzalova.internal:13131"
+endpoint = "http://quadbrat.hanzalova.internal:9090"
 ```

 On startup and periodically, cortex calls `GET /discovery` and
@@ -522,7 +521,7 @@ cortex/
 │   │       └── metrics.rs      # prometheus exporter (unchanged)
 │   ├── neuron/                 # node plane (replaces cortex-agent)
 │   │   └── src/
-│   │       ├── main.rs         # binary entrypoint, axum server on :13131
+│   │       ├── main.rs         # binary entrypoint, axum server on :9090
 │   │       ├── discovery.rs    # nvidia-smi, device enumeration
 │   │       ├── health.rs       # runtime GPU polling
 │   │       ├── api.rs          # HTTP handlers for /discovery, /models, etc.
@@ -596,24 +595,16 @@ placement matching can be added incrementally.
 Completed. Both packages have RPM specs, systemd units, and example configs.
 CI builds parallel SRPMs on tag push and publishes to separate COPR repos.

- `cortex.spec` — installs the `cortex` binary. Package name keeps the
-  short `cortex` because no Fedora package collides with it.
- `helexa-neuron.spec` — installs the `neuron` binary under package name
-  `helexa-neuron`. Renamed from bare `neuron` to avoid collision with
-  Fedora's NEURON neural-simulation package
-  (https://src.fedoraproject.org/rpms/neuron); binary, systemd unit,
-  system user, and config dir all stay named `neuron` since those are
-  project-local contexts.
+- `cortex.spec` → `helexa/cortex` COPR: binary, systemd unit, config files
+- `neuron.spec` → `helexa/neuron` COPR: binary, systemd unit, config
 - `data/cortex.service`, `data/neuron.service` — systemd units
 - `cortex.example.toml`, `neuron.example.toml`, `models.example.toml`
- CI: parallel `srpm-cortex` + `srpm-neuron` jobs, then parallel COPR
-  publish to a single project `helexa/helexa` hosting both packages.
+- CI: parallel `srpm-cortex` + `srpm-neuron` jobs, then parallel COPR publish

 Install:
 ```sh
-dnf copr enable helexa/helexa
-dnf install cortex                # gateway host
-dnf install helexa-neuron         # GPU nodes
+dnf copr enable helexa/cortex && dnf install cortex    # gateway host
+dnf copr enable helexa/neuron && dnf install neuron    # GPU nodes
 ```

 ### Phase 11: llama.cpp harness stub
--- a/Cargo.lock
+++ b/Cargo.lock
@@ -351,7 +351,7 @@ checksum = "773648b94d0e5d620f64f280777445740e61fe701025087ec8b57f45c791888b"

 [[package]]
 name = "cortex-cli"
-version = "0.1.12"
+version = "0.1.7"
 dependencies = [
 "anyhow",
 "clap",
@@ -366,7 +366,7 @@ dependencies = [

 [[package]]
 name = "cortex-core"
-version = "0.1.12"
+version = "0.1.7"
 dependencies = [
 "anyhow",
 "async-trait",
@@ -381,7 +381,7 @@ dependencies = [

 [[package]]
 name = "cortex-gateway"
-version = "0.1.12"
+version = "0.1.7"
 dependencies = [
 "anyhow",
 "axum",
@@ -1184,7 +1184,7 @@ dependencies = [

 [[package]]
 name = "neuron"
-version = "0.1.12"
+version = "0.1.7"
 dependencies = [
 "anyhow",
 "async-trait",
--- a/Cargo.toml
+++ b/Cargo.toml
@@ -8,7 +8,7 @@ members = [
 ]

 [workspace.package]
-version = "0.1.12"
+version = "0.1.7"
 edition = "2024"
 license = "GPL-3.0-or-later"
 repository = "https://git.lair.cafe/helexa/cortex"
--- a/README.md
+++ b/README.md
@@ -88,8 +88,8 @@ WantedBy=multi-user.target
 ```toml
 # cortex.toml
 [gateway]
-listen = "0.0.0.0:31313"
-metrics_listen = "0.0.0.0:31314"
+listen = "0.0.0.0:8000"
+metrics_listen = "0.0.0.0:9100"

 [eviction]
 strategy = "lru"        # lru | priority
@@ -143,7 +143,7 @@ cortex serve --config cortex.toml
 cortex status

 # list all models across nodes
-curl http://localhost:31313/v1/models
+curl http://localhost:8000/v1/models
 ```

 ## License
--- a/cortex.example.toml
+++ b/cortex.example.toml
@@ -3,11 +3,11 @@
 # Copy to cortex.toml and adjust for your environment.
 #
 # Environment variable overrides use CORTEX_ prefix with __ separators:
-#   CORTEX_GATEWAY__LISTEN=0.0.0.0:31313
+#   CORTEX_GATEWAY__LISTEN=0.0.0.0:9000

 [gateway]
-listen = "0.0.0.0:31313"
-metrics_listen = "0.0.0.0:31314"
+listen = "0.0.0.0:8000"
+metrics_listen = "0.0.0.0:9100"

 [eviction]
 strategy = "lru"
--- a/cortex.spec
+++ b/cortex.spec
@@ -1,5 +1,5 @@
 Name:           cortex
-Version:        0.1.12
+Version:        0.1.7
 Release:        1%{?dist}
 Summary:        Inference gateway for multi-node GPU clusters

@@ -22,15 +22,6 @@ BuildRequires:  systemd-rpm-macros
 Requires(pre):  shadow-utils
 Requires:       systemd

-# systemd-rpm-macros ships a unit dep generator that parses User=/Group=
-# from our .service file and emits Requires: user(cortex)/group(cortex).
-# rpm's sysusers provides-generator emits the unversioned form for groups
-# but only a versioned user(cortex) = <base64> for users with GECOS/home/
-# shell. Provide the unversioned user(cortex) explicitly so dnf can resolve
-# the auto-generated Requires. Without this, dnf5 silently filters the
-# package and reports "Nothing to do".
-Provides:       user(cortex)
-
 %description
 Cortex is a Rust reverse-proxy that sits in front of multiple inference
 nodes (via neuron daemons) and presents a unified OpenAI and Anthropic
@@ -83,5 +74,5 @@ install -Dm644 models.example.toml %{buildroot}%{_sysconfdir}/cortex/models.toml
 %config(noreplace) %{_sysconfdir}/cortex/models.toml

 %changelog
-* Wed Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
+* Tue Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
 - Initial package
--- a/crates/cortex-cli/src/main.rs
+++ b/crates/cortex-cli/src/main.rs
@@ -23,7 +23,7 @@ enum Commands {
    /// Print the fleet status (models, nodes, health).
    Status {
        /// Gateway API endpoint to query.
-        #[arg(short, long, default_value = "http://localhost:31313")]
+        #[arg(short, long, default_value = "http://localhost:8000")]
        endpoint: String,
    },
 }
--- a/crates/cortex-core/src/config.rs
+++ b/crates/cortex-core/src/config.rs
@@ -22,9 +22,9 @@ fn default_models_path() -> String {

 #[derive(Debug, Clone, Serialize, Deserialize)]
 pub struct GatewaySettings {
-    /// Address to listen on for API requests (e.g. "0.0.0.0:31313")
+    /// Address to listen on for API requests (e.g. "0.0.0.0:8000")
    pub listen: String,
-    /// Address to listen on for Prometheus metrics (e.g. "0.0.0.0:31314")
+    /// Address to listen on for Prometheus metrics (e.g. "0.0.0.0:9100")
    pub metrics_listen: String,
 }

@@ -50,7 +50,7 @@ pub enum EvictionStrategy {
 pub struct NeuronEndpoint {
    /// Human-readable node name (e.g. "beast")
    pub name: String,
-    /// Base URL of the neuron daemon (e.g. "http://beast.internal:13131")
+    /// Base URL of the neuron daemon (e.g. "http://beast.internal:9090")
    pub endpoint: String,
 }

@@ -70,8 +70,8 @@ impl Default for GatewayConfig {
    fn default() -> Self {
        Self {
            gateway: GatewaySettings {
-                listen: "0.0.0.0:31313".into(),
-                metrics_listen: "0.0.0.0:31314".into(),
+                listen: "0.0.0.0:8000".into(),
+                metrics_listen: "0.0.0.0:9100".into(),
            },
            eviction: EvictionSettings {
                strategy: EvictionStrategy::Lru,
--- a/crates/cortex-core/src/node.rs
+++ b/crates/cortex-core/src/node.rs
@@ -6,7 +6,7 @@ use std::collections::HashMap;
 #[derive(Debug, Clone)]
 pub struct NodeState {
    pub name: String,
-    /// Base URL of the neuron daemon (e.g. "http://beast.internal:13131").
+    /// Base URL of the neuron daemon (e.g. "http://beast.internal:9090").
    pub endpoint: String,
    pub healthy: bool,
    pub models: HashMap<String, ModelEntry>,
--- a/crates/neuron/src/config.rs
+++ b/crates/neuron/src/config.rs
@@ -17,7 +17,7 @@ pub struct NeuronConfig {
 }

 fn default_port() -> u16 {
-    13131
+    9090
 }

 impl NeuronConfig {
@@ -33,7 +33,7 @@ impl NeuronConfig {
 impl Default for NeuronConfig {
    fn default() -> Self {
        Self {
-            port: 13131,
+            port: 9090,
            harnesses: vec![],
        }
    }
--- a/neuron.example.toml
+++ b/neuron.example.toml
@@ -3,9 +3,9 @@
 # Copy to /etc/neuron/neuron.toml and adjust for your environment.
 #
 # Environment variable overrides use NEURON_ prefix with __ separators:
-#   NEURON_PORT=13131
+#   NEURON_PORT=9090

-port = 13131
+port = 9090

 # -- Harnesses ---------------------------------------------------------------
 # Each [[harnesses]] entry declares an inference engine managed by neuron.
--- a/helexa-neuron.spec
+++ b/helexa-neuron.spec
@@ -1,10 +1,7 @@
-Name:           helexa-neuron
-Version:        0.1.12
+Name:           neuron
+Version:        0.1.7
 Release:        1%{?dist}
 Summary:        Per-node GPU discovery and harness management daemon for cortex
-# Package name disambiguates from Fedora's existing "neuron" package
-# (NEURON neural simulation environment from Yale). Binary, systemd
-# unit, and system user are still called "neuron" for brevity.

 License:        GPL-3.0-or-later
 URL:            https://git.lair.cafe/helexa/cortex
@@ -25,15 +22,6 @@ BuildRequires:  systemd-rpm-macros
 Requires(pre):  shadow-utils
 Requires:       systemd

-# systemd-rpm-macros ships a unit dep generator that parses User=/Group=
-# from our .service file and emits Requires: user(neuron)/group(neuron).
-# rpm's sysusers provides-generator emits the unversioned form for groups
-# but only a versioned user(neuron) = <base64> for users with GECOS/home/
-# shell. Provide the unversioned user(neuron) explicitly so dnf can resolve
-# the auto-generated Requires. Without this, dnf5 silently filters the
-# package and reports "Nothing to do".
-Provides:       user(neuron)
-
 %description
 Neuron is a per-node daemon for cortex inference clusters. It discovers
 local GPU hardware via nvidia-smi, manages inference harnesses (mistral.rs,
@@ -83,5 +71,5 @@ install -Dm644 neuron.example.toml %{buildroot}%{_sysconfdir}/neuron/neuron.toml
 %config(noreplace) %{_sysconfdir}/neuron/neuron.toml

 %changelog
-* Wed Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
+* Tue Apr 15 2026 Rob Thijssen <grenade@rob.tn> - 0.1.0-1
 - Initial package