Compare commits

..

20 Commits

Author SHA1 Message Date
renovate-bot 05b3c8f279 Update Helm release rabbitmq to v16
renovate/stability-days Updates have met minimum release age requirement
2026-03-17 14:57:30 +00:00
mrtz b39b3aefc8 fix(cilium): Disable clustermesh again 2026-03-17 13:00:55 +01:00
mrtz a9c658466f feat(cilium): Enable clustermesh 2026-03-17 10:56:43 +01:00
mrtz 730dc2b865 Add kueuectl via nix 2026-03-17 10:14:18 +01:00
mrtz 5eea620225 fix(kueue): Cohort is deprecated 2026-03-16 15:24:21 +01:00
mrtz 863c242a50 fix(kueue): Remove alpha and beta features 2026-03-16 15:22:40 +01:00
mrtz 1cf2303c62 fix(kueue): Use cert-manager 2026-03-16 15:21:46 +01:00
mrtz 81e6823f3d fix(kueue): Disable internal cert 2026-03-16 15:17:52 +01:00
mrtz 2f2d6c1b70 fix(kueue): Bump CRDs 2026-03-16 15:12:11 +01:00
mrtz c99ed29e62 fix(kueue): Wrong crd 2026-03-16 15:09:12 +01:00
mrtz 7eda27cdd6 fix(kueue): Add sync-wave hooks 2026-03-16 15:05:10 +01:00
mrtz bf6542398c fix(kueue): Correct repo 2026-03-16 14:59:17 +01:00
mrtz be7954d499 feat: Add Kueue and JobSet to ekman 2026-03-16 14:52:43 +01:00
mrtz cc8a121bf6 chore: Bump velero to bitnami free version 2026-03-16 10:32:54 +01:00
Gitea Actions 88d21ba674 ci(staging): deploy docs 0d279bb9-debug 2026-03-15 19:45:40 +00:00
Gitea Actions 1eb5249f64 ci(staging): deploy docs 8d2cafc0-debug 2026-03-15 17:35:07 +00:00
Gitea Actions 3ee37fc0f7 ci(staging): deploy docs 1a0619f9-debug 2026-03-15 15:48:21 +00:00
renovate-bot ea4d9f3003 Update Helm release kube-prometheus-stack to v82.10.3 2026-03-15 08:49:11 +00:00
renovate-bot 4566ac7c28 Update Helm release openfga to v0.2.56 2026-03-15 08:47:57 +00:00
renovate-bot c13d4519bd Update Helm release umami to v7.7.3 2026-03-15 00:03:38 +00:00
21 changed files with 116 additions and 176 deletions
+1 -1
View File
@@ -8,7 +8,7 @@ releases:
- name: kueue
namespace: kueue-system
chart: oci://registry.k8s.io/kueue/charts/kueue
version: 0.15.0
version: 0.16.2
condition: kueue.enabled
values:
- ../values/kueue/values/values.yaml
+1 -1
View File
@@ -16,7 +16,7 @@ releases:
namespace: {{ .Environment.Name }}-openfga
{{- end }}
chart: openfga/openfga
version: 0.2.55
version: 0.2.56
condition: openfga.enabled
values:
- ../values/openfga/values/values.yaml
+1 -1
View File
@@ -15,7 +15,7 @@ releases:
- name: prometheus
namespace: prometheus
chart: prometheus/kube-prometheus-stack
version: 82.10.1
version: 82.10.3
condition: prometheus.enabled
values:
- ../values/prometheus/values/prometheus.yaml.gotmpl
+1 -1
View File
@@ -14,7 +14,7 @@ releases:
- name: umami
namespace: analytics
chart: umami/umami
version: 7.7.2
version: 7.7.3
condition: umami.enabled
values:
- ../values/umami/values/values.yaml
+1 -1
View File
@@ -15,7 +15,7 @@ releases:
- name: velero
namespace: velero
chart: velero/velero
version: 11.4.0
version: 12.0.0
condition: velero.enabled
values:
- ../values/velero/values/velero.yaml.gotmpl
+19
View File
@@ -0,0 +1,19 @@
{
buildGoModule,
fetchFromGitHub,
}:
buildGoModule rec {
pname = "kueuectl";
version = "0.16.3";
src = fetchFromGitHub {
owner = "kubernetes-sigs";
repo = "kueue";
rev = "v${version}";
hash = "sha256-JbU+ZoQ+YriaiIbbVCe45OTYycxYRanLhmQAdpE+xQ4=";
};
vendorHash = null;
subPackages = [ "cmd/kueuectl" ];
}
+3 -1
View File
@@ -7,6 +7,7 @@ let
overlays = [ ];
};
treefmt = import ./nix/treefmt.nix { };
kueuectl = pkgs.callPackage ./nix/kueuectl.nix { };
in
pkgs.mkShellNoCC {
packages = [
@@ -27,6 +28,7 @@ pkgs.mkShellNoCC {
pkgs.kubectl-rook-ceph
# other tools activate when needed
kueuectl
# pkgs.step-cli
# pkgs.linkerd
# pkgs.cmctl
@@ -40,7 +42,7 @@ pkgs.mkShellNoCC {
];
# Environment variables
ARGOCD_ENV_CLUSTER_NAME = "hel1";
ARGOCD_ENV_CLUSTER_NAME = "ekman";
HELM_GIT_ACCESS_TOKEN = "glpat-xxx";
API_SERVER_IP = "localhost";
API_SERVER_PORT = "7445";
+6 -3
View File
@@ -1,8 +1,11 @@
cilium:
enabled: true
# WireGuard cannot be used during migration -- Flannel nodes have no WireGuard
# keys so encrypted traffic is unreadable by them.
# TODO: re-enable after migration
clustermesh:
enabled: false
clusterId: 2
# NodePort until L2LB is available (kubeproxyless)
apiserverServiceType: NodePort
# TODO: WireGuard blocks all traffic on ekman -- disable until root cause is found.
encryption:
enabled: false
envoy:
+3
View File
@@ -1,5 +1,8 @@
cilium:
enabled: true
clustermesh:
enabled: false
clusterId: 1
nodePort:
enabled: true
l2announcement:
+4
View File
@@ -30,4 +30,8 @@ cilium:
loadbalancerPool:
enabled: false
cidr: []
clustermesh:
enabled: false
clusterId: 0
apiserverServiceType: LoadBalancer
cluster: {{ requiredEnv "ARGOCD_ENV_CLUSTER_NAME" }}
+14 -1
View File
@@ -1,3 +1,16 @@
cluster:
name: {{ .Values.cilium.cluster }}
id: {{ .Values.cilium.clustermesh.clusterId }}
{{- if .Values.cilium.clustermesh.enabled }}
clustermesh:
useAPIServer: true
apiserver:
service:
type: {{ .Values.cilium.clustermesh.apiserverServiceType }}
tls:
auto:
method: helm
{{- end }}
authentication:
mutual:
spire:
@@ -90,7 +103,7 @@ operator:
prometheus:
enabled: true
port: 12301
serviceMointor:
serviceMonitor:
enabled: true
port: 12302
rollOutPods: true
+1 -1
View File
@@ -1,6 +1,6 @@
replicaCount: 1
image:
tag: "e9fd3fc6-debug"
tag: "0d279bb9-debug"
env:
- name: APP_VERSION
value: "0.0.0"
+1 -1
View File
@@ -38,7 +38,7 @@ spec:
- group: ""
kind: Secret
name: jobset-webhook-server-cert
namespace: default
namespace: jobset-system
jsonPointers:
- /data
{{- end }}
-3
View File
@@ -1,3 +0,0 @@
kueue:
enabled: true
autosync: false
+47 -30
View File
@@ -1,51 +1,68 @@
apiVersion: kueue.x-k8s.io/v1beta1
apiVersion: kueue.x-k8s.io/v1beta2
kind: ResourceFlavor
metadata:
name: compute # Just needs to exist, can be managed with tains/tolerations
name: compute # Just needs to exist, can be managed with tains/tolerations
annotations:
argocd.argoproj.io/sync-wave: "2"
spec:
nodeLabels:
node-role.kubernetes.io/compute: compute
topology.kubernetes.io/group: c1 # Only run on C1 for now
---
apiVersion: kueue.x-k8s.io/v1beta1
apiVersion: kueue.x-k8s.io/v1beta2
kind: ClusterQueue
metadata:
name: jobs
name: cluster-queue
annotations:
argocd.argoproj.io/sync-wave: "2"
spec:
cohort: general
namespaceSelector: {} # Accept workloads from any namespace
preemption:
withinClusterQueue: "LowerPriority" # Allow higher priority to preempt lower
queueingStrategy: BestEffortFIFO
# preemption:
# withinClusterQueue: "LowerPriority" # Allow higher priority to preempt lower
resourceGroups:
- coveredResources: ["cpu", "memory"] # Cover both memory and cpu resources
flavors:
- name: compute
resources:
- name: "cpu"
nominalQuota: '4'
nominalQuota: '32'
- name: "memory"
nominalQuota: 8Gi
nominalQuota: 64Gi
# ---
# apiVersion: kueue.x-k8s.io/v1beta2
# kind: LocalQueue
# metadata:
# name: prod-queue
# namespace: prod-queue
# spec:
# clusterQueue: cluster-queue
---
apiVersion: kueue.x-k8s.io/v1beta1
kind: LocalQueue
apiVersion: v1
kind: Namespace
metadata:
name: prod-queue
namespace: prod-sorcerer
spec:
clusterQueue: jobs
name: dev-queue
annotations:
argocd.argoproj.io/sync-wave: "2"
---
apiVersion: kueue.x-k8s.io/v1beta1
apiVersion: kueue.x-k8s.io/v1beta2
kind: LocalQueue
metadata:
name: staging-queue
namespace: staging-sorcerer
namespace: dev-queue
annotations:
argocd.argoproj.io/sync-wave: "2"
spec:
clusterQueue: jobs
---
apiVersion: kueue.x-k8s.io/v1beta1
kind: WorkloadPriorityClass
metadata:
name: "normal"
value: 100
---
apiVersion: kueue.x-k8s.io/v1beta1
kind: WorkloadPriorityClass
metadata:
name: "high"
value: 200 # Higher value = higher priority
clusterQueue: cluster-queue
# ---
# apiVersion: kueue.x-k8s.io/v1beta2
# kind: WorkloadPriorityClass
# metadata:
# name: "normal"
# value: 100
# ---
# apiVersion: kueue.x-k8s.io/v1beta2
# kind: WorkloadPriorityClass
# metadata:
# name: "high"
# value: 200 # Higher value = higher priority
-89
View File
@@ -1,89 +0,0 @@
{{- if eq .Values.clusterConfig.cluster "ekman"}}
apiVersion: networking.k8s.io/v1
kind: Ingress
metadata:
name: kueueviz-ingress
namespace: kueue-system
annotations:
cert-manager.io/cluster-issuer: ca-issuer
nginx.ingress.kubernetes.io/backend-protocol: HTTP
nginx.ingress.kubernetes.io/proxy-buffer-size: 128k
nginx.ingress.kubernetes.io/proxy-read-timeout: "3600"
nginx.ingress.kubernetes.io/proxy-send-timeout: "3600"
nginx.ingress.kubernetes.io/ssl-passthrough: "true"
nginx.ingress.kubernetes.io/ssl-redirect: "true"
nginx.ingress.kubernetes.io/websocket-services: kueue-kueueviz-backend
spec:
rules:
- host: kueue.dev.tos.obx
http:
paths:
- path: /ws
pathType: Prefix
backend:
service:
name: kueue-kueueviz-backend
port:
number: 8080
- path: /api(/|$)(.*)
pathType: Prefix
backend:
service:
name: kueue-kueueviz-backend
port:
number: 8080
- path: /
pathType: Prefix
backend:
service:
name: kueue-kueueviz-frontend
port:
number: 8080
tls:
- hosts:
- kueue.dev.tos.obx
secretName: kueueviz-tls
{{- end}}
---
{{- if eq .Values.clusterConfig.cluster "rossby"}}
apiVersion: networking.k8s.io/v1
kind: Ingress
metadata:
name: kueueviz-ingress
namespace: kueue-system
annotations:
cert-manager.io/cluster-issuer: ca-issuer
nginx.ingress.kubernetes.io/websocket-services: kueue-kueueviz-backend
nginx.ingress.kubernetes.io/proxy-read-timeout: "3600"
nginx.ingress.kubernetes.io/proxy-send-timeout: "3600"
spec:
rules:
- host: kueue.dev.vtn.obx
http:
paths:
- path: /ws
pathType: Prefix
backend:
service:
name: kueue-kueueviz-backend
port:
number: 8080
- path: /api(/|$)(.*)
pathType: Prefix
backend:
service:
name: kueue-kueueviz-backend
port:
number: 8080
- path: /
pathType: Prefix
backend:
service:
name: kueue-kueueviz-frontend
port:
number: 8080
tls:
- hosts:
- kueue.dev.vtn.obx
secretName: kueueviz-tls
{{- end}}
+2 -2
View File
@@ -5,6 +5,7 @@ metadata:
name: kueue
namespace: argocd
annotations:
argocd.argoproj.io/sync-wave: "1"
argocd.argoproj.io/sync-options: SkipDryRunOnMissingResource=true
argocd.argoproj.io/compare-options: ServerSideDiff=true
finalizers:
@@ -27,7 +28,7 @@ spec:
value: {{ .Values.kueue.env }}
- name: HELMFILE_FILE_PATH
value: kueue.yaml.gotmpl
- repoURL: https://gitlab.com/oceanbox/manifests.git
- repoURL: {{ .Values.clusterConfig.manifests }}
targetRevision: main
ref: values
syncPolicy:
@@ -41,4 +42,3 @@ spec:
selfHeal: false
{{- end }}
{{- end }}
-9
View File
@@ -1,9 +0,0 @@
kueueViz:
backend:
env:
- name: KUEUEVIZ_ALLOWED_ORIGINS
value: "https://kueue.dev.tos.obx"
frontend:
env:
- name: REACT_APP_WEBSOCKET_URL
value: "wss://kueue.dev.tos.obx"
-9
View File
@@ -1,9 +0,0 @@
kueueViz:
backend:
env:
- name: KUEUEVIZ_ALLOWED_ORIGINS
value: "https://kueue.dev.vtn.obx"
frontend:
env:
- name: REACT_APP_WEBSOCKET_URL
value: "wss://kueue.dev.vtn.obx"
+11 -18
View File
@@ -1,21 +1,14 @@
controllerManager:
featureGates:
- name: TopologyAwareScheduling
enabled: true
- name: LocalQueueMetrics
enabled: true
managerConfig:
controllerManagerConfigYaml: |
apiVersion: config.kueue.x-k8s.io/v1beta1
kind: Configuration
integrations:
frameworks:
- batch/job
- jobset.x-k8s.io/jobset
internalCertManagement:
enable: false
enableCertManager: false
managerConfig:
controllerManagerConfigYaml: |
apiVersion: config.kueue.x-k8s.io/v1beta2
kind: Configuration
integrations:
frameworks:
- batch/job
- jobset.x-k8s.io/jobset
internalCertManagement:
enable: false
enableCertManager: true
enablePrometheus: true
metrics:
prometheusNamespace: prometheus
enableKueueViz: true
-4
View File
@@ -72,7 +72,3 @@ metrics:
for: 15m
labels:
severity: critical
kubectl:
image:
repository: docker.io/bitnamilegacy/kubectl
tag: 1.33.4