Compare commits

..

161 Commits

Author SHA1 Message Date
373823e565 chore(deps): update helm release argo-cd to v9.4.7 2026-03-03 12:00:55 +00:00
d36dd7735f chore(deps): update helm release argo-cd to v9.4.6 2026-03-01 21:00:31 +00:00
1a0aeb0e64 chore(deps): update helm release kube-prometheus-stack to v82.4.3 2026-02-27 19:00:32 +00:00
e6e63b5b2c chore(deps): update ghcr.io/siderolabs/discovery-service docker tag to v1.0.15 2026-02-27 11:00:50 +00:00
0fcb071122 chore(deps): update helm release kube-prometheus-stack to v82.4.2 2026-02-27 10:00:35 +00:00
e0f4fc71af chore(deps): update helm release kube-prometheus-stack to v82.4.1 2026-02-26 20:00:31 +00:00
e747bbe519 chore(deps): update helm release argo-cd to v9.4.5 2026-02-26 09:00:25 +00:00
067c3cbc59 Merge pull request 'chore(deps): update helm release velero to v11.4.0' (#252) from renovate/velero-11.x into main
Reviewed-on: #252
2026-02-26 02:07:55 +00:00
27fcdd6bac Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v82.4.0' (#253) from renovate/kube-prometheus-stack-82.x into main
Reviewed-on: #253
2026-02-26 02:07:34 +00:00
67a7c32675 chore(deps): update helm release kube-prometheus-stack to v82.4.0 2026-02-25 08:00:57 +00:00
c352c07f7b chore(deps): update helm release velero to v11.4.0 2026-02-25 05:01:07 +00:00
3397d80865 chore(deps): update helm release rook-ceph to v1.19.2 2026-02-24 20:00:39 +00:00
39548b9b31 chore(deps): update helm release cert-manager to v1.19.4 2026-02-24 16:01:20 +00:00
9b75b8d4bf chore(deps): update helm release argo-cd to v9.4.4 2026-02-22 20:00:35 +00:00
8d29dd8bd1 chore(deps): update helm release kube-prometheus-stack to v82.2.1 2026-02-22 18:00:23 +00:00
4090830d95 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v82.2.0' (#245) from renovate/kube-prometheus-stack-82.x into main
Reviewed-on: #245
2026-02-20 16:40:41 +00:00
21790a5a41 chore(deps): update helm release kube-prometheus-stack to v82.2.0 2026-02-20 15:00:59 +00:00
4ab5ecdd6f chore(deps): update helm release traefik to v39.0.2 2026-02-20 15:00:48 +00:00
c11f7897d7 chore(deps): update helm release external-secrets to v2.0.1 2026-02-20 14:00:24 +00:00
8839dd6eb1 chore(deps): update helm release kube-prometheus-stack to v82.1.1 2026-02-19 17:00:39 +00:00
cc57178974 chore(deps): update helm release argo-cd to v9.4.3 2026-02-18 17:00:59 +00:00
3d95158244 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v82.1.0' (#240) from renovate/kube-prometheus-stack-82.x into main
Reviewed-on: #240
2026-02-17 19:36:08 +00:00
141f05c6ae chore(deps): update helm release kube-prometheus-stack to v82.1.0 2026-02-17 15:00:31 +00:00
3651f23c72 chore(deps): update helm release kube-prometheus-stack to v82.0.2 2026-02-17 01:00:25 +00:00
b4cbbd97a6 chore(deps): update helm release kube-prometheus-stack to v82.0.1 2026-02-16 19:00:19 +00:00
ede26d9c1d Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v82' (#237) from renovate/kube-prometheus-stack-82.x into main
Reviewed-on: #237
2026-02-16 14:14:15 +00:00
cc14ef66ed chore(deps): update helm release kube-prometheus-stack to v82 2026-02-15 08:00:27 +00:00
35b3f6cc42 chore(deps): update helm release kube-prometheus-stack to v81.6.9 2026-02-13 23:00:30 +00:00
033a3b95ad chore(deps): update helm release kube-prometheus-stack to v81.6.8 2026-02-13 22:00:24 +00:00
f90060e366 chore(deps): update helm release kube-prometheus-stack to v81.6.7 2026-02-13 15:00:25 +00:00
1f074a7087 chore(deps): update helm release kube-prometheus-stack to v81.6.6 2026-02-13 13:01:24 +00:00
c6cf3b7d84 chore(deps): update helm release argo-cd to v9.4.2 2026-02-13 13:00:24 +00:00
e611c68342 chore(deps): update ghcr.io/siderolabs/discovery-service docker tag to v1.0.14 2026-02-13 12:00:30 +00:00
d828d88078 chore(deps): update helm release traefik to v39.0.1 2026-02-13 10:00:29 +00:00
8fa00efc16 chore(deps): update helm release kube-prometheus-stack to v81.6.5 2026-02-13 06:00:24 +00:00
fbe2274182 chore(deps): update helm release kube-prometheus-stack to v81.6.4 2026-02-13 02:00:37 +00:00
bf4985040a chore(deps): update helm release kubernetes-replicator to v2.12.3 2026-02-12 11:00:46 +00:00
ce3a367ec9 chore(deps): update helm release kube-prometheus-stack to v81.6.3 2026-02-12 09:00:20 +00:00
6006e75db9 chore(deps): update helm release kube-prometheus-stack to v81.6.2 2026-02-11 19:00:31 +00:00
db590d1d2c Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v81.6.1' (#224) from renovate/kube-prometheus-stack-81.x into main
Reviewed-on: #224
2026-02-10 18:52:20 +00:00
7b6f92646f chore(deps): update helm release kube-prometheus-stack to v81.6.1 2026-02-10 14:00:27 +00:00
6bbd9748a2 chore(deps): update helm release kube-prometheus-stack to v81.5.2 2026-02-09 19:00:20 +00:00
b22ff17c1d chore(deps): update helm release kube-prometheus-stack to v81.5.1 2026-02-09 13:00:43 +00:00
96900bea0c add README 2026-02-07 13:47:45 -05:00
0f84c335de omni: use ipvs for kube-proxy 2026-02-06 21:31:00 -05:00
5e1b5dc007 omni: try to use iptables mode instead of nftables for kube-proxy in attempt to fix TLS timeout issues 2026-02-06 14:48:53 -05:00
f0f1b45c93 Merge pull request 'chore(deps): update cloudflare/cloudflared docker tag to v2026.2.0' (#220) from renovate/cloudflare-cloudflared-2026.x into main
Reviewed-on: #220
2026-02-06 19:42:42 +00:00
46c4e7b50f Merge pull request 'chore(deps): update helm release external-secrets to v2' (#221) from renovate/external-secrets-2.x into main
Reviewed-on: #221
2026-02-06 19:42:18 +00:00
dbba05d7b6 chore(deps): update helm release external-secrets to v2 2026-02-06 16:00:30 +00:00
db9aa7c99d chore(deps): update cloudflare/cloudflared docker tag to v2026.2.0 2026-02-06 16:00:22 +00:00
8f0d73946f traefik: update traefik-local service to have a 3600 second timeout 2026-02-05 19:43:20 -05:00
d0ac6145e0 chore(deps): update helm release rook-ceph to v1.19.1 2026-02-05 22:00:37 +00:00
b9830a2153 chore(deps): update helm release argo-cd to v9.4.1 2026-02-05 20:00:24 +00:00
4f51cc5799 chore(deps): update helm release external-secrets to v1.3.2 2026-02-03 21:00:24 +00:00
fe1707d078 argocd: add default values to externalsecrets 2026-02-03 13:30:51 -05:00
df154d3b8b Merge pull request 'chore(deps): update helm release argo-cd to v9.4.0' (#214) from renovate/argo-cd-9.x into main
Reviewed-on: #214
2026-02-03 18:21:55 +00:00
49d6684d0a Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v81.5.0' (#216) from renovate/kube-prometheus-stack-81.x into main
Reviewed-on: #216
2026-02-03 18:21:37 +00:00
179cdaffd7 chore(deps): update helm release kube-prometheus-stack to v81.5.0 2026-02-03 17:00:42 +00:00
396c998336 chore(deps): update helm release kube-prometheus-stack to v81.4.3 2026-02-03 08:00:23 +00:00
1829d76a07 omni: rewrite git.dubyatp.xyz to traefik local 2026-02-02 22:22:19 -05:00
4315074427 traefik: add traefik-local svc 2026-02-02 21:21:53 -05:00
289a51fd7d chore(deps): update helm release argo-cd to v9.4.0 2026-02-03 00:00:39 +00:00
b6f178ef88 chore(deps): update helm release cert-manager to v1.19.3 2026-02-02 15:00:30 +00:00
eb021c1510 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v81.4.2' (#212) from renovate/kube-prometheus-stack-81.x into main
Reviewed-on: #212
2026-01-31 02:36:02 +00:00
99e7e0ae30 chore(deps): update helm release kube-prometheus-stack to v81.4.2 2026-01-30 22:00:50 +00:00
e80fb62fd7 chore(deps): update helm release kube-prometheus-stack to v81.3.2 2026-01-30 09:00:57 +00:00
b6cf261505 chore(deps): update helm release kube-prometheus-stack to v81.3.1 2026-01-29 18:01:21 +00:00
cc2b1825d5 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v81.3.0' (#209) from renovate/kube-prometheus-stack-81.x into main
Reviewed-on: #209
2026-01-29 00:01:54 +00:00
5b15d78da0 chore(deps): update helm release kube-prometheus-stack to v81.3.0 2026-01-28 20:01:08 +00:00
3e54d7c96d chore(deps): update helm release kube-prometheus-stack to v81.2.5 2026-01-28 18:00:32 +00:00
52d680a143 chore(deps): update cloudflare/cloudflared docker tag to v2026.1.2 2026-01-27 12:00:39 +00:00
a5a604a496 chore(deps): update helm release argo-cd to v9.3.7 2026-01-27 08:00:41 +00:00
9194de2325 chore(deps): update helm release argo-cd to v9.3.6 2026-01-26 12:00:29 +00:00
ce5a5c63e3 Merge pull request 'chore(deps): update helm release external-secrets to v1.3.1' (#203) from renovate/external-secrets-1.x into main
Reviewed-on: #203
2026-01-23 23:45:20 +00:00
6a4c3e2253 chore(deps): update helm release kube-prometheus-stack to v81.2.2 2026-01-23 21:00:22 +00:00
65013f6720 chore(deps): update helm release external-secrets to v1.3.1 2026-01-23 19:00:19 +00:00
9426dbeb71 traefik: remove unnecessary line 2026-01-23 10:11:23 -05:00
ca3234cb79 traefik: fix syntax for new version 2026-01-23 10:09:43 -05:00
6d2d895b67 Merge pull request 'chore(deps): update helm release traefik to v39' (#201) from renovate/traefik-39.x into main
Reviewed-on: #201
2026-01-23 15:01:10 +00:00
c2bd9b23ac Merge pull request 'chore(deps): update helm release kite to v0.7.8' (#202) from renovate/kite-0.x into main
Reviewed-on: #202
2026-01-23 14:54:06 +00:00
0790ccd2ad kite: add deployment strategy 2026-01-23 09:52:40 -05:00
ddcadddaaa chore(deps): update helm release kite to v0.7.8 2026-01-23 12:00:32 +00:00
8fabc526ad chore(deps): update helm release traefik to v39 2026-01-23 08:00:24 +00:00
e285b581f3 chore(deps): update helm release argo-cd to v9.3.5 2026-01-23 07:00:21 +00:00
3f614405c8 chore(deps): update helm release kube-prometheus-stack to v81.2.1 2026-01-22 18:00:53 +00:00
079fdd4da2 rook-ceph: upgrade ceph to v20.2.0-20251104 2026-01-21 11:26:16 -05:00
6e22223c4b Merge pull request 'chore(deps): update helm release rook-ceph to v1.19.0' (#198) from renovate/rook-ceph-1.x into main
Reviewed-on: #198
2026-01-21 00:54:55 +00:00
61d5ad7071 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v81.2.0' (#196) from renovate/kube-prometheus-stack-81.x into main
Reviewed-on: #196
2026-01-21 00:45:04 +00:00
cd3f663549 Merge pull request 'chore(deps): update cloudflare/cloudflared docker tag to v2026' (#197) from renovate/cloudflare-cloudflared-2026.x into main
Reviewed-on: #197
2026-01-21 00:42:35 +00:00
f1fd7c6cb1 chore(deps): update helm release rook-ceph to v1.19.0 2026-01-20 20:00:57 +00:00
175b2c13f9 chore(deps): update helm release kube-prometheus-stack to v81.2.0 2026-01-20 19:00:21 +00:00
a643de1085 chore(deps): update cloudflare/cloudflared docker tag to v2026 2026-01-20 12:00:55 +00:00
e5aab6948d Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v81' (#195) from renovate/kube-prometheus-stack-81.x into main
Reviewed-on: #195
2026-01-20 00:08:08 +00:00
30456b3817 chore(deps): update helm release kube-prometheus-stack to v81 2026-01-19 22:00:23 +00:00
ab12531084 chore(deps): update velero/velero-plugin-for-aws docker tag to v1.13.2 2026-01-16 08:00:27 +00:00
b789b7be21 chore(deps): update helm release kube-prometheus-stack to v80.14.4 2026-01-15 15:00:53 +00:00
3a2cfdb84e chore(deps): update helm release argo-cd to v9.3.4 2026-01-14 22:00:23 +00:00
506c034948 argocd: remove unnecessary and annoying prometheus alert 2026-01-14 13:27:50 -05:00
7cbc80906e chore(deps): update helm release kube-prometheus-stack to v80.14.3 2026-01-14 15:00:53 +00:00
3fd705520c chore(deps): update helm release kube-prometheus-stack to v80.14.2 2026-01-14 04:00:53 +00:00
94d65decd1 chore(deps): update helm release argo-cd to v9.3.3 2026-01-13 23:00:55 +00:00
e06a1be194 chore(deps): update helm release kube-prometheus-stack to v80.14.1 2026-01-13 21:01:40 +00:00
dc926c31de chore(deps): update helm release rook-ceph to v1.18.9 2026-01-13 20:00:23 +00:00
af31507e8c Merge branch 'renovate/argo-cd-9.x' 2026-01-13 11:28:24 -05:00
c0ca549393 Merge branch 'renovate/kube-prometheus-stack-80.x' 2026-01-13 11:26:09 -05:00
a113c84c9d chore(deps): update helm release kube-prometheus-stack to v80.14.0 2026-01-13 16:00:44 +00:00
a7cc46ed8a chore(deps): update helm release argo-cd to v9.3.1 2026-01-13 11:00:29 +00:00
54e6a76aab chore(deps): update helm release kube-prometheus-stack to v80.13.3 2026-01-09 10:00:58 +00:00
33ef2866e9 chore(deps): update helm release traefik to v38.0.2 2026-01-08 09:00:26 +00:00
b609e87dd3 chore(deps): update helm release kube-prometheus-stack to v80.13.2 2026-01-07 23:00:59 +00:00
e1ffafc161 chore(deps): update helm release kube-prometheus-stack to v80.13.1 2026-01-07 18:00:29 +00:00
4170dfa26c Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.13.0' (#180) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #180
2026-01-06 22:56:17 +00:00
5fcb92ee8b chore(deps): update helm release kube-prometheus-stack to v80.13.0 2026-01-06 22:00:55 +00:00
c5acc2416f chore(deps): update helm release velero to v11.3.2 2026-01-06 12:00:56 +00:00
87b667b2ab chore(deps): update helm release kube-prometheus-stack to v80.11.1 2026-01-06 11:00:55 +00:00
d68d2db3bc Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.11.0' (#177) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #177
2026-01-06 01:46:43 +00:00
ad68a17eb5 Merge pull request 'chore(deps): update helm release kite to v0.7.7' (#176) from renovate/kite-0.x into main
Reviewed-on: #176
2026-01-06 01:46:28 +00:00
b07c7bf3a0 chore(deps): update helm release kube-prometheus-stack to v80.11.0 2026-01-05 15:00:58 +00:00
78fc45ae6c chore(deps): update helm release kite to v0.7.7 2026-01-05 13:00:27 +00:00
2fa1594e99 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.10.0' (#173) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #173
2026-01-03 16:53:26 +00:00
b211327516 chore(deps): update helm release external-secrets to v1.2.1 2026-01-02 23:00:55 +00:00
6885ec790c chore(deps): update helm release argo-cd to v9.2.4 2026-01-02 23:00:27 +00:00
664cace62e chore(deps): update helm release kube-prometheus-stack to v80.10.0 2026-01-02 18:00:26 +00:00
dae06b2c05 chore(deps): update helm release kube-prometheus-stack to v80.9.2 2025-12-31 11:00:57 +00:00
583831273d kite: create volume backups 2025-12-31 00:15:20 -05:00
f327b23001 try automerging patches 2025-12-31 00:01:26 -05:00
6f2603d3a0 remove redundant node alerts 2025-12-30 23:50:18 -05:00
c26ea4e139 Merge pull request 'chore(deps): update helm release velero to v11.3.1' (#170) from renovate/velero-11.x into main
Reviewed-on: #170
2025-12-31 04:44:22 +00:00
b521924f00 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.9.1' (#171) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #171
2025-12-31 04:44:07 +00:00
19f203e374 re-add weyma-talos-cp04 2025-12-30 23:43:11 -05:00
bb251462fb update omni cluster template 2025-12-30 22:44:13 -05:00
9a9d108e7c chore(deps): update helm release kube-prometheus-stack to v80.9.1 2025-12-30 19:00:56 +00:00
70d5ae2e48 chore(deps): update helm release velero to v11.3.1 2025-12-29 11:00:24 +00:00
e6e25baee1 Merge pull request 'chore(deps): update helm release argo-cd to v9.2.3' (#168) from renovate/argo-cd-9.x into main
Reviewed-on: #168
2025-12-29 00:55:53 +00:00
a08e9930d5 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.8.0' (#169) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #169
2025-12-29 00:55:41 +00:00
94bb98b4ed chore(deps): update helm release argo-cd to v9.2.3 2025-12-28 13:00:26 +00:00
07f863b0a7 chore(deps): update helm release kube-prometheus-stack to v80.8.0 2025-12-28 01:08:47 +00:00
79669aaf16 Merge pull request 'chore(deps): update helm release external-secrets to v1.2.0' (#164) from renovate/external-secrets-1.x into main
Reviewed-on: #164
2025-12-23 20:45:46 +00:00
7237e23151 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.6.0' (#165) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #165
2025-12-23 20:45:33 +00:00
f4cc060de7 Merge pull request 'chore(deps): update helm release argo-cd to v9.2.0' (#166) from renovate/argo-cd-9.x into main
Reviewed-on: #166
2025-12-23 20:44:27 +00:00
15f5cb1cbc Merge pull request 'chore(deps): update helm release kite to v0.7.6' (#167) from renovate/kite-0.x into main
Reviewed-on: #167
2025-12-23 20:44:16 +00:00
373b418601 chore(deps): update helm release kite to v0.7.6 2025-12-23 17:03:22 +00:00
95af55533e chore(deps): update helm release argo-cd to v9.2.0 2025-12-23 12:00:27 +00:00
24b29cc9a9 consolidate everything into main file, needed for import 2025-12-22 16:49:31 -05:00
ba292377ab derp 2025-12-20 17:19:37 -05:00
9ee0e419a0 fix dispatcharr route 2025-12-20 17:16:49 -05:00
0ee35ec27c im tar 2025-12-20 17:13:04 -05:00
9697736ed3 traefik: add rule to dispatcharr route 2025-12-20 17:10:35 -05:00
1dea2edfcc traefik: add static route for dispatcharr 2025-12-20 17:00:13 -05:00
ae3d90eb10 chore(deps): update helm release kube-prometheus-stack to v80.6.0 2025-12-19 16:00:23 +00:00
72e16276b8 chore(deps): update helm release external-secrets to v1.2.0 2025-12-19 15:00:19 +00:00
f1fe246f14 Merge pull request 'chore(deps): update helm release traefik to v38' (#161) from renovate/traefik-38.x into main
Reviewed-on: #161
2025-12-19 14:59:37 +00:00
afe3aaf866 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.5.0' (#163) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #163
2025-12-19 14:58:25 +00:00
603b6fdbd3 Merge pull request 'chore(deps): update helm release argo-cd to v9.1.9' (#162) from renovate/argo-cd-9.x into main
Reviewed-on: #162
2025-12-19 14:56:05 +00:00
b4fa24c8d1 chore(deps): update helm release traefik to v38 2025-12-19 14:01:27 +00:00
1c344f11c4 chore(deps): update helm release kube-prometheus-stack to v80.5.0 2025-12-18 16:01:00 +00:00
a9f1a7cf69 chore(deps): update helm release argo-cd to v9.1.9 2025-12-18 13:00:55 +00:00
335563a895 Merge pull request 'chore(deps): update helm release kube-prometheus-stack to v80.4.2' (#160) from renovate/kube-prometheus-stack-80.x into main
Reviewed-on: #160
2025-12-17 15:34:06 +00:00
72df8103f2 Merge pull request 'chore(deps): update helm release argo-cd to v9.1.8' (#159) from renovate/argo-cd-9.x into main
Reviewed-on: #159
2025-12-17 15:33:19 +00:00
22dbbaf64f chore(deps): update helm release kube-prometheus-stack to v80.4.2 2025-12-17 15:01:09 +00:00
ecba2195b6 chore(deps): update helm release argo-cd to v9.1.8 2025-12-16 02:00:20 +00:00
29 changed files with 397 additions and 277 deletions

37
README.md Normal file
View File

@@ -0,0 +1,37 @@
# Main Infrastructure: weyma-talos
**Production Kubernetes infrastructure with disaster recovery capabilities**
This repository contains the foundational infrastructure for my Kubernetes homelab, designed with reliability and rapid recovery as core principles.
## Architecture
My infrastructure follows a layered "black start" approach - essential services run outside the Kubernetes cluster to enable cluster bootstrapping and recovery from total failures.
### Black Start Layer
Static services (Docker Compose on TrueNAS/Proxmox) that provide cluster dependencies:
- Image cache for faster deployments and offline capability
- Talos discovery server for node bootstrapping
- HashiCorp Vault for secrets management (external to cluster)
- Future: Self-hosted Sidero Omni server (migrating from SaaS)
### System Apps Layer
Applications running within Kubernetes that provide core cluster functionality, managed via ArgoCD with GitOps principles.
## Repository Structure
- **`black-start/`** - Docker Compose services for cluster dependencies
- **`config-patches/`** - Talos Linux configuration patches for cluster and individual machines
- **`omni/`** - Sidero Omni [cluster template](https://docs.siderolabs.com/omni/reference/cluster-templates)
- **`system-apps/`** - System applications (ArgoCD projects) - monitoring, ingress, certificates, storage
## Tech Stack
**OS:** Talos Linux | **Orchestration:** Kubernetes | **GitOps:** ArgoCD | **Secrets:** Vault | **Storage:** Rook-Ceph
## Recovery Process
The "black start" architecture enables ~15-20 minute automated recovery from complete infrastructure failure:
1. Start black-start services → 2. Bootstrap Talos → 3. Deploy system apps → 4. Deploy core apps
For application deployments, see [core-apps](https://git.dubyatp.xyz/core-apps).

View File

@@ -2,7 +2,7 @@ version: "3.8"
services:
discovery:
restart: unless-stopped
image: ghcr.io/siderolabs/discovery-service:v1.0.13
image: ghcr.io/siderolabs/discovery-service:v1.0.15
ports:
- 10.105.6.215:3000:3000
- 10.105.6.215:3001:3001

View File

@@ -1,5 +0,0 @@
kind: ControlPlane
machines:
- 20b4c826-e699-43b3-826d-73eb5173680b
- 30303031-3030-3030-6335-303731636665
- 5fdea709-56ad-45f2-966d-5e344dbe4fdf

View File

@@ -1,16 +0,0 @@
kind: Machine
systemExtensions:
- siderolabs/nut-client
- siderolabs/qemu-guest-agent
name: 5fdea709-56ad-45f2-966d-5e344dbe4fdf
patches:
- idOverride: 400-cm-5fdea709-56ad-45f2-966d-5e344dbe4fdf
inline:
machine:
network:
hostname: weyma-talos-cp01
interfaces:
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:e6:ff:7b
dhcp: true

View File

@@ -1,13 +0,0 @@
kind: Machine
name: 20b4c826-e699-43b3-826d-73eb5173680b
patches:
- idOverride: 400-cm-20b4c826-e699-43b3-826d-73eb5173680b
inline:
machine:
network:
hostname: weyma-talos-cp02
interfaces:
- deviceSelector:
driver: virtio*
hardwareAddr: 00:16:3e:9c:01:27
dhcp: true

View File

@@ -1,14 +0,0 @@
kind: Machine
systemExtensions:
- siderolabs/nut-client
name: 30303031-3030-3030-6335-303731636665
patches:
- idOverride: 400-cm-30303031-3030-3030-6335-303731636665
inline:
machine:
network:
hostname: weyma-talos-cp04
interfaces:
- deviceSelector:
hardwareAddr: dc:a6:32:95:0f:cb
dhcp: true

View File

@@ -1,30 +0,0 @@
kind: Machine
systemExtensions:
- siderolabs/i915
- siderolabs/nut-client
name: 03000200-0400-0500-0006-000700080009
install:
disk: /dev/sda
patches:
- idOverride: 400-cm-03000200-0400-0500-0006-000700080009
inline:
machine:
network:
hostname: weyma-talos-testw01
interfaces:
- deviceSelector:
driver: igc
hardwareAddr: e8:ff:1e:d5:f8:22
dhcp: true
vlans:
- dhcp: false
vlanId: 50
- deviceSelector:
hardwareAddr: e8:ff:1e:d5:f8:21
dhcp: true
mtu: 9000
- bridge:
interfaces:
- enp2s0.50
dhcp: false
interface: br0

View File

@@ -1,25 +0,0 @@
kind: Machine
name: 1006b91a-ecbf-11ea-aed4-046ba1ee3700
patches:
- idOverride: 400-cm-1006b91a-ecbf-11ea-aed4-046ba1ee3700
inline:
machine:
network:
hostname: weyma-talos-testw04
interfaces:
- deviceSelector:
driver: mlx4_core
hardwareAddr: f4:52:14:60:5e:30
dhcp: true
vlans:
- dhcp: false
vlanId: 50
- deviceSelector:
hardwareAddr: f4:52:14:60:5e:31
dhcp: true
mtu: 9000
- bridge:
interfaces:
- eno1.50
dhcp: false
interface: br0

View File

@@ -1,24 +0,0 @@
kind: Machine
name: 5f0cd701-0784-4fcc-8e52-3b3304049972
patches:
- idOverride: 400-cm-5f0cd701-0784-4fcc-8e52-3b3304049972
inline:
machine:
network:
hostname: weyma-talos-testw05
interfaces:
- deviceSelector:
hardwareAddr: 00:16:3e:b3:dd:f8
dhcp: true
- deviceSelector:
hardwareAddr: 00:16:3e:e5:79:0a
dhcp: true
mtu: 9000
- deviceSelector:
hardwareAddr: 00:16:3e:6b:1c:1d
dhcp: false
- bridge:
interfaces:
- enx00163e6b1c1d
dhcp: false
interface: br0

View File

@@ -1,25 +0,0 @@
kind: Machine
name: 02c02200-f403-11ef-9372-70f446672600
patches:
- idOverride: 400-cm-02c02200-f403-11ef-9372-70f446672600
inline:
machine:
network:
hostname: weyma-talos-w02
interfaces:
- deviceSelector:
driver: igc
hardwareAddr: e8:ff:1e:d4:b8:89
dhcp: true
vlans:
- dhcp: false
vlanId: 50
- deviceSelector:
hardwareAddr: e8:ff:1e:d4:b8:8a
dhcp: true
mtu: 9000
- bridge:
interfaces:
- enp1s0.50
dhcp: false
interface: br0

View File

@@ -1,27 +0,0 @@
kind: Machine
name: da507021-8912-4337-86a3-94a05bd1cf05
patches:
- idOverride: 400-cm-da507021-8912-4337-86a3-94a05bd1cf05
inline:
machine:
network:
hostname: weyma-talos-w03
interfaces:
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:be:6c:08
dhcp: true
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:f8:4a:92
dhcp: true
mtu: 8996
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:93:02:0e
dhcp: false
- bridge:
interfaces:
- enxbc241193020e
dhcp: false
interface: br0

View File

@@ -52,6 +52,7 @@ patches:
bind-address: 0.0.0.0
proxy:
extraArgs:
proxy-mode: ipvs
metrics-bind-address: 0.0.0.0:10249
scheduler:
extraArgs:
@@ -287,3 +288,245 @@ patches:
selector:
k8s-app: metrics-server
name: metrics-lb
- contents: |-
apiVersion: v1
data:
Corefile: |
.:53 {
errors
health {
lameduck 5s
}
ready
log . {
class error
}
prometheus :9153
kubernetes cluster.local in-addr.arpa ip6.arpa {
pods insecure
fallthrough in-addr.arpa ip6.arpa
ttl 30
}
rewrite name git.dubyatp.xyz traefik-local.traefik.svc.cluster.local
forward . /etc/resolv.conf {
max_concurrent 1000
}
cache 30 {
disable success cluster.local
disable denial cluster.local
}
loop
reload
loadbalance
}
kind: ConfigMap
metadata:
name: coredns
namespace: kube-system
name: coredns-config
---
kind: ControlPlane
machines:
- 20b4c826-e699-43b3-826d-73eb5173680b
- 5fdea709-56ad-45f2-966d-5e344dbe4fdf
- 30303031-3030-3030-6335-303731636665
---
kind: Workers
machines:
- 02c02200-f403-11ef-9372-70f446672600
- 03000200-0400-0500-0006-000700080009
- 1006b91a-ecbf-11ea-aed4-046ba1ee3700
- 5f0cd701-0784-4fcc-8e52-3b3304049972
- da507021-8912-4337-86a3-94a05bd1cf05
---
kind: Machine
name: 02c02200-f403-11ef-9372-70f446672600
patches:
- idOverride: 400-cm-02c02200-f403-11ef-9372-70f446672600
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-w02
interfaces:
- deviceSelector:
driver: igc
hardwareAddr: e8:ff:1e:d4:b8:89
dhcp: true
vlans:
- dhcp: false
vlanId: 50
- deviceSelector:
hardwareAddr: e8:ff:1e:d4:b8:8a
dhcp: true
mtu: 9000
- bridge:
interfaces:
- enp1s0.50
dhcp: false
interface: br0
---
kind: Machine
name: 03000200-0400-0500-0006-000700080009
patches:
- idOverride: 400-cm-03000200-0400-0500-0006-000700080009
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-testw01
interfaces:
- deviceSelector:
driver: igc
hardwareAddr: e8:ff:1e:d5:f8:22
dhcp: true
vlans:
- dhcp: false
vlanId: 50
- deviceSelector:
hardwareAddr: e8:ff:1e:d5:f8:21
dhcp: true
mtu: 9000
- bridge:
interfaces:
- enp2s0.50
dhcp: false
interface: br0
---
kind: Machine
name: 1006b91a-ecbf-11ea-aed4-046ba1ee3700
patches:
- idOverride: 400-cm-1006b91a-ecbf-11ea-aed4-046ba1ee3700
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-testw04
interfaces:
- deviceSelector:
driver: mlx4_core
hardwareAddr: f4:52:14:60:5e:30
dhcp: true
vlans:
- dhcp: false
vlanId: 50
- deviceSelector:
hardwareAddr: f4:52:14:60:5e:31
dhcp: true
mtu: 9000
- bridge:
interfaces:
- eno1.50
dhcp: false
interface: br0
---
kind: Machine
name: 30303031-3030-3030-6335-303731636665
patches:
- idOverride: 400-cm-30303031-3030-3030-6335-303731636665
inline:
machine:
network:
hostname: weyma-talos-cp04
interfaces:
- deviceSelector:
hardwareAddr: dc:a6:32:95:0f:cb
dhcp: true
---
kind: Machine
name: 20b4c826-e699-43b3-826d-73eb5173680b
patches:
- idOverride: 400-cm-20b4c826-e699-43b3-826d-73eb5173680b
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-cp02
interfaces:
- deviceSelector:
driver: virtio*
hardwareAddr: 00:16:3e:9c:01:27
dhcp: true
---
kind: Machine
name: 5f0cd701-0784-4fcc-8e52-3b3304049972
patches:
- idOverride: 400-cm-5f0cd701-0784-4fcc-8e52-3b3304049972
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-testw05
interfaces:
- deviceSelector:
hardwareAddr: 00:16:3e:b3:dd:f8
dhcp: true
- deviceSelector:
hardwareAddr: 00:16:3e:e5:79:0a
dhcp: true
mtu: 9000
- deviceSelector:
hardwareAddr: 00:16:3e:6b:1c:1d
dhcp: false
- bridge:
interfaces:
- enx00163e6b1c1d
dhcp: false
interface: br0
---
kind: Machine
systemExtensions:
- siderolabs/nut-client
- siderolabs/qemu-guest-agent
name: 5fdea709-56ad-45f2-966d-5e344dbe4fdf
patches:
- idOverride: 400-cm-5fdea709-56ad-45f2-966d-5e344dbe4fdf
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-cp01
interfaces:
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:e6:ff:7b
dhcp: true
---
kind: Machine
name: da507021-8912-4337-86a3-94a05bd1cf05
patches:
- idOverride: 400-cm-da507021-8912-4337-86a3-94a05bd1cf05
annotations:
name: ""
inline:
machine:
network:
hostname: weyma-talos-w03
interfaces:
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:be:6c:08
dhcp: true
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:f8:4a:92
dhcp: true
mtu: 8996
- deviceSelector:
driver: virtio*
hardwareAddr: bc:24:11:93:02:0e
dhcp: false
- bridge:
interfaces:
- enxbc241193020e
dhcp: false
interface: br0

View File

@@ -1,7 +0,0 @@
kind: Workers
machines:
- 02c02200-f403-11ef-9372-70f446672600
- 03000200-0400-0500-0006-000700080009
- 1006b91a-ecbf-11ea-aed4-046ba1ee3700
- 5f0cd701-0784-4fcc-8e52-3b3304049972
- da507021-8912-4337-86a3-94a05bd1cf05

View File

@@ -14,6 +14,12 @@
}
],
"packageRules": [
{
"description": "Automerge patch updates",
"matchUpdateTypes": ["patch"],
"matchCurrentVersion": "!/^0/",
"automerge": true
},
{
"description": "Rook Ceph - auto-update minor and patch versions only",
"matchDatasources": ["docker"],

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: argo-cd
version: 9.1.7
version: 9.4.7
repository: https://argoproj.github.io/argo-helm

View File

@@ -56,18 +56,6 @@ argo-cd:
Argo CD has not reported any applications data for the past 15 minutes which
means that it must be down or not functioning properly. This needs to be
resolved for this cloud to continue to maintain state.
- alert: ArgoAppNotSynced
expr: |
argocd_app_info{sync_status!="Synced"} == 1
for: 12h
labels:
severity: warning
annotations:
summary: '{{ $labels.name }} Application not synchronized'
description: >
The application {{ $labels.name }} has not been synchronized for over
12 hours which means that the state of this cloud has drifted away from the
state inside Git.
server:
ingress:
enabled: true
@@ -140,18 +128,30 @@ argo-cd:
remoteRef:
key: argo-cd
property: webhook.gitea.secret
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: admin.password
remoteRef:
key: argo-cd
property: admin.password
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: admin.passwordMtime
remoteRef:
key: argo-cd
property: admin.passwordMtime
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: dex.authentik.clientSecret
remoteRef:
key: argo-cd
property: dex.authentik.clientSecret
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- apiVersion: external-secrets.io/v1
kind: ExternalSecret
metadata:
@@ -172,14 +172,23 @@ argo-cd:
remoteRef:
key: argo-cd-git
property: sshPrivateKey
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: type
remoteRef:
key: argo-cd-git
property: type
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: url
remoteRef:
key: argo-cd-git
property: url.core-apps
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- apiVersion: external-secrets.io/v1
kind: ExternalSecret
metadata:
@@ -200,14 +209,23 @@ argo-cd:
remoteRef:
key: argo-cd-git
property: sshPrivateKey
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: type
remoteRef:
key: argo-cd-git
property: type
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: url
remoteRef:
key: argo-cd-git
property: url.weyma-talos
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- apiVersion: external-secrets.io/v1
kind: ExternalSecret
metadata:
@@ -228,14 +246,23 @@ argo-cd:
remoteRef:
key: argo-cd-git
property: sshPrivateKey
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: type
remoteRef:
key: argo-cd-git
property: type
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: url
remoteRef:
key: argo-cd-git
property: url.williamp-sites
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- apiVersion: external-secrets.io/v1
kind: ExternalSecret
metadata:
@@ -256,11 +283,20 @@ argo-cd:
remoteRef:
key: argo-cd-git
property: sshPrivateKey
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: type
remoteRef:
key: argo-cd-git
property: type
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None
- secretKey: url
remoteRef:
key: argo-cd-git
property: url.db-operators
conversionStrategy: Default
decodingStrategy: None
metadataPolicy: None

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: cert-manager
version: v1.19.2
version: v1.19.4
repository: https://charts.jetstack.io

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: external-secrets
version: 1.1.1
version: 2.0.1
repository: https://charts.external-secrets.io

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: kite
version: 0.7.5
version: 0.7.8
repository: https://zxh326.github.io/kite

View File

@@ -1,5 +1,7 @@
kite:
host: "https://weyma-kite.infra.dubyatp.xyz"
deploymentStrategy:
type: Recreate
secret:
create: false
existingSecret: kite-secret
@@ -16,3 +18,5 @@ kite:
paths:
- path: /
pathType: ImplementationSpecific
podAnnotations:
backup.velero.io/backup-volumes: kite-storage

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: kubernetes-replicator
version: 2.12.2
version: 2.12.3
repository: https://helm.mittwald.de

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: kube-prometheus-stack
version: 80.4.1
version: 82.4.3
repository: https://prometheus-community.github.io/helm-charts

View File

@@ -21,7 +21,7 @@ spec:
# versions running within the cluster. See tags available at https://hub.docker.com/r/ceph/ceph/tags/.
# If you want to be more precise, you can always use a timestamp tag such as quay.io/ceph/ceph:v19.2.1-20250202
# This tag might not contain a new Ceph version, just security fixes from the underlying operating system, which will reduce vulnerabilities
image: quay.io/ceph/ceph:v19.2.3-20250717
image: quay.io/ceph/ceph:v20.2.0-20251104
# Whether to allow unsupported versions of Ceph. Currently Reef and Squid are supported.
# Future versions such as Tentacle (v20) would require this to be set to `true`.
# Do not set to true in production.

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: rook-ceph
version: v1.18.8
version: v1.19.2
repository: https://charts.rook.io/release

View File

@@ -497,61 +497,6 @@ spec:
oid: "1.3.6.1.4.1.50495.1.2.1.8.1"
severity: "critical"
type: "ceph_default"
- alert: "CephNodeNetworkPacketDrops"
annotations:
description: "Node {{ "{{" }} $labels.instance {{ "}}" }} experiences packet drop > 0.5% or > 10 packets/s on interface {{ "{{" }} $labels.device {{ "}}" }}."
summary: "One or more NICs reports packet drops"
expr: |
(
rate(node_network_receive_drop_total{device!="lo"}[1m]) +
rate(node_network_transmit_drop_total{device!="lo"}[1m])
) / (
rate(node_network_receive_packets_total{device!="lo"}[1m]) +
rate(node_network_transmit_packets_total{device!="lo"}[1m])
) >= 0.0050000000000000001 and (
rate(node_network_receive_drop_total{device!="lo"}[1m]) +
rate(node_network_transmit_drop_total{device!="lo"}[1m])
) >= 10
labels:
oid: "1.3.6.1.4.1.50495.1.2.1.8.2"
severity: "warning"
type: "ceph_default"
- alert: "CephNodeNetworkPacketErrors"
annotations:
description: "Node {{ "{{" }} $labels.instance {{ "}}" }} experiences packet errors > 0.01% or > 10 packets/s on interface {{ "{{" }} $labels.device {{ "}}" }}."
summary: "One or more NICs reports packet errors"
expr: |
(
rate(node_network_receive_errs_total{device!="lo"}[1m]) +
rate(node_network_transmit_errs_total{device!="lo"}[1m])
) / (
rate(node_network_receive_packets_total{device!="lo"}[1m]) +
rate(node_network_transmit_packets_total{device!="lo"}[1m])
) >= 0.0001 or (
rate(node_network_receive_errs_total{device!="lo"}[1m]) +
rate(node_network_transmit_errs_total{device!="lo"}[1m])
) >= 10
labels:
oid: "1.3.6.1.4.1.50495.1.2.1.8.3"
severity: "warning"
type: "ceph_default"
- alert: "CephNodeNetworkBondDegraded"
annotations:
description: "Bond {{ "{{" }} $labels.master {{ "}}" }} is degraded on Node {{ "{{" }} $labels.instance {{ "}}" }}."
summary: "Degraded Bond on Node {{ "{{" }} $labels.instance {{ "}}" }}"
expr: |
node_bonding_slaves - node_bonding_active != 0
labels:
severity: "warning"
type: "ceph_default"
- alert: "CephNodeInconsistentMTU"
annotations:
description: "Node {{ "{{" }} $labels.instance {{ "}}" }} has a different MTU size ({{ "{{" }} $value {{ "}}" }}) than the median of devices named {{ "{{" }} $labels.device {{ "}}" }}."
summary: "MTU settings across Ceph hosts are inconsistent"
expr: "node_network_mtu_bytes * (node_network_up{device!=\"lo\"} > 0) == scalar( max by (device) (node_network_mtu_bytes * (node_network_up{device!=\"lo\"} > 0)) != quantile by (device) (.5, node_network_mtu_bytes * (node_network_up{device!=\"lo\"} > 0)) )or node_network_mtu_bytes * (node_network_up{device!=\"lo\"} > 0) == scalar( min by (device) (node_network_mtu_bytes * (node_network_up{device!=\"lo\"} > 0)) != quantile by (device) (.5, node_network_mtu_bytes * (node_network_up{device!=\"lo\"} > 0)) )"
labels:
severity: "warning"
type: "ceph_default"
- name: "pools"
rules:
- alert: "CephPoolGrowthWarning"

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: traefik
version: 37.4.0
version: 39.0.2
repository: https://traefik.github.io/charts

View File

@@ -4,18 +4,17 @@ traefik:
- --entryPoints.websecure.transport.respondingTimeouts.readTimeout=0
ports:
web:
redirections:
entryPoint:
to: websecure
scheme: https
permanent: true
http:
redirections:
entryPoint:
to: websecure
scheme: https
permanent: true
gitssh:
port: 2222
exposedPort: 22
expose:
default: true
tls:
passthrough: true
metrics:
prometheus:
service:
@@ -38,7 +37,7 @@ traefik:
kind: DaemonSet
additionalContainers:
- name: cloudflared
image: cloudflare/cloudflared:2025.11.1
image: cloudflare/cloudflared:2026.2.0
command:
- cloudflared
- tunnel
@@ -81,6 +80,19 @@ traefik:
traefik-real-ip:
excludednets:
- "1.1.1.1/24"
routers:
dispatcharr:
entryPoints:
- websecure
service: dispatcharr
tls:
options: default
rule: 'Host(`dispatcharr.dubyatp.xyz`) && PathPrefix(`/`)'
services:
dispatcharr:
loadBalancer:
servers:
- url: http://10.105.15.20:9191
service:
spec:
externalTrafficPolicy: Local
@@ -117,3 +129,26 @@ traefik:
data:
tls.crt: ""
tls.key: ""
- apiVersion: v1
kind: Service
metadata:
name: traefik-local
spec:
sessionAffinity: ClientIP
sessionAffinityConfig:
clientIP:
timeoutSeconds: 3600
selector:
app.kubernetes.io/name: traefik
app.kubernetes.io/instance: traefik-traefik
ports:
- name: gitssh
port: 22
targetPort: gitssh
- name: web
port: 80
targetPort: web
- name: websecure
port: 443
targetPort: websecure
type: ClusterIP

View File

@@ -24,5 +24,5 @@ appVersion: "1.0"
dependencies:
- name: velero
version: 11.2.0
version: 11.4.0
repository: https://vmware-tanzu.github.io/helm-charts

View File

@@ -59,7 +59,7 @@ velero:
insecureSkipTLSVerify: "true"
initContainers:
- name: velero-plugin-for-aws
image: velero/velero-plugin-for-aws:v1.13.1
image: velero/velero-plugin-for-aws:v1.13.2
imagePullPolicy: IfNotPresent
volumeMounts:
- mountPath: /target