blob: 2249daebfaab8d1a66938aabd838a585b188a14c [file] [log] [blame]
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +02001// k0.hswaw.net kubernetes cluster
2// This defines the cluster as a single object.
3// Use the sibling k0*.jsonnet 'view' files to actually apply the configuration.
4
5local kube = import "../../kube/kube.libsonnet";
6local policies = import "../../kube/policies.libsonnet";
7
8local cluster = import "cluster.libsonnet";
9
Serge Bazanski3c5d8362021-02-06 17:27:02 +000010local admitomatic = import "lib/admitomatic.libsonnet";
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020011local cockroachdb = import "lib/cockroachdb.libsonnet";
12local registry = import "lib/registry.libsonnet";
13local rook = import "lib/rook.libsonnet";
14
15{
16 k0: {
17 local k0 = self,
18 cluster: cluster.Cluster("k0", "hswaw.net") {
19 cfg+: {
Serge Bazanski3d294842020-08-04 01:34:07 +020020 storageClassNameParanoid: k0.ceph.waw3Pools.blockRedundant.name,
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020021 },
22 metallb+: {
23 cfg+: {
Serge Bazanskia5ed6442020-09-20 22:52:57 +000024 // Peer with calico running on same node.
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020025 peers: [
26 {
Serge Bazanskia5ed6442020-09-20 22:52:57 +000027 "peer-address": "127.0.0.1",
28 "peer-asn": 65003,
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020029 "my-asn": 65002,
30 },
31 ],
Serge Bazanskia5ed6442020-09-20 22:52:57 +000032 // Public IP address pools. Keep in sync with k0.calico.yaml.
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020033 addressPools: [
34 {
35 name: "public-v4-1",
36 protocol: "bgp",
37 addresses: [
38 "185.236.240.48/28",
39 ],
40 },
41 {
42 name: "public-v4-2",
43 protocol: "bgp",
44 addresses: [
45 "185.236.240.112/28"
46 ],
47 },
48 ],
49 },
50 },
51 },
52
53 // Docker registry
54 registry: registry.Environment {
55 cfg+: {
56 domain: "registry.%s" % [k0.cluster.fqdn],
57 storageClassName: k0.cluster.cfg.storageClassNameParanoid,
Serge Bazanski3d294842020-08-04 01:34:07 +020058 objectStorageName: "waw-hdd-redundant-3-object",
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020059 },
60 },
61
62 // CockroachDB, running on bc01n{01,02,03}.
63 cockroach: {
64 waw2: cockroachdb.Cluster("crdb-waw1") {
65 cfg+: {
66 topology: [
67 { name: "bc01n01", node: "bc01n01.hswaw.net" },
68 { name: "bc01n02", node: "bc01n02.hswaw.net" },
Patryk Jakuszewedf14cc2021-01-23 23:00:29 +010069 { name: "dcr01s22", node: "dcr01s22.hswaw.net" },
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020070 ],
71 // Host path on SSD.
72 hostPath: "/var/db/crdb-waw1",
Serge Bazanski509ab6e2020-07-30 22:43:20 +020073 extraDNS: [
74 "crdb-waw1.hswaw.net",
75 ],
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020076 },
77 },
78 clients: {
79 cccampix: k0.cockroach.waw2.Client("cccampix"),
80 cccampixDev: k0.cockroach.waw2.Client("cccampix-dev"),
81 buglessDev: k0.cockroach.waw2.Client("bugless-dev"),
82 sso: k0.cockroach.waw2.Client("sso"),
Serge Bazanski509ab6e2020-07-30 22:43:20 +020083 herpDev: k0.cockroach.waw2.Client("herp-dev"),
Patryk Jakuszewf3153882021-01-23 15:38:50 +010084 gitea: k0.cockroach.waw2.Client("gitea"),
Piotr Dobrowolskif4a6a562021-02-01 21:32:25 +010085 issues: k0.cockroach.waw2.Client("issues"),
Serge Bazanskibf266c62021-03-17 21:48:58 +000086 dns: k0.cockroach.waw2.Client("dns"),
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020087 },
88 },
89
90 ceph: {
91 // waw1 cluster - dead as of 2019/08/06, data corruption
Serge Bazanski61f978a2021-01-22 16:26:07 +010092 // waw2 cluster - dead as of 2021/01/22, torn down (horrible M610 RAID controllers are horrible)
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +020093
Serge Bazanski464fb042021-09-11 20:24:27 +000094 // waw3: 6TB SAS 3.5" HDDs, internal Rook cluster.
95 //
96 // Suffers from rook going apeshit and nuking all mons if enough of
97 // a control plane is up for rook to run but if nodes are
98 // unavailable to the point of it deciding that no mon exists and
99 // it should create some new ones, fully nuking the monmap and
100 // making recovery a pain.
101 //
102 // Supposedly new versions of Rook slowly fix these issues, but q3k
103 // doesn't personally trust this codebase anymore. He'd rather
104 // manage the actual Ceph cluster myself, we don't need all of this
105 // magic.
106 //
107 // See: b.hswaw.net/6
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200108 waw3: rook.Cluster(k0.cluster.rook, "ceph-waw3") {
109 spec: {
110 mon: {
Serge Bazanskicf842b02021-01-19 20:08:23 +0100111 count: 1,
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200112 allowMultiplePerNode: false,
113 },
Serge Bazanski793ca1b2021-03-07 00:07:19 +0000114 resources: {
115 osd: {
116 requests: {
Serge Bazanski64de7af2021-03-17 21:47:29 +0000117 cpu: "2",
118 memory: "6G",
Serge Bazanski793ca1b2021-03-07 00:07:19 +0000119 },
120 limits: {
Serge Bazanski64de7af2021-03-17 21:47:29 +0000121 cpu: "2",
122 memory: "8G",
Serge Bazanski793ca1b2021-03-07 00:07:19 +0000123 },
124 },
125
126 },
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200127 storage: {
128 useAllNodes: false,
129 useAllDevices: false,
130 config: {
131 databaseSizeMB: "1024",
132 journalSizeMB: "1024",
133 },
Serge Bazanski464fb042021-09-11 20:24:27 +0000134
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200135 nodes: [
136 {
137 name: "dcr01s22.hswaw.net",
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200138 devices: [
Serge Bazanski464fb042021-09-11 20:24:27 +0000139 { name: "/dev/disk/by-id/wwn-0x" + id }
140 for id in [
141 "5000c5008508c433",
142 "5000c500850989cf",
143 "5000c5008508f843",
144 "5000c5008508baf7",
145 ]
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200146 ],
147 },
148 {
149 name: "dcr01s24.hswaw.net",
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200150 devices: [
Serge Bazanski464fb042021-09-11 20:24:27 +0000151 { name: "/dev/disk/by-id/wwn-0x" + id }
152 for id in [
153 "5000c5008508ee03",
154 "5000c5008508c9ef",
155 "5000c5008508df33",
156 "5000c5008508dd3b",
157 ]
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200158 ],
159 },
160 ],
161 },
162 benji:: {
163 metadataStorageClass: "waw-hdd-redundant-3",
164 encryptionPassword: std.split((importstr "../secrets/plain/k0-benji-encryption-password"), '\n')[0],
165 pools: [
166 "waw-hdd-redundant-3",
167 "waw-hdd-redundant-3-metadata",
168 "waw-hdd-yolo-3",
169 ],
170 s3Configuration: {
171 awsAccessKeyId: "RPYZIROFXNLQVU2WJ4R3",
172 awsSecretAccessKey: std.split((importstr "../secrets/plain/k0-benji-secret-access-key"), '\n')[0],
173 bucketName: "benji-k0-backups-waw3",
174 endpointUrl: "https://s3.eu-central-1.wasabisys.com/",
175 },
176 }
177 },
178 },
179 waw3Pools: {
180 // redundant block storage
181 blockRedundant: rook.ECBlockPool(k0.ceph.waw3, "waw-hdd-redundant-3") {
182 metadataReplicas: 2,
183 spec: {
184 failureDomain: "host",
185 replicated: {
186 size: 2,
187 },
188 },
189 },
190 // yolo block storage (low usage, no host redundancy)
191 blockYolo: rook.ReplicatedBlockPool(k0.ceph.waw3, "waw-hdd-yolo-3") {
192 spec: {
193 failureDomain: "osd",
194 erasureCoded: {
Serge Bazanskicf842b02021-01-19 20:08:23 +0100195 dataChunks: 2,
196 codingChunks: 1,
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200197 },
198 },
199 },
Serge Bazanski242ec582020-09-20 15:36:11 +0000200 // q3k's personal pool, used externally from k8s.
201 q3kRedundant: rook.ECBlockPool(k0.ceph.waw3, "waw-hdd-redundant-q3k-3") {
202 metadataReplicas: 2,
203 spec: {
204 failureDomain: "host",
205 replicated: {
206 size: 2,
207 },
208 },
209 },
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200210 objectRedundant: rook.S3ObjectStore(k0.ceph.waw3, "waw-hdd-redundant-3-object") {
211 spec: {
212 metadataPool: {
213 failureDomain: "host",
214 replicated: { size: 2 },
215 },
216 dataPool: {
217 failureDomain: "host",
218 replicated: { size: 2 },
219 },
220 },
221 },
222 },
223
224 // Clients for S3/radosgw storage.
225 clients: {
226 # Used for owncloud.hackerspace.pl, which for now lives on boston-packets.hackerspace.pl.
227 nextcloudWaw3: kube.CephObjectStoreUser("nextcloud") {
228 metadata+: {
229 namespace: "ceph-waw3",
230 },
231 spec: {
232 store: "waw-hdd-redundant-3-object",
233 displayName: "nextcloud",
234 },
235 },
Piotr Dobrowolski3b8a43f2021-02-01 21:19:48 +0100236 # issues.hackerspace.pl (redmine) attachments bucket
237 issuesWaw3: kube.CephObjectStoreUser("issues") {
238 metadata+: {
239 namespace: "ceph-waw3",
240 },
241 spec: {
242 store: "waw-hdd-redundant-3-object",
243 displayName: "issues",
244 },
245 },
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200246
247 # nuke@hackerspace.pl's personal storage.
248 nukePersonalWaw3: kube.CephObjectStoreUser("nuke-personal") {
249 metadata+: {
250 namespace: "ceph-waw3",
251 },
252 spec: {
253 store: "waw-hdd-redundant-3-object",
254 displayName: "nuke-personal",
255 },
256 },
257
258 # patryk@hackerspace.pl's ArmA3 mod bucket.
259 cz2ArmaModsWaw3: kube.CephObjectStoreUser("cz2-arma3mods") {
260 metadata+: {
261 namespace: "ceph-waw3",
262 },
263 spec: {
264 store: "waw-hdd-redundant-3-object",
265 displayName: "cz2-arma3mods",
266 },
267 },
Bartosz Stebeld9df5872020-06-13 21:19:40 +0200268 # Buckets for spark pipelines
269 # TODO(implr): consider a second yolo-backed one for temp data
270 implrSparkWaw3: kube.CephObjectStoreUser("implr-spark") {
271 metadata+: {
272 namespace: "ceph-waw3",
273 },
274 spec: {
275 store: "waw-hdd-redundant-3-object",
276 displayName: "implr-spark",
277 },
278 },
Sergiusz Bazanskib1aadd82020-06-24 19:06:17 +0200279 # q3k's personal user
280 q3kWaw3: kube.CephObjectStoreUser("q3k") {
281 metadata+: {
282 namespace: "ceph-waw3",
283 },
284 spec: {
285 store: "waw-hdd-redundant-3-object",
286 displayName: "q3k",
287 },
288 },
Serge Bazanskibfe9bb02020-10-27 20:50:50 +0100289 # woju's personal user
290 wojuWaw3: kube.CephObjectStoreUser("woju") {
291 metadata+: {
292 namespace: "ceph-waw3",
293 },
294 spec: {
295 store: "waw-hdd-redundant-3-object",
296 displayName: "woju",
297 },
Patryk Jakuszewcae7cf72020-11-28 14:36:48 +0100298 },
Patryk Jakuszew34668a52020-11-28 13:45:25 +0100299 # cz3's (patryk@hackerspace.pl) personal user
300 cz3Waw3: kube.CephObjectStoreUser("cz3") {
301 metadata+: {
302 namespace: "ceph-waw3",
303 },
304 spec: {
305 store: "waw-hdd-redundant-3-object",
306 displayName: "cz3",
307 },
Serge Bazanskibfe9bb02020-10-27 20:50:50 +0100308 },
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200309 },
310 },
311
312
313 # These are policies allowing for Insecure pods in some namespaces.
314 # A lot of them are spurious and come from the fact that we deployed
315 # these namespaces before we deployed the draconian PodSecurityPolicy
316 # we have now. This should be fixed by setting up some more granular
317 # policies, or fixing the workloads to not need some of the permission
318 # bits they use, whatever those might be.
319 # TODO(q3k): fix this?
320 unnecessarilyInsecureNamespaces: [
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200321 policies.AllowNamespaceInsecure("ceph-waw3"),
322 policies.AllowNamespaceInsecure("matrix"),
323 policies.AllowNamespaceInsecure("registry"),
324 policies.AllowNamespaceInsecure("internet"),
325 # TODO(implr): restricted policy with CAP_NET_ADMIN and tuntap, but no full root
326 policies.AllowNamespaceInsecure("implr-vpn"),
327 ],
Serge Bazanski3c5d8362021-02-06 17:27:02 +0000328
329 # Admission controller that permits non-privileged users to manage
330 # their namespaces without danger of hijacking important URLs.
331 admitomatic: admitomatic.Environment {
332 cfg+: {
333 proto: {
334 // Domains allowed in given namespaces. If a domain exists
335 // anywhere, ingresses will only be permitted to be created
336 // within namespaces in which it appears here. This works
337 // the same way for wildcards, if a wildcard exists in this
338 // list it blocks all unauthorized uses of that domain
339 // elsewhere.
340 //
341 // See //cluster/admitomatic for more information.
342 //
343 // Or, tl;dr:
344 //
345 // If you do a wildcard CNAME onto the k0 ingress, you
346 // should explicitly state *.your.name.com here.
347 //
348 // If you just want to protect your host from being
349 // hijacked by other cluster users, you should also state
350 // it here (either as a wildcard, or unary domains).
351 allow_domain: [
352 { namespace: "covid-formity", dns: "covid19.hackerspace.pl" },
353 { namespace: "covid-formity", dns: "covid.hackerspace.pl" },
354 { namespace: "covid-formity", dns: "www.covid.hackerspace.pl" },
355 { namespace: "devtools-prod", dns: "hackdoc.hackerspace.pl" },
356 { namespace: "devtools-prod", dns: "cs.hackerspace.pl" },
357 { namespace: "engelsystem-prod", dns: "engelsystem.hackerspace.pl" },
358 { namespace: "gerrit", dns: "gerrit.hackerspace.pl" },
359 { namespace: "gitea-prod", dns: "gitea.hackerspace.pl" },
360 { namespace: "hswaw-prod", dns: "*.hackerspace.pl" },
Serge Bazanski99b91b12021-03-28 17:34:32 +0000361 { namespace: "hswaw-prod", dns: "*.hswaw.net" },
Serge Bazanski3c5d8362021-02-06 17:27:02 +0000362 { namespace: "internet", dns: "internet.hackerspace.pl" },
363 { namespace: "matrix", dns: "matrix.hackerspace.pl" },
364 { namespace: "onlyoffice-prod", dns: "office.hackerspace.pl" },
365 { namespace: "redmine", dns: "issues.hackerspace.pl" },
Serge Bazanski877cf0a2021-02-08 00:34:34 +0100366 { namespace: "redmine", dns: "b.hackerspace.pl" },
367 { namespace: "redmine", dns: "b.hswaw.net" },
368 { namespace: "redmine", dns: "xn--137h.hackerspace.pl" },
369 { namespace: "redmine", dns: "xn--137h.hswaw.net" },
Serge Bazanski3c5d8362021-02-06 17:27:02 +0000370 { namespace: "speedtest", dns: "speedtest.hackerspace.pl" },
371 { namespace: "sso", dns: "sso.hackerspace.pl" },
372
373 { namespace: "ceph-waw3", dns: "ceph-waw3.hswaw.net" },
374 { namespace: "ceph-waw3", dns: "object.ceph-waw3.hswaw.net" },
375 { namespace: "monitoring-global-k0", dns: "*.hswaw.net" },
376 { namespace: "registry", dns: "*.hswaw.net" },
377
378 // q3k's legacy namespace (pre-prodvider)
379 { namespace: "q3k", dns: "*.q3k.org" },
380 { namespace: "personal-q3k", dns: "*.q3k.org" },
381 ],
382 },
383 },
384 },
Sergiusz Bazanskidbfa9882020-06-06 01:21:45 +0200385 },
386}