Fork 0

362 lines
12 KiB
Raw Normal View History

2019-01-13 21:06:33 +00:00
# Top level cluster configuration.
local kube = import "../../kube/kube.libsonnet";
local policies = import "../../kube/policies.libsonnet";
2019-06-20 22:24:09 +00:00
local calico = import "lib/calico.libsonnet";
2019-06-20 22:24:09 +00:00
local certmanager = import "lib/cert-manager.libsonnet";
local cockroachdb = import "lib/cockroachdb.libsonnet";
local coredns = import "lib/coredns.libsonnet";
2019-01-18 08:40:59 +00:00
local metallb = import "lib/metallb.libsonnet";
2019-06-20 22:24:09 +00:00
local metrics = import "lib/metrics.libsonnet";
local nginx = import "lib/nginx.libsonnet";
local prodvider = import "lib/prodvider.libsonnet";
local registry = import "lib/registry.libsonnet";
2019-04-01 16:40:50 +00:00
local rook = import "lib/rook.libsonnet";
local pki = import "lib/pki.libsonnet";
2019-01-13 21:06:33 +00:00
local Cluster(short, realm) = {
2019-01-13 21:06:33 +00:00
local cluster = self,
local cfg = cluster.cfg,
short:: short,
realm:: realm,
fqdn:: "%s.%s" % [cluster.short, cluster.realm],
cfg:: {
// Storage class used for internal services (like registry). This must
// be set to a valid storage class. This can either be a cloud provider class
// (when running on GKE &co) or a storage class created using rook.
storageClassNameRedundant: error "storageClassNameRedundant must be set",
2019-01-13 21:06:33 +00:00
// These are required to let the API Server contact kubelets.
crAPIServerToKubelet: kube.ClusterRole("system:kube-apiserver-to-kubelet") {
metadata+: {
annotations+: {
"rbac.authorization.kubernetes.io/autoupdate": "true",
labels+: {
"kubernetes.io/bootstrapping": "rbac-defaults",
2019-01-13 21:06:33 +00:00
rules: [
apiGroups: [""],
resources: ["nodes/%s" % r for r in [ "proxy", "stats", "log", "spec", "metrics" ]],
verbs: ["*"],
2019-01-13 21:08:05 +00:00
crbAPIServer: kube.ClusterRoleBinding("system:kube-apiserver") {
2019-01-13 21:06:33 +00:00
roleRef: {
apiGroup: "rbac.authorization.k8s.io",
kind: "ClusterRole",
name: cluster.crAPIServerToKubelet.metadata.name,
subjects: [
apiGroup: "rbac.authorization.k8s.io",
kind: "User",
# A cluster API Server authenticates with a certificate whose CN is == to the FQDN of the cluster.
name: cluster.fqdn,
2019-01-13 21:06:33 +00:00
2019-01-13 23:02:59 +00:00
// This ClusteRole is bound to all humans that log in via prodaccess/prodvider/SSO.
// It should allow viewing of non-sensitive data for debugability and openness.
crViewer: kube.ClusterRole("system:viewer") {
rules: [
apiGroups: [""],
resources: [
verbs: ["list"],
apiGroups: ["metrics.k8s.io"],
resources: [
verbs: ["list"],
apiGroups: ["apps"],
resources: [
verbs: ["list"],
apiGroups: ["extensions"],
resources: [
verbs: ["list"],
// This ClusterRole is applied (scoped to personal namespace) to all humans.
crFullInNamespace: kube.ClusterRole("system:admin-namespace") {
rules: [
apiGroups: ["*"],
resources: ["*"],
verbs: ["*"],
// This ClusterRoleBindings allows root access to cluster admins.
crbAdmins: kube.ClusterRoleBinding("system:admins") {
roleRef: {
apiGroup: "rbac.authorization.k8s.io",
kind: "ClusterRole",
name: "cluster-admin",
subjects: [
apiGroup: "rbac.authorization.k8s.io",
kind: "User",
name: user + "@hackerspace.pl",
} for user in [
podSecurityPolicies: policies.Cluster {},
allowInsecureNamespaces: [
# TODO(q3k): fix this?
// Allow all service accounts (thus all controllers) to create secure pods.
crbAllowServiceAccountsSecure: kube.ClusterRoleBinding("policy:allow-all-secure") {
roleRef_: cluster.podSecurityPolicies.secureRole,
subjects: [
kind: "Group",
apiGroup: "rbac.authorization.k8s.io",
name: "system:serviceaccounts",
// Calico network fabric
calico: calico.Environment {},
2019-01-13 23:02:59 +00:00
// CoreDNS for this cluster.
dns: coredns.Environment {
cfg+: {
cluster_domains: [
// Metrics Server
metrics: metrics.Environment {},
2019-01-18 08:40:59 +00:00
// Metal Load Balancer
metallb: metallb.Environment {
cfg+: {
addressPools: [
{ name: "public-v4-1", protocol: "layer2", addresses: [""] },
// Main nginx Ingress Controller
nginx: nginx.Environment {},
certmanager: certmanager.Environment {},
issuer: kube.ClusterIssuer("letsencrypt-prod") {
spec: {
acme: {
server: "https://acme-v02.api.letsencrypt.org/directory",
email: "bofh@hackerspace.pl",
privateKeySecretRef: {
name: "letsencrypt-prod"
http01: {},
2019-04-01 22:06:13 +00:00
2019-04-01 16:40:50 +00:00
// Rook Ceph storage
rook: rook.Operator {
operator+: {
spec+: {
// TODO(q3k): Bring up the operator again when stability gets fixed
// See: https://github.com/rook/rook/issues/3059#issuecomment-492378873
replicas: 1,
// Docker registry
registry: registry.Environment {
cfg+: {
domain: "registry.%s" % [cluster.fqdn],
storageClassName: cfg.storageClassNameParanoid,
objectStorageName: "waw-hdd-redundant-2-object",
// TLS PKI machinery
pki: pki.Environment(cluster.short, cluster.realm),
// Prodvider
prodvider: prodvider.Environment {
cfg+: {
apiEndpoint: "kubernetes.default.svc.%s" % [cluster.fqdn],
2019-06-20 22:24:09 +00:00
k0: {
local k0 = self,
cluster: Cluster("k0", "hswaw.net") {
cfg+: {
storageClassNameParanoid: k0.ceph.blockParanoid.name,
2019-06-20 22:24:09 +00:00
cockroach: {
waw2: cockroachdb.Cluster("crdb-waw1") {
2019-06-20 22:24:09 +00:00
cfg+: {
topology: [
{ name: "bc01n01", node: "bc01n01.hswaw.net" },
{ name: "bc01n02", node: "bc01n02.hswaw.net" },
{ name: "bc01n03", node: "bc01n03.hswaw.net" },
2019-06-20 22:24:09 +00:00
hostPath: "/var/db/crdb-waw1",
2019-04-01 22:06:13 +00:00
clients: {
cccampix: k0.cockroach.waw2.Client("cccampix"),
cccampixDev: k0.cockroach.waw2.Client("cccampix-dev"),
2019-04-01 22:06:13 +00:00
2019-06-20 22:24:09 +00:00
ceph: {
// waw1 cluster - dead as of 2019/08/06, data corruption
// waw2 cluster
waw2: rook.Cluster(k0.cluster.rook, "ceph-waw2") {
2019-06-20 22:24:09 +00:00
spec: {
mon: {
count: 3,
allowMultiplePerNode: false,
storage: {
useAllNodes: false,
useAllDevices: false,
config: {
databaseSizeMB: "1024",
journalSizeMB: "1024",
nodes: [
name: "bc01n01.hswaw.net",
location: "rack=dcr01 chassis=bc01 host=bc01n01",
devices: [ { name: "sda" } ],
name: "bc01n02.hswaw.net",
location: "rack=dcr01 chassis=bc01 host=bc01n02",
devices: [ { name: "sda" } ],
name: "bc01n03.hswaw.net",
location: "rack=dcr01 chassis=bc01 host=bc01n03",
devices: [ { name: "sda" } ],
benji:: {
metadataStorageClass: "waw-hdd-paranoid-2",
encryptionPassword: std.split((importstr "../secrets/plain/k0-benji-encryption-password"), '\n')[0],
pools: [
s3Configuration: {
awsSecretAccessKey: std.split((importstr "../secrets/plain/k0-benji-secret-access-key"), '\n')[0],
bucketName: "benji-k0-backups",
endpointUrl: "https://s3.eu-central-1.wasabisys.com/",
2019-06-20 22:24:09 +00:00
2019-06-20 22:24:09 +00:00
// redundant block storage
blockRedundant: rook.ECBlockPool(k0.ceph.waw2, "waw-hdd-redundant-2") {
2019-06-20 22:24:09 +00:00
spec: {
failureDomain: "host",
erasureCoded: {
dataChunks: 2,
codingChunks: 1,
// paranoid block storage (3 replicas)
blockParanoid: rook.ReplicatedBlockPool(k0.ceph.waw2, "waw-hdd-paranoid-2") {
spec: {
failureDomain: "host",
replicated: {
size: 3,
2019-06-20 22:24:09 +00:00
// yolo block storage (no replicas!)
blockYolo: rook.ReplicatedBlockPool(k0.ceph.waw2, "waw-hdd-yolo-2") {
2019-06-20 22:24:09 +00:00
spec: {
failureDomain: "host",
replicated: {
size: 1,
2019-04-07 16:49:41 +00:00
objectRedundant: rook.S3ObjectStore(k0.ceph.waw2, "waw-hdd-redundant-2-object") {
2019-06-20 22:24:09 +00:00
spec: {
metadataPool: {
failureDomain: "host",
replicated: { size: 3 },
dataPool: {
failureDomain: "host",
erasureCoded: {
dataChunks: 2,
codingChunks: 1,
2019-04-07 16:49:41 +00:00
# Used for owncloud.hackerspace.pl, which for now lices on boston-packets.hackerspace.pl.
nextcloud: kube._Object("ceph.rook.io/v1", "CephObjectStoreUser", "nextcloud") {
metadata+: {
namespace: "ceph-waw2",
spec: {
store: "waw-hdd-redundant-2-object",
displayName: "nextcloud",
2019-04-07 16:49:41 +00:00
2019-01-13 21:06:33 +00:00