Skip to content

Commit d974095

Browse files
authored
Merge pull request #831 from lsst-it/IT-6035_reprovision_kueyen_rke2
(cluster/kueyen) Move Kueyen to RKE2 folder.
2 parents b36583e + 10d8e39 commit d974095

Some content is hidden

Large Commits have some content hidden by default. Use the searchbox below for content that may be hidden.

47 files changed

+424
-95
lines changed

fleet/lib/kube-prometheus-stack-pre/fleet.yaml

Lines changed: 1 addition & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -31,6 +31,7 @@ targetCustomizations:
3131
values:
3232
- pillan
3333
- ruka
34+
- kueyen
3435
yaml:
3536
overlays:
3637
- prod

fleet/lib/kube-prometheus-stack/aggregator/values.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -100,7 +100,7 @@ grafana:
100100
name: $__file{/etc/secrets/keycloak-credentials/url}
101101
role_attribute_path: contains(groups[*], 'grafana-admin') && 'GrafanaAdmin' || contains(groups[*], 'grafana-admin') && 'Admin' || contains(groups[*], 'grafana-editor') && 'Editor' || 'Viewer'
102102
scopes: openid profile email groups roles offline_access
103-
token_url: https://keycloak.ls.lsst.org/realms/master/protocol/openid-connect/token
103+
token_url: $__file{/etc/secrets/keycloak-credentials/url}/realms/master/protocol/openid-connect/token
104104
use_refresh_token: true
105105
ingress:
106106
enabled: true

fleet/lib/kube-prometheus-stack/fleet.yaml

Lines changed: 13 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -43,6 +43,19 @@ diff:
4343
jsonPointers:
4444
- /spec/automountServiceAccountToken
4545
targetCustomizations:
46+
- name: kueyen
47+
clusterSelector:
48+
matchExpressions:
49+
- key: management.cattle.io/cluster-display-name
50+
operator: In
51+
values:
52+
- kueyen
53+
helm:
54+
valuesFiles:
55+
- pvc/values.yaml
56+
- aggregator/values.yaml
57+
- ldap/values.yaml
58+
- overlays/kueyen/values.yaml
4659
- name: pillan
4760
clusterSelector:
4861
matchExpressions:
Lines changed: 179 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,179 @@
1+
---
2+
prometheus:
3+
prometheusSpec:
4+
configMaps:
5+
- sd-snmp-network
6+
- sd-snmp-power
7+
- sd-snmp-raritan-pdu
8+
secrets:
9+
- puppetdb
10+
additionalScrapeConfigs:
11+
- job_name: blackbox-ping-dev
12+
metrics_path: /probe
13+
params:
14+
module: [icmp]
15+
puppetdb_sd_configs:
16+
- url: https://puppetdb.${ .ClusterLabels.site }.lsst.org:8443
17+
basic_auth:
18+
username: svc_prometheus
19+
password_file: /etc/prometheus/secrets/puppetdb/password
20+
query: resources { type = "Class" and title = "Prometheus::Node_exporter" }
21+
refresh_interval: 30s
22+
follow_redirects: true
23+
include_parameters: true
24+
enable_http2: true
25+
relabel_configs:
26+
- source_labels: [__meta_puppetdb_certname]
27+
target_label: __param_target
28+
- source_labels: [__param_target]
29+
target_label: instance
30+
- target_label: __address__
31+
replacement: prometheus-blackbox-exporter.blackbox-exporter:9115
32+
- job_name: node-exporter-dev
33+
puppetdb_sd_configs:
34+
- url: https://puppetdb.${ .ClusterLabels.site }.lsst.org:8443
35+
basic_auth:
36+
username: svc_prometheus
37+
password_file: /etc/prometheus/secrets/puppetdb/password
38+
query: |
39+
resources {
40+
type = "Class" and title = "Profile::Core::Node_info" and
41+
certname in resources[certname] {
42+
type = "Class" and title = "Prometheus::Node_exporter"
43+
}
44+
}
45+
refresh_interval: 30s
46+
follow_redirects: true
47+
include_parameters: true
48+
enable_http2: true
49+
port: 9100
50+
relabel_configs:
51+
- source_labels: [__meta_puppetdb_certname]
52+
target_label: instance
53+
- source_labels: [__meta_puppetdb_environment]
54+
target_label: environment
55+
- source_labels: [__meta_puppetdb_parameter_site]
56+
target_label: site
57+
- source_labels: [__meta_puppetdb_parameter_role]
58+
target_label: role
59+
- source_labels: [__meta_puppetdb_parameter_cluster]
60+
target_label: cluster
61+
- job_name: blackbox-ping-ls
62+
puppetdb_sd_configs:
63+
- url: https://puppetdb.ls.lsst.org:8443
64+
basic_auth:
65+
username: svc_prometheus
66+
password_file: /etc/prometheus/secrets/puppetdb/password
67+
query: resources { type = "Class" and title = "Prometheus::Node_exporter" }
68+
refresh_interval: 30s
69+
follow_redirects: true
70+
include_parameters: true
71+
enable_http2: true
72+
relabel_configs:
73+
- source_labels: [__meta_puppetdb_certname]
74+
target_label: __param_target
75+
- source_labels: [__param_target]
76+
target_label: instance
77+
- target_label: __address__
78+
replacement: prometheus-blackbox-exporter.blackbox-exporter:9115
79+
- job_name: node-exporter-ls
80+
puppetdb_sd_configs:
81+
- url: https://puppetdb.ls.lsst.org:8443
82+
basic_auth:
83+
username: svc_prometheus
84+
password_file: /etc/prometheus/secrets/puppetdb/password
85+
query: |
86+
resources {
87+
type = "Class" and title = "Profile::Core::Node_info" and
88+
certname in resources[certname] {
89+
type = "Class" and title = "Prometheus::Node_exporter"
90+
}
91+
}
92+
refresh_interval: 30s
93+
follow_redirects: true
94+
include_parameters: true
95+
enable_http2: true
96+
port: 9100
97+
relabel_configs:
98+
- source_labels: [__meta_puppetdb_certname]
99+
target_label: instance
100+
- source_labels: [__meta_puppetdb_environment]
101+
target_label: environment
102+
- source_labels: [__meta_puppetdb_parameter_site]
103+
target_label: site
104+
- source_labels: [__meta_puppetdb_parameter_role]
105+
target_label: role
106+
- source_labels: [__meta_puppetdb_parameter_cluster]
107+
target_label: cluster
108+
- job_name: snmp-network
109+
metrics_path: /snmp
110+
params:
111+
module: [if_mib]
112+
auth: [rubin_v2]
113+
file_sd_configs:
114+
- files:
115+
- /etc/prometheus/configmaps/sd-snmp-network/snmp-network.json
116+
relabel_configs:
117+
- source_labels: [__address__]
118+
target_label: __param_target
119+
- source_labels: [__meta_hostname]
120+
target_label: instance
121+
- source_labels: [__meta_network_function]
122+
target_label: network_function
123+
- target_label: __address__
124+
replacement: prometheus-snmp-exporter.snmp-exporter:9116
125+
- job_name: blackbox-network
126+
metrics_path: /probe
127+
params:
128+
module: [icmp]
129+
file_sd_configs:
130+
- files:
131+
- /etc/prometheus/configmaps/sd-snmp-network/snmp-network.json
132+
- /etc/prometheus/configmaps/sd-snmp-power/snmp-power.json
133+
- /etc/prometheus/configmaps/sd-snmp-raritan-pdu/snmp-raritan-pdu.json
134+
relabel_configs:
135+
- source_labels: [__address__]
136+
target_label: __param_target
137+
- source_labels: [__meta_hostname]
138+
target_label: instance
139+
- source_labels: [__meta_network_function]
140+
target_label: network_function
141+
- target_label: __address__
142+
replacement: prometheus-blackbox-exporter.blackbox-exporter:9115
143+
- job_name: snmp-power
144+
metrics_path: /snmp
145+
file_sd_configs:
146+
- files:
147+
- /etc/prometheus/configmaps/sd-snmp-power/snmp-power.json
148+
relabel_configs:
149+
- source_labels: [__address__]
150+
target_label: __param_target
151+
- source_labels: [__meta_hostname]
152+
target_label: instance
153+
- source_labels: [__meta_auth]
154+
target_label: __param_auth
155+
- source_labels: [__meta_module]
156+
target_label: __param_module
157+
- target_label: __address__
158+
replacement: prometheus-snmp-exporter.snmp-exporter:9116
159+
- job_name: snmp-raritan-pdu
160+
metrics_path: /snmp
161+
params:
162+
module: [raritan]
163+
auth: [rubin_v2]
164+
file_sd_configs:
165+
- files:
166+
- /etc/prometheus/configmaps/sd-snmp-raritan-pdu/snmp-raritan-pdu.json
167+
relabel_configs:
168+
- source_labels: [__address__]
169+
target_label: __param_target
170+
- source_labels: [__meta_hostname]
171+
target_label: instance
172+
173+
grafana:
174+
grafana.ini:
175+
auth.generic_oauth:
176+
api_url: https://keycloak.ls.lsst.org/realms/master/protocol/openid-connect/userinfo
177+
auth_url: https://keycloak.ls.lsst.org/realms/master/protocol/openid-connect/auth
178+
name: keycloak.ls.lsst.org
179+
token_url: https://keycloak.ls.lsst.org/realms/master/protocol/openid-connect/token

fleet/lib/mimir-pre/fleet.yaml

Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -49,3 +49,13 @@ targetCustomizations:
4949
yaml:
5050
overlays:
5151
- antu
52+
- name: kueyen
53+
clusterSelector:
54+
matchExpressions:
55+
- key: management.cattle.io/cluster-display-name
56+
operator: In
57+
values:
58+
- kueyen
59+
yaml:
60+
overlays:
61+
- kueyen
Lines changed: 18 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,18 @@
1+
---
2+
apiVersion: external-secrets.io/v1beta1
3+
kind: ExternalSecret
4+
metadata:
5+
name: mimir-s3
6+
spec:
7+
secretStoreRef:
8+
kind: ClusterSecretStore
9+
name: onepassword
10+
data:
11+
- secretKey: AWS_ACCESS_KEY_ID
12+
remoteRef:
13+
key: &item mimir
14+
property: AWS_ACCESS_KEY_ID
15+
- secretKey: AWS_SECRET_ACCESS_KEY
16+
remoteRef:
17+
key: *item
18+
property: AWS_SECRET_ACCESS_KEY

fleet/lib/mimir/fleet.yaml

Lines changed: 11 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -32,6 +32,17 @@ targetCustomizations:
3232
helm:
3333
valuesFiles:
3434
- overlays/ayekan/values.yaml
35+
- name: kueyen
36+
clusterSelector:
37+
matchExpressions:
38+
- key: management.cattle.io/cluster-display-name
39+
operator: In
40+
values:
41+
- kueyen
42+
helm:
43+
valuesFiles:
44+
- overlays/kueyen/values.yaml
45+
- overlays/rke2/values.yaml
3546
- name: rke2
3647
clusterSelector:
3748
matchExpressions:
Lines changed: 10 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,10 @@
1+
---
2+
mimir:
3+
structuredConfig:
4+
common:
5+
storage:
6+
s3:
7+
region: o11y
8+
endpoint: s3.o11y.kueyen.dev.lsst.org
9+
limits:
10+
compactor_blocks_retention_period: 90d

fleet/lib/rook-ceph-cluster/overlays/kueyen/values.yaml

Lines changed: 16 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -6,27 +6,37 @@ cephClusterSpec:
66
useAllNodes: false
77
useAllDevices: false
88
config:
9-
osdsPerDevice: "4"
9+
osdsPerDevice: "1"
1010
nodes:
1111
- name: kueyen01
1212
devices:
13-
- name: /dev/nvme0n1
13+
- name: /dev/disk/by-id/scsi-35000c500a15cf937
1414
- name: kueyen02
1515
devices:
16-
- name: /dev/nvme0n1
16+
- name: /dev/disk/by-id/scsi-35000c500a15847b7
1717
- name: kueyen03
1818
devices:
19-
- name: /dev/nvme0n1
19+
- name: /dev/disk/by-id/scsi-35000c500a15ca7af
20+
- name: kueyen04
21+
devices:
22+
- name: /dev/disk/by-id/scsi-35000c500a15ce4d3
23+
- name: /dev/disk/by-id/scsi-35000c500a1588b9b
24+
- name: kueyen05
25+
devices:
26+
- name: /dev/disk/by-id/scsi-35000c500a157854b
27+
- name: kueyen06
28+
devices:
29+
- name: /dev/disk/by-id/scsi-35000c500a1584f37
2030

2131
cephBlockPools:
2232
- name: replicapool
2333
spec:
2434
failureDomain: host
2535
replicated:
26-
size: 3
36+
size: 2
2737
requireSafeReplicaSize: true
2838
quotas:
29-
maxSize: 1.5Ti
39+
maxSize: 2Ti
3040
enableRBDStats: true
3141
storageClass:
3242
name: rook-ceph-block

fleet/lib/rook-ceph-conf/charts/kueyen/templates/cephobjectstore-lfa.yaml renamed to fleet/lib/rook-ceph-conf/charts/kueyen/templates/cephobjectstore-o11y.yaml

Lines changed: 15 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -2,7 +2,7 @@
22
apiVersion: ceph.rook.io/v1
33
kind: CephObjectStore
44
metadata:
5-
name: lfa
5+
name: o11y
66
namespace: rook-ceph
77
spec:
88
metadataPool:
@@ -17,36 +17,43 @@ spec:
1717
dataChunks: 2
1818
codingChunks: 1
1919
quotas:
20-
maxSize: 1Ti
20+
maxSize: 40Ti
2121
preservePoolsOnDelete: false
2222
gateway:
2323
sslCertificateRef:
2424
port: 80
2525
# securePort: 443
2626
instances: 3
27+
resources:
28+
limits:
29+
cpu: "4"
30+
memory: 4Gi
31+
requests:
32+
cpu: "4"
33+
memory: 4Gi
2734
---
2835
apiVersion: networking.k8s.io/v1
2936
kind: Ingress
3037
metadata:
31-
name: rook-ceph-rgw-ingress
38+
name: rook-ceph-rgw-ingress-o11y
3239
namespace: rook-ceph
3340
annotations:
34-
cert-manager.io/cluster-issuer: letsencrypt-staging
41+
cert-manager.io/cluster-issuer: letsencrypt
3542
nginx.ingress.kubernetes.io/proxy-body-size: 1024m
3643
spec:
3744
ingressClassName: nginx
3845
tls:
3946
- hosts:
40-
- s3.kueyen.dev.lsst.org
41-
secretName: rook-ceph-rgw-ingress-tls
47+
- &host s3.o11y.kueyen.dev.lsst.org
48+
secretName: rook-ceph-rgw-ingress-tls-o11y
4249
rules:
43-
- host: s3.kueyen.dev.lsst.org
50+
- host: *host
4451
http:
4552
paths:
4653
- path: /
4754
pathType: Prefix
4855
backend:
4956
service:
50-
name: rook-ceph-rgw-lfa
57+
name: rook-ceph-rgw-o11y
5158
port:
5259
number: 80

0 commit comments

Comments
 (0)