diff --git a/README.md b/README.md
index 6cf39221..ad92f583 100644
--- a/README.md
+++ b/README.md
@@ -42,6 +42,7 @@ The cluster-deployment tools here include helm charts and ansible playbooks to s
 * Pod security policies
 * Automatic certificate issuing/renewal with Letsencrypt
 * PostgreSQL-operator from CrunchyData
+* Grafana with prometheus-based alerting
 
 ### Resource definitions
 
@@ -70,6 +71,7 @@ The cluster-deployment tools here include helm charts and ansible playbooks to s
 | duplicati | [![](https://img.shields.io/docker/v/instantlinux/duplicati?sort=date)](https://hub.docker.com/r/instantlinux/duplicati "Version badge") | backups |
 | ez-ipupdate | [![](https://img.shields.io/docker/v/instantlinux/ez-ipupdate?sort=date)](https://hub.docker.com/r/instantlinux/ez-ipupdate "Version badge") | Dynamic DNS client |
 | haproxy-keepalived | [![](https://img.shields.io/docker/v/instantlinux/haproxy-keepalived?sort=date)](https://hub.docker.com/r/instantlinux/haproxy-keepalived "Version badge") | load balancer |
+| grafana | ** | monitoring dashboard with prometheus-based alerting |
 | guacamole | ** | authenticated remote-desktop server |
 | logspout | ** | central logging for Docker |
 | mysqldump | [![](https://img.shields.io/docker/v/instantlinux/mysqldump?sort=date)](https://hub.docker.com/r/instantlinux/mysqldump "Version badge") | per-database alternative to xtrabackup |
diff --git a/ansible/roles/monitoring_agent/defaults/main.yml b/ansible/roles/monitoring_agent/defaults/main.yml
index 5a576298..0b85bc15 100644
--- a/ansible/roles/monitoring_agent/defaults/main.yml
+++ b/ansible/roles/monitoring_agent/defaults/main.yml
@@ -83,6 +83,7 @@ syslog: "{{ syslog_defaults | combine(syslog_override) }}"
 ubuntu_packages:
   - bc
   - nagios-nrpe-server
+  - prometheus-node-exporter
   - python3-pip
   - rsyslog
   - smartmontools
diff --git a/k8s/Makefile b/k8s/Makefile
index 46b39c72..f0e83b4d 100644
--- a/k8s/Makefile
+++ b/k8s/Makefile
@@ -95,14 +95,14 @@ $(STACKS)::
 .PHONY: envsubst imports install namespace_config node_labels \
 	persistent remote_volumes secrets sops untaint_master
 
-IMPORTS      = cert-manager flannel metrics
+IMPORTS      = cert-manager flannel
 INSTALL_YAML = $(basename $(wildcard install/*.yaml)) \
           $(addprefix imports/, $(IMPORTS))
 VOLUMES_YAML = $(basename $(wildcard volumes/*.yaml))
 
 install: install/admin-user cluster_network \
 	install/local-storage storage_localdefault imports \
-	install_imports namespace_config install/gitlab-rbac \
+	install_imports namespace_config install/prometheus-rbac \
 	install/k8s-backup install/logspout remote_volumes \
 	sops data-sync-ssh persistent secrets install/ingress-nginx \
 	install/cert-manager
@@ -219,10 +219,14 @@ cert-manager-helm: helm_install
 imports: $(foreach file,$(IMPORTS),imports/$(file).yaml)
 install_imports: $(foreach file, $(IMPORTS), imports/$(file))
 
-imports/metrics.yaml: imports/metrics-$(VERSION_METRICS).yaml
+imports/kube-state-metrics: imports/kube-state-metrics-$(VERSION_METRICS)
 	ln -s $(notdir $<) $@
-imports/metrics-$(VERSION_METRICS).yaml:
-	curl -sLo $@ https://github.com/kubernetes-sigs/metrics-server/releases/download/v$(VERSION_METRICS)/components.yaml
+imports/kube-state-metrics-$(VERSION_METRICS):
+	git clone --dept 1 --branch v$(VERSION_METRICS) \
+	 https://github.com/kubernetes/kube-state-metrics \
+	 imports/kube-state-metrics-$(VERSION_METRICS)
+install_metrics: imports/kube-state-metrics
+	kubectl apply --context=sudo -k $</examples/standard
 
 imports/traefik-prom.yaml:
 	curl -sLo $@ https://raw.githubusercontent.com/mateobur/prometheus-monitoring-guide/master/traefik-prom.yaml
diff --git a/k8s/Makefile.vars b/k8s/Makefile.vars
index c9147095..fbcf626c 100644
--- a/k8s/Makefile.vars
+++ b/k8s/Makefile.vars
@@ -32,6 +32,8 @@ export TZ                   ?= UTC
 export K8S_INGRESS_NGINX_IP ?= 10.101.1.2
 export AUTHELIA_IP          ?= 10.101.1.5
 export MONITOR_EXT_IP       ?= 192.168.1.20
+# export PROMETHEUS_IP	    ?= 10.101.1.21
+# export PROM_ALERT_IP	    ?= 10.101.1.22
 export RSYSLOGD_IP          ?= 10.101.1.40
 
 # Exposed nodePorts - install/ingress-nginx.yaml
diff --git a/k8s/Makefile.versions b/k8s/Makefile.versions
index 808e1f3d..aad170a7 100644
--- a/k8s/Makefile.versions
+++ b/k8s/Makefile.versions
@@ -9,7 +9,7 @@ export VERSION_DEFAULTBACKEND ?= 1.5
 export VERSION_FLANNEL        ?= 0.26.1
 export VERSION_HELM           ?= 3.16.2
 export VERSION_INGRESS_NGINX  ?= 1.11.2
-export VERSION_METRICS        ?= 0.7.2
+export VERSION_METRICS        ?= 2.15.0
 
 # Held back versions - more effort to upgrade
 export VERSION_CALICO        ?= 3.16.5
diff --git a/k8s/helm/grafana/.helmignore b/k8s/helm/grafana/.helmignore
new file mode 100644
index 00000000..839de881
--- /dev/null
+++ b/k8s/helm/grafana/.helmignore
@@ -0,0 +1,2 @@
+*~
+.git
diff --git a/k8s/helm/grafana/Chart.yaml b/k8s/helm/grafana/Chart.yaml
new file mode 100644
index 00000000..5c9ef75d
--- /dev/null
+++ b/k8s/helm/grafana/Chart.yaml
@@ -0,0 +1,26 @@
+apiVersion: v2
+name: grafana
+description: Grafana metrics visualization and alerting
+home: https://github.com/instantlinux/docker-tools
+sources:
+- https://github.com/instantlinux/docker-tools
+- https://github.com/grafana/grafana
+type: application
+version: 0.1.0
+appVersion: 12.0.0
+dependencies:
+- name: chartlib
+  version: 0.1.8
+  repository: https://instantlinux.github.io/docker-tools
+- name: prometheus
+  version: 0.1.0
+  repository: file://subcharts/prometheus
+  condition: prometheus.enabled
+- name: alertmanager
+  version: 0.1.0
+  repository: file://subcharts/alertmanager
+  condition: alertmanager.enabled
+- name: redis
+  version: 0.1.0
+  repository: file://subcharts/redis
+  condition: redis.enabled
diff --git a/k8s/helm/grafana/subcharts/alertmanager/.helmignore b/k8s/helm/grafana/subcharts/alertmanager/.helmignore
new file mode 100644
index 00000000..839de881
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/alertmanager/.helmignore
@@ -0,0 +1,2 @@
+*~
+.git
diff --git a/k8s/helm/grafana/subcharts/alertmanager/Chart.yaml b/k8s/helm/grafana/subcharts/alertmanager/Chart.yaml
new file mode 100644
index 00000000..0422d6fc
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/alertmanager/Chart.yaml
@@ -0,0 +1,14 @@
+apiVersion: v2
+name: alertmanager
+description: Prometheus alerting
+home: https://github.com/instantlinux/docker-tools
+sources:
+- https://github.com/instantlinux/docker-tools
+- https://hub.docker.com/r/prom/alertmanager
+type: application
+version: 0.1.0
+appVersion: "v0.28.1"
+dependencies:
+- name: chartlib
+  version: 0.1.8
+  repository: https://instantlinux.github.io/docker-tools
diff --git a/k8s/helm/grafana/subcharts/alertmanager/templates/NOTES.txt b/k8s/helm/grafana/subcharts/alertmanager/templates/NOTES.txt
new file mode 100644
index 00000000..62ea3f4b
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/alertmanager/templates/NOTES.txt
@@ -0,0 +1,28 @@
+{{- if hasKey .Values "service" }}
+{{- if or .Values.service.enabled (not (hasKey .Values.service "enabled")) }}
+1. Get the application URL by running these commands:
+{{- if hasKey .Values "ingress" }}
+{{- if .Values.ingress.enabled }}
+{{- range $host := .Values.ingress.hosts }}
+  {{- range .paths }}
+  http{{ if $.Values.ingress.tls }}s{{ end }}://{{ $host.host }}{{ .path }}
+  {{- end }}
+{{- end }}
+{{- else if contains "NodePort" .Values.service.type }}
+  export NODE_PORT=$(kubectl get --namespace {{ .Release.Namespace }} -o jsonpath="{.spec.ports[0].nodePort}" services {{ include "local.fullname" . }})
+  export NODE_IP=$(kubectl get nodes --namespace {{ .Release.Namespace }} -o jsonpath="{.items[0].status.addresses[0].address}")
+  echo http://$NODE_IP:$NODE_PORT
+{{- else if contains "LoadBalancer" .Values.service.type }}
+     NOTE: It may take a few minutes for the LoadBalancer IP to be available.
+           You can watch the status of by running 'kubectl get --namespace {{ .Release.Namespace }} svc -w {{ include "local.fullname" . }}'
+  export SERVICE_IP=$(kubectl get svc --namespace {{ .Release.Namespace }} {{ include "local.fullname" . }} --template "{{"{{ range (index .status.loadBalancer.ingress 0) }}{{.}}{{ end }}"}}")
+  echo http://$SERVICE_IP:{{ .Values.service.port }}
+{{- else if contains "ClusterIP" .Values.service.type }}
+  export POD_NAME=$(kubectl get pods --namespace {{ .Release.Namespace }} -l "app.kubernetes.io/name={{ include "local.name" . }},app.kubernetes.io/instance={{ .Release.Name }}" -o jsonpath="{.items[0].metadata.name}")
+  export CONTAINER_PORT=$(kubectl get pod --namespace {{ .Release.Namespace }} $POD_NAME -o jsonpath="{.spec.containers[0].ports[0].containerPort}")
+  echo "Visit http://127.0.0.1:8080 to use your application"
+  kubectl --namespace {{ .Release.Namespace }} port-forward $POD_NAME 8080:$CONTAINER_PORT
+{{- end }}
+{{- end }}
+{{- end }}
+{{- end }}
diff --git a/k8s/helm/grafana/subcharts/alertmanager/templates/app.yaml b/k8s/helm/grafana/subcharts/alertmanager/templates/app.yaml
new file mode 100644
index 00000000..5a01911b
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/alertmanager/templates/app.yaml
@@ -0,0 +1,15 @@
+{{- include "chartlib.configmap" . }}
+---
+{{- include "chartlib.deployment" . }}
+---
+{{- include "chartlib.hpa" . }}
+---
+{{- include "chartlib.ingress" . }}
+---
+{{- include "chartlib.ingresstotp" . }}
+---
+{{- include "chartlib.service" . }}
+---
+{{- include "chartlib.serviceaccount" . }}
+---
+{{- include "chartlib.statefulset" . }}
diff --git a/k8s/helm/grafana/subcharts/alertmanager/templates/tests/test-connection.yaml b/k8s/helm/grafana/subcharts/alertmanager/templates/tests/test-connection.yaml
new file mode 100644
index 00000000..ae159a4f
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/alertmanager/templates/tests/test-connection.yaml
@@ -0,0 +1,17 @@
+{{- if hasKey .Values "service" }}
+apiVersion: v1
+kind: Pod
+metadata:
+  name: "{{ include "local.fullname" . }}-test-connection"
+  labels:
+    {{- include "local.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": test
+spec:
+  containers:
+    - name: wget
+      image: busybox
+      command: ['wget']
+      args: ['{{ include "local.fullname" . }}:{{ .Values.service.port }}']
+  restartPolicy: Never
+{{- end }}
diff --git a/k8s/helm/grafana/subcharts/alertmanager/values.yaml b/k8s/helm/grafana/subcharts/alertmanager/values.yaml
new file mode 100644
index 00000000..5c63f471
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/alertmanager/values.yaml
@@ -0,0 +1,65 @@
+# Default values for alertmanager.
+deployment:
+  command:
+  - /bin/alertmanager
+  - --config.file=/etc/alertmanager/alertmanager.yml
+  - --storage.path=/alertmanager
+  - --web.external-url=http://10.101.1.22:9093
+  containerPorts: [ containerPort: 9093 ]
+  env:
+    smtp_from: alertmanager@example.com
+    smtp_smarthost: smtp:25
+volumeMounts:
+- mountPath: /etc/alertmanager/alertmanager.yml
+  name: config
+  readOnly: true
+  subPath: alertmanager.yml
+- mountPath: /alertmanager
+  name: data
+volumes:
+- name: config
+  configMap:
+    name: grafana-alertmanager
+- name: data
+  hostPath: { path: /var/lib/docker/k8s-volumes/prometheus/alertmanager }
+image:
+  repository: prom/alertmanager
+  pullPolicy: IfNotPresent
+  # tag: default
+
+nameOverride: ""
+fullnameOverride: ""
+
+serviceAccount:
+  enabled: false
+service:
+  clusterIP: 10.101.1.22
+  ports: [ port: 9093 ]
+  type: ClusterIP
+autoscaling:
+  enabled: false
+
+configmap:
+  data:
+    alertmanager.yml: |
+      global:
+        smtp_from: Prometheus Notifications <alertmanager@noreply.example.com>
+        smtp_smarthost: smtp:587
+      route:
+        group_by: [ alertname ]
+        group_wait: 10s
+        group_interval: 1m
+        repeat_interval: 1d
+        receiver: SMTP
+      receivers:
+      - name: SMTP
+        email_configs:
+        - require_tls: true
+          send_resolved: true
+          to: monitor@example.com
+      inhibit_rules:
+      - source_match:
+          severity: critical
+        target_match:
+          severity: warning
+        equal: [ alertname, dev, instance ]
diff --git a/k8s/helm/grafana/subcharts/prometheus/.helmignore b/k8s/helm/grafana/subcharts/prometheus/.helmignore
new file mode 100644
index 00000000..839de881
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/prometheus/.helmignore
@@ -0,0 +1,2 @@
+*~
+.git
diff --git a/k8s/helm/grafana/subcharts/prometheus/Chart.yaml b/k8s/helm/grafana/subcharts/prometheus/Chart.yaml
new file mode 100644
index 00000000..58bbd3e6
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/prometheus/Chart.yaml
@@ -0,0 +1,14 @@
+apiVersion: v2
+name: prometheus
+description: Prometheus metrics and alerting
+home: https://github.com/instantlinux/docker-tools
+sources:
+- https://github.com/instantlinux/docker-tools
+- https://hub.docker.com/r/prom/prometheus
+type: application
+version: 0.1.0
+appVersion: "v3.3.1"
+dependencies:
+- name: chartlib
+  version: 0.1.8
+  repository: https://instantlinux.github.io/docker-tools
diff --git a/k8s/helm/grafana/subcharts/prometheus/templates/NOTES.txt b/k8s/helm/grafana/subcharts/prometheus/templates/NOTES.txt
new file mode 100644
index 00000000..62ea3f4b
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/prometheus/templates/NOTES.txt
@@ -0,0 +1,28 @@
+{{- if hasKey .Values "service" }}
+{{- if or .Values.service.enabled (not (hasKey .Values.service "enabled")) }}
+1. Get the application URL by running these commands:
+{{- if hasKey .Values "ingress" }}
+{{- if .Values.ingress.enabled }}
+{{- range $host := .Values.ingress.hosts }}
+  {{- range .paths }}
+  http{{ if $.Values.ingress.tls }}s{{ end }}://{{ $host.host }}{{ .path }}
+  {{- end }}
+{{- end }}
+{{- else if contains "NodePort" .Values.service.type }}
+  export NODE_PORT=$(kubectl get --namespace {{ .Release.Namespace }} -o jsonpath="{.spec.ports[0].nodePort}" services {{ include "local.fullname" . }})
+  export NODE_IP=$(kubectl get nodes --namespace {{ .Release.Namespace }} -o jsonpath="{.items[0].status.addresses[0].address}")
+  echo http://$NODE_IP:$NODE_PORT
+{{- else if contains "LoadBalancer" .Values.service.type }}
+     NOTE: It may take a few minutes for the LoadBalancer IP to be available.
+           You can watch the status of by running 'kubectl get --namespace {{ .Release.Namespace }} svc -w {{ include "local.fullname" . }}'
+  export SERVICE_IP=$(kubectl get svc --namespace {{ .Release.Namespace }} {{ include "local.fullname" . }} --template "{{"{{ range (index .status.loadBalancer.ingress 0) }}{{.}}{{ end }}"}}")
+  echo http://$SERVICE_IP:{{ .Values.service.port }}
+{{- else if contains "ClusterIP" .Values.service.type }}
+  export POD_NAME=$(kubectl get pods --namespace {{ .Release.Namespace }} -l "app.kubernetes.io/name={{ include "local.name" . }},app.kubernetes.io/instance={{ .Release.Name }}" -o jsonpath="{.items[0].metadata.name}")
+  export CONTAINER_PORT=$(kubectl get pod --namespace {{ .Release.Namespace }} $POD_NAME -o jsonpath="{.spec.containers[0].ports[0].containerPort}")
+  echo "Visit http://127.0.0.1:8080 to use your application"
+  kubectl --namespace {{ .Release.Namespace }} port-forward $POD_NAME 8080:$CONTAINER_PORT
+{{- end }}
+{{- end }}
+{{- end }}
+{{- end }}
diff --git a/k8s/helm/grafana/subcharts/prometheus/templates/app.yaml b/k8s/helm/grafana/subcharts/prometheus/templates/app.yaml
new file mode 100644
index 00000000..5a01911b
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/prometheus/templates/app.yaml
@@ -0,0 +1,15 @@
+{{- include "chartlib.configmap" . }}
+---
+{{- include "chartlib.deployment" . }}
+---
+{{- include "chartlib.hpa" . }}
+---
+{{- include "chartlib.ingress" . }}
+---
+{{- include "chartlib.ingresstotp" . }}
+---
+{{- include "chartlib.service" . }}
+---
+{{- include "chartlib.serviceaccount" . }}
+---
+{{- include "chartlib.statefulset" . }}
diff --git a/k8s/helm/grafana/subcharts/prometheus/templates/tests/test-connection.yaml b/k8s/helm/grafana/subcharts/prometheus/templates/tests/test-connection.yaml
new file mode 100644
index 00000000..ae159a4f
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/prometheus/templates/tests/test-connection.yaml
@@ -0,0 +1,17 @@
+{{- if hasKey .Values "service" }}
+apiVersion: v1
+kind: Pod
+metadata:
+  name: "{{ include "local.fullname" . }}-test-connection"
+  labels:
+    {{- include "local.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": test
+spec:
+  containers:
+    - name: wget
+      image: busybox
+      command: ['wget']
+      args: ['{{ include "local.fullname" . }}:{{ .Values.service.port }}']
+  restartPolicy: Never
+{{- end }}
diff --git a/k8s/helm/grafana/subcharts/prometheus/values.yaml b/k8s/helm/grafana/subcharts/prometheus/values.yaml
new file mode 100644
index 00000000..e276f45a
--- /dev/null
+++ b/k8s/helm/grafana/subcharts/prometheus/values.yaml
@@ -0,0 +1,138 @@
+# Default values for prometheus.
+deployment:
+  command:
+  - /bin/prometheus
+  - --config.file=/etc/prometheus/prometheus.yml
+  - --storage.tsdb.path=/prometheus
+  - --storage.tsdb.retention.time=90d
+  - --web.external-url=http://10.101.1.21:9090
+  containerPorts: [ containerPort: 9090 ]
+  nodeSelector:
+    service.prometheus: allow
+volumeMounts:
+- mountPath: /etc/prometheus/prometheus.yml
+  name: config
+  readOnly: true
+  subPath: prometheus.yml
+- mountPath: /etc/prometheus/alert-rules.yml
+  name: config
+  readOnly: true
+  subPath: alert-rules.yml
+- mountPath: /etc/prometheus/targets.json
+  name: config
+  readOnly: true
+  subPath: targets.json
+- mountPath: /prometheus
+  name: data
+volumes:
+- name: config
+  configMap:
+    name: grafana-prometheus
+- name: data
+  hostPath: { path: /var/lib/docker/k8s-volumes/prometheus }
+image:
+  repository: prom/prometheus
+  pullPolicy: IfNotPresent
+  # tag: default
+
+nameOverride: ""
+fullnameOverride: ""
+
+serviceAccount:
+  enabled: true
+  create: true
+service:
+  clusterIP: 10.101.1.21
+  ports: [ port: 9090 ]
+  type: ClusterIP
+autoscaling:
+  enabled: false
+
+configmap:
+  data:
+    prometheus.yml: |
+      global:
+        scrape_interval: 1m
+        evaluation_interval: 1m
+      alerting:
+        alertmanagers:
+        - static_configs:
+          - targets:
+            - grafana-alertmanager:9093
+      rule_files: [ alert-rules.yml ]
+      scrape_configs:
+      - job_name: prometheus
+        static_configs:
+        - targets: [ localhost:9090 ]
+      - job_name: hw-nodes
+        file_sd_configs:
+        - files: [ targets.json ]
+        relabel_configs:
+        - source_labels: [__address__]
+          target_label: instance
+        - source_labels: [ __address__ ]
+          target_label: __address__
+          replacement: '${1}:9100'
+        # Next two directives define label alertSuppress and apply
+        # it to nodes with a specified hostname prefix
+        - source_labels: [ instance ]
+          target_label: alertSuppress
+          replacement: false
+        - source_labels: [ instance ]
+          regex: ^myth.*
+          target_label: alertSuppress
+          replacement: true
+    targets.json: |
+      # Override the targets with your nodes list, comma-separated
+      [
+        {
+          "labels": {
+            "job": "hw-nodes"
+          },
+          "targets": [
+            "localhost"
+          ]
+        }
+      ]
+    alert-rules.yml: |
+      groups:
+      - name: systems
+        rules:
+        - alert: InstanceDown
+          expr: up{alertSuppress="false"} == 0
+          for: 15s
+          labels:
+            severity: critical
+          annotations:
+            summary: "Instance [{{ $labels.instance }}] down"
+            description: "[{{ $labels.instance }}] of {{ $labels.job }} is down"
+
+        - alert: DiskSpaceLow
+          # To skip volumes on a monitored node, add to that node's config
+          #   /etc/defaults/prometheus-node-exporter
+          # ARGS="--collector.filesystem.ignored-mount-points=<pattern>"
+          expr: (node_filesystem_avail_bytes{fstype!~"^(fuse.*|tmpfs|cifs|nfs)"} / node_filesystem_size_bytes < .10 and on (instance, device, mountpoint) node_filesystem_readonly == 0)
+          for: 2m
+          labels:
+            severity: critical
+          annotations:
+            summary: Low disk space (instance {{ $labels.instance }})
+            description: "Disk is almost full (> 90%)  Value = {{ $value }}"
+
+        - alert: CPULoadHigh
+          expr: sum by (instance) (node_load1) > node:cpu_core:count
+          for: 10m
+          labels:
+            severity: warning
+          annotations:
+            summary: Host high CPU load (instance {{ $labels.instance }})
+            description: "CPU load average is high  Value = {{ $value }}"
+
+        - alert: NTPClockSkew
+          expr: ((node_timex_offset_seconds > 0.05 and deriv(node_timex_offset_seconds[5m]) >= 0) or (node_timex_offset_seconds < -0.05 and deriv(node_timex_offset_seconds[5m]) <= 0))
+          for: 10m
+          labels:
+            severity: warning
+          annotations:
+            summary: Host clock skew (instance {{ $labels.instance }})
+            description: "Clock is out of sync, ensure NTP is configured correctly on this host.  Value = {{ $value }}"
diff --git a/k8s/helm/grafana/templates/NOTES.txt b/k8s/helm/grafana/templates/NOTES.txt
new file mode 100644
index 00000000..62ea3f4b
--- /dev/null
+++ b/k8s/helm/grafana/templates/NOTES.txt
@@ -0,0 +1,28 @@
+{{- if hasKey .Values "service" }}
+{{- if or .Values.service.enabled (not (hasKey .Values.service "enabled")) }}
+1. Get the application URL by running these commands:
+{{- if hasKey .Values "ingress" }}
+{{- if .Values.ingress.enabled }}
+{{- range $host := .Values.ingress.hosts }}
+  {{- range .paths }}
+  http{{ if $.Values.ingress.tls }}s{{ end }}://{{ $host.host }}{{ .path }}
+  {{- end }}
+{{- end }}
+{{- else if contains "NodePort" .Values.service.type }}
+  export NODE_PORT=$(kubectl get --namespace {{ .Release.Namespace }} -o jsonpath="{.spec.ports[0].nodePort}" services {{ include "local.fullname" . }})
+  export NODE_IP=$(kubectl get nodes --namespace {{ .Release.Namespace }} -o jsonpath="{.items[0].status.addresses[0].address}")
+  echo http://$NODE_IP:$NODE_PORT
+{{- else if contains "LoadBalancer" .Values.service.type }}
+     NOTE: It may take a few minutes for the LoadBalancer IP to be available.
+           You can watch the status of by running 'kubectl get --namespace {{ .Release.Namespace }} svc -w {{ include "local.fullname" . }}'
+  export SERVICE_IP=$(kubectl get svc --namespace {{ .Release.Namespace }} {{ include "local.fullname" . }} --template "{{"{{ range (index .status.loadBalancer.ingress 0) }}{{.}}{{ end }}"}}")
+  echo http://$SERVICE_IP:{{ .Values.service.port }}
+{{- else if contains "ClusterIP" .Values.service.type }}
+  export POD_NAME=$(kubectl get pods --namespace {{ .Release.Namespace }} -l "app.kubernetes.io/name={{ include "local.name" . }},app.kubernetes.io/instance={{ .Release.Name }}" -o jsonpath="{.items[0].metadata.name}")
+  export CONTAINER_PORT=$(kubectl get pod --namespace {{ .Release.Namespace }} $POD_NAME -o jsonpath="{.spec.containers[0].ports[0].containerPort}")
+  echo "Visit http://127.0.0.1:8080 to use your application"
+  kubectl --namespace {{ .Release.Namespace }} port-forward $POD_NAME 8080:$CONTAINER_PORT
+{{- end }}
+{{- end }}
+{{- end }}
+{{- end }}
diff --git a/k8s/helm/grafana/templates/app.yaml b/k8s/helm/grafana/templates/app.yaml
new file mode 100644
index 00000000..5a01911b
--- /dev/null
+++ b/k8s/helm/grafana/templates/app.yaml
@@ -0,0 +1,15 @@
+{{- include "chartlib.configmap" . }}
+---
+{{- include "chartlib.deployment" . }}
+---
+{{- include "chartlib.hpa" . }}
+---
+{{- include "chartlib.ingress" . }}
+---
+{{- include "chartlib.ingresstotp" . }}
+---
+{{- include "chartlib.service" . }}
+---
+{{- include "chartlib.serviceaccount" . }}
+---
+{{- include "chartlib.statefulset" . }}
diff --git a/k8s/helm/grafana/templates/tests/test-connection.yaml b/k8s/helm/grafana/templates/tests/test-connection.yaml
new file mode 100644
index 00000000..ae159a4f
--- /dev/null
+++ b/k8s/helm/grafana/templates/tests/test-connection.yaml
@@ -0,0 +1,17 @@
+{{- if hasKey .Values "service" }}
+apiVersion: v1
+kind: Pod
+metadata:
+  name: "{{ include "local.fullname" . }}-test-connection"
+  labels:
+    {{- include "local.labels" . | nindent 4 }}
+  annotations:
+    "helm.sh/hook": test
+spec:
+  containers:
+    - name: wget
+      image: busybox
+      command: ['wget']
+      args: ['{{ include "local.fullname" . }}:{{ .Values.service.port }}']
+  restartPolicy: Never
+{{- end }}
diff --git a/k8s/helm/grafana/values.yaml b/k8s/helm/grafana/values.yaml
new file mode 100644
index 00000000..1ba4cabe
--- /dev/null
+++ b/k8s/helm/grafana/values.yaml
@@ -0,0 +1,97 @@
+# Default values for grafana.
+tlsHostname: grafana.example.com
+deployment:
+  env:
+    gf_analytics_reporting_enabled: false
+    gf_analytics_check_for_updates: false
+    gf_database_type: mysql
+    gf_database_host: db00
+    gf_database_name: grafana
+    gf_database_password__file: /run/secrets/grafana-db-password
+    gf_database_user: grafana
+    gf_remote_cache_type: redis
+    gf_remote_cache_connstr: addr=grafana-redis:6379,pool_size=100,db=0,ssl=false
+    # See note in volumeMounts below
+    # gf_security_admin_password__file: /run/secrets/admin_password
+    gf_security_admin_email: admin@example.com
+    gf_server_domain: grafana.example.com
+    gf_server_root_url: https://grafana.example.com
+    gf_smtp_enabled: true
+    gf_smtp_host: smtp:25
+    gf_users_allow_sign_up: false
+    tz: America/Los_Angeles
+    uid: 472
+  containerPorts:
+  - containerPort: 3000
+  livenessProbe:
+    httpGet:
+      path: /api/health
+      port: 3000
+    initialDelaySeconds: 60
+    timeoutSeconds: 30
+    failureThreshold: 10
+  resources:
+    limits:
+      memory: 256Mi
+    requests:
+      cpu: 100m
+      memory: 64Mi
+volumeMounts:
+- mountPath: /var/lib/grafana
+  name: data
+  subPath: data
+- mountPath: /run/secrets/grafana-db-password
+  name: grafana-db-password
+  readOnly: true
+  subPath: grafana-db-password
+# Add an admin_password key in the secret and override volumeMounts to
+# include this mountPath at first run if you want to set the admin pw
+# automatically. This value is not used after initial setup.
+#
+# - mountPath: /run/secrets/admin_password
+#   name: grafana-db-password
+#   readOnly: true
+#   subPath: admin_password
+volumes:
+- name: data
+  hostPath: { path: /var/lib/docker/k8s-volumes/share/grafana }
+- name: grafana-db-password
+  secret:
+    secretName: grafana-db-password
+
+image:
+  repository: grafana/grafana-enterprise
+  pullPolicy: IfNotPresent
+  # tag: default
+
+nameOverride: ""
+fullnameOverride: ""
+
+serviceAccount: {}
+service:
+  clusterIP: None
+  ports:
+  - { port: 80, targetPort: 3000, name: grafana }
+  type: ClusterIP
+autoscaling:
+  enabled: false
+
+authelia:
+  fqdn: authtotp.example.com
+  ip: 10.101.1.5
+  path: /login
+ingress:
+  annotations:
+    cert-manager.io/cluster-issuer: letsencrypt-prod
+    kubernetes.io/ingress.class: nginx
+    nginx.ingress.kubernetes.io/enable-access-log: "false"
+ingressTOTP:
+  enabled: true
+
+# Subchart parameters
+prometheus:
+  enabled: true
+alertmanager:
+  enabled: true
+redis:
+  enabled: false
diff --git a/k8s/install/prometheus-rbac.yaml b/k8s/install/prometheus-rbac.yaml
new file mode 100644
index 00000000..c02e37fc
--- /dev/null
+++ b/k8s/install/prometheus-rbac.yaml
@@ -0,0 +1,32 @@
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRoleBinding
+metadata:
+  name: $K8S_NAMESPACE:prometheus-scraper-binding
+roleRef:
+  apiGroup: rbac.authorization.k8s.io
+  kind: ClusterRole
+  name: $K8S_NAMESPACE:prometheus-scraper
+subjects:
+- kind: ServiceAccount
+  name: grafana-prometheus
+  namespace: $K8S_NAMESPACE
+---
+apiVersion: rbac.authorization.k8s.io/v1
+kind: ClusterRole
+metadata:
+  name: $K8S_NAMESPACE:prometheus-scraper
+rules:
+- apiGroups: [""]
+  resources:
+  - endpoints
+  - nodes
+  - pods
+  - services
+  verbs: [get, list, watch]
+- apiGroups: [extensions]
+  resources:
+  - ingresses
+  verbs: [get, list, watch]
+- nonResourceURLs: ["/metrics"]
+  verbs: [get]