From c261526c040ceeb2b0ea2b81ed43b5e556c46702 Mon Sep 17 00:00:00 2001 From: Nicolas Takashi Date: Thu, 10 Aug 2023 22:34:18 +0100 Subject: [PATCH] [CHORE] adding eBPF helm chart Signed-off-by: Nicolas Takashi --- .github/workflows/ebpf-test.yaml | 37 +++ charts/opentelemetry-ebpf/.helmignore | 23 ++ charts/opentelemetry-ebpf/CONTRIBUTING.md | 12 + charts/opentelemetry-ebpf/Chart.yaml | 14 + charts/opentelemetry-ebpf/README.md | 0 .../rendered/cloud-collector-deployment.yaml | 44 +++ .../cloud-collector-serviceaccount.yaml | 12 + .../cloud-collector/rendered/configmap.yaml | 16 + .../rendered/k8s-collector-clusterrole.yaml | 29 ++ .../k8s-collector-clusterrolebinding.yaml | 20 ++ .../rendered/k8s-collector-deployment.yaml | 75 +++++ .../k8s-collector-serviceaccount.yaml | 12 + .../kernel-collector-clusterrole.yaml | 21 ++ .../kernel-collector-clusterrolebinding.yaml | 20 ++ .../rendered/kernel-collector-daemonset.yaml | 90 ++++++ .../kernel-collector-podsecuritypolicy.yaml | 42 +++ .../kernel-collector-serviceaccount.yaml | 12 + .../rendered/reducer-deployment.yaml | 53 ++++ .../rendered/reducer-service.yaml | 22 ++ .../examples/cloud-collector/values.yaml | 5 + .../opentelemetry-ebpf/templates/_helpers.tpl | 138 +++++++++ .../templates/cloud-collector-deployment.yaml | 115 ++++++++ .../cloud-collector-serviceaccount.yaml | 12 + .../templates/configmap.yaml | 10 + .../templates/k8s-collector-clusterrole.yaml | 25 ++ .../k8s-collector-clusterrolebinding.yaml | 16 + .../templates/k8s-collector-deployment.yaml | 160 ++++++++++ .../k8s-collector-serviceaccount.yaml | 8 + .../kernel-collector-clusterrole.yaml | 17 ++ .../kernel-collector-clusterrolebinding.yaml | 16 + .../templates/kernel-collector-daemonset.yaml | 197 +++++++++++++ .../kernel-collector-podsecuritypolicy.yaml | 38 +++ .../kernel-collector-serviceaccount.yaml | 8 + .../templates/reducer-deployment.yaml | 121 ++++++++ .../templates/reducer-service.yaml | 22 ++ charts/opentelemetry-ebpf/values.schema.json | 176 +++++++++++ charts/opentelemetry-ebpf/values.yaml | 275 ++++++++++++++++++ 37 files changed, 1913 insertions(+) create mode 100644 .github/workflows/ebpf-test.yaml create mode 100644 charts/opentelemetry-ebpf/.helmignore create mode 100644 charts/opentelemetry-ebpf/CONTRIBUTING.md create mode 100644 charts/opentelemetry-ebpf/Chart.yaml create mode 100644 charts/opentelemetry-ebpf/README.md create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-deployment.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-serviceaccount.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/configmap.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrole.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrolebinding.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-deployment.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-serviceaccount.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrole.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrolebinding.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-daemonset.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-podsecuritypolicy.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-serviceaccount.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-deployment.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-service.yaml create mode 100644 charts/opentelemetry-ebpf/examples/cloud-collector/values.yaml create mode 100644 charts/opentelemetry-ebpf/templates/_helpers.tpl create mode 100644 charts/opentelemetry-ebpf/templates/cloud-collector-deployment.yaml create mode 100644 charts/opentelemetry-ebpf/templates/cloud-collector-serviceaccount.yaml create mode 100644 charts/opentelemetry-ebpf/templates/configmap.yaml create mode 100644 charts/opentelemetry-ebpf/templates/k8s-collector-clusterrole.yaml create mode 100644 charts/opentelemetry-ebpf/templates/k8s-collector-clusterrolebinding.yaml create mode 100644 charts/opentelemetry-ebpf/templates/k8s-collector-deployment.yaml create mode 100644 charts/opentelemetry-ebpf/templates/k8s-collector-serviceaccount.yaml create mode 100644 charts/opentelemetry-ebpf/templates/kernel-collector-clusterrole.yaml create mode 100644 charts/opentelemetry-ebpf/templates/kernel-collector-clusterrolebinding.yaml create mode 100644 charts/opentelemetry-ebpf/templates/kernel-collector-daemonset.yaml create mode 100644 charts/opentelemetry-ebpf/templates/kernel-collector-podsecuritypolicy.yaml create mode 100644 charts/opentelemetry-ebpf/templates/kernel-collector-serviceaccount.yaml create mode 100644 charts/opentelemetry-ebpf/templates/reducer-deployment.yaml create mode 100644 charts/opentelemetry-ebpf/templates/reducer-service.yaml create mode 100644 charts/opentelemetry-ebpf/values.schema.json create mode 100644 charts/opentelemetry-ebpf/values.yaml diff --git a/.github/workflows/ebpf-test.yaml b/.github/workflows/ebpf-test.yaml new file mode 100644 index 000000000..608811915 --- /dev/null +++ b/.github/workflows/ebpf-test.yaml @@ -0,0 +1,37 @@ +name: Test eBPF Chart + +on: + pull_request: + paths: + - "charts/opentelemetry-ebpf/**" + branches: + - main + +jobs: + collector-test: + runs-on: ubuntu-latest + steps: + - name: Checkout + uses: actions/checkout@v3 + with: + fetch-depth: 0 + - name: Setup + uses: ./.github/actions/setup + with: + create-kind-cluster: "true" + + - name: Run chart-testing (install) + run: ct install --charts charts/opentelemetry-ebpf + + - name: Run daemonset and deployment install test + run: | + kubectl apply -f ./charts/opentelemetry-collector/examples/daemonset-and-deployment/rendered + + kubectl rollout status deployment example-opentelemetry-collector --timeout=30s + + kubectl apply -f ./charts/opentelemetry-ebpf/examples/cloud-collector/rendered + + kubectl rollout status daemonset example-opentelemetry-ebpf-kernel-collector --timeout=30s + kubectl rollout status deployment example-opentelemetry-ebpf-cloud-collector --timeout=30s + kubectl rollout status deployment example-opentelemetry-ebpf-k8s-collector --timeout=30s + kubectl rollout status deployment example-opentelemetry-ebpf-reducer --timeout=30s diff --git a/charts/opentelemetry-ebpf/.helmignore b/charts/opentelemetry-ebpf/.helmignore new file mode 100644 index 000000000..0e8a0eb36 --- /dev/null +++ b/charts/opentelemetry-ebpf/.helmignore @@ -0,0 +1,23 @@ +# Patterns to ignore when building packages. +# This supports shell glob matching, relative path matching, and +# negation (prefixed with !). Only one pattern per line. +.DS_Store +# Common VCS dirs +.git/ +.gitignore +.bzr/ +.bzrignore +.hg/ +.hgignore +.svn/ +# Common backup files +*.swp +*.bak +*.tmp +*.orig +*~ +# Various IDEs +.project +.idea/ +*.tmproj +.vscode/ diff --git a/charts/opentelemetry-ebpf/CONTRIBUTING.md b/charts/opentelemetry-ebpf/CONTRIBUTING.md new file mode 100644 index 000000000..aa0bf2663 --- /dev/null +++ b/charts/opentelemetry-ebpf/CONTRIBUTING.md @@ -0,0 +1,12 @@ +# Collector Chart Contributing Guide + +All changes to the chart require a bump to the version in `chart.yaml`. See the [Contributing Guide](https://github.com/open-telemetry/opentelemetry-helm-charts/blob/main/CONTRIBUTING.md#versioning) for our versioning requirements. + +Once the chart version is bumped, the examples must be regenerated. You can regenerate examples by running `make generate-examples CHARTS=opentelemetry-collector`. + +## Bumping Default Collector Version + +1. Increase the minor version of the chart by one and set the patch version to zero. +2. Update the chart's `appVersion` to match the new collector version. This version will be used as the image tag by default. +3. Review the corresponding release notes in [Collector Core](https://github.com/open-telemetry/opentelemetry-collector/releases), [Collector Contrib](https://github.com/open-telemetry/opentelemetry-collector-contrib/releases), and [Collector Releases](https://github.com/open-telemetry/opentelemetry-collector-releases/releases). If any changes affect the helm charts, adjust the helm chart accordingly. +4. Run `make generate-examples CHARTS=opentelemetry-collector`. diff --git a/charts/opentelemetry-ebpf/Chart.yaml b/charts/opentelemetry-ebpf/Chart.yaml new file mode 100644 index 000000000..24e3c3776 --- /dev/null +++ b/charts/opentelemetry-ebpf/Chart.yaml @@ -0,0 +1,14 @@ +apiVersion: v2 +name: opentelemetry-ebpf +version: 0.1.0 +description: OpenTelemetry eBPF Helm chart for Kubernetes +type: application +home: https://opentelemetry.io/ +sources: + - https://github.com/open-telemetry/opentelemetry-collector + - https://github.com/open-telemetry/opentelemetry-collector-contrib + - https://github.com/open-telemetry/opentelemetry-ebpf +maintainers: + - name: dmitryax +icon: https://opentelemetry.io/img/logos/opentelemetry-logo-nav.png +appVersion: 0.10.0 diff --git a/charts/opentelemetry-ebpf/README.md b/charts/opentelemetry-ebpf/README.md new file mode 100644 index 000000000..e69de29bb diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-deployment.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-deployment.yaml new file mode 100644 index 000000000..0d6b82886 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-deployment.yaml @@ -0,0 +1,44 @@ +--- +# Source: opentelemetry-ebpf/templates/cloud-collector-deployment.yaml +apiVersion: apps/v1 +kind: Deployment +metadata: + name: example-opentelemetry-ebpf-cloud-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +spec: + progressDeadlineSeconds: 600 + replicas: 1 + revisionHistoryLimit: 3 + selector: + matchLabels: + app.kubernetes.io/name: example-opentelemetry-ebpf-cloud-collector + app.kubernetes.io/instance: example + strategy: + type: RollingUpdate + template: + metadata: + labels: + app.kubernetes.io/name: example-opentelemetry-ebpf-cloud-collector + app.kubernetes.io/instance: example + spec: + containers: + - image: "otel/opentelemetry-ebpf-cloud-collector:v0.10.0" + imagePullPolicy: IfNotPresent + name: cloud-collector + args: + - --warning + env: + - name: "EBPF_NET_CLUSTER_NAME" + value: "" + - name: "EBPF_NET_INTAKE_HOST" + value: example-opentelemetry-ebpf-reducer + - name: "EBPF_NET_INTAKE_PORT" + value: "7000" + terminationGracePeriodSeconds: 30 + securityContext: {} + serviceAccountName: example-opentelemetry-ebpf-cloud-collector diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-serviceaccount.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-serviceaccount.yaml new file mode 100644 index 000000000..87fa62739 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/cloud-collector-serviceaccount.yaml @@ -0,0 +1,12 @@ +--- +# Source: opentelemetry-ebpf/templates/cloud-collector-serviceaccount.yaml +apiVersion: v1 +kind: ServiceAccount +metadata: + name: example-opentelemetry-ebpf-cloud-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/configmap.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/configmap.yaml new file mode 100644 index 000000000..d9b34b8c8 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/configmap.yaml @@ -0,0 +1,16 @@ +--- +# Source: opentelemetry-ebpf/templates/configmap.yaml +apiVersion: v1 +kind: ConfigMap +metadata: + name: example-opentelemetry-ebpf-config + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +data: + config.yaml: | + labels: + environment: "" diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrole.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrole.yaml new file mode 100644 index 000000000..d3ddf3c09 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrole.yaml @@ -0,0 +1,29 @@ +--- +# Source: opentelemetry-ebpf/templates/k8s-collector-clusterrole.yaml +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: example-opentelemetry-ebpf-k8s-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +rules: +- apiGroups: + - "" + resources: + - pods + verbs: + - get + - list + - watch +- apiGroups: + - apps + resources: + - replicasets + verbs: + - get + - list + - watch diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrolebinding.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrolebinding.yaml new file mode 100644 index 000000000..bce0e8a87 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-clusterrolebinding.yaml @@ -0,0 +1,20 @@ +--- +# Source: opentelemetry-ebpf/templates/k8s-collector-clusterrolebinding.yaml +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRoleBinding +metadata: + name: example-opentelemetry-ebpf-k8s-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +roleRef: + apiGroup: rbac.authorization.k8s.io + kind: ClusterRole + name: example-opentelemetry-ebpf-k8s-collector +subjects: +- kind: ServiceAccount + name: example-opentelemetry-ebpf-k8s-collector + namespace: default diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-deployment.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-deployment.yaml new file mode 100644 index 000000000..7b4196f56 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-deployment.yaml @@ -0,0 +1,75 @@ +--- +# Source: opentelemetry-ebpf/templates/k8s-collector-deployment.yaml +# The k8s-collector consists of two services: +# 1) k8s-watcher: talks to the Kubernetes API server to determine the current state of +# the cluster; sets up watches to be notified of subsequent changes to pods, services +# and other resources. +# 2) k8s-relay: relays the information collected by k8s-watcher to the reducer. +apiVersion: apps/v1 +kind: Deployment +metadata: + name: example-opentelemetry-ebpf-k8s-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +spec: + progressDeadlineSeconds: 600 + replicas: 1 + revisionHistoryLimit: 3 + selector: + matchLabels: + app.kubernetes.io/name: example-opentelemetry-ebpf-k8s-collector + app.kubernetes.io/instance: example + strategy: + type: RollingUpdate + template: + metadata: + annotations: + # This is here to allow us to do "zero-downtime" updates without an image change. + rollingUpdateVersion: "1" + charts.flowmill.com/version: 0.1.0 + labels: + app.kubernetes.io/name: example-opentelemetry-ebpf-k8s-collector + app.kubernetes.io/instance: example + spec: + containers: + - image: "otel/opentelemetry-ebpf-k8s-watcher:v0.10.0" + imagePullPolicy: IfNotPresent + name: k8s-watcher + args: + - --log-console + - --log-level=warning + # k8s-relay, which is a service that the k8s-watcher talks to. + # Currently not configurable, has to be reachable on localhost:8172, so must + # share a pod with the k8s-watcher above. + - image: "otel/opentelemetry-ebpf-k8s-relay:v0.10.0" + imagePullPolicy: IfNotPresent + name: k8s-relay + args: + - --config-file=/etc/network-explorer/config.yaml + - --warning + env: + - name: "EBPF_NET_CLUSTER_NAME" + value: "" + - name: "EBPF_NET_INTAKE_HOST" + value: example-opentelemetry-ebpf-reducer + - name: "EBPF_NET_INTAKE_PORT" + value: "7000" + volumeMounts: + - mountPath: /etc/network-explorer + name: k8s-relay-config + terminationGracePeriodSeconds: 30 + volumes: + - name: k8s-relay-config + projected: + sources: + - configMap: + name: example-opentelemetry-ebpf-config + items: + - key: config.yaml + path: config.yaml + securityContext: {} + serviceAccountName: example-opentelemetry-ebpf-k8s-collector diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-serviceaccount.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-serviceaccount.yaml new file mode 100644 index 000000000..1454daa4b --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/k8s-collector-serviceaccount.yaml @@ -0,0 +1,12 @@ +--- +# Source: opentelemetry-ebpf/templates/k8s-collector-serviceaccount.yaml +apiVersion: v1 +kind: ServiceAccount +metadata: + name: example-opentelemetry-ebpf-k8s-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrole.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrole.yaml new file mode 100644 index 000000000..d5540b459 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrole.yaml @@ -0,0 +1,21 @@ +--- +# Source: opentelemetry-ebpf/templates/kernel-collector-clusterrole.yaml +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: example-opentelemetry-ebpf-kernel-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +rules: +- apiGroups: + - policy + resourceNames: + - example-opentelemetry-ebpf-kernel-collector + resources: + - podsecuritypolicies + verbs: + - use diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrolebinding.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrolebinding.yaml new file mode 100644 index 000000000..196220dd6 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-clusterrolebinding.yaml @@ -0,0 +1,20 @@ +--- +# Source: opentelemetry-ebpf/templates/kernel-collector-clusterrolebinding.yaml +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRoleBinding +metadata: + name: example-opentelemetry-ebpf-kernel-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +roleRef: + apiGroup: rbac.authorization.k8s.io + kind: ClusterRole + name: example-opentelemetry-ebpf-kernel-collector +subjects: +- kind: ServiceAccount + name: example-opentelemetry-ebpf-kernel-collector + namespace: default diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-daemonset.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-daemonset.yaml new file mode 100644 index 000000000..5eb6a1265 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-daemonset.yaml @@ -0,0 +1,90 @@ +--- +# Source: opentelemetry-ebpf/templates/kernel-collector-daemonset.yaml +# kernel collector daemonset: deploys the kernel collector to each node in the cluster. +# The kernel collector needs to be able to compile and install +# eBPF programs in the node's kernel, so needs to run as root and +# needs to mount /lib/modules and /usr/src from the node itself. +apiVersion: apps/v1 +kind: DaemonSet +metadata: + name: example-opentelemetry-ebpf-kernel-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +spec: + selector: + matchLabels: + app.kubernetes.io/name: example-opentelemetry-ebpf-kernel-collector + app.kubernetes.io/instance: example + template: + metadata: + annotations: + release_number: "3" + charts.flowmill.com/version: 0.1.0 + labels: + app.kubernetes.io/name: example-opentelemetry-ebpf-kernel-collector + app.kubernetes.io/instance: example + spec: + containers: + - name: kernel-collector + image: "otel/opentelemetry-ebpf-kernel-collector:v0.10.0" + imagePullPolicy: IfNotPresent + args: + - --config-file=/etc/network-explorer/config.yaml + - --disable-nomad-metadata + - --warning + # TODO: liveness probe + env: + - name: "EBPF_NET_CLUSTER_NAME" + value: "" + - name: "EBPF_NET_DISABLE_HTTP_METRICS" + value: "false" + - name: "EBPF_NET_KERNEL_HEADERS_AUTO_FETCH" + value: "true" + - name: "EBPF_NET_INTAKE_HOST" + value: example-opentelemetry-ebpf-reducer + - name: "EBPF_NET_INTAKE_PORT" + value: "7000" + - name: "EBPF_NET_HOST_DIR" + value: "/hostfs" + securityContext: + privileged: true + volumeMounts: + - mountPath: /hostfs/ + name: host-root + readOnly: true + - mountPath: /hostfs/var/cache + name: host-var-cache + readOnly: false + - mountPath: /etc/network-explorer + name: example-opentelemetry-ebpf-config + readOnly: true + dnsPolicy: ClusterFirstWithHostNet + hostNetwork: true + hostPID: true + serviceAccountName: example-opentelemetry-ebpf-kernel-collector + volumes: + - name: example-opentelemetry-ebpf-config + projected: + sources: + - configMap: + name: example-opentelemetry-ebpf-config + items: + - key: config.yaml + path: config.yaml + - name: host-root + hostPath: + path: / + type: Directory + - name: host-var-cache + hostPath: + path: /var/cache + type: DirectoryOrCreate + tolerations: + - effect: NoExecute + operator: Exists + - effect: NoSchedule + operator: Exists diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-podsecuritypolicy.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-podsecuritypolicy.yaml new file mode 100644 index 000000000..2fe4813be --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-podsecuritypolicy.yaml @@ -0,0 +1,42 @@ +--- +# Source: opentelemetry-ebpf/templates/kernel-collector-podsecuritypolicy.yaml +apiVersion: policy/v1beta1 +kind: PodSecurityPolicy +metadata: + name: example-opentelemetry-ebpf-kernel-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +spec: + privileged: true + allowPrivilegeEscalation: true + allowedHostPaths: + - pathPrefix: /usr/src + readOnly: true + - pathPrefix: /lib/modules + readOnly: true + - pathPrefix: /etc + readOnly: true + - pathPrefix: /var/cache + readOnly: false + - pathPrefix: /sys/fs/cgroup + readOnly: true + fsGroup: + rule: RunAsAny + hostNetwork: true + hostPorts: + - max: 65535 + min: 0 + hostPID: true + readOnlyRootFilesystem: false + runAsUser: + rule: RunAsAny + seLinux: + rule: RunAsAny + supplementalGroups: + rule: RunAsAny + volumes: + - "*" diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-serviceaccount.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-serviceaccount.yaml new file mode 100644 index 000000000..9d9736307 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/kernel-collector-serviceaccount.yaml @@ -0,0 +1,12 @@ +--- +# Source: opentelemetry-ebpf/templates/kernel-collector-serviceaccount.yaml +apiVersion: v1 +kind: ServiceAccount +metadata: + name: example-opentelemetry-ebpf-kernel-collector + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-deployment.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-deployment.yaml new file mode 100644 index 000000000..e450dc245 --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-deployment.yaml @@ -0,0 +1,53 @@ +--- +# Source: opentelemetry-ebpf/templates/reducer-deployment.yaml +apiVersion: apps/v1 +kind: Deployment +metadata: + name: example-opentelemetry-ebpf-reducer + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +spec: + replicas: 1 + strategy: + type: RollingUpdate + selector: + matchLabels: + app.kubernetes.io/name: example-opentelemetry-ebpf-reducer + app.kubernetes.io/instance: example + template: + metadata: + labels: + app.kubernetes.io/name: example-opentelemetry-ebpf-reducer + app.kubernetes.io/instance: example + spec: + containers: + - name: reducer + image: "otel/opentelemetry-ebpf-reducer:v0.10.0" + imagePullPolicy: IfNotPresent + args: + - --port=7000 + - --log-console + - --no-log-file + - --warning + - --enable-aws-enrichment + - --disable-prometheus-metrics + - --enable-otlp-grpc-metrics + - --otlp-grpc-metrics-host=example-opentelemetry-collector + - --otlp-grpc-metrics-port=4317 + - --num-ingest-shards=1 + - --num-matching-shards=1 + - --num-aggregation-shards=1 + ports: + - name: telemetry + containerPort: 7000 + protocol: TCP + readinessProbe: + initialDelaySeconds: 5 + periodSeconds: 20 + timeoutSeconds: 5 + exec: + command: ['/srv/health_check.sh', 'readiness_probe', 'localhost', "7000"] diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-service.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-service.yaml new file mode 100644 index 000000000..b825616aa --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/rendered/reducer-service.yaml @@ -0,0 +1,22 @@ +--- +# Source: opentelemetry-ebpf/templates/reducer-service.yaml +apiVersion: v1 +kind: Service +metadata: + name: example-opentelemetry-ebpf-reducer + labels: + helm.sh/chart: opentelemetry-ebpf-0.1.0 + app.kubernetes.io/name: opentelemetry-ebpf + app.kubernetes.io/instance: example + app.kubernetes.io/version: "0.10.0" + app.kubernetes.io/managed-by: Helm +spec: + type: ClusterIP + selector: + app.kubernetes.io/name: example-opentelemetry-ebpf-reducer + app.kubernetes.io/instance: example + ports: + - name: telemetry + port: 7000 + targetPort: telemetry + protocol: TCP diff --git a/charts/opentelemetry-ebpf/examples/cloud-collector/values.yaml b/charts/opentelemetry-ebpf/examples/cloud-collector/values.yaml new file mode 100644 index 000000000..f02009cbb --- /dev/null +++ b/charts/opentelemetry-ebpf/examples/cloud-collector/values.yaml @@ -0,0 +1,5 @@ +cloudCollector: + enabled: true + +otelCollector: + address: example-opentelemetry-collector diff --git a/charts/opentelemetry-ebpf/templates/_helpers.tpl b/charts/opentelemetry-ebpf/templates/_helpers.tpl new file mode 100644 index 000000000..63aa19686 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/_helpers.tpl @@ -0,0 +1,138 @@ +{{/* +Expand the name of the chart. +*/}} +{{- define "opentelemetry-ebpf.name" -}} +{{- default .Chart.Name .Values.nameOverride | trunc 63 | trimSuffix "-" }} +{{- end }} + +{{- define "opentelemetry-ebpf.lowercase_chartname" -}} +{{- default .Chart.Name | lower }} +{{- end }} + +{{/* +Create a default fully qualified app name. +We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). +If release name contains chart name it will be used as a full name. +*/}} +{{- define "opentelemetry-ebpf.fullname" -}} +{{- if .Values.fullnameOverride }} +{{- .Values.fullnameOverride | trunc 63 | trimSuffix "-" }} +{{- else }} +{{- $name := default .Chart.Name .Values.nameOverride }} +{{- if contains $name .Release.Name }} +{{- .Release.Name | trunc 63 | trimSuffix "-" }} +{{- else }} +{{- printf "%s-%s" .Release.Name $name | trunc 63 | trimSuffix "-" }} +{{- end }} +{{- end }} +{{- end }} + +{{/* +Create chart name and version as used by the chart label. +*/}} +{{- define "opentelemetry-ebpf.chart" -}} +{{- printf "%s-%s" .Chart.Name .Chart.Version | replace "+" "_" | trunc 63 | trimSuffix "-" }} +{{- end }} + +{{/* +Common labels +*/}} +{{- define "opentelemetry-ebpf.labels" -}} +helm.sh/chart: {{ include "opentelemetry-ebpf.chart" . }} +{{ include "opentelemetry-ebpf.selectorLabels" . }} +{{- if .Chart.AppVersion }} +app.kubernetes.io/version: {{ .Chart.AppVersion | quote }} +{{- end }} +app.kubernetes.io/managed-by: {{ .Release.Service }} +{{- end }} + +{{/* +Selector labels +*/}} +{{- define "opentelemetry-ebpf.selectorLabels" -}} +app.kubernetes.io/name: {{ include "opentelemetry-ebpf.name" . }} +app.kubernetes.io/instance: {{ .Release.Name }} +{{- end }} + +{{/* +Fully qualified app name for the cloud-collector deployment. +*/}} +{{- define "opentelemetry-collector-cloud-collector.fullname" -}} +{{- $name := default .Chart.Name .Values.nameOverride -}} +{{- if contains $name .Release.Name -}} +{{- printf "%s-cloud-collector" .Release.Name | trunc 63 | trimSuffix "-" -}} +{{- else -}} +{{- printf "%s-%s-cloud-collector" .Release.Name $name | trunc 63 | trimSuffix "-" -}} +{{- end -}} +{{- end -}} + +{{/* +Create the name of the service account to use for the cloud-collector +*/}} +{{- define "opentelemetry-collector-cloud-collector.serviceAccountName" -}} +{{- if .Values.cloudCollector.serviceAccount.create }} +{{- default (include "opentelemetry-collector-cloud-collector.fullname" .) .Values.cloudCollector.serviceAccount.name }} +{{- else }} +{{- default "default" .Values.cloudCollector.serviceAccount.name }} +{{- end }} +{{- end }} + +{{/* +Fully qualified app name for the k8s-collector deployment. +*/}} +{{- define "opentelemetry-collector-k8s-collector.fullname" -}} +{{- $name := default .Chart.Name .Values.nameOverride -}} +{{- if contains $name .Release.Name -}} +{{- printf "%s-k8s-collector" .Release.Name | trunc 63 | trimSuffix "-" -}} +{{- else -}} +{{- printf "%s-%s-k8s-collector" .Release.Name $name | trunc 63 | trimSuffix "-" -}} +{{- end -}} +{{- end -}} + +{{/* +Create the name of the service account to use for the k8s-collector +*/}} +{{- define "opentelemetry-collector-k8s-collector.serviceAccountName" -}} +{{- if .Values.k8sCollector.serviceAccount.create }} +{{- default (include "opentelemetry-collector-k8s-collector.fullname" .) .Values.k8sCollector.serviceAccount.name }} +{{- else }} +{{- default "default" .Values.k8sCollector.serviceAccount.name }} +{{- end }} +{{- end }} + +{{/* +Fully qualified app name for the kernel-collector daemonset. +We truncate at 63 chars because some Kubernetes name fields are limited to this (by the DNS naming spec). +If release name contains chart name it will be used as a full name. +*/}} +{{- define "opentelemetry-collector-kernel-collector.fullname" -}} +{{- $name := default .Chart.Name .Values.nameOverride -}} +{{- if contains $name .Release.Name -}} +{{- printf "%s-kernel-collector" .Release.Name | trunc 63 | trimSuffix "-" -}} +{{- else -}} +{{- printf "%s-%s-kernel-collector" .Release.Name $name | trunc 63 | trimSuffix "-" -}} +{{- end -}} +{{- end -}} + +{{/* +Create the name of the service account to use for the kernel-collector +*/}} +{{- define "opentelemetry-collector-kernel-collector.serviceAccountName" -}} +{{- if .Values.kernelCollector.serviceAccount.create }} +{{- default (include "opentelemetry-collector-kernel-collector.fullname" .) .Values.kernelCollector.serviceAccount.name }} +{{- else }} +{{- default "default" .Values.kernelCollector.serviceAccount.name }} +{{- end }} +{{- end }} + +{{/* +Fully qualified app name for the reducer deployment. +*/}} +{{- define "opentelemetry-collector-reducer.fullname" -}} +{{- $name := default .Chart.Name .Values.nameOverride -}} +{{- if contains $name .Release.Name -}} +{{- printf "%s-reducer" .Release.Name | trunc 63 | trimSuffix "-" -}} +{{- else -}} +{{- printf "%s-%s-reducer" .Release.Name $name | trunc 63 | trimSuffix "-" -}} +{{- end -}} +{{- end -}} \ No newline at end of file diff --git a/charts/opentelemetry-ebpf/templates/cloud-collector-deployment.yaml b/charts/opentelemetry-ebpf/templates/cloud-collector-deployment.yaml new file mode 100644 index 000000000..2dfff97df --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/cloud-collector-deployment.yaml @@ -0,0 +1,115 @@ +{{- if .Values.cloudCollector.enabled }} +apiVersion: apps/v1 +kind: Deployment +metadata: + name: {{ include "opentelemetry-collector-cloud-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +spec: + progressDeadlineSeconds: 600 + replicas: 1 + revisionHistoryLimit: 3 + selector: + matchLabels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-cloud-collector.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + strategy: + type: RollingUpdate + template: + metadata: + labels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-cloud-collector.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + spec: +{{- if .Values.imagePullSecrets }} + imagePullSecrets: +{{- range .Values.imagePullSecrets }} + - name: {{ . }} +{{- end }} +{{- end }} + containers: + - image: "{{ default .Values.images.repository .Values.cloudCollector.image.repository }}/{{ .Values.cloudCollector.image.name }}:{{ default .Values.images.tag .Values.cloudCollector.image.tag }}" + imagePullPolicy: {{ .Values.images.pullPolicy }} + name: cloud-collector +{{- if hasKey .Values.cloudCollector "resources" }} + resources: +{{ toYaml .Values.cloudCollector.resources | indent 10 }} +{{- end }} + args: +{{- if .Values.log.console }} + - --log-console +{{- end }} +{{- if hasKey .Values.log "level" }} + - --{{ .Values.log.level }} +{{- end }} +{{- if hasKey .Values.cloudCollector "log" -}} +{{- if hasKey .Values.cloudCollector.log "whitelist" }} +{{- if hasKey .Values.cloudCollector.log.whitelist "channel" }} + - --log-whitelist-channel={{ .Values.cloudCollector.log.whitelist.channel }} +{{- end }} +{{- if hasKey .Values.cloudCollector.log.whitelist "component" }} + - --log-whitelist-component={{ .Values.cloudCollector.log.whitelist.component }} +{{- end }} +{{- if hasKey .Values.cloudCollector.log.whitelist "cloudPlatform" }} + - --log-whitelist-cloud-platform={{ .Values.cloudCollector.log.whitelist.cloudPlatform }} +{{- end }} +{{- end }} +{{- end }} +{{- if .Values.cloudCollector.additionalArgs }} +{{ toYaml .Values.cloudCollector.additionalArgs | indent 10 }} +{{- end }} + env: + - name: "EBPF_NET_CLUSTER_NAME" + value: {{ tpl (.Values.clusterName | toYaml) . }} +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.enabled) }} + - name: "EBPF_NET_DEBUG_MODE" + value: "true" +{{- end }} +{{- end }} +{{- if (default false .Values.cloudCollector.runUnderGDB) }} + - name: "EBPF_NET_RUN_UNDER_GDB" + value: "gdb" +{{- end }} + - name: "EBPF_NET_INTAKE_HOST" + value: {{ include "opentelemetry-collector-reducer.fullname" . }} + - name: "EBPF_NET_INTAKE_PORT" + value: "{{ default 7000 .Values.reducer.telemetryPort }}" +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - name: "EBPF_NET_MINIDUMP_DIR" + value: "/hostfs/var/run/network-explorer/minidump" +{{- end }} +{{- end }} +{{- if .Values.cloudCollector.env }} +{{ toYaml .Values.cloudCollector.env | indent 10 }} +{{- end }} +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + volumeMounts: + - mountPath: /hostfs/var/run/network-explorer + name: host-var-run-network-explorer + readOnly: false + volumes: + - name: host-var-run-network-explorer + hostPath: + path: /var/run/network-explorer + type: DirectoryOrCreate +{{- end }} +{{- end }} + terminationGracePeriodSeconds: 30 + securityContext: {} + serviceAccountName: {{ include "opentelemetry-collector-cloud-collector.serviceAccountName" . }} + {{- with .Values.cloudCollector.nodeSelector }} + nodeSelector: +{{ toYaml . | indent 8}} + {{- end }} + {{- with .Values.cloudCollector.affinity }} + affinity: +{{ toYaml . | indent 8 }} + {{- end }} + {{- with .Values.cloudCollector.tolerations }} + tolerations: +{{ toYaml . | indent 8 }} + {{- end }} +{{- end }} diff --git a/charts/opentelemetry-ebpf/templates/cloud-collector-serviceaccount.yaml b/charts/opentelemetry-ebpf/templates/cloud-collector-serviceaccount.yaml new file mode 100644 index 000000000..a5e1156cb --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/cloud-collector-serviceaccount.yaml @@ -0,0 +1,12 @@ +{{- if and .Values.cloudCollector.enabled .Values.cloudCollector.serviceAccount.create -}} +apiVersion: v1 +kind: ServiceAccount +metadata: + name: {{ include "opentelemetry-collector-cloud-collector.serviceAccountName" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} + {{- with .Values.cloudCollector.serviceAccount.annotations }} + annotations: + {{- toYaml . | nindent 4 }} + {{- end }} +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/configmap.yaml b/charts/opentelemetry-ebpf/templates/configmap.yaml new file mode 100644 index 000000000..42c4ab32c --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/configmap.yaml @@ -0,0 +1,10 @@ +apiVersion: v1 +kind: ConfigMap +metadata: + name: {{ include "opentelemetry-ebpf.fullname" . }}-config + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +data: + config.yaml: | + labels: + environment: {{ tpl (.Values.clusterName | toYaml) . }} diff --git a/charts/opentelemetry-ebpf/templates/k8s-collector-clusterrole.yaml b/charts/opentelemetry-ebpf/templates/k8s-collector-clusterrole.yaml new file mode 100644 index 000000000..1a4641174 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/k8s-collector-clusterrole.yaml @@ -0,0 +1,25 @@ +{{- if .Values.rbac.create -}} +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: {{ include "opentelemetry-collector-k8s-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +rules: +- apiGroups: + - "" + resources: + - pods + verbs: + - get + - list + - watch +- apiGroups: + - apps + resources: + - replicasets + verbs: + - get + - list + - watch +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/k8s-collector-clusterrolebinding.yaml b/charts/opentelemetry-ebpf/templates/k8s-collector-clusterrolebinding.yaml new file mode 100644 index 000000000..7f4fbca5a --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/k8s-collector-clusterrolebinding.yaml @@ -0,0 +1,16 @@ +{{- if .Values.rbac.create -}} +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRoleBinding +metadata: + name: {{ include "opentelemetry-collector-k8s-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +roleRef: + apiGroup: rbac.authorization.k8s.io + kind: ClusterRole + name: {{ include "opentelemetry-collector-k8s-collector.fullname" . }} +subjects: +- kind: ServiceAccount + name: {{ include "opentelemetry-collector-k8s-collector.serviceAccountName" . }} + namespace: {{ .Release.Namespace }} +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/k8s-collector-deployment.yaml b/charts/opentelemetry-ebpf/templates/k8s-collector-deployment.yaml new file mode 100644 index 000000000..253c1a0a5 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/k8s-collector-deployment.yaml @@ -0,0 +1,160 @@ +{{- if .Values.k8sCollector.enabled }} +# The k8s-collector consists of two services: +# 1) k8s-watcher: talks to the Kubernetes API server to determine the current state of +# the cluster; sets up watches to be notified of subsequent changes to pods, services +# and other resources. +# 2) k8s-relay: relays the information collected by k8s-watcher to the reducer. +apiVersion: apps/v1 +kind: Deployment +metadata: + name: {{ include "opentelemetry-collector-k8s-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +spec: + progressDeadlineSeconds: 600 + replicas: 1 + revisionHistoryLimit: 3 + selector: + matchLabels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-k8s-collector.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + strategy: + type: RollingUpdate + template: + metadata: + annotations: + # This is here to allow us to do "zero-downtime" updates without an image change. + rollingUpdateVersion: "1" + charts.flowmill.com/version: {{ .Chart.Version }} + labels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-k8s-collector.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + spec: +{{- if .Values.imagePullSecrets }} + imagePullSecrets: +{{- range .Values.imagePullSecrets }} + - name: {{ . }} +{{- end }} +{{- end }} + containers: + - image: "{{ default .Values.images.repository .Values.k8sCollector.watcher.image.repository }}/{{ .Values.k8sCollector.watcher.image.name }}:{{ default .Values.images.tag .Values.k8sCollector.watcher.image.tag }}" + imagePullPolicy: {{ .Values.images.pullPolicy }} + name: k8s-watcher +{{- if hasKey .Values.k8sCollector.watcher "resources" }} + resources: +{{ toYaml .Values.k8sCollector.watcher.resources | indent 10 }} +{{- end }} + args: + - --log-console + {{- if hasKey .Values.log "level" }} + - --log-level={{ .Values.log.level }} + {{- end }} + # k8s-relay, which is a service that the k8s-watcher talks to. + # Currently not configurable, has to be reachable on localhost:8172, so must + # share a pod with the k8s-watcher above. + - image: "{{ default .Values.images.repository .Values.k8sCollector.relay.image.repository }}/{{ .Values.k8sCollector.relay.image.name }}:{{ default .Values.images.tag .Values.k8sCollector.relay.image.tag }}" + imagePullPolicy: {{ .Values.images.pullPolicy }} + name: k8s-relay +{{- if hasKey .Values.k8sCollector.relay "resources" }} + resources: +{{ toYaml .Values.k8sCollector.relay.resources | indent 10 }} +{{- end }} + args: + - --config-file=/etc/network-explorer/config.yaml +{{- if .Values.log.console }} + - --log-console +{{- end }} +{{- if hasKey .Values.log "level" }} + - --{{ .Values.log.level }} +{{- end }} +{{- if hasKey .Values.k8sCollector.relay "log" -}} +{{- if hasKey .Values.k8sCollector.relay.log "whitelist" }} +{{- if hasKey .Values.k8sCollector.relay.log.whitelist "channel" }} + - --log-whitelist-channel={{ .Values.k8sCollector.relay.log.whitelist.channel }} +{{- end }} +{{- if hasKey .Values.k8sCollector.relay.log.whitelist "component" }} + - --log-whitelist-component={{ .Values.k8sCollector.relay.log.whitelist.component }} +{{- end }} +{{- if hasKey .Values.k8sCollector.relay.log.whitelist "cloudPlatform" }} + - --log-whitelist-cloud-platform={{ .Values.k8sCollector.relay.log.whitelist.cloudPlatform }} +{{- end }} +{{- end }} +{{- end }} +{{- if .Values.k8sCollector.relay.additionalArgs }} +{{ toYaml .Values.k8sCollector.relay.additionalArgs | indent 10 }} +{{- end }} + env: + - name: "EBPF_NET_CLUSTER_NAME" + value: {{ tpl (.Values.clusterName | toYaml) . }} +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.enabled) }} + - name: "EBPF_NET_DEBUG_MODE" + value: "true" +{{- end }} +{{- end }} +{{- if (default false .Values.k8sCollector.relay.runUnderGDB) }} + - name: "EBPF_NET_RUN_UNDER_GDB" + value: "gdb" +{{- end }} + - name: "EBPF_NET_INTAKE_HOST" + value: {{ include "opentelemetry-collector-reducer.fullname" . }} + - name: "EBPF_NET_INTAKE_PORT" + value: "{{ default 7000 .Values.reducer.telemetryPort }}" +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - name: "EBPF_NET_MINIDUMP_DIR" + value: "/hostfs/var/run/network-explorer/minidump" +{{- end }} +{{- end }} +{{- if and .Values.debug.enabled .Values.debug.sendUnplannedExitMetric }} + - name: "EBPF_NET_CRASH_METRIC_HOST" + value: {{ .Values.otelCollector.address }} + - name: "EBPF_NET_CRASH_METRIC_PORT" + value: {{ .Values.otelCollector.port | default 4317 }} +{{- end }} +{{- if .Values.k8sCollector.relay.env }} +{{ toYaml .Values.k8sCollector.relay.env | indent 10 }} +{{- end }} + volumeMounts: + - mountPath: /etc/network-explorer + name: k8s-relay-config +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - mountPath: /hostfs/var/run/network-explorer + name: host-var-run-network-explorer + readOnly: false +{{- end }} +{{- end }} + terminationGracePeriodSeconds: 30 + volumes: +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - name: host-var-run-network-explorer + hostPath: + path: /var/run/network-explorer + type: DirectoryOrCreate +{{- end }} +{{- end }} + - name: k8s-relay-config + projected: + sources: + - configMap: + name: {{ include "opentelemetry-ebpf.fullname" . }}-config + items: + - key: config.yaml + path: config.yaml + securityContext: {} + serviceAccountName: {{ include "opentelemetry-collector-k8s-collector.serviceAccountName" . }} + {{- with .Values.k8sCollector.nodeSelector }} + nodeSelector: +{{ toYaml . | indent 8}} + {{- end }} + {{- with .Values.k8sCollector.affinity }} + affinity: +{{ toYaml . | indent 8 }} + {{- end }} + {{- with .Values.k8sCollector.tolerations }} + tolerations: +{{ toYaml . | indent 8 }} + {{- end }} +{{- end }} diff --git a/charts/opentelemetry-ebpf/templates/k8s-collector-serviceaccount.yaml b/charts/opentelemetry-ebpf/templates/k8s-collector-serviceaccount.yaml new file mode 100644 index 000000000..db5bd148e --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/k8s-collector-serviceaccount.yaml @@ -0,0 +1,8 @@ +{{- if and .Values.k8sCollector.enabled .Values.k8sCollector.serviceAccount.create -}} +apiVersion: v1 +kind: ServiceAccount +metadata: + name: {{ include "opentelemetry-collector-k8s-collector.serviceAccountName" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/kernel-collector-clusterrole.yaml b/charts/opentelemetry-ebpf/templates/kernel-collector-clusterrole.yaml new file mode 100644 index 000000000..d0675a991 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/kernel-collector-clusterrole.yaml @@ -0,0 +1,17 @@ +{{- if .Values.rbac.create -}} +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRole +metadata: + name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +rules: +- apiGroups: + - policy + resourceNames: + - {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + resources: + - podsecuritypolicies + verbs: + - use +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/kernel-collector-clusterrolebinding.yaml b/charts/opentelemetry-ebpf/templates/kernel-collector-clusterrolebinding.yaml new file mode 100644 index 000000000..ca40a54f1 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/kernel-collector-clusterrolebinding.yaml @@ -0,0 +1,16 @@ +{{- if .Values.rbac.create -}} +apiVersion: rbac.authorization.k8s.io/v1 +kind: ClusterRoleBinding +metadata: + name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +roleRef: + apiGroup: rbac.authorization.k8s.io + kind: ClusterRole + name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} +subjects: +- kind: ServiceAccount + name: {{ include "opentelemetry-collector-kernel-collector.serviceAccountName" . }} + namespace: {{ .Release.Namespace }} +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/kernel-collector-daemonset.yaml b/charts/opentelemetry-ebpf/templates/kernel-collector-daemonset.yaml new file mode 100644 index 000000000..32ea0e2ab --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/kernel-collector-daemonset.yaml @@ -0,0 +1,197 @@ +{{- if .Values.kernelCollector.enabled }} +# kernel collector daemonset: deploys the kernel collector to each node in the cluster. +# The kernel collector needs to be able to compile and install +# eBPF programs in the node's kernel, so needs to run as root and +# needs to mount /lib/modules and /usr/src from the node itself. +apiVersion: apps/v1 +kind: DaemonSet +metadata: + name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +spec: + selector: + matchLabels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + template: + metadata: + annotations: + release_number: "3" + charts.flowmill.com/version: {{ .Chart.Version }} + labels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + spec: +{{- if .Values.imagePullSecrets }} + imagePullSecrets: +{{- range .Values.imagePullSecrets }} + - name: {{ . }} +{{- end }} +{{- end }} + containers: + - name: kernel-collector + image: "{{ default .Values.images.repository .Values.kernelCollector.image.repository }}/{{ .Values.kernelCollector.image.name }}:{{ default .Values.images.tag .Values.kernelCollector.image.tag }}" + imagePullPolicy: {{ .Values.images.pullPolicy }} + args: + - --config-file=/etc/network-explorer/config.yaml +{{- if .Values.kernelCollector.bpfDumpFile }} + - --bpf-dump-file={{ .Values.kernelCollector.bpfDumpFile }} +{{- end }} +{{- if (default false .Values.kernelCollector.useDockerMetadata) }} + - --force-docker-metadata +{{- end }} +{{- if not (default false .Values.kernelCollector.collectNomadMetadata) }} + - --disable-nomad-metadata +{{- end }} +{{- if .Values.kernelCollector.userlandTcp }} + - --enable-userland-tcp +{{- end }} +{{- if .Values.log.console }} + - --log-console +{{- end }} +{{- if hasKey .Values.log "level" }} + - --{{ .Values.log.level }} +{{- end }} +{{- if hasKey .Values.kernelCollector "log" }} +{{- if hasKey .Values.kernelCollector.log "whitelist" }} +{{- if hasKey .Values.kernelCollector.log.whitelist "agentLog" }} + - --log-whitelist-agent-log={{ .Values.kernelCollector.log.whitelist.agentLog }} +{{- end }} +{{- if hasKey .Values.kernelCollector.log.whitelist "channel" }} + - --log-whitelist-channel={{ .Values.kernelCollector.log.whitelist.channel }} +{{- end }} +{{- if hasKey .Values.kernelCollector.log.whitelist "component" }} + - --log-whitelist-component={{ .Values.kernelCollector.log.whitelist.component }} +{{- end }} +{{- if hasKey .Values.kernelCollector.log.whitelist "cloudPlatform" }} + - --log-whitelist-cloud-platform={{ .Values.kernelCollector.log.whitelist.cloudPlatform }} +{{- end }} +{{- end }} +{{- end }} +{{- if .Values.kernelCollector.additionalArgs }} +{{ toYaml .Values.kernelCollector.additionalArgs | indent 12 }} +{{- end }} + # TODO: liveness probe + env: + - name: "EBPF_NET_CLUSTER_NAME" + value: {{ tpl (.Values.clusterName | toYaml) . }} +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.enabled) }} + - name: "EBPF_NET_DEBUG_MODE" + value: "true" +{{- end }} +{{- end }} + - name: "EBPF_NET_DISABLE_HTTP_METRICS" + value: {{ quote (default false .Values.kernelCollector.disableHttpMetrics) }} +{{- if (default false .Values.kernelCollector.runUnderGDB) }} + - name: "EBPF_NET_RUN_UNDER_GDB" + value: "gdb" +{{- end }} + - name: "EBPF_NET_KERNEL_HEADERS_AUTO_FETCH" + value: {{ quote (default true .Values.kernelCollector.fetchKernelHeaders) }} + - name: "EBPF_NET_INTAKE_HOST" + value: {{ include "opentelemetry-collector-reducer.fullname" . }} + - name: "EBPF_NET_INTAKE_PORT" + value: "{{ default 7000 .Values.reducer.telemetryPort }}" +{{- if .Values.kernelCollector.exportBpfSrcFile }} + - name: "EBPF_NET_EXPORT_BPF_SRC_FILE" + value: {{ quote .Values.kernelCollector.exportBpfSrcFile }} +{{- end }} + - name: "EBPF_NET_HOST_DIR" + value: "/hostfs" +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - name: "EBPF_NET_MINIDUMP_DIR" + value: "/hostfs/var/run/network-explorer/minidump" +{{- end }} +{{- end }} +{{- if and .Values.debug.enabled .Values.debug.sendUnplannedExitMetric }} + - name: "EBPF_NET_CRASH_METRIC_HOST" + value: {{ .Values.otelCollector.address }} + - name: "EBPF_NET_CRASH_METRIC_PORT" + value: {{ .Values.otelCollector.port | default 4317 }} +{{- end }} +{{- if .Values.kernelCollector.env }} +{{ toYaml .Values.kernelCollector.env | indent 12 }} +{{- end }} +{{- if .Values.kernelCollector.resources }} + resources: +{{ toYaml .Values.kernelCollector.resources | indent 12 }} +{{- end }} + securityContext: + privileged: true + volumeMounts: + - mountPath: /hostfs/ + name: host-root + readOnly: true +{{- if (default true .Values.kernelCollector.fetchKernelHeaders) }} + - mountPath: /hostfs/var/cache + name: host-var-cache + readOnly: false +{{- end }} + - mountPath: /etc/network-explorer + name: {{ include "opentelemetry-ebpf.fullname" . }}-config + readOnly: true +{{- if (default false .Values.kernelCollector.useDockerMetadata) }} + - mountPath: /var/run/docker.sock + name: docker-sock + readOnly: false +{{- end }} +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - mountPath: /hostfs/var/run/network-explorer + name: host-var-run-network-explorer + readOnly: false +{{- end }} +{{- end }} + dnsPolicy: ClusterFirstWithHostNet + hostNetwork: true + hostPID: true + serviceAccountName: {{ include "opentelemetry-collector-kernel-collector.serviceAccountName" . }} + volumes: + - name: {{ include "opentelemetry-ebpf.fullname" . }}-config + projected: + sources: + - configMap: + name: {{ include "opentelemetry-ebpf.fullname" . }}-config + items: + - key: config.yaml + path: config.yaml + - name: host-root + hostPath: + path: / + type: Directory +{{- if (default true .Values.kernelCollector.fetchKernelHeaders) }} + - name: host-var-cache + hostPath: + path: /var/cache + type: DirectoryOrCreate +{{- end }} +{{- if hasKey .Values "debug" }} +{{- if (default false .Values.debug.storeMinidump) }} + - name: host-var-run-network-explorer + hostPath: + path: /var/run/network-explorer + type: DirectoryOrCreate +{{- end }} +{{- end }} +{{- if (default false .Values.kernelCollector.useDockerMetadata) }} + - name: docker-sock + hostPath: + path: /var/run/docker.sock + type: Socket +{{- end }} + {{- with .Values.kernelCollector.nodeSelector }} + nodeSelector: +{{ toYaml . | indent 8 }} + {{- end }} + {{- with .Values.kernelCollector.affinity }} + affinity: +{{ toYaml . | indent 8 }} + {{- end }} + {{- with .Values.kernelCollector.tolerations }} + tolerations: +{{ toYaml . | indent 8 }} + {{- end }} +{{- end }} diff --git a/charts/opentelemetry-ebpf/templates/kernel-collector-podsecuritypolicy.yaml b/charts/opentelemetry-ebpf/templates/kernel-collector-podsecuritypolicy.yaml new file mode 100644 index 000000000..c73112dbc --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/kernel-collector-podsecuritypolicy.yaml @@ -0,0 +1,38 @@ +{{- if .Values.podSecurityPolicy.enabled }} +apiVersion: policy/v1beta1 +kind: PodSecurityPolicy +metadata: + name: {{ include "opentelemetry-collector-kernel-collector.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +spec: + privileged: true + allowPrivilegeEscalation: true + allowedHostPaths: + - pathPrefix: /usr/src + readOnly: true + - pathPrefix: /lib/modules + readOnly: true + - pathPrefix: /etc + readOnly: true + - pathPrefix: /var/cache + readOnly: false + - pathPrefix: /sys/fs/cgroup + readOnly: true + fsGroup: + rule: RunAsAny + hostNetwork: true + hostPorts: + - max: 65535 + min: 0 + hostPID: true + readOnlyRootFilesystem: false + runAsUser: + rule: RunAsAny + seLinux: + rule: RunAsAny + supplementalGroups: + rule: RunAsAny + volumes: + - "*" +{{- end }} diff --git a/charts/opentelemetry-ebpf/templates/kernel-collector-serviceaccount.yaml b/charts/opentelemetry-ebpf/templates/kernel-collector-serviceaccount.yaml new file mode 100644 index 000000000..456136d5b --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/kernel-collector-serviceaccount.yaml @@ -0,0 +1,8 @@ +{{- if and .Values.kernelCollector.enabled .Values.kernelCollector.serviceAccount.create -}} +apiVersion: v1 +kind: ServiceAccount +metadata: + name: {{ include "opentelemetry-collector-kernel-collector.serviceAccountName" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +{{- end -}} diff --git a/charts/opentelemetry-ebpf/templates/reducer-deployment.yaml b/charts/opentelemetry-ebpf/templates/reducer-deployment.yaml new file mode 100644 index 000000000..6bc589cf4 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/reducer-deployment.yaml @@ -0,0 +1,121 @@ +apiVersion: apps/v1 +kind: Deployment +metadata: + name: {{ include "opentelemetry-collector-reducer.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +spec: + replicas: 1 + strategy: + type: RollingUpdate + selector: + matchLabels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-reducer.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + template: + metadata: + labels: + app.kubernetes.io/name: {{ include "opentelemetry-collector-reducer.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + spec: +{{- if .Values.imagePullSecrets }} + imagePullSecrets: +{{- range .Values.imagePullSecrets }} + - name: {{ . }} +{{- end }} +{{- end }} + containers: + - name: reducer + image: "{{ default .Values.images.repository .Values.reducer.image.repository }}/{{ .Values.reducer.image.name }}:{{ default .Values.images.tag .Values.reducer.image.tag }}" + imagePullPolicy: {{ .Values.images.pullPolicy }} + args: + - --port={{- .Values.reducer.telemetryPort }} + - --log-console + - --no-log-file + {{- if hasKey .Values.log "level" }} + - --{{ .Values.log.level }} + {{- end }} + - --enable-aws-enrichment + - --disable-prometheus-metrics + - --enable-otlp-grpc-metrics + - --otlp-grpc-metrics-host={{ .Values.otelCollector.address }} + - --otlp-grpc-metrics-port={{ .Values.otelCollector.port | default 4317 }} + {{- if .Values.reducer.disableMetrics }} + - --disable-metrics={{join "," .Values.reducer.disableMetrics}} + {{- end }} + {{- if .Values.reducer.enableMetrics }} + - --enable-metrics={{join "," .Values.reducer.enableMetrics}} + {{- end }} + {{- if .Values.reducer.ingestShards }} + - --num-ingest-shards={{- .Values.reducer.ingestShards }} + {{- end }} + {{- if .Values.reducer.matchingShards }} + - --num-matching-shards={{- .Values.reducer.matchingShards }} + {{- end }} + {{- if .Values.reducer.aggregationShards }} + - --num-aggregation-shards={{- .Values.reducer.aggregationShards }} + {{- end }} + {{- if .Values.reducer.extraArgs }} + {{- toYaml .Values.reducer.extraArgs | nindent 12 }} + {{- end }} + {{- if .Values.debug.enabled }} + env: + {{- if (default false .Values.debug.storeMinidump) }} + - name: "EBPF_NET_MINIDUMP_DIR" + value: "/hostfs/var/run/network-explorer/minidump" + {{- end }} + {{- if .Values.debug.sendUnplannedExitMetric }} + - name: "EBPF_NET_CRASH_METRIC_HOST" + value: {{ .Values.otelCollector.address }} + - name: "EBPF_NET_CRASH_METRIC_PORT" + value: {{ .Values.otelCollector.port | default 4317 }} + {{- end }} + {{- end }} + ports: + - name: telemetry + containerPort: {{ .Values.reducer.telemetryPort }} + protocol: TCP + {{- if not .Values.reducer.disableInternalMetrics }} + - name: stats + containerPort: {{ .Values.reducer.statsPromPort }} + protocol: TCP + {{- end }} + {{- if .Values.debug.enabled }} + volumeMounts: + {{- if (default false .Values.debug.storeMinidump) }} + - mountPath: /hostfs/var/run/network-explorer + name: host-var-run-network-explorer + readOnly: false + {{- end }} + {{- end }} + readinessProbe: + initialDelaySeconds: 5 + periodSeconds: 20 + timeoutSeconds: 5 + exec: + command: ['/srv/health_check.sh', 'readiness_probe', 'localhost', {{ quote .Values.reducer.telemetryPort }}] + {{- if .Values.resources }} + resources: + {{- toYaml .Values.resources | nindent 12 }} + {{- end }} + {{- with .Values.reducer.nodeSelector }} + nodeSelector: + {{- toYaml . | nindent 8 }} + {{- end }} + {{- with .Values.reducer.affinity }} + affinity: + {{- toYaml . | nindent 8 }} + {{- end }} + {{- with .Values.reducer.tolerations }} + tolerations: + {{- toYaml . | nindent 8 }} + {{- end }} + {{- if .Values.debug.enabled }} + volumes: + {{- if (default false .Values.debug.storeMinidump) }} + - name: host-var-run-network-explorer + hostPath: + path: /var/run/network-explorer + type: DirectoryOrCreate + {{- end }} + {{- end }} diff --git a/charts/opentelemetry-ebpf/templates/reducer-service.yaml b/charts/opentelemetry-ebpf/templates/reducer-service.yaml new file mode 100644 index 000000000..0f7028e10 --- /dev/null +++ b/charts/opentelemetry-ebpf/templates/reducer-service.yaml @@ -0,0 +1,22 @@ +apiVersion: v1 +kind: Service +metadata: + name: {{ include "opentelemetry-collector-reducer.fullname" . }} + labels: + {{- include "opentelemetry-ebpf.labels" . | nindent 4 }} +spec: + type: ClusterIP + selector: + app.kubernetes.io/name: {{ include "opentelemetry-collector-reducer.fullname" . }} + app.kubernetes.io/instance: {{ .Release.Name }} + ports: + - name: telemetry + port: {{ .Values.reducer.telemetryPort }} + targetPort: telemetry + protocol: TCP + {{- if not .Values.reducer.disableInternalMetrics }} + - name: stats + port: {{ .Values.reducer.statsPromPort }} + targetPort: stats + protocol: TCP + {{- end }} diff --git a/charts/opentelemetry-ebpf/values.schema.json b/charts/opentelemetry-ebpf/values.schema.json new file mode 100644 index 000000000..0eae4b477 --- /dev/null +++ b/charts/opentelemetry-ebpf/values.schema.json @@ -0,0 +1,176 @@ +{ + "$schema": "http://json-schema.org/schema#", + "type": "object", + "title": "Values", + "additionalProperties": false, + "properties": { + "global": { + "type": "object" + }, + "nameOverride": { + "description": "Override name of the chart used in Kubernetes object names.", + "type": "string" + }, + "fullnameOverride": { + "description": "Override fully qualified app name.", + "type": "string" + }, + "clusterName": { + "description": "Cluster Name", + "type": "string" + }, + "otelCollector": { + "type": "object", + "additionalProperties": false, + "required": [ + "address" + ], + "properties": { + "address": { + "type": "string" + }, + "port": { + "type": "string" + } + } + }, + "resources": { + "type": "object", + "additionalProperties": false, + "properties": { + "limits": { + "type": "object", + "additionalProperties": false, + "properties": { + "cpu": { + "type": [ + "string", + "integer" + ] + }, + "memory": { + "type": "string" + } + } + }, + "requests": { + "type": "object", + "additionalProperties": false, + "properties": { + "cpu": { + "type": [ + "string", + "integer" + ] + }, + "memory": { + "type": "string" + } + } + } + } + }, + "images": { + "description": "images", + "type": "object", + "additionalProperties": false, + "properties": { + "tag": { + "type": "string" + }, + "repository": { + "type": "string" + }, + "pullPolicy": { + "type": "string", + "enum": [ + "IfNotPresent", + "Always", + "Never" + ] + } + } + }, + "imagePullSecrets": { + "type": "array", + "items": { + "type": "string" + } + }, + "log": { + "type": "object", + "additionalProperties": false, + "properties": { + "console": { + "type": "boolean" + }, + "level": { + "type": "string", + "enum": [ + "error", + "warning", + "info", + "debug", + "trace" + ] + } + } + }, + "debug": { + "type": "object", + "additionalProperties": false, + "properties": { + "enabled": { + "type": "boolean" + }, + "storeMinidump": { + "type": "boolean" + }, + "sendUnplannedExitMetric": { + "type": "boolean" + } + } + }, + "kernelCollector": { + "type": "object", + "additionalProperties": true + }, + "cloudCollector": { + "type": "object", + "additionalProperties": true + }, + "k8sCollector": { + "type": "object", + "additionalProperties": true + }, + "reducer": { + "type": "object", + "additionalProperties": true + }, + "rbac": { + "type": "object", + "additionalProperties": false, + "properties": { + "create": { + "type": "boolean" + } + } + }, + "podSecurityPolicy": { + "type": "object", + "additionalProperties": false, + "properties": { + "enabled": { + "type": "boolean" + }, + "annotations": { + "type": "object", + "additionalProperties": true + } + } + } + }, + "required": [ + "clusterName" + ] +} \ No newline at end of file diff --git a/charts/opentelemetry-ebpf/values.yaml b/charts/opentelemetry-ebpf/values.yaml new file mode 100644 index 000000000..6d02e918d --- /dev/null +++ b/charts/opentelemetry-ebpf/values.yaml @@ -0,0 +1,275 @@ +# Default values for opentelemetry-ebpf. +# This is a YAML-formatted file. +# Declare variables to be passed into your templates. + +nameOverride: "" +fullnameOverride: "" + +clusterName: "" + +images: + tag: "v0.10.0" + repository: otel + pullPolicy: IfNotPresent + +imagePullSecrets: [] + +resources: {} + +otelCollector: + address: "" + port: "" + +log: + console: false + # possible values: { error | warning | info | debug | trace } + level: warning + +debug: + enabled: false + storeMinidump: false + sendUnplannedExitMetric: false + +kernelCollector: + enabled: true + serviceAccount: + create: true + name: "" + image: + repository: "" + tag: "" + name: opentelemetry-ebpf-kernel-collector + + nodeSelector: {} + disableHttpMetrics: false + + tolerations: + - operator: "Exists" + effect: "NoExecute" + - operator: "Exists" + effect: "NoSchedule" + + affinity: {} + resources: {} + + # uncomment the line below to disable automatic kernel headers fetching + # fetchKernelHeaders: false + + # uncomment to enable enrichment using Docker metadata + # useDockerMetadata: true + + # uncomment to enable enrichment using Nomad metadata (https://www.nomadproject.io/) + # collectNomadMetadata: true + +cloudCollector: + enabled: false + image: + repository: "" + tag: "" + name: opentelemetry-ebpf-cloud-collector + + serviceAccount: + create: true + name: "" + annotations: + {} + ## eks.amazonaws.com/role-arn: "role-arn-name" + + tolerations: [] + affinity: {} + +k8sCollector: + enabled: true + serviceAccount: + create: true + name: "" + relay: + image: + repository: "" + tag: "" + name: opentelemetry-ebpf-k8s-relay + watcher: + image: + repository: "" + tag: "" + name: opentelemetry-ebpf-k8s-watcher + + tolerations: [] + affinity: {} + +reducer: + image: + repository: "" + tag: "" + name: opentelemetry-ebpf-reducer + extraArgs: {} + ingestShards: 1 + matchingShards: 1 + aggregationShards: 1 + disableInternalMetrics: true + disableMetrics: + [] + ### to disable an entire metric category: ### + # - tcp.all + # - udp.all + # - dns.all + # - http.all + ### to disable an individual metric: ### + ### tcp ### + # - tcp.bytes + # - tcp.rtt.num_measurements + # - tcp.active + # - tcp.rtt.average + # - tcp.packets + # - tcp.retrans + # - tcp.syn_timeouts + # - tcp.new_sockets + # - tcp.resets + ### udp ### + # - udp.bytes + # - udp.packets + # - udp.active + # - udp.drops + ### dns ### + # - dns.client.duration.average + # - dns.server.duration.average + # - dns.active_sockets + # - dns.responses + # - dns.timeouts + ### http ## + # - http.client.duration.average + # - http.server.duration.average + # - http.active_sockets + # - http.status_code + ### ebpf_net ## + # - ebpf_net.span_utilization_fraction + # - ebpf_net.pipeline_metric_bytes_discarded + # - ebpf_net.codetiming_min_ns + # - ebpf_net.entrypoint_info + # - ebpf_net.otlp_grpc.requests_sent + # - ebpf_net.connections + # - ebpf_net.rpc_queue_elem_utilization_fraction + # - ebpf_net.disconnects + # - ebpf_net.codetiming_avg_ns + # - ebpf_net.client_handle_pool + # - ebpf_net.otlp_grpc.successful_requests + # - ebpf_net.span_utilization + # - ebpf_net.up + # - ebpf_net.rpc_queue_buf_utilization_fraction + # - ebpf_net.collector_log_count + # - ebpf_net.time_since_last_message_ns + # - ebpf_net.bpf_log + # - ebpf_net.codetiming_count + # - ebpf_net.message + # - ebpf_net.otlp_grpc.bytes_sent + # - ebpf_net.pipeline_message_error + # - ebpf_net.pipeline_metric_bytes_written + # - ebpf_net.codetiming_max_ns + # - ebpf_net.span_utilization_max + # - ebpf_net.client_handle_pool_fraction + # - ebpf_net.span_utilization_fraction + # - ebpf_net.rpc_latency_ns + # - ebpf_net.agg_root_truncation + # - ebpf_net.clock_offset_ns + # - ebpf_net.otlp_grpc.metrics_sent + # - ebpf_net.otlp_grpc.unknown_response_tags + # - ebpf_net.collector_health + # - ebpf_net.codetiming_sum_ns + # - ebpf_net.otlp_grpc.failed_requests + # - ebpf_net.rpc_queue_buf_utilization + ### to enable all metrics (including metrics turned off by default): ### + # - none + enableMetrics: + [] + ### Disable metrics flag is evaluated first and only then enable metric flag is evaluated. ### + ### to enable an entire metric category: ### + # - tcp.all + # - udp.all + # - dns.all + # - http.all + # - ebpf_net.all + ### to enable an individual metric: ### + ### tcp ### + # - tcp.bytes + # - tcp.rtt.num_measurements + # - tcp.active + # - tcp.rtt.average + # - tcp.packets + # - tcp.retrans + # - tcp.syn_timeouts + # - tcp.new_sockets + # - tcp.resets + ### udp ### + # - udp.bytes + # - udp.packets + # - udp.active + # - udp.drops + ### dns ### + # - dns.client.duration.average + # - dns.server.duration.average + # - dns.active_sockets + # - dns.responses + # - dns.timeouts + ### http ### + # - http.client.duration.average + # - http.server.duration.average + # - http.active_sockets + # - http.status_code + ### ebpf_net ### + # - ebpf_net.span_utilization_fraction + # - ebpf_net.pipeline_metric_bytes_discarded + # - ebpf_net.codetiming_min_ns + # - ebpf_net.entrypoint_info + # - ebpf_net.otlp_grpc.requests_sent + # - ebpf_net.connections + # - ebpf_net.rpc_queue_elem_utilization_fraction + # - ebpf_net.disconnects + # - ebpf_net.codetiming_avg_ns + # - ebpf_net.client_handle_pool + # - ebpf_net.otlp_grpc.successful_requests + # - ebpf_net.span_utilization + # - ebpf_net.up + # - ebpf_net.rpc_queue_buf_utilization_fraction + # - ebpf_net.collector_log_count + # - ebpf_net.time_since_last_message_ns + # - ebpf_net.bpf_log + # - ebpf_net.codetiming_count + # - ebpf_net.message + # - ebpf_net.otlp_grpc.bytes_sent + # - ebpf_net.pipeline_message_error + # - ebpf_net.pipeline_metric_bytes_written + # - ebpf_net.codetiming_max_ns + # - ebpf_net.span_utilization_max + # - ebpf_net.client_handle_pool_fraction + # - ebpf_net.span_utilization_fraction + # - ebpf_net.rpc_latency_ns + # - ebpf_net.agg_root_truncation + # - ebpf_net.clock_offset_ns + # - ebpf_net.otlp_grpc.metrics_sent + # - ebpf_net.otlp_grpc.unknown_response_tags + # - ebpf_net.collector_health + # - ebpf_net.codetiming_sum_ns + # - ebpf_net.otlp_grpc.failed_requests + # - ebpf_net.rpc_queue_buf_utilization + telemetryPort: 7000 + statsPromPort: 7001 + resources: {} + nodeSelector: {} + tolerations: [] + affinity: {} + +rbac: + create: true + +podSecurityPolicy: + enabled: true + annotations: + {} + ## Specify pod annotations + ## Ref: https://kubernetes.io/docs/concepts/policy/pod-security-policy/#apparmor + ## Ref: https://kubernetes.io/docs/concepts/policy/pod-security-policy/#seccomp + ## Ref: https://kubernetes.io/docs/concepts/policy/pod-security-policy/#sysctl + ## + # seccomp.security.alpha.kubernetes.io/allowedProfileNames: '*' + # seccomp.security.alpha.kubernetes.io/defaultProfileName: 'docker/default' + # apparmor.security.beta.kubernetes.io/defaultProfileName: 'runtime/default'