3554 lines
133 KiB
YAML
3554 lines
133 KiB
YAML
|
global:
|
|||
|
# zone: cluster.local (use only if your DNS server doesn't live in the same zone as kubecost)
|
|||
|
prometheus:
|
|||
|
enabled: true # Kubecost depends on Prometheus data, it is not optional. When enabled: false, Prometheus will not be installed and you must configure your own Prometheus to scrape kubecost as well as provide the fqdn below. -- Warning: Before changing this setting, please read to understand the risks https://docs.kubecost.com/install-and-configure/install/custom-prom
|
|||
|
fqdn: http://cost-analyzer-prometheus-server.default.svc # example address of a prometheus to connect to. Include protocol (http:// or https://) Ignored if enabled: true
|
|||
|
# insecureSkipVerify: false # If true, kubecost will not check the TLS cert of prometheus
|
|||
|
# queryServiceBasicAuthSecretName: dbsecret # kubectl create secret generic dbsecret -n kubecost --from-file=USERNAME --from-file=PASSWORD
|
|||
|
# queryServiceBearerTokenSecretName: mcdbsecret # kubectl create secret generic mcdbsecret -n kubecost --from-file=TOKEN
|
|||
|
|
|||
|
grafana:
|
|||
|
enabled: true # If false, Grafana will not be installed
|
|||
|
domainName: cost-analyzer-grafana.default.svc # example grafana domain Ignored if enabled: true
|
|||
|
scheme: "http" # http or https, for the domain name above.
|
|||
|
proxy: true # If true, the kubecost frontend will route to your grafana through its service endpoint
|
|||
|
# fqdn: cost-analyzer-grafana.default.svc
|
|||
|
|
|||
|
# Enable only when you are using GCP Marketplace ENT listing. Learn more at https://console.cloud.google.com/marketplace/product/kubecost-public/kubecost-ent
|
|||
|
gcpstore:
|
|||
|
enabled: false
|
|||
|
|
|||
|
# Google Cloud Managed Service for Prometheus
|
|||
|
gmp:
|
|||
|
# Remember to set up these parameters when install the Kubecost Helm chart with `global.gmp.enabled=true` if you want to use GMP self-deployed collection (Recommended) to utilize Kubecost scrape configs.
|
|||
|
# If enabling GMP, it is highly recommended to utilize Google's distribution of Prometheus.
|
|||
|
# Learn more at https://cloud.google.com/stackdriver/docs/managed-prometheus/setup-unmanaged
|
|||
|
# --set prometheus.server.image.repository="gke.gcr.io/prometheus-engine/prometheus" \
|
|||
|
# --set prometheus.server.image.tag="v2.35.0-gmp.2-gke.0"
|
|||
|
enabled: false # If true, kubecost will be configured to use GMP Prometheus image and query from Google Cloud Managed Service for Prometheus.
|
|||
|
prometheusServerEndpoint: http://localhost:8085/ # The prometheus service endpoint used by kubecost. The calls are forwarded through the GMP Prom proxy side car to the GMP database.
|
|||
|
gmpProxy:
|
|||
|
enabled: false
|
|||
|
image: gke.gcr.io/prometheus-engine/frontend:v0.4.1-gke.0 # GMP Prometheus proxy image that serve as an endpoint to query metrics from GMP
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
name: gmp-proxy
|
|||
|
port: 8085
|
|||
|
projectId: YOUR_PROJECT_ID # example GCP project ID
|
|||
|
|
|||
|
# Amazon Managed Service for Prometheus
|
|||
|
amp:
|
|||
|
enabled: false # If true, kubecost will be configured to remote_write and query from Amazon Managed Service for Prometheus.
|
|||
|
prometheusServerEndpoint: http://localhost:8005/workspaces/<workspaceId>/ # The prometheus service endpoint used by kubecost. The calls are forwarded through the SigV4Proxy side car to the AMP workspace.
|
|||
|
remoteWriteService: https://aps-workspaces.us-west-2.amazonaws.com/workspaces/<workspaceId>/api/v1/remote_write # The remote_write endpoint for the AMP workspace.
|
|||
|
sigv4:
|
|||
|
region: us-west-2
|
|||
|
# access_key: ACCESS_KEY # AWS Access key
|
|||
|
# secret_key: SECRET_KEY # AWS Secret key
|
|||
|
# role_arn: ROLE_ARN # AWS role arn
|
|||
|
# profile: PROFILE # AWS profile
|
|||
|
|
|||
|
# Mimir Proxy to help Kubecost to query metrics from multi-tenant Grafana Mimir.
|
|||
|
# Set `global.mimirProxy.enabled=true` and `global.prometheus.enabled=false` to enable Mimir Proxy.
|
|||
|
# You also need to set `global.prometheus.fqdn=http://kubecost-cost-analyzer-mimir-proxy.kubecost.svc:8085/prometheus`
|
|||
|
# or `global.prometheus.fqdn=http://{{ template "cost-analyzer.fullname" . }}-mimir-proxy.{{ .Release.Namespace }}.svc:8085/prometheus'
|
|||
|
# Learn more at https://grafana.com/docs/mimir/latest/operators-guide/secure/authentication-and-authorization/#without-an-authenticating-reverse-proxy
|
|||
|
mimirProxy:
|
|||
|
enabled: false
|
|||
|
name: mimir-proxy
|
|||
|
image: nginxinc/nginx-unprivileged
|
|||
|
port: 8085
|
|||
|
mimirEndpoint: $mimir_endpoint # Your Mimir query endpoint. If your Mimir query endpoint is http://example.com/prometheus, replace $mimir_endpoint with http://example.com/
|
|||
|
orgIdentifier: $your_tenant_ID # Your Grafana Mimir tenant ID
|
|||
|
# basicAuth:
|
|||
|
# username: user
|
|||
|
# password: pwd
|
|||
|
|
|||
|
# Azure Monitor Managed Service for Prometheus
|
|||
|
# See https://github.com/MicrosoftDocs/azure-docs/blob/main/articles/azure-monitor/essentials/prometheus-metrics-overview.md for information
|
|||
|
# and https://learn.microsoft.com/en-us/azure/azure-monitor/essentials/prometheus-remote-write-virtual-machines for more information on setting this up
|
|||
|
ammsp:
|
|||
|
enabled: false
|
|||
|
prometheusServerEndpoint: http://localhost:8081/
|
|||
|
remoteWriteService: $<AMMSP_METRICS_INGESTION_ENDPOINT>
|
|||
|
queryEndpoint: $<AMMSP_QUERY_ENDPOINT>
|
|||
|
|
|||
|
aadAuthProxy:
|
|||
|
enabled: false
|
|||
|
# per https://github.com/Azure/aad-auth-proxy/releases/tag/0.1.0-main-04-10-2024-7067ac84
|
|||
|
image: $<IMAGE> # Example: mcr.microsoft.com/azuremonitor/auth-proxy/prod/aad-auth-proxy/images/aad-auth-proxy:0.1.0-main-04-10-2024-7067ac84
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
name: aad-auth-proxy
|
|||
|
port: 8081
|
|||
|
audience: https://prometheus.monitor.azure.com/.default
|
|||
|
identityType: userAssigned
|
|||
|
aadClientId: $<AZURE_MANAGED_IDENTITY_CLIENT_ID>
|
|||
|
aadTenantId: $<AZURE_MANAGED_IDENTITY_TENANT_ID>
|
|||
|
|
|||
|
notifications:
|
|||
|
# Kubecost alerting configuration
|
|||
|
# Ref: http://docs.kubecost.com/alerts
|
|||
|
# alertConfigs:
|
|||
|
# frontendUrl: http://localhost:9090 # optional, used for linkbacks
|
|||
|
# globalSlackWebhookUrl: https://hooks.slack.com/services/T00000000/B00000000/XXXXXXXXXXXXXXXXXXXXXXXX # optional, used for Slack alerts
|
|||
|
# globalMsTeamsWebhookUrl: https://xxxxx.webhook.office.com/webhookb2/XXXXXXXXXXXXXXXXXXXXXXXX/IncomingWebhook/XXXXXXXXXXXXXXXXXXXXXXXX # optional, used for Microsoft Teams alerts
|
|||
|
# globalAlertEmails:
|
|||
|
# - recipient@example.com
|
|||
|
# - additionalRecipient@example.com
|
|||
|
# globalEmailSubject: Custom Subject
|
|||
|
# Alerts generated by kubecost, about cluster data
|
|||
|
# alerts:
|
|||
|
# Daily namespace budget alert on namespace `kubecost`
|
|||
|
# - type: budget # supported: budget, recurringUpdate
|
|||
|
# threshold: 50 # optional, required for budget alerts
|
|||
|
# window: daily # or 1d
|
|||
|
# aggregation: namespace
|
|||
|
# filter: kubecost
|
|||
|
# ownerContact: # optional, overrides globalAlertEmails default
|
|||
|
# - owner@example.com
|
|||
|
# - owner2@example.com
|
|||
|
# # optional, used for alert-specific Slack and Microsoft Teams alerts
|
|||
|
# slackWebhookUrl: https://hooks.slack.com/services/T00000000/B00000000/XXXXXXXXXXXXXXXXXXXXXXXX
|
|||
|
# msTeamsWebhookUrl: https://xxxxx.webhook.office.com/webhookb2/XXXXXXXXXXXXXXXXXXXXXXXX/IncomingWebhook/XXXXXXXXXXXXXXXXXXXXXXXX
|
|||
|
|
|||
|
# Daily cluster budget alert on cluster `cluster-one`
|
|||
|
# - type: budget
|
|||
|
# threshold: 200.8 # optional, required for budget alerts
|
|||
|
# window: daily # or 1d
|
|||
|
# aggregation: cluster
|
|||
|
# filter: cluster-one # does not accept csv
|
|||
|
|
|||
|
# Recurring weekly update (weeklyUpdate alert)
|
|||
|
# - type: recurringUpdate
|
|||
|
# window: weekly # or 7d
|
|||
|
# aggregation: namespace
|
|||
|
# filter: '*'
|
|||
|
|
|||
|
# Recurring weekly namespace update on kubecost namespace
|
|||
|
# - type: recurringUpdate
|
|||
|
# window: weekly # or 7d
|
|||
|
# aggregation: namespace
|
|||
|
# filter: kubecost
|
|||
|
|
|||
|
# Spend Change Alert
|
|||
|
# - type: spendChange # change relative to moving avg
|
|||
|
# relativeThreshold: 0.20 # Proportional change relative to baseline. Must be greater than -1 (can be negative)
|
|||
|
# window: 1d # accepts ‘d’, ‘h’
|
|||
|
# baselineWindow: 30d # previous window, offset by window
|
|||
|
# aggregation: namespace
|
|||
|
# filter: kubecost, default # accepts csv
|
|||
|
|
|||
|
# Health Score Alert
|
|||
|
# - type: health # Alerts when health score changes by a threshold
|
|||
|
# window: 10m
|
|||
|
# threshold: 5 # Send Alert if health scores changes by 5 or more
|
|||
|
|
|||
|
# Kubecost Health Diagnostic
|
|||
|
# - type: diagnostic # Alerts when kubecost is unable to compute costs - ie: Prometheus unreachable
|
|||
|
# window: 10m
|
|||
|
|
|||
|
alertmanager: # Supply an alertmanager FQDN to receive notifications from the app.
|
|||
|
enabled: false # If true, allow kubecost to write to your alertmanager
|
|||
|
fqdn: http://cost-analyzer-prometheus-server.default.svc # example fqdn. Ignored if prometheus.enabled: true
|
|||
|
|
|||
|
# Set saved Cost Allocation report(s) accessible from /reports
|
|||
|
# Ref: http://docs.kubecost.com/saved-reports
|
|||
|
savedReports:
|
|||
|
enabled: false # If true, overwrites report parameters set through UI
|
|||
|
reports:
|
|||
|
- title: "Example Saved Report 0"
|
|||
|
window: "today"
|
|||
|
aggregateBy: "namespace"
|
|||
|
chartDisplay: "category"
|
|||
|
idle: "separate"
|
|||
|
rate: "cumulative"
|
|||
|
accumulate: false # daily resolution
|
|||
|
filters: # Ref: https://docs.kubecost.com/apis/filters-api
|
|||
|
- key: "cluster" # Ref: https://docs.kubecost.com/apis/filters-api#allocation-apis-request-sizing-v2-api
|
|||
|
operator: ":" # Ref: https://docs.kubecost.com/apis/filters-api#filter-operators
|
|||
|
value: "dev"
|
|||
|
- title: "Example Saved Report 1"
|
|||
|
window: "month"
|
|||
|
aggregateBy: "controllerKind"
|
|||
|
chartDisplay: "category"
|
|||
|
idle: "share"
|
|||
|
rate: "monthly"
|
|||
|
accumulate: false
|
|||
|
filters: # Ref: https://docs.kubecost.com/apis/filters-api
|
|||
|
- key: "namespace" # Ref: https://docs.kubecost.com/apis/filters-api#allocation-apis-request-sizing-v2-api
|
|||
|
operator: "!:" # Ref: https://docs.kubecost.com/apis/filters-api#filter-operators
|
|||
|
value: "kubecost"
|
|||
|
- title: "Example Saved Report 2"
|
|||
|
window: "2020-11-11T00:00:00Z,2020-12-09T23:59:59Z"
|
|||
|
aggregateBy: "service"
|
|||
|
chartDisplay: "category"
|
|||
|
idle: "hide"
|
|||
|
rate: "daily"
|
|||
|
accumulate: true # entire window resolution
|
|||
|
filters: [] # if no filters, specify empty array
|
|||
|
|
|||
|
# Set saved Asset report(s) accessible from /reports
|
|||
|
# Ref: http://docs.kubecost.com/saved-reports
|
|||
|
assetReports:
|
|||
|
enabled: false # If true, overwrites report parameters set through UI
|
|||
|
reports:
|
|||
|
- title: "Example Asset Report 0"
|
|||
|
window: "today"
|
|||
|
aggregateBy: "type"
|
|||
|
accumulate: false # daily resolution
|
|||
|
filters:
|
|||
|
- property: "cluster"
|
|||
|
value: "cluster-one"
|
|||
|
|
|||
|
# Set saved Cloud Cost report(s) accessible from /reports
|
|||
|
# Ref: http://docs.kubecost.com/saved-reports
|
|||
|
cloudCostReports:
|
|||
|
enabled: false # If true, overwrites report parameters set through UI
|
|||
|
reports:
|
|||
|
- title: "Cloud Cost Report 0"
|
|||
|
window: "today"
|
|||
|
aggregateBy: "service"
|
|||
|
accumulate: false # daily resolution
|
|||
|
# filters:
|
|||
|
# - property: "service"
|
|||
|
# value: "service1" # corresponds to a value to filter cloud cost aggregate by service data on.
|
|||
|
|
|||
|
podAnnotations: {}
|
|||
|
# iam.amazonaws.com/role: role-arn
|
|||
|
|
|||
|
# Applies these labels to all Deployments, StatefulSets, DaemonSets, and their pod templates.
|
|||
|
additionalLabels: {}
|
|||
|
|
|||
|
securityContext:
|
|||
|
runAsNonRoot: true
|
|||
|
seccompProfile:
|
|||
|
type: RuntimeDefault
|
|||
|
fsGroup: 1001
|
|||
|
runAsGroup: 1001
|
|||
|
runAsUser: 1001
|
|||
|
fsGroupChangePolicy: OnRootMismatch
|
|||
|
containerSecurityContext:
|
|||
|
allowPrivilegeEscalation: false
|
|||
|
privileged: false
|
|||
|
readOnlyRootFilesystem: true
|
|||
|
capabilities:
|
|||
|
drop:
|
|||
|
- ALL
|
|||
|
|
|||
|
# Platforms is a higher-level abstraction for platform-specific values and settings.
|
|||
|
platforms:
|
|||
|
# Deploying to OpenShift (OCP) requires enabling this option.
|
|||
|
openshift:
|
|||
|
enabled: false # Deploy Kubecost to OpenShift.
|
|||
|
route:
|
|||
|
enabled: false # Create an OpenShift Route.
|
|||
|
annotations: {} # Add annotations to the Route.
|
|||
|
# host: kubecost.apps.okd4.example.com # Add a custom host for your Route.
|
|||
|
# Create Security Context Constraint resources for the DaemonSets requiring additional privileges.
|
|||
|
scc:
|
|||
|
nodeExporter: false # Creates an SCC for Prometheus Node Exporter. This requires Node Exporter be enabled.
|
|||
|
networkCosts: false # Creates an SCC for Kubecost network-costs. This requires network-costs be enabled.
|
|||
|
# When OpenShift is enabled, the following securityContext will be applied to all resources unless they define their own.
|
|||
|
securityContext:
|
|||
|
runAsNonRoot: true
|
|||
|
seccompProfile:
|
|||
|
type: RuntimeDefault
|
|||
|
# Set options for deploying with CI/CD tools like Argo CD.
|
|||
|
cicd:
|
|||
|
enabled: false # Set to true when using affected CI/CD tools for access to the below configuration options.
|
|||
|
skipSanityChecks: false # If true, skip all sanity/existence checks for resources like Secrets.
|
|||
|
|
|||
|
## Kubecost Integrations
|
|||
|
## Ref: https://docs.kubecost.com/integrations
|
|||
|
##
|
|||
|
integrations:
|
|||
|
postgres:
|
|||
|
enabled: false
|
|||
|
runInterval: "12h" # How frequently to run the integration.
|
|||
|
databaseHost: "" # REQUIRED. ex: my.postgres.database.azure.com
|
|||
|
databasePort: "" # REQUIRED. ex: 5432
|
|||
|
databaseName: "" # REQUIRED. ex: postgres
|
|||
|
databaseUser: "" # REQUIRED. ex: myusername
|
|||
|
databasePassword: "" # REQUIRED. ex: mypassword
|
|||
|
databaseSecretName: "" # OPTIONAL. Specify your own k8s secret containing the above credentials. Must have key "creds.json".
|
|||
|
|
|||
|
## Configure what Postgres table to write to, and what parameters to pass
|
|||
|
## when querying Kubecost's APIs. Ensure all parameters are enclosed in
|
|||
|
## quotes. Ref: https://docs.kubecost.com/apis/apis-overview
|
|||
|
queryConfigs:
|
|||
|
allocations: []
|
|||
|
# - databaseTable: "kubecost_allocation_data"
|
|||
|
# window: "7d"
|
|||
|
# aggregate: "namespace"
|
|||
|
# idle: "true"
|
|||
|
# shareIdle: "true"
|
|||
|
# shareNamespaces: "kubecost,kube-system"
|
|||
|
# shareLabels: ""
|
|||
|
# - databaseTable: "kubecost_allocation_data_by_cluster"
|
|||
|
# window: "10d"
|
|||
|
# aggregate: "cluster"
|
|||
|
# idle: "true"
|
|||
|
# shareIdle: "false"
|
|||
|
# shareNamespaces: ""
|
|||
|
# shareLabels: ""
|
|||
|
assets: []
|
|||
|
# - databaseTable: "kubecost_assets_data"
|
|||
|
# window: "7d"
|
|||
|
# aggregate: "cluster"
|
|||
|
cloudCosts: []
|
|||
|
# - databaseTable: "kubecost_cloudcosts_data"
|
|||
|
# window: "7d"
|
|||
|
# aggregate: "service"
|
|||
|
|
|||
|
## Provide a name override for the chart.
|
|||
|
# nameOverride: ""
|
|||
|
## Provide a full name override option for the chart.
|
|||
|
# fullnameOverride: ""
|
|||
|
|
|||
|
## This flag is only required for users upgrading to a new version of Kubecost.
|
|||
|
## The flag is used to ensure users are aware of important
|
|||
|
## (potentially breaking) changes included in the new version.
|
|||
|
##
|
|||
|
upgrade:
|
|||
|
toV2: false
|
|||
|
|
|||
|
# generated at http://kubecost.com/install, used for alerts tracking and free trials
|
|||
|
kubecostToken: # ""
|
|||
|
|
|||
|
# Advanced pipeline for custom prices, enterprise key required
|
|||
|
pricingCsv:
|
|||
|
enabled: false
|
|||
|
location:
|
|||
|
provider: "AWS"
|
|||
|
region: "us-east-1"
|
|||
|
URI: s3://kc-csv-test/pricing_schema.csv # a valid file URI
|
|||
|
csvAccessCredentials: pricing-schema-access-secret
|
|||
|
|
|||
|
# SAML integration for user management and RBAC, enterprise key required
|
|||
|
# Ref: https://github.com/kubecost/docs/blob/main/user-management.md
|
|||
|
saml:
|
|||
|
enabled: false
|
|||
|
# secretName: "kubecost-authzero"
|
|||
|
# metadataSecretName: "kubecost-authzero-metadata" # One of metadataSecretName or idpMetadataURL must be set. defaults to metadataURL if set
|
|||
|
# idpMetadataURL: "https://dev-elu2z98r.auth0.com/samlp/metadata/c6nY4M37rBP0qSO1IYIqBPPyIPxLS8v2"
|
|||
|
# appRootURL: "http://localhost:9090" # sample URL
|
|||
|
# authTimeout: 1440 # number of minutes the JWT will be valid
|
|||
|
# redirectURL: "https://dev-elu2z98r.auth0.com/v2/logout" # callback URL redirected to after logout
|
|||
|
# audienceURI: "http://localhost:9090" # by convention, the same as the appRootURL, but any string uniquely identifying kubecost to your samp IDP. Optional if you follow the convention
|
|||
|
# nameIDFormat: "urn:oasis:names:tc:SAML:1.1:nameid-format:unspecified" If your SAML provider requires a specific nameid format
|
|||
|
# isGLUUProvider: false # An additional URL parameter must be appended for GLUU providers
|
|||
|
# encryptionCertSecret: "kubecost-saml-cert" # k8s secret where the x509 certificate used to encrypt an Okta saml response is stored
|
|||
|
# decryptionKeySecret: "kubecost-sank-decryption-key" # k8s secret where the private key associated with the encryptionCertSecret is stored
|
|||
|
# authSecret: "random-string" # value of SAML secret used to issue tokens, will be autogenerated as random string if not provided
|
|||
|
# authSecretName: "kubecost-saml-secret" # name of k8s secret where the authSecret will be stored, defaults to "kubecost-saml-secret" if not provided
|
|||
|
rbac:
|
|||
|
enabled: false
|
|||
|
# groups:
|
|||
|
# - name: admin
|
|||
|
# enabled: false # if admin is disabled, all SAML users will be able to make configuration changes to the kubecost frontend
|
|||
|
# assertionName: "http://schemas.auth0.com/userType" # a SAML Assertion, one of whose elements has a value that matches on of the values in assertionValues
|
|||
|
# assertionValues:
|
|||
|
# - "admin"
|
|||
|
# - "superusers"
|
|||
|
# - name: readonly
|
|||
|
# enabled: false # if readonly is disabled, all users authorized on SAML will default to readonly
|
|||
|
# assertionName: "http://schemas.auth0.com/userType"
|
|||
|
# assertionValues:
|
|||
|
# - "readonly"
|
|||
|
# - name: editor
|
|||
|
# enabled: true # if editor is enabled, editors will be allowed to edit reports/alerts scoped to them, and act as readers otherwise. Users will never default to editor.
|
|||
|
# assertionName: "http://schemas.auth0.com/userType"
|
|||
|
# assertionValues:
|
|||
|
# - "editor"
|
|||
|
|
|||
|
oidc:
|
|||
|
enabled: false
|
|||
|
clientID: "" # application/client client_id parameter obtained from provider, used to make requests to server
|
|||
|
clientSecret: "" # application/client client_secret parameter obtained from provider, used to make requests to server
|
|||
|
# secretName: "kubecost-oidc-secret" # k8s secret where clientsecret will be stored
|
|||
|
# For use to provide a custom OIDC Secret. Overrides the usage of oidc.clientSecret and oidc.secretName.
|
|||
|
# Should contain the field directly.
|
|||
|
# Can be created using raw k8s secrets, external secrets, sealed secrets, or any other method.
|
|||
|
existingCustomSecret:
|
|||
|
enabled: false
|
|||
|
name: "" # name of the secret containing the client secret
|
|||
|
|
|||
|
# authURL: "https://my.auth.server/authorize" # endpoint for login to auth server
|
|||
|
# loginRedirectURL: "http://my.kubecost.url/model/oidc/authorize" # Kubecost url configured in provider for redirect after authentication
|
|||
|
# discoveryURL: "https://my.auth.server/.well-known/openid-configuration" # url for OIDC endpoint discovery
|
|||
|
skipOnlineTokenValidation: false # if true, will skip accessing OIDC introspection endpoint for online token verification, and instead try to locally validate JWT claims
|
|||
|
useClientSecretPost: false # if true, client secret will specifically only use client_secret_post method, otherwise it will attempt to send the secret in both the header and the body.
|
|||
|
# hostedDomain: "example.com" # optional, blocks access to the auth domain specified in the hd claim of the provider ID token
|
|||
|
rbac:
|
|||
|
enabled: false
|
|||
|
# groups:
|
|||
|
# - name: admin
|
|||
|
# enabled: false # if admin is disabled, all authenticated users will be able to make configuration changes to the kubecost frontend
|
|||
|
# claimName: "roles" # Kubecost matches this string against the JWT's payload key containing RBAC info (this value is unique across identity providers)
|
|||
|
# claimValues: # Kubecost matches these strings with the roles created in your identity provider
|
|||
|
# - "admin"
|
|||
|
# - "superusers"
|
|||
|
# - name: readonly
|
|||
|
# enabled: false # if readonly is disabled, all authenticated users will default to readonly
|
|||
|
# claimName: "roles"
|
|||
|
# claimValues:
|
|||
|
# - "readonly"
|
|||
|
# - name: editor
|
|||
|
# enabled: false # if editor is enabled, editors will be allowed to edit reports/alerts scoped to them, and act as readers otherwise. Users will never default to editor.
|
|||
|
# claimName: "roles"
|
|||
|
# claimValues:
|
|||
|
# - "editor"
|
|||
|
|
|||
|
## Adds the HTTP_PROXY, HTTPS_PROXY, and NO_PROXY environment variables to all
|
|||
|
## containers. Typically used in environments that have firewall rules which
|
|||
|
## prevent kubecost from accessing cloud provider resources.
|
|||
|
## Ref: https://www.oreilly.com/library/view/security-with-go/9781788627917/5ea6a02b-3d96-44b1-ad3c-6ab60fcbbe4f.xhtml
|
|||
|
##
|
|||
|
systemProxy:
|
|||
|
enabled: false
|
|||
|
httpProxyUrl: ""
|
|||
|
httpsProxyUrl: ""
|
|||
|
noProxy: ""
|
|||
|
|
|||
|
# imagePullSecrets:
|
|||
|
# - name: "image-pull-secret"
|
|||
|
|
|||
|
# imageVersion uses the base image name (image:) but overrides the version
|
|||
|
# pulled. It should be avoided. If non-default behavior is needed, use
|
|||
|
# fullImageName for the relevant component.
|
|||
|
# imageVersion:
|
|||
|
|
|||
|
kubecostFrontend:
|
|||
|
enabled: true
|
|||
|
deployMethod: singlepod # haMode or singlepod - haMode is currently only supported with Enterprise tier
|
|||
|
haReplicas: 2 # only used with haMode
|
|||
|
image: "gcr.io/kubecost1/frontend"
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
# fullImageName overrides the default image construction logic. The exact
|
|||
|
# image provided (registry, image, tag) will be used for the frontend.
|
|||
|
# fullImageName:
|
|||
|
|
|||
|
# extraEnv:
|
|||
|
# - name: NGINX_ENTRYPOINT_WORKER_PROCESSES_AUTOTUNE
|
|||
|
# value: "1"
|
|||
|
# securityContext:
|
|||
|
# readOnlyRootFilesystem: true
|
|||
|
resources:
|
|||
|
requests:
|
|||
|
cpu: "10m"
|
|||
|
memory: "55Mi"
|
|||
|
# limits:
|
|||
|
# cpu: "100m"
|
|||
|
# memory: "256Mi"
|
|||
|
deploymentStrategy: {}
|
|||
|
# rollingUpdate:
|
|||
|
# maxSurge: 1
|
|||
|
# maxUnavailable: 1
|
|||
|
# type: RollingUpdate
|
|||
|
|
|||
|
# Define a readiness probe for the Kubecost frontend container.
|
|||
|
readinessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 1
|
|||
|
periodSeconds: 5
|
|||
|
failureThreshold: 6
|
|||
|
|
|||
|
# Define a liveness probe for the Kubecost frontend container.
|
|||
|
livenessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 1
|
|||
|
periodSeconds: 5
|
|||
|
failureThreshold: 6
|
|||
|
ipv6:
|
|||
|
enabled: true # disable if the cluster does not support ipv6
|
|||
|
# timeoutSeconds: 600 # should be rarely used, but can be increased if needed
|
|||
|
# allow customizing nginx-conf server block
|
|||
|
# extraServerConfig: |-
|
|||
|
# proxy_busy_buffers_size 512k;
|
|||
|
# proxy_buffers 4 512k;
|
|||
|
# proxy_buffer_size 256k;
|
|||
|
# large_client_header_buffers 4 64k;
|
|||
|
# hideDiagnostics: false # useful if the primary is not monitored. Supported in limited environments.
|
|||
|
# hideOrphanedResources: false # OrphanedResources works on the primary-cluster's cloud-provider only.
|
|||
|
|
|||
|
# set to true to set all upstreams to use <service>.<namespace>.svc.cluster.local instead of just <service>.<namespace>
|
|||
|
useDefaultFqdn: false
|
|||
|
# api:
|
|||
|
# fqdn: kubecost-api.kubecost.svc.cluster.local:9001
|
|||
|
# model:
|
|||
|
# fqdn: kubecost-model.kubecost.svc.cluster.local:9003
|
|||
|
# forecasting:
|
|||
|
# fqdn: kubecost-forcasting.kubecost.svc.cluster.local:5000
|
|||
|
# aggregator:
|
|||
|
# fqdn: kubecost-aggregator.kubecost.svc.cluster.local:9004
|
|||
|
# cloudCost:
|
|||
|
# fqdn: kubecost-cloud-cost.kubecost.svc.cluster.local:9005
|
|||
|
# multiClusterDiagnostics:
|
|||
|
# fqdn: kubecost-multi-diag.kubecost.svc.cluster.local:9007
|
|||
|
# clusterController:
|
|||
|
# fqdn: cluster-controller.kubecost.svc.cluster.local:9731
|
|||
|
|
|||
|
# Kubecost Metrics deploys a separate pod which will emit kubernetes specific metrics required
|
|||
|
# by the cost-model. This pod is designed to remain active and decoupled from the cost-model itself.
|
|||
|
# However, disabling this service/pod deployment will flag the cost-model to emit the metrics instead.
|
|||
|
kubecostMetrics:
|
|||
|
# emitPodAnnotations: false
|
|||
|
# emitNamespaceAnnotations: false
|
|||
|
# emitKsmV1Metrics: true # emit all KSM metrics in KSM v1.
|
|||
|
# emitKsmV1MetricsOnly: false # emit only the KSM metrics missing from KSM v2. Advanced users only.
|
|||
|
|
|||
|
# Optional
|
|||
|
# The metrics exporter is a separate deployment and service (for prometheus scrape auto-discovery)
|
|||
|
# which emits metrics cost-model relies on. Enabling this deployment also removes the KSM dependency
|
|||
|
# from the cost-model. If the deployment is not enabled, the metrics will continue to be emitted from
|
|||
|
# the cost-model.
|
|||
|
exporter:
|
|||
|
enabled: false
|
|||
|
port: 9005
|
|||
|
# Adds the default Prometheus scrape annotations to the metrics exporter service.
|
|||
|
# Set to false and use service.annotations (below) to set custom scrape annotations.
|
|||
|
prometheusScrape: true
|
|||
|
resources: {}
|
|||
|
# requests:
|
|||
|
# cpu: "200m"
|
|||
|
# memory: "55Mi"
|
|||
|
## Node tolerations for server scheduling to nodes with taints
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/assign-pod-node/
|
|||
|
tolerations: []
|
|||
|
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
affinity: {}
|
|||
|
|
|||
|
service:
|
|||
|
annotations: {}
|
|||
|
|
|||
|
# Service Monitor for Kubecost Metrics
|
|||
|
serviceMonitor: # the kubecost included prometheus uses scrapeConfigs and does not support service monitors. The following options assume an existing prometheus that supports serviceMonitors.
|
|||
|
enabled: false
|
|||
|
additionalLabels: {}
|
|||
|
metricRelabelings: []
|
|||
|
relabelings: []
|
|||
|
## PriorityClassName
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/pod-priority-preemption/#priorityclass
|
|||
|
priorityClassName: ""
|
|||
|
additionalLabels: {}
|
|||
|
nodeSelector: {}
|
|||
|
extraArgs: []
|
|||
|
|
|||
|
sigV4Proxy:
|
|||
|
image: public.ecr.aws/aws-observability/aws-sigv4-proxy:latest
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
name: aps
|
|||
|
port: 8005
|
|||
|
region: us-west-2 # The AWS region
|
|||
|
host: aps-workspaces.us-west-2.amazonaws.com # The hostname for AMP service.
|
|||
|
# role_arn: arn:aws:iam::<account>:role/role-name # The AWS IAM role to assume.
|
|||
|
extraEnv: # Pass extra env variables to sigV4Proxy
|
|||
|
# - name: AWS_ACCESS_KEY_ID
|
|||
|
# value: <access_key>
|
|||
|
# - name: AWS_SECRET_ACCESS_KEY
|
|||
|
# value: <secret_key>
|
|||
|
# Optional resource requests and limits for the sigV4proxy container.
|
|||
|
resources: {}
|
|||
|
|
|||
|
kubecostModel:
|
|||
|
image: "gcr.io/kubecost1/cost-model"
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
# fullImageName overrides the default image construction logic. The exact
|
|||
|
# image provided (registry, image, tag) will be used for cost-model.
|
|||
|
# fullImageName:
|
|||
|
|
|||
|
# securityContext:
|
|||
|
# readOnlyRootFilesystem: true
|
|||
|
|
|||
|
# Build local cost allocation cache
|
|||
|
warmCache: false
|
|||
|
# Run allocation ETL pipelines
|
|||
|
etl: true
|
|||
|
# Enable the ETL filestore backing storage
|
|||
|
etlFileStoreEnabled: true
|
|||
|
# The total number of days the ETL pipelines will build
|
|||
|
# Set to 0 to disable daily ETL (not recommended)
|
|||
|
etlDailyStoreDurationDays: 91
|
|||
|
# The total number of hours the ETL pipelines will build
|
|||
|
# Set to 0 to disable hourly ETL (recommended for large environments)
|
|||
|
# Must be < prometheus server retention, otherwise empty data may overwrite
|
|||
|
# known-good data
|
|||
|
etlHourlyStoreDurationHours: 49
|
|||
|
# For deploying kubecost in a cluster that does not self-monitor
|
|||
|
etlReadOnlyMode: false
|
|||
|
|
|||
|
## The name of the Secret containing a bucket config for Federated storage.
|
|||
|
## The contents should be stored under a key named federated-store.yaml.
|
|||
|
## Ref: https://docs.kubecost.com/install-and-configure/install/multi-cluster/long-term-storage-configuration
|
|||
|
# federatedStorageConfigSecret: federated-store
|
|||
|
|
|||
|
## Federated storage config can be supplied via a secret or the yaml block
|
|||
|
## below when using the block below, only a single provider is supported,
|
|||
|
## others are for example purposes.
|
|||
|
## Ref: https://docs.kubecost.com/install-and-configure/install/multi-cluster/long-term-storage-configuration
|
|||
|
# federatedStorageConfig: |-
|
|||
|
# # AWS EXAMPLE
|
|||
|
# type: S3
|
|||
|
# config:
|
|||
|
# bucket: kubecost-federated-storage-bucket
|
|||
|
# endpoint: s3.amazonaws.com
|
|||
|
# region: us-east-1
|
|||
|
# # best practice is to use pod identities to access AWS resources. Otherwise it is possible to use an access_key and secret_key
|
|||
|
# access_key: "<your-access-key>"
|
|||
|
# secret_key: "<your-secret-key>"
|
|||
|
# # AZURE EXAMPLE
|
|||
|
# type: AZURE
|
|||
|
# config:
|
|||
|
# storage_account: ""
|
|||
|
# storage_account_key: ""
|
|||
|
# container: ""
|
|||
|
# max_retries: 0
|
|||
|
# # GCP EXAMPLE
|
|||
|
# type: GCS
|
|||
|
# config:
|
|||
|
# bucket: kubecost-federated-storage-bucket
|
|||
|
# service_account: |-
|
|||
|
# {
|
|||
|
# "type": "service_account",
|
|||
|
# "project_id": "...",
|
|||
|
# "private_key_id": "...",
|
|||
|
# "private_key": "...",
|
|||
|
# "client_email": "...",
|
|||
|
# "client_id": "...",
|
|||
|
# "auth_uri": "https://accounts.google.com/o/oauth2/auth",
|
|||
|
# "token_uri": "https://oauth2.googleapis.com/token",
|
|||
|
# "auth_provider_x509_cert_url": "https://www.googleapis.com/oauth2/v1/certs",
|
|||
|
# "client_x509_cert_url": ""
|
|||
|
# }
|
|||
|
|
|||
|
# Installs Kubecost/OpenCost plugins
|
|||
|
plugins:
|
|||
|
enabled: false
|
|||
|
install:
|
|||
|
enabled: false
|
|||
|
fullImageName: curlimages/curl:latest
|
|||
|
securityContext:
|
|||
|
allowPrivilegeEscalation: false
|
|||
|
seccompProfile:
|
|||
|
type: RuntimeDefault
|
|||
|
capabilities:
|
|||
|
drop:
|
|||
|
- ALL
|
|||
|
readOnlyRootFilesystem: true
|
|||
|
runAsNonRoot: true
|
|||
|
runAsUser: 1001
|
|||
|
folder: /opt/opencost/plugin
|
|||
|
|
|||
|
# leave this commented to always download most recent version of plugins
|
|||
|
# version: <INSERT_SPECIFIC_PLUGINS_VERSION>
|
|||
|
|
|||
|
# the list of enabled plugins
|
|||
|
enabledPlugins: []
|
|||
|
# - datadog
|
|||
|
|
|||
|
# pre-existing secret for plugin configuration
|
|||
|
existingCustomSecret:
|
|||
|
enabled: false
|
|||
|
name: "" # name of the secret containing plugin config
|
|||
|
|
|||
|
secretName: kubecost-plugin-secret
|
|||
|
|
|||
|
# uncomment this to define plugin configuration via the values file
|
|||
|
# configs:
|
|||
|
# datadog: |
|
|||
|
# {
|
|||
|
# "datadog_site": "<INSERT_DATADOG_SITE>",
|
|||
|
# "datadog_api_key": "<INSERT_DATADOG_API_KEY>",
|
|||
|
# "datadog_app_key": "<INSERT_DATADOG_APP_KEY>"
|
|||
|
# }
|
|||
|
|
|||
|
allocation:
|
|||
|
# Enables or disables adding node labels to allocation data (i.e. workloads).
|
|||
|
# Defaults to "true" and starts with a sensible includeList for basics like
|
|||
|
# topology (e.g. zone, region) and instance type labels.
|
|||
|
# nodeLabels:
|
|||
|
# enabled: true
|
|||
|
# includeList: "node.kubernetes.io/instance-type,topology.kubernetes.io/region,topology.kubernetes.io/zone"
|
|||
|
|
|||
|
# Enables or disables the ContainerStats pipeline, used for quantile-based
|
|||
|
# queries like for request sizing recommendations.
|
|||
|
# ContainerStats provides support for quantile-based request right-sizing
|
|||
|
# recommendations.
|
|||
|
#
|
|||
|
# It is disabled by default to avoid problems in extremely high-scale Thanos
|
|||
|
# environments. If you would like to try quantile-based request-sizing
|
|||
|
# recommendations, enable this! If you are in a high-scale environment,
|
|||
|
# please monitor Kubecost logs, Thanos query logs, and Thanos load closely.
|
|||
|
# We hope to make major improvements at scale here soon!
|
|||
|
#
|
|||
|
containerStatsEnabled: true # enabled by default as of v2.2.0
|
|||
|
|
|||
|
# max number of concurrent Prometheus queries
|
|||
|
maxQueryConcurrency: 5
|
|||
|
resources:
|
|||
|
requests:
|
|||
|
cpu: "200m"
|
|||
|
memory: "55Mi"
|
|||
|
# limits:
|
|||
|
# cpu: "800m"
|
|||
|
# memory: "256Mi"
|
|||
|
|
|||
|
# Define a readiness probe for the Kubecost cost-model container.
|
|||
|
readinessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 10
|
|||
|
periodSeconds: 10
|
|||
|
failureThreshold: 200
|
|||
|
|
|||
|
# Define a liveness probe for the Kubecost cost-model container.
|
|||
|
livenessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 10
|
|||
|
periodSeconds: 10
|
|||
|
failureThreshold: 200
|
|||
|
extraArgs: []
|
|||
|
|
|||
|
# Optional. A list of extra environment variables to be added to the cost-model container.
|
|||
|
# extraEnv:
|
|||
|
# - name: LOG_LEVEL
|
|||
|
# value: trace
|
|||
|
# - name: LOG_FORMAT
|
|||
|
# value: json
|
|||
|
# # When false, Kubecost will not show Asset costs for local disks physically
|
|||
|
# # attached to nodes (e.g. ephemeral storage). This needs to be applied to
|
|||
|
# # each cluster monitored.
|
|||
|
# - name: ASSET_INCLUDE_LOCAL_DISK_COST
|
|||
|
# value: "true"
|
|||
|
|
|||
|
# creates an ingress directly to the model container, for API access
|
|||
|
ingress:
|
|||
|
enabled: false
|
|||
|
# className: nginx
|
|||
|
labels:
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: "true"
|
|||
|
annotations:
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: "true"
|
|||
|
paths: ["/"]
|
|||
|
pathType: ImplementationSpecific
|
|||
|
hosts:
|
|||
|
- cost-analyzer-model.local
|
|||
|
tls: []
|
|||
|
# - secretName: cost-analyzer-model-tls
|
|||
|
# hosts:
|
|||
|
# - cost-analyzer-model.local
|
|||
|
utcOffset: "+00:00"
|
|||
|
# Optional - add extra ports to the cost-model container. For kubecost development purposes only - not recommended for users.
|
|||
|
extraPorts: []
|
|||
|
# - name: debug
|
|||
|
# port: 40000
|
|||
|
# targetPort: 40000
|
|||
|
# containerPort: 40000
|
|||
|
|
|||
|
## etlUtils is a utility typically used by Enterprise customers transitioning
|
|||
|
## from v1 to v2 of Kubecost. It translates the data from the "/etl" dir of the
|
|||
|
## bucket, to the "/federated" dir of the bucket.
|
|||
|
## Ref: https://docs.kubecost.com/install-and-configure/install/multi-cluster/federated-etl/thanos-migration-guide
|
|||
|
##
|
|||
|
etlUtils:
|
|||
|
enabled: false
|
|||
|
fullImageName: null
|
|||
|
resources: {}
|
|||
|
env: {}
|
|||
|
nodeSelector: {}
|
|||
|
tolerations: []
|
|||
|
affinity: {}
|
|||
|
|
|||
|
# Basic Kubecost ingress, more examples available at https://docs.kubecost.com/install-and-configure/install/ingress-examples
|
|||
|
ingress:
|
|||
|
enabled: false
|
|||
|
# className: nginx
|
|||
|
labels:
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: "true"
|
|||
|
annotations:
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: "true"
|
|||
|
paths: ["/"] # There's no need to route specifically to the pods-- we have an nginx deployed that handles routing
|
|||
|
pathType: ImplementationSpecific
|
|||
|
hosts:
|
|||
|
- cost-analyzer.local
|
|||
|
tls: []
|
|||
|
# - secretName: cost-analyzer-tls
|
|||
|
# hosts:
|
|||
|
# - cost-analyzer.local
|
|||
|
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
tolerations: []
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
|
|||
|
affinity: {}
|
|||
|
|
|||
|
topologySpreadConstraints: []
|
|||
|
|
|||
|
# If true, creates a PriorityClass to be used by the cost-analyzer pod
|
|||
|
priority:
|
|||
|
enabled: false
|
|||
|
name: "" # Provide name of existing priority class only. If left blank, upstream chart will create one from default template.
|
|||
|
|
|||
|
# If true, enable creation of NetworkPolicy resources.
|
|||
|
networkPolicy:
|
|||
|
enabled: false
|
|||
|
denyEgress: true # create a network policy that denies egress from kubecost
|
|||
|
sameNamespace: true # Set to true if cost analyzer and prometheus are on the same namespace
|
|||
|
# namespace: kubecost # Namespace where prometheus is installed
|
|||
|
|
|||
|
# Cost-analyzer specific vars using the new template
|
|||
|
costAnalyzer:
|
|||
|
enabled: false # If true, create a network policy for cost-analyzer
|
|||
|
annotations: {} # annotations to be added to the network policy
|
|||
|
additionalLabels: {} # additional labels to be added to the network policy
|
|||
|
# Examples rules:
|
|||
|
# ingressRules:
|
|||
|
# - selectors: # allow ingress from self on all ports
|
|||
|
# - podSelector:
|
|||
|
# matchLabels:
|
|||
|
# app.kubernetes.io/name: cost-analyzer
|
|||
|
# - selectors: # allow egress access to prometheus
|
|||
|
# - namespaceSelector:
|
|||
|
# matchLabels:
|
|||
|
# name: prometheus
|
|||
|
# podSelector:
|
|||
|
# matchLabels:
|
|||
|
# app: prometheus
|
|||
|
# ports:
|
|||
|
# - protocol: TCP
|
|||
|
# port: 9090
|
|||
|
# egressRules:
|
|||
|
# - selectors: # restrict egress to inside cluster
|
|||
|
# - namespaceSelector: {}
|
|||
|
|
|||
|
## @param extraVolumes A list of volumes to be added to the pod
|
|||
|
##
|
|||
|
extraVolumes: []
|
|||
|
## @param extraVolumeMounts A list of volume mounts to be added to the pod
|
|||
|
##
|
|||
|
extraVolumeMounts: []
|
|||
|
|
|||
|
# Define persistence volume for cost-analyzer, more information at https://docs.kubecost.com/install-and-configure/install/storage
|
|||
|
persistentVolume:
|
|||
|
size: 32Gi
|
|||
|
dbSize: 32.0Gi
|
|||
|
enabled: true # Note that setting this to false means configurations will be wiped out on pod restart.
|
|||
|
# storageClass: "-" #
|
|||
|
# existingClaim: kubecost-cost-analyzer # a claim in the same namespace as kubecost
|
|||
|
labels: {}
|
|||
|
annotations: {}
|
|||
|
# helm.sh/resource-policy: keep # https://helm.sh/docs/howto/charts_tips_and_tricks/#tell-helm-not-to-uninstall-a-resource
|
|||
|
|
|||
|
# Enables a separate PV specifically for ETL data. This should be avoided, but
|
|||
|
# is kept for legacy compatibility.
|
|||
|
dbPVEnabled: false
|
|||
|
|
|||
|
service:
|
|||
|
type: ClusterIP
|
|||
|
port: 9090
|
|||
|
targetPort: 9090
|
|||
|
nodePort: {}
|
|||
|
labels: {}
|
|||
|
annotations: {}
|
|||
|
# loadBalancerSourceRanges: []
|
|||
|
sessionAffinity:
|
|||
|
enabled: false # Makes sure that connections from a client are passed to the same Pod each time, when set to `true`. You should set it when you enabled authentication through OIDC or SAML integration.
|
|||
|
timeoutSeconds: 10800
|
|||
|
|
|||
|
prometheus:
|
|||
|
## Provide a full name override for Prometheus.
|
|||
|
# fullnameOverride: ""
|
|||
|
## Provide a name override for Prometheus.
|
|||
|
# nameOverride: ""
|
|||
|
|
|||
|
rbac:
|
|||
|
create: true # Create the RBAC resources for Prometheus.
|
|||
|
|
|||
|
## Define serviceAccount names for components. Defaults to component's fully qualified name.
|
|||
|
##
|
|||
|
serviceAccounts:
|
|||
|
alertmanager:
|
|||
|
create: true
|
|||
|
name:
|
|||
|
nodeExporter:
|
|||
|
create: true
|
|||
|
name:
|
|||
|
pushgateway:
|
|||
|
create: true
|
|||
|
name:
|
|||
|
server:
|
|||
|
create: true
|
|||
|
name:
|
|||
|
## Prometheus server ServiceAccount annotations.
|
|||
|
## Can be used for AWS IRSA annotations when using Remote Write mode with Amazon Managed Prometheus.
|
|||
|
annotations: {}
|
|||
|
|
|||
|
## Specify an existing ConfigMap to be used by Prometheus when using self-signed certificates.
|
|||
|
##
|
|||
|
# selfsignedCertConfigMapName: ""
|
|||
|
|
|||
|
imagePullSecrets:
|
|||
|
# - name: "image-pull-secret"
|
|||
|
|
|||
|
extraScrapeConfigs: |
|
|||
|
- job_name: kubecost
|
|||
|
honor_labels: true
|
|||
|
scrape_interval: 1m
|
|||
|
scrape_timeout: 60s
|
|||
|
metrics_path: /metrics
|
|||
|
scheme: http
|
|||
|
dns_sd_configs:
|
|||
|
- names:
|
|||
|
- {{ template "cost-analyzer.serviceName" . }}
|
|||
|
type: 'A'
|
|||
|
port: 9003
|
|||
|
- job_name: kubecost-networking
|
|||
|
kubernetes_sd_configs:
|
|||
|
- role: pod
|
|||
|
relabel_configs:
|
|||
|
# Scrape only the the targets matching the following metadata
|
|||
|
- source_labels: [__meta_kubernetes_pod_label_app_kubernetes_io_instance]
|
|||
|
action: keep
|
|||
|
regex: kubecost
|
|||
|
- source_labels: [__meta_kubernetes_pod_label_app_kubernetes_io_name]
|
|||
|
action: keep
|
|||
|
regex: network-costs
|
|||
|
- job_name: kubecost-aggregator
|
|||
|
scrape_interval: 1m
|
|||
|
scrape_timeout: 60s
|
|||
|
metrics_path: /metrics
|
|||
|
scheme: http
|
|||
|
dns_sd_configs:
|
|||
|
- names:
|
|||
|
- {{ template "aggregator.serviceName" . }}
|
|||
|
type: 'A'
|
|||
|
{{- if or .Values.saml.enabled .Values.oidc.enabled }}
|
|||
|
port: 9008
|
|||
|
{{- else }}
|
|||
|
port: 9004
|
|||
|
{{- end }}
|
|||
|
## Enables scraping of NVIDIA GPU metrics via dcgm-exporter. Scrapes all
|
|||
|
## endpoints which contain "dcgm-exporter" in labels "app",
|
|||
|
## "app.kubernetes.io/component", or "app.kubernetes.io/name" with a case
|
|||
|
## insensitive match.
|
|||
|
## Refs:
|
|||
|
## https://github.com/NVIDIA/gpu-operator/blob/d4316a415bbd684ce8416a88042305fc1a093aa4/assets/state-dcgm-exporter/0600_service.yaml#L7
|
|||
|
## https://github.com/NVIDIA/dcgm-exporter/blob/54fd1ca137c66511a87a720390613680b9bdabdd/deployment/templates/service.yaml#L23
|
|||
|
- job_name: kubecost-dcgm-exporter
|
|||
|
kubernetes_sd_configs:
|
|||
|
- role: endpoints
|
|||
|
relabel_configs:
|
|||
|
- source_labels: [__meta_kubernetes_pod_label_app, __meta_kubernetes_pod_label_app_kubernetes_io_component, __meta_kubernetes_pod_label_app_kubernetes_io_name]
|
|||
|
action: keep
|
|||
|
regex: (?i)(.*dcgm-exporter.*|.*dcgm-exporter.*|.*dcgm-exporter.*)
|
|||
|
|
|||
|
server:
|
|||
|
# If clusterIDConfigmap is defined, instead use user-generated configmap with key CLUSTER_ID
|
|||
|
# to use as unique cluster ID in kubecost cost-analyzer deployment.
|
|||
|
# This overrides the cluster_id set in prometheus.server.global.external_labels.
|
|||
|
# NOTE: This does not affect the external_labels set in prometheus config.
|
|||
|
# clusterIDConfigmap: cluster-id-configmap
|
|||
|
|
|||
|
## Provide a full name override for the Prometheus server.
|
|||
|
# fullnameOverride: ""
|
|||
|
|
|||
|
## Prometheus server container name
|
|||
|
##
|
|||
|
enabled: true
|
|||
|
name: server
|
|||
|
sidecarContainers:
|
|||
|
strategy:
|
|||
|
type: Recreate
|
|||
|
rollingUpdate: null
|
|||
|
|
|||
|
## Prometheus server container image
|
|||
|
##
|
|||
|
image:
|
|||
|
repository: cgr.dev/chainguard/prometheus
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## prometheus server priorityClassName
|
|||
|
##
|
|||
|
priorityClassName: ""
|
|||
|
|
|||
|
## The URL prefix at which the container can be accessed. Useful in the case the '-web.external-url' includes a slug
|
|||
|
## so that the various internal URLs are still able to access as they are in the default case.
|
|||
|
## (Optional)
|
|||
|
prefixURL: ""
|
|||
|
|
|||
|
## External URL which can access alertmanager
|
|||
|
## Maybe same with Ingress host name
|
|||
|
baseURL: ""
|
|||
|
|
|||
|
## Additional server container environment variables
|
|||
|
##
|
|||
|
## You specify this manually like you would a raw deployment manifest.
|
|||
|
## This means you can bind in environment variables from secrets.
|
|||
|
##
|
|||
|
## e.g. static environment variable:
|
|||
|
## - name: DEMO_GREETING
|
|||
|
## value: "Hello from the environment"
|
|||
|
##
|
|||
|
## e.g. secret environment variable:
|
|||
|
## - name: USERNAME
|
|||
|
## valueFrom:
|
|||
|
## secretKeyRef:
|
|||
|
## name: mysecret
|
|||
|
## key: username
|
|||
|
env: []
|
|||
|
|
|||
|
extraFlags:
|
|||
|
- web.enable-lifecycle
|
|||
|
## web.enable-admin-api flag controls access to the administrative HTTP API which includes functionality such as
|
|||
|
## deleting time series. This is disabled by default.
|
|||
|
# - web.enable-admin-api
|
|||
|
##
|
|||
|
## storage.tsdb.no-lockfile flag controls BD locking
|
|||
|
# - storage.tsdb.no-lockfile
|
|||
|
##
|
|||
|
## storage.tsdb.wal-compression flag enables compression of the write-ahead log (WAL)
|
|||
|
# - storage.tsdb.wal-compression
|
|||
|
|
|||
|
## Path to a configuration file on prometheus server container FS
|
|||
|
configPath: /etc/config/prometheus.yml
|
|||
|
|
|||
|
global:
|
|||
|
## How frequently to scrape targets by default
|
|||
|
##
|
|||
|
scrape_interval: 1m
|
|||
|
## How long until a scrape request times out
|
|||
|
##
|
|||
|
scrape_timeout: 60s
|
|||
|
## How frequently to evaluate rules
|
|||
|
##
|
|||
|
evaluation_interval: 1m
|
|||
|
external_labels:
|
|||
|
cluster_id: cluster-one # Each cluster should have a unique ID
|
|||
|
## https://prometheus.io/docs/prometheus/latest/configuration/configuration/#remote_write
|
|||
|
##
|
|||
|
remoteWrite: {}
|
|||
|
## https://prometheus.io/docs/prometheus/latest/configuration/configuration/#remote_read
|
|||
|
##
|
|||
|
remoteRead: {}
|
|||
|
|
|||
|
## Additional Prometheus server container arguments
|
|||
|
##
|
|||
|
extraArgs:
|
|||
|
query.max-concurrency: 1
|
|||
|
query.max-samples: 100000000
|
|||
|
|
|||
|
## Additional InitContainers to initialize the pod
|
|||
|
##
|
|||
|
extraInitContainers: []
|
|||
|
|
|||
|
## Additional Prometheus server Volume mounts
|
|||
|
##
|
|||
|
extraVolumeMounts: []
|
|||
|
|
|||
|
## Additional Prometheus server Volumes
|
|||
|
##
|
|||
|
extraVolumes: []
|
|||
|
|
|||
|
## Additional Prometheus server hostPath mounts
|
|||
|
##
|
|||
|
extraHostPathMounts: []
|
|||
|
# - name: certs-dir
|
|||
|
# mountPath: /etc/kubernetes/certs
|
|||
|
# subPath: ""
|
|||
|
# hostPath: /etc/kubernetes/certs
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
extraConfigmapMounts: []
|
|||
|
# - name: certs-configmap
|
|||
|
# mountPath: /prometheus
|
|||
|
# subPath: ""
|
|||
|
# configMap: certs-configmap
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
## Additional Prometheus server Secret mounts
|
|||
|
# Defines additional mounts with secrets. Secrets must be manually created in the namespace.
|
|||
|
extraSecretMounts: []
|
|||
|
# - name: secret-files
|
|||
|
# mountPath: /etc/secrets
|
|||
|
# subPath: ""
|
|||
|
# secretName: prom-secret-files
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
## ConfigMap override where fullname is {{.Release.Name}}-{{.Values.server.configMapOverrideName}}
|
|||
|
## Defining configMapOverrideName will cause templates/server-configmap.yaml
|
|||
|
## to NOT generate a ConfigMap resource
|
|||
|
##
|
|||
|
configMapOverrideName: ""
|
|||
|
|
|||
|
ingress:
|
|||
|
## If true, Prometheus server Ingress will be created
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
# className: nginx
|
|||
|
|
|||
|
## Prometheus server Ingress annotations
|
|||
|
##
|
|||
|
annotations: {}
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: 'true'
|
|||
|
|
|||
|
## Prometheus server Ingress additional labels
|
|||
|
##
|
|||
|
extraLabels: {}
|
|||
|
|
|||
|
## Prometheus server Ingress hostnames with optional path
|
|||
|
## Must be provided if Ingress is enabled
|
|||
|
##
|
|||
|
hosts: []
|
|||
|
# - prometheus.domain.com
|
|||
|
# - domain.com/prometheus
|
|||
|
|
|||
|
## PathType determines the interpretation of the Path matching
|
|||
|
pathType: "Prefix"
|
|||
|
|
|||
|
## Extra paths to prepend to every host configuration. This is useful when working with annotation based services.
|
|||
|
extraPaths: []
|
|||
|
# - path: /*
|
|||
|
# backend:
|
|||
|
# serviceName: ssl-redirect
|
|||
|
# servicePort: use-annotation
|
|||
|
|
|||
|
## Prometheus server Ingress TLS configuration
|
|||
|
## Secrets must be manually created in the namespace
|
|||
|
##
|
|||
|
tls: []
|
|||
|
# - secretName: prometheus-server-tls
|
|||
|
# hosts:
|
|||
|
# - prometheus.domain.com
|
|||
|
|
|||
|
## Server Deployment Strategy type
|
|||
|
# strategy:
|
|||
|
# type: Recreate
|
|||
|
|
|||
|
## Node tolerations for server scheduling to nodes with taints
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/assign-pod-node/
|
|||
|
##
|
|||
|
tolerations: []
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
|
|||
|
## Node labels for Prometheus server pod assignment
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/node-selection/
|
|||
|
##
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
## Pod affinity
|
|||
|
##
|
|||
|
affinity: {}
|
|||
|
|
|||
|
## PodDisruptionBudget settings
|
|||
|
## ref: https://kubernetes.io/docs/concepts/workloads/pods/disruptions/
|
|||
|
##
|
|||
|
podDisruptionBudget:
|
|||
|
enabled: false
|
|||
|
maxUnavailable: 1
|
|||
|
|
|||
|
## Use an alternate scheduler, e.g. "stork".
|
|||
|
## ref: https://kubernetes.io/docs/tasks/administer-cluster/configure-multiple-schedulers/
|
|||
|
##
|
|||
|
# schedulerName:
|
|||
|
|
|||
|
persistentVolume:
|
|||
|
## If true, Prometheus server will create/use a Persistent Volume Claim
|
|||
|
## If false, use emptyDir
|
|||
|
##
|
|||
|
enabled: true
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume access modes
|
|||
|
## Must match those of existing PV or dynamic provisioner
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/persistent-volumes/
|
|||
|
##
|
|||
|
accessModes:
|
|||
|
- ReadWriteOnce
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume annotations
|
|||
|
##
|
|||
|
annotations: {}
|
|||
|
# helm.sh/resource-policy: keep # https://helm.sh/docs/howto/charts_tips_and_tricks/#tell-helm-not-to-uninstall-a-resource
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume existing claim name
|
|||
|
## Requires server.persistentVolume.enabled: true
|
|||
|
## If defined, PVC must be created manually before volume will be bound
|
|||
|
existingClaim: ""
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume mount root path
|
|||
|
##
|
|||
|
mountPath: /data
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume size
|
|||
|
##
|
|||
|
size: 32Gi
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume Storage Class
|
|||
|
## If defined, storageClassName: <storageClass>
|
|||
|
## If set to "-", storageClassName: "", which disables dynamic provisioning
|
|||
|
## If undefined (the default) or set to null, no storageClassName spec is
|
|||
|
## set, choosing the default provisioner. (gp2 on AWS, standard on
|
|||
|
## GKE, AWS & OpenStack)
|
|||
|
##
|
|||
|
# storageClass: "-"
|
|||
|
|
|||
|
## Prometheus server data Persistent Volume Binding Mode
|
|||
|
## If defined, volumeBindingMode: <volumeBindingMode>
|
|||
|
## If undefined (the default) or set to null, no volumeBindingMode spec is
|
|||
|
## set, choosing the default mode.
|
|||
|
##
|
|||
|
# volumeBindingMode: ""
|
|||
|
|
|||
|
## Subdirectory of Prometheus server data Persistent Volume to mount
|
|||
|
## Useful if the volume's root directory is not empty
|
|||
|
##
|
|||
|
subPath: ""
|
|||
|
|
|||
|
emptyDir:
|
|||
|
sizeLimit: ""
|
|||
|
|
|||
|
## Annotations to be added to Prometheus server pods
|
|||
|
##
|
|||
|
podAnnotations: {}
|
|||
|
# iam.amazonaws.com/role: prometheus
|
|||
|
|
|||
|
## Annotations to be added to the Prometheus Server deployment
|
|||
|
##
|
|||
|
deploymentAnnotations: {}
|
|||
|
|
|||
|
## Labels to be added to Prometheus server pods
|
|||
|
##
|
|||
|
podLabels: {}
|
|||
|
|
|||
|
## Prometheus AlertManager configuration
|
|||
|
##
|
|||
|
alertmanagers: []
|
|||
|
|
|||
|
## Use a StatefulSet if replicaCount needs to be greater than 1 (see below)
|
|||
|
##
|
|||
|
replicaCount: 1
|
|||
|
|
|||
|
statefulSet:
|
|||
|
## If true, use a statefulset instead of a deployment for pod management.
|
|||
|
## This allows to scale replicas to more than 1 pod
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
podManagementPolicy: OrderedReady
|
|||
|
|
|||
|
## Alertmanager headless service to use for the statefulset
|
|||
|
##
|
|||
|
headless:
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
servicePort: 80
|
|||
|
|
|||
|
## Prometheus server readiness and liveness probe initial delay and timeout
|
|||
|
## Ref: https://kubernetes.io/docs/tasks/configure-pod-container/configure-liveness-readiness-startup-probes/
|
|||
|
##
|
|||
|
readinessProbeInitialDelay: 5
|
|||
|
readinessProbeTimeout: 3
|
|||
|
readinessProbeFailureThreshold: 3
|
|||
|
readinessProbeSuccessThreshold: 1
|
|||
|
livenessProbeInitialDelay: 5
|
|||
|
livenessProbeTimeout: 3
|
|||
|
livenessProbeFailureThreshold: 3
|
|||
|
livenessProbeSuccessThreshold: 1
|
|||
|
|
|||
|
## Prometheus server resource requests and limits
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/compute-resources/
|
|||
|
##
|
|||
|
resources: {}
|
|||
|
# limits:
|
|||
|
# cpu: 500m
|
|||
|
# memory: 512Mi
|
|||
|
# requests:
|
|||
|
# cpu: 500m
|
|||
|
# memory: 512Mi
|
|||
|
|
|||
|
## Vertical Pod Autoscaler config
|
|||
|
## Ref: https://github.com/kubernetes/autoscaler/tree/master/vertical-pod-autoscaler
|
|||
|
verticalAutoscaler:
|
|||
|
## If true a VPA object will be created for the controller (either StatefulSet or Deployment, based on above configs)
|
|||
|
enabled: false
|
|||
|
## Optional. Defaults to "Auto" if not specified.
|
|||
|
# updateMode: "Auto"
|
|||
|
## Mandatory. Without, VPA will not be created.
|
|||
|
# containerPolicies:
|
|||
|
# - containerName: 'prometheus-server'
|
|||
|
|
|||
|
## Security context to be added to server pods
|
|||
|
##
|
|||
|
securityContext: {}
|
|||
|
# runAsUser: 1001
|
|||
|
# runAsNonRoot: true
|
|||
|
# runAsGroup: 1001
|
|||
|
# fsGroup: 1001
|
|||
|
|
|||
|
containerSecurityContext: {}
|
|||
|
|
|||
|
service:
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
clusterIP: ""
|
|||
|
# nodePort: ""
|
|||
|
|
|||
|
## List of IP addresses at which the Prometheus server service is available
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/services/#external-ips
|
|||
|
##
|
|||
|
externalIPs: []
|
|||
|
|
|||
|
loadBalancerIP: ""
|
|||
|
loadBalancerSourceRanges: []
|
|||
|
servicePort: 80
|
|||
|
sessionAffinity: None
|
|||
|
type: ClusterIP
|
|||
|
|
|||
|
## Enable gRPC port on service to allow auto discovery with thanos-querier
|
|||
|
gRPC:
|
|||
|
enabled: false
|
|||
|
servicePort: 10901
|
|||
|
# nodePort: 10901
|
|||
|
|
|||
|
## If using a statefulSet (statefulSet.enabled=true), configure the
|
|||
|
## service to connect to a specific replica to have a consistent view
|
|||
|
## of the data.
|
|||
|
statefulsetReplica:
|
|||
|
enabled: false
|
|||
|
replica: 0
|
|||
|
|
|||
|
## Prometheus server pod termination grace period
|
|||
|
##
|
|||
|
terminationGracePeriodSeconds: 300
|
|||
|
|
|||
|
## Prometheus data retention period (default if not specified is 97 hours)
|
|||
|
##
|
|||
|
## Kubecost builds up its own persistent store of metric data on the
|
|||
|
## filesystem (usually a PV) and, when using ETL Backup and/or Federated
|
|||
|
## ETL, in more durable object storage like S3 or GCS. Kubecost's data
|
|||
|
## retention is _not_ tied to the configured Prometheus retention.
|
|||
|
##
|
|||
|
## For data durability, we recommend using ETL Backup instead of relying on
|
|||
|
## Prometheus retention.
|
|||
|
##
|
|||
|
## Lower retention values will affect Prometheus by reducing resource
|
|||
|
## consumption and increasing stability. It _must not_ be set below or equal
|
|||
|
## to kubecostModel.etlHourlyStoreDurationHours, otherwise empty data sets
|
|||
|
## may overwrite good data sets. For now, it must also be >= 49h for Daily
|
|||
|
## ETL stability.
|
|||
|
##
|
|||
|
## "ETL Rebuild" and "ETL Repair" is only possible on data available within
|
|||
|
## this retention window. This is an extremely rare operation.
|
|||
|
##
|
|||
|
## If you want maximum security in the event of a Kubecost agent
|
|||
|
## (cost-model) outage, increase this value. The current default of 97h is
|
|||
|
## intended to balance Prometheus stability and resource consumption
|
|||
|
## against the event of an outage in Kubecost which would necessitate a
|
|||
|
## version change. 4 days should provide enough time for most users to
|
|||
|
## notice a problem and initiate corrective action.
|
|||
|
retention: 97h
|
|||
|
# retentionSize: should be significantly greater than the storage used in the number of hours set in etlHourlyStoreDurationHours
|
|||
|
|
|||
|
# Install Prometheus Alert Manager
|
|||
|
alertmanager:
|
|||
|
## If false, alertmanager will not be installed
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## Provide a full name override for Prometheus alertmanager.
|
|||
|
# fullnameOverride: ""
|
|||
|
|
|||
|
strategy:
|
|||
|
type: Recreate
|
|||
|
rollingUpdate: null
|
|||
|
|
|||
|
## alertmanager container name
|
|||
|
##
|
|||
|
name: alertmanager
|
|||
|
|
|||
|
## alertmanager container image
|
|||
|
##
|
|||
|
image:
|
|||
|
repository: cgr.dev/chainguard/prometheus-alertmanager
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## alertmanager priorityClassName
|
|||
|
##
|
|||
|
priorityClassName: ""
|
|||
|
|
|||
|
## Additional alertmanager container arguments
|
|||
|
##
|
|||
|
extraArgs: {}
|
|||
|
|
|||
|
## The URL prefix at which the container can be accessed. Useful in the case the '-web.external-url' includes a slug
|
|||
|
## so that the various internal URLs are still able to access as they are in the default case.
|
|||
|
## (Optional)
|
|||
|
prefixURL: ""
|
|||
|
|
|||
|
## External URL which can access alertmanager
|
|||
|
baseURL: "http://localhost:9093"
|
|||
|
|
|||
|
## Additional alertmanager container environment variable
|
|||
|
## For instance to add a http_proxy
|
|||
|
##
|
|||
|
extraEnv: {}
|
|||
|
|
|||
|
## Additional alertmanager Secret mounts
|
|||
|
# Defines additional mounts with secrets. Secrets must be manually created in the namespace.
|
|||
|
extraSecretMounts: []
|
|||
|
# - name: secret-files
|
|||
|
# mountPath: /etc/secrets
|
|||
|
# subPath: ""
|
|||
|
# secretName: alertmanager-secret-files
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
## ConfigMap override where fullname is {{.Release.Name}}-{{.Values.alertmanager.configMapOverrideName}}
|
|||
|
## Defining configMapOverrideName will cause templates/alertmanager-configmap.yaml
|
|||
|
## to NOT generate a ConfigMap resource
|
|||
|
##
|
|||
|
configMapOverrideName: ""
|
|||
|
|
|||
|
## The name of a secret in the same kubernetes namespace which contains the Alertmanager config
|
|||
|
## Defining configFromSecret will cause templates/alertmanager-configmap.yaml
|
|||
|
## to NOT generate a ConfigMap resource
|
|||
|
##
|
|||
|
configFromSecret: ""
|
|||
|
|
|||
|
## The configuration file name to be loaded to alertmanager
|
|||
|
## Must match the key within configuration loaded from ConfigMap/Secret
|
|||
|
##
|
|||
|
configFileName: alertmanager.yml
|
|||
|
|
|||
|
ingress:
|
|||
|
## If true, alertmanager Ingress will be created
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## alertmanager Ingress annotations
|
|||
|
##
|
|||
|
annotations: {}
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: 'true'
|
|||
|
|
|||
|
## alertmanager Ingress additional labels
|
|||
|
##
|
|||
|
extraLabels: {}
|
|||
|
|
|||
|
## alertmanager Ingress hostnames with optional path
|
|||
|
## Must be provided if Ingress is enabled
|
|||
|
##
|
|||
|
hosts: []
|
|||
|
# - alertmanager.domain.com
|
|||
|
# - domain.com/alertmanager
|
|||
|
|
|||
|
## Extra paths to prepend to every host configuration. This is useful when working with annotation based services.
|
|||
|
extraPaths: []
|
|||
|
# - path: /*
|
|||
|
# backend:
|
|||
|
# serviceName: ssl-redirect
|
|||
|
# servicePort: use-annotation
|
|||
|
|
|||
|
## alertmanager Ingress TLS configuration
|
|||
|
## Secrets must be manually created in the namespace
|
|||
|
##
|
|||
|
tls: []
|
|||
|
# - secretName: prometheus-alerts-tls
|
|||
|
# hosts:
|
|||
|
# - alertmanager.domain.com
|
|||
|
|
|||
|
## Alertmanager Deployment Strategy type
|
|||
|
# strategy:
|
|||
|
# type: Recreate
|
|||
|
|
|||
|
## Node tolerations for alertmanager scheduling to nodes with taints
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/assign-pod-node/
|
|||
|
##
|
|||
|
tolerations: []
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
|
|||
|
## Node labels for alertmanager pod assignment
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/node-selection/
|
|||
|
##
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
## Pod affinity
|
|||
|
##
|
|||
|
affinity: {}
|
|||
|
|
|||
|
## PodDisruptionBudget settings
|
|||
|
## ref: https://kubernetes.io/docs/concepts/workloads/pods/disruptions/
|
|||
|
##
|
|||
|
podDisruptionBudget:
|
|||
|
enabled: false
|
|||
|
maxUnavailable: 1
|
|||
|
|
|||
|
## Use an alternate scheduler, e.g. "stork".
|
|||
|
## ref: https://kubernetes.io/docs/tasks/administer-cluster/configure-multiple-schedulers/
|
|||
|
##
|
|||
|
# schedulerName:
|
|||
|
|
|||
|
persistentVolume:
|
|||
|
## If true, alertmanager will create/use a Persistent Volume Claim
|
|||
|
## If false, use emptyDir
|
|||
|
##
|
|||
|
enabled: true
|
|||
|
|
|||
|
## alertmanager data Persistent Volume access modes
|
|||
|
## Must match those of existing PV or dynamic provisioner
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/persistent-volumes/
|
|||
|
##
|
|||
|
accessModes:
|
|||
|
- ReadWriteOnce
|
|||
|
|
|||
|
## alertmanager data Persistent Volume Claim annotations
|
|||
|
##
|
|||
|
annotations: {}
|
|||
|
|
|||
|
## alertmanager data Persistent Volume existing claim name
|
|||
|
## Requires alertmanager.persistentVolume.enabled: true
|
|||
|
## If defined, PVC must be created manually before volume will be bound
|
|||
|
existingClaim: ""
|
|||
|
|
|||
|
## alertmanager data Persistent Volume mount root path
|
|||
|
##
|
|||
|
mountPath: /data
|
|||
|
|
|||
|
## alertmanager data Persistent Volume size
|
|||
|
##
|
|||
|
size: 2Gi
|
|||
|
|
|||
|
## alertmanager data Persistent Volume Storage Class
|
|||
|
## If defined, storageClassName: <storageClass>
|
|||
|
## If set to "-", storageClassName: "", which disables dynamic provisioning
|
|||
|
## If undefined (the default) or set to null, no storageClassName spec is
|
|||
|
## set, choosing the default provisioner. (gp2 on AWS, standard on
|
|||
|
## GKE, AWS & OpenStack)
|
|||
|
##
|
|||
|
# storageClass: "-"
|
|||
|
|
|||
|
## alertmanager data Persistent Volume Binding Mode
|
|||
|
## If defined, volumeBindingMode: <volumeBindingMode>
|
|||
|
## If undefined (the default) or set to null, no volumeBindingMode spec is
|
|||
|
## set, choosing the default mode.
|
|||
|
##
|
|||
|
# volumeBindingMode: ""
|
|||
|
|
|||
|
## Subdirectory of alertmanager data Persistent Volume to mount
|
|||
|
## Useful if the volume's root directory is not empty
|
|||
|
##
|
|||
|
subPath: ""
|
|||
|
|
|||
|
## Annotations to be added to alertmanager pods
|
|||
|
##
|
|||
|
podAnnotations: {}
|
|||
|
## Tell prometheus to use a specific set of alertmanager pods
|
|||
|
## instead of all alertmanager pods found in the same namespace
|
|||
|
## Useful if you deploy multiple releases within the same namespace
|
|||
|
##
|
|||
|
## prometheus.io/probe: alertmanager-teamA
|
|||
|
|
|||
|
## Labels to be added to Prometheus AlertManager pods
|
|||
|
##
|
|||
|
podLabels: {}
|
|||
|
|
|||
|
## Use a StatefulSet if replicaCount needs to be greater than 1 (see below)
|
|||
|
##
|
|||
|
replicaCount: 1
|
|||
|
|
|||
|
statefulSet:
|
|||
|
## If true, use a statefulset instead of a deployment for pod management.
|
|||
|
## This allows to scale replicas to more than 1 pod
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
podManagementPolicy: OrderedReady
|
|||
|
|
|||
|
## Alertmanager headless service to use for the statefulset
|
|||
|
##
|
|||
|
headless:
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
|
|||
|
## Enabling peer mesh service end points for enabling the HA alert manager
|
|||
|
## Ref: https://github.com/prometheus/alertmanager/blob/master/README.md
|
|||
|
# enableMeshPeer : true
|
|||
|
|
|||
|
servicePort: 80
|
|||
|
|
|||
|
## alertmanager resource requests and limits
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/compute-resources/
|
|||
|
##
|
|||
|
resources: {}
|
|||
|
# limits:
|
|||
|
# cpu: 10m
|
|||
|
# memory: 32Mi
|
|||
|
# requests:
|
|||
|
# cpu: 10m
|
|||
|
# memory: 32Mi
|
|||
|
|
|||
|
## Security context to be added to alertmanager pods
|
|||
|
##
|
|||
|
securityContext:
|
|||
|
runAsUser: 1001
|
|||
|
runAsNonRoot: true
|
|||
|
runAsGroup: 1001
|
|||
|
fsGroup: 1001
|
|||
|
|
|||
|
service:
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
clusterIP: ""
|
|||
|
|
|||
|
## Enabling peer mesh service end points for enabling the HA alert manager
|
|||
|
## Ref: https://github.com/prometheus/alertmanager/blob/master/README.md
|
|||
|
# enableMeshPeer : true
|
|||
|
|
|||
|
## List of IP addresses at which the alertmanager service is available
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/services/#external-ips
|
|||
|
##
|
|||
|
externalIPs: []
|
|||
|
|
|||
|
loadBalancerIP: ""
|
|||
|
loadBalancerSourceRanges: []
|
|||
|
servicePort: 80
|
|||
|
# nodePort: 30000
|
|||
|
sessionAffinity: None
|
|||
|
type: ClusterIP
|
|||
|
|
|||
|
# Define a custom scheduler for Alertmanager pods
|
|||
|
# schedulerName: default-scheduler
|
|||
|
|
|||
|
## alertmanager ConfigMap entries
|
|||
|
##
|
|||
|
alertmanagerFiles:
|
|||
|
alertmanager.yml:
|
|||
|
global: {}
|
|||
|
# slack_api_url: ''
|
|||
|
|
|||
|
receivers:
|
|||
|
- name: default-receiver
|
|||
|
# slack_configs:
|
|||
|
# - channel: '@you'
|
|||
|
# send_resolved: true
|
|||
|
|
|||
|
route:
|
|||
|
group_wait: 10s
|
|||
|
group_interval: 5m
|
|||
|
receiver: default-receiver
|
|||
|
repeat_interval: 3h
|
|||
|
|
|||
|
## Monitors ConfigMap changes and POSTs to a URL
|
|||
|
configmapReload:
|
|||
|
prometheus:
|
|||
|
## If false, the configmap-reload container will not be deployed
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## configmap-reload container name
|
|||
|
##
|
|||
|
name: configmap-reload
|
|||
|
|
|||
|
## configmap-reload container image
|
|||
|
##
|
|||
|
image:
|
|||
|
repository: cgr.dev/chainguard/prometheus-config-reloader
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## Additional configmap-reload container arguments
|
|||
|
##
|
|||
|
extraArgs: {}
|
|||
|
## Additional configmap-reload volume directories
|
|||
|
##
|
|||
|
extraVolumeDirs: []
|
|||
|
|
|||
|
## Additional configmap-reload mounts
|
|||
|
##
|
|||
|
extraConfigmapMounts: []
|
|||
|
# - name: prometheus-alerts
|
|||
|
# mountPath: /etc/alerts.d
|
|||
|
# subPath: ""
|
|||
|
# configMap: prometheus-alerts
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
## configmap-reload resource requests and limits
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/compute-resources/
|
|||
|
##
|
|||
|
resources: {}
|
|||
|
|
|||
|
## configmap-reload container securityContext
|
|||
|
containerSecurityContext: {}
|
|||
|
|
|||
|
alertmanager:
|
|||
|
## If false, the configmap-reload container will not be deployed
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## configmap-reload container name
|
|||
|
##
|
|||
|
name: configmap-reload
|
|||
|
|
|||
|
## configmap-reload container image
|
|||
|
##
|
|||
|
image:
|
|||
|
repository: cgr.dev/chainguard/prometheus-config-reloader
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## Additional configmap-reload container arguments
|
|||
|
##
|
|||
|
extraArgs: {}
|
|||
|
## Additional configmap-reload volume directories
|
|||
|
##
|
|||
|
extraVolumeDirs: []
|
|||
|
|
|||
|
|
|||
|
## Additional configmap-reload mounts
|
|||
|
##
|
|||
|
extraConfigmapMounts: []
|
|||
|
# - name: prometheus-alerts
|
|||
|
# mountPath: /etc/alerts.d
|
|||
|
# subPath: ""
|
|||
|
# configMap: prometheus-alerts
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
|
|||
|
## configmap-reload resource requests and limits
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/compute-resources/
|
|||
|
##
|
|||
|
resources: {}
|
|||
|
|
|||
|
# node-export must be disabled if there is an existing daemonset: https://guide.kubecost.com/hc/en-us/articles/4407601830679-Troubleshoot-Install#a-name-node-exporter-a-issue-failedscheduling-kubecost-prometheus-node-exporter
|
|||
|
nodeExporter:
|
|||
|
## If false, node-exporter will not be installed.
|
|||
|
## This is disabled by default in Kubecost 2.0, though it can be enabled as needed.
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## Provide a full name override for node exporter.
|
|||
|
# fullnameOverride: ""
|
|||
|
|
|||
|
## If true, node-exporter pods share the host network namespace
|
|||
|
##
|
|||
|
hostNetwork: true
|
|||
|
|
|||
|
## If true, node-exporter pods share the host PID namespace
|
|||
|
##
|
|||
|
hostPID: true
|
|||
|
|
|||
|
## node-exporter dns policy
|
|||
|
##
|
|||
|
dnsPolicy: ClusterFirstWithHostNet
|
|||
|
|
|||
|
## node-exporter container name
|
|||
|
##
|
|||
|
name: node-exporter
|
|||
|
|
|||
|
## node-exporter container image
|
|||
|
##
|
|||
|
image:
|
|||
|
repository: prom/node-exporter
|
|||
|
tag: v1.8.2
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## node-exporter priorityClassName
|
|||
|
##
|
|||
|
priorityClassName: ""
|
|||
|
|
|||
|
## Custom Update Strategy
|
|||
|
##
|
|||
|
updateStrategy:
|
|||
|
type: RollingUpdate
|
|||
|
|
|||
|
## Additional node-exporter container arguments
|
|||
|
##
|
|||
|
extraArgs: {}
|
|||
|
|
|||
|
## Additional node-exporter hostPath mounts
|
|||
|
##
|
|||
|
extraHostPathMounts: []
|
|||
|
# - name: textfile-dir
|
|||
|
# mountPath: /srv/txt_collector
|
|||
|
# hostPath: /var/lib/node-exporter
|
|||
|
# readOnly: true
|
|||
|
# mountPropagation: HostToContainer
|
|||
|
|
|||
|
extraConfigmapMounts: []
|
|||
|
# - name: certs-configmap
|
|||
|
# mountPath: /prometheus
|
|||
|
# configMap: certs-configmap
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
## Set a custom affinity for node-exporter
|
|||
|
##
|
|||
|
# affinity:
|
|||
|
|
|||
|
## Node tolerations for node-exporter scheduling to nodes with taints
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/assign-pod-node/
|
|||
|
##
|
|||
|
tolerations: []
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
|
|||
|
## Node labels for node-exporter pod assignment
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/node-selection/
|
|||
|
##
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
## Annotations to be added to node-exporter pods
|
|||
|
##
|
|||
|
podAnnotations: {}
|
|||
|
|
|||
|
## Annotations to be added to the node-exporter DaemonSet
|
|||
|
##
|
|||
|
deploymentAnnotations: {}
|
|||
|
|
|||
|
## Labels to be added to node-exporter pods
|
|||
|
##
|
|||
|
pod:
|
|||
|
labels: {}
|
|||
|
|
|||
|
## PodDisruptionBudget settings
|
|||
|
## ref: https://kubernetes.io/docs/concepts/workloads/pods/disruptions/
|
|||
|
##
|
|||
|
podDisruptionBudget:
|
|||
|
enabled: false
|
|||
|
maxUnavailable: 1
|
|||
|
|
|||
|
## node-exporter resource limits & requests
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/compute-resources/
|
|||
|
##
|
|||
|
resources: {}
|
|||
|
# limits:
|
|||
|
# cpu: 200m
|
|||
|
# memory: 50Mi
|
|||
|
# requests:
|
|||
|
# cpu: 100m
|
|||
|
# memory: 30Mi
|
|||
|
|
|||
|
## Security context to be added to node-exporter pods
|
|||
|
##
|
|||
|
securityContext: {}
|
|||
|
# runAsUser: 0
|
|||
|
|
|||
|
service:
|
|||
|
annotations:
|
|||
|
prometheus.io/scrape: "true"
|
|||
|
labels: {}
|
|||
|
|
|||
|
# Exposed as a headless service:
|
|||
|
# https://kubernetes.io/docs/concepts/services-networking/service/#headless-services
|
|||
|
clusterIP: None
|
|||
|
|
|||
|
## List of IP addresses at which the node-exporter service is available
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/services/#external-ips
|
|||
|
##
|
|||
|
externalIPs: []
|
|||
|
|
|||
|
hostPort: 9100
|
|||
|
loadBalancerIP: ""
|
|||
|
loadBalancerSourceRanges: []
|
|||
|
servicePort: 9100
|
|||
|
type: ClusterIP
|
|||
|
|
|||
|
# Install Prometheus Push Gateway.
|
|||
|
pushgateway:
|
|||
|
## If false, pushgateway will not be installed
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## Provide a full name override for Prometheus push gateway.
|
|||
|
# fullnameOverride: ""
|
|||
|
|
|||
|
## Use an alternate scheduler, e.g. "stork".
|
|||
|
## ref: https://kubernetes.io/docs/tasks/administer-cluster/configure-multiple-schedulers/
|
|||
|
##
|
|||
|
# schedulerName:
|
|||
|
|
|||
|
## pushgateway container name
|
|||
|
##
|
|||
|
name: pushgateway
|
|||
|
|
|||
|
## pushgateway container image
|
|||
|
##
|
|||
|
image:
|
|||
|
repository: prom/pushgateway
|
|||
|
tag: v1.9.0
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## pushgateway priorityClassName
|
|||
|
##
|
|||
|
priorityClassName: ""
|
|||
|
|
|||
|
## Additional pushgateway container arguments
|
|||
|
##
|
|||
|
## for example: persistence.file: /data/pushgateway.data
|
|||
|
extraArgs: {}
|
|||
|
|
|||
|
ingress:
|
|||
|
## If true, pushgateway Ingress will be created
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
## pushgateway Ingress annotations
|
|||
|
##
|
|||
|
annotations: {}
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: 'true'
|
|||
|
|
|||
|
## pushgateway Ingress hostnames with optional path
|
|||
|
## Must be provided if Ingress is enabled
|
|||
|
##
|
|||
|
hosts: []
|
|||
|
# - pushgateway.domain.com
|
|||
|
# - domain.com/pushgateway
|
|||
|
|
|||
|
## Extra paths to prepend to every host configuration. This is useful when working with annotation based services.
|
|||
|
extraPaths: []
|
|||
|
# - path: /*
|
|||
|
# backend:
|
|||
|
# serviceName: ssl-redirect
|
|||
|
# servicePort: use-annotation
|
|||
|
|
|||
|
## pushgateway Ingress TLS configuration
|
|||
|
## Secrets must be manually created in the namespace
|
|||
|
##
|
|||
|
tls: []
|
|||
|
# - secretName: prometheus-alerts-tls
|
|||
|
# hosts:
|
|||
|
# - pushgateway.domain.com
|
|||
|
|
|||
|
## Node tolerations for pushgateway scheduling to nodes with taints
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/assign-pod-node/
|
|||
|
##
|
|||
|
tolerations: []
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
|
|||
|
## Node labels for pushgateway pod assignment
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/node-selection/
|
|||
|
##
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
## Annotations to be added to pushgateway pods
|
|||
|
##
|
|||
|
podAnnotations: {}
|
|||
|
|
|||
|
replicaCount: 1
|
|||
|
|
|||
|
## PodDisruptionBudget settings
|
|||
|
## ref: https://kubernetes.io/docs/concepts/workloads/pods/disruptions/
|
|||
|
##
|
|||
|
podDisruptionBudget:
|
|||
|
enabled: false
|
|||
|
maxUnavailable: 1
|
|||
|
|
|||
|
## pushgateway resource requests and limits
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/compute-resources/
|
|||
|
##
|
|||
|
resources: {}
|
|||
|
# limits:
|
|||
|
# cpu: 10m
|
|||
|
# memory: 32Mi
|
|||
|
# requests:
|
|||
|
# cpu: 10m
|
|||
|
# memory: 32Mi
|
|||
|
|
|||
|
## Security context to be added to push-gateway pods
|
|||
|
##
|
|||
|
securityContext:
|
|||
|
runAsUser: 1001
|
|||
|
runAsNonRoot: true
|
|||
|
|
|||
|
service:
|
|||
|
annotations:
|
|||
|
prometheus.io/probe: pushgateway
|
|||
|
labels: {}
|
|||
|
clusterIP: ""
|
|||
|
|
|||
|
## List of IP addresses at which the pushgateway service is available
|
|||
|
## Ref: https://kubernetes.io/docs/user-guide/services/#external-ips
|
|||
|
##
|
|||
|
externalIPs: []
|
|||
|
|
|||
|
loadBalancerIP: ""
|
|||
|
loadBalancerSourceRanges: []
|
|||
|
servicePort: 9091
|
|||
|
type: ClusterIP
|
|||
|
|
|||
|
strategy:
|
|||
|
type: Recreate
|
|||
|
rollingUpdate: null
|
|||
|
|
|||
|
|
|||
|
persistentVolume:
|
|||
|
## If true, pushgateway will create/use a Persistent Volume Claim
|
|||
|
## If false, use emptyDir
|
|||
|
##
|
|||
|
enabled: true
|
|||
|
|
|||
|
## pushgateway data Persistent Volume access modes
|
|||
|
## Must match those of existing PV or dynamic provisioner
|
|||
|
## Ref: http://kubernetes.io/docs/user-guide/persistent-volumes/
|
|||
|
##
|
|||
|
accessModes:
|
|||
|
- ReadWriteOnce
|
|||
|
|
|||
|
## pushgateway data Persistent Volume Claim annotations
|
|||
|
##
|
|||
|
annotations: {}
|
|||
|
|
|||
|
## pushgateway data Persistent Volume existing claim name
|
|||
|
## Requires pushgateway.persistentVolume.enabled: true
|
|||
|
## If defined, PVC must be created manually before volume will be bound
|
|||
|
existingClaim: ""
|
|||
|
|
|||
|
## pushgateway data Persistent Volume mount root path
|
|||
|
##
|
|||
|
mountPath: /data
|
|||
|
|
|||
|
## pushgateway data Persistent Volume size
|
|||
|
##
|
|||
|
size: 2Gi
|
|||
|
|
|||
|
## pushgateway data Persistent Volume Storage Class
|
|||
|
## If defined, storageClassName: <storageClass>
|
|||
|
## If set to "-", storageClassName: "", which disables dynamic provisioning
|
|||
|
## If undefined (the default) or set to null, no storageClassName spec is
|
|||
|
## set, choosing the default provisioner. (gp2 on AWS, standard on
|
|||
|
## GKE, AWS & OpenStack)
|
|||
|
##
|
|||
|
# storageClass: "-"
|
|||
|
|
|||
|
## pushgateway data Persistent Volume Binding Mode
|
|||
|
## If defined, volumeBindingMode: <volumeBindingMode>
|
|||
|
## If undefined (the default) or set to null, no volumeBindingMode spec is
|
|||
|
## set, choosing the default mode.
|
|||
|
##
|
|||
|
# volumeBindingMode: ""
|
|||
|
|
|||
|
## Subdirectory of pushgateway data Persistent Volume to mount
|
|||
|
## Useful if the volume's root directory is not empty
|
|||
|
##
|
|||
|
subPath: ""
|
|||
|
|
|||
|
serverFiles:
|
|||
|
## Alerts configuration
|
|||
|
## Ref: https://prometheus.io/docs/prometheus/latest/configuration/alerting_rules/
|
|||
|
alerting_rules.yml: {}
|
|||
|
# groups:
|
|||
|
# - name: Instances
|
|||
|
# rules:
|
|||
|
# - alert: InstanceDown
|
|||
|
# expr: up == 0
|
|||
|
# for: 5m
|
|||
|
# labels:
|
|||
|
# severity: page
|
|||
|
# annotations:
|
|||
|
# description: '{{ $labels.instance }} of job {{ $labels.job }} has been down for more than 5 minutes.'
|
|||
|
# summary: 'Instance {{ $labels.instance }} down'
|
|||
|
## DEPRECATED DEFAULT VALUE, unless explicitly naming your files, please use alerting_rules.yml
|
|||
|
alerts: {}
|
|||
|
|
|||
|
## Records configuration
|
|||
|
## Ref: https://prometheus.io/docs/prometheus/latest/configuration/recording_rules/
|
|||
|
recording_rules.yml: {}
|
|||
|
## DEPRECATED DEFAULT VALUE, unless explicitly naming your files, please use recording_rules.yml
|
|||
|
|
|||
|
prometheus.yml:
|
|||
|
rule_files:
|
|||
|
- /etc/config/recording_rules.yml
|
|||
|
- /etc/config/alerting_rules.yml
|
|||
|
## Below two files are DEPRECATED will be removed from this default values file
|
|||
|
- /etc/config/rules
|
|||
|
- /etc/config/alerts
|
|||
|
|
|||
|
scrape_configs:
|
|||
|
- job_name: prometheus
|
|||
|
static_configs:
|
|||
|
- targets:
|
|||
|
- localhost:9090
|
|||
|
|
|||
|
# A scrape configuration for running Prometheus on a Kubernetes cluster.
|
|||
|
# This uses separate scrape configs for cluster components (i.e. API server, node)
|
|||
|
# and services to allow each to use different authentication configs.
|
|||
|
#
|
|||
|
# Kubernetes labels will be added as Prometheus labels on metrics via the
|
|||
|
# `labelmap` relabeling action.
|
|||
|
|
|||
|
- job_name: 'kubernetes-nodes-cadvisor'
|
|||
|
|
|||
|
# Default to scraping over https. If required, just disable this or change to
|
|||
|
# `http`.
|
|||
|
scheme: https
|
|||
|
|
|||
|
# This TLS & bearer token file config is used to connect to the actual scrape
|
|||
|
# endpoints for cluster components. This is separate to discovery auth
|
|||
|
# configuration because discovery & scraping are two separate concerns in
|
|||
|
# Prometheus. The discovery auth config is automatic if Prometheus runs inside
|
|||
|
# the cluster. Otherwise, more config options have to be provided within the
|
|||
|
# <kubernetes_sd_config>.
|
|||
|
tls_config:
|
|||
|
ca_file: /var/run/secrets/kubernetes.io/serviceaccount/ca.crt
|
|||
|
# If your node certificates are self-signed or use a different CA to the
|
|||
|
# master CA, then disable certificate verification below. Note that
|
|||
|
# certificate verification is an integral part of a secure infrastructure
|
|||
|
# so this should only be disabled in a controlled environment. You can
|
|||
|
# disable certificate verification by uncommenting the line below.
|
|||
|
#
|
|||
|
insecure_skip_verify: true
|
|||
|
bearer_token_file: /var/run/secrets/kubernetes.io/serviceaccount/token
|
|||
|
|
|||
|
kubernetes_sd_configs:
|
|||
|
- role: node
|
|||
|
|
|||
|
# This configuration will work only on kubelet 1.7.3+
|
|||
|
# As the scrape endpoints for cAdvisor have changed
|
|||
|
# if you are using older version you need to change the replacement to
|
|||
|
# replacement: /api/v1/nodes/$1:4194/proxy/metrics
|
|||
|
# more info here https://github.com/coreos/prometheus-operator/issues/633
|
|||
|
relabel_configs:
|
|||
|
- action: labelmap
|
|||
|
regex: __meta_kubernetes_node_label_(.+)
|
|||
|
- target_label: __address__
|
|||
|
replacement: kubernetes.default.svc:443
|
|||
|
- source_labels: [__meta_kubernetes_node_name]
|
|||
|
regex: (.+)
|
|||
|
target_label: __metrics_path__
|
|||
|
replacement: /api/v1/nodes/$1/proxy/metrics/cadvisor
|
|||
|
|
|||
|
metric_relabel_configs:
|
|||
|
- source_labels: [__name__]
|
|||
|
regex: (container_cpu_usage_seconds_total|container_memory_working_set_bytes|container_network_receive_errors_total|container_network_transmit_errors_total|container_network_receive_packets_dropped_total|container_network_transmit_packets_dropped_total|container_memory_usage_bytes|container_cpu_cfs_throttled_periods_total|container_cpu_cfs_periods_total|container_fs_usage_bytes|container_fs_limit_bytes|container_cpu_cfs_periods_total|container_fs_inodes_free|container_fs_inodes_total|container_fs_usage_bytes|container_fs_limit_bytes|container_cpu_cfs_throttled_periods_total|container_cpu_cfs_periods_total|container_network_receive_bytes_total|container_network_transmit_bytes_total|container_fs_inodes_free|container_fs_inodes_total|container_fs_usage_bytes|container_fs_limit_bytes|container_spec_cpu_shares|container_spec_memory_limit_bytes|container_network_receive_bytes_total|container_network_transmit_bytes_total|container_fs_reads_bytes_total|container_network_receive_bytes_total|container_fs_writes_bytes_total|container_fs_reads_bytes_total|cadvisor_version_info|kubecost_pv_info)
|
|||
|
action: keep
|
|||
|
- source_labels: [container]
|
|||
|
target_label: container_name
|
|||
|
regex: (.+)
|
|||
|
action: replace
|
|||
|
- source_labels: [pod]
|
|||
|
target_label: pod_name
|
|||
|
regex: (.+)
|
|||
|
action: replace
|
|||
|
|
|||
|
# A scrape configuration for running Prometheus on a Kubernetes cluster.
|
|||
|
# This uses separate scrape configs for cluster components (i.e. API server, node)
|
|||
|
# and services to allow each to use different authentication configs.
|
|||
|
#
|
|||
|
# Kubernetes labels will be added as Prometheus labels on metrics via the
|
|||
|
# `labelmap` relabeling action.
|
|||
|
|
|||
|
- job_name: 'kubernetes-nodes'
|
|||
|
|
|||
|
# Default to scraping over https. If required, just disable this or change to
|
|||
|
# `http`.
|
|||
|
scheme: https
|
|||
|
|
|||
|
# This TLS & bearer token file config is used to connect to the actual scrape
|
|||
|
# endpoints for cluster components. This is separate to discovery auth
|
|||
|
# configuration because discovery & scraping are two separate concerns in
|
|||
|
# Prometheus. The discovery auth config is automatic if Prometheus runs inside
|
|||
|
# the cluster. Otherwise, more config options have to be provided within the
|
|||
|
# <kubernetes_sd_config>.
|
|||
|
tls_config:
|
|||
|
ca_file: /var/run/secrets/kubernetes.io/serviceaccount/ca.crt
|
|||
|
# If your node certificates are self-signed or use a different CA to the
|
|||
|
# master CA, then disable certificate verification below. Note that
|
|||
|
# certificate verification is an integral part of a secure infrastructure
|
|||
|
# so this should only be disabled in a controlled environment. You can
|
|||
|
# disable certificate verification by uncommenting the line below.
|
|||
|
#
|
|||
|
insecure_skip_verify: true
|
|||
|
bearer_token_file: /var/run/secrets/kubernetes.io/serviceaccount/token
|
|||
|
|
|||
|
kubernetes_sd_configs:
|
|||
|
- role: node
|
|||
|
|
|||
|
relabel_configs:
|
|||
|
- action: labelmap
|
|||
|
regex: __meta_kubernetes_node_label_(.+)
|
|||
|
- target_label: __address__
|
|||
|
replacement: kubernetes.default.svc:443
|
|||
|
- source_labels: [__meta_kubernetes_node_name]
|
|||
|
regex: (.+)
|
|||
|
target_label: __metrics_path__
|
|||
|
replacement: /api/v1/nodes/$1/proxy/metrics
|
|||
|
|
|||
|
metric_relabel_configs:
|
|||
|
- source_labels: [__name__]
|
|||
|
regex: (kubelet_volume_stats_used_bytes) # this metric is in alpha
|
|||
|
action: keep
|
|||
|
|
|||
|
# Scrape config for service endpoints.
|
|||
|
#
|
|||
|
# The relabeling allows the actual service scrape endpoint to be configured
|
|||
|
# via the following annotations:
|
|||
|
#
|
|||
|
# * `prometheus.io/scrape`: Only scrape services that have a value of `true`
|
|||
|
# * `prometheus.io/scheme`: If the metrics endpoint is secured then you will need
|
|||
|
# to set this to `https` & most likely set the `tls_config` of the scrape config.
|
|||
|
# * `prometheus.io/path`: If the metrics path is not `/metrics` override this.
|
|||
|
# * `prometheus.io/port`: If the metrics are exposed on a different port to the
|
|||
|
# service then set this appropriately.
|
|||
|
- job_name: 'kubernetes-service-endpoints'
|
|||
|
|
|||
|
kubernetes_sd_configs:
|
|||
|
- role: endpoints
|
|||
|
|
|||
|
relabel_configs:
|
|||
|
- source_labels: [__meta_kubernetes_service_annotation_prometheus_io_scrape]
|
|||
|
action: keep
|
|||
|
regex: true
|
|||
|
- source_labels: [__meta_kubernetes_endpoints_name]
|
|||
|
action: keep
|
|||
|
regex: (.*node-exporter|kubecost-network-costs)
|
|||
|
- source_labels: [__meta_kubernetes_service_annotation_prometheus_io_scheme]
|
|||
|
action: replace
|
|||
|
target_label: __scheme__
|
|||
|
regex: (https?)
|
|||
|
- source_labels: [__meta_kubernetes_service_annotation_prometheus_io_path]
|
|||
|
action: replace
|
|||
|
target_label: __metrics_path__
|
|||
|
regex: (.+)
|
|||
|
- source_labels: [__address__, __meta_kubernetes_service_annotation_prometheus_io_port]
|
|||
|
action: replace
|
|||
|
target_label: __address__
|
|||
|
regex: ([^:]+)(?::\d+)?;(\d+)
|
|||
|
replacement: $1:$2
|
|||
|
- action: labelmap
|
|||
|
regex: __meta_kubernetes_service_label_(.+)
|
|||
|
- source_labels: [__meta_kubernetes_namespace]
|
|||
|
action: replace
|
|||
|
target_label: kubernetes_namespace
|
|||
|
- source_labels: [__meta_kubernetes_service_name]
|
|||
|
action: replace
|
|||
|
target_label: kubernetes_name
|
|||
|
- source_labels: [__meta_kubernetes_pod_node_name]
|
|||
|
action: replace
|
|||
|
target_label: kubernetes_node
|
|||
|
metric_relabel_configs:
|
|||
|
- source_labels: [__name__]
|
|||
|
regex: (container_cpu_allocation|container_cpu_usage_seconds_total|container_fs_limit_bytes|container_fs_writes_bytes_total|container_gpu_allocation|container_memory_allocation_bytes|container_memory_usage_bytes|container_memory_working_set_bytes|container_network_receive_bytes_total|container_network_transmit_bytes_total|DCGM_FI_DEV_GPU_UTIL|deployment_match_labels|kube_daemonset_status_desired_number_scheduled|kube_daemonset_status_number_ready|kube_deployment_spec_replicas|kube_deployment_status_replicas|kube_deployment_status_replicas_available|kube_job_status_failed|kube_namespace_annotations|kube_namespace_labels|kube_node_info|kube_node_labels|kube_node_status_allocatable|kube_node_status_allocatable_cpu_cores|kube_node_status_allocatable_memory_bytes|kube_node_status_capacity|kube_node_status_capacity_cpu_cores|kube_node_status_capacity_memory_bytes|kube_node_status_condition|kube_persistentvolume_capacity_bytes|kube_persistentvolume_status_phase|kube_persistentvolumeclaim_info|kube_persistentvolumeclaim_resource_requests_storage_bytes|kube_pod_container_info|kube_pod_container_resource_limits|kube_pod_container_resource_limits_cpu_cores|kube_pod_container_resource_limits_memory_bytes|kube_pod_container_resource_requests|kube_pod_container_resource_requests_cpu_cores|kube_pod_container_resource_requests_memory_bytes|kube_pod_container_status_restarts_total|kube_pod_container_status_running|kube_pod_container_status_terminated_reason|kube_pod_labels|kube_pod_owner|kube_pod_status_phase|kube_replicaset_owner|kube_statefulset_replicas|kube_statefulset_status_replicas|kubecost_cluster_info|kubecost_cluster_management_cost|kubecost_cluster_memory_working_set_bytes|kubecost_load_balancer_cost|kubecost_network_internet_egress_cost|kubecost_network_region_egress_cost|kubecost_network_zone_egress_cost|kubecost_node_is_spot|kubecost_pod_network_egress_bytes_total|node_cpu_hourly_cost|node_cpu_seconds_total|node_disk_reads_completed|node_disk_reads_completed_total|node_disk_writes_completed|node_disk_writes_completed_total|node_filesystem_device_error|node_gpu_count|node_gpu_hourly_cost|node_memory_Buffers_bytes|node_memory_Cached_bytes|node_memory_MemAvailable_bytes|node_memory_MemFree_bytes|node_memory_MemTotal_bytes|node_network_transmit_bytes_total|node_ram_hourly_cost|node_total_hourly_cost|pod_pvc_allocation|pv_hourly_cost|service_selector_labels|statefulSet_match_labels|kubecost_pv_info|up)
|
|||
|
action: keep
|
|||
|
|
|||
|
|
|||
|
# prometheus.yml: # Sample block -- enable if using an in cluster durable store.
|
|||
|
# remote_write:
|
|||
|
# - url: "http://pgprometheus-adapter:9201/write"
|
|||
|
# write_relabel_configs:
|
|||
|
# - source_labels: [__name__]
|
|||
|
# regex: 'container_.*_allocation|container_.*_allocation_bytes|.*_hourly_cost|kube_pod_container_resource_requests{resource="memory", unit="byte"}|container_memory_working_set_bytes|kube_pod_container_resource_requests{resource="cpu", unit="core"}|kube_pod_container_resource_requests|pod_pvc_allocation|kube_namespace_labels|kube_pod_labels'
|
|||
|
# action: keep
|
|||
|
# queue_config:
|
|||
|
# max_samples_per_send: 1000
|
|||
|
# remote_read:
|
|||
|
# - url: "http://pgprometheus-adapter:9201/read"
|
|||
|
rules:
|
|||
|
groups:
|
|||
|
- name: CPU
|
|||
|
rules:
|
|||
|
- expr: sum(rate(container_cpu_usage_seconds_total{container!=""}[5m]))
|
|||
|
record: cluster:cpu_usage:rate5m
|
|||
|
- expr: rate(container_cpu_usage_seconds_total{container!=""}[5m])
|
|||
|
record: cluster:cpu_usage_nosum:rate5m
|
|||
|
- expr: avg(irate(container_cpu_usage_seconds_total{container!="POD", container!=""}[5m])) by (container,pod,namespace)
|
|||
|
record: kubecost_container_cpu_usage_irate
|
|||
|
- expr: sum(container_memory_working_set_bytes{container!="POD",container!=""}) by (container,pod,namespace)
|
|||
|
record: kubecost_container_memory_working_set_bytes
|
|||
|
- expr: sum(container_memory_working_set_bytes{container!="POD",container!=""})
|
|||
|
record: kubecost_cluster_memory_working_set_bytes
|
|||
|
- name: Savings
|
|||
|
rules:
|
|||
|
- expr: sum(avg(kube_pod_owner{owner_kind!="DaemonSet"}) by (pod) * sum(container_cpu_allocation) by (pod))
|
|||
|
record: kubecost_savings_cpu_allocation
|
|||
|
labels:
|
|||
|
daemonset: "false"
|
|||
|
- expr: sum(avg(kube_pod_owner{owner_kind="DaemonSet"}) by (pod) * sum(container_cpu_allocation) by (pod)) / sum(kube_node_info)
|
|||
|
record: kubecost_savings_cpu_allocation
|
|||
|
labels:
|
|||
|
daemonset: "true"
|
|||
|
- expr: sum(avg(kube_pod_owner{owner_kind!="DaemonSet"}) by (pod) * sum(container_memory_allocation_bytes) by (pod))
|
|||
|
record: kubecost_savings_memory_allocation_bytes
|
|||
|
labels:
|
|||
|
daemonset: "false"
|
|||
|
- expr: sum(avg(kube_pod_owner{owner_kind="DaemonSet"}) by (pod) * sum(container_memory_allocation_bytes) by (pod)) / sum(kube_node_info)
|
|||
|
record: kubecost_savings_memory_allocation_bytes
|
|||
|
labels:
|
|||
|
daemonset: "true"
|
|||
|
|
|||
|
# Adds option to add alert_relabel_configs to avoid duplicate alerts in alertmanager
|
|||
|
# useful in H/A prometheus with different external labels but the same alerts
|
|||
|
alertRelabelConfigs:
|
|||
|
# alert_relabel_configs:
|
|||
|
# - source_labels: [dc]
|
|||
|
# regex: (.+)\d+
|
|||
|
# target_label: dc
|
|||
|
|
|||
|
networkPolicy:
|
|||
|
## Enable creation of NetworkPolicy resources.
|
|||
|
##
|
|||
|
enabled: false
|
|||
|
|
|||
|
|
|||
|
## Optional daemonset to more accurately attribute network costs to the correct workload
|
|||
|
## https://docs.kubecost.com/install-and-configure/advanced-configuration/network-costs-configuration
|
|||
|
networkCosts:
|
|||
|
enabled: false
|
|||
|
image:
|
|||
|
repository: gcr.io/kubecost1/kubecost-network-costs
|
|||
|
tag: v0.17.6
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
updateStrategy:
|
|||
|
type: RollingUpdate
|
|||
|
# For existing Prometheus Installs, use the serviceMonitor: or prometheusScrape below.
|
|||
|
# the below setting annotates the networkCost service endpoints for each of the network-costs pods.
|
|||
|
# The Service is annotated with prometheus.io/scrape: "true" to automatically get picked up by the prometheus config.
|
|||
|
# NOTE: Setting this option to true and leaving the above extraScrapeConfig "job_name: kubecost-networking" configured will cause the
|
|||
|
# NOTE: pods to be scraped twice.
|
|||
|
prometheusScrape: false
|
|||
|
# Traffic Logging will enable logging the top 5 destinations for each source
|
|||
|
# every 30 minutes.
|
|||
|
trafficLogging: true
|
|||
|
|
|||
|
logLevel: info
|
|||
|
|
|||
|
# Port will set both the containerPort and hostPort to this value.
|
|||
|
# These must be identical due to network-costs being run on hostNetwork
|
|||
|
port: 3001
|
|||
|
# this daemonset can use significant resources on large clusters: https://guide.kubecost.com/hc/en-us/articles/4407595973527-Network-Traffic-Cost-Allocation
|
|||
|
resources:
|
|||
|
limits: # remove the limits by setting cpu: null
|
|||
|
cpu: 500m # can be less, will depend on cluster size
|
|||
|
# memory: it is not recommended to set a memory limit
|
|||
|
requests:
|
|||
|
cpu: 50m
|
|||
|
memory: 20Mi
|
|||
|
extraArgs: []
|
|||
|
config:
|
|||
|
# Configuration for traffic destinations, including specific classification
|
|||
|
# for IPs and CIDR blocks. This configuration will act as an override to the
|
|||
|
# automatic classification provided by network-costs.
|
|||
|
destinations:
|
|||
|
# In Zone contains a list of address/range that will be
|
|||
|
# classified as in zone.
|
|||
|
in-zone:
|
|||
|
# Loopback Addresses in "IANA IPv4 Special-Purpose Address Registry"
|
|||
|
- "127.0.0.0/8"
|
|||
|
# IPv4 Link Local Address Space
|
|||
|
- "169.254.0.0/16"
|
|||
|
# Private Address Ranges in RFC-1918
|
|||
|
- "10.0.0.0/8" # Remove this entry if using Multi-AZ Kubernetes
|
|||
|
- "172.16.0.0/12"
|
|||
|
- "192.168.0.0/16"
|
|||
|
|
|||
|
# In Region contains a list of address/range that will be
|
|||
|
# classified as in region. This is synonymous with cross
|
|||
|
# zone traffic, where the regions between source and destinations
|
|||
|
# are the same, but the zone is different.
|
|||
|
in-region: []
|
|||
|
|
|||
|
# Cross Region contains a list of address/range that will be
|
|||
|
# classified as non-internet egress from one region to another.
|
|||
|
cross-region: []
|
|||
|
|
|||
|
# Internet contains a list of address/range that will be
|
|||
|
# classified as internet traffic. This is synonymous with traffic
|
|||
|
# that cannot be classified within the cluster.
|
|||
|
# NOTE: Internet classification filters are executed _after_
|
|||
|
# NOTE: direct-classification, but before in-zone, in-region,
|
|||
|
# NOTE: and cross-region.
|
|||
|
internet: []
|
|||
|
|
|||
|
# Direct Classification specifically maps an ip address or range
|
|||
|
# to a region (required) and/or zone (optional). This classification
|
|||
|
# takes priority over in-zone, in-region, and cross-region configurations.
|
|||
|
direct-classification: []
|
|||
|
# - region: "us-east1"
|
|||
|
# zone: "us-east1-c"
|
|||
|
# ips:
|
|||
|
# - "10.0.0.0/24"
|
|||
|
services:
|
|||
|
# google-cloud-services: when set to true, enables labeling traffic metrics with google cloud
|
|||
|
# service endpoints
|
|||
|
google-cloud-services: true
|
|||
|
# amazon-web-services: when set to true, enables labeling traffic metrics with amazon web service
|
|||
|
# endpoints.
|
|||
|
amazon-web-services: true
|
|||
|
# azure-cloud-services: when set to true, enables labeling traffic metrics with azure cloud service
|
|||
|
# endpoints
|
|||
|
azure-cloud-services: true
|
|||
|
# user defined services provide a way to define custom service endpoints which will label traffic metrics
|
|||
|
# falling within the defined address range.
|
|||
|
# services:
|
|||
|
# - service: "test-service-1"
|
|||
|
# ips:
|
|||
|
# - "19.1.1.2"
|
|||
|
# - service: "test-service-2"
|
|||
|
# ips:
|
|||
|
# - "15.128.15.2"
|
|||
|
# - "20.0.0.0/8"
|
|||
|
|
|||
|
## Node tolerations for server scheduling to nodes with taints
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/assign-pod-node/
|
|||
|
##
|
|||
|
tolerations: []
|
|||
|
# - key: "key"
|
|||
|
# operator: "Equal|Exists"
|
|||
|
# value: "value"
|
|||
|
# effect: "NoSchedule|PreferNoSchedule|NoExecute(1.6 only)"
|
|||
|
|
|||
|
affinity: {}
|
|||
|
|
|||
|
service:
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
|
|||
|
## PriorityClassName
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/pod-priority-preemption/#priorityclass
|
|||
|
priorityClassName: ""
|
|||
|
## PodMonitor
|
|||
|
## Allows scraping of network metrics from a dedicated prometheus operator setup
|
|||
|
podMonitor:
|
|||
|
enabled: false
|
|||
|
additionalLabels: {}
|
|||
|
# match the default extraScrapeConfig
|
|||
|
additionalLabels: {}
|
|||
|
nodeSelector: {}
|
|||
|
annotations: {}
|
|||
|
healthCheckProbes: {}
|
|||
|
# readinessProbe:
|
|||
|
# tcpSocket:
|
|||
|
# port: 3001
|
|||
|
# initialDelaySeconds: 5
|
|||
|
# periodSeconds: 10
|
|||
|
# failureThreshold: 5
|
|||
|
# livenessProbe:
|
|||
|
# tcpSocket:
|
|||
|
# port: 3001
|
|||
|
# initialDelaySeconds: 5
|
|||
|
# periodSeconds: 10
|
|||
|
# failureThreshold: 5
|
|||
|
additionalSecurityContext: {}
|
|||
|
# readOnlyRootFilesystem: true
|
|||
|
|
|||
|
## Kubecost Deployment Configuration
|
|||
|
## Used for HA mode in Business & Enterprise tier
|
|||
|
##
|
|||
|
kubecostDeployment:
|
|||
|
replicas: 1
|
|||
|
# deploymentStrategy:
|
|||
|
# rollingUpdate:
|
|||
|
# maxSurge: 1
|
|||
|
# maxUnavailable: 1
|
|||
|
# type: RollingUpdate
|
|||
|
labels: {}
|
|||
|
annotations: {}
|
|||
|
|
|||
|
|
|||
|
## Kubecost Forecasting forecasts future cost patterns based on historical
|
|||
|
## patterns observed by Kubecost.
|
|||
|
forecasting:
|
|||
|
enabled: true
|
|||
|
|
|||
|
# fullImageName overrides the default image construction logic. The exact
|
|||
|
# image provided (registry, image, tag) will be used for the forecasting
|
|||
|
# container.
|
|||
|
# Example: fullImageName: gcr.io/kubecost1/forecasting:v0.0.1
|
|||
|
fullImageName: gcr.io/kubecost1/kubecost-modeling:v0.1.16
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
|
|||
|
# Resource specification block for the forecasting container.
|
|||
|
resources:
|
|||
|
requests:
|
|||
|
cpu: 200m
|
|||
|
memory: 300Mi
|
|||
|
limits:
|
|||
|
cpu: 1500m
|
|||
|
memory: 1Gi
|
|||
|
|
|||
|
# Set environment variables for the forecasting container as key/value pairs.
|
|||
|
env:
|
|||
|
# -t is the worker timeout which primarily affects model training time;
|
|||
|
# if it is not high enough, training workers may die mid training
|
|||
|
"GUNICORN_CMD_ARGS": "--log-level info -t 1200"
|
|||
|
|
|||
|
# Define a priority class for the forecasting Deployment.
|
|||
|
priority:
|
|||
|
enabled: false
|
|||
|
name: ""
|
|||
|
|
|||
|
# Define a nodeSelector for the forecasting Deployment.
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
# Define tolerations for the forecasting Deployment.
|
|||
|
tolerations: []
|
|||
|
|
|||
|
# Define Pod affinity for the forecasting Deployment.
|
|||
|
affinity: {}
|
|||
|
|
|||
|
# Define a readiness probe for the forecasting container
|
|||
|
readinessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 10
|
|||
|
periodSeconds: 10
|
|||
|
failureThreshold: 200
|
|||
|
|
|||
|
# Define a liveness probe for the forecasting container.
|
|||
|
livenessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 10
|
|||
|
periodSeconds: 10
|
|||
|
failureThreshold: 200
|
|||
|
|
|||
|
## The Kubecost Aggregator is the primary query backend for Kubecost
|
|||
|
## Ref: https://docs.kubecost.com/install-and-configure/install/multi-cluster/federated-etl/aggregator
|
|||
|
##
|
|||
|
kubecostAggregator:
|
|||
|
# deployMethod determines how Aggregator is deployed. Current options are
|
|||
|
# "singlepod" (within cost-analyzer Pod) "statefulset" (separate
|
|||
|
# StatefulSet), and "disabled". Only use "disabled" if this is a secondary
|
|||
|
# Federated ETL cluster which does not need to answer queries.
|
|||
|
deployMethod: singlepod
|
|||
|
|
|||
|
# fullImageName overrides the default image construction logic. The exact
|
|||
|
# image provided (registry, image, tag) will be used for aggregator.
|
|||
|
# fullImageName:
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
|
|||
|
# For legacy configuration support, `enabled: true` overrides deployMethod
|
|||
|
# and causes `deployMethod: "statefulset"`
|
|||
|
enabled: false
|
|||
|
|
|||
|
# Replicas sets the number of Aggregator replicas. It only has an effect if
|
|||
|
# `deployMethod: "statefulset"`
|
|||
|
replicas: 1
|
|||
|
|
|||
|
logLevel: info
|
|||
|
|
|||
|
# stagingEmptyDirSizeLimit changes how large the "staging"
|
|||
|
# /var/configs/waterfowl emptyDir is. It only takes effect in StatefulSet
|
|||
|
# configurations of Aggregator, other configurations are unaffected.
|
|||
|
#
|
|||
|
# It should be set to approximately 8x the size of the largest bingen file in
|
|||
|
# object storage. For example, if your largest bingen file is a daily
|
|||
|
# Allocation file with size 300MiB, this value should be set to approximately
|
|||
|
# 2400Mi. In most environments, the default should suffice.
|
|||
|
stagingEmptyDirSizeLimit: 2Gi
|
|||
|
|
|||
|
# this is the number of partitions the datastore is split into for copying
|
|||
|
# the higher this number, the lower the ram usage but the longer it takes for
|
|||
|
# new data to show in the kubecost UI
|
|||
|
# set to 0 for max partitioning (minimum possible ram usage, but the slowest)
|
|||
|
# the default of 25 is sufficient for 95%+ of users. This should only be modified
|
|||
|
# after consulting with Kubecost's support team
|
|||
|
numDBCopyPartitions: 25
|
|||
|
|
|||
|
# How many threads the read database is configured with (i.e. Kubecost API /
|
|||
|
# UI queries). If increasing this value, it is recommended to increase the
|
|||
|
# aggregator's memory requests & limits.
|
|||
|
# default: 1
|
|||
|
dbReadThreads: 1
|
|||
|
|
|||
|
# How many threads the write database is configured with (i.e. ingestion of
|
|||
|
# new data from S3). If increasing this value, it is recommended to increase
|
|||
|
# the aggregator's memory requests & limits.
|
|||
|
# default: 1
|
|||
|
dbWriteThreads: 1
|
|||
|
|
|||
|
# How many threads to use when ingesting Asset/Allocation/CloudCost data
|
|||
|
# from the federated store bucket. In most cases the default is sufficient,
|
|||
|
# but can be increased if trying to backfill historical data.
|
|||
|
# default: 1
|
|||
|
dbConcurrentIngestionCount: 1
|
|||
|
|
|||
|
# Memory limit applied to read database and write database connections. The
|
|||
|
# default of "no limit" is appropriate when first establishing a baseline of
|
|||
|
# resource usage required. It is eventually recommended to set these values
|
|||
|
# such that dbMemoryLimit + dbWriteMemoryLimit < the total memory available
|
|||
|
# to the aggregator pod.
|
|||
|
# default: 0GB is no limit
|
|||
|
dbMemoryLimit: 0GB
|
|||
|
dbWriteMemoryLimit: 0GB
|
|||
|
|
|||
|
# How much data to ingest from the federated store bucket, and how much data
|
|||
|
# to keep in the DB before rolling the data off.
|
|||
|
#
|
|||
|
# Note: If increasing this value to backfill historical data, it will take
|
|||
|
# time to gradually ingest and process those historical ETL files. Consider
|
|||
|
# also increasing the resources available to the aggregator as well as the
|
|||
|
# refresh and concurrency env vars.
|
|||
|
#
|
|||
|
# default: 91
|
|||
|
etlDailyStoreDurationDays: 91
|
|||
|
|
|||
|
# How much hourly data to ingest from the federated store bucket, and how much
|
|||
|
# to keep in the DB before rolling the data off.
|
|||
|
#
|
|||
|
# In high scale environments setting this to `0` can improve performance if hourly
|
|||
|
# resolution is not a requirement.
|
|||
|
#
|
|||
|
# default: 49
|
|||
|
etlHourlyStoreDurationHours: 49
|
|||
|
|
|||
|
# How much container resource usage data to retain in the DB, in terms of days.
|
|||
|
#
|
|||
|
# In high scale environments setting this to `0` can improve performance if hourly
|
|||
|
# resolution is not a requirement.
|
|||
|
#
|
|||
|
# default: 1
|
|||
|
containerResourceUsageRetentionDays: 1
|
|||
|
|
|||
|
# Trim memory on close, only change if advised by Kubecost support.
|
|||
|
dbTrimMemoryOnClose: true
|
|||
|
|
|||
|
persistentConfigsStorage:
|
|||
|
storageClass: "" # default storage class
|
|||
|
storageRequest: 1Gi
|
|||
|
aggregatorDbStorage:
|
|||
|
storageClass: "" # default storage class
|
|||
|
storageRequest: 128Gi
|
|||
|
|
|||
|
resources: {}
|
|||
|
# requests:
|
|||
|
# cpu: 1000m
|
|||
|
# memory: 1Gi
|
|||
|
|
|||
|
readinessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 10
|
|||
|
periodSeconds: 10
|
|||
|
failureThreshold: 200
|
|||
|
|
|||
|
## Set additional environment variables for the aggregator pod
|
|||
|
# extraEnv:
|
|||
|
# - name: SOME_VARIABLE
|
|||
|
# value: "some_value"
|
|||
|
|
|||
|
## Add a priority class to the aggregator pod
|
|||
|
# priority:
|
|||
|
# enabled: false
|
|||
|
# name: ""
|
|||
|
|
|||
|
## Optional - add extra ports to the aggregator container. For kubecost development purposes only - not recommended for users.
|
|||
|
# extraPorts: []
|
|||
|
# - name: debug
|
|||
|
# port: 40000
|
|||
|
# targetPort: 40000
|
|||
|
# containerPort: 40000
|
|||
|
|
|||
|
## Define a securityContext for the aggregator pod. This will take highest precedence.
|
|||
|
# securityContext: {}
|
|||
|
|
|||
|
## Define the container-level security context for the aggregator pod. This will take highest precedence.
|
|||
|
# containerSecurityContext: {}
|
|||
|
|
|||
|
## Provide a Service Account name for aggregator.
|
|||
|
# serviceAccountName: ""
|
|||
|
|
|||
|
## Define a nodeSelector for the aggregator pod
|
|||
|
# nodeSelector: {}
|
|||
|
|
|||
|
## Define tolerations for the aggregator pod
|
|||
|
# tolerations: []
|
|||
|
|
|||
|
## Define Pod affinity for the aggregator pod
|
|||
|
# affinity: {}
|
|||
|
|
|||
|
## Define extra volumes for the aggregator pod
|
|||
|
# extraVolumes: []
|
|||
|
|
|||
|
## Define extra volumemounts for the aggregator pod
|
|||
|
# extraVolumeMounts: []
|
|||
|
|
|||
|
## Creates a new container/pod to retrieve CloudCost data. By default it uses
|
|||
|
## the same serviceaccount as the cost-analyzer pod. A custom serviceaccount
|
|||
|
## can be specified.
|
|||
|
cloudCost:
|
|||
|
# The cloudCost component of Aggregator depends on
|
|||
|
# kubecostAggregator.deployMethod:
|
|||
|
# kA.dM = "singlepod" -> cloudCost is run as container inside cost-analyzer
|
|||
|
# kA.dM = "statefulset" -> cloudCost is run as single-replica Deployment
|
|||
|
resources: {}
|
|||
|
# requests:
|
|||
|
# cpu: 1000m
|
|||
|
# memory: 1Gi
|
|||
|
# refreshRateHours:
|
|||
|
# queryWindowDays:
|
|||
|
# runWindowDays:
|
|||
|
# serviceAccountName:
|
|||
|
readinessProbe:
|
|||
|
enabled: true
|
|||
|
initialDelaySeconds: 10
|
|||
|
periodSeconds: 10
|
|||
|
failureThreshold: 200
|
|||
|
|
|||
|
## Add a nodeSelector for aggregator cloud costs
|
|||
|
# nodeSelector: {}
|
|||
|
|
|||
|
## Tolerations for the aggregator cloud costs
|
|||
|
# tolerations: []
|
|||
|
|
|||
|
## Affinity for the aggregator cloud costs
|
|||
|
# affinity: {}
|
|||
|
|
|||
|
## ServiceAccount for the aggregator cloud costs
|
|||
|
# serviceAccountName: ""
|
|||
|
|
|||
|
## Define environment variables for cloud cost
|
|||
|
# env: {}
|
|||
|
|
|||
|
## Define extra volumes for the cloud cost pod
|
|||
|
# extraVolumes: []
|
|||
|
|
|||
|
## Define extra volumemounts for the cloud cost pod
|
|||
|
# extraVolumeMounts: []
|
|||
|
|
|||
|
## Configure the Collections service for aggregator.
|
|||
|
# collections:
|
|||
|
# cache:
|
|||
|
# enabled: false
|
|||
|
|
|||
|
# Jaeger is an optional container attached to wherever the Aggregator
|
|||
|
# container is running. It is used for performance investigation. Enable if
|
|||
|
# Kubecost Support asks.
|
|||
|
jaeger:
|
|||
|
enabled: false
|
|||
|
image: jaegertracing/all-in-one
|
|||
|
imageVersion: latest
|
|||
|
# containerSecurityContext:
|
|||
|
|
|||
|
service:
|
|||
|
labels: {}
|
|||
|
|
|||
|
## Kubecost Multi-cluster Diagnostics (beta)
|
|||
|
## A single view into the health of all agent clusters. Each agent cluster sends
|
|||
|
## its diagnostic data to a storage bucket. Future versions may include
|
|||
|
## repairing & alerting from the primary.
|
|||
|
## Ref: https://docs.kubecost.com/install-and-configure/install/multi-cluster/multi-cluster-diagnostics
|
|||
|
##
|
|||
|
diagnostics:
|
|||
|
enabled: true
|
|||
|
|
|||
|
## The primary aggregates all diagnostic data and handles API requests. It's
|
|||
|
## also responsible for deleting diagnostic data (on disk & bucket) beyond
|
|||
|
## retention. When in readonly mode it does not push its own diagnostic data
|
|||
|
## to the bucket.
|
|||
|
primary:
|
|||
|
enabled: false
|
|||
|
retention: "7d"
|
|||
|
readonly: false
|
|||
|
|
|||
|
## How frequently to run & push diagnostics. Defaults to 5 minutes.
|
|||
|
pollingInterval: "300s"
|
|||
|
|
|||
|
## Creates a new Diagnostic file in the bucket for every run.
|
|||
|
keepDiagnosticHistory: false
|
|||
|
|
|||
|
## Pushes the cluster's Kubecost Helm Values to the bucket once upon startup.
|
|||
|
## This may contain sensitive information and is roughly 30kb per cluster.
|
|||
|
collectHelmValues: false
|
|||
|
|
|||
|
## By default, the Multi-cluster Diagnostics service runs within the
|
|||
|
## cost-model container in the cost-analyzer pod. For higher availability, it
|
|||
|
## can be run as a separate deployment.
|
|||
|
deployment:
|
|||
|
enabled: false
|
|||
|
resources:
|
|||
|
requests:
|
|||
|
cpu: "10m"
|
|||
|
memory: "20Mi"
|
|||
|
env: {}
|
|||
|
labels: {}
|
|||
|
securityContext: {}
|
|||
|
containerSecurityContext: {}
|
|||
|
nodeSelector: {}
|
|||
|
tolerations: []
|
|||
|
affinity: {}
|
|||
|
|
|||
|
## Provide a full name override for the diagnostics Deployment.
|
|||
|
# diagnosticsFullnameOverride: ""
|
|||
|
|
|||
|
# Kubecost Cluster Controller for Right Sizing and Cluster Turndown
|
|||
|
clusterController:
|
|||
|
enabled: false
|
|||
|
image:
|
|||
|
repository: gcr.io/kubecost1/cluster-controller
|
|||
|
tag: v0.16.9
|
|||
|
imagePullPolicy: IfNotPresent
|
|||
|
## PriorityClassName
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/pod-priority-preemption/#priorityclass
|
|||
|
priorityClassName: ""
|
|||
|
# Set custom tolerations for the cluster controller.
|
|||
|
tolerations: []
|
|||
|
resources: {}
|
|||
|
actionConfigs:
|
|||
|
# this configures the Kubecost Cluster Turndown action
|
|||
|
# for more details, see documentation at https://github.com/kubecost/cluster-turndown/tree/develop?tab=readme-ov-file#setting-a-turndown-schedule
|
|||
|
clusterTurndown: []
|
|||
|
# - name: my-schedule
|
|||
|
# start: "2024-02-09T00:00:00Z"
|
|||
|
# end: "2024-02-09T12:00:00Z"
|
|||
|
# repeat: daily
|
|||
|
# - name: my-schedule2
|
|||
|
# start: "2024-02-09T00:00:00Z"
|
|||
|
# end: "2024-02-09T01:00:00Z"
|
|||
|
# repeat: weekly
|
|||
|
# this configures the Kubecost Namespace Turndown action
|
|||
|
# for more details, see documentation at https://docs.kubecost.com/using-kubecost/navigating-the-kubecost-ui/savings/savings-actions#namespace-turndown
|
|||
|
namespaceTurndown:
|
|||
|
# - name: my-ns-turndown-action
|
|||
|
# dryRun: false
|
|||
|
# schedule: "0 0 * * *"
|
|||
|
# type: Scheduled
|
|||
|
# targetObjs:
|
|||
|
# - namespace
|
|||
|
# keepPatterns:
|
|||
|
# - ignorednamespace
|
|||
|
# keepLabels:
|
|||
|
# turndown: ignore
|
|||
|
# params:
|
|||
|
# minNamespaceAge: 4h
|
|||
|
# this configures the Kubecost Cluster Sizing action
|
|||
|
# for more details, see documentation at https://docs.kubecost.com/using-kubecost/navigating-the-kubecost-ui/savings/savings-actions#cluster-sizing
|
|||
|
clusterRightsize:
|
|||
|
# startTime: '2024-01-02T15:04:05Z'
|
|||
|
# frequencyMinutes: 1440
|
|||
|
# lastCompleted: ''
|
|||
|
# recommendationParams:
|
|||
|
# window: 48h
|
|||
|
# architecture: ''
|
|||
|
# targetUtilization: 0.8
|
|||
|
# minNodeCount: 1
|
|||
|
# allowSharedCore: false
|
|||
|
# allowCostIncrease: false
|
|||
|
# recommendationType: ''
|
|||
|
# This configures the Kubecost Continuous Request Sizing Action
|
|||
|
#
|
|||
|
# Using this configuration overrides annotation-based configuration of
|
|||
|
# Continuous Request Sizing. Annotation configuration will be ignored while
|
|||
|
# this configuration method is present in the cluster.
|
|||
|
#
|
|||
|
# For more details, see documentation at https://docs.kubecost.com/using-kubecost/navigating-the-kubecost-ui/savings/savings-actions#automated-request-sizing
|
|||
|
containerRightsize:
|
|||
|
# Workloads can be selected by an _exact_ key (namespace, controllerKind,
|
|||
|
# controllerName). This will only match a single controller. The cluster
|
|||
|
# ID is current irrelevant because Cluster Controller can only modify
|
|||
|
# workloads within the cluster it is running in.
|
|||
|
# workloads:
|
|||
|
# - clusterID: cluster-one
|
|||
|
# namespace: my-namespace
|
|||
|
# controllerKind: deployment
|
|||
|
# controllerName: my-controller
|
|||
|
# An alternative to exact key selection is filter selection. The filters
|
|||
|
# are syntactically identical to Kubecost's "v2" filters [1] but only
|
|||
|
# support a small set of filter fields, those being:
|
|||
|
# - namespace
|
|||
|
# - controllerKind
|
|||
|
# - controllerName
|
|||
|
# - label
|
|||
|
# - annotation
|
|||
|
#
|
|||
|
# If multiple filters are listed, they will be ORed together at the top
|
|||
|
# level.
|
|||
|
#
|
|||
|
# See the examples below.
|
|||
|
#
|
|||
|
# [1] https://docs.kubecost.com/apis/filters-api
|
|||
|
# filterConfig:
|
|||
|
# - filter: |
|
|||
|
# namespace:"abc"+controllerKind:"deployment"
|
|||
|
# - filter: |
|
|||
|
# controllerName:"abc123"+controllerKind:"daemonset"
|
|||
|
# - filter: |
|
|||
|
# namespace:"foo"+controllerKind!:"statefulset"
|
|||
|
# - filter: |
|
|||
|
# namespace:"bar","baz"
|
|||
|
# schedule:
|
|||
|
# start: "2024-01-30T15:04:05Z"
|
|||
|
# frequencyMinutes: 5
|
|||
|
# recommendationQueryWindow: "48h"
|
|||
|
# lastModified: ''
|
|||
|
# targetUtilizationCPU: 0.8 # results in a cpu request setting that is 20% higher than the max seen over last 48h
|
|||
|
# targetUtilizationMemory: 0.8 # results in a RAM request setting that is 20% higher than the max seen over last 48h
|
|||
|
|
|||
|
kubescaler:
|
|||
|
# If true, will cause all (supported) workloads to be have their requests
|
|||
|
# automatically right-sized on a regular basis.
|
|||
|
defaultResizeAll: false
|
|||
|
# fqdn: kubecost-cluster-controller.kubecost.svc.cluster.local:9731
|
|||
|
namespaceTurndown:
|
|||
|
rbac:
|
|||
|
enabled: true
|
|||
|
|
|||
|
reporting:
|
|||
|
# Kubecost bug report feature: Logs access/collection limited to .Release.Namespace
|
|||
|
# Ref: http://docs.kubecost.com/bug-report
|
|||
|
logCollection: true
|
|||
|
# Basic frontend analytics
|
|||
|
productAnalytics: true
|
|||
|
|
|||
|
# Report Javascript errors
|
|||
|
errorReporting: true
|
|||
|
valuesReporting: true
|
|||
|
# googleAnalyticsTag allows you to embed your Google Global Site Tag to track usage of Kubecost.
|
|||
|
# googleAnalyticsTag is only included in our Enterprise offering.
|
|||
|
# googleAnalyticsTag: G-XXXXXXXXX
|
|||
|
|
|||
|
serviceMonitor: # the kubecost included prometheus uses scrapeConfigs and does not support service monitors. The following options assume an existing prometheus that supports serviceMonitors.
|
|||
|
enabled: false
|
|||
|
interval: 1m
|
|||
|
scrapeTimeout: 10s
|
|||
|
additionalLabels: {}
|
|||
|
metricRelabelings: []
|
|||
|
relabelings: []
|
|||
|
networkCosts:
|
|||
|
enabled: false
|
|||
|
interval: 1m
|
|||
|
scrapeTimeout: 10s
|
|||
|
additionalLabels: {}
|
|||
|
metricRelabelings: []
|
|||
|
relabelings: []
|
|||
|
aggregatorMetrics:
|
|||
|
enabled: false
|
|||
|
interval: 1m
|
|||
|
scrapeTimeout: 10s
|
|||
|
additionalLabels: {}
|
|||
|
metricRelabelings: []
|
|||
|
relabelings:
|
|||
|
- action: replace
|
|||
|
sourceLabels:
|
|||
|
- __meta_kubernetes_namespace
|
|||
|
targetLabel: namespace
|
|||
|
prometheusRule:
|
|||
|
enabled: false
|
|||
|
additionalLabels: {}
|
|||
|
|
|||
|
supportNFS: false
|
|||
|
# initChownDataImage ensures all Kubecost filepath permissions on PV or local storage are set up correctly.
|
|||
|
initChownDataImage: "busybox" # Supports a fully qualified Docker image, e.g. registry.hub.docker.com/library/busybox:latest
|
|||
|
initChownData:
|
|||
|
resources: {}
|
|||
|
# requests:
|
|||
|
# cpu: "50m"
|
|||
|
# memory: "20Mi"
|
|||
|
|
|||
|
grafana:
|
|||
|
# namespace_datasources: kubecost # override the default namespace here
|
|||
|
# namespace_dashboards: kubecost # override the default namespace here
|
|||
|
rbac:
|
|||
|
create: true
|
|||
|
|
|||
|
serviceAccount:
|
|||
|
create: true
|
|||
|
name: ""
|
|||
|
|
|||
|
## Provide a full name override for the Grafana Deployment.
|
|||
|
# fullnameOverride: ""
|
|||
|
## Provide a name override for the Grafana Deployment.
|
|||
|
# nameOverride: ""
|
|||
|
|
|||
|
## Configure grafana datasources
|
|||
|
## ref: http://docs.grafana.org/administration/provisioning/#datasources
|
|||
|
##
|
|||
|
# datasources:
|
|||
|
# datasources.yaml:
|
|||
|
# apiVersion: 1
|
|||
|
# datasources:
|
|||
|
# - name: prometheus-kubecost
|
|||
|
# type: prometheus
|
|||
|
# url: http://kubecost-prometheus-server.kubecost.svc.cluster.local
|
|||
|
# access: proxy
|
|||
|
# isDefault: false
|
|||
|
# jsonData:
|
|||
|
# httpMethod: POST
|
|||
|
# prometheusType: Prometheus
|
|||
|
# prometheusVersion: 2.35.0
|
|||
|
# timeInterval: 1m
|
|||
|
|
|||
|
## Number of replicas for the Grafana deployment
|
|||
|
replicas: 1
|
|||
|
|
|||
|
## Deployment strategy for the Grafana deployment
|
|||
|
deploymentStrategy: RollingUpdate
|
|||
|
|
|||
|
## Readiness probe for the Grafana deployment
|
|||
|
readinessProbe:
|
|||
|
httpGet:
|
|||
|
path: /api/health
|
|||
|
port: 3000
|
|||
|
|
|||
|
## Liveness probe for the Grafana deployment
|
|||
|
livenessProbe:
|
|||
|
httpGet:
|
|||
|
path: /api/health
|
|||
|
port: 3000
|
|||
|
initialDelaySeconds: 60
|
|||
|
timeoutSeconds: 30
|
|||
|
failureThreshold: 10
|
|||
|
|
|||
|
## Container image settings for the Grafana deployment
|
|||
|
image:
|
|||
|
repository: cgr.dev/chainguard/grafana
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## Optionally specify an array of imagePullSecrets.
|
|||
|
## Secrets must be manually created in the namespace.
|
|||
|
# pullSecrets:
|
|||
|
# - myRegistrKeySecretName
|
|||
|
|
|||
|
## Pod-level security context for the Grafana deployment. Recommended let global defaults take effect.
|
|||
|
securityContext: {}
|
|||
|
# runAsUser: 472
|
|||
|
# fsGroup: 472
|
|||
|
|
|||
|
## PriorityClassName for the Grafana deployment
|
|||
|
priorityClassName: ""
|
|||
|
|
|||
|
## Container image settings for Grafana initContainer used to download dashboards. Will only be used when dashboards are present.
|
|||
|
downloadDashboardsImage:
|
|||
|
repository: curlimages/curl
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
|
|||
|
## Pod Annotations for the Grafana deployment
|
|||
|
podAnnotations: {}
|
|||
|
|
|||
|
## Deployment annotations for the Grafana deployment
|
|||
|
annotations: {}
|
|||
|
|
|||
|
## Expose the Grafana service to be accessed from outside the cluster (LoadBalancer service).
|
|||
|
## or access it from within the cluster (ClusterIP service). Set the service type and the port to serve it.
|
|||
|
service:
|
|||
|
type: ClusterIP
|
|||
|
port: 80
|
|||
|
annotations: {}
|
|||
|
labels: {}
|
|||
|
|
|||
|
## This template is not needed and is not supported.
|
|||
|
## It is here for backwards compatibility.
|
|||
|
## Kubecost exposes grafana by default with the
|
|||
|
## top level ingress template under /grafana/
|
|||
|
ingress:
|
|||
|
enabled: false
|
|||
|
annotations: {}
|
|||
|
# kubernetes.io/ingress.class: nginx
|
|||
|
# kubernetes.io/tls-acme: "true"
|
|||
|
labels: {}
|
|||
|
path: /
|
|||
|
pathType: Prefix
|
|||
|
hosts:
|
|||
|
- chart-example.local
|
|||
|
tls: []
|
|||
|
# - secretName: chart-example-tls
|
|||
|
# hosts:
|
|||
|
# - chart-example.local
|
|||
|
|
|||
|
## Resource requests and limits for the Grafana deployment
|
|||
|
resources: {}
|
|||
|
# limits:
|
|||
|
# cpu: 100m
|
|||
|
# memory: 128Mi
|
|||
|
# requests:
|
|||
|
# cpu: 100m
|
|||
|
# memory: 128Mi
|
|||
|
|
|||
|
## Node labels for pod assignment of the Grafana deployment
|
|||
|
nodeSelector: {}
|
|||
|
|
|||
|
## Tolerations for pod assignment of the Grafana deployment
|
|||
|
tolerations: []
|
|||
|
|
|||
|
## Affinity for pod assignment of the Grafana deployment
|
|||
|
affinity: {}
|
|||
|
|
|||
|
## Enable persistence using Persistent Volume Claims of the Grafana deployment
|
|||
|
persistence:
|
|||
|
enabled: false
|
|||
|
# storageClassName: default
|
|||
|
# accessModes:
|
|||
|
# - ReadWriteOnce
|
|||
|
# size: 10Gi
|
|||
|
# annotations: {}
|
|||
|
# subPath: ""
|
|||
|
# existingClaim:
|
|||
|
|
|||
|
## Admin user for Grafana
|
|||
|
adminUser: admin
|
|||
|
|
|||
|
## Admin password for Grafana
|
|||
|
adminPassword: strongpassword
|
|||
|
|
|||
|
## Use an alternate scheduler for the Grafana deployment
|
|||
|
# schedulerName:
|
|||
|
|
|||
|
## Extra environment variables that will be passed onto Grafana deployment pods
|
|||
|
env: {}
|
|||
|
|
|||
|
## The name of a secret for Grafana in the same Kubernetes namespace which contain values to be added to the environment
|
|||
|
## This can be useful for auth tokens, etc
|
|||
|
envFromSecret: ""
|
|||
|
|
|||
|
## Additional Grafana server secret mounts
|
|||
|
## Defines additional mounts with secrets. Secrets must be manually created in the namespace.
|
|||
|
extraSecretMounts: []
|
|||
|
# - name: secret-files
|
|||
|
# mountPath: /etc/secrets
|
|||
|
# secretName: grafana-secret-files
|
|||
|
# readOnly: true
|
|||
|
|
|||
|
## List of Grafana plugins
|
|||
|
plugins: []
|
|||
|
# - digrich-bubblechart-panel
|
|||
|
# - grafana-clock-panel
|
|||
|
|
|||
|
## Grafana dashboard providers
|
|||
|
## ref: http://docs.grafana.org/administration/provisioning/#dashboards
|
|||
|
##
|
|||
|
## `path` must be /var/lib/grafana/dashboards/<provider_name>
|
|||
|
##
|
|||
|
dashboardProviders: {}
|
|||
|
# dashboardproviders.yaml:
|
|||
|
# apiVersion: 1
|
|||
|
# providers:
|
|||
|
# - name: 'default'
|
|||
|
# orgId: 1
|
|||
|
# folder: ''
|
|||
|
# type: file
|
|||
|
# disableDeletion: false
|
|||
|
# editable: true
|
|||
|
# options:
|
|||
|
# path: /var/lib/grafana/dashboards/default
|
|||
|
|
|||
|
## Configure Grafana dashboard to import
|
|||
|
## NOTE: To use dashboards you must also enable/configure dashboardProviders
|
|||
|
## ref: https://grafana.com/dashboards
|
|||
|
##
|
|||
|
## dashboards per provider, use provider name as key.
|
|||
|
##
|
|||
|
dashboards: {}
|
|||
|
# default:
|
|||
|
# prometheus-stats:
|
|||
|
# gnetId: 3662
|
|||
|
# revision: 2
|
|||
|
# datasource: Prometheus
|
|||
|
|
|||
|
## Reference to external Grafana ConfigMap per provider. Use provider name as key and ConfiMap name as value.
|
|||
|
## A provider dashboards must be defined either by external ConfigMaps or in values.yaml, not in both.
|
|||
|
## ConfigMap data example:
|
|||
|
##
|
|||
|
## data:
|
|||
|
## example-dashboard.json: |
|
|||
|
## RAW_JSON
|
|||
|
##
|
|||
|
dashboardsConfigMaps: {}
|
|||
|
# default: ""
|
|||
|
|
|||
|
## LDAP Authentication for Grafana can be enabled with the following values on grafana.ini
|
|||
|
## NOTE: Grafana will fail to start if the value for ldap.toml is invalid
|
|||
|
# auth.ldap:
|
|||
|
# enabled: true
|
|||
|
# allow_sign_up: true
|
|||
|
# config_file: /etc/grafana/ldap.toml
|
|||
|
|
|||
|
## Grafana's LDAP configuration
|
|||
|
## Templated by the template in _helpers.tpl
|
|||
|
## NOTE: To enable the grafana.ini must be configured with auth.ldap.enabled
|
|||
|
## ref: http://docs.grafana.org/installation/configuration/#auth-ldap
|
|||
|
## ref: http://docs.grafana.org/installation/ldap/#configuration
|
|||
|
ldap:
|
|||
|
# `existingSecret` is a reference to an existing secret containing the ldap configuration
|
|||
|
# for Grafana in a key `ldap-toml`.
|
|||
|
existingSecret: ""
|
|||
|
# `config` is the content of `ldap.toml` that will be stored in the created secret
|
|||
|
config: ""
|
|||
|
# config: |-
|
|||
|
# verbose_logging = true
|
|||
|
|
|||
|
# [[servers]]
|
|||
|
# host = "my-ldap-server"
|
|||
|
# port = 636
|
|||
|
# use_ssl = true
|
|||
|
# start_tls = false
|
|||
|
# ssl_skip_verify = false
|
|||
|
# bind_dn = "uid=%s,ou=users,dc=myorg,dc=com"
|
|||
|
|
|||
|
## Grafana's SMTP configuration
|
|||
|
## NOTE: To enable, grafana.ini must be configured with smtp.enabled
|
|||
|
## ref: http://docs.grafana.org/installation/configuration/#smtp
|
|||
|
smtp:
|
|||
|
# `existingSecret` is a reference to an existing secret containing the smtp configuration
|
|||
|
# for Grafana in keys `user` and `password`.
|
|||
|
existingSecret: ""
|
|||
|
|
|||
|
## Grafana sidecars that collect the configmaps with specified label and stores the included files them into the respective folders
|
|||
|
## Requires at least Grafana 5 to work and can't be used together with parameters dashboardProviders, datasources and dashboards
|
|||
|
sidecar:
|
|||
|
image:
|
|||
|
repository: cgr.dev/chainguard/k8s-sidecar
|
|||
|
tag: latest
|
|||
|
pullPolicy: IfNotPresent
|
|||
|
resources: {}
|
|||
|
dashboards:
|
|||
|
enabled: true
|
|||
|
# label that the configmaps with dashboards are marked with
|
|||
|
label: grafana_dashboard
|
|||
|
labelValue: "1"
|
|||
|
# set sidecar ERROR_THROTTLE_SLEEP env var from default 5s to 0s -> fixes https://github.com/kubecost/cost-analyzer-helm-chart/issues/877
|
|||
|
annotations: {}
|
|||
|
error_throttle_sleep: 0
|
|||
|
folder: /tmp/dashboards
|
|||
|
datasources:
|
|||
|
# dataSourceFilename: foo.yml # If you need to change the name of the datasource file
|
|||
|
enabled: false
|
|||
|
error_throttle_sleep: 0
|
|||
|
# label that the configmaps with datasources are marked with
|
|||
|
label: grafana_datasource
|
|||
|
|
|||
|
## Grafana's primary configuration
|
|||
|
## NOTE: values in map will be converted to ini format
|
|||
|
## ref: http://docs.grafana.org/installation/configuration/
|
|||
|
##
|
|||
|
## For grafana to be accessible, add the path to root_url. For example, if you run kubecost at www.foo.com:9090/kubecost
|
|||
|
## set root_url to "%(protocol)s://%(domain)s:%(http_port)s/kubecost/grafana". No change is necessary here if kubecost runs at a root URL
|
|||
|
grafana.ini:
|
|||
|
server:
|
|||
|
serve_from_sub_path: false # Set to false on Grafana v10+
|
|||
|
root_url: "%(protocol)s://%(domain)s:%(http_port)s/grafana"
|
|||
|
paths:
|
|||
|
data: /var/lib/grafana/data
|
|||
|
logs: /var/log/grafana
|
|||
|
plugins: /var/lib/grafana/plugins
|
|||
|
provisioning: /etc/grafana/provisioning
|
|||
|
analytics:
|
|||
|
check_for_updates: true
|
|||
|
log:
|
|||
|
mode: console
|
|||
|
grafana_net:
|
|||
|
url: https://grafana.net
|
|||
|
auth.anonymous:
|
|||
|
enabled: true
|
|||
|
org_role: Editor
|
|||
|
org_name: Main Org.
|
|||
|
|
|||
|
serviceAccount:
|
|||
|
create: true # Set this to false if you're bringing your own service account.
|
|||
|
annotations: {}
|
|||
|
# name: kc-test
|
|||
|
|
|||
|
awsstore:
|
|||
|
useAwsStore: false
|
|||
|
imageNameAndVersion: gcr.io/kubecost1/awsstore:latest # Name and version of the container image for AWSStore.
|
|||
|
createServiceAccount: false
|
|||
|
## PriorityClassName
|
|||
|
## Ref: https://kubernetes.io/docs/concepts/configuration/pod-priority-preemption/#priorityclass
|
|||
|
priorityClassName: ""
|
|||
|
# Use a custom nodeSelector for AWSStore.
|
|||
|
nodeSelector: {}
|
|||
|
# kubernetes.io/arch: amd64
|
|||
|
## Annotations for the AWSStore ServiceAccount.
|
|||
|
annotations: {}
|
|||
|
|
|||
|
## Federated ETL Architecture
|
|||
|
## Ref: https://docs.kubecost.com/install-and-configure/install/multi-cluster/federated-etl
|
|||
|
##
|
|||
|
federatedETL:
|
|||
|
|
|||
|
## If true, installs the minimal set of components required for a Federated ETL cluster.
|
|||
|
agentOnly: false
|
|||
|
|
|||
|
## If true, push ETL data to the federated storage bucket
|
|||
|
federatedCluster: false
|
|||
|
|
|||
|
## If true, this cluster will be able to read from the federated-store but will
|
|||
|
## not write to it. This is useful in situations when you want to deploy a
|
|||
|
## primary cluster, but don't want the primary cluster's ETL data to be
|
|||
|
## pushed to the bucket
|
|||
|
readOnlyPrimary: false
|
|||
|
|
|||
|
## If true, changes the dir of S3 backup to the Federated combined store.
|
|||
|
## Commonly used when transitioning from Thanos to Federated ETL architecture.
|
|||
|
redirectS3Backup: false
|
|||
|
|
|||
|
## If true, will query metrics from a central PromQL DB (e.g. Amazon Managed
|
|||
|
## Prometheus)
|
|||
|
useMultiClusterDB: false
|
|||
|
|
|||
|
## Kubecost Admission Controller (beta feature)
|
|||
|
## To use this feature, ensure you have run the `create-admission-controller.sh`
|
|||
|
## script. This generates a k8s secret with TLS keys/certificats and a
|
|||
|
## corresponding CA bundle.
|
|||
|
##
|
|||
|
kubecostAdmissionController:
|
|||
|
enabled: false
|
|||
|
secretName: webhook-server-tls
|
|||
|
caBundle: ${CA_BUNDLE}
|
|||
|
|
|||
|
# Enables or disables the Cost Event Audit pipeline, which tracks recent changes at cluster level
|
|||
|
# and provides an estimated cost impact via the Kubecost Predict API.
|
|||
|
#
|
|||
|
# It is disabled by default to avoid problems in high-scale environments.
|
|||
|
costEventsAudit:
|
|||
|
enabled: false
|
|||
|
|
|||
|
## Disable updates to kubecost from the frontend UI and via POST request
|
|||
|
## This feature is considered beta, entrprise users should use teams:
|
|||
|
## https://docs.kubecost.com/using-kubecost/navigating-the-kubecost-ui/teams
|
|||
|
# readonly: false
|
|||
|
|
|||
|
# # These configs can also be set from the Settings page in the Kubecost product
|
|||
|
# # UI. Values in this block override config changes in the Settings UI on pod
|
|||
|
# # restart
|
|||
|
# kubecostProductConfigs:
|
|||
|
# # An optional list of cluster definitions that can be added for frontend
|
|||
|
# # access. The local cluster is *always* included by default, so this list is
|
|||
|
# # for non-local clusters.
|
|||
|
# clusters:
|
|||
|
# - name: "Cluster A"
|
|||
|
# address: http://cluster-a.kubecost.com:9090
|
|||
|
# # Optional authentication credentials - only basic auth is currently supported.
|
|||
|
# auth:
|
|||
|
# type: basic
|
|||
|
# # Secret name should be a secret formatted based on: https://github.com/kubecost/docs/blob/main/ingress-examples.md
|
|||
|
# secretName: cluster-a-auth
|
|||
|
# # Or pass auth directly as base64 encoded user:pass
|
|||
|
# data: YWRtaW46YWRtaW4=
|
|||
|
# # Or user and pass directly
|
|||
|
# user: admin
|
|||
|
# pass: admin
|
|||
|
# - name: "Cluster B"
|
|||
|
# address: http://cluster-b.kubecost.com:9090
|
|||
|
# # Enabling customPricesEnabled and defaultModelPricing instructs Kubecost to
|
|||
|
# # use these custom monthly resource prices when reporting node costs. Note,
|
|||
|
# # that the below configuration is for the monthly cost of the resource.
|
|||
|
# # Kubecost considers there to be 730 hours in a month. Also note, that these
|
|||
|
# # configurations will have no effect on metrics emitted such as
|
|||
|
# # `node_ram_hourly_cost` or `node_cpu_hourly_cost`.
|
|||
|
# # Ref: https://docs.kubecost.com/install-and-configure/install/provider-installations/air-gapped
|
|||
|
# customPricesEnabled: false
|
|||
|
# defaultModelPricing:
|
|||
|
# enabled: true
|
|||
|
# CPU: "28.0"
|
|||
|
# spotCPU: "4.86"
|
|||
|
# RAM: "3.09"
|
|||
|
# spotRAM: "0.65"
|
|||
|
# GPU: "693.50"
|
|||
|
# spotGPU: "225.0"
|
|||
|
# storage: "0.04"
|
|||
|
# zoneNetworkEgress: "0.01"
|
|||
|
# regionNetworkEgress: "0.01"
|
|||
|
# internetNetworkEgress: "0.12"
|
|||
|
# # The cluster profile represents a predefined set of parameters to use when calculating savings.
|
|||
|
# # Possible values are: [ development, production, high-availability ]
|
|||
|
# clusterProfile: production
|
|||
|
# spotLabel: lifecycle
|
|||
|
# spotLabelValue: Ec2Spot
|
|||
|
# gpuLabel: gpu
|
|||
|
# gpuLabelValue: true
|
|||
|
# alibabaServiceKeyName: ""
|
|||
|
# alibabaServiceKeyPassword: ""
|
|||
|
# awsServiceKeyName: ACCESSKEYID
|
|||
|
# awsServiceKeyPassword: fakepassword # Only use if your values.yaml are stored encrypted. Otherwise provide an existing secret via serviceKeySecretName
|
|||
|
# awsSpotDataRegion: us-east-1
|
|||
|
# awsSpotDataBucket: spot-data-feed-s3-bucket
|
|||
|
# awsSpotDataPrefix: dev
|
|||
|
# athenaProjectID: "530337586277" # The AWS AccountID where the Athena CUR is. Generally your masterpayer account
|
|||
|
# athenaBucketName: "s3://aws-athena-query-results-530337586277-us-east-1"
|
|||
|
# athenaRegion: us-east-1
|
|||
|
# athenaDatabase: athenacurcfn_athena_test1
|
|||
|
# athenaTable: "athena_test1"
|
|||
|
# athenaWorkgroup: "primary" # The default workgroup in AWS is 'primary'
|
|||
|
# masterPayerARN: ""
|
|||
|
# projectID: "123456789" # Also known as AccountID on AWS -- the current account/project that this instance of Kubecost is deployed on.
|
|||
|
# gcpSecretName: gcp-secret # Name of a secret representing the gcp service key
|
|||
|
# gcpSecretKeyName: compute-viewer-kubecost-key.json # Name of the secret's key containing the gcp service key
|
|||
|
# bigQueryBillingDataDataset: billing_data.gcp_billing_export_v1_01AC9F_74CF1D_5565A2
|
|||
|
# labelMappingConfigs: # names of k8s labels or annotations used to designate different allocation concepts
|
|||
|
# enabled: true
|
|||
|
# owner_label: "owner"
|
|||
|
# team_label: "team"
|
|||
|
# department_label: "dept"
|
|||
|
# product_label: "product"
|
|||
|
# environment_label: "env"
|
|||
|
# namespace_external_label: "kubernetes_namespace" # external labels/tags are used to map external cloud costs to kubernetes concepts
|
|||
|
# cluster_external_label: "kubernetes_cluster"
|
|||
|
# controller_external_label: "kubernetes_controller"
|
|||
|
# product_external_label: "kubernetes_label_app"
|
|||
|
# service_external_label: "kubernetes_service"
|
|||
|
# deployment_external_label: "kubernetes_deployment"
|
|||
|
# owner_external_label: "kubernetes_label_owner"
|
|||
|
# team_external_label: "kubernetes_label_team"
|
|||
|
# environment_external_label: "kubernetes_label_env"
|
|||
|
# department_external_label: "kubernetes_label_department"
|
|||
|
# statefulset_external_label: "kubernetes_statefulset"
|
|||
|
# daemonset_external_label: "kubernetes_daemonset"
|
|||
|
# pod_external_label: "kubernetes_pod"
|
|||
|
# grafanaURL: ""
|
|||
|
# # Provide a mapping from Account ID to a readable Account Name in a key/value object. Provide Account IDs as they are displayed in CloudCost
|
|||
|
# # as the 'key' and the Account Name associated with it as the 'value'
|
|||
|
# cloudAccountMapping:
|
|||
|
# EXAMPLE_ACCOUNT_ID: EXAMPLE_ACCOUNT_NAME
|
|||
|
# clusterName: "" # clusterName is the default context name in settings.
|
|||
|
# clusterAccountID: "" # Manually set Account property for assets
|
|||
|
# currencyCode: "USD" # official support for USD, AUD, BRL, CAD, CHF, CNY, DKK, EUR, GBP, IDR, INR, JPY, NOK, PLN, SEK
|
|||
|
# azureBillingRegion: US # Represents 2-letter region code, e.g. West Europe = NL, Canada = CA. ref: https://en.wikipedia.org/wiki/List_of_ISO_3166_country_codes
|
|||
|
# azureSubscriptionID: 0bd50fdf-c923-4e1e-850c-196dd3dcc5d3
|
|||
|
# azureClientID: f2ef6f7d-71fb-47c8-b766-8d63a19db017
|
|||
|
# azureTenantID: 72faf3ff-7a3f-4597-b0d9-7b0b201bb23a
|
|||
|
# azureClientPassword: fake key # Only use if your values.yaml are stored encrypted. Otherwise provide an existing secret via serviceKeySecretName
|
|||
|
# azureOfferDurableID: "MS-AZR-0003p"
|
|||
|
# discount: "" # percentage discount applied to compute
|
|||
|
# negotiatedDiscount: "" # custom negotiated cloud provider discount
|
|||
|
# standardDiscount: "" # custom negotiated cloud provider discount, applied to all incoming asset compute costs in a federated environment. Overrides negotiatedDiscount on any cluster in the federated environment.
|
|||
|
# defaultIdle: false
|
|||
|
# serviceKeySecretName: "" # Use an existing AWS or Azure secret with format as in aws-service-key-secret.yaml or azure-service-key-secret.yaml. Leave blank if using createServiceKeySecret
|
|||
|
# createServiceKeySecret: true # Creates a secret representing your cloud service key based on data in values.yaml. If you are storing unencrypted values, add a secret manually
|
|||
|
# sharedNamespaces: "" # namespaces with shared workloads, example value: "kube-system\,ingress-nginx\,kubecost\,monitoring"
|
|||
|
# sharedOverhead: "" # value representing a fixed external cost per month to be distributed among aggregations.
|
|||
|
# shareTenancyCosts: true # enable or disable sharing costs such as cluster management fees (defaults to "true" on Settings page)
|
|||
|
# metricsConfigs: # configuration for metrics emitted by Kubecost
|
|||
|
# disabledMetrics: [] # list of metrics that Kubecost will not emit. Note that disabling metrics can lead to unexpected behavior in the cost-model.
|
|||
|
# productKey: # Apply enterprise product license
|
|||
|
# enabled: false
|
|||
|
# key: ""
|
|||
|
# secretname: productkeysecret # Reference an existing k8s secret created from a file named productkey.json of format { "key": "enterprise-key-here" }. If the secretname is specified, a configmap with the key will not be created.
|
|||
|
# mountPath: "/some/custom/path/productkey.json" # (use instead of secretname) Declare the path at which the product key file is mounted (eg. by a secrets provisioner). The file must be of format { "key": "enterprise-key-here" }.
|
|||
|
# # The following block enables the use of a custom SMTP server which overrides Kubecost's built-in, external SMTP server for alerts and reports
|
|||
|
# smtp:
|
|||
|
# config: |
|
|||
|
# {
|
|||
|
# "sender_email": "",
|
|||
|
# "host": "",
|
|||
|
# "port": 587,
|
|||
|
# "authentication": true,
|
|||
|
# "username": "",
|
|||
|
# "password": "",
|
|||
|
# "secure": true
|
|||
|
# }
|
|||
|
# secretname: smtpconfigsecret # Reference an existing k8s secret created from a file named smtp.json of format specified by config above. If the secretname is specified, a configmap with the key will not be created.
|
|||
|
# mountPath: "/some/custom/path/smtp.json" # (use instead of secretname) Declare the path at which the SMTP config file is mounted (eg. by a secrets provisioner). The file must be of format specified by config above.
|
|||
|
# carbonEstimates: false # Enables Kubecost beta carbon estimation endpoints /assets/carbon and /allocations/carbon
|
|||
|
# The below options to hide UI elements are only supported in Enterprise
|
|||
|
# hideDiagnostics: false # useful if the primary is not monitored. Supported in limited environments.
|
|||
|
# hideOrphanedResources: false # OrphanedResources works on the primary-cluster's cloud-provider only.
|
|||
|
# hideKubecostActions: false
|
|||
|
# hideReservedInstances: false
|
|||
|
# hideSpotCommander: false
|
|||
|
# hideUnclaimedVolumes: false
|
|||
|
# hideCloudIntegrationsUI: false
|
|||
|
# hideBellIcon: false
|
|||
|
# hideTeams: false
|
|||
|
# savingsRecommendationsAllowLists: # Define select list of instance types to be evaluated in computing Savings Recommendations
|
|||
|
# AWS: []
|
|||
|
# GCP: []
|
|||
|
# Azure: []
|
|||
|
|
|||
|
## Specify an existing Kubernetes Secret holding the cloud integration information. This Secret must contain
|
|||
|
## a key with name `cloud-integration.json` and the contents must be in a specific format. It is expected
|
|||
|
## to exist in the release Namespace. This is mutually exclusive with cloudIntegrationJSON where only one must be defined.
|
|||
|
# cloudIntegrationSecret: "cloud-integration"
|
|||
|
|
|||
|
## Specify the cloud integration information in JSON form if pointing to an existing Secret is not desired or you'd rather
|
|||
|
## define the cloud integration information directly in the values file. This will result in a new Secret being created
|
|||
|
## named `cloud-integration` in the release Namespace. It is mutually exclusive with the cloudIntegrationSecret where only one must be defined.
|
|||
|
# cloudIntegrationJSON: |-
|
|||
|
# {
|
|||
|
# "aws": [
|
|||
|
# {
|
|||
|
# "athenaBucketName": "s3://AWS_cloud_integration_athenaBucketName",
|
|||
|
# "athenaRegion": "AWS_cloud_integration_athenaRegion",
|
|||
|
# "athenaDatabase": "AWS_cloud_integration_athenaDatabase",
|
|||
|
# "athenaTable": "AWS_cloud_integration_athenaBucketName",
|
|||
|
# "projectID": "AWS_cloud_integration_athena_projectID",
|
|||
|
# "serviceKeyName": "AWS_cloud_integration_athena_serviceKeyName",
|
|||
|
# "serviceKeySecret": "AWS_cloud_integration_athena_serviceKeySecret"
|
|||
|
# }
|
|||
|
# ],
|
|||
|
# "azure": [
|
|||
|
# {
|
|||
|
# "azureSubscriptionID": "my-subscription-id",
|
|||
|
# "azureStorageAccount": "my-storage-account",
|
|||
|
# "azureStorageAccessKey": "my-storage-access-key",
|
|||
|
# "azureStorageContainer": "my-storage-container"
|
|||
|
# }
|
|||
|
# ],
|
|||
|
# "gcp": [
|
|||
|
# {
|
|||
|
# "projectID": "my-project-id",
|
|||
|
# "billingDataDataset": "detailedbilling.my-billing-dataset",
|
|||
|
# "key": {
|
|||
|
# "type": "service_account",
|
|||
|
# "project_id": "my-project-id",
|
|||
|
# "private_key_id": "my-private-key-id",
|
|||
|
# "private_key": "my-pem-encoded-private-key",
|
|||
|
# "client_email": "my-service-account-name@my-project-id.iam.gserviceaccount.com",
|
|||
|
# "client_id": "my-client-id",
|
|||
|
# "auth_uri": "auth-uri",
|
|||
|
# "token_uri": "token-uri",
|
|||
|
# "auth_provider_x509_cert_url": "my-x509-provider-cert",
|
|||
|
# "client_x509_cert_url": "my-x509-cert-url"
|
|||
|
# }
|
|||
|
# }
|
|||
|
# ]
|
|||
|
# }
|
|||
|
|
|||
|
# ingestPodUID: false # Enables using UIDs to uniquely ID pods. This requires either Kubecost's replicated KSM metrics, or KSM v2.1.0+. This may impact performance, and changes the default cost-model allocation behavior.
|
|||
|
# regionOverrides: "region1,region2,region3" # list of regions which will override default costmodel provider regions
|
|||
|
|
|||
|
# Explicit names of various ConfigMaps to use. If not set, a default will apply.
|
|||
|
# pricingConfigmapName: ""
|
|||
|
# productConfigmapName: ""
|
|||
|
# smtpConfigmapName: ""
|
|||
|
|
|||
|
# -- Array of extra K8s manifests to deploy
|
|||
|
## Note: Supports use of custom Helm templates
|
|||
|
extraObjects: []
|
|||
|
# Cloud Billing Integration:
|
|||
|
# - apiVersion: v1
|
|||
|
# kind: Secret
|
|||
|
# metadata:
|
|||
|
# name: cloud-integration
|
|||
|
# namespace: kubecost
|
|||
|
# type: Opaque
|
|||
|
# data:
|
|||
|
# cloud-integration.json: BASE64_SECRET
|
|||
|
# Istio:
|
|||
|
# - apiVersion: networking.istio.io/v1alpha3
|
|||
|
# kind: VirtualService
|
|||
|
# metadata:
|
|||
|
# name: my-virtualservice
|
|||
|
# spec:
|
|||
|
# hosts:
|
|||
|
# - kubecost.myorg.com
|
|||
|
# gateways:
|
|||
|
# - my-gateway
|
|||
|
# http:
|
|||
|
# - route:
|
|||
|
# - destination:
|
|||
|
# host: kubecost.kubecost.svc.cluster.local
|
|||
|
# port:
|
|||
|
# number: 80
|