/* Copyright 2018 The Knative Authors Licensed under the Apache License, Version 2.0 (the "License"); you may not use this file except in compliance with the License. You may obtain a copy of the License at http://www.apache.org/licenses/LICENSE-2.0 Unless required by applicable law or agreed to in writing, software distributed under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. See the License for the specific language governing permissions and limitations under the License. */ package metrics import ( "context" "encoding/json" "errors" "fmt" "os" "path" "strconv" "strings" "time" "go.opencensus.io/stats" corev1 "k8s.io/api/core/v1" "knative.dev/pkg/metrics/metricskey" ) // metricsBackend specifies the backend to use for metrics type metricsBackend string const ( // BackendDestinationKey points to the config map entry key for metrics backend destination. BackendDestinationKey = "metrics.backend-destination" // DomainEnv points to the metrics domain env var. DomainEnv = "METRICS_DOMAIN" // The following keys are used to configure metrics reporting. // See https://github.com/knative/serving/blob/master/config/config-observability.yaml // for details. allowStackdriverCustomMetricsKey = "metrics.allow-stackdriver-custom-metrics" collectorAddressKey = "metrics.opencensus-address" collectorSecureKey = "metrics.opencensus-require-tls" reportingPeriodKey = "metrics.reporting-period-seconds" // Stackdriver client configuration keys stackdriverClusterNameKey = "metrics.stackdriver-cluster-name" stackdriverCustomMetricSubDomainKey = "metrics.stackdriver-custom-metrics-subdomain" stackdriverGCPLocationKey = "metrics.stackdriver-gcp-location" stackdriverProjectIDKey = "metrics.stackdriver-project-id" stackdriverUseSecretKey = "metrics.stackdriver-use-secret" defaultBackendEnvName = "DEFAULT_METRICS_BACKEND" defaultPrometheusPort = 9090 maxPrometheusPort = 65535 minPrometheusPort = 1024 prometheusPortEnvName = "METRICS_PROMETHEUS_PORT" ) // Metrics backend "enum". const ( // stackdriver is used for Stackdriver backend stackdriver metricsBackend = "stackdriver" // prometheus is used for Prometheus backend prometheus metricsBackend = "prometheus" // openCensus is used to export to the OpenCensus Agent / Collector, // which can send to many other services. openCensus metricsBackend = "opencensus" // none is used to export, well, nothing. none metricsBackend = "none" ) type metricsConfig struct { // The metrics domain. e.g. "serving.knative.dev" or "build.knative.dev". domain string // The component that emits the metrics. e.g. "activator", "autoscaler". component string // The metrics backend destination. backendDestination metricsBackend // reportingPeriod specifies the interval between reporting aggregated views. // If duration is less than or equal to zero, it enables the default behavior. reportingPeriod time.Duration // recorder provides a hook for performing custom transformations before // writing the metrics to the stats.RecordWithOptions interface. recorder func(context.Context, []stats.Measurement, ...stats.Options) error // secret contains credentials for an exporter to use for authentication. secret *corev1.Secret // ---- OpenCensus specific below ---- // collectorAddress is the address of the collector, if not `localhost:55678` collectorAddress string // Require mutual TLS. Defaults to "false" because mutual TLS is hard to set up. requireSecure bool // ---- Prometheus specific below ---- // prometheusPort is the port where metrics are exposed in Prometheus // format. It defaults to 9090. prometheusPort int // ---- Stackdriver specific below ---- // True if backendDestination equals to "stackdriver". Store this in a variable // to reduce string comparison operations. isStackdriverBackend bool // stackdriverMetricTypePrefix is the metric domain joins component, e.g. // "knative.dev/serving/activator". Store this in a variable to reduce string // join operations. stackdriverMetricTypePrefix string // stackdriverCustomMetricTypePrefix is "custom.googleapis.com" joined with the subdomain and component. // E.g., "custom.googleapis.com//". // Store this in a variable to reduce string join operations. stackdriverCustomMetricTypePrefix string // stackdriverClientConfig is the metadata to configure the metrics exporter's Stackdriver client. stackdriverClientConfig StackdriverClientConfig } // StackdriverClientConfig encapsulates the metadata required to configure a Stackdriver client. type StackdriverClientConfig struct { // ProjectID is the stackdriver project ID to which data is uploaded. // This is not necessarily the GCP project ID where the Kubernetes cluster is hosted. // Required when the Kubernetes cluster is not hosted on GCE. ProjectID string // GCPLocation is the GCP region or zone to which data is uploaded. // This is not necessarily the GCP location where the Kubernetes cluster is hosted. // Required when the Kubernetes cluster is not hosted on GCE. GCPLocation string // ClusterName is the cluster name with which the data will be associated in Stackdriver. // Required when the Kubernetes cluster is not hosted on GCE. ClusterName string // UseSecret is whether the credentials stored in a Kubernetes Secret should be used to // authenticate with Stackdriver. The Secret name and namespace can be specified by calling // metrics.SetStackdriverSecretLocation. // If UseSecret is false, Google Application Default Credentials // will be used (https://cloud.google.com/docs/authentication/production). UseSecret bool } // NewStackdriverClientConfigFromMap creates a stackdriverClientConfig from the given map func NewStackdriverClientConfigFromMap(config map[string]string) *StackdriverClientConfig { return &StackdriverClientConfig{ ProjectID: config[stackdriverProjectIDKey], GCPLocation: config[stackdriverGCPLocationKey], ClusterName: config[stackdriverClusterNameKey], UseSecret: strings.EqualFold(config[stackdriverUseSecretKey], "true"), } } // record applies the `ros` Options to each measurement in `mss` and then records the resulting // measurements in the metricsConfig's designated backend. func (mc *metricsConfig) record(ctx context.Context, mss []stats.Measurement, ros ...stats.Options) error { if mc == nil || mc.backendDestination == none { // Don't record data points if the metric config is not initialized yet or if // the defined backend is "none" explicitly. return nil } if mc.recorder == nil { opt, err := optionForResource(metricskey.GetResource(ctx)) if err != nil { return err } ros = append(ros, opt) return stats.RecordWithOptions(ctx, append(ros, stats.WithMeasurements(mss...))...) } return mc.recorder(ctx, mss, ros...) } func createMetricsConfig(ctx context.Context, ops ExporterOptions) (*metricsConfig, error) { var mc metricsConfig if ops.Domain == "" { return nil, errors.New("metrics domain cannot be empty") } mc.domain = ops.Domain if ops.Component == "" { return nil, errors.New("metrics component name cannot be empty") } mc.component = ops.Component if ops.ConfigMap == nil { return nil, errors.New("metrics config map cannot be empty") } m := ops.ConfigMap // Read backend setting from environment variable first backend := os.Getenv(defaultBackendEnvName) if backend == "" { // Use Prometheus if DEFAULT_METRICS_BACKEND does not exist or is empty backend = string(prometheus) } // Override backend if it is set in the config map. if backendFromConfig, ok := m[BackendDestinationKey]; ok { backend = backendFromConfig } lb := metricsBackend(strings.ToLower(backend)) switch lb { case stackdriver, prometheus, openCensus: mc.backendDestination = lb default: return nil, fmt.Errorf("unsupported metrics backend value %q", backend) } if mc.backendDestination == openCensus { mc.collectorAddress = ops.ConfigMap[collectorAddressKey] if isSecure := ops.ConfigMap[collectorSecureKey]; isSecure != "" { var err error if mc.requireSecure, err = strconv.ParseBool(isSecure); err != nil { return nil, fmt.Errorf("invalid %s value %q", collectorSecureKey, isSecure) } if mc.requireSecure { mc.secret, err = getOpenCensusSecret(ops.Component, ops.Secrets) if err != nil { return nil, err } } } } if mc.backendDestination == prometheus { pp := ops.PrometheusPort if pp == 0 { var err error pp, err = prometheusPort() if err != nil { return nil, fmt.Errorf("failed to determine Prometheus port: %w", err) } } if pp < minPrometheusPort || pp > maxPrometheusPort { return nil, fmt.Errorf("invalid port %d, should be between %d and %d", pp, minPrometheusPort, maxPrometheusPort) } mc.prometheusPort = pp } // If stackdriverClientConfig is not provided for stackdriver backend destination, OpenCensus will try to // use the application default credentials. If that is not available, Opencensus would fail to create the // metrics exporter. if mc.backendDestination == stackdriver { scc := NewStackdriverClientConfigFromMap(m) mc.stackdriverClientConfig = *scc mc.isStackdriverBackend = true var allowCustomMetrics bool var err error mc.stackdriverMetricTypePrefix = path.Join(mc.domain, mc.component) customMetricsSubDomain := m[stackdriverCustomMetricSubDomainKey] if customMetricsSubDomain == "" { customMetricsSubDomain = defaultCustomMetricSubDomain } mc.stackdriverCustomMetricTypePrefix = path.Join(customMetricTypePrefix, customMetricsSubDomain, mc.component) if ascmStr := m[allowStackdriverCustomMetricsKey]; ascmStr != "" { allowCustomMetrics, err = strconv.ParseBool(ascmStr) if err != nil { return nil, fmt.Errorf("invalid %s value %q", allowStackdriverCustomMetricsKey, ascmStr) } } mc.recorder = sdCustomMetricsRecorder(mc, allowCustomMetrics) if scc.UseSecret { secret, err := getStackdriverSecret(ctx, ops.Secrets) if err != nil { return nil, err } mc.secret = secret } } // If reporting period is specified, use the value from the configuration. // If not, set a default value based on the selected backend. // Each exporter makes different promises about what the lowest supported // reporting period is. For Stackdriver, this value is 1 minute. // For Prometheus, we will use a lower value since the exporter doesn't // push anything but just responds to pull requests, and shorter durations // do not really hurt the performance and we rely on the scraping configuration. if repStr, ok := m[reportingPeriodKey]; ok && repStr != "" { repInt, err := strconv.Atoi(repStr) if err != nil { return nil, fmt.Errorf("invalid %s value %q", reportingPeriodKey, repStr) } mc.reportingPeriod = time.Duration(repInt) * time.Second } else { switch mc.backendDestination { case stackdriver, openCensus: mc.reportingPeriod = time.Minute case prometheus: mc.reportingPeriod = 5 * time.Second } } return &mc, nil } // Domain holds the metrics domain to use for surfacing metrics. func Domain() string { if domain := os.Getenv(DomainEnv); domain != "" { return domain } panic(fmt.Sprintf(`The environment variable %q is not set If this is a process running on Kubernetes, then it should be specifying this via: env: - name: %s value: knative.dev/some-repository If this is a Go unit test consuming metric.Domain() then it should add the following import: import ( _ "knative.dev/pkg/metrics/testing" )`, DomainEnv, DomainEnv)) } // prometheusPort returns the TCP port number configured via the environment // for the Prometheus metrics exporter if it's set, a default value otherwise. // No validation is performed on the port value, other than ensuring that value // is a valid port number (16-bit unsigned integer). func prometheusPort() (int, error) { ppStr := os.Getenv(prometheusPortEnvName) if ppStr == "" { return defaultPrometheusPort, nil } pp, err := strconv.ParseUint(ppStr, 10, 16) if err != nil { return -1, fmt.Errorf("the environment variable %q could not be parsed as a port number: %w", prometheusPortEnvName, err) } return int(pp), nil } // JsonToMetricsOptions converts a json string of a // ExporterOptions. Returns a non-nil ExporterOptions always. func JsonToMetricsOptions(jsonOpts string) (*ExporterOptions, error) { // nolint No rename due to backwards incompatibility. var opts ExporterOptions if jsonOpts == "" { return nil, errors.New("json options string is empty") } if err := json.Unmarshal([]byte(jsonOpts), &opts); err != nil { return nil, err } return &opts, nil } // MetricsOptionsToJson converts a ExporterOptions to a json string. func MetricsOptionsToJson(opts *ExporterOptions) (string, error) { // nolint No rename due to backwards incompatibility. if opts == nil { return "", nil } jsonOpts, err := json.Marshal(opts) if err != nil { return "", err } return string(jsonOpts), nil }