mirror of
https://github.com/open-telemetry/opentelemetry-go.git
synced 2024-12-16 10:19:23 +02:00
5461669733
* Checkpoint new pull controller * Tests pass * Fix example * Example fix * Add a test * Comment * address MrAlias's feedback
376 lines
12 KiB
Go
376 lines
12 KiB
Go
// Copyright The OpenTelemetry Authors
|
|
//
|
|
// Licensed under the Apache License, Version 2.0 (the "License");
|
|
// you may not use this file except in compliance with the License.
|
|
// You may obtain a copy of the License at
|
|
//
|
|
// http://www.apache.org/licenses/LICENSE-2.0
|
|
//
|
|
// Unless required by applicable law or agreed to in writing, software
|
|
// distributed under the License is distributed on an "AS IS" BASIS,
|
|
// WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
// See the License for the specific language governing permissions and
|
|
// limitations under the License.
|
|
|
|
package prometheus
|
|
|
|
import (
|
|
"context"
|
|
"fmt"
|
|
"net/http"
|
|
"sync"
|
|
|
|
"go.opentelemetry.io/otel/api/metric"
|
|
|
|
"github.com/prometheus/client_golang/prometheus"
|
|
"github.com/prometheus/client_golang/prometheus/promhttp"
|
|
|
|
"go.opentelemetry.io/otel/api/global"
|
|
"go.opentelemetry.io/otel/api/label"
|
|
export "go.opentelemetry.io/otel/sdk/export/metric"
|
|
"go.opentelemetry.io/otel/sdk/export/metric/aggregator"
|
|
"go.opentelemetry.io/otel/sdk/metric/controller/pull"
|
|
"go.opentelemetry.io/otel/sdk/metric/selector/simple"
|
|
)
|
|
|
|
// Exporter is an implementation of metric.Exporter that sends metrics to
|
|
// Prometheus.
|
|
//
|
|
// This exporter supports Prometheus pulls, as such it does not
|
|
// implement the export.Exporter interface.
|
|
type Exporter struct {
|
|
handler http.Handler
|
|
|
|
registerer prometheus.Registerer
|
|
gatherer prometheus.Gatherer
|
|
|
|
// lock protects access to the controller. The controller
|
|
// exposes its own lock, but using a dedicated lock in this
|
|
// struct allows the exporter to potentially support multiple
|
|
// controllers (e.g., with different resources).
|
|
lock sync.RWMutex
|
|
controller *pull.Controller
|
|
|
|
onError func(error)
|
|
|
|
defaultSummaryQuantiles []float64
|
|
defaultHistogramBoundaries []metric.Number
|
|
}
|
|
|
|
var _ http.Handler = &Exporter{}
|
|
|
|
// Config is a set of configs for the tally reporter.
|
|
type Config struct {
|
|
// Registry is the prometheus registry that will be used as the default Registerer and
|
|
// Gatherer if these are not specified.
|
|
//
|
|
// If not set a new empty Registry is created.
|
|
Registry *prometheus.Registry
|
|
|
|
// Registerer is the prometheus registerer to register
|
|
// metrics with.
|
|
//
|
|
// If not specified the Registry will be used as default.
|
|
Registerer prometheus.Registerer
|
|
|
|
// Gatherer is the prometheus gatherer to gather
|
|
// metrics with.
|
|
//
|
|
// If not specified the Registry will be used as default.
|
|
Gatherer prometheus.Gatherer
|
|
|
|
// DefaultSummaryQuantiles is the default summary quantiles
|
|
// to use. Use nil to specify the system-default summary quantiles.
|
|
DefaultSummaryQuantiles []float64
|
|
|
|
// DefaultHistogramBoundaries defines the default histogram bucket
|
|
// boundaries.
|
|
DefaultHistogramBoundaries []metric.Number
|
|
|
|
// OnError is a function that handle errors that may occur while exporting metrics.
|
|
// TODO: This should be refactored or even removed once we have a better error handling mechanism.
|
|
OnError func(error)
|
|
}
|
|
|
|
// NewExportPipeline sets up a complete export pipeline with the recommended setup,
|
|
// using the recommended selector and standard integrator. See the pull.Options.
|
|
func NewExportPipeline(config Config, options ...pull.Option) (*Exporter, error) {
|
|
if config.Registry == nil {
|
|
config.Registry = prometheus.NewRegistry()
|
|
}
|
|
|
|
if config.Registerer == nil {
|
|
config.Registerer = config.Registry
|
|
}
|
|
|
|
if config.Gatherer == nil {
|
|
config.Gatherer = config.Registry
|
|
}
|
|
|
|
if config.OnError == nil {
|
|
config.OnError = func(err error) {
|
|
fmt.Println(err.Error())
|
|
}
|
|
}
|
|
|
|
e := &Exporter{
|
|
handler: promhttp.HandlerFor(config.Gatherer, promhttp.HandlerOpts{}),
|
|
registerer: config.Registerer,
|
|
gatherer: config.Gatherer,
|
|
defaultSummaryQuantiles: config.DefaultSummaryQuantiles,
|
|
defaultHistogramBoundaries: config.DefaultHistogramBoundaries,
|
|
onError: config.OnError,
|
|
}
|
|
|
|
c := &collector{
|
|
exp: e,
|
|
}
|
|
e.SetController(config, options...)
|
|
if err := config.Registerer.Register(c); err != nil {
|
|
return nil, fmt.Errorf("cannot register the collector: %w", err)
|
|
}
|
|
|
|
return e, nil
|
|
}
|
|
|
|
// InstallNewPipeline instantiates a NewExportPipeline and registers it globally.
|
|
// Typically called as:
|
|
//
|
|
// hf, err := prometheus.InstallNewPipeline(prometheus.Config{...})
|
|
//
|
|
// if err != nil {
|
|
// ...
|
|
// }
|
|
// http.HandleFunc("/metrics", hf)
|
|
// defer pipeline.Stop()
|
|
// ... Done
|
|
func InstallNewPipeline(config Config, options ...pull.Option) (*Exporter, error) {
|
|
exp, err := NewExportPipeline(config, options...)
|
|
if err != nil {
|
|
return nil, err
|
|
}
|
|
global.SetMeterProvider(exp.Provider())
|
|
return exp, nil
|
|
}
|
|
|
|
// SetController sets up a standard *pull.Controller as the metric provider
|
|
// for this exporter.
|
|
func (e *Exporter) SetController(config Config, options ...pull.Option) {
|
|
e.lock.Lock()
|
|
defer e.lock.Unlock()
|
|
// Prometheus uses a stateful pull controller since instruments are
|
|
// cumulative and should not be reset after each collection interval.
|
|
//
|
|
// Prometheus uses this approach to be resilient to scrape failures.
|
|
// If a Prometheus server tries to scrape metrics from a host and fails for some reason,
|
|
// it could try again on the next scrape and no data would be lost, only resolution.
|
|
//
|
|
// Gauges (or LastValues) and Summaries are an exception to this and have different behaviors.
|
|
//
|
|
// TODO: Prometheus supports "Gauge Histogram" which are
|
|
// expressed as delta histograms.
|
|
e.controller = pull.New(
|
|
simple.NewWithHistogramDistribution(config.DefaultHistogramBoundaries),
|
|
append(options, pull.WithStateful(true))...,
|
|
)
|
|
}
|
|
|
|
// Provider returns the metric.Provider of this exporter.
|
|
func (e *Exporter) Provider() metric.Provider {
|
|
return e.controller.Provider()
|
|
}
|
|
|
|
// Controller returns the controller object that coordinates collection for the SDK.
|
|
func (e *Exporter) Controller() *pull.Controller {
|
|
e.lock.RLock()
|
|
defer e.lock.RUnlock()
|
|
return e.controller
|
|
}
|
|
|
|
func (e *Exporter) ServeHTTP(w http.ResponseWriter, r *http.Request) {
|
|
e.handler.ServeHTTP(w, r)
|
|
}
|
|
|
|
// collector implements prometheus.Collector interface.
|
|
type collector struct {
|
|
exp *Exporter
|
|
}
|
|
|
|
var _ prometheus.Collector = (*collector)(nil)
|
|
|
|
func (c *collector) Describe(ch chan<- *prometheus.Desc) {
|
|
c.exp.lock.RLock()
|
|
defer c.exp.lock.RUnlock()
|
|
|
|
_ = c.exp.Controller().ForEach(func(record export.Record) error {
|
|
ch <- c.toDesc(&record)
|
|
return nil
|
|
})
|
|
}
|
|
|
|
// Collect exports the last calculated CheckpointSet.
|
|
//
|
|
// Collect is invoked whenever prometheus.Gatherer is also invoked.
|
|
// For example, when the HTTP endpoint is invoked by Prometheus.
|
|
func (c *collector) Collect(ch chan<- prometheus.Metric) {
|
|
c.exp.lock.RLock()
|
|
defer c.exp.lock.RUnlock()
|
|
|
|
ctrl := c.exp.Controller()
|
|
ctrl.Collect(context.Background())
|
|
|
|
err := ctrl.ForEach(func(record export.Record) error {
|
|
agg := record.Aggregator()
|
|
numberKind := record.Descriptor().NumberKind()
|
|
// TODO: Use the resource value in this record.
|
|
labels := labelValues(record.Labels())
|
|
desc := c.toDesc(&record)
|
|
|
|
if hist, ok := agg.(aggregator.Histogram); ok {
|
|
if err := c.exportHistogram(ch, hist, numberKind, desc, labels); err != nil {
|
|
return fmt.Errorf("exporting histogram: %w", err)
|
|
}
|
|
} else if dist, ok := agg.(aggregator.Distribution); ok {
|
|
// TODO: summaries values are never being resetted.
|
|
// As measurements are recorded, new records starts to have less impact on these summaries.
|
|
// We should implement an solution that is similar to the Prometheus Clients
|
|
// using a rolling window for summaries could be a solution.
|
|
//
|
|
// References:
|
|
// https://www.robustperception.io/how-does-a-prometheus-summary-work
|
|
// https://github.com/prometheus/client_golang/blob/fa4aa9000d2863904891d193dea354d23f3d712a/prometheus/summary.go#L135
|
|
if err := c.exportSummary(ch, dist, numberKind, desc, labels); err != nil {
|
|
return fmt.Errorf("exporting summary: %w", err)
|
|
}
|
|
} else if sum, ok := agg.(aggregator.Sum); ok {
|
|
if err := c.exportCounter(ch, sum, numberKind, desc, labels); err != nil {
|
|
return fmt.Errorf("exporting counter: %w", err)
|
|
}
|
|
} else if lastValue, ok := agg.(aggregator.LastValue); ok {
|
|
if err := c.exportLastValue(ch, lastValue, numberKind, desc, labels); err != nil {
|
|
return fmt.Errorf("exporting last value: %w", err)
|
|
}
|
|
}
|
|
return nil
|
|
})
|
|
if err != nil {
|
|
c.exp.onError(err)
|
|
}
|
|
}
|
|
|
|
func (c *collector) exportLastValue(ch chan<- prometheus.Metric, lvagg aggregator.LastValue, kind metric.NumberKind, desc *prometheus.Desc, labels []string) error {
|
|
lv, _, err := lvagg.LastValue()
|
|
if err != nil {
|
|
return fmt.Errorf("error retrieving last value: %w", err)
|
|
}
|
|
|
|
m, err := prometheus.NewConstMetric(desc, prometheus.GaugeValue, lv.CoerceToFloat64(kind), labels...)
|
|
if err != nil {
|
|
return fmt.Errorf("error creating constant metric: %w", err)
|
|
}
|
|
|
|
ch <- m
|
|
return nil
|
|
}
|
|
|
|
func (c *collector) exportCounter(ch chan<- prometheus.Metric, sum aggregator.Sum, kind metric.NumberKind, desc *prometheus.Desc, labels []string) error {
|
|
v, err := sum.Sum()
|
|
if err != nil {
|
|
return fmt.Errorf("error retrieving counter: %w", err)
|
|
}
|
|
|
|
m, err := prometheus.NewConstMetric(desc, prometheus.CounterValue, v.CoerceToFloat64(kind), labels...)
|
|
if err != nil {
|
|
return fmt.Errorf("error creating constant metric: %w", err)
|
|
}
|
|
|
|
ch <- m
|
|
return nil
|
|
}
|
|
|
|
func (c *collector) exportSummary(ch chan<- prometheus.Metric, dist aggregator.Distribution, kind metric.NumberKind, desc *prometheus.Desc, labels []string) error {
|
|
count, err := dist.Count()
|
|
if err != nil {
|
|
return fmt.Errorf("error retrieving count: %w", err)
|
|
}
|
|
|
|
var sum metric.Number
|
|
sum, err = dist.Sum()
|
|
if err != nil {
|
|
return fmt.Errorf("error retrieving distribution sum: %w", err)
|
|
}
|
|
|
|
quantiles := make(map[float64]float64)
|
|
for _, quantile := range c.exp.defaultSummaryQuantiles {
|
|
q, _ := dist.Quantile(quantile)
|
|
quantiles[quantile] = q.CoerceToFloat64(kind)
|
|
}
|
|
|
|
m, err := prometheus.NewConstSummary(desc, uint64(count), sum.CoerceToFloat64(kind), quantiles, labels...)
|
|
if err != nil {
|
|
return fmt.Errorf("error creating constant summary: %w", err)
|
|
}
|
|
|
|
ch <- m
|
|
return nil
|
|
}
|
|
|
|
func (c *collector) exportHistogram(ch chan<- prometheus.Metric, hist aggregator.Histogram, kind metric.NumberKind, desc *prometheus.Desc, labels []string) error {
|
|
buckets, err := hist.Histogram()
|
|
if err != nil {
|
|
return fmt.Errorf("error retrieving histogram: %w", err)
|
|
}
|
|
sum, err := hist.Sum()
|
|
if err != nil {
|
|
return fmt.Errorf("error retrieving sum: %w", err)
|
|
}
|
|
|
|
var totalCount uint64
|
|
// counts maps from the bucket upper-bound to the cumulative count.
|
|
// The bucket with upper-bound +inf is not included.
|
|
counts := make(map[float64]uint64, len(buckets.Boundaries))
|
|
for i := range buckets.Boundaries {
|
|
boundary := buckets.Boundaries[i].CoerceToFloat64(kind)
|
|
totalCount += buckets.Counts[i].AsUint64()
|
|
counts[boundary] = totalCount
|
|
}
|
|
// Include the +inf bucket in the total count.
|
|
totalCount += buckets.Counts[len(buckets.Counts)-1].AsUint64()
|
|
|
|
m, err := prometheus.NewConstHistogram(desc, totalCount, sum.CoerceToFloat64(kind), counts, labels...)
|
|
if err != nil {
|
|
return fmt.Errorf("error creating constant histogram: %w", err)
|
|
}
|
|
|
|
ch <- m
|
|
return nil
|
|
}
|
|
|
|
func (c *collector) toDesc(record *export.Record) *prometheus.Desc {
|
|
desc := record.Descriptor()
|
|
labels := labelsKeys(record.Labels())
|
|
return prometheus.NewDesc(sanitize(desc.Name()), desc.Description(), labels, nil)
|
|
}
|
|
|
|
func labelsKeys(labels *label.Set) []string {
|
|
iter := labels.Iter()
|
|
keys := make([]string, 0, iter.Len())
|
|
for iter.Next() {
|
|
kv := iter.Label()
|
|
keys = append(keys, sanitize(string(kv.Key)))
|
|
}
|
|
return keys
|
|
}
|
|
|
|
func labelValues(labels *label.Set) []string {
|
|
// TODO(paivagustavo): parse the labels.Encoded() instead of calling `Emit()` directly
|
|
// this would avoid unnecessary allocations.
|
|
iter := labels.Iter()
|
|
values := make([]string, 0, iter.Len())
|
|
for iter.Next() {
|
|
label := iter.Label()
|
|
values = append(values, label.Value.Emit())
|
|
}
|
|
return values
|
|
}
|