Documentation ¶
Index ¶
- Constants
- func GroupKey(file, name string) string
- func NewOriginContext(ctx context.Context, rule RuleDetail) context.Context
- type Alert
- type AlertState
- type AlertingRule
- func (r *AlertingRule) ActiveAlerts() []*Alert
- func (r *AlertingRule) Annotations() labels.Labels
- func (r *AlertingRule) Eval(ctx context.Context, ts time.Time, query QueryFunc, externalURL *url.URL, ...) (promql.Vector, error)
- func (r *AlertingRule) ForEachActiveAlert(f func(*Alert))
- func (r *AlertingRule) GetEvaluationDuration() time.Duration
- func (r *AlertingRule) GetEvaluationTimestamp() time.Time
- func (r *AlertingRule) Health() RuleHealth
- func (r *AlertingRule) HoldDuration() time.Duration
- func (r *AlertingRule) KeepFiringFor() time.Duration
- func (r *AlertingRule) Labels() labels.Labels
- func (r *AlertingRule) LastError() error
- func (r *AlertingRule) Name() string
- func (r *AlertingRule) Query() parser.Expr
- func (r *AlertingRule) QueryforStateSeries(alert *Alert, q storage.Querier) (storage.Series, error)
- func (r *AlertingRule) Restored() bool
- func (r *AlertingRule) SetEvaluationDuration(dur time.Duration)
- func (r *AlertingRule) SetEvaluationTimestamp(ts time.Time)
- func (r *AlertingRule) SetHealth(health RuleHealth)
- func (r *AlertingRule) SetLastError(err error)
- func (r *AlertingRule) SetRestored(restored bool)
- func (r *AlertingRule) State() AlertState
- func (r *AlertingRule) String() string
- type FileLoader
- type Group
- func (g *Group) AlertingRules() []*AlertingRule
- func (g *Group) Context() context.Context
- func (g *Group) CopyState(from *Group)
- func (g *Group) Equals(ng *Group) bool
- func (g *Group) Eval(ctx context.Context, ts time.Time)
- func (g *Group) EvalTimestamp(startTime int64) time.Time
- func (g *Group) File() string
- func (g *Group) GetEvaluationTime() time.Duration
- func (g *Group) GetLastEvaluation() time.Time
- func (g *Group) HasAlertingRules() bool
- func (g *Group) Interval() time.Duration
- func (g *Group) Limit() int
- func (g *Group) Name() string
- func (g *Group) Queryable() storage.Queryable
- func (g *Group) RestoreForState(ts time.Time)
- func (g *Group) Rules() []Rule
- type GroupLoader
- type GroupOptions
- type Manager
- func (m *Manager) AlertingRules() []*AlertingRule
- func (m *Manager) LoadGroups(interval time.Duration, externalLabels labels.Labels, externalURL string, ...) (map[string]*Group, []error)
- func (m *Manager) RuleGroups() []*Group
- func (m *Manager) Rules() []Rule
- func (m *Manager) Run()
- func (m *Manager) Stop()
- func (m *Manager) Update(interval time.Duration, files []string, externalLabels labels.Labels, ...) error
- type ManagerOptions
- type Metrics
- type NotifyFunc
- type QueryFunc
- type RecordingRule
- func (rule *RecordingRule) Eval(ctx context.Context, ts time.Time, query QueryFunc, _ *url.URL, limit int) (promql.Vector, error)
- func (rule *RecordingRule) GetEvaluationDuration() time.Duration
- func (rule *RecordingRule) GetEvaluationTimestamp() time.Time
- func (rule *RecordingRule) Health() RuleHealth
- func (rule *RecordingRule) Labels() labels.Labels
- func (rule *RecordingRule) LastError() error
- func (rule *RecordingRule) Name() string
- func (rule *RecordingRule) Query() parser.Expr
- func (rule *RecordingRule) SetEvaluationDuration(dur time.Duration)
- func (rule *RecordingRule) SetEvaluationTimestamp(ts time.Time)
- func (rule *RecordingRule) SetHealth(health RuleHealth)
- func (rule *RecordingRule) SetLastError(err error)
- func (rule *RecordingRule) String() string
- type Rule
- type RuleDetail
- type RuleGroupPostProcessFunc
- type RuleHealth
- type Sender
Constants ¶
const ( KindAlerting = "alerting" KindRecording = "recording" )
Variables ¶
This section is empty.
Functions ¶
func NewOriginContext ¶
func NewOriginContext(ctx context.Context, rule RuleDetail) context.Context
NewOriginContext returns a new context with data about the origin attached.
Types ¶
type Alert ¶
type Alert struct { State AlertState Labels labels.Labels Annotations labels.Labels // The value at the last evaluation of the alerting expression. Value float64 // The interval during which the condition of this alert held true. // ResolvedAt will be 0 to indicate a still active alert. ActiveAt time.Time FiredAt time.Time ResolvedAt time.Time LastSentAt time.Time ValidUntil time.Time KeepFiringSince time.Time }
Alert is the user-level representation of a single instance of an alerting rule.
type AlertState ¶
type AlertState int
AlertState denotes the state of an active alert.
const ( // StateInactive is the state of an alert that is neither firing nor pending. StateInactive AlertState = iota // StatePending is the state of an alert that has been active for less than // the configured threshold duration. StatePending // StateFiring is the state of an alert that has been active for longer than // the configured threshold duration. StateFiring )
func (AlertState) String ¶
func (s AlertState) String() string
type AlertingRule ¶
type AlertingRule struct {
// contains filtered or unexported fields
}
An AlertingRule generates alerts from its vector expression.
func NewAlertingRule ¶
func NewAlertingRule( name string, vec parser.Expr, hold, keepFiringFor time.Duration, labels, annotations, externalLabels labels.Labels, externalURL string, restored bool, logger log.Logger, ) *AlertingRule
NewAlertingRule constructs a new AlertingRule.
func (*AlertingRule) ActiveAlerts ¶
func (r *AlertingRule) ActiveAlerts() []*Alert
ActiveAlerts returns a slice of active alerts.
func (*AlertingRule) Annotations ¶
func (r *AlertingRule) Annotations() labels.Labels
Annotations returns the annotations of the alerting rule.
func (*AlertingRule) Eval ¶
func (r *AlertingRule) Eval(ctx context.Context, ts time.Time, query QueryFunc, externalURL *url.URL, limit int) (promql.Vector, error)
Eval evaluates the rule expression and then creates pending alerts and fires or removes previously pending alerts accordingly.
func (*AlertingRule) ForEachActiveAlert ¶
func (r *AlertingRule) ForEachActiveAlert(f func(*Alert))
ForEachActiveAlert runs the given function on each alert. This should be used when you want to use the actual alerts from the AlertingRule and not on its copy. If you want to run on a copy of alerts then don't use this, get the alerts from 'ActiveAlerts()'.
func (*AlertingRule) GetEvaluationDuration ¶
func (r *AlertingRule) GetEvaluationDuration() time.Duration
GetEvaluationDuration returns the time in seconds it took to evaluate the alerting rule.
func (*AlertingRule) GetEvaluationTimestamp ¶
func (r *AlertingRule) GetEvaluationTimestamp() time.Time
GetEvaluationTimestamp returns the time the evaluation took place.
func (*AlertingRule) Health ¶
func (r *AlertingRule) Health() RuleHealth
Health returns the current health of the alerting rule.
func (*AlertingRule) HoldDuration ¶
func (r *AlertingRule) HoldDuration() time.Duration
HoldDuration returns the hold duration of the alerting rule.
func (*AlertingRule) KeepFiringFor ¶
func (r *AlertingRule) KeepFiringFor() time.Duration
KeepFiringFor returns the duration an alerting rule should keep firing for after resolution.
func (*AlertingRule) Labels ¶
func (r *AlertingRule) Labels() labels.Labels
Labels returns the labels of the alerting rule.
func (*AlertingRule) LastError ¶
func (r *AlertingRule) LastError() error
LastError returns the last error seen by the alerting rule.
func (*AlertingRule) Name ¶
func (r *AlertingRule) Name() string
Name returns the name of the alerting rule.
func (*AlertingRule) Query ¶
func (r *AlertingRule) Query() parser.Expr
Query returns the query expression of the alerting rule.
func (*AlertingRule) QueryforStateSeries ¶
QueryforStateSeries returns the series for ALERTS_FOR_STATE.
func (*AlertingRule) Restored ¶
func (r *AlertingRule) Restored() bool
Restored returns the restoration state of the alerting rule.
func (*AlertingRule) SetEvaluationDuration ¶
func (r *AlertingRule) SetEvaluationDuration(dur time.Duration)
SetEvaluationDuration updates evaluationDuration to the duration it took to evaluate the rule on its last evaluation.
func (*AlertingRule) SetEvaluationTimestamp ¶
func (r *AlertingRule) SetEvaluationTimestamp(ts time.Time)
SetEvaluationTimestamp updates evaluationTimestamp to the timestamp of when the rule was last evaluated.
func (*AlertingRule) SetHealth ¶
func (r *AlertingRule) SetHealth(health RuleHealth)
SetHealth sets the current health of the alerting rule.
func (*AlertingRule) SetLastError ¶
func (r *AlertingRule) SetLastError(err error)
SetLastError sets the current error seen by the alerting rule.
func (*AlertingRule) SetRestored ¶
func (r *AlertingRule) SetRestored(restored bool)
SetRestored updates the restoration state of the alerting rule.
func (*AlertingRule) State ¶
func (r *AlertingRule) State() AlertState
State returns the maximum state of alert instances for this rule. StateFiring > StatePending > StateInactive
func (*AlertingRule) String ¶
func (r *AlertingRule) String() string
type FileLoader ¶
type FileLoader struct{}
FileLoader is the default GroupLoader implementation. It defers to rulefmt.ParseFile and parser.ParseExpr
func (FileLoader) Load ¶
func (FileLoader) Load(identifier string) (*rulefmt.RuleGroups, []error)
type Group ¶
type Group struct {
// contains filtered or unexported fields
}
Group is a set of rules that have a logical relation.
func NewGroup ¶
func NewGroup(o GroupOptions) *Group
NewGroup makes a new Group with the given name, options, and rules.
func (*Group) AlertingRules ¶
func (g *Group) AlertingRules() []*AlertingRule
AlertingRules returns the list of the group's alerting rules.
func (*Group) CopyState ¶
CopyState copies the alerting rule and staleness related state from the given group.
Rules are matched based on their name and labels. If there are duplicates, the first is matched with the first, second with the second etc.
func (*Group) Eval ¶
Eval runs a single evaluation cycle in which all rules are evaluated sequentially.
func (*Group) EvalTimestamp ¶
EvalTimestamp returns the immediately preceding consistently slotted evaluation time.
func (*Group) GetEvaluationTime ¶
GetEvaluationTime returns the time in seconds it took to evaluate the rule group.
func (*Group) GetLastEvaluation ¶
GetLastEvaluation returns the time the last evaluation of the rule group took place.
func (*Group) HasAlertingRules ¶
HasAlertingRules returns true if the group contains at least one AlertingRule.
func (*Group) RestoreForState ¶
RestoreForState restores the 'for' state of the alerts by looking up last ActiveAt from storage.
type GroupLoader ¶
type GroupLoader interface { Load(identifier string) (*rulefmt.RuleGroups, []error) Parse(query string) (parser.Expr, error) }
GroupLoader is responsible for loading rule groups from arbitrary sources and parsing them.
type GroupOptions ¶
type GroupOptions struct {
Name, File string
Interval time.Duration
Limit int
Rules []Rule
ShouldRestore bool
Opts *ManagerOptions
RuleGroupPostProcessFunc RuleGroupPostProcessFunc
// contains filtered or unexported fields
}
type Manager ¶
type Manager struct {
// contains filtered or unexported fields
}
The Manager manages recording and alerting rules.
func NewManager ¶
func NewManager(o *ManagerOptions) *Manager
NewManager returns an implementation of Manager, ready to be started by calling the Run method.
func (*Manager) AlertingRules ¶
func (m *Manager) AlertingRules() []*AlertingRule
AlertingRules returns the list of the manager's alerting rules.
func (*Manager) LoadGroups ¶
func (m *Manager) LoadGroups( interval time.Duration, externalLabels labels.Labels, externalURL string, ruleGroupPostProcessFunc RuleGroupPostProcessFunc, filenames ...string, ) (map[string]*Group, []error)
LoadGroups reads groups from a list of files.
func (*Manager) RuleGroups ¶
RuleGroups returns the list of manager's rule groups.
func (*Manager) Run ¶
func (m *Manager) Run()
Run starts processing of the rule manager. It is blocking.
func (*Manager) Update ¶
func (m *Manager) Update(interval time.Duration, files []string, externalLabels labels.Labels, externalURL string, ruleGroupPostProcessFunc RuleGroupPostProcessFunc) error
Update the rule manager's state as the config requires. If loading the new rules failed the old rule set is restored.
type ManagerOptions ¶
type ManagerOptions struct { ExternalURL *url.URL QueryFunc QueryFunc NotifyFunc NotifyFunc Context context.Context Appendable storage.Appendable Queryable storage.Queryable Logger log.Logger Registerer prometheus.Registerer OutageTolerance time.Duration ForGracePeriod time.Duration ResendDelay time.Duration GroupLoader GroupLoader Metrics *Metrics }
ManagerOptions bundles options for the Manager.
type Metrics ¶
type Metrics struct { EvalDuration prometheus.Summary IterationDuration prometheus.Summary IterationsMissed *prometheus.CounterVec IterationsScheduled *prometheus.CounterVec EvalTotal *prometheus.CounterVec EvalFailures *prometheus.CounterVec GroupInterval *prometheus.GaugeVec GroupLastEvalTime *prometheus.GaugeVec GroupLastDuration *prometheus.GaugeVec GroupRules *prometheus.GaugeVec GroupSamples *prometheus.GaugeVec }
Metrics for rule evaluation.
func NewGroupMetrics ¶
func NewGroupMetrics(reg prometheus.Registerer) *Metrics
NewGroupMetrics creates a new instance of Metrics and registers it with the provided registerer, if not nil.
type NotifyFunc ¶
NotifyFunc sends notifications about a set of alerts generated by the given expression.
func SendAlerts ¶
func SendAlerts(s Sender, externalURL string) NotifyFunc
SendAlerts implements the rules.NotifyFunc for a Notifier.
type RecordingRule ¶
type RecordingRule struct {
// contains filtered or unexported fields
}
A RecordingRule records its vector expression into new timeseries.
func NewRecordingRule ¶
NewRecordingRule returns a new recording rule.
func (*RecordingRule) Eval ¶
func (rule *RecordingRule) Eval(ctx context.Context, ts time.Time, query QueryFunc, _ *url.URL, limit int) (promql.Vector, error)
Eval evaluates the rule and then overrides the metric names and labels accordingly.
func (*RecordingRule) GetEvaluationDuration ¶
func (rule *RecordingRule) GetEvaluationDuration() time.Duration
GetEvaluationDuration returns the time in seconds it took to evaluate the recording rule.
func (*RecordingRule) GetEvaluationTimestamp ¶
func (rule *RecordingRule) GetEvaluationTimestamp() time.Time
GetEvaluationTimestamp returns the time the evaluation took place.
func (*RecordingRule) Health ¶
func (rule *RecordingRule) Health() RuleHealth
Health returns the current health of the recording rule.
func (*RecordingRule) Labels ¶
func (rule *RecordingRule) Labels() labels.Labels
Labels returns the rule labels.
func (*RecordingRule) LastError ¶
func (rule *RecordingRule) LastError() error
LastError returns the last error seen by the recording rule.
func (*RecordingRule) Query ¶
func (rule *RecordingRule) Query() parser.Expr
Query returns the rule query expression.
func (*RecordingRule) SetEvaluationDuration ¶
func (rule *RecordingRule) SetEvaluationDuration(dur time.Duration)
SetEvaluationDuration updates evaluationDuration to the time in seconds it took to evaluate the rule on its last evaluation.
func (*RecordingRule) SetEvaluationTimestamp ¶
func (rule *RecordingRule) SetEvaluationTimestamp(ts time.Time)
SetEvaluationTimestamp updates evaluationTimestamp to the timestamp of when the rule was last evaluated.
func (*RecordingRule) SetHealth ¶
func (rule *RecordingRule) SetHealth(health RuleHealth)
SetHealth sets the current health of the recording rule.
func (*RecordingRule) SetLastError ¶
func (rule *RecordingRule) SetLastError(err error)
SetLastError sets the current error seen by the recording rule.
func (*RecordingRule) String ¶
func (rule *RecordingRule) String() string
type Rule ¶
type Rule interface { Name() string // Labels of the rule. Labels() labels.Labels // eval evaluates the rule, including any associated recording or alerting actions. Eval(context.Context, time.Time, QueryFunc, *url.URL, int) (promql.Vector, error) // String returns a human-readable string representation of the rule. String() string // Query returns the rule query expression. Query() parser.Expr // SetLastErr sets the current error experienced by the rule. SetLastError(error) // LastErr returns the last error experienced by the rule. LastError() error // SetHealth sets the current health of the rule. SetHealth(RuleHealth) // Health returns the current health of the rule. Health() RuleHealth SetEvaluationDuration(time.Duration) // GetEvaluationDuration returns last evaluation duration. // NOTE: Used dynamically by rules.html template. GetEvaluationDuration() time.Duration SetEvaluationTimestamp(time.Time) // GetEvaluationTimestamp returns last evaluation timestamp. // NOTE: Used dynamically by rules.html template. GetEvaluationTimestamp() time.Time }
A Rule encapsulates a vector expression which is evaluated at a specified interval and acted upon (currently either recorded or used for alerting).
type RuleDetail ¶
RuleDetail contains information about the rule that is being evaluated.
func FromOriginContext ¶
func FromOriginContext(ctx context.Context) RuleDetail
FromOriginContext returns the RuleDetail origin data from the context.
func NewRuleDetail ¶
func NewRuleDetail(r Rule) RuleDetail
NewRuleDetail creates a RuleDetail from a given Rule.
type RuleGroupPostProcessFunc ¶
This function will be used before each rule group evaluation if not nil. Use this function type if the rule group post processing is needed.
type RuleHealth ¶
type RuleHealth string
RuleHealth describes the health state of a rule.
const ( HealthUnknown RuleHealth = "unknown" HealthGood RuleHealth = "ok" HealthBad RuleHealth = "err" )
The possible health states of a rule based on the last execution.