2020-09-19 22:29:08 +02:00
|
|
|
package pagerduty
|
2020-09-17 01:26:19 +02:00
|
|
|
|
2020-09-19 22:22:12 +02:00
|
|
|
import (
|
2021-12-03 03:05:17 +01:00
|
|
|
"bytes"
|
|
|
|
"encoding/json"
|
2024-12-17 02:32:13 +01:00
|
|
|
"errors"
|
2020-09-19 22:22:12 +02:00
|
|
|
"fmt"
|
2021-12-03 07:44:17 +01:00
|
|
|
"io"
|
2020-11-23 22:20:06 +01:00
|
|
|
"net/http"
|
|
|
|
|
2022-12-06 07:41:09 +01:00
|
|
|
"github.com/TwiN/gatus/v5/alerting/alert"
|
|
|
|
"github.com/TwiN/gatus/v5/client"
|
2024-05-10 04:56:16 +02:00
|
|
|
"github.com/TwiN/gatus/v5/config/endpoint"
|
2024-11-14 05:54:00 +01:00
|
|
|
"github.com/TwiN/logr"
|
2024-12-17 02:32:13 +01:00
|
|
|
"gopkg.in/yaml.v3"
|
2020-09-19 22:22:12 +02:00
|
|
|
)
|
|
|
|
|
2021-07-30 00:13:37 +02:00
|
|
|
const (
|
|
|
|
restAPIURL = "https://events.pagerduty.com/v2/enqueue"
|
|
|
|
)
|
|
|
|
|
2024-12-17 02:32:13 +01:00
|
|
|
var (
|
|
|
|
ErrIntegrationKeyNotSet = errors.New("integration-key must have exactly 32 characters")
|
|
|
|
ErrDuplicateGroupOverride = errors.New("duplicate group override")
|
|
|
|
)
|
|
|
|
|
|
|
|
type Config struct {
|
|
|
|
IntegrationKey string `yaml:"integration-key"`
|
|
|
|
}
|
|
|
|
|
|
|
|
func (cfg *Config) Validate() error {
|
|
|
|
if len(cfg.IntegrationKey) != 32 {
|
|
|
|
return ErrIntegrationKeyNotSet
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
|
|
|
func (cfg *Config) Merge(override *Config) {
|
|
|
|
if len(override.IntegrationKey) > 0 {
|
|
|
|
cfg.IntegrationKey = override.IntegrationKey
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
2020-09-26 21:15:50 +02:00
|
|
|
// AlertProvider is the configuration necessary for sending an alert using PagerDuty
|
2020-09-19 22:29:08 +02:00
|
|
|
type AlertProvider struct {
|
2024-12-17 02:32:13 +01:00
|
|
|
DefaultConfig Config `yaml:",inline"`
|
2021-05-16 03:31:32 +02:00
|
|
|
|
2021-10-23 22:47:12 +02:00
|
|
|
// DefaultAlert is the default alert configuration to use for endpoints with an alert of the appropriate type
|
2021-12-03 03:05:17 +01:00
|
|
|
DefaultAlert *alert.Alert `yaml:"default-alert,omitempty"`
|
2021-10-06 02:01:36 +02:00
|
|
|
|
2021-10-06 02:40:44 +02:00
|
|
|
// Overrides is a list of Override that may be prioritized over the default configuration
|
2021-12-03 03:05:17 +01:00
|
|
|
Overrides []Override `yaml:"overrides,omitempty"`
|
2021-10-06 02:40:44 +02:00
|
|
|
}
|
|
|
|
|
|
|
|
// Override is a case under which the default integration is overridden
|
|
|
|
type Override struct {
|
2024-12-17 02:32:13 +01:00
|
|
|
Group string `yaml:"group"`
|
|
|
|
Config `yaml:",inline"`
|
2020-09-19 22:22:12 +02:00
|
|
|
}
|
|
|
|
|
2024-12-17 02:32:13 +01:00
|
|
|
// Validate the provider's configuration
|
|
|
|
func (provider *AlertProvider) Validate() error {
|
2021-10-06 02:01:36 +02:00
|
|
|
registeredGroups := make(map[string]bool)
|
2021-10-06 02:40:44 +02:00
|
|
|
if provider.Overrides != nil {
|
|
|
|
for _, override := range provider.Overrides {
|
2024-12-17 02:32:13 +01:00
|
|
|
if isAlreadyRegistered := registeredGroups[override.Group]; isAlreadyRegistered || override.Group == "" {
|
|
|
|
return ErrDuplicateGroupOverride
|
2021-10-06 02:01:36 +02:00
|
|
|
}
|
2021-10-06 02:40:44 +02:00
|
|
|
registeredGroups[override.Group] = true
|
2021-10-06 02:01:36 +02:00
|
|
|
}
|
|
|
|
}
|
2021-10-06 02:40:44 +02:00
|
|
|
// Either the default integration key has the right length, or there are overrides who are properly configured.
|
2024-12-17 02:32:13 +01:00
|
|
|
return provider.DefaultConfig.Validate()
|
2020-09-19 22:22:12 +02:00
|
|
|
}
|
|
|
|
|
2021-12-03 03:05:17 +01:00
|
|
|
// Send an alert using the provider
|
2020-10-23 22:12:53 +02:00
|
|
|
//
|
2021-12-03 03:05:17 +01:00
|
|
|
// Relevant: https://developer.pagerduty.com/docs/events-api-v2/trigger-events/
|
2024-05-10 04:56:16 +02:00
|
|
|
func (provider *AlertProvider) Send(ep *endpoint.Endpoint, alert *alert.Alert, result *endpoint.Result, resolved bool) error {
|
2024-12-17 02:32:13 +01:00
|
|
|
cfg, err := provider.GetConfig(ep.Group, alert)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
buffer := bytes.NewBuffer(provider.buildRequestBody(cfg, ep, alert, result, resolved))
|
2021-12-03 03:05:17 +01:00
|
|
|
request, err := http.NewRequest(http.MethodPost, restAPIURL, buffer)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
|
|
|
request.Header.Set("Content-Type", "application/json")
|
|
|
|
response, err := client.GetHTTPClient(nil).Do(request)
|
|
|
|
if err != nil {
|
|
|
|
return err
|
|
|
|
}
|
2022-10-20 21:16:27 +02:00
|
|
|
defer response.Body.Close()
|
2021-12-03 03:05:17 +01:00
|
|
|
if response.StatusCode > 399 {
|
2021-12-03 07:44:17 +01:00
|
|
|
body, _ := io.ReadAll(response.Body)
|
2021-12-03 03:05:17 +01:00
|
|
|
return fmt.Errorf("call to provider alert returned status code %d: %s", response.StatusCode, string(body))
|
|
|
|
}
|
|
|
|
if alert.IsSendingOnResolved() {
|
|
|
|
if resolved {
|
|
|
|
// The alert has been resolved and there's no error, so we can clear the alert's ResolveKey
|
|
|
|
alert.ResolveKey = ""
|
|
|
|
} else {
|
|
|
|
// We need to retrieve the resolve key from the response
|
|
|
|
var payload pagerDutyResponsePayload
|
2024-11-14 05:54:00 +01:00
|
|
|
if err = json.NewDecoder(response.Body).Decode(&payload); err != nil {
|
2021-12-03 04:15:51 +01:00
|
|
|
// Silently fail. We don't want to create tons of alerts just because we failed to parse the body.
|
2024-11-14 05:54:00 +01:00
|
|
|
logr.Errorf("[pagerduty.Send] Ran into error decoding pagerduty response: %s", err.Error())
|
2021-12-03 03:05:17 +01:00
|
|
|
} else {
|
|
|
|
alert.ResolveKey = payload.DedupKey
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
return nil
|
|
|
|
}
|
|
|
|
|
2022-10-20 21:47:07 +02:00
|
|
|
type Body struct {
|
|
|
|
RoutingKey string `json:"routing_key"`
|
|
|
|
DedupKey string `json:"dedup_key"`
|
|
|
|
EventAction string `json:"event_action"`
|
|
|
|
Payload Payload `json:"payload"`
|
|
|
|
}
|
|
|
|
|
|
|
|
type Payload struct {
|
|
|
|
Summary string `json:"summary"`
|
|
|
|
Source string `json:"source"`
|
|
|
|
Severity string `json:"severity"`
|
|
|
|
}
|
|
|
|
|
2021-12-03 03:05:17 +01:00
|
|
|
// buildRequestBody builds the request body for the provider
|
2024-12-17 02:32:13 +01:00
|
|
|
func (provider *AlertProvider) buildRequestBody(cfg *Config, ep *endpoint.Endpoint, alert *alert.Alert, result *endpoint.Result, resolved bool) []byte {
|
2020-09-26 20:23:43 +02:00
|
|
|
var message, eventAction, resolveKey string
|
|
|
|
if resolved {
|
2024-05-10 04:56:16 +02:00
|
|
|
message = fmt.Sprintf("RESOLVED: %s - %s", ep.DisplayName(), alert.GetDescription())
|
2020-09-26 20:23:43 +02:00
|
|
|
eventAction = "resolve"
|
|
|
|
resolveKey = alert.ResolveKey
|
|
|
|
} else {
|
2024-05-10 04:56:16 +02:00
|
|
|
message = fmt.Sprintf("TRIGGERED: %s - %s", ep.DisplayName(), alert.GetDescription())
|
2020-09-26 20:23:43 +02:00
|
|
|
eventAction = "trigger"
|
|
|
|
resolveKey = ""
|
|
|
|
}
|
2022-10-20 21:47:07 +02:00
|
|
|
body, _ := json.Marshal(Body{
|
2024-12-17 02:32:13 +01:00
|
|
|
RoutingKey: cfg.IntegrationKey,
|
2022-10-20 21:47:07 +02:00
|
|
|
DedupKey: resolveKey,
|
|
|
|
EventAction: eventAction,
|
|
|
|
Payload: Payload{
|
|
|
|
Summary: message,
|
|
|
|
Source: "Gatus",
|
|
|
|
Severity: "critical",
|
|
|
|
},
|
|
|
|
})
|
|
|
|
return body
|
2020-09-17 01:26:19 +02:00
|
|
|
}
|
2021-05-16 03:31:32 +02:00
|
|
|
|
2024-12-17 02:32:13 +01:00
|
|
|
// GetDefaultAlert returns the provider's default alert configuration
|
|
|
|
func (provider *AlertProvider) GetDefaultAlert() *alert.Alert {
|
|
|
|
return provider.DefaultAlert
|
|
|
|
}
|
|
|
|
|
|
|
|
// GetConfig returns the configuration for the provider with the overrides applied
|
|
|
|
func (provider *AlertProvider) GetConfig(group string, alert *alert.Alert) (*Config, error) {
|
|
|
|
cfg := provider.DefaultConfig
|
|
|
|
// Handle group overrides
|
2021-10-06 02:40:44 +02:00
|
|
|
if provider.Overrides != nil {
|
|
|
|
for _, override := range provider.Overrides {
|
|
|
|
if group == override.Group {
|
2024-12-17 02:32:13 +01:00
|
|
|
cfg.Merge(&override.Config)
|
|
|
|
break
|
2021-10-06 02:40:44 +02:00
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2024-12-17 02:32:13 +01:00
|
|
|
// Handle alert overrides
|
|
|
|
if len(alert.ProviderOverride) != 0 {
|
|
|
|
overrideConfig := Config{}
|
|
|
|
if err := yaml.Unmarshal(alert.ProviderOverrideAsBytes(), &overrideConfig); err != nil {
|
|
|
|
return nil, err
|
|
|
|
}
|
|
|
|
cfg.Merge(&overrideConfig)
|
|
|
|
}
|
|
|
|
// Validate the configuration
|
|
|
|
err := cfg.Validate()
|
|
|
|
return &cfg, err
|
2021-10-06 02:40:44 +02:00
|
|
|
}
|
|
|
|
|
2024-12-17 02:32:13 +01:00
|
|
|
// ValidateOverrides validates the alert's provider override and, if present, the group override
|
|
|
|
func (provider *AlertProvider) ValidateOverrides(group string, alert *alert.Alert) error {
|
|
|
|
_, err := provider.GetConfig(group, alert)
|
|
|
|
return err
|
2021-05-16 03:31:32 +02:00
|
|
|
}
|
2021-12-03 03:05:17 +01:00
|
|
|
|
|
|
|
type pagerDutyResponsePayload struct {
|
|
|
|
Status string `json:"status"`
|
|
|
|
Message string `json:"message"`
|
|
|
|
DedupKey string `json:"dedup_key"`
|
|
|
|
}
|