debian-mirror-gitlab/app/services/clusters/integrations/prometheus_health_check_service.rb

Ignoring revisions in .git-blame-ignore-revs. Click here to bypass and see the normal blame view.

102 lines
2.7 KiB
Ruby
Raw Normal View History

2020-04-22 19:07:51 +05:30
# frozen_string_literal: true
module Clusters
2021-12-11 22:18:48 +05:30
module Integrations
2020-04-22 19:07:51 +05:30
class PrometheusHealthCheckService
include Gitlab::Utils::StrongMemoize
include Gitlab::Routing
def initialize(cluster)
@cluster = cluster
@logger = Gitlab::AppJsonLogger.build
end
def execute
raise 'Invalid cluster type. Only project types are allowed.' unless @cluster.project_type?
2021-12-11 22:18:48 +05:30
return unless prometheus_integration.enabled
2020-04-22 19:07:51 +05:30
project = @cluster.clusterable
@logger.info(
message: 'Prometheus health check',
cluster_id: @cluster.id,
newly_unhealthy: became_unhealthy?,
currently_healthy: currently_healthy?,
was_healthy: was_healthy?
)
send_notification(project) if became_unhealthy?
2021-12-11 22:18:48 +05:30
prometheus_integration.update_columns(health_status: current_health_status) if health_changed?
2020-04-22 19:07:51 +05:30
end
private
2021-12-11 22:18:48 +05:30
def prometheus_integration
strong_memoize(:prometheus_integration) do
@cluster.integration_prometheus
end
end
def current_health_status
if currently_healthy?
:healthy
else
:unhealthy
2020-04-22 19:07:51 +05:30
end
end
def currently_healthy?
strong_memoize(:currently_healthy) do
2021-12-11 22:18:48 +05:30
prometheus_integration.prometheus_client.healthy?
2020-04-22 19:07:51 +05:30
end
end
def became_unhealthy?
strong_memoize(:became_unhealthy) do
2021-12-11 22:18:48 +05:30
(was_healthy? || was_unknown?) && !currently_healthy?
2020-04-22 19:07:51 +05:30
end
end
def was_healthy?
strong_memoize(:was_healthy) do
2021-12-11 22:18:48 +05:30
prometheus_integration.healthy?
end
end
def was_unknown?
strong_memoize(:was_unknown) do
prometheus_integration.unknown?
2020-04-22 19:07:51 +05:30
end
end
def health_changed?
was_healthy? != currently_healthy?
end
def send_notification(project)
notification_payload = build_notification_payload(project)
2021-02-22 17:27:13 +05:30
integration = project.alert_management_http_integrations.active.first
Projects::Alerting::NotifyService.new(project, notification_payload).execute(integration&.token, integration)
2020-04-22 19:07:51 +05:30
@logger.info(message: 'Successfully notified of Prometheus newly unhealthy', cluster_id: @cluster.id, project_id: project.id)
end
def build_notification_payload(project)
cluster_path = namespace_project_cluster_path(
project_id: project.path,
namespace_id: project.namespace.path,
id: @cluster.id
)
{
title: "Prometheus is Unhealthy. Cluster Name: #{@cluster.name}",
description: "Prometheus is unhealthy for the cluster: [#{@cluster.name}](#{cluster_path}) attached to project #{project.name}."
}
end
end
end
end