2021-02-03 16:09:17 -05:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2022-03-31 11:08:32 -04:00
|
|
|
require Rails.root.join('metrics_server', 'metrics_server')
|
2022-03-15 08:07:44 -04:00
|
|
|
|
2019-07-02 03:36:33 -04:00
|
|
|
# Keep separate directories for separate processes
|
2022-03-25 08:07:52 -04:00
|
|
|
def metrics_temp_dir
|
2019-07-02 03:36:33 -04:00
|
|
|
return unless Rails.env.development? || Rails.env.test?
|
|
|
|
|
2019-12-22 04:07:51 -05:00
|
|
|
if Gitlab::Runtime.sidekiq?
|
2019-07-02 03:36:33 -04:00
|
|
|
Rails.root.join('tmp/prometheus_multiproc_dir/sidekiq')
|
2019-12-22 04:07:51 -05:00
|
|
|
elsif Gitlab::Runtime.puma?
|
2019-07-02 03:36:33 -04:00
|
|
|
Rails.root.join('tmp/prometheus_multiproc_dir/puma')
|
|
|
|
else
|
|
|
|
Rails.root.join('tmp/prometheus_multiproc_dir')
|
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2022-03-25 08:07:52 -04:00
|
|
|
def prometheus_metrics_dir
|
|
|
|
ENV['prometheus_multiproc_dir'] || metrics_temp_dir
|
2022-03-09 13:08:16 -05:00
|
|
|
end
|
|
|
|
|
2022-03-31 11:08:32 -04:00
|
|
|
def puma_master?
|
2022-03-25 08:07:52 -04:00
|
|
|
Prometheus::PidProvider.worker_id == 'puma_master'
|
2022-03-09 13:08:16 -05:00
|
|
|
end
|
|
|
|
|
2022-03-31 11:08:32 -04:00
|
|
|
# Whether a dedicated process should run that serves Rails application metrics, as opposed
|
|
|
|
# to using a Rails controller.
|
|
|
|
def puma_dedicated_metrics_server?
|
|
|
|
Settings.monitoring.web_exporter.enabled
|
|
|
|
end
|
|
|
|
|
|
|
|
if puma_master?
|
2022-03-09 13:08:16 -05:00
|
|
|
# The following is necessary to ensure stale Prometheus metrics don't accumulate over time.
|
2022-03-25 08:07:52 -04:00
|
|
|
# It needs to be done as early as possible to ensure new metrics aren't being deleted.
|
|
|
|
#
|
|
|
|
# Note that this should not happen for Sidekiq. Since Sidekiq workers are spawned from the
|
|
|
|
# sidekiq-cluster script, we perform this cleanup in `sidekiq_cluster/cli.rb` instead,
|
|
|
|
# since it must happen prior to any worker processes or the metrics server starting up.
|
|
|
|
Prometheus::CleanupMultiprocDirService.new(prometheus_metrics_dir).execute
|
2022-03-09 13:08:16 -05:00
|
|
|
|
|
|
|
::Prometheus::Client.reinitialize_on_pid_change(force: true)
|
|
|
|
end
|
|
|
|
|
2021-06-18 11:10:16 -04:00
|
|
|
::Prometheus::Client.configure do |config|
|
2020-09-09 08:08:22 -04:00
|
|
|
config.logger = Gitlab::AppLogger
|
2017-07-19 04:54:39 -04:00
|
|
|
|
2022-03-25 08:07:52 -04:00
|
|
|
config.multiprocess_files_dir = prometheus_metrics_dir
|
2017-08-29 09:45:19 -04:00
|
|
|
|
2021-06-18 11:10:16 -04:00
|
|
|
config.pid_provider = ::Prometheus::PidProvider.method(:worker_id)
|
2017-07-19 04:54:39 -04:00
|
|
|
end
|
2017-08-07 13:13:02 -04:00
|
|
|
|
2017-11-22 18:26:50 -05:00
|
|
|
Gitlab::Application.configure do |config|
|
|
|
|
# 0 should be Sentry to catch errors in this middleware
|
2021-06-08 17:10:05 -04:00
|
|
|
config.middleware.insert_after(Labkit::Middleware::Rack, Gitlab::Metrics::RequestsRackMiddleware)
|
2017-11-22 18:26:50 -05:00
|
|
|
end
|
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
# Any actions beyond this check should only execute outside of tests, when running in an application
|
|
|
|
# context (i.e. not in the Rails console or rspec) and when users have enabled metrics.
|
|
|
|
return if Rails.env.test? || !Gitlab::Runtime.application? || !Gitlab::Metrics.prometheus_metrics_enabled?
|
|
|
|
|
|
|
|
Gitlab::Cluster::LifecycleEvents.on_master_start do
|
|
|
|
Gitlab::Metrics.gauge(:deployments, 'GitLab Version', {}, :max).set({ version: Gitlab::VERSION, revision: Gitlab.revision }, 1)
|
2020-09-09 05:08:40 -04:00
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
if Gitlab::Runtime.puma?
|
2022-06-06 11:09:05 -04:00
|
|
|
[
|
|
|
|
Gitlab::Metrics::Samplers::RubySampler,
|
|
|
|
Gitlab::Metrics::Samplers::ThreadsSampler
|
|
|
|
].each { |sampler| sampler.instance(logger: Gitlab::AppLogger).start }
|
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
Gitlab::Metrics::Samplers::PumaSampler.instance.start
|
2021-01-22 16:09:10 -05:00
|
|
|
|
2022-03-31 11:08:32 -04:00
|
|
|
MetricsServer.start_for_puma if puma_dedicated_metrics_server?
|
2017-11-02 16:23:23 -04:00
|
|
|
end
|
2019-05-29 08:27:44 -04:00
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
Gitlab::Ci::Parsers.instrument!
|
|
|
|
rescue IOError => e
|
|
|
|
Gitlab::ErrorTracking.track_exception(e)
|
|
|
|
Gitlab::Metrics.error_detected!
|
|
|
|
end
|
2019-10-02 17:06:22 -04:00
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
Gitlab::Cluster::LifecycleEvents.on_worker_start do
|
|
|
|
defined?(::Prometheus::Client.reinitialize_on_pid_change) && ::Prometheus::Client.reinitialize_on_pid_change
|
|
|
|
logger = Gitlab::AppLogger
|
2022-06-06 11:09:05 -04:00
|
|
|
# Since we also run these samplers in the Puma primary, we need to re-create them each time we fork.
|
|
|
|
# For Sidekiq, this does not make any difference, since there is no primary.
|
|
|
|
[
|
|
|
|
Gitlab::Metrics::Samplers::RubySampler,
|
|
|
|
Gitlab::Metrics::Samplers::ThreadsSampler
|
|
|
|
].each { |sampler| sampler.initialize_instance(logger: logger, recreate: true).start }
|
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
Gitlab::Metrics::Samplers::DatabaseSampler.initialize_instance(logger: logger).start
|
|
|
|
|
|
|
|
if Gitlab::Runtime.puma?
|
2022-03-15 08:07:44 -04:00
|
|
|
# Since we are observing a metrics server from the Puma primary, we would inherit
|
|
|
|
# this supervision thread after forking into workers, so we need to explicitly stop it here.
|
2022-03-31 11:08:32 -04:00
|
|
|
::MetricsServer::PumaProcessSupervisor.instance.stop if puma_dedicated_metrics_server?
|
2020-05-15 17:08:21 -04:00
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
Gitlab::Metrics::Samplers::ActionCableSampler.instance(logger: logger).start
|
|
|
|
end
|
2021-01-22 16:09:10 -05:00
|
|
|
|
2022-03-07 10:22:51 -05:00
|
|
|
if Gitlab.ee? && Gitlab::Runtime.sidekiq?
|
|
|
|
Gitlab::Metrics::Samplers::GlobalSearchSampler.instance(logger: logger).start
|
2019-05-29 08:27:44 -04:00
|
|
|
end
|
2022-03-07 10:22:51 -05:00
|
|
|
|
|
|
|
Gitlab::Ci::Parsers.instrument!
|
|
|
|
rescue IOError => e
|
|
|
|
Gitlab::ErrorTracking.track_exception(e)
|
|
|
|
Gitlab::Metrics.error_detected!
|
2018-10-20 14:00:19 -04:00
|
|
|
end
|
2019-10-04 02:06:05 -04:00
|
|
|
|
2022-03-31 11:08:32 -04:00
|
|
|
if Gitlab::Runtime.puma? && puma_dedicated_metrics_server?
|
2019-10-30 05:27:58 -04:00
|
|
|
Gitlab::Cluster::LifecycleEvents.on_before_graceful_shutdown do
|
|
|
|
# We need to ensure that before we re-exec or shutdown server
|
2022-03-15 08:07:44 -04:00
|
|
|
# we also stop the metrics server
|
2022-03-31 11:08:32 -04:00
|
|
|
::MetricsServer::PumaProcessSupervisor.instance.shutdown
|
2019-10-16 11:06:17 -04:00
|
|
|
end
|
|
|
|
|
2019-10-04 02:06:05 -04:00
|
|
|
Gitlab::Cluster::LifecycleEvents.on_before_master_restart do
|
|
|
|
# We need to ensure that before we re-exec server
|
2022-03-15 08:07:44 -04:00
|
|
|
# we also stop the metrics server
|
2019-10-16 11:06:17 -04:00
|
|
|
#
|
|
|
|
# We do it again, for being extra safe,
|
|
|
|
# but it should not be needed
|
2022-03-31 11:08:32 -04:00
|
|
|
::MetricsServer::PumaProcessSupervisor.instance.shutdown
|
2019-10-04 02:06:05 -04:00
|
|
|
end
|
|
|
|
end
|