usage_data.rb 19.6 KB
Newer Older
G
gfyoung 已提交
1 2
# frozen_string_literal: true

3 4 5
# For hardening usage ping and make it easier to add measures there is in place
#   * alt_usage_data method
#     handles StandardError and fallbacks into -1 this way not all measures fail if we encounter one exception
6
#
7 8 9 10 11 12 13 14 15 16 17 18
#     Examples:
#     alt_usage_data { Gitlab::VERSION }
#     alt_usage_data { Gitlab::CurrentSettings.uuid }
#
#   * redis_usage_data method
#     handles ::Redis::CommandError, Gitlab::UsageDataCounters::BaseCounter::UnknownEvent
#     returns -1 when a block is sent or hash with all values -1 when a counter is sent
#     different behaviour due to 2 different implementations of redis counter
#
#     Examples:
#     redis_usage_data(Gitlab::UsageDataCounters::WikiPageCounter)
#     redis_usage_data { ::Gitlab::UsageCounters::PodLogs.usage_totals[:total] }
19 20
module Gitlab
  class UsageData
21
    BATCH_SIZE = 100
22
    FALLBACK = -1
23

24
    class << self
25
      def data(force_refresh: false)
A
Alex Kalderimis 已提交
26 27 28
        Rails.cache.fetch('usage_data', force: force_refresh, expires_in: 2.weeks) do
          uncached_data
        end
29 30 31
      end

      def uncached_data
32 33
        license_usage_data
          .merge(system_usage_data)
34 35 36
          .merge(features_usage_data)
          .merge(components_usage_data)
          .merge(cycle_analytics_usage_data)
37
          .merge(object_store_usage_data)
38
          .merge(recording_ce_finish_data)
39 40
      end

41 42
      def to_json(force_refresh: false)
        data(force_refresh: force_refresh).to_json
43 44
      end

45
      def license_usage_data
46
        {
47
          recorded_at: Time.now, # should be calculated very first
48 49 50 51
          uuid: alt_usage_data { Gitlab::CurrentSettings.uuid },
          hostname: alt_usage_data { Gitlab.config.gitlab.host },
          version: alt_usage_data { Gitlab::VERSION },
          installation_type: alt_usage_data { installation_type },
52
          active_user_count: count(User.active),
53 54 55 56
          edition: 'CE'
        }
      end

57 58 59 60 61 62
      def recording_ce_finish_data
        {
          recording_ce_finished_at: Time.now
        }
      end

63
      # rubocop: disable Metrics/AbcSize
64
      # rubocop: disable CodeReuse/ActiveRecord
65
      def system_usage_data
66 67
        alert_bot_incident_count = count(::Issue.authored(::User.alert_bot))

68 69
        {
          counts: {
70 71 72 73 74 75 76 77 78 79 80 81 82 83
            assignee_lists: count(List.assignee),
            boards: count(Board),
            ci_builds: count(::Ci::Build),
            ci_internal_pipelines: count(::Ci::Pipeline.internal),
            ci_external_pipelines: count(::Ci::Pipeline.external),
            ci_pipeline_config_auto_devops: count(::Ci::Pipeline.auto_devops_source),
            ci_pipeline_config_repository: count(::Ci::Pipeline.repository_source),
            ci_runners: count(::Ci::Runner),
            ci_triggers: count(::Ci::Trigger),
            ci_pipeline_schedules: count(::Ci::PipelineSchedule),
            auto_devops_enabled: count(::ProjectAutoDevops.enabled),
            auto_devops_disabled: count(::ProjectAutoDevops.disabled),
            deploy_keys: count(DeployKey),
            deployments: count(Deployment),
84 85
            successful_deployments: count(Deployment.success),
            failed_deployments: count(Deployment.failed),
86 87 88
            environments: count(::Environment),
            clusters: count(::Clusters::Cluster),
            clusters_enabled: count(::Clusters::Cluster.enabled),
89 90
            project_clusters_enabled: count(::Clusters::Cluster.enabled.project_type),
            group_clusters_enabled: count(::Clusters::Cluster.enabled.group_type),
91
            instance_clusters_enabled: count(::Clusters::Cluster.enabled.instance_type),
92
            clusters_disabled: count(::Clusters::Cluster.disabled),
93 94
            project_clusters_disabled: count(::Clusters::Cluster.disabled.project_type),
            group_clusters_disabled: count(::Clusters::Cluster.disabled.group_type),
95
            instance_clusters_disabled: count(::Clusters::Cluster.disabled.instance_type),
96 97
            clusters_platforms_eks: count(::Clusters::Cluster.aws_installed.enabled),
            clusters_platforms_gke: count(::Clusters::Cluster.gcp_installed.enabled),
98
            clusters_platforms_user: count(::Clusters::Cluster.user_provided.enabled),
99 100 101
            clusters_applications_helm: count(::Clusters::Applications::Helm.available),
            clusters_applications_ingress: count(::Clusters::Applications::Ingress.available),
            clusters_applications_cert_managers: count(::Clusters::Applications::CertManager.available),
102
            clusters_applications_crossplane: count(::Clusters::Applications::Crossplane.available),
103 104 105
            clusters_applications_prometheus: count(::Clusters::Applications::Prometheus.available),
            clusters_applications_runner: count(::Clusters::Applications::Runner.available),
            clusters_applications_knative: count(::Clusters::Applications::Knative.available),
106
            clusters_applications_elastic_stack: count(::Clusters::Applications::ElasticStack.available),
107
            clusters_applications_jupyter: count(::Clusters::Applications::Jupyter.available),
108
            clusters_management_project: count(::Clusters::Cluster.with_management_project),
109
            in_review_folder: count(::Environment.in_review_folder),
110
            grafana_integrated_projects: count(GrafanaIntegration.enabled),
111 112
            groups: count(Group),
            issues: count(Issue),
113
            issues_created_from_gitlab_error_tracking_ui: count(SentryIssue),
114
            issues_with_associated_zoom_link: count(ZoomMeeting.added_to_issue),
115
            issues_using_zoom_quick_actions: distinct_count(ZoomMeeting, :issue_id),
116
            issues_with_embedded_grafana_charts_approx: grafana_embed_usage_data,
117
            issues_created_gitlab_alerts: count(Issue.with_alert_management_alerts.not_authored_by(::User.alert_bot)),
118 119 120
            incident_issues: alert_bot_incident_count,
            alert_bot_incident_issues: alert_bot_incident_count,
            incident_labeled_issues: count(::Issue.with_label_attributes(IncidentManagement::CreateIssueService::INCIDENT_LABEL)),
121 122 123 124 125 126
            keys: count(Key),
            label_lists: count(List.label),
            lfs_objects: count(LfsObject),
            milestone_lists: count(List.milestone),
            milestones: count(Milestone),
            pages_domains: count(PagesDomain),
127
            pool_repositories: count(PoolRepository),
128 129
            projects: count(Project),
            projects_imported_from_github: count(Project.where(import_type: 'github')),
130
            projects_with_repositories_enabled: count(ProjectFeature.where('repository_access_level > ?', ProjectFeature::DISABLED)),
L
Logan King 已提交
131
            projects_with_error_tracking_enabled: count(::ErrorTracking::ProjectErrorTrackingSetting.where(enabled: true)),
132
            projects_with_alerts_service_enabled: count(AlertsService.active),
133
            projects_with_prometheus_alerts: distinct_count(PrometheusAlert, :project_id),
134
            projects_with_terraform_reports: distinct_count(::Ci::JobArtifact.terraform_reports, :project_id),
135
            projects_with_terraform_states: distinct_count(::Terraform::State, :project_id),
136 137 138 139
            protected_branches: count(ProtectedBranch),
            releases: count(Release),
            remote_mirrors: count(RemoteMirror),
            snippets: count(Snippet),
140
            suggestions: count(Suggestion),
141
            terraform_reports: count(::Ci::JobArtifact.terraform_reports),
142
            terraform_states: count(::Terraform::State),
143
            todos: count(Todo),
144
            uploads: count(Upload),
145 146 147 148
            web_hooks: count(WebHook),
            labels: count(Label),
            merge_requests: count(MergeRequest),
            notes: count(Note)
149 150 151
          }.merge(
            services_usage,
            usage_counters,
152
            user_preferences_usage,
153 154
            ingress_modsecurity_usage,
            container_expiration_policies_usage
155 156
          )
        }
157
      end
158
      # rubocop: enable CodeReuse/ActiveRecord
159
      # rubocop: enable Metrics/AbcSize
160

161
      def cycle_analytics_usage_data
162
        Gitlab::CycleAnalytics::UsageData.new.to_json
163 164
      rescue ActiveRecord::StatementInvalid
        { avg_cycle_analytics: {} }
165 166
      end

167 168 169 170 171 172 173 174
      # rubocop:disable CodeReuse/ActiveRecord
      def grafana_embed_usage_data
        count(Issue.joins('JOIN grafana_integrations USING (project_id)')
          .where("issues.description LIKE '%' || grafana_integrations.grafana_url || '%'")
          .where(grafana_integrations: { enabled: true }))
      end
      # rubocop: enable CodeReuse/ActiveRecord

175 176 177 178 179 180
      def features_usage_data
        features_usage_data_ce
      end

      def features_usage_data_ce
        {
181
          container_registry_enabled: alt_usage_data { Gitlab.config.registry.enabled },
182
          dependency_proxy_enabled: Gitlab.config.try(:dependency_proxy)&.enabled,
183 184 185 186 187 188 189 190 191
          gitlab_shared_runners_enabled: alt_usage_data { Gitlab.config.gitlab_ci.shared_runners_enabled },
          gravatar_enabled: alt_usage_data { Gitlab::CurrentSettings.gravatar_enabled? },
          ldap_enabled: alt_usage_data { Gitlab.config.ldap.enabled },
          mattermost_enabled: alt_usage_data { Gitlab.config.mattermost.enabled },
          omniauth_enabled: alt_usage_data { Gitlab::Auth.omniauth_enabled? },
          prometheus_metrics_enabled: alt_usage_data { Gitlab::Metrics.prometheus_metrics_enabled? },
          reply_by_email_enabled: alt_usage_data { Gitlab::IncomingEmail.enabled? },
          signup_enabled: alt_usage_data { Gitlab::CurrentSettings.allow_signup? },
          web_ide_clientside_preview_enabled: alt_usage_data { Gitlab::CurrentSettings.web_ide_clientside_preview_enabled? },
192 193
          ingress_modsecurity_enabled: Feature.enabled?(:ingress_modsecurity),
          grafana_link_enabled: alt_usage_data { Gitlab::CurrentSettings.grafana_enabled? }
194
        }
195
      end
196

A
Alex Kalderimis 已提交
197
      # @return [Hash<Symbol, Integer>]
T
Tiago Botelho 已提交
198
      def usage_counters
199
        usage_data_counters.map { |counter| redis_usage_data(counter) }.reduce({}, :merge)
A
Alex Kalderimis 已提交
200 201 202 203
      end

      # @return [Array<#totals>] An array of objects that respond to `#totals`
      def usage_data_counters
204
        [
205 206 207 208 209 210 211 212
          Gitlab::UsageDataCounters::WikiPageCounter,
          Gitlab::UsageDataCounters::WebIdeCounter,
          Gitlab::UsageDataCounters::NoteCounter,
          Gitlab::UsageDataCounters::SnippetCounter,
          Gitlab::UsageDataCounters::SearchCounter,
          Gitlab::UsageDataCounters::CycleAnalyticsCounter,
          Gitlab::UsageDataCounters::ProductivityAnalyticsCounter,
          Gitlab::UsageDataCounters::SourceCodeCounter,
213 214
          Gitlab::UsageDataCounters::MergeRequestCounter,
          Gitlab::UsageDataCounters::DesignsCounter
215
        ]
T
Tiago Botelho 已提交
216 217
      end

218 219
      def components_usage_data
        {
220 221 222 223 224 225 226 227 228 229 230 231 232 233
          git: { version: alt_usage_data { Gitlab::Git.version } },
          gitaly: {
            version: alt_usage_data { Gitaly::Server.all.first.server_version },
            servers: alt_usage_data { Gitaly::Server.count },
            filesystems: alt_usage_data { Gitaly::Server.filesystems }
          },
          gitlab_pages: {
            enabled: alt_usage_data { Gitlab.config.pages.enabled },
            version: alt_usage_data { Gitlab::Pages::VERSION }
          },
          database: {
            adapter: alt_usage_data { Gitlab::Database.adapter_name },
            version: alt_usage_data { Gitlab::Database.version }
          },
234
          app_server: { type: app_server_type }
235
        }
236
      end
237

238 239 240 241 242 243 244 245
      def app_server_type
        Gitlab::Runtime.identify.to_s
      rescue Gitlab::Runtime::IdentificationError => e
        Gitlab::AppLogger.error(e.message)
        Gitlab::ErrorTracking.track_exception(e)
        'unknown_app_server_type'
      end

246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279
      def object_store_config(component)
        config = alt_usage_data(fallback: nil) do
          Settings[component]['object_store']
        end

        if config
          {
            enabled: alt_usage_data { Settings[component]['enabled'] },
            object_store: {
              enabled: alt_usage_data { config['enabled'] },
              direct_upload: alt_usage_data { config['direct_upload'] },
              background_upload: alt_usage_data { config['background_upload'] },
              provider: alt_usage_data { config['connection']['provider'] }
            }
          }
        else
          {
            enabled: alt_usage_data { Settings[component]['enabled'] }
          }
        end
      end

      def object_store_usage_data
        {
          object_store: {
            artifacts: object_store_config('artifacts'),
            external_diffs: object_store_config('external_diffs'),
            lfs: object_store_config('lfs'),
            uploads: object_store_config('uploads'),
            packages: object_store_config('packages')
          }
        }
      end

280
      def ingress_modsecurity_usage
281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298
        ##
        # This method measures usage of the Modsecurity Web Application Firewall across the entire
        # instance's deployed environments.
        #
        # NOTE: this service is an approximation as it does not yet take into account if environment
        # is enabled and only measures applications installed using GitLab Managed Apps (disregards
        # CI-based managed apps).
        #
        # More details: https://gitlab.com/gitlab-org/gitlab/-/merge_requests/28331#note_318621786
        ##

        column = ::Deployment.arel_table[:environment_id]
        {
          ingress_modsecurity_logging: distinct_count(successful_deployments_with_cluster(::Clusters::Applications::Ingress.modsecurity_enabled.logging), column),
          ingress_modsecurity_blocking: distinct_count(successful_deployments_with_cluster(::Clusters::Applications::Ingress.modsecurity_enabled.blocking), column),
          ingress_modsecurity_disabled: distinct_count(successful_deployments_with_cluster(::Clusters::Applications::Ingress.modsecurity_disabled), column),
          ingress_modsecurity_not_installed: distinct_count(successful_deployments_with_cluster(::Clusters::Applications::Ingress.modsecurity_not_installed), column)
        }
299 300
      end

301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323
      # rubocop: disable CodeReuse/ActiveRecord
      def container_expiration_policies_usage
        results = {}
        start = ::Project.minimum(:id)
        finish = ::Project.maximum(:id)

        results[:projects_with_expiration_policy_disabled] = distinct_count(::ContainerExpirationPolicy.where(enabled: false), :project_id, start: start, finish: finish)
        base = ::ContainerExpirationPolicy.active
        results[:projects_with_expiration_policy_enabled] = distinct_count(base, :project_id, start: start, finish: finish)

        %i[keep_n cadence older_than].each do |option|
          ::ContainerExpirationPolicy.public_send("#{option}_options").keys.each do |value| # rubocop: disable GitlabSecurity/PublicSend
            results["projects_with_expiration_policy_enabled_with_#{option}_set_to_#{value}".to_sym] = distinct_count(base.where(option => value), :project_id, start: start, finish: finish)
          end
        end

        results[:projects_with_expiration_policy_enabled_with_keep_n_unset] = distinct_count(base.where(keep_n: nil), :project_id, start: start, finish: finish)
        results[:projects_with_expiration_policy_enabled_with_older_than_unset] = distinct_count(base.where(older_than: nil), :project_id, start: start, finish: finish)

        results
      end
      # rubocop: enable CodeReuse/ActiveRecord

324
      # rubocop: disable CodeReuse/ActiveRecord
325
      def services_usage
326 327
        results = Service.available_services_names.without('jira').each_with_object({}) do |service_name, response|
          response["projects_#{service_name}_active".to_sym] = count(Service.active.where(template: false, type: "#{service_name}_service".camelize))
328
        end
329

330 331 332 333
        # Keep old Slack keys for backward compatibility, https://gitlab.com/gitlab-data/analytics/issues/3241
        results[:projects_slack_notifications_active] = results[:projects_slack_active]
        results[:projects_slack_slash_active] = results[:projects_slack_slash_commands_active]

334
        results.merge(jira_usage).merge(jira_import_usage)
335 336 337 338 339 340
      end

      def jira_usage
        # Jira Cloud does not support custom domains as per https://jira.atlassian.com/browse/CLOUD-6999
        # so we can just check for subdomains of atlassian.net

341 342 343
        results = {
          projects_jira_server_active: 0,
          projects_jira_cloud_active: 0,
344
          projects_jira_active: 0
345
        }
346

347 348
        Service.active
          .by_type(:JiraService)
349 350 351
          .includes(:jira_tracker_data)
          .find_in_batches(batch_size: BATCH_SIZE) do |services|
          counts = services.group_by do |service|
352
            # TODO: Simplify as part of https://gitlab.com/gitlab-org/gitlab/issues/29404
353 354 355 356 357 358
            service_url = service.data_fields&.url || (service.properties && service.properties['url'])
            service_url&.include?('.atlassian.net') ? :cloud : :server
          end

          results[:projects_jira_server_active] += counts[:server].count if counts[:server]
          results[:projects_jira_cloud_active] += counts[:cloud].count if counts[:cloud]
359
          results[:projects_jira_active] += services.size
360 361 362
        end

        results
363
      rescue ActiveRecord::StatementInvalid
364
        { projects_jira_server_active: FALLBACK, projects_jira_cloud_active: FALLBACK, projects_jira_active: FALLBACK }
365
      end
366 367 368 369 370 371 372

      def successful_deployments_with_cluster(scope)
        scope
          .joins(cluster: :deployments)
          .merge(Clusters::Cluster.enabled)
          .merge(Deployment.success)
      end
373
      # rubocop: enable CodeReuse/ActiveRecord
374

375 376 377 378 379 380 381 382 383 384
      def jira_import_usage
        finished_jira_imports = JiraImportState.finished

        {
          jira_imports_total_imported_count: count(finished_jira_imports),
          jira_imports_projects_count: distinct_count(finished_jira_imports, :project_id),
          jira_imports_total_imported_issues_count: alt_usage_data { JiraImportState.finished_imports_count }
        }
      end

385 386 387 388
      def user_preferences_usage
        {} # augmented in EE
      end

389
      def count(relation, column = nil, batch: true, start: nil, finish: nil)
390
        if batch && Feature.enabled?(:usage_ping_batch_counter, default_enabled: true)
391
          Gitlab::Database::BatchCount.batch_count(relation, column, start: start, finish: finish)
392 393 394 395
        else
          relation.count
        end
      rescue ActiveRecord::StatementInvalid
396
        FALLBACK
397 398
      end

399
      def distinct_count(relation, column = nil, batch: true, start: nil, finish: nil)
400
        if batch && Feature.enabled?(:usage_ping_batch_counter, default_enabled: true)
401
          Gitlab::Database::BatchCount.batch_distinct_count(relation, column, start: start, finish: finish)
402 403 404
        else
          relation.distinct_count_by(column)
        end
405
      rescue ActiveRecord::StatementInvalid
406
        FALLBACK
407
      end
408

409
      def alt_usage_data(value = nil, fallback: FALLBACK, &block)
410 411 412 413 414 415 416 417 418
        if block_given?
          yield
        else
          value
        end
      rescue
        fallback
      end

419 420 421 422 423 424 425 426
      def redis_usage_data(counter = nil, &block)
        if block_given?
          redis_usage_counter(&block)
        elsif counter.present?
          redis_usage_data_totals(counter)
        end
      end

427 428
      private

429 430 431
      def redis_usage_counter
        yield
      rescue ::Redis::CommandError, Gitlab::UsageDataCounters::BaseCounter::UnknownEvent
432
        FALLBACK
433 434 435 436 437 438 439 440
      end

      def redis_usage_data_totals(counter)
        counter.totals
      rescue ::Redis::CommandError, Gitlab::UsageDataCounters::BaseCounter::UnknownEvent
        counter.fallback_totals
      end

441 442 443 444 445 446 447
      def installation_type
        if Rails.env.production?
          Gitlab::INSTALLATION_TYPE
        else
          "gitlab-development-kit"
        end
      end
448 449 450
    end
  end
end
451 452

Gitlab::UsageData.prepend_if_ee('EE::Gitlab::UsageData')