repository.rb 31.0 KB
Newer Older
1 2
require 'securerandom'

3
class Repository
L
Lin Jen-Shin 已提交
4 5 6
  REF_MERGE_REQUEST = 'merge-requests'.freeze
  REF_KEEP_AROUND = 'keep-around'.freeze
  REF_ENVIRONMENTS = 'environments'.freeze
7 8 9 10 11 12 13 14 15

  RESERVED_REFS_NAMES = %W[
    heads
    tags
    #{REF_ENVIRONMENTS}
    #{REF_KEEP_AROUND}
    #{REF_ENVIRONMENTS}
  ].freeze

16
  include Gitlab::ShellAdapter
17
  include RepositoryMirroring
18

19
  attr_accessor :full_path, :disk_path, :project
20

21 22
  delegate :ref_name_for_sha, to: :raw_repository

23
  CreateTreeError = Class.new(StandardError)
24

25 26 27 28 29 30
  # Methods that cache data from the Git repository.
  #
  # Each entry in this Array should have a corresponding method with the exact
  # same name. The cache key used by those methods must also match method's
  # name.
  #
31 32 33
  # For example, for entry `:commit_count` there's a method called `commit_count` which
  # stores its data in the `commit_count` cache key.
  CACHED_METHODS = %i(size commit_count rendered_readme contribution_guide
34 35
                      changelog license_blob license_key gitignore koding_yml
                      gitlab_ci_yml branch_names tag_names branch_count
D
Douwe Maan 已提交
36
                      tag_count avatar exists? empty? root_ref).freeze
37 38 39 40 41

  # Certain method caches should be refreshed when certain types of files are
  # changed. This Hash maps file types (as returned by Gitlab::FileDetector) to
  # the corresponding methods to call for refreshing caches.
  METHOD_CACHES_FOR_FILE_TYPES = {
42
    readme: :rendered_readme,
43
    changelog: :changelog,
44
    license: %i(license_blob license_key license),
45 46 47 48 49
    contributing: :contribution_guide,
    gitignore: :gitignore,
    koding: :koding_yml,
    gitlab_ci: :gitlab_ci_yml,
    avatar: :avatar
D
Douwe Maan 已提交
50
  }.freeze
51 52 53 54 55

  # Wraps around the given method and caches its output in Redis and an instance
  # variable.
  #
  # This only works for methods that do not take any arguments.
56
  def self.cache_method(name, fallback: nil, memoize_only: false)
57
    original = :"_uncached_#{name}"
58

59
    alias_method(original, name)
60

61
    define_method(name) do
62 63 64
      cache_method_output(name, fallback: fallback, memoize_only: memoize_only) do
        __send__(original) # rubocop:disable GitlabSecurity/PublicSend
      end
65
    end
66
  end
67

68
  def initialize(full_path, project, disk_path: nil)
69
    @full_path = full_path
70
    @disk_path = disk_path || full_path
71
    @project = project
72
  end
73

74
  def ==(other)
H
http://jneen.net/ 已提交
75 76 77
    @disk_path == other.disk_path
  end

78
  def raw_repository
79
    return nil unless full_path
80

81
    @raw_repository ||= initialize_raw_repository
82 83
  end

84 85
  alias_method :raw, :raw_repository

86
  # Return absolute path to repository
87
  def path_to_repo
88
    @path_to_repo ||= File.expand_path(
89
      File.join(repository_storage_path, disk_path + '.git')
90
    )
91 92
  end

93 94 95 96 97 98
  # we need to have this method here because it is not cached in ::Git and
  # the method is called multiple times for every request
  def has_visible_content?
    branch_count > 0
  end

99 100 101 102
  def inspect
    "#<#{self.class.name}:#{@disk_path}>"
  end

L
Lin Jen-Shin 已提交
103
  def commit(ref = 'HEAD')
104
    return nil unless exists?
105

106 107 108 109 110 111
    commit =
      if ref.is_a?(Gitlab::Git::Commit)
        ref
      else
        Gitlab::Git::Commit.find(raw_repository, ref)
      end
112

113
    commit = ::Commit.new(commit, @project) if commit
114
    commit
115
  rescue Rugged::OdbError, Rugged::TreeError
116
    nil
117 118
  end

119
  def commits(ref, path: nil, limit: nil, offset: nil, skip_merges: false, after: nil, before: nil)
120
    options = {
121 122 123 124 125
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
126 127
      after: after,
      before: before,
128
      follow: Array(path).length == 1,
129
      skip_merges: skip_merges
130 131 132
    }

    commits = Gitlab::Git::Commit.where(options)
133
    commits = Commit.decorate(commits, @project) if commits.present?
134 135 136
    commits
  end

137 138
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
139
    commits = Commit.decorate(commits, @project) if commits.present?
140 141 142
    commits
  end

J
Jacob Vosmaer 已提交
143
  # Gitaly migration: https://gitlab.com/gitlab-org/gitaly/issues/384
144
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
145 146 147 148
    unless exists? && has_visible_content? && query.present?
      return []
    end

149 150 151 152 153 154 155
    raw_repository.gitaly_migrate(:commits_by_message) do |is_enabled|
      if is_enabled
        find_commits_by_message_by_gitaly(query, ref, path, limit, offset)
      else
        find_commits_by_message_by_shelling_out(query, ref, path, limit, offset)
      end
    end
156 157
  end

158 159 160 161 162 163 164
  def find_branch(name, fresh_repo: true)
    # Since the Repository object may have in-memory index changes, invalidating the memoized Repository object may
    # cause unintended side effects. Because finding a branch is a read-only operation, we can safely instantiate
    # a new repo here to ensure a consistent state to avoid a libgit2 bug where concurrent access (e.g. via git gc)
    # may cause the branch to "disappear" erroneously or have the wrong SHA.
    #
    # See: https://github.com/libgit2/libgit2/issues/1534 and https://gitlab.com/gitlab-org/gitlab-ce/issues/15392
165
    raw_repo = fresh_repo ? initialize_raw_repository : raw_repository
166 167

    raw_repo.find_branch(name)
168 169 170
  end

  def find_tag(name)
171
    tags.find { |tag| tag.name == name }
172 173
  end

174
  def add_branch(user, branch_name, ref)
175
    branch = raw_repository.add_branch(branch_name, user: user, target: ref)
176

177
    after_create_branch
178 179 180 181

    branch
  rescue Gitlab::Git::Repository::InvalidRef
    false
182 183
  end

184
  def add_tag(user, tag_name, target, message = nil)
185
    raw_repository.add_tag(tag_name, user: user, target: target, message: message)
186 187
  rescue Gitlab::Git::Repository::InvalidRef
    false
188 189
  end

190
  def rm_branch(user, branch_name)
191
    before_remove_branch
192

193
    raw_repository.rm_branch(branch_name, user: user)
194

195
    after_remove_branch
196
    true
197 198
  end

L
Lin Jen-Shin 已提交
199
  def rm_tag(user, tag_name)
Y
Yorick Peterse 已提交
200
    before_remove_tag
201

202
    raw_repository.rm_tag(tag_name, user: user)
L
Lin Jen-Shin 已提交
203 204 205

    after_remove_tag
    true
206 207
  end

208 209 210 211
  def ref_names
    branch_names + tag_names
  end

212
  def branch_exists?(branch_name)
213 214 215 216 217 218 219
    return false unless raw_repository

    @branch_exists_memo ||= Hash.new do |hash, key|
      hash[key] = raw_repository.branch_exists?(key)
    end

    @branch_exists_memo[branch_name]
220 221
  end

222
  def ref_exists?(ref)
223 224
    !!raw_repository&.ref_exists?(ref)
  rescue ArgumentError
225
    false
226 227
  end

D
Douwe Maan 已提交
228 229 230 231
  # Makes sure a commit is kept around when Git garbage collection runs.
  # Git GC will delete commits from the repository that are no longer in any
  # branches or tags, but we want to keep some of these commits around, for
  # example if they have comments or CI builds.
232 233 234 235 236
  def keep_around(sha)
    return unless sha && commit(sha)

    return if kept_around?(sha)

237 238
    # This will still fail if the file is corrupted (e.g. 0 bytes)
    begin
239
      write_ref(keep_around_ref_name(sha), sha)
240
    rescue Rugged::ReferenceError => ex
241
      Rails.logger.error "Unable to create #{REF_KEEP_AROUND} reference for repository #{path}: #{ex}"
242 243
    rescue Rugged::OSError => ex
      raise unless ex.message =~ /Failed to create locked file/ && ex.message =~ /File exists/
244
      Rails.logger.error "Unable to create #{REF_KEEP_AROUND} reference for repository #{path}: #{ex}"
245
    end
246 247 248
  end

  def kept_around?(sha)
249
    ref_exists?(keep_around_ref_name(sha))
250
  end
251

252 253 254 255
  def write_ref(ref_path, sha)
    rugged.references.create(ref_path, sha, force: true)
  end

256
  def diverging_commit_counts(branch)
257
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
J
Jeff Stubler 已提交
258
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
259 260
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
261 262
      number_commits_behind = raw_repository
        .count_commits_between(branch.dereferenced_target.sha, root_ref_hash)
263

264 265
      number_commits_ahead = raw_repository
        .count_commits_between(root_ref_hash, branch.dereferenced_target.sha)
266

267 268 269
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
270

271 272 273
  def expire_tags_cache
    expire_method_caches(%i(tag_names tag_count))
    @tags = nil
274
  end
275

276 277 278
  def expire_branches_cache
    expire_method_caches(%i(branch_names branch_count))
    @local_branches = nil
279
    @branch_exists_memo = nil
280 281
  end

282 283
  def expire_statistics_caches
    expire_method_caches(%i(size commit_count))
284 285
  end

286 287
  def expire_all_method_caches
    expire_method_caches(CACHED_METHODS)
D
Douwe Maan 已提交
288 289
  end

290 291 292 293 294 295 296 297 298
  # Expires the caches of a specific set of methods
  def expire_method_caches(methods)
    methods.each do |key|
      cache.expire(key)

      ivar = cache_instance_variable_name(key)

      remove_instance_variable(ivar) if instance_variable_defined?(ivar)
    end
D
Douwe Maan 已提交
299 300
  end

301 302 303 304 305 306 307 308 309 310 311 312 313 314 315
  def expire_avatar_cache
    expire_method_caches(%i(avatar))
  end

  # Refreshes the method caches of this repository.
  #
  # types - An Array of file types (e.g. `:readme`) used to refresh extra
  #         caches.
  def refresh_method_caches(types)
    to_refresh = []

    types.each do |type|
      methods = METHOD_CACHES_FOR_FILE_TYPES[type.to_sym]

      to_refresh.concat(Array(methods)) if methods
316
    end
317

318
    expire_method_caches(to_refresh)
319

320
    to_refresh.each { |method| send(method) } # rubocop:disable GitlabSecurity/PublicSend
321
  end
322

323 324 325 326 327 328 329
  def expire_branch_cache(branch_name = nil)
    # When we push to the root branch we have to flush the cache for all other
    # branches as their statistics are based on the commits relative to the
    # root branch.
    if !branch_name || branch_name == root_ref
      branches.each do |branch|
        cache.expire(:"diverging_commit_counts_#{branch.name}")
330
        cache.expire(:"commit_count_#{branch.name}")
331 332 333 334 335
      end
    # In case a commit is pushed to a non-root branch we only have to flush the
    # cache for said branch.
    else
      cache.expire(:"diverging_commit_counts_#{branch_name}")
336
      cache.expire(:"commit_count_#{branch_name}")
337
    end
D
Dmitriy Zaporozhets 已提交
338 339
  end

340
  def expire_root_ref_cache
341
    expire_method_caches(%i(root_ref))
342 343
  end

344 345
  # Expires the cache(s) used to determine if a repository is empty or not.
  def expire_emptiness_caches
346
    return unless empty?
347

348
    expire_method_caches(%i(empty?))
Y
Yorick Peterse 已提交
349 350
  end

351 352 353 354
  def lookup_cache
    @lookup_cache ||= {}
  end

355
  def expire_exists_cache
356
    expire_method_caches(%i(exists?))
357 358
  end

359 360 361 362 363 364 365
  # expire cache that doesn't depend on repository data (when expiring)
  def expire_content_cache
    expire_tags_cache
    expire_branches_cache
    expire_root_ref_cache
    expire_emptiness_caches
    expire_exists_cache
366
    expire_statistics_caches
367 368 369 370 371
  end

  # Runs code after a repository has been created.
  def after_create
    expire_exists_cache
372 373
    expire_root_ref_cache
    expire_emptiness_caches
Y
Yorick Peterse 已提交
374 375

    repository_event(:create_repository)
376 377
  end

378 379
  # Runs code just before a repository is deleted.
  def before_delete
380
    expire_exists_cache
381 382
    expire_all_method_caches
    expire_branch_cache if exists?
383
    expire_content_cache
Y
Yorick Peterse 已提交
384 385

    repository_event(:remove_repository)
386 387 388 389 390 391 392
  end

  # Runs code just before the HEAD of a repository is changed.
  def before_change_head
    # Cached divergent commit counts are based on repository head
    expire_branch_cache
    expire_root_ref_cache
Y
Yorick Peterse 已提交
393 394

    repository_event(:change_default_branch)
395 396
  end

Y
Yorick Peterse 已提交
397 398
  # Runs code before pushing (= creating or removing) a tag.
  def before_push_tag
399 400
    expire_statistics_caches
    expire_emptiness_caches
401
    expire_tags_cache
Y
Yorick Peterse 已提交
402 403

    repository_event(:push_tag)
Y
Yorick Peterse 已提交
404 405 406 407 408
  end

  # Runs code before removing a tag.
  def before_remove_tag
    expire_tags_cache
409
    expire_statistics_caches
Y
Yorick Peterse 已提交
410 411

    repository_event(:remove_tag)
412 413
  end

L
Lin Jen-Shin 已提交
414 415 416 417 418
  # Runs code after removing a tag.
  def after_remove_tag
    expire_tags_cache
  end

419 420 421
  # Runs code after the HEAD of a repository is changed.
  def after_change_head
    expire_method_caches(METHOD_CACHES_FOR_FILE_TYPES.keys)
422 423
  end

424 425
  # Runs code after a repository has been forked/imported.
  def after_import
426
    expire_content_cache
427 428 429
  end

  # Runs code after a new commit has been pushed.
430 431 432
  def after_push_commit(branch_name)
    expire_statistics_caches
    expire_branch_cache(branch_name)
Y
Yorick Peterse 已提交
433 434

    repository_event(:push_commit, branch: branch_name)
435 436 437 438
  end

  # Runs code after a new branch has been created.
  def after_create_branch
439
    expire_branches_cache
Y
Yorick Peterse 已提交
440 441

    repository_event(:push_branch)
442 443
  end

444 445 446
  # Runs code before removing an existing branch.
  def before_remove_branch
    expire_branches_cache
Y
Yorick Peterse 已提交
447 448

    repository_event(:remove_branch)
449 450
  end

451 452
  # Runs code after an existing branch has been removed.
  def after_remove_branch
453
    expire_branches_cache
454 455
  end

456
  def method_missing(m, *args, &block)
457 458
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
459
      lookup_cache[m][args.join(":")] ||= raw_repository.__send__(m, *args, &block) # rubocop:disable GitlabSecurity/PublicSend
460
    else
461
      raw_repository.__send__(m, *args, &block) # rubocop:disable GitlabSecurity/PublicSend
462
    end
463 464
  end

465 466
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
467
  end
D
Dmitriy Zaporozhets 已提交
468 469

  def blob_at(sha, path)
470
    unless Gitlab::Git.blank_ref?(sha)
D
Douwe Maan 已提交
471
      Blob.decorate(Gitlab::Git::Blob.find(self, sha, path), project)
472
    end
D
Douwe Maan 已提交
473 474
  rescue Gitlab::Git::Repository::NoRepository
    nil
D
Dmitriy Zaporozhets 已提交
475
  end
476

477 478 479 480 481 482 483
  def root_ref
    if raw_repository
      raw_repository.root_ref
    else
      # When the repo does not exist we raise this error so no data is cached.
      raise Rugged::ReferenceError
    end
484
  end
485
  cache_method :root_ref
486

487
  # Gitaly migration: https://gitlab.com/gitlab-org/gitaly/issues/314
488
  def exists?
489
    return false unless full_path
490 491 492 493 494 495 496 497

    Gitlab::GitalyClient.migrate(:repository_exists) do |enabled|
      if enabled
        raw_repository.exists?
      else
        refs_directory_exists?
      end
    end
498 499 500
  end
  cache_method :exists?

D
Douwe Maan 已提交
501
  delegate :empty?, to: :raw_repository
502 503 504 505 506 507 508 509 510 511 512 513 514
  cache_method :empty?

  # The size of this repository in megabytes.
  def size
    exists? ? raw_repository.size : 0.0
  end
  cache_method :size, fallback: 0.0

  def commit_count
    root_ref ? raw_repository.commit_count(root_ref) : 0
  end
  cache_method :commit_count, fallback: 0

515
  def commit_count_for_ref(ref)
516
    return 0 unless exists?
517

518 519 520 521
    begin
      cache.fetch(:"commit_count_#{ref}") { raw_repository.commit_count(ref) }
    rescue Rugged::ReferenceError
      0
522 523 524
    end
  end

525
  delegate :branch_names, to: :raw_repository
526 527
  cache_method :branch_names, fallback: []

D
Douwe Maan 已提交
528
  delegate :tag_names, to: :raw_repository
529 530
  cache_method :tag_names, fallback: []

K
Cleanup  
Kim "BKC" Carlbäcker 已提交
531
  delegate :branch_count, :tag_count, to: :raw_repository
532 533 534 535 536 537
  cache_method :branch_count, fallback: 0
  cache_method :tag_count, fallback: 0

  def avatar
    if tree = file_on_head(:avatar)
      tree.path
538 539
    end
  end
540
  cache_method :avatar
541

542
  def readme
543 544
    if readme = tree(:head)&.readme
      ReadmeBlob.new(readme, self)
545
    end
546 547
  end

548
  def rendered_readme
T
Toon Claes 已提交
549
    MarkupHelper.markup_unsafe(readme.name, readme.data, project: project) if readme
550 551
  end
  cache_method :rendered_readme
552

553
  def contribution_guide
554
    file_on_head(:contributing)
555
  end
556
  cache_method :contribution_guide
557 558

  def changelog
559
    file_on_head(:changelog)
560
  end
561
  cache_method :changelog
562

563
  def license_blob
564
    file_on_head(:license)
565
  end
566
  cache_method :license_blob
Z
Zeger-Jan van de Weg 已提交
567

568
  def license_key
569
    return unless exists?
570

571
    Licensee.license(path).try(:key)
572
  end
573
  cache_method :license_key
574

D
Douwe Maan 已提交
575 576
  def license
    return unless license_key
577

578
    Licensee::License.new(license_key)
579
  end
580
  cache_method :license, memoize_only: true
581 582

  def gitignore
583
    file_on_head(:gitignore)
584
  end
585
  cache_method :gitignore
586 587

  def koding_yml
588
    file_on_head(:koding)
589
  end
590
  cache_method :koding_yml
591

592
  def gitlab_ci_yml
593
    file_on_head(:gitlab_ci)
594
  end
595
  cache_method :gitlab_ci_yml
596

597
  def head_commit
598 599 600 601
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
602 603 604
    if head_commit
      @head_tree ||= Tree.new(self, head_commit.sha, nil)
    end
605 606
  end

607
  def tree(sha = :head, path = nil, recursive: false)
608
    if sha == :head
609 610
      return unless head_commit

611 612 613 614 615
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
616 617
    end

618
    Tree.new(self, sha, path, recursive: recursive)
619
  end
D
Dmitriy Zaporozhets 已提交
620 621

  def blob_at_branch(branch_name, path)
D
Dmitriy Zaporozhets 已提交
622
    last_commit = commit(branch_name)
D
Dmitriy Zaporozhets 已提交
623

D
Dmitriy Zaporozhets 已提交
624 625 626 627 628
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
D
Dmitriy Zaporozhets 已提交
629
  end
D
Dmitriy Zaporozhets 已提交
630

631
  def last_commit_for_path(sha, path)
632 633 634 635 636 637 638
    raw_repository.gitaly_migrate(:last_commit_for_path) do |is_enabled|
      if is_enabled
        last_commit_for_path_by_gitaly(sha, path)
      else
        last_commit_for_path_by_rugged(sha, path)
      end
    end
639
  end
640

H
Hiroyuki Sato 已提交
641 642
  def last_commit_id_for_path(sha, path)
    key = path.blank? ? "last_commit_id_for_path:#{sha}" : "last_commit_id_for_path:#{sha}:#{Digest::SHA1.hexdigest(path)}"
H
Hiroyuki Sato 已提交
643

H
Hiroyuki Sato 已提交
644
    cache.fetch(key) do
645 646 647 648 649 650 651
      raw_repository.gitaly_migrate(:last_commit_for_path) do |is_enabled|
        if is_enabled
          last_commit_for_path_by_gitaly(sha, path).id
        else
          last_commit_id_for_path_by_shelling_out(sha, path)
        end
      end
H
Hiroyuki Sato 已提交
652 653 654
    end
  end

655
  def next_branch(name, opts = {})
P
P.S.V.R 已提交
656 657 658
    branch_ids = self.branch_names.map do |n|
      next 1 if n == name
      result = n.match(/\A#{name}-([0-9]+)\z/)
659 660 661
      result[1].to_i if result
    end.compact

P
P.S.V.R 已提交
662
    highest_branch_id = branch_ids.max || 0
663

P
P.S.V.R 已提交
664 665 666
    return name if opts[:mild] && 0 == highest_branch_id

    "#{name}-#{highest_branch_id + 1}"
667 668
  end

669
  def branches_sorted_by(value)
670
    raw_repository.local_branches(sort_by: value)
671
  end
672

673 674 675
  def tags_sorted_by(value)
    case value
    when 'name'
676
      VersionSorter.rsort(tags) { |tag| tag.name }
677 678 679 680 681 682 683 684 685
    when 'updated_desc'
      tags_sorted_by_committed_date.reverse
    when 'updated_asc'
      tags_sorted_by_committed_date
    else
      tags
    end
  end

686
  def contributors
687
    commits = self.commits(nil, limit: 2000, offset: 0, skip_merges: true)
688

D
Dmitriy Zaporozhets 已提交
689
    commits.group_by(&:author_email).map do |email, commits|
690 691
      contributor = Gitlab::Contributor.new
      contributor.email = email
692

D
Dmitriy Zaporozhets 已提交
693
      commits.each do |commit|
694
        if contributor.name.blank?
D
Dmitriy Zaporozhets 已提交
695
          contributor.name = commit.author_name
696 697
        end

698
        contributor.commits += 1
699 700
      end

701 702
      contributor
    end
703
  end
D
Dmitriy Zaporozhets 已提交
704

705
  def refs_contains_sha(ref_type, sha)
706 707
    args = %W(#{ref_type} --contains #{sha})
    names = run_git(args).first
708 709 710 711 712 713 714 715 716 717 718 719 720

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
H
Hannes Rosenögger 已提交
721

722 723 724
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
H
Hannes Rosenögger 已提交
725

726 727
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
H
Hannes Rosenögger 已提交
728
  end
729

730
  def local_branches
731
    @local_branches ||= raw_repository.local_branches
732 733
  end

734 735
  alias_method :branches, :local_branches

736 737 738 739
  def tags
    @tags ||= raw_repository.tags
  end

D
Douwe Maan 已提交
740 741 742
  def create_dir(user, path, **options)
    options[:user] = user
    options[:actions] = [{ action: :create_dir, file_path: path }]
743

D
Douwe Maan 已提交
744
    multi_action(**options)
S
Stan Hu 已提交
745 746
  end

D
Douwe Maan 已提交
747 748 749
  def create_file(user, path, content, **options)
    options[:user] = user
    options[:actions] = [{ action: :create, file_path: path, content: content }]
750

D
Douwe Maan 已提交
751
    multi_action(**options)
S
Stan Hu 已提交
752
  end
753

D
Douwe Maan 已提交
754 755 756
  def update_file(user, path, content, **options)
    previous_path = options.delete(:previous_path)
    action = previous_path && previous_path != path ? :move : :update
757

D
Douwe Maan 已提交
758 759
    options[:user] = user
    options[:actions] = [{ action: action, file_path: path, previous_path: previous_path, content: content }]
760

D
Douwe Maan 已提交
761
    multi_action(**options)
762 763
  end

D
Douwe Maan 已提交
764 765 766
  def delete_file(user, path, **options)
    options[:user] = user
    options[:actions] = [{ action: :delete, file_path: path }]
767

D
Douwe Maan 已提交
768
    multi_action(**options)
769 770
  end

771 772
  def with_cache_hooks
    result = yield
773

774
    return unless result
775

776 777
    after_create if result.repo_created?
    after_create_branch if result.branch_created?
778

779 780 781 782 783 784 785 786 787
    result.newrev
  end

  def with_branch(user, *args)
    with_cache_hooks do
      Gitlab::Git::OperationService.new(user, raw_repository).with_branch(*args) do |start_commit|
        yield start_commit
      end
    end
788 789
  end

790
  # rubocop:disable Metrics/ParameterLists
L
Lin Jen-Shin 已提交
791
  def multi_action(
792
    user:, branch_name:, message:, actions:,
793
    author_email: nil, author_name: nil,
794
    start_branch_name: nil, start_project: project)
795

796 797
    with_branch(
      user,
798
      branch_name,
799
      start_branch_name: start_branch_name,
800
      start_repository: start_project.repository.raw_repository) do |start_commit|
801

802
      index = Gitlab::Git::Index.new(raw_repository)
803

804
      if start_commit
805
        index.read_tree(start_commit.rugged_commit.tree)
806 807 808
        parents = [start_commit.sha]
      else
        parents = []
M
Marc Siegfriedt 已提交
809 810
      end

811
      actions.each do |options|
812
        index.public_send(options.delete(:action), options) # rubocop:disable GitlabSecurity/PublicSend
M
Marc Siegfriedt 已提交
813 814 815
      end

      options = {
816
        tree: index.write_tree,
M
Marc Siegfriedt 已提交
817 818 819 820 821
        message: message,
        parents: parents
      }
      options.merge!(get_committer_and_author(user, email: author_email, name: author_name))

822
      create_commit(options)
M
Marc Siegfriedt 已提交
823 824
    end
  end
825
  # rubocop:enable Metrics/ParameterLists
M
Marc Siegfriedt 已提交
826

827 828
  def get_committer_and_author(user, email: nil, name: nil)
    committer = user_to_committer(user)
D
Douwe Maan 已提交
829
    author = Gitlab::Git.committer_hash(email: email, name: name) || committer
830

831
    {
832 833
      author: author,
      committer: committer
834 835 836
    }
  end

837
  def user_to_committer(user)
838
    Gitlab::Git.committer_hash(email: user.email, name: user.name)
839 840
  end

841 842 843 844 845 846 847 848 849 850 851
  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

852 853 854 855 856 857
  def merge(user, source_sha, merge_request, message)
    with_cache_hooks do
      raw_repository.merge(user, source_sha, merge_request.target_branch, message) do |commit_id|
        merge_request.update(in_progress_merge_commit_sha: commit_id)
        nil # Return value does not matter.
      end
858
    end
859 860
  end

861
  def revert(
862
    user, commit, branch_name,
863
    start_branch_name: nil, start_project: project)
864 865
    with_branch(
      user,
866
      branch_name,
867
      start_branch_name: start_branch_name,
868
      start_repository: start_project.repository.raw_repository) do |start_commit|
869

870 871
      revert_tree_id = check_revert_content(commit, start_commit.sha)
      unless revert_tree_id
872
        raise Repository::CreateTreeError.new('Failed to revert commit')
873
      end
874 875

      committer = user_to_committer(user)
876

877 878 879 880 881
      create_commit(message: commit.revert_message(user),
                    author: committer,
                    committer: committer,
                    tree: revert_tree_id,
                    parents: [start_commit.sha])
882
    end
883 884
  end

885
  def cherry_pick(
886
    user, commit, branch_name,
887
    start_branch_name: nil, start_project: project)
888 889
    with_branch(
      user,
890
      branch_name,
891
      start_branch_name: start_branch_name,
892
      start_repository: start_project.repository.raw_repository) do |start_commit|
P
P.S.V.R 已提交
893

894 895
      cherry_pick_tree_id = check_cherry_pick_content(commit, start_commit.sha)
      unless cherry_pick_tree_id
896
        raise Repository::CreateTreeError.new('Failed to cherry-pick commit')
897
      end
P
P.S.V.R 已提交
898 899

      committer = user_to_committer(user)
900

901
      create_commit(message: commit.cherry_pick_message(user),
902 903 904 905 906 907 908 909
                    author: {
                        email: commit.author_email,
                        name: commit.author_name,
                        time: commit.authored_date
                    },
                    committer: committer,
                    tree: cherry_pick_tree_id,
                    parents: [start_commit.sha])
P
P.S.V.R 已提交
910 911 912
    end
  end

913
  def resolve_conflicts(user, branch_name, params)
914
    with_branch(user, branch_name) do
915 916
      committer = user_to_committer(user)

917
      create_commit(params.merge(author: committer, committer: committer))
918 919 920
    end
  end

921 922
  def check_revert_content(target_commit, source_sha)
    args = [target_commit.sha, source_sha]
923
    args << { mainline: 1 } if target_commit.merge_commit?
924 925 926 927 928 929 930 931 932 933

    revert_index = rugged.revert_commit(*args)
    return false if revert_index.conflicts?

    tree_id = revert_index.write_tree(rugged)
    return false unless diff_exists?(source_sha, tree_id)

    tree_id
  end

934 935
  def check_cherry_pick_content(target_commit, source_sha)
    args = [target_commit.sha, source_sha]
936
    args << 1 if target_commit.merge_commit?
P
P.S.V.R 已提交
937 938 939 940 941 942 943 944 945 946

    cherry_pick_index = rugged.cherrypick_commit(*args)
    return false if cherry_pick_index.conflicts?

    tree_id = cherry_pick_index.write_tree(rugged)
    return false unless diff_exists?(source_sha, tree_id)

    tree_id
  end

947 948
  def diff_exists?(sha1, sha2)
    rugged.diff(sha1, sha2).size > 0
949 950
  end

F
Florent (HP) 已提交
951 952 953 954 955
  def merged_to_root_ref?(branch_name)
    branch_commit = commit(branch_name)
    root_ref_commit = commit(root_ref)

    if branch_commit
956
      same_head = branch_commit.id == root_ref_commit.id
957
      !same_head && ancestor?(branch_commit.id, root_ref_commit.id)
F
Florent (HP) 已提交
958 959 960 961 962
    else
      nil
    end
  end

S
Stan Hu 已提交
963
  def merge_base(first_commit_id, second_commit_id)
964 965
    first_commit_id = commit(first_commit_id).try(:id) || first_commit_id
    second_commit_id = commit(second_commit_id).try(:id) || second_commit_id
S
Stan Hu 已提交
966
    rugged.merge_base(first_commit_id, second_commit_id)
D
Douwe Maan 已提交
967 968
  rescue Rugged::ReferenceError
    nil
S
Stan Hu 已提交
969 970
  end

971
  def ancestor?(ancestor_id, descendant_id)
972
    return false if ancestor_id.nil? || descendant_id.nil?
973

974 975
    Gitlab::GitalyClient.migrate(:is_ancestor) do |is_enabled|
      if is_enabled
976
        raw_repository.ancestor?(ancestor_id, descendant_id)
977
      else
J
Jacob Vosmaer 已提交
978
        rugged_is_ancestor?(ancestor_id, descendant_id)
979 980
      end
    end
981 982
  end

V
Valery Sizov 已提交
983 984 985
  def empty_repo?
    !exists? || !has_visible_content?
  end
986
  cache_method :empty_repo?, memoize_only: true
V
Valery Sizov 已提交
987 988 989

  def search_files_by_content(query, ref)
    return [] if empty_repo? || query.blank?
V
Valery Sizov 已提交
990

991
    offset = 2
992 993 994
    args = %W(grep -i -I -n --before-context #{offset} --after-context #{offset} -E -e #{Regexp.escape(query)} #{ref || root_ref})

    run_git(args).first.scrub.split(/^--$/)
995 996
  end

V
Valery Sizov 已提交
997 998
  def search_files_by_name(query, ref)
    return [] if empty_repo? || query.blank?
999

1000 1001 1002
    args = %W(ls-tree --full-tree -r #{ref || root_ref} --name-status | #{Regexp.escape(query)})

    run_git(args).first.lines.map(&:strip)
1003 1004
  end

1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018
  def add_remote(name, url)
    raw_repository.remote_add(name, url)
  rescue Rugged::ConfigError
    raw_repository.remote_update(name, url: url)
  end

  def remove_remote(name)
    raw_repository.remote_delete(name)
    true
  rescue Rugged::ConfigError
    false
  end

  def fetch_remote(remote, forced: false, no_tags: false)
1019
    gitlab_shell.fetch_remote(raw_repository, remote, forced: forced, no_tags: no_tags)
1020 1021
  end

1022 1023 1024
  def fetch_source_branch(source_repository, source_branch, local_ref)
    raw_repository.fetch_source_branch(source_repository.raw_repository, source_branch, local_ref)
  end
1025

1026 1027
  def compare_source_branch(target_branch_name, source_repository, source_branch_name, straight:)
    raw_repository.compare_source_branch(target_branch_name, source_repository.raw_repository, source_branch_name, straight: straight)
1028
  end
1029

1030 1031
  def create_ref(ref, ref_path)
    fetch_ref(path_to_repo, ref, ref_path)
1032 1033
  end

1034 1035 1036 1037 1038
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

1039 1040 1041 1042
  def gitattribute(path, name)
    raw_repository.attributes(path)[name]
  end

1043 1044 1045 1046 1047 1048 1049 1050 1051 1052
  def copy_gitattributes(ref)
    actual_ref = ref || root_ref
    begin
      raw_repository.copy_gitattributes(actual_ref)
      true
    rescue Gitlab::Git::Repository::InvalidRef
      false
    end
  end

1053 1054 1055 1056 1057 1058 1059 1060 1061 1062 1063
  # Caches the supplied block both in a cache and in an instance variable.
  #
  # The cache key and instance variable are named the same way as the value of
  # the `key` argument.
  #
  # This method will return `nil` if the corresponding instance variable is also
  # set to `nil`. This ensures we don't keep yielding the block when it returns
  # `nil`.
  #
  # key - The name of the key to cache the data in.
  # fallback - A value to fall back to in the event of a Git error.
1064
  def cache_method_output(key, fallback: nil, memoize_only: false, &block)
1065
    ivar = cache_instance_variable_name(key)
1066

1067 1068 1069 1070
    if instance_variable_defined?(ivar)
      instance_variable_get(ivar)
    else
      begin
1071 1072 1073 1074 1075 1076 1077
        value =
          if memoize_only
            yield
          else
            cache.fetch(key, &block)
          end
        instance_variable_set(ivar, value)
1078 1079 1080 1081
      rescue Rugged::ReferenceError, Gitlab::Git::Repository::NoRepository
        # if e.g. HEAD or the entire repository doesn't exist we want to
        # gracefully handle this and not cache anything.
        fallback
1082 1083 1084
      end
    end
  end
1085

1086 1087 1088
  def cache_instance_variable_name(key)
    :"@#{key.to_s.tr('?!', '')}"
  end
1089

1090 1091
  def file_on_head(type)
    if head = tree(:head)
D
Douwe Maan 已提交
1092 1093
      head.blobs.find do |blob|
        Gitlab::FileDetector.type_of(blob.path) == type
1094 1095 1096 1097
      end
    end
  end

D
Douwe Maan 已提交
1098 1099 1100 1101
  def route_map_for(sha)
    blob_data_at(sha, '.gitlab/route-map.yml')
  end

1102 1103
  def gitlab_ci_yml_for(sha, path = '.gitlab-ci.yml')
    blob_data_at(sha, path)
D
Douwe Maan 已提交
1104 1105
  end

1106 1107
  private

D
Douwe Maan 已提交
1108 1109
  def blob_data_at(sha, path)
    blob = blob_at(sha, path)
1110
    return unless blob
1111

1112
    blob.load_all_data!
1113
    blob.data
1114
  end
1115

1116
  def refs_directory_exists?
1117 1118 1119
    circuit_breaker.perform do
      File.exist?(File.join(path_to_repo, 'refs'))
    end
1120
  end
1121

1122
  def cache
1123 1124
    # TODO: should we use UUIDs here? We could move repositories without clearing this cache
    @cache ||= RepositoryCache.new(full_path, @project.id)
1125
  end
1126 1127

  def tags_sorted_by_committed_date
1128 1129 1130 1131 1132 1133 1134 1135 1136 1137 1138 1139
    tags.sort_by do |tag|
      # Annotated tags can point to any object (e.g. a blob), but generally
      # tags point to a commit. If we don't have a commit, then just default
      # to putting the tag at the end of the list.
      target = tag.dereferenced_target

      if target
        target.committed_date
      else
        Time.now
      end
    end
1140
  end
D
Douwe Maan 已提交
1141 1142

  def keep_around_ref_name(sha)
1143
    "refs/#{REF_KEEP_AROUND}/#{sha}"
D
Douwe Maan 已提交
1144
  end
Y
Yorick Peterse 已提交
1145 1146

  def repository_event(event, tags = {})
1147
    Gitlab::Metrics.add_event(event, { path: full_path }.merge(tags))
Y
Yorick Peterse 已提交
1148
  end
1149

1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160
  def last_commit_for_path_by_gitaly(sha, path)
    c = raw_repository.gitaly_commit_client.last_commit_for_path(sha, path)
    commit(c)
  end

  def last_commit_for_path_by_rugged(sha, path)
    sha = last_commit_id_for_path_by_shelling_out(sha, path)
    commit(sha)
  end

  def last_commit_id_for_path_by_shelling_out(sha, path)
1161 1162
    args = %W(rev-list --max-count=1 #{sha} -- #{path})
    run_git(args).first.strip
1163 1164
  end

1165 1166 1167
  def repository_storage_path
    @project.repository_storage_path
  end
1168

1169
  def initialize_raw_repository
1170
    Gitlab::Git::Repository.new(project.repository_storage, disk_path + '.git', Gitlab::GlRepository.gl_repository(project, false))
1171
  end
1172 1173 1174 1175

  def circuit_breaker
    @circuit_breaker ||= Gitlab::Git::Storage::CircuitBreaker.for_storage(project.repository_storage)
  end
1176 1177 1178 1179 1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196

  def find_commits_by_message_by_shelling_out(query, ref, path, limit, offset)
    ref ||= root_ref

    args = %W(
      log #{ref} --pretty=%H --skip #{offset}
      --max-count #{limit} --grep=#{query} --regexp-ignore-case
    )
    args = args.concat(%W(-- #{path})) if path.present?

    git_log_results = run_git(args).first.lines

    git_log_results.map { |c| commit(c.chomp) }.compact
  end

  def find_commits_by_message_by_gitaly(query, ref, path, limit, offset)
    raw_repository
      .gitaly_commit_client
      .commits_by_message(query, revision: ref, path: path, limit: limit, offset: offset)
      .map { |c| commit(c) }
  end
1197
end