repository.rb 30.8 KB
Newer Older
1 2
require 'securerandom'

3
class Repository
L
Lin Jen-Shin 已提交
4 5 6
  REF_MERGE_REQUEST = 'merge-requests'.freeze
  REF_KEEP_AROUND = 'keep-around'.freeze
  REF_ENVIRONMENTS = 'environments'.freeze
7 8 9 10

  RESERVED_REFS_NAMES = %W[
    heads
    tags
11
    replace
12 13 14 15 16
    #{REF_ENVIRONMENTS}
    #{REF_KEEP_AROUND}
    #{REF_ENVIRONMENTS}
  ].freeze

17 18
  include Gitlab::ShellAdapter

19
  attr_accessor :full_path, :disk_path, :project, :is_wiki
20

21 22
  delegate :ref_name_for_sha, to: :raw_repository

23
  CreateTreeError = Class.new(StandardError)
24

25 26 27 28 29 30
  # Methods that cache data from the Git repository.
  #
  # Each entry in this Array should have a corresponding method with the exact
  # same name. The cache key used by those methods must also match method's
  # name.
  #
31 32 33
  # For example, for entry `:commit_count` there's a method called `commit_count` which
  # stores its data in the `commit_count` cache key.
  CACHED_METHODS = %i(size commit_count rendered_readme contribution_guide
34 35
                      changelog license_blob license_key gitignore koding_yml
                      gitlab_ci_yml branch_names tag_names branch_count
S
Sean McGivern 已提交
36 37
                      tag_count avatar exists? empty? root_ref has_visible_content?
                      issue_template_names merge_request_template_names).freeze
38 39 40

  # Methods that use cache_method but only memoize the value
  MEMOIZED_CACHED_METHODS = %i(license empty_repo?).freeze
41 42 43 44 45

  # Certain method caches should be refreshed when certain types of files are
  # changed. This Hash maps file types (as returned by Gitlab::FileDetector) to
  # the corresponding methods to call for refreshing caches.
  METHOD_CACHES_FOR_FILE_TYPES = {
46
    readme: :rendered_readme,
47
    changelog: :changelog,
48
    license: %i(license_blob license_key license),
49 50 51 52
    contributing: :contribution_guide,
    gitignore: :gitignore,
    koding: :koding_yml,
    gitlab_ci: :gitlab_ci_yml,
S
Sean McGivern 已提交
53 54 55
    avatar: :avatar,
    issue_template: :issue_template_names,
    merge_request_template: :merge_request_template_names
D
Douwe Maan 已提交
56
  }.freeze
57 58 59 60 61

  # Wraps around the given method and caches its output in Redis and an instance
  # variable.
  #
  # This only works for methods that do not take any arguments.
62
  def self.cache_method(name, fallback: nil, memoize_only: false)
63
    original = :"_uncached_#{name}"
64

65
    alias_method(original, name)
66

67
    define_method(name) do
68 69 70
      cache_method_output(name, fallback: fallback, memoize_only: memoize_only) do
        __send__(original) # rubocop:disable GitlabSecurity/PublicSend
      end
71
    end
72
  end
73

74
  def initialize(full_path, project, disk_path: nil, is_wiki: false)
75
    @full_path = full_path
76
    @disk_path = disk_path || full_path
77
    @project = project
78
    @commit_cache = {}
79
    @is_wiki = is_wiki
80
  end
81

82
  def ==(other)
H
http://jneen.net/ 已提交
83 84 85
    @disk_path == other.disk_path
  end

86
  def raw_repository
87
    return nil unless full_path
88

89
    @raw_repository ||= initialize_raw_repository
90 91
  end

92 93
  alias_method :raw, :raw_repository

94
  # Return absolute path to repository
95
  def path_to_repo
96
    @path_to_repo ||= File.expand_path(
97
      File.join(repository_storage_path, disk_path + '.git')
98
    )
99 100
  end

101 102 103 104
  def inspect
    "#<#{self.class.name}:#{@disk_path}>"
  end

L
Lin Jen-Shin 已提交
105
  def commit(ref = 'HEAD')
106
    return nil unless exists?
107
    return ref if ref.is_a?(::Commit)
108

109 110
    find_commit(ref)
  end
111

112 113 114 115 116 117
  # Finding a commit by the passed SHA
  # Also takes care of caching, based on the SHA
  def commit_by(oid:)
    return @commit_cache[oid] if @commit_cache.key?(oid)

    @commit_cache[oid] = find_commit(oid)
118 119
  end

120
  def commits(ref, path: nil, limit: nil, offset: nil, skip_merges: false, after: nil, before: nil)
121
    options = {
122 123 124 125 126
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
127 128
      after: after,
      before: before,
129
      follow: Array(path).length == 1,
130
      skip_merges: skip_merges
131 132 133
    }

    commits = Gitlab::Git::Commit.where(options)
134
    commits = Commit.decorate(commits, @project) if commits.present?
135 136

    CommitCollection.new(project, commits, ref)
137 138
  end

139 140
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
141
    commits = Commit.decorate(commits, @project) if commits.present?
142 143 144
    commits
  end

J
Jacob Vosmaer 已提交
145
  # Gitaly migration: https://gitlab.com/gitlab-org/gitaly/issues/384
146
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
147 148 149 150
    unless exists? && has_visible_content? && query.present?
      return []
    end

151
    raw_repository.gitaly_migrate(:commits_by_message) do |is_enabled|
152 153 154 155 156 157 158 159
      commits =
        if is_enabled
          find_commits_by_message_by_gitaly(query, ref, path, limit, offset)
        else
          find_commits_by_message_by_shelling_out(query, ref, path, limit, offset)
        end

      CommitCollection.new(project, commits, ref)
160
    end
161 162
  end

163 164 165 166 167 168 169
  def find_branch(name, fresh_repo: true)
    # Since the Repository object may have in-memory index changes, invalidating the memoized Repository object may
    # cause unintended side effects. Because finding a branch is a read-only operation, we can safely instantiate
    # a new repo here to ensure a consistent state to avoid a libgit2 bug where concurrent access (e.g. via git gc)
    # may cause the branch to "disappear" erroneously or have the wrong SHA.
    #
    # See: https://github.com/libgit2/libgit2/issues/1534 and https://gitlab.com/gitlab-org/gitlab-ce/issues/15392
170
    raw_repo = fresh_repo ? initialize_raw_repository : raw_repository
171 172

    raw_repo.find_branch(name)
173 174 175
  end

  def find_tag(name)
176
    tags.find { |tag| tag.name == name }
177 178
  end

179
  def add_branch(user, branch_name, ref)
180
    branch = raw_repository.add_branch(branch_name, user: user, target: ref)
181

182
    after_create_branch
183 184 185 186

    branch
  rescue Gitlab::Git::Repository::InvalidRef
    false
187 188
  end

189
  def add_tag(user, tag_name, target, message = nil)
190
    raw_repository.add_tag(tag_name, user: user, target: target, message: message)
191 192
  rescue Gitlab::Git::Repository::InvalidRef
    false
193 194
  end

195
  def rm_branch(user, branch_name)
196
    before_remove_branch
197

198
    raw_repository.rm_branch(branch_name, user: user)
199

200
    after_remove_branch
201
    true
202 203
  end

L
Lin Jen-Shin 已提交
204
  def rm_tag(user, tag_name)
Y
Yorick Peterse 已提交
205
    before_remove_tag
206

207
    raw_repository.rm_tag(tag_name, user: user)
L
Lin Jen-Shin 已提交
208 209 210

    after_remove_tag
    true
211 212
  end

213 214 215 216
  def ref_names
    branch_names + tag_names
  end

217
  def branch_exists?(branch_name)
218 219 220 221 222 223 224
    return false unless raw_repository

    @branch_exists_memo ||= Hash.new do |hash, key|
      hash[key] = raw_repository.branch_exists?(key)
    end

    @branch_exists_memo[branch_name]
225 226
  end

227
  def ref_exists?(ref)
228 229
    !!raw_repository&.ref_exists?(ref)
  rescue ArgumentError
230
    false
231 232
  end

D
Douwe Maan 已提交
233 234 235 236
  # Makes sure a commit is kept around when Git garbage collection runs.
  # Git GC will delete commits from the repository that are no longer in any
  # branches or tags, but we want to keep some of these commits around, for
  # example if they have comments or CI builds.
237
  def keep_around(sha)
238
    return unless sha && commit_by(oid: sha)
239 240 241

    return if kept_around?(sha)

242 243
    # This will still fail if the file is corrupted (e.g. 0 bytes)
    begin
244
      write_ref(keep_around_ref_name(sha), sha)
245
    rescue Rugged::ReferenceError => ex
246
      Rails.logger.error "Unable to create #{REF_KEEP_AROUND} reference for repository #{path}: #{ex}"
247 248
    rescue Rugged::OSError => ex
      raise unless ex.message =~ /Failed to create locked file/ && ex.message =~ /File exists/
249

250
      Rails.logger.error "Unable to create #{REF_KEEP_AROUND} reference for repository #{path}: #{ex}"
251
    end
252 253 254
  end

  def kept_around?(sha)
255
    ref_exists?(keep_around_ref_name(sha))
256
  end
257

258 259 260 261
  def write_ref(ref_path, sha)
    rugged.references.create(ref_path, sha, force: true)
  end

262
  def diverging_commit_counts(branch)
263
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
J
Jeff Stubler 已提交
264
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
265 266
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
267 268
      number_commits_behind = raw_repository
        .count_commits_between(branch.dereferenced_target.sha, root_ref_hash)
269

270 271
      number_commits_ahead = raw_repository
        .count_commits_between(root_ref_hash, branch.dereferenced_target.sha)
272

273 274 275
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
276

277 278 279
  def expire_tags_cache
    expire_method_caches(%i(tag_names tag_count))
    @tags = nil
280
  end
281

282
  def expire_branches_cache
283
    expire_method_caches(%i(branch_names branch_count has_visible_content?))
284
    @local_branches = nil
285
    @branch_exists_memo = nil
286 287
  end

288 289
  def expire_statistics_caches
    expire_method_caches(%i(size commit_count))
290 291
  end

292 293
  def expire_all_method_caches
    expire_method_caches(CACHED_METHODS)
D
Douwe Maan 已提交
294 295
  end

296 297 298 299 300 301 302 303 304
  # Expires the caches of a specific set of methods
  def expire_method_caches(methods)
    methods.each do |key|
      cache.expire(key)

      ivar = cache_instance_variable_name(key)

      remove_instance_variable(ivar) if instance_variable_defined?(ivar)
    end
D
Douwe Maan 已提交
305 306
  end

307 308 309 310 311 312 313 314 315 316 317 318 319 320 321
  def expire_avatar_cache
    expire_method_caches(%i(avatar))
  end

  # Refreshes the method caches of this repository.
  #
  # types - An Array of file types (e.g. `:readme`) used to refresh extra
  #         caches.
  def refresh_method_caches(types)
    to_refresh = []

    types.each do |type|
      methods = METHOD_CACHES_FOR_FILE_TYPES[type.to_sym]

      to_refresh.concat(Array(methods)) if methods
322
    end
323

324
    expire_method_caches(to_refresh)
325

326
    to_refresh.each { |method| send(method) } # rubocop:disable GitlabSecurity/PublicSend
327
  end
328

329 330 331 332 333 334 335
  def expire_branch_cache(branch_name = nil)
    # When we push to the root branch we have to flush the cache for all other
    # branches as their statistics are based on the commits relative to the
    # root branch.
    if !branch_name || branch_name == root_ref
      branches.each do |branch|
        cache.expire(:"diverging_commit_counts_#{branch.name}")
336
        cache.expire(:"commit_count_#{branch.name}")
337 338 339 340 341
      end
    # In case a commit is pushed to a non-root branch we only have to flush the
    # cache for said branch.
    else
      cache.expire(:"diverging_commit_counts_#{branch_name}")
342
      cache.expire(:"commit_count_#{branch_name}")
343
    end
D
Dmitriy Zaporozhets 已提交
344 345
  end

346
  def expire_root_ref_cache
347
    expire_method_caches(%i(root_ref))
348 349
  end

350 351
  # Expires the cache(s) used to determine if a repository is empty or not.
  def expire_emptiness_caches
352
    return unless empty?
353

354
    expire_method_caches(%i(empty? has_visible_content?))
Y
Yorick Peterse 已提交
355 356
  end

357 358 359 360
  def lookup_cache
    @lookup_cache ||= {}
  end

361
  def expire_exists_cache
362
    expire_method_caches(%i(exists?))
363 364
  end

365 366 367 368 369 370 371
  # expire cache that doesn't depend on repository data (when expiring)
  def expire_content_cache
    expire_tags_cache
    expire_branches_cache
    expire_root_ref_cache
    expire_emptiness_caches
    expire_exists_cache
372
    expire_statistics_caches
373 374 375 376 377
  end

  # Runs code after a repository has been created.
  def after_create
    expire_exists_cache
378 379
    expire_root_ref_cache
    expire_emptiness_caches
Y
Yorick Peterse 已提交
380 381

    repository_event(:create_repository)
382 383
  end

384 385
  # Runs code just before a repository is deleted.
  def before_delete
386
    expire_exists_cache
387 388
    expire_all_method_caches
    expire_branch_cache if exists?
389
    expire_content_cache
Y
Yorick Peterse 已提交
390 391

    repository_event(:remove_repository)
392 393 394 395 396 397 398
  end

  # Runs code just before the HEAD of a repository is changed.
  def before_change_head
    # Cached divergent commit counts are based on repository head
    expire_branch_cache
    expire_root_ref_cache
Y
Yorick Peterse 已提交
399 400

    repository_event(:change_default_branch)
401 402
  end

Y
Yorick Peterse 已提交
403 404
  # Runs code before pushing (= creating or removing) a tag.
  def before_push_tag
405 406
    expire_statistics_caches
    expire_emptiness_caches
407
    expire_tags_cache
Y
Yorick Peterse 已提交
408 409

    repository_event(:push_tag)
Y
Yorick Peterse 已提交
410 411 412 413 414
  end

  # Runs code before removing a tag.
  def before_remove_tag
    expire_tags_cache
415
    expire_statistics_caches
Y
Yorick Peterse 已提交
416 417

    repository_event(:remove_tag)
418 419
  end

L
Lin Jen-Shin 已提交
420 421 422 423 424
  # Runs code after removing a tag.
  def after_remove_tag
    expire_tags_cache
  end

425 426 427
  # Runs code after the HEAD of a repository is changed.
  def after_change_head
    expire_method_caches(METHOD_CACHES_FOR_FILE_TYPES.keys)
428 429
  end

430 431
  # Runs code after a repository has been forked/imported.
  def after_import
432
    expire_content_cache
433 434 435
  end

  # Runs code after a new commit has been pushed.
436 437 438
  def after_push_commit(branch_name)
    expire_statistics_caches
    expire_branch_cache(branch_name)
Y
Yorick Peterse 已提交
439 440

    repository_event(:push_commit, branch: branch_name)
441 442 443 444
  end

  # Runs code after a new branch has been created.
  def after_create_branch
445
    expire_branches_cache
Y
Yorick Peterse 已提交
446 447

    repository_event(:push_branch)
448 449
  end

450 451 452
  # Runs code before removing an existing branch.
  def before_remove_branch
    expire_branches_cache
Y
Yorick Peterse 已提交
453 454

    repository_event(:remove_branch)
455 456
  end

457 458
  # Runs code after an existing branch has been removed.
  def after_remove_branch
459
    expire_branches_cache
460 461
  end

462
  def method_missing(m, *args, &block)
463 464
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
465
      lookup_cache[m][args.join(":")] ||= raw_repository.__send__(m, *args, &block) # rubocop:disable GitlabSecurity/PublicSend
466
    else
467
      raw_repository.__send__(m, *args, &block) # rubocop:disable GitlabSecurity/PublicSend
468
    end
469 470
  end

471 472
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
473
  end
D
Dmitriy Zaporozhets 已提交
474 475

  def blob_at(sha, path)
476
    Blob.decorate(raw_repository.blob_at(sha, path), project)
D
Douwe Maan 已提交
477 478
  rescue Gitlab::Git::Repository::NoRepository
    nil
D
Dmitriy Zaporozhets 已提交
479
  end
480

481 482 483 484 485
  # items is an Array like: [[oid, path], [oid1, path1]]
  def blobs_at(items)
    raw_repository.batch_blobs(items).map { |blob| Blob.decorate(blob, project) }
  end

486 487 488 489 490 491 492
  def root_ref
    if raw_repository
      raw_repository.root_ref
    else
      # When the repo does not exist we raise this error so no data is cached.
      raise Rugged::ReferenceError
    end
493
  end
494
  cache_method :root_ref
495

496
  # Gitaly migration: https://gitlab.com/gitlab-org/gitaly/issues/314
497
  def exists?
498
    return false unless full_path
499

500
    raw_repository.exists?
501 502 503
  end
  cache_method :exists?

D
Douwe Maan 已提交
504
  delegate :empty?, to: :raw_repository
505 506 507 508 509 510 511 512 513 514 515 516 517
  cache_method :empty?

  # The size of this repository in megabytes.
  def size
    exists? ? raw_repository.size : 0.0
  end
  cache_method :size, fallback: 0.0

  def commit_count
    root_ref ? raw_repository.commit_count(root_ref) : 0
  end
  cache_method :commit_count, fallback: 0

518
  def commit_count_for_ref(ref)
519
    return 0 unless exists?
520

521 522 523 524
    begin
      cache.fetch(:"commit_count_#{ref}") { raw_repository.commit_count(ref) }
    rescue Rugged::ReferenceError
      0
525 526 527
    end
  end

528
  delegate :branch_names, to: :raw_repository
529 530
  cache_method :branch_names, fallback: []

D
Douwe Maan 已提交
531
  delegate :tag_names, to: :raw_repository
532 533
  cache_method :tag_names, fallback: []

534
  delegate :branch_count, :tag_count, :has_visible_content?, to: :raw_repository
535 536
  cache_method :branch_count, fallback: 0
  cache_method :tag_count, fallback: 0
537
  cache_method :has_visible_content?, fallback: false
538 539

  def avatar
540 541 542 543 544
    # n+1: https://gitlab.com/gitlab-org/gitlab-ce/issues/38327
    Gitlab::GitalyClient.allow_n_plus_1_calls do
      if tree = file_on_head(:avatar)
        tree.path
      end
545 546
    end
  end
547
  cache_method :avatar
548

S
Sean McGivern 已提交
549 550 551 552 553 554 555 556 557 558
  def issue_template_names
    Gitlab::Template::IssueTemplate.dropdown_names(project)
  end
  cache_method :issue_template_names, fallback: []

  def merge_request_template_names
    Gitlab::Template::MergeRequestTemplate.dropdown_names(project)
  end
  cache_method :merge_request_template_names, fallback: []

559
  def readme
560 561
    if readme = tree(:head)&.readme
      ReadmeBlob.new(readme, self)
562
    end
563 564
  end

565
  def rendered_readme
T
Toon Claes 已提交
566
    MarkupHelper.markup_unsafe(readme.name, readme.data, project: project) if readme
567 568
  end
  cache_method :rendered_readme
569

570
  def contribution_guide
571
    file_on_head(:contributing)
572
  end
573
  cache_method :contribution_guide
574 575

  def changelog
576
    file_on_head(:changelog)
577
  end
578
  cache_method :changelog
579

580
  def license_blob
581
    file_on_head(:license)
582
  end
583
  cache_method :license_blob
Z
Zeger-Jan van de Weg 已提交
584

585
  def license_key
586
    return unless exists?
587

588
    Licensee.license(path).try(:key)
589
  end
590
  cache_method :license_key
591

D
Douwe Maan 已提交
592 593
  def license
    return unless license_key
594

595
    Licensee::License.new(license_key)
596
  end
597
  cache_method :license, memoize_only: true
598 599

  def gitignore
600
    file_on_head(:gitignore)
601
  end
602
  cache_method :gitignore
603 604

  def koding_yml
605
    file_on_head(:koding)
606
  end
607
  cache_method :koding_yml
608

609
  def gitlab_ci_yml
610
    file_on_head(:gitlab_ci)
611
  end
612
  cache_method :gitlab_ci_yml
613

614
  def head_commit
615 616 617 618
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
619 620 621
    if head_commit
      @head_tree ||= Tree.new(self, head_commit.sha, nil)
    end
622 623
  end

624
  def tree(sha = :head, path = nil, recursive: false)
625
    if sha == :head
626 627
      return unless head_commit

628 629 630 631 632
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
633 634
    end

635
    Tree.new(self, sha, path, recursive: recursive)
636
  end
D
Dmitriy Zaporozhets 已提交
637 638

  def blob_at_branch(branch_name, path)
D
Dmitriy Zaporozhets 已提交
639
    last_commit = commit(branch_name)
D
Dmitriy Zaporozhets 已提交
640

D
Dmitriy Zaporozhets 已提交
641 642 643 644 645
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
D
Dmitriy Zaporozhets 已提交
646
  end
D
Dmitriy Zaporozhets 已提交
647

648
  def last_commit_for_path(sha, path)
649 650 651 652 653 654 655
    raw_repository.gitaly_migrate(:last_commit_for_path) do |is_enabled|
      if is_enabled
        last_commit_for_path_by_gitaly(sha, path)
      else
        last_commit_for_path_by_rugged(sha, path)
      end
    end
656
  end
657

H
Hiroyuki Sato 已提交
658 659
  def last_commit_id_for_path(sha, path)
    key = path.blank? ? "last_commit_id_for_path:#{sha}" : "last_commit_id_for_path:#{sha}:#{Digest::SHA1.hexdigest(path)}"
H
Hiroyuki Sato 已提交
660

H
Hiroyuki Sato 已提交
661
    cache.fetch(key) do
662 663 664 665 666 667 668
      raw_repository.gitaly_migrate(:last_commit_for_path) do |is_enabled|
        if is_enabled
          last_commit_for_path_by_gitaly(sha, path).id
        else
          last_commit_id_for_path_by_shelling_out(sha, path)
        end
      end
H
Hiroyuki Sato 已提交
669 670 671
    end
  end

672
  def next_branch(name, opts = {})
P
P.S.V.R 已提交
673 674
    branch_ids = self.branch_names.map do |n|
      next 1 if n == name
675

P
P.S.V.R 已提交
676
      result = n.match(/\A#{name}-([0-9]+)\z/)
677 678 679
      result[1].to_i if result
    end.compact

P
P.S.V.R 已提交
680
    highest_branch_id = branch_ids.max || 0
681

P
P.S.V.R 已提交
682 683 684
    return name if opts[:mild] && 0 == highest_branch_id

    "#{name}-#{highest_branch_id + 1}"
685 686
  end

687
  def branches_sorted_by(value)
688
    raw_repository.local_branches(sort_by: value)
689
  end
690

691 692 693
  def tags_sorted_by(value)
    case value
    when 'name'
694
      VersionSorter.rsort(tags) { |tag| tag.name }
695 696 697 698 699 700 701 702 703
    when 'updated_desc'
      tags_sorted_by_committed_date.reverse
    when 'updated_asc'
      tags_sorted_by_committed_date
    else
      tags
    end
  end

704
  def contributors
705
    commits = self.commits(nil, limit: 2000, offset: 0, skip_merges: true)
706

D
Dmitriy Zaporozhets 已提交
707
    commits.group_by(&:author_email).map do |email, commits|
708 709
      contributor = Gitlab::Contributor.new
      contributor.email = email
710

D
Dmitriy Zaporozhets 已提交
711
      commits.each do |commit|
712
        if contributor.name.blank?
D
Dmitriy Zaporozhets 已提交
713
          contributor.name = commit.author_name
714 715
        end

716
        contributor.commits += 1
717 718
      end

719 720
      contributor
    end
721
  end
D
Dmitriy Zaporozhets 已提交
722

723
  def refs_contains_sha(ref_type, sha)
724 725
    args = %W(#{ref_type} --contains #{sha})
    names = run_git(args).first
726 727 728 729 730 731 732 733 734 735 736 737 738

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
H
Hannes Rosenögger 已提交
739

740 741 742
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
H
Hannes Rosenögger 已提交
743

744 745
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
H
Hannes Rosenögger 已提交
746
  end
747

748
  def local_branches
749
    @local_branches ||= raw_repository.local_branches
750 751
  end

752 753
  alias_method :branches, :local_branches

754 755 756 757
  def tags
    @tags ||= raw_repository.tags
  end

D
Douwe Maan 已提交
758 759 760
  def create_dir(user, path, **options)
    options[:user] = user
    options[:actions] = [{ action: :create_dir, file_path: path }]
761

D
Douwe Maan 已提交
762
    multi_action(**options)
S
Stan Hu 已提交
763 764
  end

D
Douwe Maan 已提交
765 766 767
  def create_file(user, path, content, **options)
    options[:user] = user
    options[:actions] = [{ action: :create, file_path: path, content: content }]
768

D
Douwe Maan 已提交
769
    multi_action(**options)
S
Stan Hu 已提交
770
  end
771

D
Douwe Maan 已提交
772 773 774
  def update_file(user, path, content, **options)
    previous_path = options.delete(:previous_path)
    action = previous_path && previous_path != path ? :move : :update
775

D
Douwe Maan 已提交
776 777
    options[:user] = user
    options[:actions] = [{ action: action, file_path: path, previous_path: previous_path, content: content }]
778

D
Douwe Maan 已提交
779
    multi_action(**options)
780 781
  end

D
Douwe Maan 已提交
782 783 784
  def delete_file(user, path, **options)
    options[:user] = user
    options[:actions] = [{ action: :delete, file_path: path }]
785

D
Douwe Maan 已提交
786
    multi_action(**options)
787 788
  end

789 790
  def with_cache_hooks
    result = yield
791

792
    return unless result
793

794 795
    after_create if result.repo_created?
    after_create_branch if result.branch_created?
796

797 798 799 800 801 802 803 804 805
    result.newrev
  end

  def with_branch(user, *args)
    with_cache_hooks do
      Gitlab::Git::OperationService.new(user, raw_repository).with_branch(*args) do |start_commit|
        yield start_commit
      end
    end
806 807
  end

808
  # rubocop:disable Metrics/ParameterLists
L
Lin Jen-Shin 已提交
809
  def multi_action(
810
    user:, branch_name:, message:, actions:,
811
    author_email: nil, author_name: nil,
812
    start_branch_name: nil, start_project: project)
813

814 815
    with_branch(
      user,
816
      branch_name,
817
      start_branch_name: start_branch_name,
818
      start_repository: start_project.repository.raw_repository) do |start_commit|
819

820
      index = Gitlab::Git::Index.new(raw_repository)
821

822
      if start_commit
823
        index.read_tree(start_commit.rugged_commit.tree)
824 825 826
        parents = [start_commit.sha]
      else
        parents = []
M
Marc Siegfriedt 已提交
827 828
      end

829
      actions.each do |options|
830
        index.public_send(options.delete(:action), options) # rubocop:disable GitlabSecurity/PublicSend
M
Marc Siegfriedt 已提交
831 832 833
      end

      options = {
834
        tree: index.write_tree,
M
Marc Siegfriedt 已提交
835 836 837 838 839
        message: message,
        parents: parents
      }
      options.merge!(get_committer_and_author(user, email: author_email, name: author_name))

840
      create_commit(options)
M
Marc Siegfriedt 已提交
841 842
    end
  end
843
  # rubocop:enable Metrics/ParameterLists
M
Marc Siegfriedt 已提交
844

845 846
  def get_committer_and_author(user, email: nil, name: nil)
    committer = user_to_committer(user)
D
Douwe Maan 已提交
847
    author = Gitlab::Git.committer_hash(email: email, name: name) || committer
848

849
    {
850 851
      author: author,
      committer: committer
852 853 854 855 856 857 858 859 860 861 862 863 864 865
    }
  end

  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

866 867 868 869 870 871
  def merge(user, source_sha, merge_request, message)
    with_cache_hooks do
      raw_repository.merge(user, source_sha, merge_request.target_branch, message) do |commit_id|
        merge_request.update(in_progress_merge_commit_sha: commit_id)
        nil # Return value does not matter.
      end
872
    end
873 874
  end

875
  def ff_merge(user, source, target_branch, merge_request: nil)
876 877
    their_commit_id = commit(source)&.id
    raise 'Invalid merge source' if their_commit_id.nil?
878

879
    merge_request&.update(in_progress_merge_commit_sha: their_commit_id)
880

881
    with_cache_hooks { raw.ff_merge(user, their_commit_id, target_branch) }
882 883
  end

884
  def revert(
885
    user, commit, branch_name, message,
886
    start_branch_name: nil, start_project: project)
887

888 889 890 891 892 893 894 895 896
    with_cache_hooks do
      raw_repository.revert(
        user: user,
        commit: commit.raw,
        branch_name: branch_name,
        message: message,
        start_branch_name: start_branch_name,
        start_repository: start_project.repository.raw_repository
      )
897
    end
898 899
  end

900
  def cherry_pick(
901
    user, commit, branch_name, message,
902
    start_branch_name: nil, start_project: project)
P
P.S.V.R 已提交
903

904 905 906 907 908 909 910 911 912
    with_cache_hooks do
      raw_repository.cherry_pick(
        user: user,
        commit: commit.raw,
        branch_name: branch_name,
        message: message,
        start_branch_name: start_branch_name,
        start_repository: start_project.repository.raw_repository
      )
P
P.S.V.R 已提交
913 914 915
    end
  end

916 917 918 919
  def merged_to_root_ref?(branch_or_name, pre_loaded_merged_branches = nil)
    branch = Gitlab::Git::Branch.find(self, branch_or_name)

    if branch
920 921
      @root_ref_sha ||= commit(root_ref).sha
      same_head = branch.target == @root_ref_sha
922 923 924 925
      merged =
        if pre_loaded_merged_branches
          pre_loaded_merged_branches.include?(branch.name)
        else
926
          ancestor?(branch.target, @root_ref_sha)
927
        end
F
Florent (HP) 已提交
928

929
      !same_head && merged
F
Florent (HP) 已提交
930 931 932 933 934
    else
      nil
    end
  end

935 936
  delegate :merged_branch_names, to: :raw_repository

S
Stan Hu 已提交
937
  def merge_base(first_commit_id, second_commit_id)
938 939
    first_commit_id = commit(first_commit_id).try(:id) || first_commit_id
    second_commit_id = commit(second_commit_id).try(:id) || second_commit_id
S
Stan Hu 已提交
940
    rugged.merge_base(first_commit_id, second_commit_id)
D
Douwe Maan 已提交
941 942
  rescue Rugged::ReferenceError
    nil
S
Stan Hu 已提交
943 944
  end

945
  def ancestor?(ancestor_id, descendant_id)
946
    return false if ancestor_id.nil? || descendant_id.nil?
947

948 949
    Gitlab::GitalyClient.migrate(:is_ancestor) do |is_enabled|
      if is_enabled
950
        raw_repository.ancestor?(ancestor_id, descendant_id)
951
      else
J
Jacob Vosmaer 已提交
952
        rugged_is_ancestor?(ancestor_id, descendant_id)
953 954
      end
    end
955 956
  end

V
Valery Sizov 已提交
957 958 959
  def empty_repo?
    !exists? || !has_visible_content?
  end
960
  cache_method :empty_repo?, memoize_only: true
V
Valery Sizov 已提交
961 962 963

  def search_files_by_content(query, ref)
    return [] if empty_repo? || query.blank?
V
Valery Sizov 已提交
964

965
    offset = 2
966 967 968
    args = %W(grep -i -I -n --before-context #{offset} --after-context #{offset} -E -e #{Regexp.escape(query)} #{ref || root_ref})

    run_git(args).first.scrub.split(/^--$/)
969 970
  end

V
Valery Sizov 已提交
971 972
  def search_files_by_name(query, ref)
    return [] if empty_repo? || query.blank?
973

974 975 976
    args = %W(ls-tree --full-tree -r #{ref || root_ref} --name-status | #{Regexp.escape(query)})

    run_git(args).first.lines.map(&:strip)
977 978
  end

979 980
  def fetch_remote(remote, forced: false, ssh_auth: nil, no_tags: false)
    gitlab_shell.fetch_remote(raw_repository, remote, ssh_auth: ssh_auth, forced: forced, no_tags: no_tags)
981 982
  end

983 984
  def fetch_source_branch!(source_repository, source_branch, local_ref)
    raw_repository.fetch_source_branch!(source_repository.raw_repository, source_branch, local_ref)
985
  end
986

987 988 989 990
  def remote_exists?(name)
    raw_repository.remote_exists?(name)
  end

991 992
  def compare_source_branch(target_branch_name, source_repository, source_branch_name, straight:)
    raw_repository.compare_source_branch(target_branch_name, source_repository.raw_repository, source_branch_name, straight: straight)
993
  end
994

995
  def create_ref(ref, ref_path)
996
    raw_repository.write_ref(ref_path, ref)
997 998
  end

999 1000 1001 1002 1003
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

1004 1005 1006 1007 1008 1009 1010 1011 1012 1013
  def copy_gitattributes(ref)
    actual_ref = ref || root_ref
    begin
      raw_repository.copy_gitattributes(actual_ref)
      true
    rescue Gitlab::Git::Repository::InvalidRef
      false
    end
  end

1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024
  # Caches the supplied block both in a cache and in an instance variable.
  #
  # The cache key and instance variable are named the same way as the value of
  # the `key` argument.
  #
  # This method will return `nil` if the corresponding instance variable is also
  # set to `nil`. This ensures we don't keep yielding the block when it returns
  # `nil`.
  #
  # key - The name of the key to cache the data in.
  # fallback - A value to fall back to in the event of a Git error.
1025
  def cache_method_output(key, fallback: nil, memoize_only: false, &block)
1026
    ivar = cache_instance_variable_name(key)
1027

1028 1029 1030
    if instance_variable_defined?(ivar)
      instance_variable_get(ivar)
    else
1031 1032 1033 1034
      # If the repository doesn't exist and a fallback was specified we return
      # that value inmediately. This saves us Rugged/gRPC invocations.
      return fallback unless fallback.nil? || exists?

1035
      begin
1036 1037 1038 1039 1040 1041 1042
        value =
          if memoize_only
            yield
          else
            cache.fetch(key, &block)
          end
        instance_variable_set(ivar, value)
1043
      rescue Rugged::ReferenceError, Gitlab::Git::Repository::NoRepository
1044 1045 1046
        # Even if the above `#exists?` check passes these errors might still
        # occur (for example because of a non-existing HEAD). We want to
        # gracefully handle this and not cache anything
1047
        fallback
1048 1049 1050
      end
    end
  end
1051

1052 1053 1054
  def cache_instance_variable_name(key)
    :"@#{key.to_s.tr('?!', '')}"
  end
1055

1056 1057
  def file_on_head(type)
    if head = tree(:head)
D
Douwe Maan 已提交
1058 1059
      head.blobs.find do |blob|
        Gitlab::FileDetector.type_of(blob.path) == type
1060 1061 1062 1063
      end
    end
  end

D
Douwe Maan 已提交
1064 1065 1066 1067
  def route_map_for(sha)
    blob_data_at(sha, '.gitlab/route-map.yml')
  end

1068 1069
  def gitlab_ci_yml_for(sha, path = '.gitlab-ci.yml')
    blob_data_at(sha, path)
D
Douwe Maan 已提交
1070 1071
  end

1072 1073 1074 1075
  def fetch_ref(source_repository, source_ref:, target_ref:)
    raw_repository.fetch_ref(source_repository.raw_repository, source_ref: source_ref, target_ref: target_ref)
  end

1076 1077
  private

1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089
  # TODO Generice finder, later split this on finders by Ref or Oid
  # gitlab-org/gitlab-ce#39239
  def find_commit(oid_or_ref)
    commit = if oid_or_ref.is_a?(Gitlab::Git::Commit)
               oid_or_ref
             else
               Gitlab::Git::Commit.find(raw_repository, oid_or_ref)
             end

    ::Commit.new(commit, @project) if commit
  end

D
Douwe Maan 已提交
1090 1091
  def blob_data_at(sha, path)
    blob = blob_at(sha, path)
1092
    return unless blob
1093

1094
    blob.load_all_data!
1095
    blob.data
1096
  end
1097

1098
  def cache
1099 1100
    # TODO: should we use UUIDs here? We could move repositories without clearing this cache
    @cache ||= RepositoryCache.new(full_path, @project.id)
1101
  end
1102 1103

  def tags_sorted_by_committed_date
1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115
    tags.sort_by do |tag|
      # Annotated tags can point to any object (e.g. a blob), but generally
      # tags point to a commit. If we don't have a commit, then just default
      # to putting the tag at the end of the list.
      target = tag.dereferenced_target

      if target
        target.committed_date
      else
        Time.now
      end
    end
1116
  end
D
Douwe Maan 已提交
1117 1118

  def keep_around_ref_name(sha)
1119
    "refs/#{REF_KEEP_AROUND}/#{sha}"
D
Douwe Maan 已提交
1120
  end
Y
Yorick Peterse 已提交
1121 1122

  def repository_event(event, tags = {})
1123
    Gitlab::Metrics.add_event(event, { path: full_path }.merge(tags))
Y
Yorick Peterse 已提交
1124
  end
1125

1126 1127
  def last_commit_for_path_by_gitaly(sha, path)
    c = raw_repository.gitaly_commit_client.last_commit_for_path(sha, path)
1128
    commit_by(oid: c)
1129 1130 1131 1132
  end

  def last_commit_for_path_by_rugged(sha, path)
    sha = last_commit_id_for_path_by_shelling_out(sha, path)
1133
    commit_by(oid: sha)
1134 1135 1136
  end

  def last_commit_id_for_path_by_shelling_out(sha, path)
1137
    args = %W(rev-list --max-count=1 #{sha} -- #{path})
A
Andrew Newdigate 已提交
1138
    raw_repository.run_git_with_timeout(args, Gitlab::Git::Popen::FAST_GIT_PROCESS_TIMEOUT).first.strip
1139 1140
  end

1141 1142 1143
  def repository_storage_path
    @project.repository_storage_path
  end
1144

1145
  def initialize_raw_repository
1146
    Gitlab::Git::Repository.new(project.repository_storage, disk_path + '.git', Gitlab::GlRepository.gl_repository(project, is_wiki))
1147
  end
1148

1149 1150 1151 1152 1153 1154 1155 1156 1157 1158 1159 1160 1161 1162 1163 1164 1165 1166 1167 1168
  def find_commits_by_message_by_shelling_out(query, ref, path, limit, offset)
    ref ||= root_ref

    args = %W(
      log #{ref} --pretty=%H --skip #{offset}
      --max-count #{limit} --grep=#{query} --regexp-ignore-case
    )
    args = args.concat(%W(-- #{path})) if path.present?

    git_log_results = run_git(args).first.lines

    git_log_results.map { |c| commit(c.chomp) }.compact
  end

  def find_commits_by_message_by_gitaly(query, ref, path, limit, offset)
    raw_repository
      .gitaly_commit_client
      .commits_by_message(query, revision: ref, path: path, limit: limit, offset: offset)
      .map { |c| commit(c) }
  end
1169
end