repository.rb 17.7 KB
Newer Older
1 2
require 'securerandom'

3
class Repository
4 5
  class CommitError < StandardError; end

6 7
  include Gitlab::ShellAdapter

8
  attr_accessor :path_with_namespace, :project
9

J
Jacob Vosmaer 已提交
10 11 12 13 14 15 16 17
  def self.clean_old_archives
    repository_downloads_path = Gitlab.config.gitlab.repository_downloads_path

    return unless File.directory?(repository_downloads_path)

    Gitlab::Popen.popen(%W(find #{repository_downloads_path} -not -path #{repository_downloads_path} -mmin +120 -delete))
  end

18
  def initialize(path_with_namespace, project)
19
    @path_with_namespace = path_with_namespace
20
    @project = project
21
  end
22

23 24
  def raw_repository
    return nil unless path_with_namespace
25

26
    @raw_repository ||= begin
27
      Gitlab::Git::Repository.new(path_to_repo)
28 29 30
    rescue Gitlab::Git::Repository::NoRepository
      nil
    end
31 32
  end

33 34 35 36
  def update_autocrlf_option
    raw_repository.autocrlf = :input if raw_repository.autocrlf != :input
  end

37
  # Return absolute path to repository
38
  def path_to_repo
39 40 41
    @path_to_repo ||= File.expand_path(
      File.join(Gitlab.config.gitlab_shell.repos_path, path_with_namespace + ".git")
    )
42 43
  end

44 45 46 47 48
  def exists?
    raw_repository
  end

  def empty?
49 50 51
    return @empty unless @empty.nil?

    @empty = cache.fetch(:empty?) { raw_repository.empty? }
52 53
  end

54 55 56 57 58 59 60 61 62 63
  #
  # Git repository can contains some hidden refs like:
  #   /refs/notes/*
  #   /refs/git-as-svn/*
  #   /refs/pulls/*
  # This refs by default not visible in project page and not cloned to client side.
  #
  # This method return true if repository contains some content visible in project page.
  #
  def has_visible_content?
64 65 66 67 68
    return @has_visible_content unless @has_visible_content.nil?

    @has_visible_content = cache.fetch(:has_visible_content?) do
      raw_repository.branch_count > 0
    end
69 70
  end

71
  def commit(id = 'HEAD')
72
    return nil unless raw_repository
73
    commit = Gitlab::Git::Commit.find(raw_repository, id)
74
    commit = Commit.new(commit, @project) if commit
75
    commit
76
  rescue Rugged::OdbError
77
    nil
78 79
  end

D
Dmitriy Zaporozhets 已提交
80
  def commits(ref, path = nil, limit = nil, offset = nil, skip_merges = false)
81
    options = {
82 83 84 85 86
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
87 88
      # --follow doesn't play well with --skip. See:
      # https://gitlab.com/gitlab-org/gitlab-ce/issues/3574#note_3040520
89 90
      follow: false,
      skip_merges: skip_merges
91 92 93
    }

    commits = Gitlab::Git::Commit.where(options)
94
    commits = Commit.decorate(commits, @project) if commits.present?
95 96 97
    commits
  end

98 99
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
100
    commits = Commit.decorate(commits, @project) if commits.present?
101 102 103
    commits
  end

104 105 106
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
    ref ||= root_ref

107
    # Limited to 1000 commits for now, could be parameterized?
108 109
    args = %W(#{Gitlab.config.git.bin_path} log #{ref} --pretty=%H --skip #{offset} --max-count #{limit} --grep=#{query})
    args = args.concat(%W(-- #{path})) if path.present?
110

111 112
    git_log_results = Gitlab::Popen.popen(args, path_to_repo).first.lines.map(&:chomp)
    commits = git_log_results.map { |c| commit(c) }
113
    commits
114 115
  end

116
  def find_branch(name)
117
    raw_repository.branches.find { |branch| branch.name == name }
118 119 120
  end

  def find_tag(name)
121
    raw_repository.tags.find { |tag| tag.name == name }
122 123
  end

124 125 126 127 128 129 130 131 132 133
  def add_branch(user, branch_name, target)
    oldrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name
    target = commit(target).try(:id)

    return false unless target

    GitHooksService.new.execute(user, path_to_repo, oldrev, target, ref) do
      rugged.branches.create(branch_name, target)
    end
134

135 136
    expire_branches_cache
    find_branch(branch_name)
137 138
  end

139
  def add_tag(tag_name, ref, message = nil)
D
Douwe Maan 已提交
140
    expire_tags_cache
141

142
    gitlab_shell.add_tag(path_with_namespace, tag_name, ref, message)
143 144
  end

145
  def rm_branch(user, branch_name)
D
Douwe Maan 已提交
146
    expire_branches_cache
147

148 149 150 151 152 153 154 155
    branch = find_branch(branch_name)
    oldrev = branch.try(:target)
    newrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name

    GitHooksService.new.execute(user, path_to_repo, oldrev, newrev, ref) do
      rugged.branches.delete(branch_name)
    end
156

157 158
    expire_branches_cache
    true
159 160
  end

161
  def rm_tag(tag_name)
D
Douwe Maan 已提交
162
    expire_tags_cache
163

164 165 166
    gitlab_shell.rm_tag(path_with_namespace, tag_name)
  end

167
  def branch_names
168
    cache.fetch(:branch_names) { raw_repository.branch_names }
169 170 171
  end

  def tag_names
172
    cache.fetch(:tag_names) { raw_repository.tag_names }
173 174
  end

175
  def commit_count
176
    cache.fetch(:commit_count) do
177
      begin
178
        raw_repository.commit_count(self.root_ref)
179 180 181
      rescue
        0
      end
182
    end
183 184
  end

185 186 187
  # Return repo size in megabytes
  # Cached in redis
  def size
188
    cache.fetch(:size) { raw_repository.size }
189
  end
190

191
  def diverging_commit_counts(branch)
192
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
J
Jeff Stubler 已提交
193
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
194 195
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
196 197 198 199 200
      number_commits_behind = raw_repository.
        count_commits_between(branch.target, root_ref_hash)

      number_commits_ahead = raw_repository.
        count_commits_between(root_ref_hash, branch.target)
201

202 203 204
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
205

206
  def cache_keys
207
    %i(size branch_names tag_names commit_count
208 209
       readme version contribution_guide changelog license)
  end
210

211 212 213 214 215 216
  def build_cache
    cache_keys.each do |key|
      unless cache.exist?(key)
        send(key)
      end
    end
217

218
    branches.each do |branch|
J
Jeff Stubler 已提交
219
      unless cache.exist?(:"diverging_commit_counts_#{branch.name}")
220 221 222
        send(:diverging_commit_counts, branch)
      end
    end
223 224
  end

D
Douwe Maan 已提交
225 226 227 228 229 230 231 232 233 234
  def expire_tags_cache
    cache.expire(:tag_names)
    @tags = nil
  end

  def expire_branches_cache
    cache.expire(:branch_names)
    @branches = nil
  end

235
  def expire_cache(branch_name = nil)
236
    cache_keys.each do |key|
237 238
      cache.expire(key)
    end
239

240
    expire_branch_cache(branch_name)
241
  end
242

243 244 245 246 247 248 249 250 251
  # Expires _all_ caches, including those that would normally only be expired
  # under specific conditions.
  def expire_all_caches!
    expire_cache
    expire_root_ref_cache
    expire_emptiness_caches
    expire_has_visible_content_cache
  end

252 253 254 255 256 257 258 259 260 261 262 263
  def expire_branch_cache(branch_name = nil)
    # When we push to the root branch we have to flush the cache for all other
    # branches as their statistics are based on the commits relative to the
    # root branch.
    if !branch_name || branch_name == root_ref
      branches.each do |branch|
        cache.expire(:"diverging_commit_counts_#{branch.name}")
      end
    # In case a commit is pushed to a non-root branch we only have to flush the
    # cache for said branch.
    else
      cache.expire(:"diverging_commit_counts_#{branch_name}")
264
    end
D
Dmitriy Zaporozhets 已提交
265 266
  end

267 268 269 270 271
  def expire_root_ref_cache
    cache.expire(:root_ref)
    @root_ref = nil
  end

272 273 274 275 276 277 278 279
  # Expires the cache(s) used to determine if a repository is empty or not.
  def expire_emptiness_caches
    cache.expire(:empty?)
    @empty = nil

    expire_has_visible_content_cache
  end

280 281 282 283 284
  def expire_has_visible_content_cache
    cache.expire(:has_visible_content?)
    @has_visible_content = nil
  end

285 286
  def rebuild_cache
    cache_keys.each do |key|
287
      cache.expire(key)
288
      send(key)
D
Dmitriy Zaporozhets 已提交
289
    end
290

291
    branches.each do |branch|
J
Jeff Stubler 已提交
292 293
      cache.expire(:"diverging_commit_counts_#{branch.name}")
      diverging_commit_counts(branch)
294
    end
295 296
  end

297 298 299 300
  def lookup_cache
    @lookup_cache ||= {}
  end

301 302 303 304
  def expire_branch_names
    cache.expire(:branch_names)
  end

305
  def method_missing(m, *args, &block)
306 307 308 309 310 311
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
      lookup_cache[m][args.join(":")] ||= raw_repository.send(m, *args, &block)
    else
      raw_repository.send(m, *args, &block)
    end
312 313
  end

314 315
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
316
  end
D
Dmitriy Zaporozhets 已提交
317 318

  def blob_at(sha, path)
319 320 321
    unless Gitlab::Git.blank_ref?(sha)
      Gitlab::Git::Blob.find(self, sha, path)
    end
D
Dmitriy Zaporozhets 已提交
322
  end
323

324 325 326 327
  def blob_by_oid(oid)
    Gitlab::Git::Blob.raw(self, oid)
  end

328
  def readme
329
    cache.fetch(:readme) { tree(:head).readme }
330
  end
331

332
  def version
333
    cache.fetch(:version) do
334 335 336 337 338 339
      tree(:head).blobs.find do |file|
        file.name.downcase == 'version'
      end
    end
  end

340
  def contribution_guide
341 342 343 344 345 346
    cache.fetch(:contribution_guide) do
      tree(:head).blobs.find do |file|
        file.contributing?
      end
    end
  end
347 348 349 350

  def changelog
    cache.fetch(:changelog) do
      tree(:head).blobs.find do |file|
351
        file.name =~ /\A(changelog|history)/i
352 353
      end
    end
354 355
  end

356 357
  def license
    cache.fetch(:license) do
Z
Zeger-Jan van de Weg 已提交
358
      licenses =  tree(:head).blobs.find_all do |file|
359
                    file.name =~ /\A(copying|license|licence)/i
Z
Zeger-Jan van de Weg 已提交
360 361
                  end

362 363 364 365 366 367 368 369 370 371 372 373 374
      preferences = [
        /\Alicen[sc]e\z/i,        # LICENSE, LICENCE
        /\Alicen[sc]e\./i,        # LICENSE.md, LICENSE.txt
        /\Acopying\z/i,           # COPYING
        /\Acopying\.(?!lesser)/i, # COPYING.txt
        /Acopying.lesser/i        # COPYING.LESSER
      ]

      license = nil
      preferences.each do |r|
        license = licenses.find { |l| l.name =~ r }
        break if license
      end
Z
Zeger-Jan van de Weg 已提交
375

376
      license
377
    end
378 379
  end

380
  def head_commit
381 382 383 384 385
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
    @head_tree ||= Tree.new(self, head_commit.sha, nil)
386 387 388 389
  end

  def tree(sha = :head, path = nil)
    if sha == :head
390 391 392 393 394
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
395 396 397 398
    end

    Tree.new(self, sha, path)
  end
D
Dmitriy Zaporozhets 已提交
399 400

  def blob_at_branch(branch_name, path)
D
Dmitriy Zaporozhets 已提交
401
    last_commit = commit(branch_name)
D
Dmitriy Zaporozhets 已提交
402

D
Dmitriy Zaporozhets 已提交
403 404 405 406 407
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
D
Dmitriy Zaporozhets 已提交
408
  end
D
Dmitriy Zaporozhets 已提交
409 410 411 412 413 414 415 416

  # Returns url for submodule
  #
  # Ex.
  #   @repository.submodule_url_for('master', 'rack')
  #   # => git@localhost:rack.git
  #
  def submodule_url_for(ref, path)
D
Dmitriy Zaporozhets 已提交
417
    if submodules(ref).any?
D
Dmitriy Zaporozhets 已提交
418 419 420 421 422 423 424
      submodule = submodules(ref)[path]

      if submodule
        submodule['url']
      end
    end
  end
425 426

  def last_commit_for_path(sha, path)
427
    args = %W(#{Gitlab.config.git.bin_path} rev-list --max-count=1 #{sha} -- #{path})
428 429
    sha = Gitlab::Popen.popen(args, path_to_repo).first.strip
    commit(sha)
430
  end
431

432 433 434 435 436 437 438 439 440 441 442
  def next_patch_branch
    patch_branch_ids = self.branch_names.map do |n|
      result = n.match(/\Apatch-([0-9]+)\z/)
      result[1].to_i if result
    end.compact

    highest_patch_branch_id = patch_branch_ids.max || 0

    "patch-#{highest_patch_branch_id + 1}"
  end

443
  # Remove archives older than 2 hours
444 445 446 447 448 449 450 451 452 453 454 455 456 457
  def branches_sorted_by(value)
    case value
    when 'recently_updated'
      branches.sort do |a, b|
        commit(b.target).committed_date <=> commit(a.target).committed_date
      end
    when 'last_updated'
      branches.sort do |a, b|
        commit(a.target).committed_date <=> commit(b.target).committed_date
      end
    else
      branches
    end
  end
458 459

  def contributors
D
Dmitriy Zaporozhets 已提交
460
    commits = self.commits(nil, nil, 2000, 0, true)
461

D
Dmitriy Zaporozhets 已提交
462
    commits.group_by(&:author_email).map do |email, commits|
463 464
      contributor = Gitlab::Contributor.new
      contributor.email = email
465

D
Dmitriy Zaporozhets 已提交
466
      commits.each do |commit|
467
        if contributor.name.blank?
D
Dmitriy Zaporozhets 已提交
468
          contributor.name = commit.author_name
469 470
        end

471
        contributor.commits += 1
472 473
      end

474 475
      contributor
    end
476
  end
D
Dmitriy Zaporozhets 已提交
477 478

  def blob_for_diff(commit, diff)
479
    blob_at(commit.id, diff.file_path)
D
Dmitriy Zaporozhets 已提交
480 481 482 483 484 485 486
  end

  def prev_blob_for_diff(commit, diff)
    if commit.parent_id
      blob_at(commit.parent_id, diff.old_path)
    end
  end
487

488 489
  def refs_contains_sha(ref_type, sha)
    args = %W(#{Gitlab.config.git.bin_path} #{ref_type} --contains #{sha})
490 491 492 493 494 495 496 497 498 499 500 501 502 503
    names = Gitlab::Popen.popen(args, path_to_repo).first

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
H
Hannes Rosenögger 已提交
504

505 506 507
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
H
Hannes Rosenögger 已提交
508

509 510
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
H
Hannes Rosenögger 已提交
511
  end
512

513 514 515 516 517 518 519 520 521
  def branches
    @branches ||= raw_repository.branches
  end

  def tags
    @tags ||= raw_repository.tags
  end

  def root_ref
522
    @root_ref ||= cache.fetch(:root_ref) { raw_repository.root_ref }
523 524
  end

S
Stan Hu 已提交
525
  def commit_dir(user, path, message, branch)
526
    commit_with_hooks(user, branch) do |ref|
S
Stan Hu 已提交
527 528 529 530 531 532 533 534 535 536 537 538 539
      committer = user_to_committer(user)
      options = {}
      options[:committer] = committer
      options[:author] = committer

      options[:commit] = {
        message: message,
        branch: ref,
      }

      raw_repository.mkdir(path, options)
    end
  end
540

S
Stan Hu 已提交
541 542 543
  def commit_file(user, path, content, message, branch, update)
    commit_with_hooks(user, branch) do |ref|
      committer = user_to_committer(user)
544 545 546 547 548 549 550
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref,
      }
551

552 553
      options[:file] = {
        content: content,
S
Stan Hu 已提交
554 555
        path: path,
        update: update
556
      }
557

558 559
      Gitlab::Git::Blob.commit(raw_repository, options)
    end
560 561
  end

562
  def remove_file(user, path, message, branch)
563
    commit_with_hooks(user, branch) do |ref|
S
Stan Hu 已提交
564
      committer = user_to_committer(user)
565 566 567 568 569 570 571
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref
      }
572

573 574 575
      options[:file] = {
        path: path
      }
576

577 578
      Gitlab::Git::Blob.remove(raw_repository, options)
    end
579 580
  end

S
Stan Hu 已提交
581
  def user_to_committer(user)
582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599
    {
      email: user.email,
      name: user.name,
      time: Time.now
    }
  end

  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

600
  def merge(user, source_sha, target_branch, options = {})
601 602 603 604 605 606 607 608 609
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    raise "Invalid merge target" if our_commit.nil?
    raise "Invalid merge source" if their_commit.nil?

    merge_index = rugged.merge_commits(our_commit, their_commit)
    return false if merge_index.conflicts?

610 611 612 613 614 615
    commit_with_hooks(user, target_branch) do |ref|
      actual_options = options.merge(
        parents: [our_commit, their_commit],
        tree: merge_index.write_tree(rugged),
        update_ref: ref
      )
616

617 618
      Rugged::Commit.create(rugged, actual_options)
    end
619 620
  end

F
Florent (HP) 已提交
621 622 623 624 625
  def merged_to_root_ref?(branch_name)
    branch_commit = commit(branch_name)
    root_ref_commit = commit(root_ref)

    if branch_commit
626
      is_ancestor?(branch_commit.id, root_ref_commit.id)
F
Florent (HP) 已提交
627 628 629 630 631
    else
      nil
    end
  end

S
Stan Hu 已提交
632
  def merge_base(first_commit_id, second_commit_id)
633 634
    first_commit_id = commit(first_commit_id).try(:id) || first_commit_id
    second_commit_id = commit(second_commit_id).try(:id) || second_commit_id
S
Stan Hu 已提交
635
    rugged.merge_base(first_commit_id, second_commit_id)
D
Douwe Maan 已提交
636 637
  rescue Rugged::ReferenceError
    nil
S
Stan Hu 已提交
638 639
  end

640 641 642 643 644
  def is_ancestor?(ancestor_id, descendant_id)
    merge_base(ancestor_id, descendant_id) == ancestor_id
  end


645 646
  def search_files(query, ref)
    offset = 2
647
    args = %W(#{Gitlab.config.git.bin_path} grep -i -I -n --before-context #{offset} --after-context #{offset} -e #{query} #{ref || root_ref})
648 649 650
    Gitlab::Popen.popen(args, path_to_repo).first.scrub.split(/^--$/)
  end

D
Dmitriy Zaporozhets 已提交
651
  def parse_search_result(result)
652 653 654 655
    ref = nil
    filename = nil
    startline = 0

656
    result.each_line.each_with_index do |line, index|
657 658 659 660 661 662 663
      if line =~ /^.*:.*:\d+:/
        ref, filename, startline = line.split(':')
        startline = startline.to_i - index
        break
      end
    end

664
    data = ""
665

666 667 668
    result.each_line do |line|
      data << line.sub(ref, '').sub(filename, '').sub(/^:-\d+-/, '').sub(/^::\d+:/, '')
    end
669 670 671 672 673 674 675 676 677

    OpenStruct.new(
      filename: filename,
      ref: ref,
      startline: startline,
      data: data
    )
  end

678
  def fetch_ref(source_path, source_ref, target_ref)
679
    args = %W(#{Gitlab.config.git.bin_path} fetch -f #{source_path} #{source_ref}:#{target_ref})
680 681 682
    Gitlab::Popen.popen(args, path_to_repo)
  end

683
  def with_tmp_ref(oldrev = nil)
684 685 686
    random_string = SecureRandom.hex
    tmp_ref = "refs/tmp/#{random_string}/head"

687
    if oldrev && !Gitlab::Git.blank_ref?(oldrev)
688 689 690 691
      rugged.references.create(tmp_ref, oldrev)
    end

    # Make commit in tmp ref
692 693 694 695 696 697
    yield(tmp_ref)
  ensure
    rugged.references.delete(tmp_ref) rescue nil
  end

  def commit_with_hooks(current_user, branch)
698 699
    update_autocrlf_option

700 701 702
    oldrev = Gitlab::Git::BLANK_SHA
    ref = Gitlab::Git::BRANCH_REF_PREFIX + branch
    was_empty = empty?
703

704 705
    unless was_empty
      oldrev = find_branch(branch).target
706 707
    end

708 709 710 711 712 713 714
    with_tmp_ref(oldrev) do |tmp_ref|
      # Make commit in tmp ref
      newrev = yield(tmp_ref)

      unless newrev
        raise CommitError.new('Failed to create commit')
      end
715

716 717 718 719
      GitHooksService.new.execute(current_user, path_to_repo, oldrev, newrev, ref) do
        if was_empty
          # Create branch
          rugged.references.create(ref, newrev)
720
        else
721 722 723 724 725 726 727 728 729
          # Update head
          current_head = find_branch(branch).target

          # Make sure target branch was not changed during pre-receive hook
          if current_head == oldrev
            rugged.references.update(ref, newrev)
          else
            raise CommitError.new('Commit was rejected because branch received new push')
          end
730 731 732 733 734
        end
      end
    end
  end

735 736 737 738 739
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

740 741
  private

742 743 744
  def cache
    @cache ||= RepositoryCache.new(path_with_namespace)
  end
745
end