repository.rb 17.7 KB
Newer Older
1 2
require 'securerandom'

3
class Repository
4 5
  class CommitError < StandardError; end

6 7
  include Gitlab::ShellAdapter

8
  attr_accessor :path_with_namespace, :project
9

J
Jacob Vosmaer 已提交
10 11 12 13 14 15 16 17
  def self.clean_old_archives
    repository_downloads_path = Gitlab.config.gitlab.repository_downloads_path

    return unless File.directory?(repository_downloads_path)

    Gitlab::Popen.popen(%W(find #{repository_downloads_path} -not -path #{repository_downloads_path} -mmin +120 -delete))
  end

18
  def initialize(path_with_namespace, project)
19
    @path_with_namespace = path_with_namespace
20
    @project = project
21
  end
22

23 24
  def raw_repository
    return nil unless path_with_namespace
25

26
    @raw_repository ||= Gitlab::Git::Repository.new(path_to_repo)
27 28
  end

29 30 31 32
  def update_autocrlf_option
    raw_repository.autocrlf = :input if raw_repository.autocrlf != :input
  end

33
  # Return absolute path to repository
34
  def path_to_repo
35 36 37
    @path_to_repo ||= File.expand_path(
      File.join(Gitlab.config.gitlab_shell.repos_path, path_with_namespace + ".git")
    )
38 39
  end

40
  def exists?
41 42 43 44
    raw_repository.rugged
    true
  rescue Gitlab::Git::Repository::NoRepository
    false
45 46 47
  end

  def empty?
48 49 50
    return @empty unless @empty.nil?

    @empty = cache.fetch(:empty?) { raw_repository.empty? }
51 52
  end

53 54 55 56 57 58 59 60 61 62
  #
  # Git repository can contains some hidden refs like:
  #   /refs/notes/*
  #   /refs/git-as-svn/*
  #   /refs/pulls/*
  # This refs by default not visible in project page and not cloned to client side.
  #
  # This method return true if repository contains some content visible in project page.
  #
  def has_visible_content?
63 64 65 66 67
    return @has_visible_content unless @has_visible_content.nil?

    @has_visible_content = cache.fetch(:has_visible_content?) do
      raw_repository.branch_count > 0
    end
68 69
  end

70
  def commit(id = 'HEAD')
71
    return nil unless raw_repository
72
    commit = Gitlab::Git::Commit.find(raw_repository, id)
73
    commit = Commit.new(commit, @project) if commit
74
    commit
75
  rescue Rugged::OdbError
76
    nil
77 78
  end

D
Dmitriy Zaporozhets 已提交
79
  def commits(ref, path = nil, limit = nil, offset = nil, skip_merges = false)
80
    options = {
81 82 83 84 85
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
86 87
      # --follow doesn't play well with --skip. See:
      # https://gitlab.com/gitlab-org/gitlab-ce/issues/3574#note_3040520
88 89
      follow: false,
      skip_merges: skip_merges
90 91 92
    }

    commits = Gitlab::Git::Commit.where(options)
93
    commits = Commit.decorate(commits, @project) if commits.present?
94 95 96
    commits
  end

97 98
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
99
    commits = Commit.decorate(commits, @project) if commits.present?
100 101 102
    commits
  end

103 104 105
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
    ref ||= root_ref

106
    # Limited to 1000 commits for now, could be parameterized?
107 108
    args = %W(#{Gitlab.config.git.bin_path} log #{ref} --pretty=%H --skip #{offset} --max-count #{limit} --grep=#{query})
    args = args.concat(%W(-- #{path})) if path.present?
109

110 111
    git_log_results = Gitlab::Popen.popen(args, path_to_repo).first.lines.map(&:chomp)
    commits = git_log_results.map { |c| commit(c) }
112
    commits
113 114
  end

115
  def find_branch(name)
116
    raw_repository.branches.find { |branch| branch.name == name }
117 118 119
  end

  def find_tag(name)
120
    raw_repository.tags.find { |tag| tag.name == name }
121 122
  end

123 124 125 126 127 128 129 130 131 132
  def add_branch(user, branch_name, target)
    oldrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name
    target = commit(target).try(:id)

    return false unless target

    GitHooksService.new.execute(user, path_to_repo, oldrev, target, ref) do
      rugged.branches.create(branch_name, target)
    end
133

134 135
    expire_branches_cache
    find_branch(branch_name)
136 137
  end

138
  def add_tag(tag_name, ref, message = nil)
D
Douwe Maan 已提交
139
    expire_tags_cache
140

141
    gitlab_shell.add_tag(path_with_namespace, tag_name, ref, message)
142 143
  end

144
  def rm_branch(user, branch_name)
D
Douwe Maan 已提交
145
    expire_branches_cache
146

147 148 149 150 151 152 153 154
    branch = find_branch(branch_name)
    oldrev = branch.try(:target)
    newrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name

    GitHooksService.new.execute(user, path_to_repo, oldrev, newrev, ref) do
      rugged.branches.delete(branch_name)
    end
155

156 157
    expire_branches_cache
    true
158 159
  end

160
  def rm_tag(tag_name)
D
Douwe Maan 已提交
161
    expire_tags_cache
162

163 164 165
    gitlab_shell.rm_tag(path_with_namespace, tag_name)
  end

166
  def branch_names
167
    cache.fetch(:branch_names) { raw_repository.branch_names }
168 169 170
  end

  def tag_names
171
    cache.fetch(:tag_names) { raw_repository.tag_names }
172 173
  end

174
  def commit_count
175
    cache.fetch(:commit_count) do
176
      begin
177
        raw_repository.commit_count(self.root_ref)
178 179 180
      rescue
        0
      end
181
    end
182 183
  end

184 185 186
  # Return repo size in megabytes
  # Cached in redis
  def size
187
    cache.fetch(:size) { raw_repository.size }
188
  end
189

190
  def diverging_commit_counts(branch)
191
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
J
Jeff Stubler 已提交
192
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
193 194
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
195 196 197 198 199
      number_commits_behind = raw_repository.
        count_commits_between(branch.target, root_ref_hash)

      number_commits_ahead = raw_repository.
        count_commits_between(root_ref_hash, branch.target)
200

201 202 203
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
204

205
  def cache_keys
206
    %i(size branch_names tag_names commit_count
207 208
       readme version contribution_guide changelog license)
  end
209

210 211 212 213 214 215
  def build_cache
    cache_keys.each do |key|
      unless cache.exist?(key)
        send(key)
      end
    end
216

217
    branches.each do |branch|
J
Jeff Stubler 已提交
218
      unless cache.exist?(:"diverging_commit_counts_#{branch.name}")
219 220 221
        send(:diverging_commit_counts, branch)
      end
    end
222 223
  end

D
Douwe Maan 已提交
224 225 226 227 228 229 230 231 232 233
  def expire_tags_cache
    cache.expire(:tag_names)
    @tags = nil
  end

  def expire_branches_cache
    cache.expire(:branch_names)
    @branches = nil
  end

234
  def expire_cache(branch_name = nil)
235
    cache_keys.each do |key|
236 237
      cache.expire(key)
    end
238

239
    expire_branch_cache(branch_name)
240
  end
241

242 243 244 245 246 247 248 249 250
  # Expires _all_ caches, including those that would normally only be expired
  # under specific conditions.
  def expire_all_caches!
    expire_cache
    expire_root_ref_cache
    expire_emptiness_caches
    expire_has_visible_content_cache
  end

251 252 253 254 255 256 257 258 259 260 261 262
  def expire_branch_cache(branch_name = nil)
    # When we push to the root branch we have to flush the cache for all other
    # branches as their statistics are based on the commits relative to the
    # root branch.
    if !branch_name || branch_name == root_ref
      branches.each do |branch|
        cache.expire(:"diverging_commit_counts_#{branch.name}")
      end
    # In case a commit is pushed to a non-root branch we only have to flush the
    # cache for said branch.
    else
      cache.expire(:"diverging_commit_counts_#{branch_name}")
263
    end
D
Dmitriy Zaporozhets 已提交
264 265
  end

266 267 268 269 270
  def expire_root_ref_cache
    cache.expire(:root_ref)
    @root_ref = nil
  end

271 272 273 274 275 276 277 278
  # Expires the cache(s) used to determine if a repository is empty or not.
  def expire_emptiness_caches
    cache.expire(:empty?)
    @empty = nil

    expire_has_visible_content_cache
  end

279 280 281 282 283
  def expire_has_visible_content_cache
    cache.expire(:has_visible_content?)
    @has_visible_content = nil
  end

284 285
  def rebuild_cache
    cache_keys.each do |key|
286
      cache.expire(key)
287
      send(key)
D
Dmitriy Zaporozhets 已提交
288
    end
289

290
    branches.each do |branch|
J
Jeff Stubler 已提交
291 292
      cache.expire(:"diverging_commit_counts_#{branch.name}")
      diverging_commit_counts(branch)
293
    end
294 295
  end

296 297 298 299
  def lookup_cache
    @lookup_cache ||= {}
  end

300 301 302 303
  def expire_branch_names
    cache.expire(:branch_names)
  end

304
  def method_missing(m, *args, &block)
305 306 307 308 309 310
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
      lookup_cache[m][args.join(":")] ||= raw_repository.send(m, *args, &block)
    else
      raw_repository.send(m, *args, &block)
    end
311 312
  end

313 314
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
315
  end
D
Dmitriy Zaporozhets 已提交
316 317

  def blob_at(sha, path)
318 319 320
    unless Gitlab::Git.blank_ref?(sha)
      Gitlab::Git::Blob.find(self, sha, path)
    end
D
Dmitriy Zaporozhets 已提交
321
  end
322

323 324 325 326
  def blob_by_oid(oid)
    Gitlab::Git::Blob.raw(self, oid)
  end

327
  def readme
328
    cache.fetch(:readme) { tree(:head).readme }
329
  end
330

331
  def version
332
    cache.fetch(:version) do
333 334 335 336 337 338
      tree(:head).blobs.find do |file|
        file.name.downcase == 'version'
      end
    end
  end

339
  def contribution_guide
340 341 342 343 344 345
    cache.fetch(:contribution_guide) do
      tree(:head).blobs.find do |file|
        file.contributing?
      end
    end
  end
346 347 348 349

  def changelog
    cache.fetch(:changelog) do
      tree(:head).blobs.find do |file|
350
        file.name =~ /\A(changelog|history)/i
351 352
      end
    end
353 354
  end

355 356
  def license
    cache.fetch(:license) do
Z
Zeger-Jan van de Weg 已提交
357
      licenses =  tree(:head).blobs.find_all do |file|
358
                    file.name =~ /\A(copying|license|licence)/i
Z
Zeger-Jan van de Weg 已提交
359 360
                  end

361 362 363 364 365 366 367 368 369 370 371 372 373
      preferences = [
        /\Alicen[sc]e\z/i,        # LICENSE, LICENCE
        /\Alicen[sc]e\./i,        # LICENSE.md, LICENSE.txt
        /\Acopying\z/i,           # COPYING
        /\Acopying\.(?!lesser)/i, # COPYING.txt
        /Acopying.lesser/i        # COPYING.LESSER
      ]

      license = nil
      preferences.each do |r|
        license = licenses.find { |l| l.name =~ r }
        break if license
      end
Z
Zeger-Jan van de Weg 已提交
374

375
      license
376
    end
377 378
  end

379
  def head_commit
380 381 382 383 384
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
    @head_tree ||= Tree.new(self, head_commit.sha, nil)
385 386 387 388
  end

  def tree(sha = :head, path = nil)
    if sha == :head
389 390 391 392 393
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
394 395 396 397
    end

    Tree.new(self, sha, path)
  end
D
Dmitriy Zaporozhets 已提交
398 399

  def blob_at_branch(branch_name, path)
D
Dmitriy Zaporozhets 已提交
400
    last_commit = commit(branch_name)
D
Dmitriy Zaporozhets 已提交
401

D
Dmitriy Zaporozhets 已提交
402 403 404 405 406
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
D
Dmitriy Zaporozhets 已提交
407
  end
D
Dmitriy Zaporozhets 已提交
408 409 410 411 412 413 414 415

  # Returns url for submodule
  #
  # Ex.
  #   @repository.submodule_url_for('master', 'rack')
  #   # => git@localhost:rack.git
  #
  def submodule_url_for(ref, path)
D
Dmitriy Zaporozhets 已提交
416
    if submodules(ref).any?
D
Dmitriy Zaporozhets 已提交
417 418 419 420 421 422 423
      submodule = submodules(ref)[path]

      if submodule
        submodule['url']
      end
    end
  end
424 425

  def last_commit_for_path(sha, path)
426
    args = %W(#{Gitlab.config.git.bin_path} rev-list --max-count=1 #{sha} -- #{path})
427 428
    sha = Gitlab::Popen.popen(args, path_to_repo).first.strip
    commit(sha)
429
  end
430

431 432 433 434 435 436 437 438 439 440 441
  def next_patch_branch
    patch_branch_ids = self.branch_names.map do |n|
      result = n.match(/\Apatch-([0-9]+)\z/)
      result[1].to_i if result
    end.compact

    highest_patch_branch_id = patch_branch_ids.max || 0

    "patch-#{highest_patch_branch_id + 1}"
  end

442
  # Remove archives older than 2 hours
443 444 445 446 447 448 449 450 451 452 453 454 455 456
  def branches_sorted_by(value)
    case value
    when 'recently_updated'
      branches.sort do |a, b|
        commit(b.target).committed_date <=> commit(a.target).committed_date
      end
    when 'last_updated'
      branches.sort do |a, b|
        commit(a.target).committed_date <=> commit(b.target).committed_date
      end
    else
      branches
    end
  end
457 458

  def contributors
D
Dmitriy Zaporozhets 已提交
459
    commits = self.commits(nil, nil, 2000, 0, true)
460

D
Dmitriy Zaporozhets 已提交
461
    commits.group_by(&:author_email).map do |email, commits|
462 463
      contributor = Gitlab::Contributor.new
      contributor.email = email
464

D
Dmitriy Zaporozhets 已提交
465
      commits.each do |commit|
466
        if contributor.name.blank?
D
Dmitriy Zaporozhets 已提交
467
          contributor.name = commit.author_name
468 469
        end

470
        contributor.commits += 1
471 472
      end

473 474
      contributor
    end
475
  end
D
Dmitriy Zaporozhets 已提交
476 477

  def blob_for_diff(commit, diff)
478
    blob_at(commit.id, diff.file_path)
D
Dmitriy Zaporozhets 已提交
479 480 481 482 483 484 485
  end

  def prev_blob_for_diff(commit, diff)
    if commit.parent_id
      blob_at(commit.parent_id, diff.old_path)
    end
  end
486

487 488
  def refs_contains_sha(ref_type, sha)
    args = %W(#{Gitlab.config.git.bin_path} #{ref_type} --contains #{sha})
489 490 491 492 493 494 495 496 497 498 499 500 501 502
    names = Gitlab::Popen.popen(args, path_to_repo).first

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
H
Hannes Rosenögger 已提交
503

504 505 506
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
H
Hannes Rosenögger 已提交
507

508 509
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
H
Hannes Rosenögger 已提交
510
  end
511

512 513 514 515 516 517 518 519 520
  def branches
    @branches ||= raw_repository.branches
  end

  def tags
    @tags ||= raw_repository.tags
  end

  def root_ref
521
    @root_ref ||= cache.fetch(:root_ref) { raw_repository.root_ref }
522 523
  end

S
Stan Hu 已提交
524
  def commit_dir(user, path, message, branch)
525
    commit_with_hooks(user, branch) do |ref|
S
Stan Hu 已提交
526 527 528 529 530 531 532 533 534 535 536 537 538
      committer = user_to_committer(user)
      options = {}
      options[:committer] = committer
      options[:author] = committer

      options[:commit] = {
        message: message,
        branch: ref,
      }

      raw_repository.mkdir(path, options)
    end
  end
539

S
Stan Hu 已提交
540 541 542
  def commit_file(user, path, content, message, branch, update)
    commit_with_hooks(user, branch) do |ref|
      committer = user_to_committer(user)
543 544 545 546 547 548 549
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref,
      }
550

551 552
      options[:file] = {
        content: content,
S
Stan Hu 已提交
553 554
        path: path,
        update: update
555
      }
556

557 558
      Gitlab::Git::Blob.commit(raw_repository, options)
    end
559 560
  end

561
  def remove_file(user, path, message, branch)
562
    commit_with_hooks(user, branch) do |ref|
S
Stan Hu 已提交
563
      committer = user_to_committer(user)
564 565 566 567 568 569 570
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref
      }
571

572 573 574
      options[:file] = {
        path: path
      }
575

576 577
      Gitlab::Git::Blob.remove(raw_repository, options)
    end
578 579
  end

S
Stan Hu 已提交
580
  def user_to_committer(user)
581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598
    {
      email: user.email,
      name: user.name,
      time: Time.now
    }
  end

  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

599
  def merge(user, source_sha, target_branch, options = {})
600 601 602 603 604 605 606 607 608
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    raise "Invalid merge target" if our_commit.nil?
    raise "Invalid merge source" if their_commit.nil?

    merge_index = rugged.merge_commits(our_commit, their_commit)
    return false if merge_index.conflicts?

609 610 611 612 613 614
    commit_with_hooks(user, target_branch) do |ref|
      actual_options = options.merge(
        parents: [our_commit, their_commit],
        tree: merge_index.write_tree(rugged),
        update_ref: ref
      )
615

616 617
      Rugged::Commit.create(rugged, actual_options)
    end
618 619
  end

F
Florent (HP) 已提交
620 621 622 623 624
  def merged_to_root_ref?(branch_name)
    branch_commit = commit(branch_name)
    root_ref_commit = commit(root_ref)

    if branch_commit
625
      is_ancestor?(branch_commit.id, root_ref_commit.id)
F
Florent (HP) 已提交
626 627 628 629 630
    else
      nil
    end
  end

S
Stan Hu 已提交
631
  def merge_base(first_commit_id, second_commit_id)
632 633
    first_commit_id = commit(first_commit_id).try(:id) || first_commit_id
    second_commit_id = commit(second_commit_id).try(:id) || second_commit_id
S
Stan Hu 已提交
634
    rugged.merge_base(first_commit_id, second_commit_id)
D
Douwe Maan 已提交
635 636
  rescue Rugged::ReferenceError
    nil
S
Stan Hu 已提交
637 638
  end

639 640 641 642 643
  def is_ancestor?(ancestor_id, descendant_id)
    merge_base(ancestor_id, descendant_id) == ancestor_id
  end


644 645
  def search_files(query, ref)
    offset = 2
646
    args = %W(#{Gitlab.config.git.bin_path} grep -i -I -n --before-context #{offset} --after-context #{offset} -e #{query} #{ref || root_ref})
647 648 649
    Gitlab::Popen.popen(args, path_to_repo).first.scrub.split(/^--$/)
  end

D
Dmitriy Zaporozhets 已提交
650
  def parse_search_result(result)
651 652 653 654
    ref = nil
    filename = nil
    startline = 0

655
    result.each_line.each_with_index do |line, index|
656 657 658 659 660 661 662
      if line =~ /^.*:.*:\d+:/
        ref, filename, startline = line.split(':')
        startline = startline.to_i - index
        break
      end
    end

663
    data = ""
664

665 666 667
    result.each_line do |line|
      data << line.sub(ref, '').sub(filename, '').sub(/^:-\d+-/, '').sub(/^::\d+:/, '')
    end
668 669 670 671 672 673 674 675 676

    OpenStruct.new(
      filename: filename,
      ref: ref,
      startline: startline,
      data: data
    )
  end

677
  def fetch_ref(source_path, source_ref, target_ref)
678
    args = %W(#{Gitlab.config.git.bin_path} fetch -f #{source_path} #{source_ref}:#{target_ref})
679 680 681
    Gitlab::Popen.popen(args, path_to_repo)
  end

682
  def with_tmp_ref(oldrev = nil)
683 684 685
    random_string = SecureRandom.hex
    tmp_ref = "refs/tmp/#{random_string}/head"

686
    if oldrev && !Gitlab::Git.blank_ref?(oldrev)
687 688 689 690
      rugged.references.create(tmp_ref, oldrev)
    end

    # Make commit in tmp ref
691 692 693 694 695 696
    yield(tmp_ref)
  ensure
    rugged.references.delete(tmp_ref) rescue nil
  end

  def commit_with_hooks(current_user, branch)
697 698
    update_autocrlf_option

699 700 701
    oldrev = Gitlab::Git::BLANK_SHA
    ref = Gitlab::Git::BRANCH_REF_PREFIX + branch
    was_empty = empty?
702

703 704
    unless was_empty
      oldrev = find_branch(branch).target
705 706
    end

707 708 709 710 711 712 713
    with_tmp_ref(oldrev) do |tmp_ref|
      # Make commit in tmp ref
      newrev = yield(tmp_ref)

      unless newrev
        raise CommitError.new('Failed to create commit')
      end
714

715 716 717 718
      GitHooksService.new.execute(current_user, path_to_repo, oldrev, newrev, ref) do
        if was_empty
          # Create branch
          rugged.references.create(ref, newrev)
719
        else
720 721 722 723 724 725 726 727 728
          # Update head
          current_head = find_branch(branch).target

          # Make sure target branch was not changed during pre-receive hook
          if current_head == oldrev
            rugged.references.update(ref, newrev)
          else
            raise CommitError.new('Commit was rejected because branch received new push')
          end
729 730 731 732 733
        end
      end
    end
  end

734 735 736 737 738
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

739 740
  private

741 742 743
  def cache
    @cache ||= RepositoryCache.new(path_with_namespace)
  end
744
end