repository.rb 17.1 KB
Newer Older
1 2
require 'securerandom'

3
class Repository
4 5
  class CommitError < StandardError; end

6 7
  include Gitlab::ShellAdapter

8
  attr_accessor :path_with_namespace, :project
9

J
Jacob Vosmaer 已提交
10 11 12 13 14 15 16 17
  def self.clean_old_archives
    repository_downloads_path = Gitlab.config.gitlab.repository_downloads_path

    return unless File.directory?(repository_downloads_path)

    Gitlab::Popen.popen(%W(find #{repository_downloads_path} -not -path #{repository_downloads_path} -mmin +120 -delete))
  end

18
  def initialize(path_with_namespace, default_branch = nil, project = nil)
19
    @path_with_namespace = path_with_namespace
20
    @project = project
21
  end
22

23 24
  def raw_repository
    return nil unless path_with_namespace
25

26 27 28 29 30 31 32
    @raw_repository ||= begin
      repo = Gitlab::Git::Repository.new(path_to_repo)
      repo.autocrlf = :input
      repo
    rescue Gitlab::Git::Repository::NoRepository
      nil
    end
33 34
  end

35
  # Return absolute path to repository
36
  def path_to_repo
37 38 39
    @path_to_repo ||= File.expand_path(
      File.join(Gitlab.config.gitlab_shell.repos_path, path_with_namespace + ".git")
    )
40 41
  end

42 43 44 45 46
  def exists?
    raw_repository
  end

  def empty?
47 48 49
    return @empty unless @empty.nil?

    @empty = cache.fetch(:empty?) { raw_repository.empty? }
50 51
  end

52 53 54 55 56 57 58 59 60 61
  #
  # Git repository can contains some hidden refs like:
  #   /refs/notes/*
  #   /refs/git-as-svn/*
  #   /refs/pulls/*
  # This refs by default not visible in project page and not cloned to client side.
  #
  # This method return true if repository contains some content visible in project page.
  #
  def has_visible_content?
62 63 64 65 66
    return @has_visible_content unless @has_visible_content.nil?

    @has_visible_content = cache.fetch(:has_visible_content?) do
      raw_repository.branch_count > 0
    end
67 68
  end

69
  def commit(id = 'HEAD')
70
    return nil unless raw_repository
71
    commit = Gitlab::Git::Commit.find(raw_repository, id)
72
    commit = Commit.new(commit, @project) if commit
73
    commit
74
  rescue Rugged::OdbError
75
    nil
76 77
  end

D
Dmitriy Zaporozhets 已提交
78
  def commits(ref, path = nil, limit = nil, offset = nil, skip_merges = false)
79
    options = {
80 81 82 83 84
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
85 86
      # --follow doesn't play well with --skip. See:
      # https://gitlab.com/gitlab-org/gitlab-ce/issues/3574#note_3040520
87 88
      follow: false,
      skip_merges: skip_merges
89 90 91
    }

    commits = Gitlab::Git::Commit.where(options)
92
    commits = Commit.decorate(commits, @project) if commits.present?
93 94 95
    commits
  end

96 97
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
98
    commits = Commit.decorate(commits, @project) if commits.present?
99 100 101
    commits
  end

102 103 104
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
    ref ||= root_ref

105
    # Limited to 1000 commits for now, could be parameterized?
106 107
    args = %W(#{Gitlab.config.git.bin_path} log #{ref} --pretty=%H --skip #{offset} --max-count #{limit} --grep=#{query})
    args = args.concat(%W(-- #{path})) if path.present?
108

109 110
    git_log_results = Gitlab::Popen.popen(args, path_to_repo).first.lines.map(&:chomp)
    commits = git_log_results.map { |c| commit(c) }
111
    commits
112 113
  end

114
  def find_branch(name)
115
    raw_repository.branches.find { |branch| branch.name == name }
116 117 118
  end

  def find_tag(name)
119
    raw_repository.tags.find { |tag| tag.name == name }
120 121
  end

122 123 124 125 126 127 128 129 130 131
  def add_branch(user, branch_name, target)
    oldrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name
    target = commit(target).try(:id)

    return false unless target

    GitHooksService.new.execute(user, path_to_repo, oldrev, target, ref) do
      rugged.branches.create(branch_name, target)
    end
132

133 134
    expire_branches_cache
    find_branch(branch_name)
135 136
  end

137
  def add_tag(tag_name, ref, message = nil)
D
Douwe Maan 已提交
138
    expire_tags_cache
139

140
    gitlab_shell.add_tag(path_with_namespace, tag_name, ref, message)
141 142
  end

143
  def rm_branch(user, branch_name)
D
Douwe Maan 已提交
144
    expire_branches_cache
145

146 147 148 149 150 151 152 153
    branch = find_branch(branch_name)
    oldrev = branch.try(:target)
    newrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name

    GitHooksService.new.execute(user, path_to_repo, oldrev, newrev, ref) do
      rugged.branches.delete(branch_name)
    end
154

155 156
    expire_branches_cache
    true
157 158
  end

159
  def rm_tag(tag_name)
D
Douwe Maan 已提交
160
    expire_tags_cache
161

162 163 164
    gitlab_shell.rm_tag(path_with_namespace, tag_name)
  end

165
  def branch_names
166
    cache.fetch(:branch_names) { raw_repository.branch_names }
167 168 169
  end

  def tag_names
170
    cache.fetch(:tag_names) { raw_repository.tag_names }
171 172
  end

173
  def commit_count
174
    cache.fetch(:commit_count) do
175
      begin
176
        raw_repository.commit_count(self.root_ref)
177 178 179
      rescue
        0
      end
180
    end
181 182
  end

183 184 185
  # Return repo size in megabytes
  # Cached in redis
  def size
186
    cache.fetch(:size) { raw_repository.size }
187
  end
188

189
  def diverging_commit_counts(branch)
190
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
J
Jeff Stubler 已提交
191
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
192 193
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
194 195 196 197 198
      number_commits_behind = raw_repository.
        count_commits_between(branch.target, root_ref_hash)

      number_commits_ahead = raw_repository.
        count_commits_between(root_ref_hash, branch.target)
199

200 201 202
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
203

204
  def cache_keys
205
    %i(size branch_names tag_names commit_count
206 207
       readme version contribution_guide changelog license)
  end
208

209 210 211 212 213 214
  def build_cache
    cache_keys.each do |key|
      unless cache.exist?(key)
        send(key)
      end
    end
215

216
    branches.each do |branch|
J
Jeff Stubler 已提交
217
      unless cache.exist?(:"diverging_commit_counts_#{branch.name}")
218 219 220
        send(:diverging_commit_counts, branch)
      end
    end
221 222
  end

D
Douwe Maan 已提交
223 224 225 226 227 228 229 230 231 232
  def expire_tags_cache
    cache.expire(:tag_names)
    @tags = nil
  end

  def expire_branches_cache
    cache.expire(:branch_names)
    @branches = nil
  end

233
  def expire_cache(branch_name = nil)
234
    cache_keys.each do |key|
235 236
      cache.expire(key)
    end
237

238
    expire_branch_cache(branch_name)
239
  end
240

241 242 243 244 245 246 247 248 249 250 251 252
  def expire_branch_cache(branch_name = nil)
    # When we push to the root branch we have to flush the cache for all other
    # branches as their statistics are based on the commits relative to the
    # root branch.
    if !branch_name || branch_name == root_ref
      branches.each do |branch|
        cache.expire(:"diverging_commit_counts_#{branch.name}")
      end
    # In case a commit is pushed to a non-root branch we only have to flush the
    # cache for said branch.
    else
      cache.expire(:"diverging_commit_counts_#{branch_name}")
253
    end
D
Dmitriy Zaporozhets 已提交
254 255
  end

256 257 258 259 260 261 262 263 264 265
  def expire_root_ref_cache
    cache.expire(:root_ref)
    @root_ref = nil
  end

  def expire_has_visible_content_cache
    cache.expire(:has_visible_content?)
    @has_visible_content = nil
  end

266 267
  def rebuild_cache
    cache_keys.each do |key|
268
      cache.expire(key)
269
      send(key)
D
Dmitriy Zaporozhets 已提交
270
    end
271

272
    branches.each do |branch|
J
Jeff Stubler 已提交
273 274
      cache.expire(:"diverging_commit_counts_#{branch.name}")
      diverging_commit_counts(branch)
275
    end
276 277
  end

278 279 280 281
  def lookup_cache
    @lookup_cache ||= {}
  end

282 283 284 285
  def expire_branch_names
    cache.expire(:branch_names)
  end

286
  def method_missing(m, *args, &block)
287 288 289 290 291 292
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
      lookup_cache[m][args.join(":")] ||= raw_repository.send(m, *args, &block)
    else
      raw_repository.send(m, *args, &block)
    end
293 294
  end

295 296
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
297
  end
D
Dmitriy Zaporozhets 已提交
298 299

  def blob_at(sha, path)
300 301 302
    unless Gitlab::Git.blank_ref?(sha)
      Gitlab::Git::Blob.find(self, sha, path)
    end
D
Dmitriy Zaporozhets 已提交
303
  end
304

305 306 307 308
  def blob_by_oid(oid)
    Gitlab::Git::Blob.raw(self, oid)
  end

309
  def readme
310
    cache.fetch(:readme) { tree(:head).readme }
311
  end
312

313
  def version
314
    cache.fetch(:version) do
315 316 317 318 319 320
      tree(:head).blobs.find do |file|
        file.name.downcase == 'version'
      end
    end
  end

321
  def contribution_guide
322 323 324 325 326 327
    cache.fetch(:contribution_guide) do
      tree(:head).blobs.find do |file|
        file.contributing?
      end
    end
  end
328 329 330 331

  def changelog
    cache.fetch(:changelog) do
      tree(:head).blobs.find do |file|
332
        file.name =~ /\A(changelog|history)/i
333 334
      end
    end
335 336
  end

337 338
  def license
    cache.fetch(:license) do
Z
Zeger-Jan van de Weg 已提交
339
      licenses =  tree(:head).blobs.find_all do |file|
340
                    file.name =~ /\A(copying|license|licence)/i
Z
Zeger-Jan van de Weg 已提交
341 342
                  end

343 344 345 346 347 348 349 350 351 352 353 354 355
      preferences = [
        /\Alicen[sc]e\z/i,        # LICENSE, LICENCE
        /\Alicen[sc]e\./i,        # LICENSE.md, LICENSE.txt
        /\Acopying\z/i,           # COPYING
        /\Acopying\.(?!lesser)/i, # COPYING.txt
        /Acopying.lesser/i        # COPYING.LESSER
      ]

      license = nil
      preferences.each do |r|
        license = licenses.find { |l| l.name =~ r }
        break if license
      end
Z
Zeger-Jan van de Weg 已提交
356

357
      license
358
    end
359 360
  end

361
  def head_commit
362 363 364 365 366
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
    @head_tree ||= Tree.new(self, head_commit.sha, nil)
367 368 369 370
  end

  def tree(sha = :head, path = nil)
    if sha == :head
371 372 373 374 375
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
376 377 378 379
    end

    Tree.new(self, sha, path)
  end
D
Dmitriy Zaporozhets 已提交
380 381

  def blob_at_branch(branch_name, path)
D
Dmitriy Zaporozhets 已提交
382
    last_commit = commit(branch_name)
D
Dmitriy Zaporozhets 已提交
383

D
Dmitriy Zaporozhets 已提交
384 385 386 387 388
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
D
Dmitriy Zaporozhets 已提交
389
  end
D
Dmitriy Zaporozhets 已提交
390 391 392 393 394 395 396 397

  # Returns url for submodule
  #
  # Ex.
  #   @repository.submodule_url_for('master', 'rack')
  #   # => git@localhost:rack.git
  #
  def submodule_url_for(ref, path)
D
Dmitriy Zaporozhets 已提交
398
    if submodules(ref).any?
D
Dmitriy Zaporozhets 已提交
399 400 401 402 403 404 405
      submodule = submodules(ref)[path]

      if submodule
        submodule['url']
      end
    end
  end
406 407

  def last_commit_for_path(sha, path)
408
    args = %W(#{Gitlab.config.git.bin_path} rev-list --max-count=1 #{sha} -- #{path})
409 410
    sha = Gitlab::Popen.popen(args, path_to_repo).first.strip
    commit(sha)
411
  end
412

413 414 415 416 417 418 419 420 421 422 423
  def next_patch_branch
    patch_branch_ids = self.branch_names.map do |n|
      result = n.match(/\Apatch-([0-9]+)\z/)
      result[1].to_i if result
    end.compact

    highest_patch_branch_id = patch_branch_ids.max || 0

    "patch-#{highest_patch_branch_id + 1}"
  end

424
  # Remove archives older than 2 hours
425 426 427 428 429 430 431 432 433 434 435 436 437 438
  def branches_sorted_by(value)
    case value
    when 'recently_updated'
      branches.sort do |a, b|
        commit(b.target).committed_date <=> commit(a.target).committed_date
      end
    when 'last_updated'
      branches.sort do |a, b|
        commit(a.target).committed_date <=> commit(b.target).committed_date
      end
    else
      branches
    end
  end
439 440

  def contributors
D
Dmitriy Zaporozhets 已提交
441
    commits = self.commits(nil, nil, 2000, 0, true)
442

D
Dmitriy Zaporozhets 已提交
443
    commits.group_by(&:author_email).map do |email, commits|
444 445
      contributor = Gitlab::Contributor.new
      contributor.email = email
446

D
Dmitriy Zaporozhets 已提交
447
      commits.each do |commit|
448
        if contributor.name.blank?
D
Dmitriy Zaporozhets 已提交
449
          contributor.name = commit.author_name
450 451
        end

452
        contributor.commits += 1
453 454
      end

455 456
      contributor
    end
457
  end
D
Dmitriy Zaporozhets 已提交
458 459

  def blob_for_diff(commit, diff)
460
    blob_at(commit.id, diff.file_path)
D
Dmitriy Zaporozhets 已提交
461 462 463 464 465 466 467
  end

  def prev_blob_for_diff(commit, diff)
    if commit.parent_id
      blob_at(commit.parent_id, diff.old_path)
    end
  end
468

469 470
  def refs_contains_sha(ref_type, sha)
    args = %W(#{Gitlab.config.git.bin_path} #{ref_type} --contains #{sha})
471 472 473 474 475 476 477 478 479 480 481 482 483 484
    names = Gitlab::Popen.popen(args, path_to_repo).first

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
H
Hannes Rosenögger 已提交
485

486 487 488
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
H
Hannes Rosenögger 已提交
489

490 491
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
H
Hannes Rosenögger 已提交
492
  end
493

494 495 496 497 498 499 500 501 502
  def branches
    @branches ||= raw_repository.branches
  end

  def tags
    @tags ||= raw_repository.tags
  end

  def root_ref
503
    @root_ref ||= cache.fetch(:root_ref) { raw_repository.root_ref }
504 505
  end

S
Stan Hu 已提交
506
  def commit_dir(user, path, message, branch)
507
    commit_with_hooks(user, branch) do |ref|
S
Stan Hu 已提交
508 509 510 511 512 513 514 515 516 517 518 519 520
      committer = user_to_committer(user)
      options = {}
      options[:committer] = committer
      options[:author] = committer

      options[:commit] = {
        message: message,
        branch: ref,
      }

      raw_repository.mkdir(path, options)
    end
  end
521

S
Stan Hu 已提交
522 523 524
  def commit_file(user, path, content, message, branch, update)
    commit_with_hooks(user, branch) do |ref|
      committer = user_to_committer(user)
525 526 527 528 529 530 531
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref,
      }
532

533 534
      options[:file] = {
        content: content,
S
Stan Hu 已提交
535 536
        path: path,
        update: update
537
      }
538

539 540
      Gitlab::Git::Blob.commit(raw_repository, options)
    end
541 542
  end

543
  def remove_file(user, path, message, branch)
544
    commit_with_hooks(user, branch) do |ref|
S
Stan Hu 已提交
545
      committer = user_to_committer(user)
546 547 548 549 550 551 552
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref
      }
553

554 555 556
      options[:file] = {
        path: path
      }
557

558 559
      Gitlab::Git::Blob.remove(raw_repository, options)
    end
560 561
  end

S
Stan Hu 已提交
562
  def user_to_committer(user)
563 564 565 566 567 568 569 570 571 572 573 574 575 576 577 578 579 580
    {
      email: user.email,
      name: user.name,
      time: Time.now
    }
  end

  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

581
  def merge(user, source_sha, target_branch, options = {})
582 583 584 585 586 587 588 589 590
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    raise "Invalid merge target" if our_commit.nil?
    raise "Invalid merge source" if their_commit.nil?

    merge_index = rugged.merge_commits(our_commit, their_commit)
    return false if merge_index.conflicts?

591 592 593 594 595 596
    commit_with_hooks(user, target_branch) do |ref|
      actual_options = options.merge(
        parents: [our_commit, their_commit],
        tree: merge_index.write_tree(rugged),
        update_ref: ref
      )
597

598 599
      Rugged::Commit.create(rugged, actual_options)
    end
600 601
  end

F
Florent (HP) 已提交
602 603 604 605 606
  def merged_to_root_ref?(branch_name)
    branch_commit = commit(branch_name)
    root_ref_commit = commit(root_ref)

    if branch_commit
607
      is_ancestor?(branch_commit.id, root_ref_commit.id)
F
Florent (HP) 已提交
608 609 610 611 612
    else
      nil
    end
  end

S
Stan Hu 已提交
613 614
  def merge_base(first_commit_id, second_commit_id)
    rugged.merge_base(first_commit_id, second_commit_id)
D
Douwe Maan 已提交
615 616
  rescue Rugged::ReferenceError
    nil
S
Stan Hu 已提交
617 618
  end

619 620 621 622 623
  def is_ancestor?(ancestor_id, descendant_id)
    merge_base(ancestor_id, descendant_id) == ancestor_id
  end


624 625
  def search_files(query, ref)
    offset = 2
626
    args = %W(#{Gitlab.config.git.bin_path} grep -i -I -n --before-context #{offset} --after-context #{offset} -e #{query} #{ref || root_ref})
627 628 629
    Gitlab::Popen.popen(args, path_to_repo).first.scrub.split(/^--$/)
  end

D
Dmitriy Zaporozhets 已提交
630
  def parse_search_result(result)
631 632 633 634
    ref = nil
    filename = nil
    startline = 0

635
    result.each_line.each_with_index do |line, index|
636 637 638 639 640 641 642
      if line =~ /^.*:.*:\d+:/
        ref, filename, startline = line.split(':')
        startline = startline.to_i - index
        break
      end
    end

643
    data = ""
644

645 646 647
    result.each_line do |line|
      data << line.sub(ref, '').sub(filename, '').sub(/^:-\d+-/, '').sub(/^::\d+:/, '')
    end
648 649 650 651 652 653 654 655 656

    OpenStruct.new(
      filename: filename,
      ref: ref,
      startline: startline,
      data: data
    )
  end

657
  def fetch_ref(source_path, source_ref, target_ref)
658
    args = %W(#{Gitlab.config.git.bin_path} fetch -f #{source_path} #{source_ref}:#{target_ref})
659 660 661
    Gitlab::Popen.popen(args, path_to_repo)
  end

662
  def with_tmp_ref(oldrev = nil)
663 664 665
    random_string = SecureRandom.hex
    tmp_ref = "refs/tmp/#{random_string}/head"

666
    if oldrev && !Gitlab::Git.blank_ref?(oldrev)
667 668 669 670
      rugged.references.create(tmp_ref, oldrev)
    end

    # Make commit in tmp ref
671 672 673 674 675 676 677 678 679
    yield(tmp_ref)
  ensure
    rugged.references.delete(tmp_ref) rescue nil
  end

  def commit_with_hooks(current_user, branch)
    oldrev = Gitlab::Git::BLANK_SHA
    ref = Gitlab::Git::BRANCH_REF_PREFIX + branch
    was_empty = empty?
680

681 682
    unless was_empty
      oldrev = find_branch(branch).target
683 684
    end

685 686 687 688 689 690 691
    with_tmp_ref(oldrev) do |tmp_ref|
      # Make commit in tmp ref
      newrev = yield(tmp_ref)

      unless newrev
        raise CommitError.new('Failed to create commit')
      end
692

693 694 695 696
      GitHooksService.new.execute(current_user, path_to_repo, oldrev, newrev, ref) do
        if was_empty
          # Create branch
          rugged.references.create(ref, newrev)
697
        else
698 699 700 701 702 703 704 705 706
          # Update head
          current_head = find_branch(branch).target

          # Make sure target branch was not changed during pre-receive hook
          if current_head == oldrev
            rugged.references.update(ref, newrev)
          else
            raise CommitError.new('Commit was rejected because branch received new push')
          end
707 708 709 710 711
        end
      end
    end
  end

712 713 714 715 716
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

717 718
  private

719 720 721
  def cache
    @cache ||= RepositoryCache.new(path_with_namespace)
  end
722
end