repository.rb 31.7 KB
Newer Older
1
# coding: utf-8
2
require 'securerandom'
3
require 'forwardable'
4

5
class Repository
Valery Sizov's avatar
Valery Sizov committed
6
  include Elastic::RepositoriesSearch
Valery Sizov's avatar
Valery Sizov committed
7

8 9
  class CommitError < StandardError; end

10
  MIRROR_REMOTE = "upstream"
11
  MIRROR_GEO = "geo"
12

13 14 15 16
  # Files to use as a project avatar in case no avatar was uploaded via the web
  # UI.
  AVATAR_FILES = %w{logo.png logo.jpg logo.gif}

17 18
  include Gitlab::ShellAdapter

19
  attr_accessor :path_with_namespace, :project
20

21
  def initialize(path_with_namespace, project)
22
    @path_with_namespace = path_with_namespace
23
    @project = project
24
  end
25

26 27
  def raw_repository
    return nil unless path_with_namespace
28

29
    @raw_repository ||= Gitlab::Git::Repository.new(path_to_repo)
30 31
  end

32 33
  def update_autocrlf_option
    raw_repository.autocrlf = :input if raw_repository.autocrlf != :input
34 35
  end

36 37 38 39
  def storage_path
    @project.repository_storage_path
  end

40
  # Return absolute path to repository
41
  def path_to_repo
42
    @path_to_repo ||= File.expand_path(
43
      File.join(storage_path, path_with_namespace + ".git")
44
    )
45 46
  end

47
  def exists?
48
    return @exists unless @exists.nil?
49

50 51 52 53 54 55 56
    @exists = cache.fetch(:exists?) do
      begin
        raw_repository && raw_repository.rugged ? true : false
      rescue Gitlab::Git::Repository::NoRepository
        false
      end
    end
57 58 59
  end

  def empty?
60 61 62
    return @empty unless @empty.nil?

    @empty = cache.fetch(:empty?) { raw_repository.empty? }
63 64
  end

65 66 67 68 69 70 71 72 73 74
  #
  # Git repository can contains some hidden refs like:
  #   /refs/notes/*
  #   /refs/git-as-svn/*
  #   /refs/pulls/*
  # This refs by default not visible in project page and not cloned to client side.
  #
  # This method return true if repository contains some content visible in project page.
  #
  def has_visible_content?
75 76 77
    return @has_visible_content unless @has_visible_content.nil?

    @has_visible_content = cache.fetch(:has_visible_content?) do
78
      branch_count > 0
79
    end
80 81
  end

82
  def commit(ref = 'HEAD')
83
    return nil unless exists?
84 85 86 87 88 89
    commit =
      if ref.is_a?(Gitlab::Git::Commit)
        ref
      else
        Gitlab::Git::Commit.find(raw_repository, ref)
      end
90
    commit = ::Commit.new(commit, @project) if commit
91
    commit
92
  rescue Rugged::OdbError
93
    nil
94 95
  end

96
  def commits(ref, path: nil, limit: nil, offset: nil, skip_merges: false, after: nil, before: nil)
97
    options = {
98 99 100 101 102
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
103 104
      after: after,
      before: before,
105 106
      # --follow doesn't play well with --skip. See:
      # https://gitlab.com/gitlab-org/gitlab-ce/issues/3574#note_3040520
107 108
      follow: false,
      skip_merges: skip_merges
109 110 111
    }

    commits = Gitlab::Git::Commit.where(options)
112
    commits = Commit.decorate(commits, @project) if commits.present?
113 114 115
    commits
  end

116 117
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
118
    commits = Commit.decorate(commits, @project) if commits.present?
119 120 121
    commits
  end

122 123 124
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
    ref ||= root_ref

125
    # Limited to 1000 commits for now, could be parameterized?
126 127
    args = %W(#{Gitlab.config.git.bin_path} log #{ref} --pretty=%H --skip #{offset} --max-count #{limit} --grep=#{query})
    args = args.concat(%W(-- #{path})) if path.present?
128

129 130
    git_log_results = Gitlab::Popen.popen(args, path_to_repo).first.lines.map(&:chomp)
    commits = git_log_results.map { |c| commit(c) }
131
    commits
132 133
  end

134 135 136 137 138 139 140 141 142 143 144 145 146 147 148
  def find_branch(name, fresh_repo: true)
    # Since the Repository object may have in-memory index changes, invalidating the memoized Repository object may
    # cause unintended side effects. Because finding a branch is a read-only operation, we can safely instantiate
    # a new repo here to ensure a consistent state to avoid a libgit2 bug where concurrent access (e.g. via git gc)
    # may cause the branch to "disappear" erroneously or have the wrong SHA.
    #
    # See: https://github.com/libgit2/libgit2/issues/1534 and https://gitlab.com/gitlab-org/gitlab-ce/issues/15392
    raw_repo =
      if fresh_repo
        Gitlab::Git::Repository.new(path_to_repo)
      else
        raw_repository
      end

    raw_repo.find_branch(name)
149 150 151
  end

  def find_tag(name)
152
    tags.find { |tag| tag.name == name }
153 154
  end

155 156 157 158 159 160 161 162
  def add_branch(user, branch_name, target)
    oldrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name
    target = commit(target).try(:id)

    return false unless target

    GitHooksService.new.execute(user, path_to_repo, oldrev, target, ref) do
163
      update_ref!(ref, target, oldrev)
164
    end
165

166
    after_create_branch
167
    find_branch(branch_name)
168 169
  end

170 171 172 173
  def push_remote_branches(remote, branches)
    gitlab_shell.push_remote_branches(storage_path, path_with_namespace, remote, branches)
  end

174 175 176 177 178 179
  def add_tag(user, tag_name, target, message = nil)
    oldrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::TAG_REF_PREFIX + tag_name
    target = commit(target).try(:id)

    return false unless target
180

181 182
    options = { message: message, tagger: user_to_committer(user) } if message

183 184
    GitHooksService.new.execute(user, path_to_repo, oldrev, target, ref) do
      rugged.tags.create(tag_name, target, options)
185
    end
186

187
    find_tag(tag_name)
188 189
  end

190
  def rm_branch(user, branch_name)
191
    before_remove_branch
192

193
    branch = find_branch(branch_name)
194
    oldrev = branch.try(:target).try(:id)
195 196 197 198
    newrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name

    GitHooksService.new.execute(user, path_to_repo, oldrev, newrev, ref) do
199
      update_ref!(ref, newrev, oldrev)
200 201
    end

202
    after_remove_branch
203
    true
204 205
  end

206 207 208 209
  def delete_remote_branches(remote, branches)
    gitlab_shell.delete_remote_branches(storage_path, path_with_namespace, remote, branches)
  end

210
  def rm_tag(tag_name)
211
    before_remove_tag
212

Robert Schilling's avatar
Robert Schilling committed
213 214 215 216 217 218
    begin
      rugged.tags.delete(tag_name)
      true
    rescue Rugged::ReferenceError
      false
    end
219 220
  end

221 222 223 224
  def config
    raw_repository.rugged.config
  end

225 226 227 228 229 230
  def add_remote(name, url)
    raw_repository.remote_add(name, url)
  rescue Rugged::ConfigError
    raw_repository.remote_update(name, url: url)
  end

231 232 233 234 235 236 237
  def remove_remote(name)
    raw_repository.remote_delete(name)
    true
  rescue Rugged::ConfigError
    false
  end

238 239
  def set_remote_as_mirror(name)
    # This is used by Gitlab Geo to define repository as equivalent as "git clone --mirror"
240 241 242
    config["remote.#{name}.fetch"] = 'refs/*:refs/*'
    config["remote.#{name}.mirror"] = true
    config["remote.#{name}.prune"] = true
243 244
  end

245
  def fetch_remote(remote, forced: false, no_tags: false)
246
    gitlab_shell.fetch_remote(storage_path, path_with_namespace, remote, forced: forced, no_tags: no_tags)
247 248
  end

249
  def remote_tags(remote)
250
    gitlab_shell.list_remote_tags(storage_path, path_with_namespace, remote).map do |name, target|
251 252 253
      # Is the tag annotated or lightweight?
      object = target.is_a?(Rugged::Tag::Annotation) ? target : nil
      Gitlab::Git::Tag.new(raw_repository, object, name, target)
254
    end
255 256
  end

257
  def fetch_remote_forced!(remote)
258
    gitlab_shell.fetch_remote(storage_path, path_with_namespace, remote, forced: true)
259 260
  end

261 262 263 264
  def ref_names
    branch_names + tag_names
  end

265
  def branch_names
266
    @branch_names ||= cache.fetch(:branch_names) { branches.map(&:name) }
267 268
  end

269 270
  def branch_exists?(branch_name)
    branch_names.include?(branch_name)
271 272
  end

273 274 275 276
  def ref_exists?(ref)
    rugged.references.exist?(ref)
  end

277 278 279 280 281 282
  def update_ref!(name, newrev, oldrev)
    # We use 'git update-ref' because libgit2/rugged currently does not
    # offer 'compare and swap' ref updates. Without compare-and-swap we can
    # (and have!) accidentally reset the ref to an earlier state, clobbering
    # commits. See also https://github.com/libgit2/libgit2/issues/1534.
    command = %w[git update-ref --stdin -z]
283
    _, status = Gitlab::Popen.popen(command, path_to_repo) do |stdin|
284 285 286 287 288
      stdin.write("update #{name}\x00#{newrev}\x00#{oldrev}\x00")
    end

    return if status.zero?

289
    raise CommitError.new("Could not update branch #{name.sub('refs/heads/', '')}. Please refresh and try again.")
290 291
  end

292 293 294 295
  # Makes sure a commit is kept around when Git garbage collection runs.
  # Git GC will delete commits from the repository that are no longer in any
  # branches or tags, but we want to keep some of these commits around, for
  # example if they have comments or CI builds.
296 297 298 299 300
  def keep_around(sha)
    return unless sha && commit(sha)

    return if kept_around?(sha)

301 302 303 304 305
    # This will still fail if the file is corrupted (e.g. 0 bytes)
    begin
      rugged.references.create(keep_around_ref_name(sha), sha, force: true)
    rescue Rugged::ReferenceError => ex
      Rails.logger.error "Unable to create keep-around reference for repository #{path}: #{ex}"
306 307 308
    rescue Rugged::OSError => ex
      raise unless ex.message =~ /Failed to create locked file/ && ex.message =~ /File exists/
      Rails.logger.error "Unable to create keep-around reference for repository #{path}: #{ex}"
309
    end
310 311 312
  end

  def kept_around?(sha)
313 314 315 316 317
    begin
      ref_exists?(keep_around_ref_name(sha))
    rescue Rugged::ReferenceError
      false
    end
318 319
  end

320
  def tag_names
321
    cache.fetch(:tag_names) { raw_repository.tag_names }
322 323
  end

324
  def commit_count
325
    cache.fetch(:commit_count) do
326
      begin
327
        raw_repository.commit_count(self.root_ref)
328 329 330
      rescue
        0
      end
331
    end
332 333
  end

334
  def branch_count
335
    @branch_count ||= cache.fetch(:branch_count) { branches.size }
336 337 338 339 340 341
  end

  def tag_count
    @tag_count ||= cache.fetch(:tag_count) { raw_repository.rugged.tags.count }
  end

342 343 344
  # Return repo size in megabytes
  # Cached in redis
  def size
345
    cache.fetch(:size) { raw_repository.size }
346 347
  end

348
  def diverging_commit_counts(branch)
349
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
Jeff Stubler's avatar
Jeff Stubler committed
350
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
351 352
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
353
      number_commits_behind = raw_repository.
354
        count_commits_between(branch.target.sha, root_ref_hash)
355 356

      number_commits_ahead = raw_repository.
357
        count_commits_between(root_ref_hash, branch.target.sha)
358

359 360 361
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
362

363
  # Keys for data that can be affected for any commit push.
364
  def cache_keys
365
    %i(size commit_count
366
       readme version contribution_guide changelog
367
       license_blob license_key gitignore koding_yml)
368 369
  end

370 371 372 373 374
  # Keys for data on branch/tag operations.
  def cache_keys_for_branches_and_tags
    %i(branch_names tag_names branch_count tag_count)
  end

375
  def build_cache
376
    (cache_keys + cache_keys_for_branches_and_tags).each do |key|
377 378 379 380 381 382
      unless cache.exist?(key)
        send(key)
      end
    end
  end

383 384 385 386 387 388 389
  def expire_tags_cache
    cache.expire(:tag_names)
    @tags = nil
  end

  def expire_branches_cache
    cache.expire(:branch_names)
390
    @branch_names = nil
391
    @local_branches = nil
392 393
  end

394
  def expire_cache(branch_name = nil, revision = nil)
395
    cache_keys.each do |key|
396 397
      cache.expire(key)
    end
398

399
    expire_branch_cache(branch_name)
400
    expire_avatar_cache(branch_name, revision)
401 402 403 404

    # This ensures this particular cache is flushed after the first commit to a
    # new repository.
    expire_emptiness_caches if empty?
405
  end
406

407 408 409 410 411 412 413 414 415 416 417 418
  def expire_branch_cache(branch_name = nil)
    # When we push to the root branch we have to flush the cache for all other
    # branches as their statistics are based on the commits relative to the
    # root branch.
    if !branch_name || branch_name == root_ref
      branches.each do |branch|
        cache.expire(:"diverging_commit_counts_#{branch.name}")
      end
    # In case a commit is pushed to a non-root branch we only have to flush the
    # cache for said branch.
    else
      cache.expire(:"diverging_commit_counts_#{branch_name}")
419
    end
Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
420 421
  end

422 423 424 425 426
  def expire_root_ref_cache
    cache.expire(:root_ref)
    @root_ref = nil
  end

427 428 429 430 431 432 433 434
  # Expires the cache(s) used to determine if a repository is empty or not.
  def expire_emptiness_caches
    cache.expire(:empty?)
    @empty = nil

    expire_has_visible_content_cache
  end

435 436 437 438 439
  def expire_has_visible_content_cache
    cache.expire(:has_visible_content?)
    @has_visible_content = nil
  end

440 441 442 443 444 445 446 447 448 449
  def expire_branch_count_cache
    cache.expire(:branch_count)
    @branch_count = nil
  end

  def expire_tag_count_cache
    cache.expire(:tag_count)
    @tag_count = nil
  end

450 451 452 453
  def lookup_cache
    @lookup_cache ||= {}
  end

454 455 456 457 458 459 460 461
  def expire_avatar_cache(branch_name = nil, revision = nil)
    # Avatars are pulled from the default branch, thus if somebody pushes to a
    # different branch there's no need to expire anything.
    return if branch_name && branch_name != root_ref

    # We don't want to flush the cache if the commit didn't actually make any
    # changes to any of the possible avatar files.
    if revision && commit = self.commit(revision)
462
      return unless commit.raw_diffs(deltas_only: true).
463 464 465 466 467 468 469 470
        any? { |diff| AVATAR_FILES.include?(diff.new_path) }
    end

    cache.expire(:avatar)

    @avatar = nil
  end

471 472 473 474 475 476 477 478
  def expire_exists_cache
    cache.expire(:exists?)
    @exists = nil
  end

  # Runs code after a repository has been created.
  def after_create
    expire_exists_cache
479 480
    expire_root_ref_cache
    expire_emptiness_caches
481 482

    repository_event(:create_repository)
483 484
  end

485 486
  # Runs code just before a repository is deleted.
  def before_delete
487 488
    expire_exists_cache

489 490
    expire_cache if exists?

491 492 493 494 495
    # expire cache that don't depend on repository data (when expiring)
    expire_tags_cache
    expire_tag_count_cache
    expire_branches_cache
    expire_branch_count_cache
496 497
    expire_root_ref_cache
    expire_emptiness_caches
498
    expire_exists_cache
499 500

    repository_event(:remove_repository)
501 502 503 504 505 506 507
  end

  # Runs code just before the HEAD of a repository is changed.
  def before_change_head
    # Cached divergent commit counts are based on repository head
    expire_branch_cache
    expire_root_ref_cache
508 509

    repository_event(:change_default_branch)
510 511
  end

512 513
  # Runs code before pushing (= creating or removing) a tag.
  def before_push_tag
514
    expire_cache
515
    expire_tags_cache
516
    expire_tag_count_cache
517 518

    repository_event(:push_tag)
519 520 521 522 523 524
  end

  # Runs code before removing a tag.
  def before_remove_tag
    expire_tags_cache
    expire_tag_count_cache
525 526

    repository_event(:remove_tag)
527 528
  end

529 530 531 532 533
  def before_import
    expire_emptiness_caches
    expire_exists_cache
  end

534 535 536
  # Runs code after a repository has been forked/imported.
  def after_import
    expire_emptiness_caches
537
    expire_exists_cache
538 539 540
  end

  # Runs code after a new commit has been pushed.
541 542
  def after_push_commit(branch_name, revision)
    expire_cache(branch_name, revision)
543 544

    repository_event(:push_commit, branch: branch_name)
545 546 547 548
  end

  # Runs code after a new branch has been created.
  def after_create_branch
549
    expire_branches_cache
550
    expire_has_visible_content_cache
551
    expire_branch_count_cache
552 553

    repository_event(:push_branch)
554 555
  end

556 557 558
  # Runs code before removing an existing branch.
  def before_remove_branch
    expire_branches_cache
559 560

    repository_event(:remove_branch)
561 562 563 564 565
  end

  # Runs code after an existing branch has been removed.
  def after_remove_branch
    expire_has_visible_content_cache
566
    expire_branch_count_cache
567
    expire_branches_cache
568 569
  end

570
  def method_missing(m, *args, &block)
571 572 573 574 575 576
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
      lookup_cache[m][args.join(":")] ||= raw_repository.send(m, *args, &block)
    else
      raw_repository.send(m, *args, &block)
    end
577 578
  end

579 580
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
581
  end
Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
582 583

  def blob_at(sha, path)
584
    unless Gitlab::Git.blank_ref?(sha)
585
      Blob.decorate(Gitlab::Git::Blob.find(self, sha, path))
586
    end
Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
587
  end
588

589 590 591 592
  def blob_by_oid(oid)
    Gitlab::Git::Blob.raw(self, oid)
  end

593
  def readme
594
    cache.fetch(:readme) { tree(:head).readme }
595
  end
596

597
  def version
598
    cache.fetch(:version) do
599
      tree(:head).blobs.find do |file|
600
        file.name.casecmp('version').zero?
601 602 603 604
      end
    end
  end

605
  def contribution_guide
606 607 608 609 610 611
    cache.fetch(:contribution_guide) do
      tree(:head).blobs.find do |file|
        file.contributing?
      end
    end
  end
612 613 614

  def changelog
    cache.fetch(:changelog) do
615
      file_on_head(/\A(changelog|history|changes|news)/i)
616
    end
617 618
  end

619
  def license_blob
620
    return nil unless head_exists?
621

622
    cache.fetch(:license_blob) do
623
      file_on_head(/\A(licen[sc]e|copying)(\..+|\z)/i)
624 625
    end
  end
626

627
  def license_key
628
    return nil unless head_exists?
629 630

    cache.fetch(:license_key) do
631
      Licensee.license(path).try(:key)
632
    end
633 634
  end

635 636 637 638 639 640 641 642
  def gitignore
    return nil if !exists? || empty?

    cache.fetch(:gitignore) do
      file_on_head(/\A\.gitignore\z/)
    end
  end

643 644 645 646 647 648 649 650
  def koding_yml
    return nil unless head_exists?

    cache.fetch(:koding_yml) do
      file_on_head(/\A\.koding\.yml\z/)
    end
  end

651
  def gitlab_ci_yml
652
    return nil unless head_exists?
653 654 655 656

    @gitlab_ci_yml ||= tree(:head).blobs.find do |file|
      file.name == '.gitlab-ci.yml'
    end
657 658 659 660
  rescue Rugged::ReferenceError
    # For unknow reason spinach scenario "Scenario: I change project path"
    # lead to "Reference 'HEAD' not found" exception from Repository#empty?
    nil
661 662
  end

663
  def head_commit
664 665 666 667 668
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
    @head_tree ||= Tree.new(self, head_commit.sha, nil)
669 670 671 672
  end

  def tree(sha = :head, path = nil)
    if sha == :head
673 674 675 676 677
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
678 679 680 681
    end

    Tree.new(self, sha, path)
  end
682 683

  def blob_at_branch(branch_name, path)
684
    last_commit = commit(branch_name)
685

686 687 688 689 690
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
691
  end
692 693 694 695 696 697 698 699

  # Returns url for submodule
  #
  # Ex.
  #   @repository.submodule_url_for('master', 'rack')
  #   # => git@localhost:rack.git
  #
  def submodule_url_for(ref, path)
700
    if submodules(ref).any?
701 702 703 704 705 706 707
      submodule = submodules(ref)[path]

      if submodule
        submodule['url']
      end
    end
  end
708 709

  def last_commit_for_path(sha, path)
710
    args = %W(#{Gitlab.config.git.bin_path} rev-list --max-count=1 #{sha} -- #{path})
711 712
    sha = Gitlab::Popen.popen(args, path_to_repo).first.strip
    commit(sha)
713
  end
714

715 716 717 718 719 720 721 722 723
  # Returns a list of commits that are not present in any reference
  def new_commits(newrev)
    args = %W(#{Gitlab.config.git.bin_path} rev-list #{newrev} --not --all)

    Gitlab::Popen.popen(args, path_to_repo).first.split("\n").map do |sha|
      commit(sha.strip)
    end
  end

724
  def next_branch(name, opts = {})
725 726 727
    branch_ids = self.branch_names.map do |n|
      next 1 if n == name
      result = n.match(/\A#{name}-([0-9]+)\z/)
728 729 730
      result[1].to_i if result
    end.compact

731
    highest_branch_id = branch_ids.max || 0
732

733 734 735
    return name if opts[:mild] && 0 == highest_branch_id

    "#{name}-#{highest_branch_id + 1}"
736 737
  end

738
  # Remove archives older than 2 hours
739 740
  def branches_sorted_by(value)
    case value
741 742
    when 'name'
      branches.sort_by(&:name)
743
    when 'updated_desc'
744 745 746
      branches.sort do |a, b|
        commit(b.target).committed_date <=> commit(a.target).committed_date
      end
747
    when 'updated_asc'
748 749 750 751 752 753 754
      branches.sort do |a, b|
        commit(a.target).committed_date <=> commit(b.target).committed_date
      end
    else
      branches
    end
  end
755

756 757 758
  def tags_sorted_by(value)
    case value
    when 'name'
759
      VersionSorter.rsort(tags) { |tag| tag.name }
760 761 762 763 764 765 766 767 768
    when 'updated_desc'
      tags_sorted_by_committed_date.reverse
    when 'updated_asc'
      tags_sorted_by_committed_date
    else
      tags
    end
  end

769
  def contributors
770
    commits = self.commits(nil, limit: 2000, offset: 0, skip_merges: true)
771

Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
772
    commits.group_by(&:author_email).map do |email, commits|
773 774
      contributor = Gitlab::Contributor.new
      contributor.email = email
775

Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
776
      commits.each do |commit|
777
        if contributor.name.blank?
Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
778
          contributor.name = commit.author_name
779 780
        end

781
        contributor.commits += 1
782 783
      end

784 785
      contributor
    end
786
  end
Dmitriy Zaporozhets's avatar
Dmitriy Zaporozhets committed
787

788 789
  def refs_contains_sha(ref_type, sha)
    args = %W(#{Gitlab.config.git.bin_path} #{ref_type} --contains #{sha})
790 791 792 793 794 795 796 797 798 799 800 801 802 803
    names = Gitlab::Popen.popen(args, path_to_repo).first

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
804

805 806 807
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
808

809 810
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
811
  end
812

813
  def local_branches
814
    @local_branches ||= raw_repository.local_branches
815 816
  end

817 818
  alias_method :branches, :local_branches

819
  def remote_branches(remote_name)
820 821 822 823 824 825
    branches = []

    rugged.references.each("refs/remotes/#{remote_name}/*").map do |ref|
      name = ref.name.sub(/\Arefs\/remotes\/#{remote_name}\//, '')

      begin
826
        branches << Gitlab::Git::Branch.new(raw_repository, name, ref.target)
827 828 829 830 831 832
      rescue Rugged::ReferenceError
        # Omit invalid branch
      end
    end

    branches
833 834
  end

835 836 837 838 839
  def tags
    @tags ||= raw_repository.tags
  end

  def root_ref
840
    @root_ref ||= cache.fetch(:root_ref) { raw_repository.root_ref }
841 842
  end

843
  def commit_dir(user, path, message, branch, author_email: nil, author_name: nil)
844
    update_branch_with_hooks(user, branch) do |ref|
845 846 847 848 849 850
      options = {
        commit: {
          branch: ref,
          message: message,
          update_ref: false
        }
Stan Hu's avatar
Stan Hu committed
851 852
      }

853 854
      options.merge!(get_committer_and_author(user, email: author_email, name: author_name))

Stan Hu's avatar
Stan Hu committed
855 856 857
      raw_repository.mkdir(path, options)
    end
  end
858

859
  def commit_file(user, path, content, message, branch, update, author_email: nil, author_name: nil)
860
    update_branch_with_hooks(user, branch) do |ref|
861 862 863 864 865 866 867 868 869 870 871
      options = {
        commit: {
          branch: ref,
          message: message,
          update_ref: false
        },
        file: {
          content: content,
          path: path,
          update: update
        }
872
      }
873

874
      options.merge!(get_committer_and_author(user, email: author_email, name: author_name))
875

876 877
      Gitlab::Git::Blob.commit(raw_repository, options)
    end
878 879
  end

880
  def update_file(user, path, content, branch:, previous_path:, message:, author_email: nil, author_name: nil)
881
    update_branch_with_hooks(user, branch) do |ref|
882 883 884 885 886 887 888 889 890 891 892
      options = {
        commit: {
          branch: ref,
          message: message,
          update_ref: false
        },
        file: {
          content: content,
          path: path,
          update: true
        }
893 894
      }

895
      options.merge!(get_committer_and_author(user, email: author_email, name: author_name))
896

897
      if previous_path && previous_path != path
898
        options[:file][:previous_path] = previous_path
899
        Gitlab::Git::Blob.rename(raw_repository, options)
tiagonbotelho's avatar
tiagonbotelho committed
900
      else
901
        Gitlab::Git::Blob.commit(raw_repository, options)
tiagonbotelho's avatar
tiagonbotelho committed
902
      end
903 904 905
    end
  end

906
  def remove_file(user, path, message, branch, author_email: nil, author_name: nil)
907
    update_branch_with_hooks(user, branch) do |ref|
908 909 910 911 912 913 914 915 916
      options = {
        commit: {
          branch: ref,
          message: message,
          update_ref: false
        },
        file: {
          path: path
        }
917
      }
918

919
      options.merge!(get_committer_and_author(user, email: author_email, name: author_name))
920

921 922
      Gitlab::Git::Blob.remove(raw_repository, options)
    end
923 924
  end

925 926
  def get_committer_and_author(user, email: nil, name: nil)
    committer = user_to_committer(user)
927
    author = Gitlab::Git::committer_hash(email: email, name: name) || committer
928

929
    {
930 931
      author: author,
      committer: committer
932 933 934
    }
  end

935 936 937 938
  def user_to_committer(user)
    Gitlab::Git::committer_hash(email: user.email, name: user.name)
  end

939 940 941 942 943 944 945 946 947 948 949
  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

950
  def ff_merge(user, source, target_branch, merge_request: nil)
951
    our_commit = rugged.branches[target_branch].target
952 953 954 955 956 957
    their_commit =
      if source.is_a?(Gitlab::Git::Commit)
        source.raw_commit
      else
        rugged.lookup(source)
      end
958 959 960 961

    raise "Invalid merge target" if our_commit.nil?
    raise "Invalid merge source" if their_commit.nil?

Ruben Davila's avatar
Ruben Davila committed
962
    update_branch_with_hooks(user, target_branch) do
963 964 965
      merge_request.update(in_progress_merge_commit_sha: their_commit.oid) if merge_request
      their_commit.oid
    end
966 967
  end

968 969 970
  def merge(user, merge_request, options = {})
    our_commit = rugged.branches[merge_request.target_branch].target
    their_commit = rugged.lookup(merge_request.diff_head_sha)
971 972 973 974 975 976 977

    raise "Invalid merge target" if our_commit.nil?
    raise "Invalid merge source" if their_commit.nil?

    merge_index = rugged.merge_commits(our_commit, their_commit)
    return false if merge_index.conflicts?

978
    update_branch_with_hooks(user, merge_request.target_branch) do
979 980 981 982
      actual_options = options.merge(
        parents: [our_commit, their_commit],
        tree: merge_index.write_tree(rugged),
      )
983

984 985 986
      commit_id = Rugged::Commit.create(rugged, actual_options)
      merge_request.update(in_progress_merge_commit_sha: commit_id)
      commit_id
987
    end
988 989
  end

990
  def revert(user, commit, base_branch, revert_tree_id = nil)
991
    source_sha = find_branch(base_branch).target.sha
992
    revert_tree_id ||= check_revert_content(commit, base_branch)
993

994
    return false unless revert_tree_id
995

996
    update_branch_with_hooks(user, base_branch) do
997
      committer = user_to_committer(user)
998
      source_sha = Rugged::Commit.create(rugged,
999
        message: commit.revert_message,
1000 1001
        author: committer,
        committer: committer,
1002
        tree: revert_tree_id,
1003
        parents: [rugged.lookup(source_sha)])
1004
    end
1005 1006
  end

1007
  def cherry_pick(user, commit, base_branch, cherry_pick_tree_id = nil)
1008
    source_sha = find_branch(base_branch).target.sha
1009 1010 1011 1012
    cherry_pick_tree_id ||= check_cherry_pick_content(commit, base_branch)

    return false unless cherry_pick_tree_id

1013
    update_branch_with_hooks(user, base_branch) do
1014 1015 1016 1017 1018 1019 1020 1021 1022 1023
      committer = user_to_committer(user)
      source_sha = Rugged::Commit.create(rugged,
        message: commit.message,
        author: {
          email: commit.author_email,
          name: commit.author_name,
          time: commit.authored_date
        },
        committer: committer,
        tree: cherry_pick_tree_id,
1024
        parents: [rugged.lookup(source_sha)])
1025 1026 1027
    end
  end

Douwe Maan's avatar
Douwe Maan committed
1028
  def resolve_conflicts(user, branch, params)
1029
    update_branch_with_hooks(user, branch) do
Douwe Maan's avatar
Douwe Maan committed
1030 1031 1032 1033 1034 1035
      committer = user_to_committer(user)

      Rugged::Commit.create(rugged, params.merge(author: committer, committer: committer))
    end
  end

1036
  def check_revert_content(commit, base_branch)
1037
    source_sha = find_branch(base_branch).target.sha
1038
    args       = [commit.id, source_sha]
1039
    args << { mainline: 1 } if commit.merge_commit?
1040 1041 1042 1043 1044 1045 1046 1047 1048 1049

    revert_index = rugged.revert_commit(*args)
    return false if revert_index.conflicts?

    tree_id = revert_index.write_tree(rugged)
    return false unless diff_exists?(source_sha, tree_id)

    tree_id
  end

1050
  def check_cherry_pick_content(commit, base_branch)
1051
    source_sha = find_branch(base_branch).target.sha
1052
    args       = [commit.id, source_sha]
1053
    args << 1 if commit.merge_commit?
1054 1055 1056 1057 1058 1059 1060 1061 1062 1063

    cherry_pick_index = rugged.cherrypick_commit(*args)
    return false if cherry_pick_index.conflicts?

    tree_id = cherry_pick_index.write_tree(rugged)
    return false unless diff_exists?(source_sha, tree_id)

    tree_id
  end

1064 1065
  def diff_exists?(sha1, sha2)
    rugged.diff(sha1, sha2).size > 0
1066 1067
  end

1068 1069 1070 1071 1072
  def merged_to_root_ref?(branch_name)
    branch_commit = commit(branch_name)
    root_ref_commit = commit(root_ref)

    if branch_commit
1073
      is_ancestor?(branch_commit.id, root_ref_commit.id)
1074 1075 1076 1077 1078
    else
      nil
    end
  end

1079 1080 1081 1082 1083
  def fetch_upstream(url)
    add_remote(Repository::MIRROR_REMOTE, url)
    fetch_remote(Repository::MIRROR_REMOTE)
  end

1084
  def fetch_geo_mirror(url)
1085 1086 1087
    add_remote(Repository::MIRROR_GEO, url)
    set_remote_as_mirror(Repository::MIRROR_GEO)
    fetch_remote_forced!(Repository::MIRROR_GEO)
1088 1089
  end

1090
  def upstream_branches
1091
    @upstream_branches ||= remote_branches(Repository::MIRROR_REMOTE)
1092 1093
  end

1094 1095 1096 1097 1098 1099
  def diverged_from_upstream?(branch_name)
    branch_commit = commit(branch_name)
    upstream_commit = commit("refs/remotes/#{MIRROR_REMOTE}/#{branch_name}")

    if upstream_commit
      !is_ancestor?(branch_commit.id, upstream_commit.id)
1100 1101 1102 1103 1104 1105 1106 1107 1108 1109 1110
    else
      false
    end
  end

  def upstream_has_diverged?(branch_name, remote_ref)
    branch_commit = commit(branch_name)
    upstream_commit = commit("refs/remotes/#{remote_ref}/#{branch_name}")

    if upstream_commit
      !is_ancestor?(upstream_commit.id, branch_commit.id)
1111 1112 1113 1114 1115
    else
      false
    end
  end

1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126
  def up_to_date_with_upstream?(branch_name)
    branch_commit = commit(branch_name)
    upstream_commit = commit("refs/remotes/#{MIRROR_REMOTE}/#{branch_name}")

    if upstream_commit
      is_ancestor?(branch_commit.id, upstream_commit.id)
    else
      false
    end
  end

1127
  def merge_base(first_commit_id, second_commit_id)
1128 1129
    first_commit_id = commit(first_commit_id).try(:id) || first_commit_id
    second_commit_id = commit(second_commit_id).try(:id) || second_commit_id
1130
    rugged.merge_base(first_commit_id, second_commit_id)
Douwe Maan's avatar
Douwe Maan committed
1131 1132
  rescue Rugged::ReferenceError
    nil
1133 1134
  end

1135 1136 1137 1138
  def is_ancestor?(ancestor_id, descendant_id)
    merge_base(ancestor_id, descendant_id) == ancestor_id
  end

1139 1140
  def search_files(query, ref)
    offset = 2
1141
    args = %W(#{Gitlab.config.git.bin_path} grep -i -I -n --before-context #{offset} --after-context #{offset} -E -e #{Regexp.escape(query)} #{ref || root_ref})
1142 1143 1144
    Gitlab::Popen.popen(args, path_to_repo).first.scrub.split(/^--$/)
  end

1145
  def fetch_ref(source_path, source_ref, target_ref)
1146
    args = %W(#{Gitlab.config.git.bin_path} fetch --no-tags -f #{source_path} #{source_ref}:#{target_ref})
1147 1148 1149
    Gitlab::Popen.popen(args, path_to_repo)
  end

1150
  def update_branch_with_hooks(current_user, branch)
1151 1152
    update_autocrlf_option

1153
    ref = Gitlab::Git::BRANCH_REF_PREFIX + branch
1154
    target_branch = find_branch(branch)
1155
    was_empty = empty?
1156

1157 1158
    # Make commit
    newrev = yield(ref)
1159

1160 1161 1162 1163
    unless newrev
      raise CommitError.new('Failed to create commit')
    end

1164 1165 1166 1167 1168
    if rugged.lookup(newrev).parent_ids.empty? || target_branch.nil?
      oldrev = Gitlab::Git::BLANK_SHA
    else
      oldrev = rugged.merge_base(newrev, target_branch.target.sha)
    end
1169

1170
    GitHooksService.new.execute(current_user, path_to_repo, oldrev, newrev, ref) do
1171
      update_ref!(ref, newrev, oldrev)
Valery Sizov's avatar
Valery Sizov committed
1172

1173
      if was_empty || !target_branch
1174 1175 1176
        # If repo was empty expire cache
        after_create if was_empty
        after_create_branch
1177 1178
      end
    end
1179 1180

    newrev
1181 1182
  end

1183 1184 1185 1186 1187
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

1188 1189 1190 1191
  def gitattribute(path, name)
    raw_repository.attributes(path)[name]
  end

1192 1193 1194 1195 1196 1197 1198 1199 1200 1201
  def copy_gitattributes(ref)
    actual_ref = ref || root_ref
    begin
      raw_repository.copy_gitattributes(actual_ref)
      true
    rescue Gitlab::Git::Repository::InvalidRef
      false
    end
  end

1202
  def main_language
1203
    return unless head_exists?
1204 1205

    Linguist::Repository.new(rugged, rugged.head.target_id).language
1206 1207
  end

1208
  def avatar
1209 1210
    return nil unless exists?

1211 1212
    @avatar ||= cache.fetch(:avatar) do
      AVATAR_FILES.find do |file|
1213
        blob_at_branch(root_ref, file)
1214 1215 1216 1217
      end
    end
  end

1218 1219 1220 1221
  def head_exists?
    exists? && !empty? && !rugged.head_unborn?
  end

1222 1223
  private

1224
  def cache
1225
    @cache ||= RepositoryCache.new(path_with_namespace, @project.id)
1226
  end
1227

1228 1229 1230
  def file_on_head(regex)
    tree(:head).blobs.find { |file| file.name =~ regex }
  end
1231 1232

  def tags_sorted_by_committed_date
1233
    tags.sort_by { |tag| tag.target.committed_date }
1234
  end
1235 1236 1237 1238

  def keep_around_ref_name(sha)
    "refs/keep-around/#{sha}"
  end
1239 1240 1241 1242

  def repository_event(event, tags = {})
    Gitlab::Metrics.add_event(event, { path: path_with_namespace }.merge(tags))
  end
1243
end