BigW Consortium Gitlab

repository.rb 16.2 KB
Newer Older
1 2
require 'securerandom'

3
class Repository
4 5
  class CommitError < StandardError; end

6 7
  include Gitlab::ShellAdapter

8
  attr_accessor :path_with_namespace, :project
9

10 11 12 13 14 15 16 17
  def self.clean_old_archives
    repository_downloads_path = Gitlab.config.gitlab.repository_downloads_path

    return unless File.directory?(repository_downloads_path)

    Gitlab::Popen.popen(%W(find #{repository_downloads_path} -not -path #{repository_downloads_path} -mmin +120 -delete))
  end

18
  def initialize(path_with_namespace, default_branch = nil, project = nil)
19
    @path_with_namespace = path_with_namespace
20
    @project = project
21
  end
22

23 24
  def raw_repository
    return nil unless path_with_namespace
25

26 27 28 29 30 31 32
    @raw_repository ||= begin
      repo = Gitlab::Git::Repository.new(path_to_repo)
      repo.autocrlf = :input
      repo
    rescue Gitlab::Git::Repository::NoRepository
      nil
    end
33 34
  end

35
  # Return absolute path to repository
36
  def path_to_repo
37 38 39
    @path_to_repo ||= File.expand_path(
      File.join(Gitlab.config.gitlab_shell.repos_path, path_with_namespace + ".git")
    )
40 41
  end

42 43 44 45 46 47
  def exists?
    raw_repository
  end

  def empty?
    raw_repository.empty?
48 49
  end

50 51 52 53 54 55 56 57 58 59 60 61 62
  #
  # Git repository can contains some hidden refs like:
  #   /refs/notes/*
  #   /refs/git-as-svn/*
  #   /refs/pulls/*
  # This refs by default not visible in project page and not cloned to client side.
  #
  # This method return true if repository contains some content visible in project page.
  #
  def has_visible_content?
    !raw_repository.branches.empty?
  end

63
  def commit(id = 'HEAD')
64
    return nil unless raw_repository
65
    commit = Gitlab::Git::Commit.find(raw_repository, id)
66
    commit = Commit.new(commit, @project) if commit
67
    commit
68
  rescue Rugged::OdbError
69
    nil
70 71
  end

72
  def commits(ref, path = nil, limit = nil, offset = nil, skip_merges = false)
73
    options = {
74 75 76 77 78
      repo: raw_repository,
      ref: ref,
      path: path,
      limit: limit,
      offset: offset,
79 80 81
      # --follow doesn't play well with --skip. See:
      # https://gitlab.com/gitlab-org/gitlab-ce/issues/3574#note_3040520
      follow: false
82 83 84
    }

    commits = Gitlab::Git::Commit.where(options)
85
    commits = Commit.decorate(commits, @project) if commits.present?
86 87 88
    commits
  end

89 90
  def commits_between(from, to)
    commits = Gitlab::Git::Commit.between(raw_repository, from, to)
91
    commits = Commit.decorate(commits, @project) if commits.present?
92 93 94
    commits
  end

95 96 97
  def find_commits_by_message(query, ref = nil, path = nil, limit = 1000, offset = 0)
    ref ||= root_ref

98
    # Limited to 1000 commits for now, could be parameterized?
99 100
    args = %W(#{Gitlab.config.git.bin_path} log #{ref} --pretty=%H --skip #{offset} --max-count #{limit} --grep=#{query})
    args = args.concat(%W(-- #{path})) if path.present?
101

102 103
    git_log_results = Gitlab::Popen.popen(args, path_to_repo).first.lines.map(&:chomp)
    commits = git_log_results.map { |c| commit(c) }
104
    commits
105 106
  end

107
  def find_branch(name)
108
    raw_repository.branches.find { |branch| branch.name == name }
109 110 111
  end

  def find_tag(name)
112
    raw_repository.tags.find { |tag| tag.name == name }
113 114
  end

115 116 117 118 119 120 121 122 123 124
  def add_branch(user, branch_name, target)
    oldrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name
    target = commit(target).try(:id)

    return false unless target

    GitHooksService.new.execute(user, path_to_repo, oldrev, target, ref) do
      rugged.branches.create(branch_name, target)
    end
125

126 127
    expire_branches_cache
    find_branch(branch_name)
128 129
  end

130
  def add_tag(tag_name, ref, message = nil)
131
    expire_tags_cache
132

133
    gitlab_shell.add_tag(path_with_namespace, tag_name, ref, message)
134 135
  end

136
  def rm_branch(user, branch_name)
137
    expire_branches_cache
138

139 140 141 142 143 144 145 146
    branch = find_branch(branch_name)
    oldrev = branch.try(:target)
    newrev = Gitlab::Git::BLANK_SHA
    ref    = Gitlab::Git::BRANCH_REF_PREFIX + branch_name

    GitHooksService.new.execute(user, path_to_repo, oldrev, newrev, ref) do
      rugged.branches.delete(branch_name)
    end
147

148 149
    expire_branches_cache
    true
150 151
  end

152
  def rm_tag(tag_name)
153
    expire_tags_cache
154

155 156 157
    gitlab_shell.rm_tag(path_with_namespace, tag_name)
  end

158
  def branch_names
159
    cache.fetch(:branch_names) { raw_repository.branch_names }
160 161 162
  end

  def tag_names
163
    cache.fetch(:tag_names) { raw_repository.tag_names }
164 165
  end

166
  def commit_count
167
    cache.fetch(:commit_count) do
168
      begin
169
        raw_repository.commit_count(self.root_ref)
170 171 172
      rescue
        0
      end
173
    end
174 175
  end

176 177 178
  # Return repo size in megabytes
  # Cached in redis
  def size
179
    cache.fetch(:size) { raw_repository.size }
180
  end
181

182
  def diverging_commit_counts(branch)
183
    root_ref_hash = raw_repository.rev_parse_target(root_ref).oid
184
    cache.fetch(:"diverging_commit_counts_#{branch.name}") do
185 186 187 188
      # Rugged seems to throw a `ReferenceError` when given branch_names rather
      # than SHA-1 hashes
      number_commits_behind = commits_between(branch.target, root_ref_hash).size
      number_commits_ahead = commits_between(root_ref_hash, branch.target).size
189

190 191 192
      { behind: number_commits_behind, ahead: number_commits_ahead }
    end
  end
193

194
  def cache_keys
195
    %i(size branch_names tag_names commit_count
196 197
       readme version contribution_guide changelog license)
  end
198

199
  def branch_cache_keys
200 201
    branches.map do |branch|
      :"diverging_commit_counts_#{branch.name}"
202
    end
203 204 205 206 207 208 209 210
  end

  def build_cache
    cache_keys.each do |key|
      unless cache.exist?(key)
        send(key)
      end
    end
211

212
    branches.each do |branch|
213
      unless cache.exist?(:"diverging_commit_counts_#{branch.name}")
214 215 216
        send(:diverging_commit_counts, branch)
      end
    end
217 218
  end

219 220 221 222 223 224 225 226 227 228
  def expire_tags_cache
    cache.expire(:tag_names)
    @tags = nil
  end

  def expire_branches_cache
    cache.expire(:branch_names)
    @branches = nil
  end

229
  def expire_cache
230
    cache_keys.each do |key|
231 232
      cache.expire(key)
    end
233

234
    expire_branch_cache
235
  end
236

237 238
  def expire_branch_cache
    branches.each do |branch|
239
      cache.expire(:"diverging_commit_counts_#{branch.name}")
240
    end
Dmitriy Zaporozhets committed
241 242
  end

243 244
  def rebuild_cache
    cache_keys.each do |key|
245
      cache.expire(key)
246
      send(key)
Dmitriy Zaporozhets committed
247
    end
248

249
    branches.each do |branch|
250 251
      cache.expire(:"diverging_commit_counts_#{branch.name}")
      diverging_commit_counts(branch)
252
    end
253 254
  end

255 256 257 258
  def lookup_cache
    @lookup_cache ||= {}
  end

259 260 261 262
  def expire_branch_names
    cache.expire(:branch_names)
  end

263
  def method_missing(m, *args, &block)
264 265 266 267 268 269
    if m == :lookup && !block_given?
      lookup_cache[m] ||= {}
      lookup_cache[m][args.join(":")] ||= raw_repository.send(m, *args, &block)
    else
      raw_repository.send(m, *args, &block)
    end
270 271
  end

272 273
  def respond_to_missing?(method, include_private = false)
    raw_repository.respond_to?(method, include_private) || super
274
  end
275 276

  def blob_at(sha, path)
277 278 279
    unless Gitlab::Git.blank_ref?(sha)
      Gitlab::Git::Blob.find(self, sha, path)
    end
280
  end
281

282 283 284 285
  def blob_by_oid(oid)
    Gitlab::Git::Blob.raw(self, oid)
  end

286
  def readme
287
    cache.fetch(:readme) { tree(:head).readme }
288
  end
289

290
  def version
291
    cache.fetch(:version) do
292 293 294 295 296 297
      tree(:head).blobs.find do |file|
        file.name.downcase == 'version'
      end
    end
  end

298
  def contribution_guide
299 300 301 302 303 304
    cache.fetch(:contribution_guide) do
      tree(:head).blobs.find do |file|
        file.contributing?
      end
    end
  end
305 306 307 308

  def changelog
    cache.fetch(:changelog) do
      tree(:head).blobs.find do |file|
309
        file.name =~ /\A(changelog|history)/i
310 311
      end
    end
312 313
  end

314 315
  def license
    cache.fetch(:license) do
316
      licenses =  tree(:head).blobs.find_all do |file|
317
                    file.name =~ /\A(copying|license|licence)/i
318 319
                  end

320 321 322 323 324 325 326 327 328 329 330 331 332
      preferences = [
        /\Alicen[sc]e\z/i,        # LICENSE, LICENCE
        /\Alicen[sc]e\./i,        # LICENSE.md, LICENSE.txt
        /\Acopying\z/i,           # COPYING
        /\Acopying\.(?!lesser)/i, # COPYING.txt
        /Acopying.lesser/i        # COPYING.LESSER
      ]

      license = nil
      preferences.each do |r|
        license = licenses.find { |l| l.name =~ r }
        break if license
      end
333

334
      license
335
    end
336 337
  end

338
  def head_commit
339 340 341 342 343
    @head_commit ||= commit(self.root_ref)
  end

  def head_tree
    @head_tree ||= Tree.new(self, head_commit.sha, nil)
344 345 346 347
  end

  def tree(sha = :head, path = nil)
    if sha == :head
348 349 350 351 352
      if path.nil?
        return head_tree
      else
        sha = head_commit.sha
      end
353 354 355 356
    end

    Tree.new(self, sha, path)
  end
357 358

  def blob_at_branch(branch_name, path)
359
    last_commit = commit(branch_name)
360

361 362 363 364 365
    if last_commit
      blob_at(last_commit.sha, path)
    else
      nil
    end
366
  end
367 368 369 370 371 372 373 374

  # Returns url for submodule
  #
  # Ex.
  #   @repository.submodule_url_for('master', 'rack')
  #   # => git@localhost:rack.git
  #
  def submodule_url_for(ref, path)
375
    if submodules(ref).any?
376 377 378 379 380 381 382
      submodule = submodules(ref)[path]

      if submodule
        submodule['url']
      end
    end
  end
383 384

  def last_commit_for_path(sha, path)
385
    args = %W(#{Gitlab.config.git.bin_path} rev-list --max-count=1 #{sha} -- #{path})
386 387
    sha = Gitlab::Popen.popen(args, path_to_repo).first.strip
    commit(sha)
388
  end
389

390 391 392 393 394 395 396 397 398 399 400
  def next_patch_branch
    patch_branch_ids = self.branch_names.map do |n|
      result = n.match(/\Apatch-([0-9]+)\z/)
      result[1].to_i if result
    end.compact

    highest_patch_branch_id = patch_branch_ids.max || 0

    "patch-#{highest_patch_branch_id + 1}"
  end

401
  # Remove archives older than 2 hours
402 403 404 405 406 407 408 409 410 411 412 413 414 415
  def branches_sorted_by(value)
    case value
    when 'recently_updated'
      branches.sort do |a, b|
        commit(b.target).committed_date <=> commit(a.target).committed_date
      end
    when 'last_updated'
      branches.sort do |a, b|
        commit(a.target).committed_date <=> commit(b.target).committed_date
      end
    else
      branches
    end
  end
416 417

  def contributors
418
    commits = self.commits(nil, nil, 2000, 0, true)
419

420
    commits.group_by(&:author_email).map do |email, commits|
421 422
      contributor = Gitlab::Contributor.new
      contributor.email = email
423

424
      commits.each do |commit|
425
        if contributor.name.blank?
426
          contributor.name = commit.author_name
427 428
        end

429
        contributor.commits += 1
430 431
      end

432 433
      contributor
    end
434
  end
435 436

  def blob_for_diff(commit, diff)
437
    blob_at(commit.id, diff.file_path)
438 439 440 441 442 443 444
  end

  def prev_blob_for_diff(commit, diff)
    if commit.parent_id
      blob_at(commit.parent_id, diff.old_path)
    end
  end
445

446 447
  def refs_contains_sha(ref_type, sha)
    args = %W(#{Gitlab.config.git.bin_path} #{ref_type} --contains #{sha})
448 449 450 451 452 453 454 455 456 457 458 459 460 461
    names = Gitlab::Popen.popen(args, path_to_repo).first

    if names.respond_to?(:split)
      names = names.split("\n").map(&:strip)

      names.each do |name|
        name.slice! '* '
      end

      names
    else
      []
    end
  end
462

463 464 465
  def branch_names_contains(sha)
    refs_contains_sha('branch', sha)
  end
466

467 468
  def tag_names_contains(sha)
    refs_contains_sha('tag', sha)
469
  end
470

471 472 473 474 475 476 477 478 479 480 481 482
  def branches
    @branches ||= raw_repository.branches
  end

  def tags
    @tags ||= raw_repository.tags
  end

  def root_ref
    @root_ref ||= raw_repository.root_ref
  end

Stan Hu committed
483
  def commit_dir(user, path, message, branch)
484
    commit_with_hooks(user, branch) do |ref|
Stan Hu committed
485 486 487 488 489 490 491 492 493 494 495 496 497
      committer = user_to_committer(user)
      options = {}
      options[:committer] = committer
      options[:author] = committer

      options[:commit] = {
        message: message,
        branch: ref,
      }

      raw_repository.mkdir(path, options)
    end
  end
498

Stan Hu committed
499 500 501
  def commit_file(user, path, content, message, branch, update)
    commit_with_hooks(user, branch) do |ref|
      committer = user_to_committer(user)
502 503 504 505 506 507 508
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref,
      }
509

510 511
      options[:file] = {
        content: content,
Stan Hu committed
512 513
        path: path,
        update: update
514
      }
515

516 517
      Gitlab::Git::Blob.commit(raw_repository, options)
    end
518 519
  end

520
  def remove_file(user, path, message, branch)
521
    commit_with_hooks(user, branch) do |ref|
Stan Hu committed
522
      committer = user_to_committer(user)
523 524 525 526 527 528 529
      options = {}
      options[:committer] = committer
      options[:author] = committer
      options[:commit] = {
        message: message,
        branch: ref
      }
530

531 532 533
      options[:file] = {
        path: path
      }
534

535 536
      Gitlab::Git::Blob.remove(raw_repository, options)
    end
537 538
  end

Stan Hu committed
539
  def user_to_committer(user)
540 541 542 543 544 545 546 547 548 549 550 551 552 553 554 555 556 557
    {
      email: user.email,
      name: user.name,
      time: Time.now
    }
  end

  def can_be_merged?(source_sha, target_branch)
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    if our_commit && their_commit
      !rugged.merge_commits(our_commit, their_commit).conflicts?
    else
      false
    end
  end

558
  def merge(user, source_sha, target_branch, options = {})
559 560 561 562 563 564 565 566 567
    our_commit = rugged.branches[target_branch].target
    their_commit = rugged.lookup(source_sha)

    raise "Invalid merge target" if our_commit.nil?
    raise "Invalid merge source" if their_commit.nil?

    merge_index = rugged.merge_commits(our_commit, their_commit)
    return false if merge_index.conflicts?

568 569 570 571 572 573
    commit_with_hooks(user, target_branch) do |ref|
      actual_options = options.merge(
        parents: [our_commit, their_commit],
        tree: merge_index.write_tree(rugged),
        update_ref: ref
      )
574

575 576
      Rugged::Commit.create(rugged, actual_options)
    end
577 578
  end

579 580 581 582 583
  def merged_to_root_ref?(branch_name)
    branch_commit = commit(branch_name)
    root_ref_commit = commit(root_ref)

    if branch_commit
584
      is_ancestor?(branch_commit.id, root_ref_commit.id)
585 586 587 588 589
    else
      nil
    end
  end

590 591 592 593
  def merge_base(first_commit_id, second_commit_id)
    rugged.merge_base(first_commit_id, second_commit_id)
  end

594 595 596 597 598
  def is_ancestor?(ancestor_id, descendant_id)
    merge_base(ancestor_id, descendant_id) == ancestor_id
  end


599 600
  def search_files(query, ref)
    offset = 2
601
    args = %W(#{Gitlab.config.git.bin_path} grep -i -n --before-context #{offset} --after-context #{offset} -e #{query} #{ref || root_ref})
602 603 604
    Gitlab::Popen.popen(args, path_to_repo).first.scrub.split(/^--$/)
  end

605
  def parse_search_result(result)
606 607 608 609
    ref = nil
    filename = nil
    startline = 0

610
    result.each_line.each_with_index do |line, index|
611 612 613 614 615 616 617
      if line =~ /^.*:.*:\d+:/
        ref, filename, startline = line.split(':')
        startline = startline.to_i - index
        break
      end
    end

618
    data = ""
619

620 621 622
    result.each_line do |line|
      data << line.sub(ref, '').sub(filename, '').sub(/^:-\d+-/, '').sub(/^::\d+:/, '')
    end
623 624 625 626 627 628 629 630 631

    OpenStruct.new(
      filename: filename,
      ref: ref,
      startline: startline,
      data: data
    )
  end

632
  def fetch_ref(source_path, source_ref, target_ref)
633
    args = %W(#{Gitlab.config.git.bin_path} fetch -f #{source_path} #{source_ref}:#{target_ref})
634 635 636
    Gitlab::Popen.popen(args, path_to_repo)
  end

637
  def with_tmp_ref(oldrev = nil)
638 639 640
    random_string = SecureRandom.hex
    tmp_ref = "refs/tmp/#{random_string}/head"

641
    if oldrev && !Gitlab::Git.blank_ref?(oldrev)
642 643 644 645
      rugged.references.create(tmp_ref, oldrev)
    end

    # Make commit in tmp ref
646 647 648 649 650 651 652 653 654
    yield(tmp_ref)
  ensure
    rugged.references.delete(tmp_ref) rescue nil
  end

  def commit_with_hooks(current_user, branch)
    oldrev = Gitlab::Git::BLANK_SHA
    ref = Gitlab::Git::BRANCH_REF_PREFIX + branch
    was_empty = empty?
655

656 657
    unless was_empty
      oldrev = find_branch(branch).target
658 659
    end

660 661 662 663 664 665 666
    with_tmp_ref(oldrev) do |tmp_ref|
      # Make commit in tmp ref
      newrev = yield(tmp_ref)

      unless newrev
        raise CommitError.new('Failed to create commit')
      end
667

668 669 670 671
      GitHooksService.new.execute(current_user, path_to_repo, oldrev, newrev, ref) do
        if was_empty
          # Create branch
          rugged.references.create(ref, newrev)
672
        else
673 674 675 676 677 678 679 680 681
          # Update head
          current_head = find_branch(branch).target

          # Make sure target branch was not changed during pre-receive hook
          if current_head == oldrev
            rugged.references.update(ref, newrev)
          else
            raise CommitError.new('Commit was rejected because branch received new push')
          end
682 683 684 685 686
        end
      end
    end
  end

687 688 689 690 691
  def ls_files(ref)
    actual_ref = ref || root_ref
    raw_repository.ls_files(actual_ref)
  end

692 693
  private

694 695 696
  def cache
    @cache ||= RepositoryCache.new(path_with_namespace)
  end
697
end