gitlab-org--gitlab-foss/lib/gitlab/git/diff_collection.rb

169 lines
4.2 KiB
Ruby
Raw Normal View History

# frozen_string_literal: true
# Gitaly note: JV: no RPC's here.
2017-01-04 13:43:06 -05:00
module Gitlab
module Git
class DiffCollection
include Enumerable
DEFAULT_LIMITS = { max_files: 100, max_lines: 5000 }.freeze
attr_reader :limits
delegate :max_files, :max_lines, :max_bytes, :safe_max_files, :safe_max_lines, :safe_max_bytes, to: :limits
def self.limits(options = {})
limits = {}
limits[:max_files] = options.fetch(:max_files, DEFAULT_LIMITS[:max_files])
limits[:max_lines] = options.fetch(:max_lines, DEFAULT_LIMITS[:max_lines])
limits[:max_bytes] = limits[:max_files] * 5.kilobytes # Average 5 KB per file
limits[:safe_max_files] = [limits[:max_files], DEFAULT_LIMITS[:max_files]].min
limits[:safe_max_lines] = [limits[:max_lines], DEFAULT_LIMITS[:max_lines]].min
limits[:safe_max_bytes] = limits[:safe_max_files] * 5.kilobytes # Average 5 KB per file
limits[:max_patch_bytes] = Gitlab::Git::Diff.patch_hard_limit_bytes
OpenStruct.new(limits)
end
2017-01-04 13:43:06 -05:00
def initialize(iterator, options = {})
@iterator = iterator
@limits = self.class.limits(options)
2017-05-31 15:41:25 -04:00
@enforce_limits = !!options.fetch(:limits, true)
@expanded = !!options.fetch(:expanded, true)
@offset_index = options.fetch(:offset_index, 0)
2017-01-04 13:43:06 -05:00
@line_count = 0
@byte_count = 0
@overflow = false
@empty = true
2017-01-04 13:43:06 -05:00
@array = Array.new
end
def each(&block)
@array.each(&block)
return if @overflow
return if @iterator.nil?
2018-07-06 06:01:15 -04:00
if @iterator.is_a?(Gitlab::GitalyClient::DiffStitcher)
each_gitaly_patch(&block)
else
each_serialized_patch(&block)
2017-01-04 13:43:06 -05:00
end
@populated = true
# Allow iterator to be garbage-collected. It cannot be reused anyway.
@iterator = nil
2017-01-04 13:43:06 -05:00
end
def empty?
any? # Make sure the iterator has been exercised
@empty
2017-01-04 13:43:06 -05:00
end
def overflow?
populate!
!!@overflow
end
def size
@size ||= count # forces a loop using each method
end
def real_size
populate!
if @overflow
"#{size}+"
else
size.to_s
end
end
def line_count
populate!
@line_count
end
2017-01-04 13:43:06 -05:00
def decorate!
collection = each_with_index do |element, i|
@array[i] = yield(element)
end
collection
end
2017-05-15 13:18:19 -04:00
alias_method :to_ary, :to_a
2017-01-04 13:43:06 -05:00
private
def populate!
return if @populated
each {} # force a loop through all diffs
2017-01-04 13:43:06 -05:00
nil
end
def over_safe_limits?(files)
files >= safe_max_files || @line_count > safe_max_lines || @byte_count >= safe_max_bytes
2017-01-04 13:43:06 -05:00
end
def each_gitaly_patch
i = @array.length
@iterator.each do |raw|
diff = Gitlab::Git::Diff.new(raw, expanded: !@enforce_limits || @expanded)
if raw.overflow_marker
@overflow = true
break
end
yield @array[i] = diff
i += 1
end
end
2018-07-06 06:01:15 -04:00
def each_serialized_patch
i = @array.length
2017-01-04 13:43:06 -05:00
@iterator.each_with_index do |raw, iterator_index|
@empty = false
2017-01-04 13:43:06 -05:00
if @enforce_limits && i >= max_files
2017-01-04 13:43:06 -05:00
@overflow = true
break
end
2017-05-31 15:41:25 -04:00
expanded = !@enforce_limits || @expanded
2017-01-04 13:43:06 -05:00
diff = Gitlab::Git::Diff.new(raw, expanded: expanded)
2017-01-04 13:43:06 -05:00
2017-06-06 17:28:06 -04:00
if !expanded && over_safe_limits?(i) && diff.line_count > 0
diff.collapse!
2017-01-04 13:43:06 -05:00
end
@line_count += diff.line_count
@byte_count += diff.diff.bytesize
if @enforce_limits && (@line_count >= max_lines || @byte_count >= max_bytes)
2017-01-04 13:43:06 -05:00
# This last Diff instance pushes us over the lines limit. We stop and
# discard it.
@overflow = true
break
end
# We should not yield / memoize diffs before the offset index. Though,
# we still consider the limit buffers for diffs before it.
if iterator_index >= @offset_index
yield @array[i] = diff
i += 1
end
2017-01-04 13:43:06 -05:00
end
end
end
end
end