summaryrefslogtreecommitdiff
path: root/lib/gitlab/file_finder.rb
blob: af8270c8db830a7ea21e9cca0d1465282a1af99a (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
# This class finds files in a repository by name and content
# the result is joined and sorted by file name
module Gitlab
  class FileFinder
    BATCH_SIZE = 100

    attr_reader :project, :ref

    delegate :repository, to: :project

    def initialize(project, ref)
      @project = project
      @ref = ref
    end

    def find(query)
      query = Gitlab::Search::Query.new(query) do
        filter :filename, matcher: ->(filter, blob) { blob.filename =~ /#{filter[:regex_value]}$/i }
        filter :path, matcher: ->(filter, blob) { blob.filename =~ /#{filter[:regex_value]}/i }
        filter :extension, matcher: ->(filter, blob) { blob.filename =~ /\.#{filter[:regex_value]}$/i }
      end

      by_content = find_by_content(query.term)

      already_found = Set.new(by_content.map(&:filename))
      by_filename = find_by_filename(query.term, except: already_found)

      files = (by_content + by_filename)
              .sort_by(&:filename)

      query.filter_results(files).map { |blob| [blob.filename, blob] }
    end

    private

    def find_by_content(query)
      results = repository.search_files_by_content(query, ref).first(BATCH_SIZE)
      results.map { |result| Gitlab::ProjectSearchResults.parse_search_result(result, project) }
    end

    def find_by_filename(query, except: [])
      filenames = search_filenames(query, except)

      blobs(filenames).map do |blob|
        Gitlab::SearchResults::FoundBlob.new(
          id: blob.id,
          filename: blob.path,
          basename: File.basename(blob.path, File.extname(blob.path)),
          ref: ref,
          startline: 1,
          data: blob.data,
          project: project
        )
      end
    end

    def search_filenames(query, except)
      filenames = repository.search_files_by_name(query, ref).first(BATCH_SIZE)

      filenames.delete_if { |filename| except.include?(filename) } unless except.empty?

      filenames
    end

    def blob_refs(filenames)
      filenames.map { |filename| [ref, filename] }
    end

    def blobs(filenames)
      Gitlab::Git::Blob.batch(repository, blob_refs(filenames), blob_size_limit: 1024)
    end
  end
end