summaryrefslogtreecommitdiff
path: root/lib/banzai/filter/external_link_filter.rb
blob: d67d466bce85edc83c5cbd237f01984b2fb28ed8 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
module Banzai
  module Filter
    # HTML Filter to modify the attributes of external links
    class ExternalLinkFilter < HTML::Pipeline::Filter
      def call
        links.each do |node|
          href = href_to_lowercase_scheme(node["href"].to_s)

          unless node["href"].to_s == href
            node.set_attribute('href', href)
          end

          if href =~ %r{\A(https?:)?//[^/]} && external_url?(href)
            node.set_attribute('rel', 'nofollow noreferrer')
            node.set_attribute('target', '_blank')
          end
        end

        doc
      end

      private

      def links
        query = 'descendant-or-self::a[@href and not(@href = "")]'
        doc.xpath(query)
      end

      def href_to_lowercase_scheme(href)
        scheme_match = href.match(/\A(\w+):\/\//)

        if scheme_match
          scheme_match.to_s.downcase + scheme_match.post_match
        else
          href
        end
      end

      def external_url?(url)
        !url.start_with?(internal_url)
      end

      def internal_url
        @internal_url ||= Gitlab.config.gitlab.url
      end
    end
  end
end