summaryrefslogtreecommitdiff
path: root/danger/commit_messages/Dangerfile
blob: 241462234c576991177de98047773f8aff08a537 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
# frozen_string_literal: true

require 'json'

URL_LIMIT_SUBJECT = "https://chris.beams.io/posts/git-commit/#limit-50"
URL_GIT_COMMIT = "https://chris.beams.io/posts/git-commit/"

# rubocop: disable Style/SignalException
# rubocop: disable Metrics/CyclomaticComplexity
# rubocop: disable Metrics/PerceivedComplexity

# Perform various checks against commits. We're not using
# https://github.com/jonallured/danger-commit_lint because its output is not
# very helpful, and it doesn't offer the means of ignoring merge commits.

class EmojiChecker
  DIGESTS = File.expand_path('../../fixtures/emojis/digests.json', __dir__)
  ALIASES = File.expand_path('../../fixtures/emojis/aliases.json', __dir__)

  # A regex that indicates a piece of text _might_ include an Emoji. The regex
  # alone is not enough, as we'd match `:foo:bar:baz`. Instead, we use this
  # regex to save us from having to check for all possible emoji names when we
  # know one definitely is not included.
  LIKELY_EMOJI = /:[\+a-z0-9_\-]+:/

  def initialize
    names = JSON.parse(File.read(DIGESTS)).keys +
      JSON.parse(File.read(ALIASES)).keys

    @emoji = names.map { |name| ":#{name}:" }
  end

  def includes_emoji?(text)
    return false unless text.match?(LIKELY_EMOJI)

    @emoji.any? { |emoji| text.include?(emoji) }
  end
end

def fail_commit(commit, message)
  fail("#{commit.sha}: #{message}")
end

def warn_commit(commit, message)
  warn("#{commit.sha}: #{message}")
end

def lines_changed_in_commit(commit)
  commit.diff_parent.stats[:total][:lines]
end

def subject_starts_with_capital?(subject)
  first_char = subject.chars.first

  first_char.upcase == first_char
end

def ce_upstream?
  gitlab.mr_labels.any? { |label| label == 'CE upstream' }
end

def too_many_changed_lines?(commit)
  commit.diff_parent.stats[:total][:files] > 3 &&
    lines_changed_in_commit(commit) >= 30
end

def lint_commits(commits)
  failures = false
  emoji_checker = EmojiChecker.new

  unicode_emoji_regex = %r((
    [\u{1F300}-\u{1F5FF}] |
    [\u{1F1E6}-\u{1F1FF}] |
    [\u{2700}-\u{27BF}] |
    [\u{1F900}-\u{1F9FF}] |
    [\u{1F600}-\u{1F64F}] |
    [\u{1F680}-\u{1F6FF}] |
    [\u{2600}-\u{26FF}]
  ))x

  commits.each do |commit|
    # For now we'll ignore merge commits, as getting rid of those is a problem
    # separate from enforcing good commit messages.
    next if commit.message.start_with?('Merge branch')

    # We ignore revert commits as they are well structured by Git already
    next if commit.message.start_with?('Revert "')

    subject, separator, details = commit.message.split("\n", 3)

    if subject.split.length < 3
      fail_commit(
        commit,
        'The commit subject must contain at least three words'
      )

      failures = true
    end

    if subject.length > 72
      fail_commit(
        commit,
        'The commit subject may not be longer than 72 characters'
      )

      failures = true
    elsif subject.length > 50
      warn_commit(
        commit,
        "This commit's subject line is acceptable, but please try to [reduce it to 50 characters](#{URL_LIMIT_SUBJECT})."
      )
    end

    unless subject_starts_with_capital?(subject)
      fail_commit(commit, 'The commit subject must start with a capital letter')
      failures = true
    end

    if subject.end_with?('.')
      fail_commit(commit, 'The commit subject must not end with a period')
      failures = true
    end

    if separator && !separator.empty?
      fail_commit(
        commit,
        'The commit subject and body must be separated by a blank line'
      )

      failures = true
    end

    details&.each_line do |line|
      line = line.strip

      next if line.length <= 72

      url_size = line.scan(%r((https?://\S+))).sum { |(url)| url.length }

      # If the line includes a URL, we'll allow it to exceed 72 characters, but
      # only if the line _without_ the URL does not exceed this limit.
      next if line.length - url_size <= 72

      fail_commit(
        commit,
        'The commit body should not contain more than 72 characters per line'
      )

      failures = true
    end

    if !details && too_many_changed_lines?(commit)
      fail_commit(
        commit,
        'Commits that change 30 or more lines across at least three files ' \
          'must describe these changes in the commit body'
      )

      failures = true
    end

    if emoji_checker.includes_emoji?(commit.message)
      fail_commit(
        commit,
        'Avoid the use of Markdown Emoji such as `:+1:`. ' \
          'These add no value to the commit message, ' \
          'and are displayed as plain text outside of GitLab'
      )

      failures = true
    end

    if commit.message.match?(unicode_emoji_regex)
      fail_commit(
        commit,
        'Avoid the use of Unicode Emoji. ' \
          'These add no value to the commit message, ' \
          'and may not be displayed properly everywhere'
      )

      failures = true
    end

    if commit.message.match?(%r(([\w\-\/]+)?(#|!|&|%)\d+\b))
      fail_commit(
        commit,
        'Use full URLs instead of short references ' \
          '(`gitlab-org/gitlab-ce#123` or `!123`), as short references are ' \
          'displayed as plain text outside of GitLab'
      )

      failures = true
    end
  end

  if failures
    markdown(<<~MARKDOWN)
      ## Commit message standards

      One or more commit messages do not meet our Git commit message standards.
      For more information on how to write a good commit message, take a look at
      [How to Write a Git Commit Message](#{URL_GIT_COMMIT}).

      Here is an example of a good commit message:

          Reject ruby interpolation in externalized strings

          When using ruby interpolation in externalized strings, they can't be
          detected. Which means they will never be presented to be translated.

          To mix variables into translations we need to use `sprintf`
          instead.

          Instead of:

              _("Hello \#{subject}")

          Use:

              _("Hello %{subject}") % { subject: 'world' }

      This is an example of a bad commit message:

          updated README.md

      This commit message is bad because although it tells us that README.md is
      updated, it doesn't tell us why or how it was updated.
    MARKDOWN
  end
end

if git.commits.length > 10 && !ce_upstream?
  warn(
    'This merge request includes more than 10 commits. ' \
      'Please rebase these commits into a smaller number of commits.'
  )
else
  lint_commits(git.commits)
end