# This module takes care of updating cache columns for Markdown-containing # fields. Use like this in the body of your class: # # include CacheMarkdownField # cache_markdown_field :foo # cache_markdown_field :bar # cache_markdown_field :baz, pipeline: :single_line # # Corresponding foo_html, bar_html and baz_html fields should exist. module CacheMarkdownField extend ActiveSupport::Concern # Increment this number every time the renderer changes its output CACHE_VERSION = 2 # changes to these attributes cause the cache to be invalidates INVALIDATED_BY = %w[author project].freeze # Knows about the relationship between markdown and html field names, and # stores the rendering contexts for the latter class FieldData def initialize @data = {} end delegate :[], :[]=, to: :@data def markdown_fields @data.keys end def html_field(markdown_field) "#{markdown_field}_html" end def html_fields markdown_fields.map {|field| html_field(field) } end end def skip_project_check? false end # Returns the default Banzai render context for the cached markdown field. def banzai_render_context(field) raise ArgumentError.new("Unknown field: #{field.inspect}") unless cached_markdown_fields.markdown_fields.include?(field) # Always include a project key, or Banzai complains project = self.project if self.respond_to?(:project) group = self.group if self.respond_to?(:group) context = cached_markdown_fields[field].merge(project: project, group: group) # Banzai is less strict about authors, so don't always have an author key context[:author] = self.author if self.respond_to?(:author) context end # Update every column in a row if any one is invalidated, as we only store # one version per row def refresh_markdown_cache options = { skip_project_check: skip_project_check? } updates = cached_markdown_fields.markdown_fields.map do |markdown_field| [ cached_markdown_fields.html_field(markdown_field), Banzai::Renderer.cacheless_render_field(self, markdown_field, options) ] end.to_h updates['cached_markdown_version'] = CacheMarkdownField::CACHE_VERSION updates.each {|html_field, data| write_attribute(html_field, data) } end def refresh_markdown_cache! updates = refresh_markdown_cache return unless persisted? && Gitlab::Database.read_write? update_columns(updates) end def cached_html_up_to_date?(markdown_field) html_field = cached_markdown_fields.html_field(markdown_field) cached = cached_html_for(markdown_field).present? && __send__(markdown_field).present? # rubocop:disable GitlabSecurity/PublicSend return false unless cached markdown_changed = attribute_changed?(markdown_field) || false html_changed = attribute_changed?(html_field) || false CacheMarkdownField::CACHE_VERSION == cached_markdown_version && (html_changed || markdown_changed == html_changed) end def invalidated_markdown_cache? cached_markdown_fields.html_fields.any? {|html_field| attribute_invalidated?(html_field) } end def attribute_invalidated?(attr) __send__("#{attr}_invalidated?") # rubocop:disable GitlabSecurity/PublicSend end def cached_html_for(markdown_field) raise ArgumentError.new("Unknown field: #{field}") unless cached_markdown_fields.markdown_fields.include?(markdown_field) __send__(cached_markdown_fields.html_field(markdown_field)) # rubocop:disable GitlabSecurity/PublicSend end included do cattr_reader :cached_markdown_fields do FieldData.new end # Always exclude _html fields from attributes (including serialization). # They contain unredacted HTML, which would be a security issue alias_method :attributes_before_markdown_cache, :attributes def attributes attrs = attributes_before_markdown_cache attrs.delete('cached_markdown_version') cached_markdown_fields.html_fields.each do |field| attrs.delete(field) end attrs end # Using before_update here conflicts with elasticsearch-model somehow before_create :refresh_markdown_cache, if: :invalidated_markdown_cache? before_update :refresh_markdown_cache, if: :invalidated_markdown_cache? end class_methods do private # Specify that a field is markdown. Its rendered output will be cached in # a corresponding _html field. Any custom rendering options may be provided # as a context. def cache_markdown_field(markdown_field, context = {}) cached_markdown_fields[markdown_field] = context html_field = cached_markdown_fields.html_field(markdown_field) invalidation_method = "#{html_field}_invalidated?".to_sym # The HTML becomes invalid if any dependent fields change. For now, assume # author and project invalidate the cache in all circumstances. define_method(invalidation_method) do changed_fields = changed_attributes.keys invalidations = changed_fields & [markdown_field.to_s, *INVALIDATED_BY] !invalidations.empty? || !cached_html_up_to_date?(markdown_field) end end end end