discourse/lib/cooked_post_processor.rb

# frozen_string_literal: true

# Post processing that we can do after a post has already been cooked.
# For example, inserting the onebox content, or image sizes/thumbnails.

class CookedPostProcessor
  LIGHTBOX_WRAPPER_CSS_CLASS = "lightbox-wrapper"
  LOADING_SIZE = 10
  LOADING_COLORS = 32

  attr_reader :cooking_options, :doc

  def initialize(post, opts = {})
    @dirty = false
    @opts = opts
    @post = post
    @previous_cooked = (@post.cooked || "").dup
    # NOTE: we re-cook the post here in order to prevent timing issues with edits
    # cf. https://meta.discourse.org/t/edit-of-rebaked-post-doesnt-show-in-html-only-in-raw/33815/6
    @cooking_options = post.cooking_options || opts[:cooking_options] || {}
    @cooking_options[:topic_id] = post.topic_id
    @cooking_options = @cooking_options.symbolize_keys

    cooked = post.cook(post.raw, @cooking_options)
    @doc = Nokogiri::HTML5::fragment(cooked)
    @has_oneboxes = post.post_analyzer.found_oneboxes?
    @size_cache = {}

    @disable_loading_image = !!opts[:disable_loading_image]
    @omit_nofollow = post.omit_nofollow?
  end

  def post_process(new_post: false)
    DistributedMutex.synchronize("post_process_#{@post.id}", validity: 10.minutes) do
      DiscourseEvent.trigger(:before_post_process_cooked, @doc, @post)
      remove_full_quote_on_direct_reply if new_post
      post_process_oneboxes
      post_process_images
      post_process_quotes
      optimize_urls
      remove_user_ids
      update_post_image
      enforce_nofollow
      pull_hotlinked_images
      grant_badges
      @post.link_post_uploads(fragments: @doc)
      DiscourseEvent.trigger(:post_process_cooked, @doc, @post)
      nil
    end
  end

  def has_emoji?
    (@doc.css("img.emoji") - @doc.css(".quote img")).size > 0
  end

  def grant_badges
    return if @post.user.blank? || !Guardian.new.can_see?(@post)

    BadgeGranter.grant(Badge.find(Badge::FirstEmoji), @post.user, post_id: @post.id) if has_emoji?
    BadgeGranter.grant(Badge.find(Badge::FirstOnebox), @post.user, post_id: @post.id) if @has_oneboxes
    BadgeGranter.grant(Badge.find(Badge::FirstReplyByEmail), @post.user, post_id: @post.id) if @post.is_reply_by_email?
  end

  def post_process_quotes
    @doc.css("aside.quote").each do |q|
      post_number = q['data-post']
      topic_id = q['data-topic']
      if topic_id && post_number
        comparer = QuoteComparer.new(
          topic_id.to_i,
          post_number.to_i,
          q.css('blockquote').text
        )

        if comparer.modified?
          q['class'] = ((q['class'] || '') + " quote-modified").strip
        end
      end
    end
  end

  def remove_full_quote_on_direct_reply
    return if !SiteSetting.remove_full_quote
    return if @post.post_number == 1
    return if @doc.xpath("aside[contains(@class, 'quote')]").size != 1

    previous = Post
      .where("post_number < ? AND topic_id = ? AND post_type = ? AND NOT hidden", @post.post_number, @post.topic_id, Post.types[:regular])
      .order("post_number DESC")
      .limit(1)
      .pluck(:cooked)
      .first

    return if previous.blank?

    previous_text = Nokogiri::HTML5::fragment(previous).text.strip
    quoted_text = @doc.css("aside.quote:first-child blockquote").first&.text&.strip || ""

    return if previous_text.gsub(/(\s){2,}/, '\1') != quoted_text.gsub(/(\s){2,}/, '\1')

    quote_regexp = /\A\s*\[quote.+\[\/quote\]/im
    quoteless_raw = @post.raw.sub(quote_regexp, "").strip

    return if @post.raw.strip == quoteless_raw

    PostRevisor.new(@post).revise!(
      Discourse.system_user,
      {
        raw: quoteless_raw,
        edit_reason: I18n.t(:removed_direct_reply_full_quotes)
      },
      skip_validations: true,
      bypass_bump: true
    )
  end

  def add_image_placeholder!(img)
    src = img["src"].sub(/^https?:/i, "")

    if large_images.include?(src)
      return add_large_image_placeholder!(img)
    elsif broken_images.include?(src)
      return add_broken_image_placeholder!(img)
    end

    false
  end

  def add_large_image_placeholder!(img)
    url = img["src"]

    is_hyperlinked = is_a_hyperlink?(img)

    placeholder = create_node("div", "large-image-placeholder")
    img.add_next_sibling(placeholder)
    placeholder.add_child(img)

    a = create_link_node(nil, url, true)
    img.add_next_sibling(a)

    span = create_span_node("url", url)
    a.add_child(span)
    span.add_previous_sibling(create_icon_node("far-image"))
    span.add_next_sibling(create_span_node("help", I18n.t("upload.placeholders.too_large", max_size_kb: SiteSetting.max_image_size_kb)))

    # Only if the image is already linked
    if is_hyperlinked
      parent = placeholder.parent
      parent.add_next_sibling(placeholder)

      if parent.name == 'a' && parent["href"].present?
        if url == parent["href"]
          parent.remove
        else
          parent["class"] = "link"
          a.add_previous_sibling(parent)

          lspan = create_span_node("url", parent["href"])
          parent.add_child(lspan)
          lspan.add_previous_sibling(create_icon_node("link"))
        end
      end
    end

    img.remove
    true
  end

  def add_broken_image_placeholder!(img)
    img.name = "span"
    img.set_attribute("class", "broken-image")
    img.set_attribute("title", I18n.t("post.image_placeholder.broken"))
    img << "<svg class=\"fa d-icon d-icon-unlink svg-icon\" aria-hidden=\"true\"><use xlink:href=\"#unlink\"></use></svg>"
    img.remove_attribute("src")
    img.remove_attribute("width")
    img.remove_attribute("height")
    true
  end

  def large_images
    @large_images ||= @post.custom_fields[Post::LARGE_IMAGES].presence || []
  end

  def broken_images
    @broken_images ||= @post.custom_fields[Post::BROKEN_IMAGES].presence || []
  end

  def downloaded_images
    @downloaded_images ||= @post.downloaded_images
  end

  def extract_images
    # all images with a src attribute
    @doc.css("img[src]") -
    # minus data images
    @doc.css("img[src^='data']") -
    # minus emojis
    @doc.css("img.emoji")
  end

  def extract_images_for_post
    # all images with a src attribute
    @doc.css("img[src]") -
    # minus emojis
    @doc.css("img.emoji") -
    # minus images inside quotes
    @doc.css(".quote img") -
    # minus onebox site icons
    @doc.css("img.site-icon") -
    # minus onebox avatars
    @doc.css("img.onebox-avatar") -
    # minus small onebox images (large images are .aspect-image-full-size)
    @doc.css(".onebox .aspect-image img")
  end

  def oneboxed_images
    @doc.css(".onebox-body img, .onebox img, img.onebox")
  end

  def limit_size!(img)
    # retrieve the size from
    #  1) the width/height attributes
    #  2) the dimension from the preview (image_sizes)
    #  3) the dimension of the original image (HTTP request)
    w, h = get_size_from_attributes(img) ||
           get_size_from_image_sizes(img["src"], @opts[:image_sizes]) ||
           get_size(img["src"])

    # limit the size of the thumbnail
    img["width"], img["height"] = ImageSizer.resize(w, h)
  end

  def get_size_from_attributes(img)
    w, h = img["width"].to_i, img["height"].to_i
    return [w, h] unless w <= 0 || h <= 0
    # if only width or height are specified attempt to scale image
    if w > 0 || h > 0
      w = w.to_f
      h = h.to_f

      return unless original_image_size = get_size(img["src"])
      original_width, original_height = original_image_size.map(&:to_f)

      if w > 0
        ratio = w / original_width
        [w.floor, (original_height * ratio).floor]
      else
        ratio = h / original_height
        [(original_width * ratio).floor, h.floor]
      end
    end
  end

  def get_size_from_image_sizes(src, image_sizes)
    return unless image_sizes.present?
    image_sizes.each do |image_size|
      url, size = image_size[0], image_size[1]
      if url && url.include?(src) &&
         size && size["width"].to_i > 0 && size["height"].to_i > 0
        return [size["width"], size["height"]]
      end
    end
    nil
  end

  def add_to_size_cache(url, w, h)
    @size_cache[url] = [w, h]
  end

  def get_size(url)
    return @size_cache[url] if @size_cache.has_key?(url)

    absolute_url = url
    absolute_url = Discourse.base_url_no_prefix + absolute_url if absolute_url =~ /^\/[^\/]/

    return unless absolute_url

    # FastImage fails when there's no scheme
    absolute_url = SiteSetting.scheme + ":" + absolute_url if absolute_url.start_with?("//")

    # we can't direct FastImage to our secure-media-uploads url because it bounces
    # anonymous requests with a 404 error
    if url && Upload.secure_media_url?(url)
      absolute_url = Upload.signed_url_from_secure_media_url(absolute_url)
    end

    return unless is_valid_image_url?(absolute_url)

    # we can *always* crawl our own images
    return unless SiteSetting.crawl_images? || Discourse.store.has_been_uploaded?(url)

    @size_cache[url] = FastImage.size(absolute_url)
  rescue Zlib::BufError, URI::Error, OpenSSL::SSL::SSLError
    # FastImage.size raises BufError for some gifs, leave it.
  end

  def is_valid_image_url?(url)
    uri = URI.parse(url)
    %w(http https).include? uri.scheme
  rescue URI::Error
  end

  def convert_to_link!(img)
    w, h = img["width"].to_i, img["height"].to_i
    user_width, user_height = (w > 0 && h > 0 && [w, h]) ||
                              get_size_from_attributes(img) ||
                              get_size_from_image_sizes(img["src"], @opts[:image_sizes])

    limit_size!(img)

    src = img["src"]
    return if src.blank? || is_a_hyperlink?(img) || is_svg?(img)

    original_width, original_height = (get_size(src) || [0, 0]).map(&:to_i)
    if original_width == 0 || original_height == 0
      Rails.logger.info "Can't reach '#{src}' to get its dimension."
      return
    end

    return if original_width <= SiteSetting.max_image_width && original_height <= SiteSetting.max_image_height

    user_width, user_height = [original_width, original_height] if user_width.to_i <= 0 && user_height.to_i <= 0
    width, height = user_width, user_height

    crop = SiteSetting.min_ratio_to_crop > 0 && width.to_f / height.to_f < SiteSetting.min_ratio_to_crop

    if crop
      width, height = ImageSizer.crop(width, height)
      img["width"], img["height"] = width, height
    else
      width, height = ImageSizer.resize(width, height)
    end

    upload = Upload.get_from_url(src)
    if upload.present?
      upload.create_thumbnail!(width, height, crop: crop)

      each_responsive_ratio do |ratio|
        resized_w = (width * ratio).to_i
        resized_h = (height * ratio).to_i

        if upload.width && resized_w <= upload.width
          upload.create_thumbnail!(resized_w, resized_h, crop: crop)
        end
      end

      unless @disable_loading_image
        upload.create_thumbnail!(LOADING_SIZE, LOADING_SIZE, format: 'png', colors: LOADING_COLORS)
      end
    end

    if img.ancestors('.onebox, .onebox-body, .quote').blank? && !img.classes.include?("onebox")
      add_lightbox!(img, original_width, original_height, upload, cropped: crop)
    end

    if upload.present?
      optimize_image!(img, upload, cropped: crop)
    end
  end

  def loading_image(upload)
    upload.thumbnail(LOADING_SIZE, LOADING_SIZE)
  end

  def is_a_hyperlink?(img)
    parent = img.parent
    while parent
      return true if parent.name == "a"
      parent = parent.parent if parent.respond_to?(:parent)
    end
    false
  end

  def each_responsive_ratio
    SiteSetting
      .responsive_post_image_sizes
      .split('|')
      .map(&:to_f)
      .sort
      .each { |r| yield r if r > 1 }
  end

  def optimize_image!(img, upload, cropped: false)
    w, h = img["width"].to_i, img["height"].to_i

    # note: optimize_urls cooks the src and data-small-upload further after this
    thumbnail = !upload.animated && upload.thumbnail(w, h)
    if thumbnail && thumbnail.filesize.to_i < upload.filesize
      img["src"] = thumbnail.url

      srcset = +""

      each_responsive_ratio do |ratio|
        resized_w = (w * ratio).to_i
        resized_h = (h * ratio).to_i

        if !cropped && upload.width && resized_w > upload.width
          cooked_url = UrlHelper.cook_url(upload.url, secure: @post.with_secure_media?)
          srcset << ", #{cooked_url} #{ratio.to_s.sub(/\.0$/, "")}x"
        elsif t = upload.thumbnail(resized_w, resized_h)
          cooked_url = UrlHelper.cook_url(t.url, secure: @post.with_secure_media?)
          srcset << ", #{cooked_url} #{ratio.to_s.sub(/\.0$/, "")}x"
        end

        img["srcset"] = "#{UrlHelper.cook_url(img["src"], secure: @post.with_secure_media?)}#{srcset}" if srcset.present?
      end
    else
      img["src"] = upload.url
    end

    if small_upload = loading_image(upload)
      img["data-small-upload"] = small_upload.url
    end
  end

  def add_lightbox!(img, original_width, original_height, upload, cropped: false)
    # first, create a div to hold our lightbox
    lightbox = create_node("div", LIGHTBOX_WRAPPER_CSS_CLASS)
    img.add_next_sibling(lightbox)
    lightbox.add_child(img)

    # then, the link to our larger image
    src = UrlHelper.cook_url(img["src"], secure: @post.with_secure_media?)
    a = create_link_node("lightbox", src)
    img.add_next_sibling(a)

    if upload
      a["data-download-href"] = Discourse.store.download_url(upload)
    end

    a.add_child(img)

    # then, some overlay informations
    meta = create_node("div", "meta")
    img.add_next_sibling(meta)

    filename = get_filename(upload, img["src"])
    informations = +"#{original_width}×#{original_height}"
    informations << " #{upload.human_filesize}" if upload

    a["title"] = CGI.escapeHTML(img["title"] || img["alt"] || filename)

    meta.add_child create_icon_node("far-image")
    meta.add_child create_span_node("filename", a["title"])
    meta.add_child create_span_node("informations", informations)
    meta.add_child create_icon_node("discourse-expand")
  end

  def get_filename(upload, src)
    return File.basename(src) unless upload
    return upload.original_filename unless upload.original_filename =~ /^blob(\.png)?$/i
    I18n.t("upload.pasted_image_filename")
  end

  def create_node(tag_name, klass)
    node = Nokogiri::XML::Node.new(tag_name, @doc)
    node["class"] = klass if klass.present?
    node
  end

  def create_span_node(klass, content = nil)
    span = create_node("span", klass)
    span.content = content if content
    span
  end

  def create_icon_node(klass)
    icon = create_node("svg", "fa d-icon d-icon-#{klass} svg-icon")
    icon.set_attribute("aria-hidden", "true")
    icon << "<use xlink:href=\"##{klass}\"></use>"

  end

  def create_link_node(klass, url, external = false)
    a = create_node("a", klass)
    a["href"] = url
    if external
      a["target"] = "_blank"
      a["rel"] = "nofollow noopener"
    end
    a
  end

  def update_post_image
    upload = nil
    eligible_image_fragments = extract_images_for_post

    # Loop through those fragments until we find one with an upload record
    @post.each_upload_url(fragments: eligible_image_fragments) do |src, path, sha1|
      upload = Upload.find_by(sha1: sha1)
      break if upload
    end

    if upload.present?
      @post.update_column(:image_upload_id, upload.id) # post
      if @post.is_first_post? # topic
        @post.topic.update_column(:image_upload_id, upload.id)
        extra_sizes = ThemeModifierHelper.new(theme_ids: Theme.user_selectable.pluck(:id)).topic_thumbnail_sizes
        @post.topic.generate_thumbnails!(extra_sizes: extra_sizes)
      end
    else
      @post.update_column(:image_upload_id, nil) if @post.image_upload_id
      @post.topic.update_column(:image_upload_id, nil) if @post.topic.image_upload_id && @post.is_first_post?
      nil
    end
  end

  def post_process_oneboxes
    limit = SiteSetting.max_oneboxes_per_post
    oneboxes = {}
    inlineOneboxes = {}

    Oneboxer.apply(@doc, extra_paths: [".inline-onebox-loading"]) do |url, element|
      is_onebox = element["class"] == Oneboxer::ONEBOX_CSS_CLASS
      map = is_onebox ? oneboxes : inlineOneboxes
      skip_onebox = limit <= 0 && !map[url]

      if skip_onebox
        if is_onebox
          element.remove_class('onebox')
        else
          remove_inline_onebox_loading_class(element)
        end

        next
      end

      limit -= 1
      map[url] = true

      if is_onebox
        onebox = Oneboxer.onebox(url,
          invalidate_oneboxes: !!@opts[:invalidate_oneboxes],
          user_id: @post&.user_id,
          category_id: @post&.topic&.category_id
        )

        @has_oneboxes = true if onebox.present?
        onebox
      else
        process_inline_onebox(element)
        false
      end
    end

    oneboxed_images.each do |img|
      next if img["src"].blank?

      src = img["src"].sub(/^https?:/i, "")
      parent = img.parent
      img_classes = (img["class"] || "").split(" ")
      link_classes = ((parent&.name == "a" && parent["class"]) || "").split(" ")

      if img_classes.include?("onebox") || link_classes.include?("onebox")
        next if add_image_placeholder!(img)
      elsif large_images.include?(src) || broken_images.include?(src)
        img.remove
        next
      end

      upload_id = downloaded_images[src]
      upload = Upload.find_by_id(upload_id) if upload_id

      if upload.present?
        img["src"] = UrlHelper.cook_url(upload.url, secure: @post.with_secure_media?)
      end

      # make sure we grab dimensions for oneboxed images
      # and wrap in a div
      limit_size!(img)

      next if img["class"]&.include?('onebox-avatar')

      parent = parent&.parent if parent&.name == "a"
      parent_class = parent && parent["class"]
      width = img["width"].to_i
      height = img["height"].to_i

      if parent_class&.include?("onebox-body") && width > 0 && height > 0
        # special instruction for width == height, assume we are dealing with an avatar
        if (img["width"].to_i == img["height"].to_i)
          found = false
          parent = img
          while parent = parent.parent
            if parent["class"] && parent["class"].include?("allowlistedgeneric")
              found = true
              break
            end
          end

          if found
            img["class"] = img["class"].to_s + " onebox-avatar"
            next
          end
        end

        if width < 64 && height < 64
          img["class"] = img["class"].to_s + " onebox-full-image"
        else
          img.delete('width')
          img.delete('height')
          new_parent = img.add_next_sibling("<div class='aspect-image' style='--aspect-ratio:#{width}/#{height};'/>")
          new_parent.first.add_child(img)
        end
      elsif (parent_class&.include?("instagram-images") || parent_class&.include?("tweet-images") || parent_class&.include?("scale-images")) && width > 0 && height > 0
        img.remove_attribute("width")
        img.remove_attribute("height")
        parent["class"] = "aspect-image-full-size"
        parent["style"] = "--aspect-ratio:#{width}/#{height};"
      end
    end

    if @omit_nofollow || !SiteSetting.add_rel_nofollow_to_user_content
      @doc.css(".onebox-body a[rel], .onebox a[rel]").each do |a|
        rel_values = a['rel'].split(' ').map(&:downcase)
        rel_values.delete('nofollow')
        rel_values.delete('ugc')
        if rel_values.blank?
          a.remove_attribute("rel")
        else
          a["rel"] = rel_values.join(' ')
        end
      end
    end
  end

  def optimize_urls
    %w{href data-download-href}.each do |selector|
      @doc.css("a[#{selector}]").each do |a|
        a[selector] = UrlHelper.cook_url(a[selector].to_s)
      end
    end

    %w{src data-small-upload}.each do |selector|
      @doc.css("img[#{selector}]").each do |img|
        img[selector] = UrlHelper.cook_url(img[selector].to_s, secure: @post.with_secure_media?)
      end
    end
  end

  def remove_user_ids
    @doc.css("a[href]").each do |a|
      uri = begin
        URI(a["href"])
      rescue URI::Error
        next
      end
      next if uri.hostname != Discourse.current_hostname

      query = Rack::Utils.parse_nested_query(uri.query)
      next if !query.delete("u")

      uri.query = query.map { |k, v| "#{k}=#{v}" }.join("&").presence
      a["href"] = uri.to_s
    end
  end

  def enforce_nofollow
    add_nofollow = !@omit_nofollow && SiteSetting.add_rel_nofollow_to_user_content
    PrettyText.add_rel_attributes_to_user_content(@doc, add_nofollow)
  end

  def pull_hotlinked_images
    return if @opts[:skip_pull_hotlinked_images]
    # have we enough disk space?
    disable_if_low_on_disk_space # But still enqueue the job
    # make sure no other job is scheduled
    Jobs.cancel_scheduled_job(:pull_hotlinked_images, post_id: @post.id)
    # schedule the job
    delay = SiteSetting.editing_grace_period + 1
    Jobs.enqueue_in(delay.seconds.to_i, :pull_hotlinked_images, post_id: @post.id)
  end

  def disable_if_low_on_disk_space
    return if Discourse.store.external?
    return if !SiteSetting.download_remote_images_to_local
    return if available_disk_space >= SiteSetting.download_remote_images_threshold

    SiteSetting.download_remote_images_to_local = false

    # log the site setting change
    reason = I18n.t("disable_remote_images_download_reason")
    staff_action_logger = StaffActionLogger.new(Discourse.system_user)
    staff_action_logger.log_site_setting_change("download_remote_images_to_local", true, false, details: reason)

    # also send a private message to the site contact user
    notify_about_low_disk_space
  end

  def notify_about_low_disk_space
    SystemMessage.create_from_system_user(Discourse.site_contact_user, :download_remote_images_disabled)
  end

  def available_disk_space
    100 - DiskSpace.percent_free("#{Rails.root}/public/uploads")
  end

  def dirty?
    @previous_cooked != html
  end

  def html
    @doc.try(:to_html)
  end

  private

  def post_process_images
    extract_images.each do |img|
      convert_to_link!(img) unless add_image_placeholder!(img)
    end
  end

  def process_inline_onebox(element)
    inline_onebox = InlineOneboxer.lookup(
      element.attributes["href"].value,
      invalidate: !!@opts[:invalidate_oneboxes],
      user_id: @post&.user_id,
      category_id: @post&.topic&.category_id
    )

    if title = inline_onebox&.dig(:title)
      element.children = CGI.escapeHTML(title)
      element.add_class("inline-onebox")
    end

    remove_inline_onebox_loading_class(element)
  end

  def remove_inline_onebox_loading_class(element)
    element.remove_class("inline-onebox-loading")
  end

  def is_svg?(img)
    path =
      begin
        URI(img["src"]).path
      rescue URI::Error
        nil
      end

    File.extname(path) == '.svg' if path
  end

end
-												DEV: enable frozen string literal on all files

This reduces chances of errors where consumers of strings mutate inputs
and reduces memory usage of the app.

Test suite passes now, but there may be some stuff left, so we will run
a few sites on a branch prior to merging

											
										
										
											2019-05-02 18:17:27 -04:00
+								# frozen_string_literal: true
-												removed auto_link_images_wider_than setting

											
										
										
											2013-07-06 13:10:53 -04:00
+								# Post processing that we can do after a post has already been cooked.
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								# For example, inserting the onebox content, or image sizes/thumbnails.
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
 								class CookedPostProcessor
-												PERF: Improve quality of `PostSearchData#raw_data`. (#7275)

This commit fixes the follow quality issue with `PostSearchData#raw_data`:

1. URLs are being tokenized and links with similar href and characters
are being duplicated in the raw data.

`Post#cooked`:

```
<p><a href=\"https://meta.discourse.org/some.png\" class=\"onebox\" target=\"_blank\" rel=\"nofollow noopener\">https://meta.discourse.org/some.png</a></p>
```

`PostSearchData#raw_data` Before:

```
This is a test topic 0 Uncategorized https://meta.discourse.org/some.png discourse org/some png https://meta.discourse.org/some.png discourse org/some png
```

`PostSearchData#raw_data` After:

```
This is a test topic 0 Uncategorized https://meta.discourse.org/some.png meta discourse org
```

2. Ligthbox being included in search pollutes the
`PostSearchData#raw_data` unncessarily.

From 28 March 2018 to 28 March 2019, searches for the term `image` on
`meta.discourse.org` had a click through rate of 2.1%. Non-lightboxed images are not included in indexing for search yet we were indexing content within a lightbox. Also, search for terms like `image` was affected we were using `Pasted image` as the filename for
uploads that were pasted.

`Post#cooked`

```
<p>Let me see how I can fix this image<br>\n<div class=\"lightbox-wrapper\"><a class=\"lightbox\" href=\"https://meta.discourse.org/some.png\" title=\"some.png\" rel=\"nofollow noopener\"><img src=\"https://meta.discourse.org/some.png\" width=\"275\" height=\"299\"><div class=\"meta\">\n<svg class=\"fa d-icon d-icon-far-image svg-icon\" aria-hidden=\"true\"><use xlink:href=\"#far-image\"></use></svg><span class=\"filename\">some.png</span><span class=\"informations\">1750×2000</span><svg class=\"fa d-icon d-icon-discourse-expand svg-icon\" aria-hidden=\"true\"><use xlink:href=\"#discourse-expand\"></use></svg>\n</div></a></div></p>
```

`PostSearchData#raw_data` Before:

```
This is a test topic 0 Uncategorized Let me see how I can fix this image some.png png https://meta.discourse.org/some.png discourse org/some png some.png png 1750×2000
```

`PostSearchData#raw_data` After:

```
This is a test topic 0 Uncategorized Let me see how I can fix this image
```

In terms of indexing performance, we now have to parse the given HTML
through nokogiri twice. However performance is not a huge worry here since a string length of 194170 takes only 30ms
to scrub plus the indexing takes place in a background job.
											
										
										
											2019-03-31 22:14:29 -04:00
+								  LIGHTBOX_WRAPPER_CSS_CLASS = "lightbox-wrapper"
-												FEATURE: Show a blurry preview when lazy loading images

This generates a 10x10 PNG thumbnail for each lightboxed image.
If Image Lazy Loading is enabled (IntersectionObserver API) then
we'll load the low res version when offscreen. As the image scrolls
in we'll swap it for the high res version.

We use a WeakMap to track the old image attributes. It's much less
memory than storing them as `data-*` attributes and swapping them
back and forth all the time.

											
										
										
											2018-12-14 17:44:38 -05:00
+								  LOADING_SIZE = 10
 								  LOADING_COLORS = 32
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
-												UX: generic onebox treats all square images as avatars and renders them smaller

											
										
										
											2017-11-12 19:19:06 -05:00
+								  attr_reader :cooking_options, :doc
-												FIX: `nofollow` was being added during post processing when it shouldn't

											
										
										
											2016-08-12 15:28:54 -04:00
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  def initialize(post, opts = {})
 								    @dirty = false
 								    @opts = opts
 								    @post = post
-												make sure assets always use schemaless absolute uris

											
										
										
											2013-12-06 05:16:13 -05:00
+								    @previous_cooked = (@post.cooked || "").dup
-												FIX: timing issue with edits and cook post processing

											
										
										
											2015-09-29 12:51:26 -04:00
+								    # NOTE: we re-cook the post here in order to prevent timing issues with edits
 								    # cf. https://meta.discourse.org/t/edit-of-rebaked-post-doesnt-show-in-html-only-in-raw/33815/6
-												FIX: onebox links should respect nofollow settings

											
										
										
											2015-12-03 15:01:18 -05:00
+								    @cooking_options = post.cooking_options || opts[:cooking_options] || {}
-												Re-add option that was removed by mistake in https://github.com/discourse/discourse/commit/482013a1d4060e69cf78773892f13ef2d8220742.

											
										
										
											2018-11-26 01:23:56 -05:00
+								    @cooking_options[:topic_id] = post.topic_id
-												FIX: onebox links should respect nofollow settings

											
										
										
											2015-12-03 15:01:18 -05:00
+								    @cooking_options = @cooking_options.symbolize_keys
-												FEATURE: New "First Onebox" badge

											
										
										
											2016-04-12 14:09:59 -04:00
-												FIX: blank cooked markdown could raise an exception in logs

Previously if somehow a user created a blank markdown document using tag
tricks (eg `<p></p><p></p><p></p><p></p><p></p><p></p>`) and so on, we would
completely strip the document down to blank on post process due to onebox
hack.

Needs a followup cause I am still unclear about the reason for empty p stripping
and it can cause some unclear cases when we re-cook posts.

											
										
										
											2020-01-28 19:37:04 -05:00
+								    cooked = post.cook(post.raw, @cooking_options)
-												FEATURE: Nokogumbo (#9577)

* FEATURE: Nokogumbo

Use Nokogumbo HTML parser.
											
										
										
											2020-05-04 23:46:57 -04:00
+								    @doc = Nokogiri::HTML5::fragment(cooked)
-												FIX: Improve Onebox detection (#8019)

Follow-up to 7c83d2eeb261ac676a8320e6a704752c56fd242e.
											
										
										
											2019-09-10 06:59:48 -04:00
+								    @has_oneboxes = post.post_analyzer.found_oneboxes?
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								    @size_cache = {}
-												FEATURE: Show a blurry preview when lazy loading images

This generates a 10x10 PNG thumbnail for each lightboxed image.
If Image Lazy Loading is enabled (IntersectionObserver API) then
we'll load the low res version when offscreen. As the image scrolls
in we'll swap it for the high res version.

We use a WeakMap to track the old image attributes. It's much less
memory than storing them as `data-*` attributes and swapping them
back and forth all the time.

											
										
										
											2018-12-14 17:44:38 -05:00
 								    @disable_loading_image = !!opts[:disable_loading_image]
-												FIX: respect `tl3 links no follow` setting (#8232)


											
										
										
											2019-10-22 13:11:04 -04:00
+								    @omit_nofollow = post.omit_nofollow?
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  end
-												DEV: Remove `bypass_bump` from CookedPostProcessor (#9468)

It was only passing it along to `PullHotlinkedImages` and that class have not used that arg since April 2014 (https://github.com/discourse/discourse/commit/c52ee665b45241a89b4de8b916860f380ecf0141)
											
										
										
											2020-04-20 21:48:19 -04:00
+								  def post_process(new_post: false)
-												FEATURE: allow post process mutex to be held longer

Previously we would only hold the post process mutex for 1 minute, that is
not enough when processing a post with lots of images. This raises the bar
to 10 minutes.

It also cleans up error reporting around distributed mutexes expiring. We
used to double report.

											
										
										
											2019-08-04 21:57:35 -04:00
+								    DistributedMutex.synchronize("post_process_#{@post.id}", validity: 10.minutes) do
-												FEATURE: add :before_post_process_cooked hook

Also reduce amount of image downloading

											
										
										
											2017-10-16 23:17:00 -04:00
+								      DiscourseEvent.trigger(:before_post_process_cooked, @doc, @post)
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
+								      remove_full_quote_on_direct_reply if new_post
-												FIX: serialize post processing

This avoids all sorts of nasty race conditions in job schedular

											
										
										
											2015-08-13 23:05:13 -04:00
+								      post_process_oneboxes
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								      post_process_images
-												FEATURE: Add `quote-modified` class if a quote has been modified

											
										
										
											2018-03-13 13:07:51 -04:00
+								      post_process_quotes
-												FIX: serialize post processing

This avoids all sorts of nasty race conditions in job schedular

											
										
										
											2015-08-13 23:05:13 -04:00
+								      optimize_urls
-												FEATURE: Remove user IDs from internal URLs. (#7406)


											
										
										
											2019-04-22 22:45:41 -04:00
+								      remove_user_ids
-												Small re-organization of CookedPostProcessor workflow

- only 'limit_size!' of oneboxed images once
- update post image at the end
- move 'enforce_nofollow' in its own method
											
										
										
											2017-10-23 12:15:51 -04:00
+								      update_post_image
-												fix the build
											
										
										
											2017-10-23 13:09:38 -04:00
+								      enforce_nofollow
-												DEV: Remove `bypass_bump` from CookedPostProcessor (#9468)

It was only passing it along to `PullHotlinkedImages` and that class have not used that arg since April 2014 (https://github.com/discourse/discourse/commit/c52ee665b45241a89b4de8b916860f380ecf0141)
											
										
										
											2020-04-20 21:48:19 -04:00
+								      pull_hotlinked_images
-												Remove `UserFirst` table and grant Emoji badge directly

											
										
										
											2016-04-07 12:27:26 -04:00
+								      grant_badges
-												Always link post to uploads in post process.

The operation is cheap anyway so no point skipping.

											
										
										
											2018-09-06 02:08:03 -04:00
+								      @post.link_post_uploads(fragments: @doc)
-												FEATURE: post_process_cooked event

											
										
										
											2017-06-23 14:35:10 -04:00
+								      DiscourseEvent.trigger(:post_process_cooked, @doc, @post)
 								      nil
-												FEATURE: Two new badges - First Emoji and First Mention

											
										
										
											2016-04-05 15:12:02 -04:00
+								    end
 								  end
-												FIX: Don't count emojis within quotes

											
										
										
											2016-04-06 12:02:18 -04:00
+								  def has_emoji?
 								    (@doc.css("img.emoji") - @doc.css(".quote img")).size > 0
 								  end
-												Remove `UserFirst` table and grant Emoji badge directly

											
										
										
											2016-04-07 12:27:26 -04:00
+								  def grant_badges
-												FIX: Various fixes to support posts with no user (#8877)

* Do not grant badges for posts with no user
* Ensure instructions are correct in Change Owner modal
* Hide user-dependent actions from posts with no user
* Make PostRevisor work with posts with no user
* Ensure posts with no user can be deleted
* discourse-narrative-bot should ignore posts with no user
* Skip TopicLink creation for posts with no user
											
										
										
											2020-03-11 08:03:20 -04:00
+								    return if @post.user.blank? || !Guardian.new.can_see?(@post)
-												FIX: Don't create user first records on private posts

											
										
										
											2016-04-05 16:13:10 -04:00
-												FIX: New badges were missing post link

											
										
										
											2016-04-13 16:38:24 -04:00
+								    BadgeGranter.grant(Badge.find(Badge::FirstEmoji), @post.user, post_id: @post.id) if has_emoji?
 								    BadgeGranter.grant(Badge.find(Badge::FirstOnebox), @post.user, post_id: @post.id) if @has_oneboxes
-												FIX: FirstReplyByEmail badge wasn't granted

DEPRECATED: PostProcess badge trigger

											
										
										
											2016-08-10 13:24:01 -04:00
+								    BadgeGranter.grant(Badge.find(Badge::FirstReplyByEmail), @post.user, post_id: @post.id) if @post.is_reply_by_email?
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  end
-												FEATURE: Add `quote-modified` class if a quote has been modified

											
										
										
											2018-03-13 13:07:51 -04:00
+								  def post_process_quotes
 								    @doc.css("aside.quote").each do |q|
 								      post_number = q['data-post']
 								      topic_id = q['data-topic']
 								      if topic_id && post_number
 								        comparer = QuoteComparer.new(
 								          topic_id.to_i,
 								          post_number.to_i,
 								          q.css('blockquote').text
 								        )
 								        if comparer.modified?
 								          q['class'] = ((q['class'] || '') + " quote-modified").strip
 								        end
 								      end
 								    end
 								  end
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
+								  def remove_full_quote_on_direct_reply
 								    return if !SiteSetting.remove_full_quote
 								    return if @post.post_number == 1
-												FIX: Remove full nested quotes on direct reply (#8581)

It used to check how many quotes were inside a post, without taking
considering that some quotes can contain other quotes. This commit
selects only top level quotes.

I had to use XPath because I could not find an equivalent CSS
selector.
											
										
										
											2019-12-20 03:24:34 -05:00
+								    return if @doc.xpath("aside[contains(@class, 'quote')]").size != 1
-												FEATURE: Remove full quotes of direct replies. (#6729)


											
										
										
											2018-12-07 07:07:11 -05:00
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
+								    previous = Post
 								      .where("post_number < ? AND topic_id = ? AND post_type = ? AND NOT hidden", @post.post_number, @post.topic_id, Post.types[:regular])
 								      .order("post_number DESC")
 								      .limit(1)
 								      .pluck(:cooked)
 								      .first
-												FEATURE: Remove full quotes of direct replies. (#6729)


											
										
										
											2018-12-07 07:07:11 -05:00
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
+								    return if previous.blank?
-												FEATURE: Remove full quotes of direct replies. (#6729)


											
										
										
											2018-12-07 07:07:11 -05:00
-												FEATURE: Nokogumbo (#9577)

* FEATURE: Nokogumbo

Use Nokogumbo HTML parser.
											
										
										
											2020-05-04 23:46:57 -04:00
+								    previous_text = Nokogiri::HTML5::fragment(previous).text.strip
-												FIX: handle clicks counters in full quotes

											
										
										
											2019-05-17 08:17:29 -04:00
+								    quoted_text = @doc.css("aside.quote:first-child blockquote").first&.text&.strip || ""
 								    return if previous_text.gsub(/(\s){2,}/, '\1') != quoted_text.gsub(/(\s){2,}/, '\1')
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
-												FIX: Remove full nested quotes on direct reply (#8581)

It used to check how many quotes were inside a post, without taking
considering that some quotes can contain other quotes. This commit
selects only top level quotes.

I had to use XPath because I could not find an equivalent CSS
selector.
											
										
										
											2019-12-20 03:24:34 -05:00
+								    quote_regexp = /\A\s*\[quote.+\[\/quote\]/im
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
+								    quoteless_raw = @post.raw.sub(quote_regexp, "").strip
 								    return if @post.raw.strip == quoteless_raw
-												FEATURE: Remove full quotes of direct replies. (#6729)


											
										
										
											2018-12-07 07:07:11 -05:00
 								    PostRevisor.new(@post).revise!(
 								      Discourse.system_user,
 								      {
-												FIX: remove full quote on direct replies when "typographed"

Use the cooked version of the post and the quote to compare their content in
order to take into account the "typographer" option of the markdown pipeline.

											
										
										
											2019-05-15 11:49:29 -04:00
+								        raw: quoteless_raw,
-												FEATURE: Remove full quotes of direct replies. (#6729)


											
										
										
											2018-12-07 07:07:11 -05:00
+								        edit_reason: I18n.t(:removed_direct_reply_full_quotes)
 								      },
-												* FEATURE: Adds site setting to let quotes on direct replies.

* DEV: Added test.
* FIX: Do not bump topic when removing full quotes.

											
										
										
											2018-12-12 09:42:53 -05:00
+								      skip_validations: true,
 								      bypass_bump: true
-												FEATURE: Remove full quotes of direct replies. (#6729)


											
										
										
											2018-12-07 07:07:11 -05:00
+								    )
 								  end
-												FIX: Do not add lightbox to onebox images (#6479)


											
										
										
											2018-10-10 17:57:21 -04:00
+								  def add_image_placeholder!(img)
 								    src = img["src"].sub(/^https?:/i, "")
 								    if large_images.include?(src)
 								      return add_large_image_placeholder!(img)
 								    elsif broken_images.include?(src)
 								      return add_broken_image_placeholder!(img)
 								    end
 								    false
 								  end
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								  def add_large_image_placeholder!(img)
 								    url = img["src"]
 								    is_hyperlinked = is_a_hyperlink?(img)
 								    placeholder = create_node("div", "large-image-placeholder")
 								    img.add_next_sibling(placeholder)
 								    placeholder.add_child(img)
 								    a = create_link_node(nil, url, true)
 								    img.add_next_sibling(a)
 								    span = create_span_node("url", url)
 								    a.add_child(span)
-												Upgrade to FontAwesome 5 (take two) (#6673)

* Add missing icons to set

* Revert FA5 revert

 This reverts commit 42572ff

* use new SVG syntax in locales

* Noscript page changes (remove login button, center "powered by" footer text)

* Cast wider net for SVG icons in settings

- include any _icon setting for SVG registry (offers better support for plugin settings)

- let themes store multiple pipe-delimited icons in a setting

- also replaces broken onebox image icon with SVG reference in cooked post processor

* interpolate icons in locales

* Fix composer whisper icon alignment

* Add support for stacked icons

* SECURITY: enforce hostname to match discourse hostname

This ensures that the hostname rails uses for various helpers always matches
the Discourse hostname

* load SVG sprite with pre-initializers

* FIX: enable caching on SVG sprites

* PERF: use JSONP for SVG sprites so they are served from CDN

This avoids needing to deal with CORS for loading of the SVG

Note, added the svg- prefix to the filename so we can quickly tell in
dev tools what the file is

* Add missing SVG sprite JSONP script to CSP

* Upgrade to FA 5.5.0

* Add support for all FA4.7 icons

- adds complete frontend and backend for renamed FA4.7 icons

- improves performance of SvgSprite.bundle and SvgSprite.all_icons

* Fix group avatar flair preview

- adds an endpoint at /svg-sprites/search/:keyword

- adds frontend ajax call that pulls icon in avatar flair preview even when it is not in subset

* Remove FA 4.7 font files

											
										
										
											2018-11-26 16:49:57 -05:00
+								    span.add_previous_sibling(create_icon_node("far-image"))
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								    span.add_next_sibling(create_span_node("help", I18n.t("upload.placeholders.too_large", max_size_kb: SiteSetting.max_image_size_kb)))
 								    # Only if the image is already linked
 								    if is_hyperlinked
 								      parent = placeholder.parent
 								      parent.add_next_sibling(placeholder)
-												FIX: Duplicate a tag if image url is same to href

											
										
										
											2017-11-15 07:06:48 -05:00
+								      if parent.name == 'a' && parent["href"].present?
 								        if url == parent["href"]
 								          parent.remove
 								        else
 								          parent["class"] = "link"
 								          a.add_previous_sibling(parent)
 								          lspan = create_span_node("url", parent["href"])
 								          parent.add_child(lspan)
 								          lspan.add_previous_sibling(create_icon_node("link"))
 								        end
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								      end
 								    end
 								    img.remove
-												FIX: Do not add lightbox to onebox images (#6479)


											
										
										
											2018-10-10 17:57:21 -04:00
+								    true
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								  end
 								  def add_broken_image_placeholder!(img)
 								    img.name = "span"
-												Upgrade to FontAwesome 5 (take two) (#6673)

* Add missing icons to set

* Revert FA5 revert

 This reverts commit 42572ff

* use new SVG syntax in locales

* Noscript page changes (remove login button, center "powered by" footer text)

* Cast wider net for SVG icons in settings

- include any _icon setting for SVG registry (offers better support for plugin settings)

- let themes store multiple pipe-delimited icons in a setting

- also replaces broken onebox image icon with SVG reference in cooked post processor

* interpolate icons in locales

* Fix composer whisper icon alignment

* Add support for stacked icons

* SECURITY: enforce hostname to match discourse hostname

This ensures that the hostname rails uses for various helpers always matches
the Discourse hostname

* load SVG sprite with pre-initializers

* FIX: enable caching on SVG sprites

* PERF: use JSONP for SVG sprites so they are served from CDN

This avoids needing to deal with CORS for loading of the SVG

Note, added the svg- prefix to the filename so we can quickly tell in
dev tools what the file is

* Add missing SVG sprite JSONP script to CSP

* Upgrade to FA 5.5.0

* Add support for all FA4.7 icons

- adds complete frontend and backend for renamed FA4.7 icons

- improves performance of SvgSprite.bundle and SvgSprite.all_icons

* Fix group avatar flair preview

- adds an endpoint at /svg-sprites/search/:keyword

- adds frontend ajax call that pulls icon in avatar flair preview even when it is not in subset

* Remove FA 4.7 font files

											
										
										
											2018-11-26 16:49:57 -05:00
+								    img.set_attribute("class", "broken-image")
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    img.set_attribute("title", I18n.t("post.image_placeholder.broken"))
-												Upgrade to FontAwesome 5 (take two) (#6673)

* Add missing icons to set

* Revert FA5 revert

 This reverts commit 42572ff

* use new SVG syntax in locales

* Noscript page changes (remove login button, center "powered by" footer text)

* Cast wider net for SVG icons in settings

- include any _icon setting for SVG registry (offers better support for plugin settings)

- let themes store multiple pipe-delimited icons in a setting

- also replaces broken onebox image icon with SVG reference in cooked post processor

* interpolate icons in locales

* Fix composer whisper icon alignment

* Add support for stacked icons

* SECURITY: enforce hostname to match discourse hostname

This ensures that the hostname rails uses for various helpers always matches
the Discourse hostname

* load SVG sprite with pre-initializers

* FIX: enable caching on SVG sprites

* PERF: use JSONP for SVG sprites so they are served from CDN

This avoids needing to deal with CORS for loading of the SVG

Note, added the svg- prefix to the filename so we can quickly tell in
dev tools what the file is

* Add missing SVG sprite JSONP script to CSP

* Upgrade to FA 5.5.0

* Add support for all FA4.7 icons

- adds complete frontend and backend for renamed FA4.7 icons

- improves performance of SvgSprite.bundle and SvgSprite.all_icons

* Fix group avatar flair preview

- adds an endpoint at /svg-sprites/search/:keyword

- adds frontend ajax call that pulls icon in avatar flair preview even when it is not in subset

* Remove FA 4.7 font files

											
										
										
											2018-11-26 16:49:57 -05:00
+								    img << "<svg class=\"fa d-icon d-icon-unlink svg-icon\" aria-hidden=\"true\"><use xlink:href=\"#unlink\"></use></svg>"
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    img.remove_attribute("src")
 								    img.remove_attribute("width")
 								    img.remove_attribute("height")
-												FIX: Do not add lightbox to onebox images (#6479)


											
										
										
											2018-10-10 17:57:21 -04:00
+								    true
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								  end
 								  def large_images
-												REFACTOR: Refactor pull_hotlinked_images job

This commit should cause no functional change
- Split into functions to avoid deep nesting
- Register custom field type, and remove manual json parse/serialize
- Recover from deleted upload records

Also adds a test to ensure pull_hotlinked_images redownloads secure images only once
											
										
										
											2020-08-05 07:14:59 -04:00
+								    @large_images ||= @post.custom_fields[Post::LARGE_IMAGES].presence || []
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								  end
 								  def broken_images
-												REFACTOR: Refactor pull_hotlinked_images job

This commit should cause no functional change
- Split into functions to avoid deep nesting
- Register custom field type, and remove manual json parse/serialize
- Recover from deleted upload records

Also adds a test to ensure pull_hotlinked_images redownloads secure images only once
											
										
										
											2020-08-05 07:14:59 -04:00
+								    @broken_images ||= @post.custom_fields[Post::BROKEN_IMAGES].presence || []
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								  end
 								  def downloaded_images
-												FIX: Link post to uploads in `PostCreator`.

* This ensures that uploads are linked to their post on creation
  instead of a background job which may be delayed if Sidekiq
  is facing difficulties.

											
										
										
											2018-09-05 21:58:01 -04:00
+								    @downloaded_images ||= @post.downloaded_images
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								  end
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								  def extract_images
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    # all images with a src attribute
-												BUGFIX: errors when post-processing 'data images'

											
										
										
											2014-07-18 11:54:18 -04:00
+								    @doc.css("img[src]") -
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    # minus data images
-												BUGFIX: errors when post-processing 'data images'

											
										
										
											2014-07-18 11:54:18 -04:00
+								    @doc.css("img[src^='data']") -
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    # minus emojis
-												FIX: Optimize images in Onebox (#8471)

This commit ensures that images in Onebox are being optimized, but not
converted to lightbox too.
											
										
										
											2019-12-09 08:39:25 -05:00
+								    @doc.css("img.emoji")
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								  end
-												FEATURE: include post image in OpenGraph image tag

											
										
										
											2016-10-31 05:41:33 -04:00
+								  def extract_images_for_post
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    # all images with a src attribute
-												FIX: use the first image in the first post in the topic as opengraph image
FEATURE: new 'default_opengraph_image_url' setting

											
										
										
											2015-10-15 05:00:47 -04:00
+								    @doc.css("img[src]") -
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    # minus emojis
-												FIX: use the first image in the first post in the topic as opengraph image
FEATURE: new 'default_opengraph_image_url' setting

											
										
										
											2015-10-15 05:00:47 -04:00
+								    @doc.css("img.emoji") -
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								    # minus images inside quotes
-												FIX: Remove post/topic image_url on post edits

- resets image_url when image is removed from first post on edit
- excludes onebox icons from being featured as topic/post images

											
										
										
											2020-02-06 11:19:40 -05:00
+								    @doc.css(".quote img") -
 								    # minus onebox site icons
-												UX: Do not use small onebox images as post/topic images

											
										
										
											2020-05-14 13:01:43 -04:00
+								    @doc.css("img.site-icon") -
 								    # minus onebox avatars
 								    @doc.css("img.onebox-avatar") -
 								    # minus small onebox images (large images are .aspect-image-full-size)
 								    @doc.css(".onebox .aspect-image img")
-												FIX: use the first image in the first post in the topic as opengraph image
FEATURE: new 'default_opengraph_image_url' setting

											
										
										
											2015-10-15 05:00:47 -04:00
+								  end
-												FEATURE: grab oneboxed image dimensions to prevent 'jiggles' while loading

											
										
										
											2014-07-21 09:59:34 -04:00
+								  def oneboxed_images
-												FIX: Onebox images are not downloaded locally without css class

											
										
										
											2018-07-31 17:21:02 -04:00
+								    @doc.css(".onebox-body img, .onebox img, img.onebox")
-												FEATURE: pull onebox images

											
										
										
											2017-06-02 05:39:06 -04:00
+								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def limit_size!(img)
-												FIX stretched thumbnails

											
										
										
											2013-11-25 12:36:13 -05:00
+								    # retrieve the size from
 								    #  1) the width/height attributes
 								    #  2) the dimension from the preview (image_sizes)
 								    #  3) the dimension of the original image (HTTP request)
 								    w, h = get_size_from_attributes(img) ||
 								           get_size_from_image_sizes(img["src"], @opts[:image_sizes]) ||
 								           get_size(img["src"])
-												REFACTOR: Migrate markdown functionality in ES6

											
										
										
											2016-06-14 14:31:51 -04:00
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    # limit the size of the thumbnail
 								    img["width"], img["height"] = ImageSizer.resize(w, h)
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								  end
-												FIX stretched thumbnails

											
										
										
											2013-11-25 12:36:13 -05:00
+								  def get_size_from_attributes(img)
 								    w, h = img["width"].to_i, img["height"].to_i
-												FIX: rescale image during cooked_post_processor when only img height or width is specified

											
										
										
											2015-08-29 17:56:25 -04:00
+								    return [w, h] unless w <= 0 || h <= 0
 								    # if only width or height are specified attempt to scale image
 								    if w > 0 || h > 0
 								      w = w.to_f
 								      h = h.to_f
-												FIX: `FastImage#size` returns `nil` if it can't fetch the image size.

											
										
										
											2016-03-07 22:29:18 -05:00
 								      return unless original_image_size = get_size(img["src"])
 								      original_width, original_height = original_image_size.map(&:to_f)
-												FIX: rescale image during cooked_post_processor when only img height or width is specified

											
										
										
											2015-08-29 17:56:25 -04:00
+								      if w > 0
 								        ratio = w / original_width
-												FIX: `FastImage#size` returns `nil` if it can't fetch the image size.

											
										
										
											2016-03-07 22:29:18 -05:00
+								        [w.floor, (original_height * ratio).floor]
-												FIX: rescale image during cooked_post_processor when only img height or width is specified

											
										
										
											2015-08-29 17:56:25 -04:00
+								      else
 								        ratio = h / original_height
-												FIX: `FastImage#size` returns `nil` if it can't fetch the image size.

											
										
										
											2016-03-07 22:29:18 -05:00
+								        [(original_width * ratio).floor, h.floor]
-												FIX: rescale image during cooked_post_processor when only img height or width is specified

											
										
										
											2015-08-29 17:56:25 -04:00
+								      end
 								    end
-												FIX stretched thumbnails

											
										
										
											2013-11-25 12:36:13 -05:00
+								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def get_size_from_image_sizes(src, image_sizes)
 								    return unless image_sizes.present?
 								    image_sizes.each do |image_size|
 								      url, size = image_size[0], image_size[1]
-												FIX: picture would be hidden when [details] block was closed in the composer

											
										
										
											2015-03-16 13:57:15 -04:00
+								      if url && url.include?(src) &&
 								         size && size["width"].to_i > 0 && size["height"].to_i > 0
 								        return [size["width"], size["height"]]
 								      end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    end
-												FIX: get_size_from_image_sizes should return [width, height] or nil (#9298)


											
										
										
											2020-03-28 14:20:51 -04:00
+								    nil
-												cleaned up CookedPostProcessor and improved specs

											
										
										
											2013-06-15 06:29:20 -04:00
+								  end
-												post processor

											
										
										
											2013-02-20 20:07:36 -05:00
-												FEATURE: add support for responsive images in posts

When creating lightboxes we will attempt to create 1.5x and 2x thumbnails
for retina screens, this can be controlled with a new hidden site setting
called responsice_post_image_sizes, if you wish to create 3x images run

SiteSetting.responsive_post_image_sizes = "1|1.5|2|3"


The default should be good for most of the setups as it balances filesize
with quality. 3x thumbs can get big.

											
										
										
											2018-10-02 23:44:53 -04:00
+								  def add_to_size_cache(url, w, h)
 								    @size_cache[url] = [w, h]
 								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def get_size(url)
-												Log an error when we can't reach an image to get its dimensions

											
										
										
											2015-08-07 13:31:15 -04:00
+								    return @size_cache[url] if @size_cache.has_key?(url)
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    absolute_url = url
 								    absolute_url = Discourse.base_url_no_prefix + absolute_url if absolute_url =~ /^\/[^\/]/
-												FIX: Don't raise an error when the img attribute cannot be found

											
										
										
											2017-05-08 15:35:31 -04:00
 								    return unless absolute_url
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    # FastImage fails when there's no scheme
-												FIX: S3 upload when using dots in bucket name

											
										
										
											2013-12-16 05:44:59 -05:00
+								    absolute_url = SiteSetting.scheme + ":" + absolute_url if absolute_url.start_with?("//")
-												FIX: Use presigned URL to avoid 403 when pulling hotlinked images for secure media (#8764)

When we were pulling hotlinked images for oneboxes in the CookedPostProcessor, we were using the direct S3 URL, which returned a 403 error and thus did not set widths and heights of the images. We now cook the URL first based on whether the upload is secure before handing off to FastImage.
											
										
										
											2020-01-22 18:31:46 -05:00
 								    # we can't direct FastImage to our secure-media-uploads url because it bounces
 								    # anonymous requests with a 404 error
-												FIX: Resolve pull hotlinked image and broken link issues for secure media URLs (#8777)

When pull_hotlinked_images tried to run on posts with secure media (which had already been downloaded from external sources) we were getting a 404 when trying to download the image because the secure endpoint doesn't allow anon downloads.

Also, we were getting into an infinite loop of pull_hotlinked_images because the job didn't consider the secure media URLs as "downloaded" already so it kept trying to download them over and over.

In this PR I have also refactored secure-media-upload URL checks and mutations into single source of truth in Upload, adding a SECURE_MEDIA_ROUTE constant to check URLs against too.
											
										
										
											2020-01-23 20:59:30 -05:00
+								    if url && Upload.secure_media_url?(url)
 								      absolute_url = Upload.signed_url_from_secure_media_url(absolute_url)
-												FIX: Use presigned URL to avoid 403 when pulling hotlinked images for secure media (#8764)

When we were pulling hotlinked images for oneboxes in the CookedPostProcessor, we were using the direct S3 URL, which returned a 403 error and thus did not set widths and heights of the images. We now cook the URL first based on whether the upload is secure before handing off to FastImage.
											
										
										
											2020-01-22 18:31:46 -05:00
+								    end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    return unless is_valid_image_url?(absolute_url)
-												Log an error when we can't reach an image to get its dimensions

											
										
										
											2015-08-07 13:31:15 -04:00
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    # we can *always* crawl our own images
-												Fix the build.

											
										
										
											2016-03-07 22:38:26 -05:00
+								    return unless SiteSetting.crawl_images? || Discourse.store.has_been_uploaded?(url)
-												Log an error when we can't reach an image to get its dimensions

											
										
										
											2015-08-07 13:31:15 -04:00
-												FIX: images aren't lightboxed anymore (partially reverts 646c6eb7cd781b47663d104de4f37cdd99b465bf)

											
										
										
											2017-10-18 17:54:36 -04:00
+								    @size_cache[url] = FastImage.size(absolute_url)
-												FIX: store the topic links using the cooked upload url

											
										
										
											2018-08-14 06:23:32 -04:00
+								  rescue Zlib::BufError, URI::Error, OpenSSL::SSL::SSLError
-												FIX: rescue login required / broken images

											
										
										
											2018-01-11 11:47:06 -05:00
+								    # FastImage.size raises BufError for some gifs, leave it.
-												keep uploads reverse index up to date

											
										
										
											2013-06-17 16:46:48 -04:00
+								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def is_valid_image_url?(url)
 								    uri = URI.parse(url)
 								    %w(http https).include? uri.scheme
-												FIX: store the topic links using the cooked upload url

											
										
										
											2018-08-14 06:23:32 -04:00
+								  rescue URI::Error
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def convert_to_link!(img)
-												FIX: Perform crop using user-specified image sizes (#9224)

* FIX: Perform crop using user-specified image sizes

It used to resize the images to max width and height first and then
perform the crop operation. This is wrong because it ignored the user
specified image sizes from the Markdown.

* DEV: Use real images in test
											
										
										
											2020-03-26 10:40:00 -04:00
+								    w, h = img["width"].to_i, img["height"].to_i
 								    user_width, user_height = (w > 0 && h > 0 && [w, h]) ||
 								                              get_size_from_attributes(img) ||
 								                              get_size_from_image_sizes(img["src"], @opts[:image_sizes])
 								    limit_size!(img)
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								    src = img["src"]
-												UX: Don't add light box for SVG images.

											
										
										
											2018-06-18 05:10:23 -04:00
+								    return if src.blank? || is_a_hyperlink?(img) || is_svg?(img)
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
-												FIX: images aren't lightboxed anymore (partially reverts 646c6eb7cd781b47663d104de4f37cdd99b465bf)

											
										
										
											2017-10-18 17:54:36 -04:00
+								    original_width, original_height = (get_size(src) || [0, 0]).map(&:to_i)
 								    if original_width == 0 || original_height == 0
-												reduce log level when we can't reach an image while cooking a post

											
										
										
											2015-08-12 10:10:42 -04:00
+								      Rails.logger.info "Can't reach '#{src}' to get its dimension."
-												Log an error when we can't reach an image to get its dimensions

											
										
										
											2015-08-07 13:31:15 -04:00
+								      return
 								    end
-												FIX: images aren't lightboxed anymore (partially reverts 646c6eb7cd781b47663d104de4f37cdd99b465bf)

											
										
										
											2017-10-18 17:54:36 -04:00
+								    return if original_width <= SiteSetting.max_image_width && original_height <= SiteSetting.max_image_height
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
-												FIX: Perform crop using user-specified image sizes (#9224)

* FIX: Perform crop using user-specified image sizes

It used to resize the images to max width and height first and then
perform the crop operation. This is wrong because it ignored the user
specified image sizes from the Markdown.

* DEV: Use real images in test
											
										
										
											2020-03-26 10:40:00 -04:00
+								    user_width, user_height = [original_width, original_height] if user_width.to_i <= 0 && user_height.to_i <= 0
 								    width, height = user_width, user_height
 								    crop = SiteSetting.min_ratio_to_crop > 0 && width.to_f / height.to_f < SiteSetting.min_ratio_to_crop
-												FEATURE: new 'min ratio to crop' site setting

											
										
										
											2018-06-05 11:13:00 -04:00
 								    if crop
-												FIX: Perform crop using user-specified image sizes (#9224)

* FIX: Perform crop using user-specified image sizes

It used to resize the images to max width and height first and then
perform the crop operation. This is wrong because it ignored the user
specified image sizes from the Markdown.

* DEV: Use real images in test
											
										
										
											2020-03-26 10:40:00 -04:00
+								      width, height = ImageSizer.crop(width, height)
 								      img["width"], img["height"] = width, height
 								    else
 								      width, height = ImageSizer.resize(width, height)
-												FEATURE: new 'crop_tall_images' site setting

											
										
										
											2016-05-23 10:18:30 -04:00
+								    end
-												FIX: Copying image markdown for secure media loading full image (#9488)

* When copying the markdown for an image between posts, we were not adding the srcset and data-small-image attributes which are done by calling optimize_image! in cooked post processor
* Refactored the code which was confusing in its current state (the consider_for_reuse method was super confusing) and fixed the issue
											
										
										
											2020-04-23 20:29:02 -04:00
+								    upload = Upload.get_from_url(src)
-												FIX: Mitigate issue where legacy pre-secure hotlinked media would not be redownloaded (#8802)

Basically, say you had already downloaded a certain image from a certain URL
using pull_hotlinked_images and the onebox. The upload would be stored
by its sha as an upload record. Whenever you linked to the same URL again
in a post (e.g. in our case an og:image on review.discourse) we would
would reuse the original upload record because of the sha1.

However when you turned on secure media this could cause problems as
the first post that uses that upload after secure media is enabled
will set the access control post for the upload to the new post.
Then if the post is deleted every single onebox/link to that same image
URL will fail forever with 403 as the secure-media-uploads URL fails
if the access control post has been deleted.

To fix this when cooking posts and pulling hotlinked images, we only
allow using an original upload by URL if its access control post
matches the current post, and if the original_sha1 is filled in,
meaning it was uploaded AFTER secure media was enabled. otherwise
we just redownload the media again to be safe, as the URL will always
be new then.
											
										
										
											2020-01-28 19:11:38 -05:00
+								    if upload.present?
-												Use an options hash instead of boolean parameters

											
										
										
											2018-12-14 16:50:28 -05:00
+								      upload.create_thumbnail!(width, height, crop: crop)
-												FEATURE: add support for responsive images in posts

When creating lightboxes we will attempt to create 1.5x and 2x thumbnails
for retina screens, this can be controlled with a new hidden site setting
called responsice_post_image_sizes, if you wish to create 3x images run

SiteSetting.responsive_post_image_sizes = "1|1.5|2|3"


The default should be good for most of the setups as it balances filesize
with quality. 3x thumbs can get big.

											
										
										
											2018-10-02 23:44:53 -04:00
 								      each_responsive_ratio do |ratio|
 								        resized_w = (width * ratio).to_i
 								        resized_h = (height * ratio).to_i
 								        if upload.width && resized_w <= upload.width
-												Use an options hash instead of boolean parameters

											
										
										
											2018-12-14 16:50:28 -05:00
+								          upload.create_thumbnail!(resized_w, resized_h, crop: crop)
-												FEATURE: add support for responsive images in posts

When creating lightboxes we will attempt to create 1.5x and 2x thumbnails
for retina screens, this can be controlled with a new hidden site setting
called responsice_post_image_sizes, if you wish to create 3x images run

SiteSetting.responsive_post_image_sizes = "1|1.5|2|3"


The default should be good for most of the setups as it balances filesize
with quality. 3x thumbs can get big.

											
										
										
											2018-10-02 23:44:53 -04:00
+								        end
 								      end
-												FEATURE: Show a blurry preview when lazy loading images

This generates a 10x10 PNG thumbnail for each lightboxed image.
If Image Lazy Loading is enabled (IntersectionObserver API) then
we'll load the low res version when offscreen. As the image scrolls
in we'll swap it for the high res version.

We use a WeakMap to track the old image attributes. It's much less
memory than storing them as `data-*` attributes and swapping them
back and forth all the time.

											
										
										
											2018-12-14 17:44:38 -05:00
 								      unless @disable_loading_image
 								        upload.create_thumbnail!(LOADING_SIZE, LOADING_SIZE, format: 'png', colors: LOADING_COLORS)
 								      end
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								    end
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
-												FIX: Optimize images in Onebox (#8471)

This commit ensures that images in Onebox are being optimized, but not
converted to lightbox too.
											
										
										
											2019-12-09 08:39:25 -05:00
+								    if img.ancestors('.onebox, .onebox-body, .quote').blank? && !img.classes.include?("onebox")
 								      add_lightbox!(img, original_width, original_height, upload, cropped: crop)
 								    end
-												FIX: Mitigate issue where legacy pre-secure hotlinked media would not be redownloaded (#8802)

Basically, say you had already downloaded a certain image from a certain URL
using pull_hotlinked_images and the onebox. The upload would be stored
by its sha as an upload record. Whenever you linked to the same URL again
in a post (e.g. in our case an og:image on review.discourse) we would
would reuse the original upload record because of the sha1.

However when you turned on secure media this could cause problems as
the first post that uses that upload after secure media is enabled
will set the access control post for the upload to the new post.
Then if the post is deleted every single onebox/link to that same image
URL will fail forever with 403 as the secure-media-uploads URL fails
if the access control post has been deleted.

To fix this when cooking posts and pulling hotlinked images, we only
allow using an original upload by URL if its access control post
matches the current post, and if the original_sha1 is filled in,
meaning it was uploaded AFTER secure media was enabled. otherwise
we just redownload the media again to be safe, as the URL will always
be new then.
											
										
										
											2020-01-28 19:11:38 -05:00
+								    if upload.present?
 								      optimize_image!(img, upload, cropped: crop)
 								    end
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								  end
-												FEATURE: Show a blurry preview when lazy loading images

This generates a 10x10 PNG thumbnail for each lightboxed image.
If Image Lazy Loading is enabled (IntersectionObserver API) then
we'll load the low res version when offscreen. As the image scrolls
in we'll swap it for the high res version.

We use a WeakMap to track the old image attributes. It's much less
memory than storing them as `data-*` attributes and swapping them
back and forth all the time.

											
										
										
											2018-12-14 17:44:38 -05:00
+								  def loading_image(upload)
 								    upload.thumbnail(LOADING_SIZE, LOADING_SIZE)
 								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def is_a_hyperlink?(img)
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								    parent = img.parent
 								    while parent
-												FIX markdown hotlinked images were not properly pulled

											
										
										
											2013-11-20 07:10:08 -05:00
+								      return true if parent.name == "a"
-												Exit early when the 'img is already inside an 'a' tag
											
										
										
											2017-10-23 11:43:53 -04:00
+								      parent = parent.parent if parent.respond_to?(:parent)
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								    end
-												FIX markdown hotlinked images were not properly pulled

											
										
										
											2013-11-20 07:10:08 -05:00
+								    false
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								  end
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
-												FEATURE: add support for responsive images in posts

When creating lightboxes we will attempt to create 1.5x and 2x thumbnails
for retina screens, this can be controlled with a new hidden site setting
called responsice_post_image_sizes, if you wish to create 3x images run

SiteSetting.responsive_post_image_sizes = "1|1.5|2|3"


The default should be good for most of the setups as it balances filesize
with quality. 3x thumbs can get big.

											
										
										
											2018-10-02 23:44:53 -04:00
+								  def each_responsive_ratio
 								    SiteSetting
 								      .responsive_post_image_sizes
 								      .split('|')
 								      .map(&:to_f)
 								      .sort
 								      .each { |r| yield r if r > 1 }
 								  end
-												FIX: Optimize quoted images (#8427)

Only images that were part of a lightbox used to be optimized. This
patch ensures that quoted images are also optimized.
											
										
										
											2019-11-29 08:18:42 -05:00
+								  def optimize_image!(img, upload, cropped: false)
 								    w, h = img["width"].to_i, img["height"].to_i
-												FIX: Secure Upload URLs in lightbox (#8451)

This fixes the following issues:

* The link element on the lightbox which pops open the lightbox was linking to the S3 URL with a private ACL instead of the secure media URL for the image
* Change to use `@post.with_secure_media?` in `CookedPostProcessor` for URL cooking, as in some cases, like when a post is edited and an upload is added, `upload.secure?` can be false which resulted in `srcset` URLs not being cooked correctly to secure media upload urls.

											
										
										
											2019-12-04 18:13:09 -05:00
+								    # note: optimize_urls cooks the src and data-small-upload further after this
-												FIX: Do not optimize animated images in cooked posts (#11214)

CookedPostProcessor replaces all large images with their optimized
versions, but for GIF images the optimized version is limited to first
frame only. This caused animations it cooked posts to require a click
to show up the lightbox and start playing.
											
										
										
											2020-11-12 14:47:30 -05:00
+								    thumbnail = !upload.animated && upload.thumbnail(w, h)
-												FIX: Optimize quoted images (#8427)

Only images that were part of a lightbox used to be optimized. This
patch ensures that quoted images are also optimized.
											
										
										
											2019-11-29 08:18:42 -05:00
+								    if thumbnail && thumbnail.filesize.to_i < upload.filesize
 								      img["src"] = thumbnail.url
 								      srcset = +""
 								      each_responsive_ratio do |ratio|
 								        resized_w = (w * ratio).to_i
 								        resized_h = (h * ratio).to_i
 								        if !cropped && upload.width && resized_w > upload.width
-												FIX: Secure Upload URLs in lightbox (#8451)

This fixes the following issues:

* The link element on the lightbox which pops open the lightbox was linking to the S3 URL with a private ACL instead of the secure media URL for the image
* Change to use `@post.with_secure_media?` in `CookedPostProcessor` for URL cooking, as in some cases, like when a post is edited and an upload is added, `upload.secure?` can be false which resulted in `srcset` URLs not being cooked correctly to secure media upload urls.

											
										
										
											2019-12-04 18:13:09 -05:00
+								          cooked_url = UrlHelper.cook_url(upload.url, secure: @post.with_secure_media?)
-												FIX: Optimize quoted images (#8427)

Only images that were part of a lightbox used to be optimized. This
patch ensures that quoted images are also optimized.
											
										
										
											2019-11-29 08:18:42 -05:00
+								          srcset << ", #{cooked_url} #{ratio.to_s.sub(/\.0$/, "")}x"
 								        elsif t = upload.thumbnail(resized_w, resized_h)
-												FIX: Secure Upload URLs in lightbox (#8451)

This fixes the following issues:

* The link element on the lightbox which pops open the lightbox was linking to the S3 URL with a private ACL instead of the secure media URL for the image
* Change to use `@post.with_secure_media?` in `CookedPostProcessor` for URL cooking, as in some cases, like when a post is edited and an upload is added, `upload.secure?` can be false which resulted in `srcset` URLs not being cooked correctly to secure media upload urls.

											
										
										
											2019-12-04 18:13:09 -05:00
+								          cooked_url = UrlHelper.cook_url(t.url, secure: @post.with_secure_media?)
-												FIX: Optimize quoted images (#8427)

Only images that were part of a lightbox used to be optimized. This
patch ensures that quoted images are also optimized.
											
										
										
											2019-11-29 08:18:42 -05:00
+								          srcset << ", #{cooked_url} #{ratio.to_s.sub(/\.0$/, "")}x"
 								        end
-												FIX: Secure Upload URLs in lightbox (#8451)

This fixes the following issues:

* The link element on the lightbox which pops open the lightbox was linking to the S3 URL with a private ACL instead of the secure media URL for the image
* Change to use `@post.with_secure_media?` in `CookedPostProcessor` for URL cooking, as in some cases, like when a post is edited and an upload is added, `upload.secure?` can be false which resulted in `srcset` URLs not being cooked correctly to secure media upload urls.

											
										
										
											2019-12-04 18:13:09 -05:00
+								        img["srcset"] = "#{UrlHelper.cook_url(img["src"], secure: @post.with_secure_media?)}#{srcset}" if srcset.present?
-												FIX: Optimize quoted images (#8427)

Only images that were part of a lightbox used to be optimized. This
patch ensures that quoted images are also optimized.
											
										
										
											2019-11-29 08:18:42 -05:00
+								      end
 								    else
 								      img["src"] = upload.url
 								    end
 								    if small_upload = loading_image(upload)
 								      img["data-small-upload"] = small_upload.url
 								    end
 								  end
-												FIX: don't use srcset on cropped thumbnails

											
										
										
											2018-10-25 10:08:10 -04:00
+								  def add_lightbox!(img, original_width, original_height, upload, cropped: false)
-												soften the lightbox overlay

											
										
										
											2013-06-25 20:44:20 -04:00
+								    # first, create a div to hold our lightbox
-												PERF: Improve quality of `PostSearchData#raw_data`. (#7275)

This commit fixes the follow quality issue with `PostSearchData#raw_data`:

1. URLs are being tokenized and links with similar href and characters
are being duplicated in the raw data.

`Post#cooked`:

```
<p><a href=\"https://meta.discourse.org/some.png\" class=\"onebox\" target=\"_blank\" rel=\"nofollow noopener\">https://meta.discourse.org/some.png</a></p>
```

`PostSearchData#raw_data` Before:

```
This is a test topic 0 Uncategorized https://meta.discourse.org/some.png discourse org/some png https://meta.discourse.org/some.png discourse org/some png
```

`PostSearchData#raw_data` After:

```
This is a test topic 0 Uncategorized https://meta.discourse.org/some.png meta discourse org
```

2. Ligthbox being included in search pollutes the
`PostSearchData#raw_data` unncessarily.

From 28 March 2018 to 28 March 2019, searches for the term `image` on
`meta.discourse.org` had a click through rate of 2.1%. Non-lightboxed images are not included in indexing for search yet we were indexing content within a lightbox. Also, search for terms like `image` was affected we were using `Pasted image` as the filename for
uploads that were pasted.

`Post#cooked`

```
<p>Let me see how I can fix this image<br>\n<div class=\"lightbox-wrapper\"><a class=\"lightbox\" href=\"https://meta.discourse.org/some.png\" title=\"some.png\" rel=\"nofollow noopener\"><img src=\"https://meta.discourse.org/some.png\" width=\"275\" height=\"299\"><div class=\"meta\">\n<svg class=\"fa d-icon d-icon-far-image svg-icon\" aria-hidden=\"true\"><use xlink:href=\"#far-image\"></use></svg><span class=\"filename\">some.png</span><span class=\"informations\">1750×2000</span><svg class=\"fa d-icon d-icon-discourse-expand svg-icon\" aria-hidden=\"true\"><use xlink:href=\"#discourse-expand\"></use></svg>\n</div></a></div></p>
```

`PostSearchData#raw_data` Before:

```
This is a test topic 0 Uncategorized Let me see how I can fix this image some.png png https://meta.discourse.org/some.png discourse org/some png some.png png 1750×2000
```

`PostSearchData#raw_data` After:

```
This is a test topic 0 Uncategorized Let me see how I can fix this image
```

In terms of indexing performance, we now have to parse the given HTML
through nokogiri twice. However performance is not a huge worry here since a string length of 194170 takes only 30ms
to scrub plus the indexing takes place in a background job.
											
										
										
											2019-03-31 22:14:29 -04:00
+								    lightbox = create_node("div", LIGHTBOX_WRAPPER_CSS_CLASS)
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								    img.add_next_sibling(lightbox)
 								    lightbox.add_child(img)
-												soften the lightbox overlay

											
										
										
											2013-06-25 20:44:20 -04:00
+								    # then, the link to our larger image
-												FIX: Secure Upload URLs in lightbox (#8451)

This fixes the following issues:

* The link element on the lightbox which pops open the lightbox was linking to the S3 URL with a private ACL instead of the secure media URL for the image
* Change to use `@post.with_secure_media?` in `CookedPostProcessor` for URL cooking, as in some cases, like when a post is edited and an upload is added, `upload.secure?` can be false which resulted in `srcset` URLs not being cooked correctly to secure media upload urls.

											
										
										
											2019-12-04 18:13:09 -05:00
+								    src = UrlHelper.cook_url(img["src"], secure: @post.with_secure_media?)
 								    a = create_link_node("lightbox", src)
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								    img.add_next_sibling(a)
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
-												FIX: Ensure lightbox image download has correct content disposition in S3 (#7845)


											
										
										
											2019-07-04 11:32:51 -04:00
+								    if upload
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
+								      a["data-download-href"] = Discourse.store.download_url(upload)
 								    end
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
+								    a.add_child(img)
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
-												soften the lightbox overlay

											
										
										
											2013-06-25 20:44:20 -04:00
+								    # then, some overlay informations
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								    meta = create_node("div", "meta")
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								    img.add_next_sibling(meta)
-												add lightbox overlay

											
										
										
											2013-06-21 12:29:40 -04:00
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    filename = get_filename(upload, img["src"])
-												DEV: enable frozen string literal on all files

This reduces chances of errors where consumers of strings mutate inputs
and reduces memory usage of the app.

Test suite passes now, but there may be some stuff left, so we will run
a few sites on a branch prior to merging

											
										
										
											2019-05-02 18:17:27 -04:00
+								    informations = +"#{original_width}×#{original_height}"
-												UX: Lightbox support for image uploader. (#7034)


											
										
										
											2019-02-20 21:13:37 -05:00
+								    informations << " #{upload.human_filesize}" if upload
-												add lightbox overlay

											
										
										
											2013-06-21 12:29:40 -04:00
-												FEATURE: fallback to image alt before filename if there's no title in lightboxes (#8286)

* use image alt as a fallback when there's no title

* update spec

we used to check that the overlay information is added when the image has a titie. This adds 2 more scenarios. One where an image has both a title and an alt, in which case the title should be used and alt ignored.

The other is when there's only an alt, it should then be used to generate the overlay

											
										
										
											2019-11-03 18:15:14 -05:00
+								    a["title"] = CGI.escapeHTML(img["title"] || img["alt"] || filename)
-												add download link in lightbox

											
										
										
											2013-11-29 14:03:39 -05:00
-												DEV: Refactor icons used in lightbox HTML

Uses <svg> elements instead of hacky CSS pseudoelements

Adds a migration to mark posts with lightboxes as needing a rebake

											
										
										
											2019-03-22 11:52:06 -04:00
+								    meta.add_child create_icon_node("far-image")
-												SECURITY: Escape HTML in filename.

											
										
										
											2016-08-10 23:27:12 -04:00
+								    meta.add_child create_span_node("filename", a["title"])
-												soften the lightbox overlay

											
										
										
											2013-06-25 20:44:20 -04:00
+								    meta.add_child create_span_node("informations", informations)
-												DEV: Refactor icons used in lightbox HTML

Uses <svg> elements instead of hacky CSS pseudoelements

Adds a migration to mark posts with lightboxes as needing a rebake

											
										
										
											2019-03-22 11:52:06 -04:00
+								    meta.add_child create_icon_node("discourse-expand")
-												add lightbox overlay

											
										
										
											2013-06-21 12:29:40 -04:00
+								  end
-												basic lightbox support

											
										
										
											2013-02-19 01:57:14 -05:00
-												provide a way to give a default filename to pasted images in the lightbox overlay

											
										
										
											2013-06-26 15:53:31 -04:00
+								  def get_filename(upload, src)
 								    return File.basename(src) unless upload
-												FIX: can no longer paste image in Chrome post editor

											
										
										
											2013-07-03 18:39:23 -04:00
+								    return upload.original_filename unless upload.original_filename =~ /^blob(\.png)?$/i
-												DEV: Apply Rubocop redundant return style

											
										
										
											2019-11-14 15:10:51 -05:00
+								    I18n.t("upload.pasted_image_filename")
-												provide a way to give a default filename to pasted images in the lightbox overlay

											
										
										
											2013-06-26 15:53:31 -04:00
+								  end
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								  def create_node(tag_name, klass)
 								    node = Nokogiri::XML::Node.new(tag_name, @doc)
 								    node["class"] = klass if klass.present?
 								    node
 								  end
-												add lightbox overlay

											
										
										
											2013-06-21 12:29:40 -04:00
+								  def create_span_node(klass, content = nil)
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								    span = create_node("span", klass)
-												add lightbox overlay

											
										
										
											2013-06-21 12:29:40 -04:00
+								    span.content = content if content
 								    span
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  end
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								  def create_icon_node(klass)
-												Upgrade to FontAwesome 5 (take two) (#6673)

* Add missing icons to set

* Revert FA5 revert

 This reverts commit 42572ff

* use new SVG syntax in locales

* Noscript page changes (remove login button, center "powered by" footer text)

* Cast wider net for SVG icons in settings

- include any _icon setting for SVG registry (offers better support for plugin settings)

- let themes store multiple pipe-delimited icons in a setting

- also replaces broken onebox image icon with SVG reference in cooked post processor

* interpolate icons in locales

* Fix composer whisper icon alignment

* Add support for stacked icons

* SECURITY: enforce hostname to match discourse hostname

This ensures that the hostname rails uses for various helpers always matches
the Discourse hostname

* load SVG sprite with pre-initializers

* FIX: enable caching on SVG sprites

* PERF: use JSONP for SVG sprites so they are served from CDN

This avoids needing to deal with CORS for loading of the SVG

Note, added the svg- prefix to the filename so we can quickly tell in
dev tools what the file is

* Add missing SVG sprite JSONP script to CSP

* Upgrade to FA 5.5.0

* Add support for all FA4.7 icons

- adds complete frontend and backend for renamed FA4.7 icons

- improves performance of SvgSprite.bundle and SvgSprite.all_icons

* Fix group avatar flair preview

- adds an endpoint at /svg-sprites/search/:keyword

- adds frontend ajax call that pulls icon in avatar flair preview even when it is not in subset

* Remove FA 4.7 font files

											
										
										
											2018-11-26 16:49:57 -05:00
+								    icon = create_node("svg", "fa d-icon d-icon-#{klass} svg-icon")
 								    icon.set_attribute("aria-hidden", "true")
 								    icon << "<use xlink:href=\"##{klass}\"></use>"
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								  end
 								  def create_link_node(klass, url, external = false)
 								    a = create_node("a", klass)
 								    a["href"] = url
 								    if external
 								      a["target"] = "_blank"
 								      a["rel"] = "nofollow noopener"
 								    end
 								    a
 								  end
-												FEATURE: include post image in OpenGraph image tag

											
										
										
											2016-10-31 05:41:33 -04:00
+								  def update_post_image
-												FEATURE: Include optimized thumbnails for topics (#9215)

This introduces new APIs for obtaining optimized thumbnails for topics. There are a few building blocks required for this:

- Introduces new `image_upload_id` columns on the `posts` and `topics` table. This replaces the old `image_url` column, which means that thumbnails are now restricted to uploads. Hotlinked thumbnails are no longer possible. In normal use (with pull_hotlinked_images enabled), this has no noticeable impact

- A migration attempts to match existing urls to upload records. If a match cannot be found then the posts will be queued for rebake

- Optimized thumbnails are generated during post_process_cooked. If thumbnails are missing when serializing a topic list, then a sidekiq job is queued

- Topic lists and topics now include a `thumbnails` key, which includes all the available images:
   ```
   "thumbnails": [
   {
     "max_width": null,
     "max_height": null,
     "url": "//example.com/original-image.png",
     "width": 1380,
     "height": 1840
   },
   {
     "max_width": 1024,
     "max_height": 1024,
     "url": "//example.com/optimized-image.png",
     "width": 768,
     "height": 1024
   }
   ]
  ```

- Themes can request additional thumbnail sizes by using a modifier in their `about.json` file:
   ```
    "modifiers": {
      "topic_thumbnail_sizes": [
        [200, 200],
        [800, 800]
      ],
      ...
  ```
  Remember that these are generated asynchronously, so your theme should include logic to fallback to other available thumbnails if your requested size has not yet been generated

- Two new raw plugin outlets are introduced, to improve the customisability of the topic list. `topic-list-before-columns` and `topic-list-before-link`
											
										
										
											2020-05-05 04:07:50 -04:00
+								    upload = nil
 								    eligible_image_fragments = extract_images_for_post
 								    # Loop through those fragments until we find one with an upload record
 								    @post.each_upload_url(fragments: eligible_image_fragments) do |src, path, sha1|
 								      upload = Upload.find_by(sha1: sha1)
 								      break if upload
-												FIX: Remove post/topic image_url on post edits

- resets image_url when image is removed from first post on edit
- excludes onebox icons from being featured as topic/post images

											
										
										
											2020-02-06 11:19:40 -05:00
+								    end
-												Add extraction of image_url for oneboxed images. Fix search by images filter name.

											
										
										
											2017-06-09 07:16:50 -04:00
-												FEATURE: Include optimized thumbnails for topics (#9215)

This introduces new APIs for obtaining optimized thumbnails for topics. There are a few building blocks required for this:

- Introduces new `image_upload_id` columns on the `posts` and `topics` table. This replaces the old `image_url` column, which means that thumbnails are now restricted to uploads. Hotlinked thumbnails are no longer possible. In normal use (with pull_hotlinked_images enabled), this has no noticeable impact

- A migration attempts to match existing urls to upload records. If a match cannot be found then the posts will be queued for rebake

- Optimized thumbnails are generated during post_process_cooked. If thumbnails are missing when serializing a topic list, then a sidekiq job is queued

- Topic lists and topics now include a `thumbnails` key, which includes all the available images:
   ```
   "thumbnails": [
   {
     "max_width": null,
     "max_height": null,
     "url": "//example.com/original-image.png",
     "width": 1380,
     "height": 1840
   },
   {
     "max_width": 1024,
     "max_height": 1024,
     "url": "//example.com/optimized-image.png",
     "width": 768,
     "height": 1024
   }
   ]
  ```

- Themes can request additional thumbnail sizes by using a modifier in their `about.json` file:
   ```
    "modifiers": {
      "topic_thumbnail_sizes": [
        [200, 200],
        [800, 800]
      ],
      ...
  ```
  Remember that these are generated asynchronously, so your theme should include logic to fallback to other available thumbnails if your requested size has not yet been generated

- Two new raw plugin outlets are introduced, to improve the customisability of the topic list. `topic-list-before-columns` and `topic-list-before-link`
											
										
										
											2020-05-05 04:07:50 -04:00
+								    if upload.present?
 								      @post.update_column(:image_upload_id, upload.id) # post
 								      if @post.is_first_post? # topic
 								        @post.topic.update_column(:image_upload_id, upload.id)
 								        extra_sizes = ThemeModifierHelper.new(theme_ids: Theme.user_selectable.pluck(:id)).topic_thumbnail_sizes
 								        @post.topic.generate_thumbnails!(extra_sizes: extra_sizes)
 								      end
 								    else
 								      @post.update_column(:image_upload_id, nil) if @post.image_upload_id
 								      @post.topic.update_column(:image_upload_id, nil) if @post.topic.image_upload_id && @post.is_first_post?
 								      nil
-												refactor CookedPostProcessor & specs

											
										
										
											2013-07-07 19:39:08 -04:00
+								    end
 								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def post_process_oneboxes
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								    limit = SiteSetting.max_oneboxes_per_post
 								    oneboxes = {}
 								    inlineOneboxes = {}
-												DEV: Remove INLINE_ONEBOX_* constants

There were two constants here, `INLINE_ONEBOX_LOADING_CSS_CLASS` and
`INLINE_ONEBOX_CSS_CLASS` that were both longer than the strings they
were DRYing up: `inline-onebox-loading` and `inline-onebox`

I normally appreciate constants, but in this case it meant that we had
a lot of JS imports resulting in many more lines of code (and CPU cycles
spent figuring them out.)

It also meant we had an `.erb` file and had to invoke Ruby to create the
JS file, which meant the app was harder to port to Ember CLI.

I removed the constants. It's less DRY but faster and simpler, and
arguably the loss of DRYness is not significant as you can still search
for the `inline-onebox-loading` and `inline-onebox` strings easily if
you are refactoring.

											
										
										
											2020-05-07 16:08:48 -04:00
+								    Oneboxer.apply(@doc, extra_paths: [".inline-onebox-loading"]) do |url, element|
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								      is_onebox = element["class"] == Oneboxer::ONEBOX_CSS_CLASS
 								      map = is_onebox ? oneboxes : inlineOneboxes
 								      skip_onebox = limit <= 0 && !map[url]
 								      if skip_onebox
-												UX: Strip class when link is not oneboxed due to site setting limits.

											
										
										
											2018-11-29 01:33:01 -05:00
+								        if is_onebox
 								          element.remove_class('onebox')
 								        else
 								          remove_inline_onebox_loading_class(element)
 								        end
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								        next
 								      end
 								      limit -= 1
 								      map[url] = true
 								      if is_onebox
-												FIX: Award 'First Onebox' badge just for Oneboxed URLs. (#7974)


											
										
										
											2019-08-08 12:45:18 -04:00
+								        onebox = Oneboxer.onebox(url,
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								          invalidate_oneboxes: !!@opts[:invalidate_oneboxes],
 								          user_id: @post&.user_id,
 								          category_id: @post&.topic&.category_id
 								        )
-												FIX: Award 'First Onebox' badge just for Oneboxed URLs. (#7974)


											
										
										
											2019-08-08 12:45:18 -04:00
 								        @has_oneboxes = true if onebox.present?
 								        onebox
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								      else
 								        process_inline_onebox(element)
 								        false
 								      end
-												ensure we allow self oneboxing of login required sites

											
										
										
											2016-11-03 17:48:32 -04:00
+								    end
-												fix the build
											
										
										
											2017-10-23 13:09:38 -04:00
-												FEATURE: pull onebox images

											
										
										
											2017-06-02 05:39:06 -04:00
+								    oneboxed_images.each do |img|
-												FIX: Should skip the loop if the image src is blank

											
										
										
											2017-11-27 03:11:28 -05:00
+								      next if img["src"].blank?
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								      src = img["src"].sub(/^https?:/i, "")
-												FIX: Display large/broken image placeholders for image oneboxes

											
										
										
											2018-10-07 08:10:15 -04:00
+								      parent = img.parent
 								      img_classes = (img["class"] || "").split(" ")
 								      link_classes = ((parent&.name == "a" && parent["class"]) || "").split(" ")
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
-												FIX: Do not add lightbox to onebox images (#6479)


											
										
										
											2018-10-10 17:57:21 -04:00
+								      if img_classes.include?("onebox") || link_classes.include?("onebox")
 								        next if add_image_placeholder!(img)
 								      elsif large_images.include?(src) || broken_images.include?(src)
 								        img.remove
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								        next
 								      end
-												FIX: properly handle too large & broken images in posts

											
										
										
											2017-11-16 09:45:07 -05:00
+								      upload_id = downloaded_images[src]
-												FIX: Use find_by_id method to prevent record not found exception

											
										
										
											2018-12-14 16:49:45 -05:00
+								      upload = Upload.find_by_id(upload_id) if upload_id
-												FIX: Use presigned URL to avoid 403 when pulling hotlinked images for secure media (#8764)

When we were pulling hotlinked images for oneboxes in the CookedPostProcessor, we were using the direct S3 URL, which returned a 403 error and thus did not set widths and heights of the images. We now cook the URL first based on whether the upload is secure before handing off to FastImage.
											
										
										
											2020-01-22 18:31:46 -05:00
 								      if upload.present?
 								        img["src"] = UrlHelper.cook_url(upload.url, secure: @post.with_secure_media?)
 								      end
-												fix the build
											
										
										
											2017-10-23 13:09:38 -04:00
-												NEW: large image placeholder added in cooked html (#5291)


											
										
										
											2017-11-15 05:30:47 -05:00
+								      # make sure we grab dimensions for oneboxed images
 								      # and wrap in a div
-												UX: onebox images no longer cause jiggle

This stops pages from "jiggling" while oneboxes download.

see: http://cssmojo.com/aspect-ratio-using-custom-properties-and-calc/

											
										
										
											2017-10-30 22:50:44 -04:00
+								      limit_size!(img)
-												UX: oneboxes with avatars now display consistently

Onebox avatar size is reduced to 60px

Also fixes regression with some oneboxes not cooking after post

											
										
										
											2017-11-07 19:50:01 -05:00
 								      next if img["class"]&.include?('onebox-avatar')
-												FIX: Process image onebox correctly when image is wrapped in a link

The instagram onebox sometimes surrounds the image with an `<a>` tag, which was breaking the aspect ratio logic, and therefore causing posts to change height on load.

											
										
										
											2019-05-10 05:02:15 -04:00
+								      parent = parent&.parent if parent&.name == "a"
-												FIX: Display large/broken image placeholders for image oneboxes

											
										
										
											2018-10-07 08:10:15 -04:00
+								      parent_class = parent && parent["class"]
-												UX: wrap instagram images with aspect ratio

											
										
										
											2018-03-21 16:00:05 -04:00
+								      width = img["width"].to_i
 								      height = img["height"].to_i
-												UX: generic onebox treats all square images as avatars and renders them smaller

											
										
										
											2017-11-12 19:19:06 -05:00
-												UX: wrap instagram images with aspect ratio

											
										
										
											2018-03-21 16:00:05 -04:00
+								      if parent_class&.include?("onebox-body") && width > 0 && height > 0
-												UX: generic onebox treats all square images as avatars and renders them smaller

											
										
										
											2017-11-12 19:19:06 -05:00
+								        # special instruction for width == height, assume we are dealing with an avatar
 								        if (img["width"].to_i == img["height"].to_i)
 								          found = false
 								          parent = img
 								          while parent = parent.parent
-												FIX: use allowlist and blocklist terminology (#10209)

This is a PR of the renaming whitelist to allowlist and blacklist to the blocklist.
											
										
										
											2020-07-26 20:23:54 -04:00
+								            if parent["class"] && parent["class"].include?("allowlistedgeneric")
-												UX: generic onebox treats all square images as avatars and renders them smaller

											
										
										
											2017-11-12 19:19:06 -05:00
+								              found = true
 								              break
 								            end
 								          end
 								          if found
 								            img["class"] = img["class"].to_s + " onebox-avatar"
 								            next
 								          end
 								        end
-												UX: stop warping tiny onebox images

											
										
										
											2017-11-27 20:32:35 -05:00
+								        if width < 64 && height < 64
 								          img["class"] = img["class"].to_s + " onebox-full-image"
 								        else
 								          img.delete('width')
 								          img.delete('height')
 								          new_parent = img.add_next_sibling("<div class='aspect-image' style='--aspect-ratio:#{width}/#{height};'/>")
 								          new_parent.first.add_child(img)
 								        end
-												FEATURE: bump onebox version, add styling for new reddit image onebox

											
										
										
											2019-04-04 05:24:30 -04:00
+								      elsif (parent_class&.include?("instagram-images") || parent_class&.include?("tweet-images") || parent_class&.include?("scale-images")) && width > 0 && height > 0
-												UX: wrap instagram images with aspect ratio

											
										
										
											2018-03-21 16:00:05 -04:00
+								        img.remove_attribute("width")
 								        img.remove_attribute("height")
-												FIX: Process image onebox correctly when image is wrapped in a link

The instagram onebox sometimes surrounds the image with an `<a>` tag, which was breaking the aspect ratio logic, and therefore causing posts to change height on load.

											
										
										
											2019-05-10 05:02:15 -04:00
+								        parent["class"] = "aspect-image-full-size"
 								        parent["style"] = "--aspect-ratio:#{width}/#{height};"
-												UX: onebox images no longer cause jiggle

This stops pages from "jiggling" while oneboxes download.

see: http://cssmojo.com/aspect-ratio-using-custom-properties-and-calc/

											
										
										
											2017-10-30 22:50:44 -04:00
+								      end
 								    end
-												FIX: respect nofollow settings for onebox links

											
										
										
											2018-03-26 06:24:39 -04:00
-												FIX: respect `tl3 links no follow` setting (#8232)


											
										
										
											2019-10-22 13:11:04 -04:00
+								    if @omit_nofollow || !SiteSetting.add_rel_nofollow_to_user_content
-												FIX: Don't strip `noopener` from oneboxes

											
										
										
											2020-07-13 16:54:15 -04:00
+								      @doc.css(".onebox-body a[rel], .onebox a[rel]").each do |a|
 								        rel_values = a['rel'].split(' ').map(&:downcase)
 								        rel_values.delete('nofollow')
 								        rel_values.delete('ugc')
 								        if rel_values.blank?
 								          a.remove_attribute("rel")
 								        else
 								          a["rel"] = rel_values.join(' ')
 								        end
 								      end
-												FIX: respect nofollow settings for onebox links

											
										
										
											2018-03-26 06:24:39 -04:00
+								    end
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								  def optimize_urls
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
+								    %w{href data-download-href}.each do |selector|
 								      @doc.css("a[#{selector}]").each do |a|
-												FIX: store the topic links using the cooked upload url

											
										
										
											2018-08-14 06:23:32 -04:00
+								        a[selector] = UrlHelper.cook_url(a[selector].to_s)
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
+								      end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    end
-												FIX: ensure local images use local CDN when uploads are stored on S3

When the S3 store was enabled, we were only applying the S3 CDN.
So all images stored locally, like the emojis, were never put on the local CDN.

Fixed a bunch of CookedPostProcessor test by adding a call to 'optimize_urls'
in order to get final URLs.

I also removed the unnecessary PrettyText.add_s3_cdn method since this is already
handled in the CookedPostProcessor.

											
										
										
											2019-02-20 13:24:38 -05:00
+								    %w{src data-small-upload}.each do |selector|
 								      @doc.css("img[#{selector}]").each do |img|
-												FEATURE: Add support for secure media (#7888)

This PR introduces a new secure media setting. When enabled, it prevent unathorized access to media uploads (files of type image, video and audio). When the `login_required` setting is enabled, then all media uploads will be protected from unauthorized (anonymous) access. When `login_required`is disabled, only media in private messages will be protected from unauthorized access. 

A few notes: 

- the `prevent_anons_from_downloading_files` setting no longer applies to audio and video uploads
- the `secure_media` setting can only be enabled if S3 uploads are already enabled and configured
- upload records have a new column, `secure`, which is a boolean `true/false` of the upload's secure status
- when creating a public post with an upload that has already been uploaded and is marked as secure, the post creator will raise an error
- when enabling or disabling the setting on a site with existing uploads, the rake task `uploads:ensure_correct_acl` should be used to update all uploads' secure status and their ACL on S3

											
										
										
											2019-11-17 20:25:42 -05:00
+								        img[selector] = UrlHelper.cook_url(img[selector].to_s, secure: @post.with_secure_media?)
-												FIX: ensure local images use local CDN when uploads are stored on S3

When the S3 store was enabled, we were only applying the S3 CDN.
So all images stored locally, like the emojis, were never put on the local CDN.

Fixed a bunch of CookedPostProcessor test by adding a call to 'optimize_urls'
in order to get final URLs.

I also removed the unnecessary PrettyText.add_s3_cdn method since this is already
handled in the CookedPostProcessor.

											
										
										
											2019-02-20 13:24:38 -05:00
+								      end
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    end
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  end
-												fix the build
											
										
										
											2017-10-23 13:09:38 -04:00
-												FEATURE: Remove user IDs from internal URLs. (#7406)


											
										
										
											2019-04-22 22:45:41 -04:00
+								  def remove_user_ids
 								    @doc.css("a[href]").each do |a|
-												FIX: rescue InvalidURIError when removing user ids from links

											
										
										
											2019-04-25 03:06:31 -04:00
+								      uri = begin
 								        URI(a["href"])
 								      rescue URI::Error
 								        next
 								      end
-												FEATURE: Remove user IDs from internal URLs. (#7406)


											
										
										
											2019-04-22 22:45:41 -04:00
+								      next if uri.hostname != Discourse.current_hostname
 								      query = Rack::Utils.parse_nested_query(uri.query)
 								      next if !query.delete("u")
 								      uri.query = query.map { |k, v| "#{k}=#{v}" }.join("&").presence
 								      a["href"] = uri.to_s
 								    end
 								  end
-												Small re-organization of CookedPostProcessor workflow

- only 'limit_size!' of oneboxed images once
- update post image at the end
- move 'enforce_nofollow' in its own method
											
										
										
											2017-10-23 12:15:51 -04:00
+								  def enforce_nofollow
-												FIX: Make sure rel attributes are correctly set. (#10645)

We must guarantee that "rel=noopener" was set if "target=_blank" is present, which is not always the case for trusted users. Also, if the link contains the "nofollow" attribute, it has to have the "ugc" attribute as well.
											
										
										
											2020-09-10 11:59:51 -04:00
+								    add_nofollow = !@omit_nofollow && SiteSetting.add_rel_nofollow_to_user_content
 								    PrettyText.add_rel_attributes_to_user_content(@doc, add_nofollow)
-												Small re-organization of CookedPostProcessor workflow

- only 'limit_size!' of oneboxed images once
- update post image at the end
- move 'enforce_nofollow' in its own method
											
										
										
											2017-10-23 12:15:51 -04:00
+								  end
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
-												DEV: Remove `bypass_bump` from CookedPostProcessor (#9468)

It was only passing it along to `PullHotlinkedImages` and that class have not used that arg since April 2014 (https://github.com/discourse/discourse/commit/c52ee665b45241a89b4de8b916860f380ecf0141)
											
										
										
											2020-04-20 21:48:19 -04:00
+								  def pull_hotlinked_images
-												FIX: Pull hotlinked images even when edited by system users (#9890)

Previously the pull hotlinked images job was skipped after system edits. This ensured that we never had an infinite loop of system-edit/pull-hotlinked/system-edit/pull-hotlinked etc.

A side effect was that edits made by system for any other reason (e.g. API, removing full quotes) would prevent pulling hotlinked images. This commit removes the system edit check, and replaces it with another method to avoid an infinite job scheduling loop.
											
										
										
											2020-05-29 08:07:47 -04:00
+								    return if @opts[:skip_pull_hotlinked_images]
-												add disk space usage failsafe

											
										
										
											2013-11-15 10:46:41 -05:00
+								    # have we enough disk space?
-												FIX: Avoid infinite loop if disk space is low

We now continue to enqueue the pull_hotlinked_images job for optimized images, even if disk space is low

											
										
										
											2019-06-07 09:09:02 -04:00
+								    disable_if_low_on_disk_space # But still enqueue the job
-												pull hotlinked images

											
										
										
											2013-11-05 13:04:47 -05:00
+								    # make sure no other job is scheduled
 								    Jobs.cancel_scheduled_job(:pull_hotlinked_images, post_id: @post.id)
 								    # schedule the job
-												Rename `ninja_edit_window` to `editing_grace_period` :'(

											
										
										
											2015-11-24 14:28:42 -05:00
+								    delay = SiteSetting.editing_grace_period + 1
-												DEV: Remove `bypass_bump` from CookedPostProcessor (#9468)

It was only passing it along to `PullHotlinkedImages` and that class have not used that arg since April 2014 (https://github.com/discourse/discourse/commit/c52ee665b45241a89b4de8b916860f380ecf0141)
											
										
										
											2020-04-20 21:48:19 -04:00
+								    Jobs.enqueue_in(delay.seconds.to_i, :pull_hotlinked_images, post_id: @post.id)
-												post process attachments

											
										
										
											2013-07-10 16:55:37 -04:00
+								  end
-												add disk space usage failsafe

											
										
										
											2013-11-15 10:46:41 -05:00
+								  def disable_if_low_on_disk_space
-												DEV: Remove the return value of disable_if_low_on_disk_space (#9469)

It was used only in specs.
											
										
										
											2020-04-20 21:48:33 -04:00
+								    return if Discourse.store.external?
 								    return if !SiteSetting.download_remote_images_to_local
 								    return if available_disk_space >= SiteSetting.download_remote_images_threshold
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
 								    SiteSetting.download_remote_images_to_local = false
-												DEV: Remove the return value of disable_if_low_on_disk_space (#9469)

It was used only in specs.
											
										
										
											2020-04-20 21:48:33 -04:00
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
+								    # log the site setting change
 								    reason = I18n.t("disable_remote_images_download_reason")
 								    staff_action_logger = StaffActionLogger.new(Discourse.system_user)
 								    staff_action_logger.log_site_setting_change("download_remote_images_to_local", true, false, details: reason)
-												move notification about low disk space into its own method

											
										
										
											2015-08-14 17:46:15 -04:00
-												FEATURE: use original filename when clicking the download link in the lightbox

											
										
										
											2014-10-15 13:20:04 -04:00
+								    # also send a private message to the site contact user
-												move notification about low disk space into its own method

											
										
										
											2015-08-14 17:46:15 -04:00
+								    notify_about_low_disk_space
-												add disk space usage failsafe

											
										
										
											2013-11-15 10:46:41 -05:00
+								  end
-												move notification about low disk space into its own method

											
										
										
											2015-08-14 17:46:15 -04:00
+								  def notify_about_low_disk_space
 								    SystemMessage.create_from_system_user(Discourse.site_contact_user, :download_remote_images_disabled)
 								  end
-												add disk space usage failsafe

											
										
										
											2013-11-15 10:46:41 -05:00
+								  def available_disk_space
-												DEV: use DiskSpace module for all disk space calculations

This normalizes it so we only carry one place for grabbing disk space size

It also normalizes the command made so it uses Discourse.execute_command
which splits off params in a far cleaner way.

											
										
										
											2020-02-17 23:13:09 -05:00
+- DiskSpace.percent_free("#{Rails.root}/public/uploads")
-												add disk space usage failsafe

											
										
										
											2013-11-15 10:46:41 -05:00
+								  end
-												cleaned up CookedPostProcessor and improved specs

											
										
										
											2013-06-15 06:29:20 -04:00
+								  def dirty?
-												make sure assets always use schemaless absolute uris

											
										
										
											2013-12-06 05:16:13 -05:00
+								    @previous_cooked != html
-												cleaned up CookedPostProcessor and improved specs

											
										
										
											2013-06-15 06:29:20 -04:00
+								  end
 								  def html
 								    @doc.try(:to_html)
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								  end
-												UX: Don't add light box for SVG images.

											
										
										
											2018-06-18 05:10:23 -04:00
+								  private
-												DEV: Make `CookedPostProcessor#post_process_images` method private.

											
										
										
											2019-05-26 23:28:37 -04:00
+								  def post_process_images
 								    extract_images.each do |img|
-												FIX: Perform crop using user-specified image sizes (#9224)

* FIX: Perform crop using user-specified image sizes

It used to resize the images to max width and height first and then
perform the crop operation. This is wrong because it ignored the user
specified image sizes from the Markdown.

* DEV: Use real images in test
											
										
										
											2020-03-26 10:40:00 -04:00
+								      convert_to_link!(img) unless add_image_placeholder!(img)
-												DEV: Make `CookedPostProcessor#post_process_images` method private.

											
										
										
											2019-05-26 23:28:37 -04:00
+								    end
 								  end
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								  def process_inline_onebox(element)
 								    inline_onebox = InlineOneboxer.lookup(
 								      element.attributes["href"].value,
-												FIX: Make inline oneboxes work with secured topics in secured contexts (#8895)


											
										
										
											2020-02-12 05:11:28 -05:00
+								      invalidate: !!@opts[:invalidate_oneboxes],
 								      user_id: @post&.user_id,
 								      category_id: @post&.topic&.category_id
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								    )
-												PERF: Move processing of inline onebox out of V8 context. (#6658)


											
										
										
											2018-11-25 20:21:38 -05:00
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
+								    if title = inline_onebox&.dig(:title)
-												SECURITY: escape title HTML for inline onebox

											
										
										
											2019-01-09 20:02:05 -05:00
+								      element.children = CGI.escapeHTML(title)
-												DEV: Remove INLINE_ONEBOX_* constants

There were two constants here, `INLINE_ONEBOX_LOADING_CSS_CLASS` and
`INLINE_ONEBOX_CSS_CLASS` that were both longer than the strings they
were DRYing up: `inline-onebox-loading` and `inline-onebox`

I normally appreciate constants, but in this case it meant that we had
a lot of JS imports resulting in many more lines of code (and CPU cycles
spent figuring them out.)

It also meant we had an `.erb` file and had to invoke Ruby to create the
JS file, which meant the app was harder to port to Ember CLI.

I removed the constants. It's less DRY but faster and simpler, and
arguably the loss of DRYness is not significant as you can still search
for the `inline-onebox-loading` and `inline-onebox` strings easily if
you are refactoring.

											
										
										
											2020-05-07 16:08:48 -04:00
+								      element.add_class("inline-onebox")
-												PERF: Move processing of inline onebox out of V8 context. (#6658)


											
										
										
											2018-11-25 20:21:38 -05:00
+								    end
-												FEATURE: Reimplement `SiteSetting.max_oneboxes_per_post`. (#6668)

Previously, the site setting was only effective on the client side of
things. Once the site setting was been reached, all oneboxes are not
rendered. This commit changes it such that the site setting is respected
both on the client and server side. The first N oneboxes are rendered and
once the limit has been reached, subsequent oneboxes will not be
rendered.
											
										
										
											2018-11-27 03:00:31 -05:00
 								    remove_inline_onebox_loading_class(element)
 								  end
 								  def remove_inline_onebox_loading_class(element)
-												DEV: Remove INLINE_ONEBOX_* constants

There were two constants here, `INLINE_ONEBOX_LOADING_CSS_CLASS` and
`INLINE_ONEBOX_CSS_CLASS` that were both longer than the strings they
were DRYing up: `inline-onebox-loading` and `inline-onebox`

I normally appreciate constants, but in this case it meant that we had
a lot of JS imports resulting in many more lines of code (and CPU cycles
spent figuring them out.)

It also meant we had an `.erb` file and had to invoke Ruby to create the
JS file, which meant the app was harder to port to Ember CLI.

I removed the constants. It's less DRY but faster and simpler, and
arguably the loss of DRYness is not significant as you can still search
for the `inline-onebox-loading` and `inline-onebox` strings easily if
you are refactoring.

											
										
										
											2020-05-07 16:08:48 -04:00
+								    element.remove_class("inline-onebox-loading")
-												PERF: Move processing of inline onebox out of V8 context. (#6658)


											
										
										
											2018-11-25 20:21:38 -05:00
+								  end
-												UX: Don't add light box for SVG images.

											
										
										
											2018-06-18 05:10:23 -04:00
+								  def is_svg?(img)
-												FIX: URL with params for svg images should not be light boxed.

											
										
										
											2018-06-19 22:47:14 -04:00
+								    path =
 								      begin
 								        URI(img["src"]).path
-												FIX: store the topic links using the cooked upload url

											
										
										
											2018-08-14 06:23:32 -04:00
+								      rescue URI::Error
-												FIX: URL with params for svg images should not be light boxed.

											
										
										
											2018-06-19 22:47:14 -04:00
+								        nil
 								      end
 								    File.extname(path) == '.svg' if path
-												UX: Don't add light box for SVG images.

											
										
										
											2018-06-18 05:10:23 -04:00
+								  end
-												Initial release of Discourse

											
										
										
											2013-02-05 14:16:51 -05:00
+								end