2013-02-05 14:16:51 -05:00
|
|
|
# Post processing that we can do after a post has already been cooked. For
|
|
|
|
# example, inserting the onebox content, or image sizes.
|
|
|
|
|
|
|
|
require_dependency 'oneboxer'
|
2013-04-13 10:31:20 -04:00
|
|
|
require_dependency 'image_optimizer'
|
2013-02-05 14:16:51 -05:00
|
|
|
|
|
|
|
class CookedPostProcessor
|
2013-02-19 01:57:14 -05:00
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
def initialize(post, opts={})
|
|
|
|
@dirty = false
|
|
|
|
@opts = opts
|
|
|
|
@post = post
|
2013-04-10 03:52:38 -04:00
|
|
|
@doc = Nokogiri::HTML::fragment(post.cooked)
|
2013-02-19 01:57:14 -05:00
|
|
|
@size_cache = {}
|
2013-06-15 06:29:20 -04:00
|
|
|
@has_been_uploaded_cache = {}
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def post_process
|
|
|
|
return unless @doc.present?
|
|
|
|
post_process_images
|
|
|
|
post_process_oneboxes
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
2013-02-25 11:42:20 -05:00
|
|
|
def post_process_images
|
2013-02-05 14:16:51 -05:00
|
|
|
images = @doc.search("img")
|
2013-02-25 11:42:20 -05:00
|
|
|
return unless images.present?
|
2013-02-05 14:16:51 -05:00
|
|
|
|
2013-02-19 01:57:14 -05:00
|
|
|
images.each do |img|
|
2013-06-15 06:29:20 -04:00
|
|
|
# keep track of the src
|
2013-02-19 01:57:14 -05:00
|
|
|
src = img['src']
|
2013-06-15 06:29:20 -04:00
|
|
|
# make sure the src is absolute (when working with locally uploaded files)
|
|
|
|
img['src'] = Discourse.base_url_no_prefix + img['src'] if img['src'] =~ /^\/[^\/]/
|
2013-02-05 14:16:51 -05:00
|
|
|
|
2013-04-13 10:31:20 -04:00
|
|
|
if src.present?
|
2013-06-15 06:29:20 -04:00
|
|
|
# update img dimensions if at least one is missing
|
|
|
|
update_dimensions!(img)
|
|
|
|
# optimize image
|
2013-04-13 10:31:20 -04:00
|
|
|
img['src'] = optimize_image(img)
|
2013-06-15 06:29:20 -04:00
|
|
|
# lightbox treatment
|
|
|
|
convert_to_link!(img)
|
|
|
|
# mark the post as dirty whenever the src has changed
|
|
|
|
@dirty |= src != img['src']
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
2013-04-13 10:31:20 -04:00
|
|
|
end
|
2013-02-19 01:57:14 -05:00
|
|
|
|
2013-04-13 10:31:20 -04:00
|
|
|
# Extract the first image from the first post and use it as the 'topic image'
|
|
|
|
if @post.post_number == 1
|
|
|
|
img = images.first
|
|
|
|
@post.topic.update_column :image_url, img['src'] if img['src'].present?
|
2013-02-19 01:57:14 -05:00
|
|
|
end
|
2013-04-13 10:31:20 -04:00
|
|
|
|
2013-02-19 01:57:14 -05:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def post_process_oneboxes
|
|
|
|
args = { post_id: @post.id }
|
|
|
|
args[:invalidate_oneboxes] = true if @opts[:invalidate_oneboxes]
|
|
|
|
# bake onebox content into the post
|
|
|
|
result = Oneboxer.apply(@doc) do |url, element|
|
|
|
|
Oneboxer.onebox(url, args)
|
|
|
|
end
|
|
|
|
# mark the post as dirty whenever a onebox as been baked
|
|
|
|
@dirty |= result.changed?
|
|
|
|
end
|
2013-04-13 10:31:20 -04:00
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def update_dimensions!(img)
|
|
|
|
return if img['width'].present? && img['height'].present?
|
|
|
|
|
|
|
|
w, h = get_size_from_image_sizes(img['src'], @opts[:image_sizes]) || image_dimensions(img['src'])
|
|
|
|
|
|
|
|
if w && h
|
|
|
|
img['width'] = w.to_s
|
|
|
|
img['height'] = h.to_s
|
|
|
|
@dirty = true
|
|
|
|
end
|
|
|
|
end
|
2013-02-20 20:07:36 -05:00
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def optimize_image(img)
|
|
|
|
return img["src"]
|
|
|
|
# TODO: needs some <3
|
2013-02-19 01:57:14 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
def convert_to_link!(img)
|
|
|
|
src = img["src"]
|
2013-04-13 10:31:20 -04:00
|
|
|
width, height = img["width"].to_i, img["height"].to_i
|
2013-02-19 01:57:14 -05:00
|
|
|
|
|
|
|
return unless src.present? && width > SiteSetting.auto_link_images_wider_than
|
|
|
|
|
2013-04-13 10:31:20 -04:00
|
|
|
original_width, original_height = get_size(src)
|
2013-02-19 01:57:14 -05:00
|
|
|
|
|
|
|
return unless original_width.to_i > width && original_height.to_i > height
|
|
|
|
|
|
|
|
parent = img.parent
|
|
|
|
while parent
|
|
|
|
return if parent.name == "a"
|
|
|
|
break unless parent.respond_to? :parent
|
|
|
|
parent = parent.parent
|
|
|
|
end
|
|
|
|
|
2013-02-25 11:42:20 -05:00
|
|
|
# not a hyperlink so we can apply
|
2013-02-19 01:57:14 -05:00
|
|
|
a = Nokogiri::XML::Node.new "a", @doc
|
|
|
|
img.add_next_sibling(a)
|
|
|
|
a["href"] = src
|
|
|
|
a["class"] = "lightbox"
|
|
|
|
a.add_child(img)
|
|
|
|
@dirty = true
|
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
2013-02-19 01:57:14 -05:00
|
|
|
def get_size_from_image_sizes(src, image_sizes)
|
|
|
|
if image_sizes.present?
|
|
|
|
if dim = image_sizes[src]
|
|
|
|
ImageSizer.resize(dim['width'], dim['height'])
|
|
|
|
end
|
|
|
|
end
|
|
|
|
end
|
2013-02-05 14:16:51 -05:00
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
# Retrieve the image dimensions for a url
|
|
|
|
def image_dimensions(url)
|
|
|
|
uri = get_image_uri(url)
|
|
|
|
return unless uri
|
|
|
|
w, h = get_size(url)
|
|
|
|
ImageSizer.resize(w, h) if w && h
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def get_size(url)
|
|
|
|
# we can always crawl our own images
|
|
|
|
return unless SiteSetting.crawl_images? || has_been_uploaded?(url)
|
|
|
|
@size_cache[url] ||= FastImage.size(url)
|
|
|
|
rescue Zlib::BufError # FastImage.size raises BufError for some gifs
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def get_image_uri(url)
|
|
|
|
uri = URI.parse(url)
|
|
|
|
uri if %w(http https).include?(uri.scheme)
|
2013-04-10 03:52:38 -04:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def has_been_uploaded?(url)
|
|
|
|
@has_been_uploaded_cache[url] ||= url.start_with?(base_url)
|
2013-02-19 01:57:14 -05:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def base_url
|
|
|
|
asset_host.present? ? asset_host : Discourse.base_url_no_prefix
|
2013-02-20 20:07:36 -05:00
|
|
|
end
|
|
|
|
|
2013-06-15 06:29:20 -04:00
|
|
|
def asset_host
|
|
|
|
ActionController::Base.asset_host
|
|
|
|
end
|
|
|
|
|
|
|
|
def dirty?
|
|
|
|
@dirty
|
|
|
|
end
|
|
|
|
|
|
|
|
def html
|
|
|
|
@doc.try(:to_html)
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
|
|
|
end
|