2014-04-22 17:11:06 +02:00
|
|
|
require "open-uri"
|
|
|
|
|
2014-04-14 22:55:57 +02:00
|
|
|
class FileHelper
|
|
|
|
|
|
|
|
def self.is_image?(filename)
|
|
|
|
filename =~ images_regexp
|
|
|
|
end
|
|
|
|
|
2014-07-27 17:21:47 +02:00
|
|
|
def self.download(url, max_file_size, tmp_file_name, follow_redirect=false)
|
2014-05-12 16:57:52 +02:00
|
|
|
raise Discourse::InvalidParameters.new(:url) unless url =~ /^https?:\/\//
|
2014-04-14 22:55:57 +02:00
|
|
|
|
2014-11-12 18:15:50 +01:00
|
|
|
uri = parse_url(url)
|
2014-04-22 17:11:06 +02:00
|
|
|
extension = File.extname(uri.path)
|
2014-04-14 22:55:57 +02:00
|
|
|
tmp = Tempfile.new([tmp_file_name, extension])
|
|
|
|
|
|
|
|
File.open(tmp.path, "wb") do |f|
|
2015-08-17 19:21:30 +02:00
|
|
|
downloaded = uri.open("rb", read_timeout: 5, redirect: follow_redirect, allow_redirections: :all)
|
2015-05-19 12:39:46 +02:00
|
|
|
while f.size <= max_file_size && data = downloaded.read(512.kilobytes)
|
2014-04-14 22:55:57 +02:00
|
|
|
f.write(data)
|
|
|
|
end
|
2014-05-22 17:37:20 +10:00
|
|
|
# tiny files are StringIO, no close! on them
|
2015-05-19 12:39:46 +02:00
|
|
|
downloaded.try(:close!) rescue nil
|
2014-04-14 22:55:57 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
tmp
|
|
|
|
end
|
|
|
|
|
|
|
|
private
|
|
|
|
|
|
|
|
def self.images
|
2014-10-13 12:43:36 -07:00
|
|
|
@@images ||= Set.new ["jpg", "jpeg", "png", "gif", "tif", "tiff", "bmp", "svg", "webp"]
|
2014-04-14 22:55:57 +02:00
|
|
|
end
|
|
|
|
|
|
|
|
def self.images_regexp
|
2014-04-29 19:12:35 +02:00
|
|
|
@@images_regexp ||= /\.(#{images.to_a.join("|")})$/i
|
2014-04-14 22:55:57 +02:00
|
|
|
end
|
|
|
|
|
2014-11-12 18:15:50 +01:00
|
|
|
# HACK to support underscores in URLs
|
|
|
|
# cf. http://stackoverflow.com/a/18938253/11983
|
|
|
|
def self.parse_url(url)
|
|
|
|
URI.parse(url)
|
|
|
|
rescue URI::InvalidURIError
|
|
|
|
host = url.match(".+\:\/\/([^\/]+)")[1]
|
|
|
|
uri = URI.parse(url.sub(host, 'valid-host'))
|
|
|
|
uri.instance_variable_set("@host", host)
|
|
|
|
uri
|
|
|
|
end
|
|
|
|
|
2014-04-14 22:55:57 +02:00
|
|
|
end
|