2019-05-02 18:17:27 -04:00
|
|
|
# frozen_string_literal: true
|
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
require "ipaddr"
|
2015-02-22 14:47:18 -05:00
|
|
|
require "url_helper"
|
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
class TopicLinkClick < ActiveRecord::Base
|
|
|
|
belongs_to :topic_link, counter_cache: :clicks
|
|
|
|
belongs_to :user
|
|
|
|
|
|
|
|
validates_presence_of :topic_link_id
|
|
|
|
|
2020-09-27 23:52:05 -04:00
|
|
|
ALLOWED_REDIRECT_HOSTNAMES = Set.new(%W[www.youtube.com youtu.be])
|
2015-04-01 16:59:25 -04:00
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
# Create a click from a URL and post_id
|
|
|
|
def self.create_from(args = {})
|
2015-09-25 14:07:04 -04:00
|
|
|
url = args[:url][0...TopicLink.max_url_length]
|
2015-02-22 14:47:18 -05:00
|
|
|
return nil if url.blank?
|
|
|
|
|
2018-12-11 02:03:13 -05:00
|
|
|
uri = UrlHelper.relaxed_parse(url)
|
2015-02-22 14:47:18 -05:00
|
|
|
urls = Set.new
|
|
|
|
urls << url
|
2023-01-20 13:52:49 -05:00
|
|
|
if url =~ /\Ahttp/
|
|
|
|
urls << url.sub(/\Ahttps/, "http")
|
|
|
|
urls << url.sub(/\Ahttp:/, "https:")
|
2015-06-12 06:02:36 -04:00
|
|
|
urls << UrlHelper.schemaless(url)
|
2014-01-14 14:59:51 -05:00
|
|
|
end
|
2015-06-12 06:02:36 -04:00
|
|
|
urls << UrlHelper.absolute_without_cdn(url)
|
2015-02-22 14:47:18 -05:00
|
|
|
urls << uri.path if uri.try(:host) == Discourse.current_hostname
|
2016-08-23 12:08:37 -04:00
|
|
|
|
|
|
|
query = url.index("?")
|
|
|
|
unless query.nil?
|
|
|
|
endpos = url.index("#") || url.size
|
|
|
|
urls << url[0..query - 1] + url[endpos..-1]
|
|
|
|
end
|
2015-02-22 14:47:18 -05:00
|
|
|
|
2017-12-13 13:58:36 -05:00
|
|
|
# link can have query params, and analytics can add more to the end:
|
|
|
|
i = url.length
|
2017-12-13 15:47:42 -05:00
|
|
|
while i = url.rindex("&", i - 1)
|
2017-12-13 13:58:36 -05:00
|
|
|
urls << url[0...i]
|
|
|
|
end
|
|
|
|
|
2015-08-04 22:15:08 -04:00
|
|
|
# add a cdn link
|
2016-06-28 15:52:38 -04:00
|
|
|
if uri
|
|
|
|
if Discourse.asset_host.present?
|
2018-03-28 04:20:08 -04:00
|
|
|
cdn_uri =
|
|
|
|
begin
|
|
|
|
URI.parse(Discourse.asset_host)
|
2018-08-14 06:23:32 -04:00
|
|
|
rescue URI::Error
|
2018-03-28 04:20:08 -04:00
|
|
|
end
|
|
|
|
|
2016-06-28 15:52:38 -04:00
|
|
|
if cdn_uri && cdn_uri.hostname == uri.hostname && uri.path.starts_with?(cdn_uri.path)
|
|
|
|
is_cdn_link = true
|
2016-06-30 10:55:01 -04:00
|
|
|
urls << uri.path[cdn_uri.path.length..-1]
|
2016-06-28 15:52:38 -04:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2017-10-06 01:20:01 -04:00
|
|
|
if SiteSetting.Upload.s3_cdn_url.present?
|
2018-03-28 04:20:08 -04:00
|
|
|
cdn_uri =
|
|
|
|
begin
|
|
|
|
URI.parse(SiteSetting.Upload.s3_cdn_url)
|
2018-08-14 06:23:32 -04:00
|
|
|
rescue URI::Error
|
2018-03-28 04:20:08 -04:00
|
|
|
end
|
|
|
|
|
2016-06-28 15:52:38 -04:00
|
|
|
if cdn_uri && cdn_uri.hostname == uri.hostname && uri.path.starts_with?(cdn_uri.path)
|
|
|
|
is_cdn_link = true
|
2016-06-30 10:55:01 -04:00
|
|
|
path = uri.path[cdn_uri.path.length..-1]
|
2016-06-28 15:52:38 -04:00
|
|
|
urls << path
|
|
|
|
urls << "#{Discourse.store.absolute_base_url}#{path}"
|
|
|
|
end
|
2015-08-04 22:15:08 -04:00
|
|
|
end
|
|
|
|
end
|
|
|
|
|
2015-02-22 14:47:18 -05:00
|
|
|
# test for all possible URLs
|
2022-02-18 07:47:56 -05:00
|
|
|
link = TopicLink.where(url: urls)
|
2014-01-14 14:59:51 -05:00
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
# Find the forum topic link
|
|
|
|
link = link.where(post_id: args[:post_id]) if args[:post_id].present?
|
|
|
|
|
2021-05-20 21:43:47 -04:00
|
|
|
# If we don't have a post, just find the first occurrence of the link
|
2013-02-05 14:16:51 -05:00
|
|
|
link = link.where(topic_id: args[:topic_id]) if args[:topic_id].present?
|
2022-02-18 07:47:56 -05:00
|
|
|
|
|
|
|
# select the TopicLink associated to first url
|
|
|
|
link =
|
|
|
|
link.order(
|
|
|
|
"array_position(ARRAY[#{urls.map { |s| "#{ActiveRecord::Base.connection.quote(s)}" }.join(",")}], url::text)",
|
|
|
|
).first
|
2013-02-05 14:16:51 -05:00
|
|
|
|
2015-02-22 14:47:18 -05:00
|
|
|
# If no link is found...
|
2013-07-27 13:18:37 -04:00
|
|
|
unless link.present?
|
2015-02-22 14:47:18 -05:00
|
|
|
# ... return the url for relative links or when using the same host
|
2023-01-20 13:52:49 -05:00
|
|
|
return url if url =~ %r{\A/[^/]} || uri.try(:host) == Discourse.current_hostname
|
2014-11-20 14:01:48 -05:00
|
|
|
|
2015-02-22 14:47:18 -05:00
|
|
|
# If we have it somewhere else on the site, just allow the redirect.
|
|
|
|
# This is likely due to a onebox of another topic.
|
|
|
|
link = TopicLink.find_by(url: url)
|
2015-04-01 16:59:25 -04:00
|
|
|
return link.url if link.present?
|
|
|
|
|
2015-05-05 21:22:53 -04:00
|
|
|
return nil unless uri
|
|
|
|
|
2020-07-26 20:23:54 -04:00
|
|
|
# Only redirect to allowlisted hostnames
|
2020-09-27 23:52:05 -04:00
|
|
|
return url if ALLOWED_REDIRECT_HOSTNAMES.include?(uri.hostname) || is_cdn_link
|
2015-08-04 21:49:11 -04:00
|
|
|
|
|
|
|
return nil
|
2013-07-27 13:18:37 -04:00
|
|
|
end
|
|
|
|
|
2015-02-22 14:47:18 -05:00
|
|
|
return url if args[:user_id] && link.user_id == args[:user_id]
|
2013-07-26 17:29:43 -04:00
|
|
|
|
2013-02-05 14:16:51 -05:00
|
|
|
# Rate limit the click counts to once in 24 hours
|
|
|
|
rate_key = "link-clicks:#{link.id}:#{args[:user_id] || args[:ip]}"
|
2019-12-03 04:05:53 -05:00
|
|
|
if Discourse.redis.setnx(rate_key, "1")
|
|
|
|
Discourse.redis.expire(rate_key, 1.day.to_i)
|
2018-05-21 15:04:55 -04:00
|
|
|
args[:ip] = nil if args[:user_id]
|
2013-06-24 18:30:32 -04:00
|
|
|
create!(topic_link_id: link.id, user_id: args[:user_id], ip_address: args[:ip])
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
|
2015-02-22 14:47:18 -05:00
|
|
|
url
|
2013-02-05 14:16:51 -05:00
|
|
|
end
|
|
|
|
end
|
2013-05-23 22:48:32 -04:00
|
|
|
|
|
|
|
# == Schema Information
|
|
|
|
#
|
|
|
|
# Table name: topic_link_clicks
|
|
|
|
#
|
|
|
|
# id :integer not null, primary key
|
|
|
|
# topic_link_id :integer not null
|
|
|
|
# user_id :integer
|
2014-08-27 01:19:25 -04:00
|
|
|
# created_at :datetime not null
|
|
|
|
# updated_at :datetime not null
|
2018-05-21 15:04:55 -04:00
|
|
|
# ip_address :inet
|
2013-05-23 22:48:32 -04:00
|
|
|
#
|
|
|
|
# Indexes
|
|
|
|
#
|
2021-07-05 18:14:15 -04:00
|
|
|
# by_link (topic_link_id)
|
2013-05-23 22:48:32 -04:00
|
|
|
#
|