From ea9f93dcc5a95048a1cda2b420a94a1ca082cd13 Mon Sep 17 00:00:00 2001 From: Robin Ward Date: Fri, 19 May 2017 16:57:19 -0400 Subject: [PATCH] FIX: Don't crawl non-http/s links --- app/jobs/regular/crawl_topic_link.rb | 2 ++ 1 file changed, 2 insertions(+) diff --git a/app/jobs/regular/crawl_topic_link.rb b/app/jobs/regular/crawl_topic_link.rb index e77fedfab63..4f6e600ab1e 100644 --- a/app/jobs/regular/crawl_topic_link.rb +++ b/app/jobs/regular/crawl_topic_link.rb @@ -27,6 +27,8 @@ module Jobs uri = URI(url) return if uri.blank? || uri.host.blank? + return unless ['https', 'http'].include?(uri.scheme) + headers = CrawlTopicLink.request_headers(uri) head = Excon.head(url, read_timeout: 20, headers: headers)