FIX: Regression where api_key is not filtered properly.
This commit is contained in:
parent
0c4e4406a1
commit
4895723f7b
|
@ -0,0 +1,157 @@
|
|||
class LogAnalyzer
|
||||
|
||||
class LineParser
|
||||
|
||||
|
||||
# log_format log_discourse '[$time_local] $remote_addr "$request" "$http_user_agent" "$sent_http_x_discourse_route" $status $bytes_sent "$http_referer" $upstream_response_time $request_time "$sent_http_x_discourse_username"';
|
||||
|
||||
attr_accessor :time, :ip_address, :url, :route, :user_agent, :rails_duration, :total_duration,
|
||||
:username, :status, :bytes_sent, :referer
|
||||
|
||||
PATTERN = /\[(.*)\] (\S+) \"(.*)\" \"(.*)\" \"(.*)\" ([0-9]+) ([0-9]+) \"(.*)\" ([0-9.]+) ([0-9.]+) "(.*)"/
|
||||
|
||||
TIME_FORMAT = "%d/%b/%Y:%H:%M:%S %Z"
|
||||
|
||||
def self.parse(line)
|
||||
|
||||
result = new
|
||||
_, result.time, result.ip_address, result.url, result.user_agent,
|
||||
result.route, result.status, result.bytes_sent, result.referer,
|
||||
result.rails_duration, result.total_duration, result.username = line.match(PATTERN).to_a
|
||||
|
||||
result.rails_duration = result.rails_duration.to_f
|
||||
result.total_duration = result.total_duration.to_f
|
||||
|
||||
verb = result.url[0..3] if result.url
|
||||
if verb && verb == "POST"
|
||||
result.route += " (POST)"
|
||||
end
|
||||
|
||||
if verb && verb == "PUT"
|
||||
result.route += " (PUT)"
|
||||
end
|
||||
|
||||
result.url = self.sanitize_url(result.url) if result.url
|
||||
|
||||
result
|
||||
end
|
||||
|
||||
def is_mobile?
|
||||
user_agent =~ /Mobile|Android|webOS/ && !(user_agent =~ /iPad|Nexus (7|10)/)
|
||||
end
|
||||
|
||||
def parsed_time
|
||||
DateTime.strptime(time, TIME_FORMAT) if time
|
||||
end
|
||||
|
||||
private
|
||||
|
||||
def self.sanitize_url(url)
|
||||
url.gsub(/api_key=([\w.\-]+)/, 'api_key=[FILTERED]')
|
||||
end
|
||||
end
|
||||
|
||||
attr_reader :total_requests, :message_bus_requests, :filenames,
|
||||
:ip_to_rails_duration, :username_to_rails_duration,
|
||||
:route_to_rails_duration, :url_to_rails_duration,
|
||||
:status_404_to_count, :from_time, :to_time
|
||||
|
||||
def self.analyze(filenames, args)
|
||||
new(filenames, args).analyze
|
||||
end
|
||||
|
||||
class Aggeregator
|
||||
|
||||
attr_accessor :aggregate_type
|
||||
|
||||
def initialize
|
||||
@data = {}
|
||||
@aggregate_type = :duration
|
||||
end
|
||||
|
||||
def add(id, duration, aggregate=nil)
|
||||
ary = (@data[id] ||= [0,0])
|
||||
ary[0] += duration
|
||||
ary[1] += 1
|
||||
unless aggregate.nil?
|
||||
ary[2] ||= Hash.new(0)
|
||||
if @aggregate_type == :duration
|
||||
ary[2][aggregate] += duration
|
||||
elsif @aggregate_type == :count
|
||||
ary[2][aggregate] += 1
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
def top(n, aggregator_formatter=nil)
|
||||
@data.sort{|a,b| b[1][0] <=> a[1][0]}.first(n).map do |metric, ary|
|
||||
metric = metric.to_s
|
||||
metric = "[empty]" if metric.length == 0
|
||||
result = [metric, ary[0], ary[1]]
|
||||
# handle aggregate
|
||||
if ary[2]
|
||||
if aggregator_formatter
|
||||
result.push aggregator_formatter.call(ary[2], ary[0], ary[1])
|
||||
else
|
||||
result.push ary[2].sort{|a,b| b[1] <=> a[1]}.first(5).map{|k,v|
|
||||
v = "%.2f" % v if Float === v
|
||||
"#{k}(#{v})"}.join(" ")
|
||||
end
|
||||
end
|
||||
|
||||
result
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
def initialize(filenames, args={})
|
||||
@filenames = filenames
|
||||
@ip_to_rails_duration = Aggeregator.new
|
||||
@username_to_rails_duration = Aggeregator.new
|
||||
|
||||
@route_to_rails_duration = Aggeregator.new
|
||||
@route_to_rails_duration.aggregate_type = :count
|
||||
|
||||
@url_to_rails_duration = Aggeregator.new
|
||||
@status_404_to_count = Aggeregator.new
|
||||
|
||||
@total_requests = 0
|
||||
@message_bus_requests = 0
|
||||
@limit = args[:limit]
|
||||
end
|
||||
|
||||
def analyze
|
||||
now = DateTime.now
|
||||
|
||||
@filenames.each do |filename|
|
||||
File.open(filename).each_line do |line|
|
||||
@total_requests += 1
|
||||
parsed = LineParser.parse(line)
|
||||
|
||||
next unless parsed.time
|
||||
next if @limit && ((now - parsed.parsed_time) * 24 * 60).to_i > @limit
|
||||
|
||||
@from_time ||= parsed.time
|
||||
@to_time = parsed.time
|
||||
|
||||
if parsed.url =~ /(POST|GET) \/message-bus/
|
||||
@message_bus_requests += 1
|
||||
next
|
||||
end
|
||||
|
||||
@ip_to_rails_duration.add(parsed.ip_address, parsed.rails_duration)
|
||||
|
||||
username = parsed.username == "-" ? "[Anonymous]" : parsed.username
|
||||
@username_to_rails_duration.add(username, parsed.rails_duration, parsed.route)
|
||||
|
||||
@route_to_rails_duration.add(parsed.route, parsed.rails_duration, parsed.is_mobile? ? "mobile" : "desktop")
|
||||
|
||||
@url_to_rails_duration.add(parsed.url, parsed.rails_duration)
|
||||
|
||||
@status_404_to_count.add(parsed.url,1) if parsed.status == "404"
|
||||
end
|
||||
end
|
||||
self
|
||||
end
|
||||
|
||||
end
|
|
@ -1,162 +1,5 @@
|
|||
require 'date'
|
||||
|
||||
class LogAnalyzer
|
||||
|
||||
class LineParser
|
||||
|
||||
|
||||
# log_format log_discourse '[$time_local] $remote_addr "$request" "$http_user_agent" "$sent_http_x_discourse_route" $status $bytes_sent "$http_referer" $upstream_response_time $request_time "$sent_http_x_discourse_username"';
|
||||
|
||||
attr_accessor :time, :ip_address, :url, :route, :user_agent, :rails_duration, :total_duration,
|
||||
:username, :status, :bytes_sent, :referer
|
||||
|
||||
PATTERN = /\[(.*)\] (\S+) \"(.*)\" \"(.*)\" \"(.*)\" ([0-9]+) ([0-9]+) \"(.*)\" ([0-9.]+) ([0-9.]+) "(.*)"/
|
||||
|
||||
TIME_FORMAT = "%d/%b/%Y:%H:%M:%S %Z"
|
||||
|
||||
def self.parse(line)
|
||||
|
||||
result = new
|
||||
_, result.time, result.ip_address, result.url, result.user_agent,
|
||||
result.route, result.status, result.bytes_sent, result.referer,
|
||||
result.rails_duration, result.total_duration, result.username = line.match(PATTERN).to_a
|
||||
|
||||
result.rails_duration = result.rails_duration.to_f
|
||||
result.total_duration = result.total_duration.to_f
|
||||
|
||||
verb = result.url[0..3] if result.url
|
||||
if verb && verb == "POST"
|
||||
result.route += " (POST)"
|
||||
end
|
||||
|
||||
if verb && verb == "PUT"
|
||||
result.route += " (PUT)"
|
||||
end
|
||||
|
||||
result.url = self.sanitize_url(result.url) if result.url
|
||||
|
||||
result
|
||||
end
|
||||
|
||||
def is_mobile?
|
||||
user_agent =~ /Mobile|Android|webOS/ && !(user_agent =~ /iPad|Nexus (7|10)/)
|
||||
end
|
||||
|
||||
def parsed_time
|
||||
DateTime.strptime(time, TIME_FORMAT) if time
|
||||
end
|
||||
|
||||
private
|
||||
|
||||
def self.sanitize_url(url)
|
||||
url.gsub(/api_key=([\w.\-]+)/, '\1=[FILTERED]')
|
||||
end
|
||||
end
|
||||
|
||||
attr_reader :total_requests, :message_bus_requests, :filenames,
|
||||
:ip_to_rails_duration, :username_to_rails_duration,
|
||||
:route_to_rails_duration, :url_to_rails_duration,
|
||||
:status_404_to_count, :from_time, :to_time
|
||||
|
||||
def self.analyze(filenames, args)
|
||||
new(filenames, args).analyze
|
||||
end
|
||||
|
||||
class Aggeregator
|
||||
|
||||
attr_accessor :aggregate_type
|
||||
|
||||
def initialize
|
||||
@data = {}
|
||||
@aggregate_type = :duration
|
||||
end
|
||||
|
||||
def add(id, duration, aggregate=nil)
|
||||
ary = (@data[id] ||= [0,0])
|
||||
ary[0] += duration
|
||||
ary[1] += 1
|
||||
unless aggregate.nil?
|
||||
ary[2] ||= Hash.new(0)
|
||||
if @aggregate_type == :duration
|
||||
ary[2][aggregate] += duration
|
||||
elsif @aggregate_type == :count
|
||||
ary[2][aggregate] += 1
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
def top(n, aggregator_formatter=nil)
|
||||
@data.sort{|a,b| b[1][0] <=> a[1][0]}.first(n).map do |metric, ary|
|
||||
metric = metric.to_s
|
||||
metric = "[empty]" if metric.length == 0
|
||||
result = [metric, ary[0], ary[1]]
|
||||
# handle aggregate
|
||||
if ary[2]
|
||||
if aggregator_formatter
|
||||
result.push aggregator_formatter.call(ary[2], ary[0], ary[1])
|
||||
else
|
||||
result.push ary[2].sort{|a,b| b[1] <=> a[1]}.first(5).map{|k,v|
|
||||
v = "%.2f" % v if Float === v
|
||||
"#{k}(#{v})"}.join(" ")
|
||||
end
|
||||
end
|
||||
|
||||
result
|
||||
end
|
||||
end
|
||||
end
|
||||
|
||||
def initialize(filenames, args={})
|
||||
@filenames = filenames
|
||||
@ip_to_rails_duration = Aggeregator.new
|
||||
@username_to_rails_duration = Aggeregator.new
|
||||
|
||||
@route_to_rails_duration = Aggeregator.new
|
||||
@route_to_rails_duration.aggregate_type = :count
|
||||
|
||||
@url_to_rails_duration = Aggeregator.new
|
||||
@status_404_to_count = Aggeregator.new
|
||||
|
||||
@total_requests = 0
|
||||
@message_bus_requests = 0
|
||||
@limit = args[:limit]
|
||||
end
|
||||
|
||||
def analyze
|
||||
now = DateTime.now
|
||||
|
||||
@filenames.each do |filename|
|
||||
File.open(filename).each_line do |line|
|
||||
@total_requests += 1
|
||||
parsed = LineParser.parse(line)
|
||||
|
||||
next unless parsed.time
|
||||
next if @limit && ((now - parsed.parsed_time) * 24 * 60).to_i > @limit
|
||||
|
||||
@from_time ||= parsed.time
|
||||
@to_time = parsed.time
|
||||
|
||||
if parsed.url =~ /(POST|GET) \/message-bus/
|
||||
@message_bus_requests += 1
|
||||
next
|
||||
end
|
||||
|
||||
@ip_to_rails_duration.add(parsed.ip_address, parsed.rails_duration)
|
||||
|
||||
username = parsed.username == "-" ? "[Anonymous]" : parsed.username
|
||||
@username_to_rails_duration.add(username, parsed.rails_duration, parsed.route)
|
||||
|
||||
@route_to_rails_duration.add(parsed.route, parsed.rails_duration, parsed.is_mobile? ? "mobile" : "desktop")
|
||||
|
||||
@url_to_rails_duration.add(parsed.url, parsed.rails_duration)
|
||||
|
||||
@status_404_to_count.add(parsed.url,1) if parsed.status == "404"
|
||||
end
|
||||
end
|
||||
self
|
||||
end
|
||||
|
||||
end
|
||||
require_relative '../lib/log_analyzer'
|
||||
|
||||
args = ARGV.dup
|
||||
|
||||
|
|
|
@ -0,0 +1,13 @@
|
|||
require 'rails_helper'
|
||||
require_relative '../lib/log_analyzer'
|
||||
|
||||
describe LogAnalyzer::LineParser do
|
||||
describe '.parse' do
|
||||
let(:line) { '[22/Sep/2016:07:32:00 +0000] 172.0.0.1 "GET /about.json?api_username=system&api_key=1234567 HTTP/1.1" "Some usename" "about/index" 200 1641 "-" 0.014 0.014 "system"' }
|
||||
|
||||
it "should filter out the api_key" do
|
||||
result = described_class.parse(line)
|
||||
expect(result.url).to eq('GET /about.json?api_username=system&api_key=[FILTERED] HTTP/1.1')
|
||||
end
|
||||
end
|
||||
end
|
Loading…
Reference in New Issue