Search Refactor: Remove some manual SQL, make search data tables more idomatic Rails/AR

This commit is contained in:
Robin Ward 2013-05-22 15:33:33 -04:00
parent b9a310f4b1
commit 7a31630837
10 changed files with 72 additions and 30 deletions

View File

@ -27,6 +27,8 @@ class Category < ActiveRecord::Base
after_destroy :invalidate_site_cache after_destroy :invalidate_site_cache
after_destroy :publish_categories_list after_destroy :publish_categories_list
has_one :category_search_data
scope :latest, ->{ order('topic_count desc') } scope :latest, ->{ order('topic_count desc') }
scope :secured, ->(guardian = nil) { scope :secured, ->(guardian = nil) {

View File

@ -0,0 +1,5 @@
class CategorySearchData < ActiveRecord::Base
belongs_to :category
validates_presence_of :search_data
end

View File

@ -25,6 +25,8 @@ class Post < ActiveRecord::Base
has_many :replies, through: :post_replies has_many :replies, through: :post_replies
has_many :post_actions has_many :post_actions
has_one :post_search_data
validates_presence_of :raw, :user_id, :topic_id validates_presence_of :raw, :user_id, :topic_id
validates :raw, stripped_length: { in: -> { SiteSetting.post_length } } validates :raw, stripped_length: { in: -> { SiteSetting.post_length } }
validate :raw_quality validate :raw_quality

View File

@ -0,0 +1,5 @@
class PostSearchData < ActiveRecord::Base
belongs_to :post
validates_presence_of :search_data
end

View File

@ -5,32 +5,33 @@ class SearchObserver < ActiveRecord::Observer
HtmlScrubber.scrub(html) HtmlScrubber.scrub(html)
end end
def self.update_index(table, id, idx) def self.update_index(table, id, search_data)
Post.exec_sql("delete from #{table} where id = ?", id) table_name = "#{table}_search_data"
sql = "insert into #{table} (id, search_data) values (?, to_tsvector('english', ?))" foreign_key = "#{table}_id"
begin
Post.exec_sql(sql, id, idx) # Would be nice to use AR here but not sure how to execut Postgres functions
# when inserting data like this.
rows = Post.exec_sql_row_count("UPDATE #{table_name} SET search_data = TO_TSVECTOR('english', ?) WHERE #{foreign_key} = ?", search_data, id)
if rows == 0
Post.exec_sql("INSERT INTO #{table_name} (#{foreign_key}, search_data) VALUES (?, TO_TSVECTOR('english', ?))", id, search_data)
end
rescue rescue
# don't allow concurrency to mess up saving a post # don't allow concurrency to mess up saving a post
end end
end
def self.update_posts_index(post_id, cooked, title, category) def self.update_posts_index(post_id, cooked, title, category)
idx = scrub_html_for_search(cooked) search_data = scrub_html_for_search(cooked) << " " << title
idx << " " << title search_data << " " << category if category
idx << " " << category if category update_index('post', post_id, search_data)
update_index('posts_search', post_id, idx)
end end
def self.update_users_index(user_id, username, name) def self.update_users_index(user_id, username, name)
idx = username.dup search_data = username.dup << " " << (name || "")
idx << " " << (name || "") update_index('user', user_id, search_data)
update_index('users_search', user_id, idx)
end end
def self.update_categories_index(category_id, name) def self.update_categories_index(category_id, name)
update_index('categories_search', category_id, name) update_index('category', category_id, name)
end end
def after_save(obj) def after_save(obj)

View File

@ -33,6 +33,8 @@ class User < ActiveRecord::Base
has_many :groups, through: :group_users has_many :groups, through: :group_users
has_many :secure_categories, through: :groups, source: :categories has_many :secure_categories, through: :groups, source: :categories
has_one :user_search_data
validates_presence_of :username validates_presence_of :username
validates_presence_of :email validates_presence_of :email
validates_uniqueness_of :email validates_uniqueness_of :email

View File

@ -0,0 +1,4 @@
class UserSearchData < ActiveRecord::Base
belongs_to :user
validates_presence_of :search_data
end

View File

@ -0,0 +1,19 @@
class RenameSearchTables < ActiveRecord::Migration
def up
rename_table :users_search, :user_search_data
rename_column :user_search_data, :id, :user_id
rename_table :categories_search, :category_search_data
rename_column :category_search_data, :id, :category_id
rename_table :posts_search, :post_search_data
rename_column :post_search_data, :id, :post_id
end
def down
rename_table :user_search_data, :users_search
rename_column :users_search, :user_id, :id
rename_table :category_search_data, :categories_search
rename_column :categories_search, :category_id, :id
rename_table :post_search_data, :posts_search
rename_column :posts_search, :post_id, :id
end
end

View File

@ -150,7 +150,7 @@ class Search
c.color, c.color,
c.text_color c.text_color
FROM categories AS c FROM categories AS c
JOIN categories_search s on s.id = c.id JOIN category_search_data s on s.category_id = c.id
/*where*/ /*where*/
ORDER BY topics_month desc ORDER BY topics_month desc
LIMIT :limit LIMIT :limit
@ -171,7 +171,7 @@ SQL
NULL AS color, NULL AS color,
NULL AS text_color NULL AS text_color
FROM users AS u FROM users AS u
JOIN users_search s on s.id = u.id JOIN user_search_data s on s.user_id = u.id
WHERE s.search_data @@ TO_TSQUERY(:locale, :query) WHERE s.search_data @@ TO_TSQUERY(:locale, :query)
ORDER BY CASE WHEN u.username_lower = lower(:orig) then 0 else 1 end, last_posted_at desc ORDER BY CASE WHEN u.username_lower = lower(:orig) then 0 else 1 end, last_posted_at desc
LIMIT :limit" LIMIT :limit"
@ -183,7 +183,7 @@ SQL
/*select*/ /*select*/
FROM topics AS ft FROM topics AS ft
/*join*/ /*join*/
JOIN posts_search s on s.id = p.id JOIN post_search_data s on s.post_id = p.id
LEFT JOIN categories c ON c.id = ft.category_id LEFT JOIN categories c ON c.id = ft.category_id
/*where*/ /*where*/
ORDER BY ORDER BY
@ -234,18 +234,18 @@ SQL
new_slug = Slug.for(row['title']) new_slug = Slug.for(row['title'])
new_slug = "topic" if new_slug.blank? new_slug = "topic" if new_slug.blank?
row['url'].gsub!('slug', new_slug) row['url'].gsub!('slug', new_slug)
elsif type == 'user'
row['avatar_template'] = User.avatar_template(row['email'])
end end
# Add avatars for users
row['avatar_template'] = User.avatar_template(row['email']) if type == 'user'
# Remove attributes when we know they don't matter # Remove attributes when we know they don't matter
row.delete('email') row.delete('email')
row.delete('color') unless type == 'category' unless type == 'category'
row.delete('text_color') unless type == 'category' row.delete('color')
row.delete('text_color')
end
grouped[type] ||= [] grouped[type] = (grouped[type] || []) << row
grouped[type] << row
end end
grouped.map do |type, results| grouped.map do |type, results|

View File

@ -22,7 +22,7 @@ describe Search do
@category = Fabricate(:category, name: 'america') @category = Fabricate(:category, name: 'america')
@topic = Fabricate(:topic, title: 'sam saffron test topic', category: @category) @topic = Fabricate(:topic, title: 'sam saffron test topic', category: @category)
@post = Fabricate(:post, topic: @topic, raw: 'this <b>fun test</b> <img src="bla" title="my image">') @post = Fabricate(:post, topic: @topic, raw: 'this <b>fun test</b> <img src="bla" title="my image">')
@indexed = Topic.exec_sql("select search_data from posts_search where id = #{@post.id}").first["search_data"] @indexed = @post.post_search_data.search_data
end end
it "should include body in index" do it "should include body in index" do
@indexed.should =~ /fun/ @indexed.should =~ /fun/
@ -37,7 +37,9 @@ describe Search do
it "should pick up on title updates" do it "should pick up on title updates" do
@topic.title = "harpi is the new title" @topic.title = "harpi is the new title"
@topic.save! @topic.save!
@indexed = Topic.exec_sql("select search_data from posts_search where id = #{@post.id}").first["search_data"] @post.post_search_data.reload
@indexed = @post.post_search_data.search_data
@indexed.should =~ /harpi/ @indexed.should =~ /harpi/
end end
@ -46,7 +48,7 @@ describe Search do
context 'user indexing observer' do context 'user indexing observer' do
before do before do
@user = Fabricate(:user, username: 'fred', name: 'bob jones') @user = Fabricate(:user, username: 'fred', name: 'bob jones')
@indexed = User.exec_sql("select search_data from users_search where id = #{@user.id}").first["search_data"] @indexed = @user.user_search_data.search_data
end end
it "should pick up on username" do it "should pick up on username" do
@ -61,7 +63,7 @@ describe Search do
context 'category indexing observer' do context 'category indexing observer' do
before do before do
@category = Fabricate(:category, name: 'america') @category = Fabricate(:category, name: 'america')
@indexed = Topic.exec_sql("select search_data from categories_search where id = #{@category.id}").first["search_data"] @indexed = @category.category_search_data.search_data
end end
it "should pick up on name" do it "should pick up on name" do