require 'rails_helper' describe SearchIndexer do let(:post_id) { 99 } def scrub(html, strip_diacritics: false) SearchIndexer.scrub_html_for_search(html, strip_diacritics: strip_diacritics) end it 'correctly indexes chinese' do SiteSetting.default_locale = 'zh_CN' data = "你好世界" expect(data.split(" ").length).to eq(1) SearchIndexer.update_posts_index(post_id, "你好世界", "", "", nil) raw_data = PostSearchData.where(post_id: post_id).pluck(:raw_data)[0] expect(raw_data.split(' ').length).to eq(2) end it 'extract youtube title' do html = "
" scrubbed = scrub(html) expect(scrubbed).to eq("Metallica Mixer Explains Missing Bass on 'And Justice for All' [Exclusive]") end it 'extract a link' do html = "link" scrubbed = scrub(html) expect(scrubbed).to eq("http://meta.discourse.org/ link") end it 'uses ignore_accent setting to strip diacritics' do html = "

HELLO Hétérogénéité Здравствуйте هتاف للترحيب 你好

" SiteSetting.search_ignore_accents = true scrubbed = SearchIndexer.scrub_html_for_search(html) expect(scrubbed).to eq("HELLO Heterogeneite Здравствуите هتاف للترحيب 你好") SiteSetting.search_ignore_accents = false scrubbed = SearchIndexer.scrub_html_for_search(html) expect(scrubbed).to eq("HELLO Hétérogénéité Здравствуйте هتاف للترحيب 你好") end it "doesn't index local files" do html = <<~HTML

Discourse

51%20PM

HTML scrubbed = scrub(html) expect(scrubbed).to eq("Discourse 51%20PM Untitled design (21).jpg Untitled%20design%20(21) Untitled design (21).jpg 1280x1136 472 KB") end it 'correctly indexes a post according to version' do # Preparing so that they can be indexed to right version SearchIndexer.update_posts_index(post_id, "dummy", "", nil, nil) PostSearchData.find_by(post_id: post_id).update_attributes!(version: -1) data = "This is a test" SearchIndexer.update_posts_index(post_id, "", "", nil, data) raw_data, locale, version = PostSearchData.where(post_id: post_id).pluck(:raw_data, :locale, :version)[0] expect(raw_data).to eq("This is a test") expect(locale).to eq("en") expect(version).to eq(Search::INDEX_VERSION) SearchIndexer.update_posts_index(post_id, "tester", "", nil, nil) raw_data = PostSearchData.where(post_id: post_id).pluck(:raw_data)[0] expect(raw_data).to eq("tester") end end