require 'rails_helper' describe SearchIndexer do let(:post_id) { 99 } it 'correctly indexes chinese' do SiteSetting.default_locale = 'zh_CN' data = "你好世界" expect(data.split(" ").length).to eq(1) SearchIndexer.update_posts_index(post_id, "你好世界", "", "", nil) raw_data = PostSearchData.where(post_id: post_id).pluck(:raw_data)[0] expect(raw_data.split(' ').length).to eq(2) end it 'extract youtube title' do html = "
" scrubbed = SearchIndexer::HtmlScrubber.scrub(html) expect(scrubbed).to eq(" Metallica Mixer Explains Missing Bass on 'And Justice for All' [Exclusive] ") end it 'extract a link' do html = "link" scrubbed = SearchIndexer::HtmlScrubber.scrub(html) expect(scrubbed).to eq(" http://meta.discourse.org/ link ") end it 'removes diacritics' do html = "HELLO Hétérogénéité Здравствуйте هتاف للترحيب 你好
" scrubbed = SearchIndexer::HtmlScrubber.scrub(html, strip_diacritics: true) expect(scrubbed).to eq(" HELLO Heterogeneite Здравствуите هتاف للترحيب 你好 ") end it "doesn't index local files" do html = <<~HTML