2015-10-11 17:41:23 +08:00
|
|
|
require 'rails_helper'
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2016-12-22 10:13:14 +08:00
|
|
|
describe SearchIndexer do
|
2017-08-16 19:38:34 +08:00
|
|
|
let(:post_id) { 99 }
|
2014-06-24 15:10:56 +08:00
|
|
|
it 'correctly indexes chinese' do
|
|
|
|
SiteSetting.default_locale = 'zh_CN'
|
|
|
|
data = "你好世界"
|
2015-01-06 00:04:23 +08:00
|
|
|
expect(data.split(" ").length).to eq(1)
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2018-02-20 11:41:00 +08:00
|
|
|
SearchIndexer.update_posts_index(post_id, "你好世界", "", "", nil)
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2017-08-16 19:38:34 +08:00
|
|
|
raw_data = PostSearchData.where(post_id: post_id).pluck(:raw_data)[0]
|
2016-08-11 03:40:58 +08:00
|
|
|
expect(raw_data.split(' ').length).to eq(2)
|
2014-06-24 15:10:56 +08:00
|
|
|
end
|
|
|
|
|
2018-04-26 13:46:52 +08:00
|
|
|
it 'extract youtube title' do
|
|
|
|
html = "<div class=\"lazyYT\" data-youtube-id=\"lmFgeFh2nlw\" data-youtube-title=\"Metallica Mixer Explains Missing Bass on 'And Justice for All' [Exclusive]\" data-width=\"480\" data-height=\"270\" data-parameters=\"feature=oembed&wmode=opaque\"></div>"
|
|
|
|
|
|
|
|
scrubbed = SearchIndexer::HtmlScrubber.scrub(html)
|
|
|
|
|
|
|
|
expect(scrubbed).to eq(" Metallica Mixer Explains Missing Bass on 'And Justice for All' [Exclusive] ")
|
|
|
|
end
|
|
|
|
|
2018-08-20 08:39:19 +08:00
|
|
|
it 'extract a link' do
|
|
|
|
html = "<a href='http://meta.discourse.org/'>link</a>"
|
|
|
|
|
|
|
|
scrubbed = SearchIndexer::HtmlScrubber.scrub(html)
|
|
|
|
|
|
|
|
expect(scrubbed).to eq(" http://meta.discourse.org/ link ")
|
|
|
|
end
|
|
|
|
|
2018-08-23 23:13:52 +08:00
|
|
|
it 'removes diacritics' do
|
2018-08-24 06:38:44 +08:00
|
|
|
html = "<p>HELLO Hétérogénéité Здравствуйте هتاف للترحيب 你好</p>"
|
2018-08-23 23:13:52 +08:00
|
|
|
|
2018-08-31 09:46:55 +08:00
|
|
|
scrubbed = SearchIndexer::HtmlScrubber.scrub(html, strip_diacritics: true)
|
2018-08-23 23:13:52 +08:00
|
|
|
|
2018-08-24 06:38:44 +08:00
|
|
|
expect(scrubbed).to eq(" HELLO Heterogeneite Здравствуите هتاف للترحيب 你好 ")
|
2018-08-23 23:13:52 +08:00
|
|
|
end
|
|
|
|
|
2017-08-16 19:38:34 +08:00
|
|
|
it 'correctly indexes a post according to version' do
|
|
|
|
# Preparing so that they can be indexed to right version
|
2018-02-20 11:41:00 +08:00
|
|
|
SearchIndexer.update_posts_index(post_id, "dummy", "", nil, nil)
|
2017-08-16 19:38:34 +08:00
|
|
|
PostSearchData.find_by(post_id: post_id).update_attributes!(version: -1)
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2017-08-16 19:38:34 +08:00
|
|
|
data = "<a>This</a> is a test"
|
2018-02-20 11:41:00 +08:00
|
|
|
SearchIndexer.update_posts_index(post_id, "", "", nil, data)
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2017-08-16 19:38:34 +08:00
|
|
|
raw_data, locale, version = PostSearchData.where(post_id: post_id).pluck(:raw_data, :locale, :version)[0]
|
2016-08-11 03:40:58 +08:00
|
|
|
expect(raw_data).to eq("This is a test")
|
|
|
|
expect(locale).to eq("en")
|
2017-08-16 19:38:34 +08:00
|
|
|
expect(version).to eq(Search::INDEX_VERSION)
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2018-02-20 11:41:00 +08:00
|
|
|
SearchIndexer.update_posts_index(post_id, "tester", "", nil, nil)
|
2014-06-24 15:10:56 +08:00
|
|
|
|
2017-08-16 19:38:34 +08:00
|
|
|
raw_data = PostSearchData.where(post_id: post_id).pluck(:raw_data)[0]
|
2016-08-11 03:40:58 +08:00
|
|
|
expect(raw_data).to eq("tester")
|
2014-06-24 15:10:56 +08:00
|
|
|
end
|
|
|
|
end
|