mirror of
https://github.com/discourse/discourse.git
synced 2024-11-30 13:05:17 +08:00
9199c52e5e
Add categories to the serialized search results together with the topics when lazy load categories is enabled. This is necessary in order for the results to be rendered correctly and display the category information.
1525 lines
44 KiB
Ruby
1525 lines
44 KiB
Ruby
# frozen_string_literal: true
|
||
|
||
class Search
|
||
DIACRITICS ||= /([\u0300-\u036f]|[\u1AB0-\u1AFF]|[\u1DC0-\u1DFF]|[\u20D0-\u20FF])/
|
||
HIGHLIGHT_CSS_CLASS = "search-highlight"
|
||
|
||
cattr_accessor :preloaded_topic_custom_fields
|
||
self.preloaded_topic_custom_fields = Set.new
|
||
|
||
def self.on_preload(&blk)
|
||
(@preload ||= Set.new) << blk
|
||
end
|
||
|
||
def self.preload(results, object)
|
||
@preload.each { |preload| preload.call(results, object) } if @preload
|
||
end
|
||
|
||
def self.per_facet
|
||
5
|
||
end
|
||
|
||
def self.per_filter
|
||
SiteSetting.search_page_size
|
||
end
|
||
|
||
def self.facets
|
||
%w[topic category user private_messages tags all_topics exclude_topics]
|
||
end
|
||
|
||
def self.ts_config(locale = SiteSetting.default_locale)
|
||
# if adding a text search configuration, you should check PG beforehand:
|
||
# SELECT cfgname FROM pg_ts_config;
|
||
# As an aside, dictionaries can be listed by `\dFd`, the
|
||
# physical locations are in /usr/share/postgresql/<version>/tsearch_data.
|
||
# But it may not appear there based on pg extension configuration.
|
||
# base docker config
|
||
#
|
||
case locale.split("_")[0].to_sym
|
||
when :da
|
||
"danish"
|
||
when :nl
|
||
"dutch"
|
||
when :en
|
||
"english"
|
||
when :fi
|
||
"finnish"
|
||
when :fr
|
||
"french"
|
||
when :de
|
||
"german"
|
||
when :hu
|
||
"hungarian"
|
||
when :it
|
||
"italian"
|
||
when :nb
|
||
"norwegian"
|
||
when :pt
|
||
"portuguese"
|
||
when :ro
|
||
"romanian"
|
||
when :ru
|
||
"russian"
|
||
when :es
|
||
"spanish"
|
||
when :sv
|
||
"swedish"
|
||
when :tr
|
||
"turkish"
|
||
else
|
||
"simple" # use the 'simple' stemmer for other languages
|
||
end
|
||
end
|
||
|
||
def self.wrap_unaccent(str)
|
||
SiteSetting.search_ignore_accents ? "unaccent(#{str})" : str
|
||
end
|
||
|
||
def self.segment_chinese?
|
||
%w[zh_TW zh_CN].include?(SiteSetting.default_locale) || SiteSetting.search_tokenize_chinese
|
||
end
|
||
|
||
def self.segment_japanese?
|
||
SiteSetting.default_locale == "ja" || SiteSetting.search_tokenize_japanese
|
||
end
|
||
|
||
def self.japanese_punctuation_regexp
|
||
# Regexp adapted from https://github.com/6/tiny_segmenter/blob/15a5b825993dfd2c662df3766f232051716bef5b/lib/tiny_segmenter.rb#L7
|
||
@japanese_punctuation_regexp ||=
|
||
Regexp.compile("[-–—―.。・()()[]{}{}【】⟨⟩、、,,،…‥〽「」『』〜~!!::??\"'|__“”‘’;/⁄/«»]")
|
||
end
|
||
|
||
def self.clean_term(term)
|
||
term = term.to_s.dup
|
||
|
||
# Removes any zero-width characters from search terms
|
||
term.gsub!(/[\u200B-\u200D\uFEFF]/, "")
|
||
|
||
# Replace curly quotes to regular quotes
|
||
term.gsub!(/[\u201c\u201d]/, '"')
|
||
|
||
# Replace fancy apostophes to regular apostophes
|
||
term.gsub!(/[\u02b9\u02bb\u02bc\u02bd\u02c8\u2018\u2019\u201b\u2032\uff07]/, "'")
|
||
|
||
term
|
||
end
|
||
|
||
def self.prepare_data(search_data, purpose = nil)
|
||
data = search_data.dup
|
||
data.force_encoding("UTF-8")
|
||
data = clean_term(data)
|
||
|
||
if purpose != :topic
|
||
if segment_chinese?
|
||
require "cppjieba_rb" unless defined?(CppjiebaRb)
|
||
|
||
segmented_data = []
|
||
|
||
# We need to split up the string here because Cppjieba has a bug where text starting with numeric chars will
|
||
# be split into two segments. For example, '123abc' becomes '123' and 'abc' after segmentation.
|
||
data.scan(/(?<chinese>[\p{Han}。,、“”《》…\.:?!;()]+)|([^\p{Han}]+)/) do
|
||
match_data = $LAST_MATCH_INFO
|
||
|
||
if match_data[:chinese]
|
||
segments = CppjiebaRb.segment(match_data.to_s, mode: :mix)
|
||
|
||
segments = CppjiebaRb.filter_stop_word(segments) if ts_config != "english"
|
||
|
||
segments = segments.filter { |s| s.present? }
|
||
segmented_data << segments.join(" ")
|
||
else
|
||
segmented_data << match_data.to_s.squish
|
||
end
|
||
end
|
||
|
||
data = segmented_data.join(" ")
|
||
elsif segment_japanese?
|
||
data.gsub!(japanese_punctuation_regexp, " ")
|
||
data = TinyJapaneseSegmenter.segment(data)
|
||
data = data.filter { |s| s.present? }
|
||
data = data.join(" ")
|
||
else
|
||
data.squish!
|
||
end
|
||
end
|
||
|
||
data.gsub!(/\S+/) do |str|
|
||
if str =~ %r{\A["]?((https?://)[\S]+)["]?\z}
|
||
begin
|
||
uri = URI.parse(Regexp.last_match[1])
|
||
uri.query = nil
|
||
str = uri.to_s
|
||
rescue URI::Error
|
||
# don't fail if uri does not parse
|
||
end
|
||
end
|
||
|
||
str
|
||
end
|
||
|
||
data
|
||
end
|
||
|
||
def self.word_to_date(str)
|
||
return Time.zone.now.beginning_of_day.days_ago(str.to_i) if str =~ /\A[0-9]{1,3}\z/
|
||
|
||
if str =~ /\A([12][0-9]{3})(-([0-1]?[0-9]))?(-([0-3]?[0-9]))?\z/
|
||
year = $1.to_i
|
||
month = $2 ? $3.to_i : 1
|
||
day = $4 ? $5.to_i : 1
|
||
|
||
return if day == 0 || month == 0 || day > 31 || month > 12
|
||
|
||
return(
|
||
begin
|
||
Time.zone.parse("#{year}-#{month}-#{day}")
|
||
rescue ArgumentError
|
||
end
|
||
)
|
||
end
|
||
|
||
return Time.zone.now.beginning_of_day.yesterday if str.downcase == "yesterday"
|
||
|
||
titlecase = str.downcase.titlecase
|
||
|
||
if Date::DAYNAMES.include?(titlecase)
|
||
return Time.zone.now.beginning_of_week(str.downcase.to_sym)
|
||
end
|
||
|
||
if idx = (Date::MONTHNAMES.find_index(titlecase) || Date::ABBR_MONTHNAMES.find_index(titlecase))
|
||
delta = Time.zone.now.month - idx
|
||
delta += 12 if delta < 0
|
||
Time.zone.now.beginning_of_month.months_ago(delta)
|
||
end
|
||
end
|
||
|
||
def self.min_post_id_no_cache
|
||
return 0 unless SiteSetting.search_prefer_recent_posts?
|
||
|
||
offset, has_more =
|
||
Post
|
||
.unscoped
|
||
.order("id desc")
|
||
.offset(SiteSetting.search_recent_posts_size - 1)
|
||
.limit(2)
|
||
.pluck(:id)
|
||
|
||
has_more ? offset : 0
|
||
end
|
||
|
||
def self.min_post_id(opts = nil)
|
||
return 0 unless SiteSetting.search_prefer_recent_posts?
|
||
|
||
# It can be quite slow to count all the posts so let's cache it
|
||
Discourse
|
||
.cache
|
||
.fetch("search-min-post-id:#{SiteSetting.search_recent_posts_size}", expires_in: 1.week) do
|
||
min_post_id_no_cache
|
||
end
|
||
end
|
||
|
||
attr_accessor :term
|
||
attr_reader :clean_term, :guardian
|
||
|
||
def initialize(term, opts = nil)
|
||
@opts = opts || {}
|
||
@guardian = @opts[:guardian] || Guardian.new
|
||
@search_context = @opts[:search_context]
|
||
@blurb_length = @opts[:blurb_length]
|
||
@valid = true
|
||
@page = @opts[:page]
|
||
@search_all_pms = false
|
||
|
||
term = Search.clean_term(term)
|
||
|
||
@clean_term = term
|
||
@in_title = false
|
||
|
||
term = process_advanced_search!(term)
|
||
if !@order &&
|
||
SiteSetting.search_default_sort_order !=
|
||
SearchSortOrderSiteSetting.value_from_id(:relevance)
|
||
@order = SearchSortOrderSiteSetting.id_from_value(SiteSetting.search_default_sort_order)
|
||
end
|
||
|
||
if term.present?
|
||
@term = Search.prepare_data(term, Topic === @search_context ? :topic : nil)
|
||
@original_term = Search.escape_string(@term)
|
||
end
|
||
|
||
if @search_pms || @search_all_pms || @opts[:type_filter] == "private_messages"
|
||
@opts[:type_filter] = "private_messages"
|
||
@search_context ||= @guardian.user
|
||
|
||
unless @search_context.present? && @guardian.can_see_private_messages?(@search_context.id)
|
||
raise Discourse::InvalidAccess.new
|
||
end
|
||
end
|
||
|
||
@opts[:type_filter] = "all_topics" if @search_all_topics && @guardian.user
|
||
|
||
@results =
|
||
GroupedSearchResults.new(
|
||
type_filter: @opts[:type_filter],
|
||
term: clean_term,
|
||
blurb_term: term,
|
||
search_context: @search_context,
|
||
blurb_length: @blurb_length,
|
||
is_header_search: !use_full_page_limit,
|
||
can_lazy_load_categories: @guardian.can_lazy_load_categories?,
|
||
)
|
||
end
|
||
|
||
def limit
|
||
if use_full_page_limit
|
||
Search.per_filter + 1
|
||
else
|
||
Search.per_facet + 1
|
||
end
|
||
end
|
||
|
||
def offset
|
||
if @page && @opts[:type_filter].present?
|
||
(@page - 1) * Search.per_filter
|
||
else
|
||
0
|
||
end
|
||
end
|
||
|
||
def valid?
|
||
@valid
|
||
end
|
||
|
||
def use_full_page_limit
|
||
@opts[:search_type] == :full_page || Topic === @search_context
|
||
end
|
||
|
||
def self.execute(term, opts = nil)
|
||
self.new(term, opts).execute
|
||
end
|
||
|
||
# Query a term
|
||
def execute(readonly_mode: Discourse.readonly_mode?)
|
||
if log_query?(readonly_mode)
|
||
status, search_log_id =
|
||
SearchLog.log(
|
||
term: @clean_term,
|
||
search_type: @opts[:search_type],
|
||
ip_address: @opts[:ip_address],
|
||
user_id: @opts[:user_id],
|
||
)
|
||
@results.search_log_id = search_log_id unless status == :error
|
||
end
|
||
|
||
unless @filters.present? || @opts[:search_for_id]
|
||
min_length = min_search_term_length
|
||
terms = (@term || "").split(/\s(?=(?:[^"]|"[^"]*")*$)/).reject { |t| t.length < min_length }
|
||
|
||
if terms.blank?
|
||
@term = ""
|
||
@valid = false
|
||
return
|
||
end
|
||
end
|
||
|
||
# If the term is a number or url to a topic, just include that topic
|
||
if @opts[:search_for_id] && %w[topic private_messages all_topics].include?(@results.type_filter)
|
||
if @term =~ /\A\d+\z/
|
||
single_topic(@term.to_i)
|
||
else
|
||
if route = Discourse.route_for(@term)
|
||
if route[:controller] == "topics" && route[:action] == "show"
|
||
topic_id = (route[:id] || route[:topic_id]).to_i
|
||
single_topic(topic_id) if topic_id > 0
|
||
end
|
||
end
|
||
end
|
||
end
|
||
|
||
find_grouped_results if @results.posts.blank?
|
||
|
||
if preloaded_topic_custom_fields.present? && @results.posts.present?
|
||
topics = @results.posts.map(&:topic)
|
||
Topic.preload_custom_fields(topics, preloaded_topic_custom_fields)
|
||
end
|
||
|
||
Search.preload(@results, self)
|
||
|
||
@results
|
||
end
|
||
|
||
def self.advanced_order(trigger, &block)
|
||
(@advanced_orders ||= {})[trigger] = block
|
||
end
|
||
|
||
def self.advanced_orders
|
||
@advanced_orders
|
||
end
|
||
|
||
def self.advanced_filter(trigger, &block)
|
||
(@advanced_filters ||= {})[trigger] = block
|
||
end
|
||
|
||
def self.advanced_filters
|
||
@advanced_filters
|
||
end
|
||
|
||
def self.custom_topic_eager_load(tables = nil, &block)
|
||
(@custom_topic_eager_loads ||= []) << (tables || block)
|
||
end
|
||
|
||
def self.custom_topic_eager_loads
|
||
Array.wrap(@custom_topic_eager_loads)
|
||
end
|
||
|
||
advanced_filter(/\Ain:personal-direct\z/i) do |posts|
|
||
if @guardian.user
|
||
posts.joins("LEFT JOIN topic_allowed_groups tg ON posts.topic_id = tg.topic_id").where(
|
||
<<~SQL,
|
||
tg.id IS NULL
|
||
AND posts.topic_id IN (
|
||
SELECT tau.topic_id
|
||
FROM topic_allowed_users tau
|
||
JOIN topic_allowed_users tau2
|
||
ON tau2.topic_id = tau.topic_id
|
||
AND tau2.id != tau.id
|
||
WHERE tau.user_id = :user_id
|
||
GROUP BY tau.topic_id
|
||
HAVING COUNT(*) = 1
|
||
)
|
||
SQL
|
||
user_id: @guardian.user.id,
|
||
)
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Ain:all-pms\z/i) { |posts| posts.private_posts if @guardian.is_admin? }
|
||
|
||
advanced_filter(/\Ain:tagged\z/i) do |posts|
|
||
posts.where("EXISTS (SELECT 1 FROM topic_tags WHERE topic_tags.topic_id = posts.topic_id)")
|
||
end
|
||
|
||
advanced_filter(/\Ain:untagged\z/i) do |posts|
|
||
posts.joins(
|
||
"LEFT JOIN topic_tags ON
|
||
topic_tags.topic_id = posts.topic_id",
|
||
).where("topic_tags.id IS NULL")
|
||
end
|
||
|
||
advanced_filter(/\Astatus:open\z/i) do |posts|
|
||
posts.where("NOT topics.closed AND NOT topics.archived")
|
||
end
|
||
|
||
advanced_filter(/\Astatus:closed\z/i) { |posts| posts.where("topics.closed") }
|
||
|
||
advanced_filter(/\Astatus:public\z/i) do |posts|
|
||
category_ids = Category.where(read_restricted: false).pluck(:id)
|
||
|
||
posts.where("topics.category_id in (?)", category_ids)
|
||
end
|
||
|
||
advanced_filter(/\Astatus:archived\z/i) { |posts| posts.where("topics.archived") }
|
||
|
||
advanced_filter(/\Astatus:noreplies\z/i) { |posts| posts.where("topics.posts_count = 1") }
|
||
|
||
advanced_filter(/\Astatus:single_user\z/i) { |posts| posts.where("topics.participant_count = 1") }
|
||
|
||
advanced_filter(/\Aposts_count:(\d+)\z/i) do |posts, match|
|
||
posts.where("topics.posts_count = ?", match.to_i)
|
||
end
|
||
|
||
advanced_filter(/\Amin_post_count:(\d+)\z/i) do |posts, match|
|
||
posts.where("topics.posts_count >= ?", match.to_i)
|
||
end
|
||
|
||
advanced_filter(/\Amin_posts:(\d+)\z/i) do |posts, match|
|
||
posts.where("topics.posts_count >= ?", match.to_i)
|
||
end
|
||
|
||
advanced_filter(/\Amax_posts:(\d+)\z/i) do |posts, match|
|
||
posts.where("topics.posts_count <= ?", match.to_i)
|
||
end
|
||
|
||
advanced_filter(/\Ain:first|^f\z/i) { |posts| posts.where("posts.post_number = 1") }
|
||
|
||
advanced_filter(/\Ain:pinned\z/i) { |posts| posts.where("topics.pinned_at IS NOT NULL") }
|
||
|
||
advanced_filter(/\Ain:wiki\z/i) { |posts, match| posts.where(wiki: true) }
|
||
|
||
advanced_filter(/\Abadge:(.*)\z/i) do |posts, match|
|
||
badge_id = Badge.where("name ilike ? OR id = ?", match, match.to_i).pick(:id)
|
||
if badge_id
|
||
posts.where(
|
||
"posts.user_id IN (SELECT ub.user_id FROM user_badges ub WHERE ub.badge_id = ?)",
|
||
badge_id,
|
||
)
|
||
else
|
||
posts.where("1 = 0")
|
||
end
|
||
end
|
||
|
||
def post_action_type_filter(posts, post_action_type)
|
||
posts.where(
|
||
"posts.id IN (
|
||
SELECT pa.post_id FROM post_actions pa
|
||
WHERE pa.user_id = ? AND
|
||
pa.post_action_type_id = ? AND
|
||
deleted_at IS NULL
|
||
)",
|
||
@guardian.user.id,
|
||
post_action_type,
|
||
)
|
||
end
|
||
|
||
advanced_filter(/\Ain:(likes)\z/i) do |posts, match|
|
||
post_action_type_filter(posts, PostActionType.types[:like]) if @guardian.user
|
||
end
|
||
|
||
# NOTE: With polymorphic bookmarks it may make sense to possibly expand
|
||
# this at some point, as it only acts on posts at the moment. On the other
|
||
# hand, this may not be necessary, as the user bookmark list has advanced
|
||
# search based on a RegisteredBookmarkable's #search_query method.
|
||
advanced_filter(/\Ain:(bookmarks)\z/i) do |posts, match|
|
||
posts.where(<<~SQL, @guardian.user.id) if @guardian.user
|
||
posts.id IN (
|
||
SELECT bookmarkable_id FROM bookmarks
|
||
WHERE bookmarks.user_id = ? AND bookmarks.bookmarkable_type = 'Post'
|
||
)
|
||
SQL
|
||
end
|
||
|
||
advanced_filter(/\Ain:posted\z/i) do |posts|
|
||
posts.where("posts.user_id = ?", @guardian.user.id) if @guardian.user
|
||
end
|
||
|
||
advanced_filter(/\Ain:(created|mine)\z/i) do |posts|
|
||
posts.where(user_id: @guardian.user.id, post_number: 1) if @guardian.user
|
||
end
|
||
|
||
advanced_filter(/\Acreated:@(.*)\z/i) do |posts, match|
|
||
user_id = User.where(username_lower: match.downcase).pick(:id)
|
||
posts.where(user_id: user_id, post_number: 1)
|
||
end
|
||
|
||
advanced_filter(/\Ain:(watching|tracking)\z/i) do |posts, match|
|
||
if @guardian.user
|
||
level = TopicUser.notification_levels[match.downcase.to_sym]
|
||
posts.where(
|
||
"posts.topic_id IN (
|
||
SELECT tu.topic_id FROM topic_users tu
|
||
WHERE tu.user_id = :user_id AND
|
||
tu.notification_level >= :level
|
||
)",
|
||
user_id: @guardian.user.id,
|
||
level: level,
|
||
)
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Ain:seen\z/i) do |posts|
|
||
if @guardian.user
|
||
posts.joins(
|
||
"INNER JOIN post_timings ON
|
||
post_timings.topic_id = posts.topic_id
|
||
AND post_timings.post_number = posts.post_number
|
||
AND post_timings.user_id = #{ActiveRecord::Base.connection.quote(@guardian.user.id)}
|
||
",
|
||
)
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Ain:unseen\z/i) do |posts|
|
||
if @guardian.user
|
||
posts.joins(
|
||
"LEFT JOIN post_timings ON
|
||
post_timings.topic_id = posts.topic_id
|
||
AND post_timings.post_number = posts.post_number
|
||
AND post_timings.user_id = #{ActiveRecord::Base.connection.quote(@guardian.user.id)}
|
||
",
|
||
).where("post_timings.user_id IS NULL")
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Awith:images\z/i) { |posts| posts.where("posts.image_upload_id IS NOT NULL") }
|
||
|
||
advanced_filter(/\Acategory:(.+)\z/i) do |posts, match|
|
||
exact = false
|
||
|
||
if match[0] == "="
|
||
exact = true
|
||
match = match[1..-1]
|
||
end
|
||
|
||
category_ids =
|
||
Category.where("slug ilike ? OR name ilike ? OR id = ?", match, match, match.to_i).pluck(:id)
|
||
if category_ids.present?
|
||
category_ids += Category.subcategory_ids(category_ids.first) unless exact
|
||
@category_filter_matched ||= true
|
||
posts.where("topics.category_id IN (?)", category_ids)
|
||
else
|
||
posts.where("1 = 0")
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\A\#([\p{L}\p{M}0-9\-:=]+)\z/i) do |posts, match|
|
||
category_slug, subcategory_slug = match.to_s.split(":")
|
||
next unless category_slug
|
||
|
||
exact = true
|
||
if category_slug[0] == "="
|
||
category_slug = category_slug[1..-1]
|
||
else
|
||
exact = false
|
||
end
|
||
|
||
category_id =
|
||
if subcategory_slug
|
||
Category
|
||
.where("lower(slug) = ?", subcategory_slug.downcase)
|
||
.where(
|
||
parent_category_id:
|
||
Category.where("lower(slug) = ?", category_slug.downcase).select(:id),
|
||
)
|
||
.pick(:id)
|
||
else
|
||
Category
|
||
.where("lower(slug) = ?", category_slug.downcase)
|
||
.order("case when parent_category_id is null then 0 else 1 end")
|
||
.pick(:id)
|
||
end
|
||
|
||
if category_id
|
||
category_ids = [category_id]
|
||
category_ids += Category.subcategory_ids(category_id) if !exact
|
||
|
||
@category_filter_matched ||= true
|
||
posts.where("topics.category_id IN (?)", category_ids)
|
||
else
|
||
# try a possible tag match
|
||
tag_id = Tag.where_name(category_slug).pick(:id)
|
||
if (tag_id)
|
||
posts.where(<<~SQL, tag_id)
|
||
topics.id IN (
|
||
SELECT DISTINCT(tt.topic_id)
|
||
FROM topic_tags tt
|
||
WHERE tt.tag_id = ?
|
||
)
|
||
SQL
|
||
else
|
||
if tag_group_id = TagGroup.find_id_by_slug(category_slug)
|
||
posts.where(<<~SQL, tag_group_id)
|
||
topics.id IN (
|
||
SELECT DISTINCT(tt.topic_id)
|
||
FROM topic_tags tt
|
||
WHERE tt.tag_id in (
|
||
SELECT tag_id
|
||
FROM tag_group_memberships
|
||
WHERE tag_group_id = ?
|
||
)
|
||
)
|
||
SQL
|
||
|
||
# a bit yucky but we got to add the term back in
|
||
elsif match.to_s.length >= min_search_term_length
|
||
posts.where <<~SQL
|
||
posts.id IN (
|
||
SELECT post_id FROM post_search_data pd1
|
||
WHERE pd1.search_data @@ #{Search.ts_query(term: "##{match}")})
|
||
SQL
|
||
end
|
||
end
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Agroup:(.+)\z/i) do |posts, match|
|
||
group_query =
|
||
Group
|
||
.visible_groups(@guardian.user)
|
||
.members_visible_groups(@guardian.user)
|
||
.where("groups.name ILIKE ? OR (groups.id = ? AND groups.id > 0)", match, match.to_i)
|
||
|
||
DiscoursePluginRegistry.search_groups_set_query_callbacks.each do |cb|
|
||
group_query = cb.call(group_query, @term, @guardian)
|
||
end
|
||
|
||
group_id = group_query.pick(:id)
|
||
|
||
if group_id
|
||
posts.where(
|
||
"posts.user_id IN (select gu.user_id from group_users gu where gu.group_id = ?)",
|
||
group_id,
|
||
)
|
||
else
|
||
posts.where("1 = 0")
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Agroup_messages:(.+)\z/i) do |posts, match|
|
||
group_id =
|
||
Group
|
||
.visible_groups(@guardian.user)
|
||
.members_visible_groups(@guardian.user)
|
||
.where(has_messages: true)
|
||
.where("name ilike ? OR (id = ? AND id > 0)", match, match.to_i)
|
||
.pick(:id)
|
||
|
||
if group_id
|
||
posts.where(
|
||
"posts.topic_id IN (SELECT topic_id FROM topic_allowed_groups WHERE group_id = ?)",
|
||
group_id,
|
||
)
|
||
else
|
||
posts.where("1 = 0")
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Auser:(.+)\z/i) do |posts, match|
|
||
user_id =
|
||
User
|
||
.where(staged: false)
|
||
.where("username_lower = ? OR id = ?", match.downcase, match.to_i)
|
||
.pick(:id)
|
||
if user_id
|
||
posts.where("posts.user_id = ?", user_id)
|
||
else
|
||
posts.where("1 = 0")
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\A\@(\S+)\z/i) do |posts, match|
|
||
username = User.normalize_username(match)
|
||
|
||
user_id = User.not_staged.where(username_lower: username).pick(:id)
|
||
|
||
user_id = @guardian.user&.id if !user_id && username == "me"
|
||
|
||
if user_id
|
||
posts.where("posts.user_id = ?", user_id)
|
||
else
|
||
posts.where("1 = 0")
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Abefore:(.*)\z/i) do |posts, match|
|
||
if date = Search.word_to_date(match)
|
||
posts.where("posts.created_at < ?", date)
|
||
else
|
||
posts
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Aafter:(.*)\z/i) do |posts, match|
|
||
if date = Search.word_to_date(match)
|
||
posts.where("posts.created_at > ?", date)
|
||
else
|
||
posts
|
||
end
|
||
end
|
||
|
||
advanced_filter(/\Atags?:([\p{L}\p{M}0-9,\-_+]+)\z/i) do |posts, match|
|
||
search_tags(posts, match, positive: true)
|
||
end
|
||
|
||
advanced_filter(/\A\-tags?:([\p{L}\p{M}0-9,\-_+]+)\z/i) do |posts, match|
|
||
search_tags(posts, match, positive: false)
|
||
end
|
||
|
||
advanced_filter(/\Afiletypes?:([a-zA-Z0-9,\-_]+)\z/i) do |posts, match|
|
||
file_extensions = match.split(",").map(&:downcase)
|
||
posts.where(
|
||
"posts.id IN (
|
||
SELECT post_id
|
||
FROM topic_links
|
||
WHERE extension IN (:file_extensions)
|
||
|
||
UNION
|
||
|
||
SELECT upload_references.target_id
|
||
FROM uploads
|
||
JOIN upload_references ON upload_references.target_type = 'Post' AND upload_references.upload_id = uploads.id
|
||
WHERE lower(uploads.extension) IN (:file_extensions)
|
||
)",
|
||
file_extensions: file_extensions,
|
||
)
|
||
end
|
||
|
||
advanced_filter(/\Amin_views:(\d+)\z/i) do |posts, match|
|
||
posts.where("topics.views >= ?", match.to_i)
|
||
end
|
||
|
||
advanced_filter(/\Amax_views:(\d+)\z/i) do |posts, match|
|
||
posts.where("topics.views <= ?", match.to_i)
|
||
end
|
||
|
||
def apply_filters(posts)
|
||
@filters.each do |block, match|
|
||
if block.arity == 1
|
||
posts = instance_exec(posts, &block) || posts
|
||
else
|
||
posts = instance_exec(posts, match, &block) || posts
|
||
end
|
||
end if @filters
|
||
posts
|
||
end
|
||
|
||
def apply_order(
|
||
posts,
|
||
aggregate_search: false,
|
||
allow_relevance_search: true,
|
||
type_filter: "all_topics"
|
||
)
|
||
if @order == :latest
|
||
if aggregate_search
|
||
posts = posts.order("MAX(posts.created_at) DESC")
|
||
else
|
||
posts = posts.reorder("posts.created_at DESC")
|
||
end
|
||
elsif @order == :oldest
|
||
if aggregate_search
|
||
posts = posts.order("MAX(posts.created_at) ASC")
|
||
else
|
||
posts = posts.reorder("posts.created_at ASC")
|
||
end
|
||
elsif @order == :latest_topic
|
||
if aggregate_search
|
||
posts = posts.order("MAX(topics.created_at) DESC")
|
||
else
|
||
posts = posts.order("topics.created_at DESC")
|
||
end
|
||
elsif @order == :oldest_topic
|
||
if aggregate_search
|
||
posts = posts.order("MAX(topics.created_at) ASC")
|
||
else
|
||
posts = posts.order("topics.created_at ASC")
|
||
end
|
||
elsif @order == :views
|
||
if aggregate_search
|
||
posts = posts.order("MAX(topics.views) DESC")
|
||
else
|
||
posts = posts.order("topics.views DESC")
|
||
end
|
||
elsif @order == :likes
|
||
if aggregate_search
|
||
posts = posts.order("MAX(posts.like_count) DESC")
|
||
else
|
||
posts = posts.order("posts.like_count DESC")
|
||
end
|
||
elsif allow_relevance_search
|
||
posts = sort_by_relevance(posts, type_filter: type_filter, aggregate_search: aggregate_search)
|
||
end
|
||
|
||
if @order
|
||
advanced_order = Search.advanced_orders&.fetch(@order, nil)
|
||
posts = advanced_order.call(posts) if advanced_order
|
||
end
|
||
|
||
posts
|
||
end
|
||
|
||
private
|
||
|
||
def search_tags(posts, match, positive:)
|
||
return if match.nil?
|
||
match.downcase!
|
||
modifier = positive ? "" : "NOT"
|
||
|
||
if match.include?("+")
|
||
tags = match.split("+")
|
||
|
||
posts.where(
|
||
"topics.id #{modifier} IN (
|
||
SELECT tt.topic_id
|
||
FROM topic_tags tt, tags
|
||
WHERE tt.tag_id = tags.id
|
||
GROUP BY tt.topic_id
|
||
HAVING to_tsvector(#{default_ts_config}, #{Search.wrap_unaccent("array_to_string(array_agg(lower(tags.name)), ' ')")}) @@ to_tsquery(#{default_ts_config}, #{Search.wrap_unaccent("?")})
|
||
)",
|
||
tags.join("&"),
|
||
)
|
||
else
|
||
tags = match.split(",")
|
||
|
||
posts.where(
|
||
"topics.id #{modifier} IN (
|
||
SELECT DISTINCT(tt.topic_id)
|
||
FROM topic_tags tt, tags
|
||
WHERE tt.tag_id = tags.id AND lower(tags.name) IN (?)
|
||
)",
|
||
tags,
|
||
)
|
||
end
|
||
end
|
||
|
||
def process_advanced_search!(term)
|
||
term
|
||
.to_s
|
||
.scan(/(([^" \t\n\x0B\f\r]+)?(("[^"]+")?))/)
|
||
.to_a
|
||
.map do |(word, _)|
|
||
next if word.blank?
|
||
|
||
found = false
|
||
|
||
Search.advanced_filters.each do |matcher, block|
|
||
cleaned = word.gsub(/["']/, "")
|
||
if cleaned =~ matcher
|
||
(@filters ||= []) << [block, $1]
|
||
found = true
|
||
end
|
||
end
|
||
|
||
if word == "l"
|
||
@order = :latest
|
||
nil
|
||
elsif word =~ /\Aorder:\w+\z/i
|
||
@order = word.downcase.gsub("order:", "").to_sym
|
||
nil
|
||
elsif word =~ /\Ain:title\z/i || word == "t"
|
||
@in_title = true
|
||
nil
|
||
elsif word =~ /\Atopic:(\d+)\z/i
|
||
topic_id = $1.to_i
|
||
if topic_id > 1
|
||
topic = Topic.find_by(id: topic_id)
|
||
@search_context = topic if @guardian.can_see?(topic)
|
||
end
|
||
nil
|
||
elsif word =~ /\Ain:all\z/i
|
||
@search_all_topics = true
|
||
nil
|
||
elsif word =~ /\Ain:personal\z/i
|
||
@search_pms = true
|
||
nil
|
||
elsif word =~ /\Ain:messages\z/i
|
||
@search_pms = true
|
||
nil
|
||
elsif word =~ /\Ain:personal-direct\z/i
|
||
@search_pms = true
|
||
nil
|
||
elsif word =~ /\Ain:all-pms\z/i
|
||
@search_all_pms = true
|
||
nil
|
||
elsif word =~ /\Agroup_messages:(.+)\z/i
|
||
@search_pms = true
|
||
nil
|
||
elsif word =~ /\Apersonal_messages:(.+)\z/i
|
||
if user = User.find_by_username($1)
|
||
@search_pms = true
|
||
@search_context = user
|
||
end
|
||
|
||
nil
|
||
else
|
||
found ? nil : word
|
||
end
|
||
end
|
||
.compact
|
||
.join(" ")
|
||
end
|
||
|
||
def find_grouped_results
|
||
if @results.type_filter.present?
|
||
unless Search.facets.include?(@results.type_filter)
|
||
raise Discourse::InvalidAccess.new("invalid type filter")
|
||
end
|
||
# calling protected methods
|
||
send("#{@results.type_filter}_search")
|
||
else
|
||
if @term.present? && !@search_context
|
||
user_search
|
||
category_search
|
||
tags_search
|
||
groups_search
|
||
end
|
||
topic_search
|
||
end
|
||
|
||
@results
|
||
rescue ActiveRecord::StatementInvalid
|
||
# In the event of a PG:Error return nothing, it is likely they used a foreign language whose
|
||
# locale is not supported by postgres
|
||
end
|
||
|
||
# If we're searching for a single topic
|
||
def single_topic(id)
|
||
if @opts[:restrict_to_archetype].present?
|
||
archetype =
|
||
(
|
||
if @opts[:restrict_to_archetype] == Archetype.default
|
||
Archetype.default
|
||
else
|
||
Archetype.private_message
|
||
end
|
||
)
|
||
|
||
post =
|
||
posts_scope.joins(:topic).find_by(
|
||
"topics.id = :id AND topics.archetype = :archetype AND posts.post_number = 1",
|
||
id: id,
|
||
archetype: archetype,
|
||
)
|
||
else
|
||
post = posts_scope.find_by(topic_id: id, post_number: 1)
|
||
end
|
||
|
||
return nil unless @guardian.can_see?(post)
|
||
|
||
@results.add(post)
|
||
@results
|
||
end
|
||
|
||
def secure_category_ids
|
||
return @secure_category_ids unless @secure_category_ids.nil?
|
||
@secure_category_ids = @guardian.secure_category_ids
|
||
end
|
||
|
||
def category_search
|
||
# scope is leaking onto Category, this is not good and probably a bug in Rails
|
||
# the secure_category_ids will invoke the same method on User, it calls Category.where
|
||
# however the scope from the query below is leaking in to Category, this works around
|
||
# the issue while we figure out what is up in Rails
|
||
secure_category_ids
|
||
|
||
categories =
|
||
Category
|
||
.includes(:category_search_data)
|
||
.where("category_search_data.search_data @@ #{ts_query}")
|
||
.references(:category_search_data)
|
||
.order("topics_month DESC")
|
||
.secured(@guardian)
|
||
.limit(limit)
|
||
|
||
categories.each { |category| @results.add(category) }
|
||
end
|
||
|
||
def user_search
|
||
return if SiteSetting.hide_user_profiles_from_public && !@guardian.user
|
||
|
||
users =
|
||
User
|
||
.includes(:user_search_data)
|
||
.references(:user_search_data)
|
||
.where(active: true)
|
||
.where(staged: false)
|
||
.where("user_search_data.search_data @@ #{ts_query("simple")}")
|
||
.order("CASE WHEN username_lower = '#{@original_term.downcase}' THEN 0 ELSE 1 END")
|
||
.order("last_posted_at DESC")
|
||
.limit(limit)
|
||
|
||
if !SiteSetting.enable_listing_suspended_users_on_search && !@guardian.user&.admin
|
||
users = users.where(suspended_at: nil)
|
||
end
|
||
|
||
users = DiscoursePluginRegistry.apply_modifier(:search_user_search, users)
|
||
|
||
users_custom_data_query =
|
||
DB.query(<<~SQL, user_ids: users.pluck(:id), term: "%#{@original_term.downcase}%")
|
||
SELECT user_custom_fields.user_id, user_fields.name, user_custom_fields.value FROM user_custom_fields
|
||
INNER JOIN user_fields ON user_fields.id = REPLACE(user_custom_fields.name, 'user_field_', '')::INTEGER AND user_fields.searchable IS TRUE
|
||
WHERE user_id IN (:user_ids)
|
||
AND user_custom_fields.name LIKE 'user_field_%'
|
||
AND user_custom_fields.value ILIKE :term
|
||
SQL
|
||
users_custom_data =
|
||
users_custom_data_query.reduce({}) do |acc, row|
|
||
acc[row.user_id] = Array.wrap(acc[row.user_id]) << { name: row.name, value: row.value }
|
||
acc
|
||
end
|
||
|
||
users.each do |user|
|
||
user.custom_data = users_custom_data[user.id] || []
|
||
@results.add(user)
|
||
end
|
||
end
|
||
|
||
def groups_search
|
||
group_query =
|
||
Group.visible_groups(@guardian.user, "groups.name ASC", include_everyone: false).where(
|
||
"groups.name ILIKE :term OR groups.full_name ILIKE :term",
|
||
term: "%#{@term}%",
|
||
)
|
||
|
||
DiscoursePluginRegistry.search_groups_set_query_callbacks.each do |cb|
|
||
group_query = cb.call(group_query, @term, @guardian)
|
||
end
|
||
|
||
groups = group_query.limit(limit)
|
||
|
||
groups.each { |group| @results.add(group) }
|
||
end
|
||
|
||
def tags_search
|
||
return unless SiteSetting.tagging_enabled
|
||
tags =
|
||
Tag
|
||
.includes(:tag_search_data)
|
||
.where("tag_search_data.search_data @@ #{ts_query}")
|
||
.references(:tag_search_data)
|
||
.order("name asc")
|
||
.limit(limit)
|
||
|
||
hidden_tag_names = DiscourseTagging.hidden_tag_names(@guardian)
|
||
|
||
tags.each { |tag| @results.add(tag) if !hidden_tag_names.include?(tag.name) }
|
||
end
|
||
|
||
def exclude_topics_search
|
||
if @term.present?
|
||
user_search
|
||
category_search
|
||
tags_search
|
||
groups_search
|
||
end
|
||
end
|
||
|
||
PHRASE_MATCH_REGEXP_PATTERN = '"([^"]+)"'
|
||
|
||
def posts_query(limit, type_filter: nil, aggregate_search: false)
|
||
posts =
|
||
Post.where(post_type: Topic.visible_post_types(@guardian.user)).joins(
|
||
:post_search_data,
|
||
:topic,
|
||
)
|
||
|
||
if type_filter != "private_messages"
|
||
posts = posts.joins("LEFT JOIN categories ON categories.id = topics.category_id")
|
||
end
|
||
|
||
is_topic_search = @search_context.present? && @search_context.is_a?(Topic)
|
||
posts = posts.where("topics.visible") unless is_topic_search
|
||
|
||
if type_filter == "private_messages" || (is_topic_search && @search_context.private_message?)
|
||
posts =
|
||
posts.where(
|
||
"topics.archetype = ? AND post_search_data.private_message",
|
||
Archetype.private_message,
|
||
)
|
||
|
||
posts = posts.private_posts_for_user(@guardian.user) unless @guardian.is_admin?
|
||
elsif type_filter == "all_topics"
|
||
private_posts =
|
||
posts.where(
|
||
"topics.archetype = ? AND post_search_data.private_message",
|
||
Archetype.private_message,
|
||
).private_posts_for_user(@guardian.user)
|
||
|
||
posts =
|
||
posts.where(
|
||
"topics.archetype <> ? AND NOT post_search_data.private_message",
|
||
Archetype.private_message,
|
||
).or(private_posts)
|
||
else
|
||
posts =
|
||
posts.where(
|
||
"topics.archetype <> ? AND NOT post_search_data.private_message",
|
||
Archetype.private_message,
|
||
)
|
||
end
|
||
|
||
if @term.present?
|
||
if is_topic_search
|
||
term_without_quote = @term
|
||
term_without_quote = $1 if @term =~ /"(.+)"/
|
||
|
||
term_without_quote = $1 if @term =~ /'(.+)'/
|
||
|
||
posts = posts.joins("JOIN users u ON u.id = posts.user_id")
|
||
posts =
|
||
posts.where(
|
||
"posts.raw || ' ' || u.username || ' ' || COALESCE(u.name, '') ilike ?",
|
||
"%#{term_without_quote}%",
|
||
)
|
||
else
|
||
posts = posts.where(post_number: 1) if @in_title
|
||
posts = posts.where("post_search_data.search_data @@ #{ts_query(weight_filter: weights)}")
|
||
exact_terms = @term.scan(Regexp.new(PHRASE_MATCH_REGEXP_PATTERN)).flatten
|
||
|
||
exact_terms.each do |exact|
|
||
posts =
|
||
posts.where("posts.raw ilike :exact OR topics.title ilike :exact", exact: "%#{exact}%")
|
||
end
|
||
end
|
||
end
|
||
|
||
posts = apply_filters(posts)
|
||
|
||
# If we have a search context, prioritize those posts first
|
||
posts =
|
||
if @search_context.present?
|
||
if @search_context.is_a?(User)
|
||
if type_filter == "private_messages"
|
||
if @guardian.is_admin? && !@search_all_pms
|
||
posts.private_posts_for_user(@search_context)
|
||
else
|
||
posts
|
||
end
|
||
else
|
||
posts.where("posts.user_id = #{@search_context.id}")
|
||
end
|
||
elsif @search_context.is_a?(Category)
|
||
category_ids =
|
||
Category
|
||
.where(parent_category_id: @search_context.id)
|
||
.pluck(:id)
|
||
.push(@search_context.id)
|
||
|
||
posts.where("topics.category_id in (?)", category_ids)
|
||
elsif is_topic_search
|
||
posts.where("topics.id = ?", @search_context.id).order(
|
||
"posts.post_number #{@order == :latest ? "DESC" : ""}",
|
||
)
|
||
elsif @search_context.is_a?(Tag)
|
||
posts =
|
||
posts.joins("LEFT JOIN topic_tags ON topic_tags.topic_id = topics.id").joins(
|
||
"LEFT JOIN tags ON tags.id = topic_tags.tag_id",
|
||
)
|
||
posts.where("tags.id = ?", @search_context.id)
|
||
end
|
||
else
|
||
posts = categories_ignored(posts) unless @category_filter_matched
|
||
posts
|
||
end
|
||
|
||
if type_filter != "private_messages"
|
||
posts =
|
||
if secure_category_ids.present?
|
||
posts.where(
|
||
"(categories.id IS NULL) OR (NOT categories.read_restricted) OR (categories.id IN (?))",
|
||
secure_category_ids,
|
||
).references(:categories)
|
||
else
|
||
posts.where("(categories.id IS NULL) OR (NOT categories.read_restricted)").references(
|
||
:categories,
|
||
)
|
||
end
|
||
end
|
||
|
||
posts =
|
||
apply_order(
|
||
posts,
|
||
aggregate_search: aggregate_search,
|
||
allow_relevance_search: !is_topic_search,
|
||
type_filter: type_filter,
|
||
)
|
||
|
||
posts = posts.offset(offset)
|
||
posts.limit(limit)
|
||
end
|
||
|
||
def weights
|
||
# A is for title
|
||
# B is for category
|
||
# C is for tags
|
||
# D is for cooked
|
||
@in_title ? "A" : (SiteSetting.tagging_enabled ? "ABCD" : "ABD")
|
||
end
|
||
|
||
def sort_by_relevance(posts, type_filter:, aggregate_search:)
|
||
exact_rank = nil
|
||
|
||
if SiteSetting.prioritize_exact_search_title_match
|
||
exact_rank = ts_rank_cd(weight_filter: "A", prefix_match: false)
|
||
end
|
||
|
||
rank = ts_rank_cd(weight_filter: weights)
|
||
|
||
if type_filter != "private_messages"
|
||
category_search_priority = <<~SQL
|
||
(
|
||
CASE categories.search_priority
|
||
WHEN #{Searchable::PRIORITIES[:very_high]}
|
||
THEN 3
|
||
WHEN #{Searchable::PRIORITIES[:very_low]}
|
||
THEN 1
|
||
ELSE 2
|
||
END
|
||
)
|
||
SQL
|
||
|
||
rank_sort_priorities = [["topics.archived", 0.85], ["topics.closed", 0.9]]
|
||
|
||
rank_sort_priorities =
|
||
DiscoursePluginRegistry.apply_modifier(
|
||
:search_rank_sort_priorities,
|
||
rank_sort_priorities,
|
||
self,
|
||
)
|
||
|
||
category_priority_weights = <<~SQL
|
||
(
|
||
CASE categories.search_priority
|
||
WHEN #{Searchable::PRIORITIES[:low]}
|
||
THEN #{SiteSetting.category_search_priority_low_weight.to_f}
|
||
WHEN #{Searchable::PRIORITIES[:high]}
|
||
THEN #{SiteSetting.category_search_priority_high_weight.to_f}
|
||
ELSE 1.0
|
||
END
|
||
*
|
||
CASE
|
||
#{rank_sort_priorities.sort_by { |_, pri| -pri }.map { |k, v| "WHEN #{k} THEN #{v}" }.join("\n")}
|
||
ELSE 1.0
|
||
END
|
||
)
|
||
SQL
|
||
|
||
posts =
|
||
if aggregate_search
|
||
posts.order("MAX(#{category_search_priority}) DESC")
|
||
else
|
||
posts.order("#{category_search_priority} DESC")
|
||
end
|
||
|
||
if @term.present? && exact_rank
|
||
posts =
|
||
if aggregate_search
|
||
posts.order("MAX(#{exact_rank} * #{category_priority_weights}) DESC")
|
||
else
|
||
posts.order("#{exact_rank} * #{category_priority_weights} DESC")
|
||
end
|
||
end
|
||
|
||
data_ranking =
|
||
if @term.blank?
|
||
"(#{category_priority_weights})"
|
||
else
|
||
"(#{rank} * #{category_priority_weights})"
|
||
end
|
||
|
||
posts =
|
||
if aggregate_search
|
||
posts.order("MAX(#{data_ranking}) DESC")
|
||
else
|
||
posts.order("#{data_ranking} DESC")
|
||
end
|
||
end
|
||
|
||
posts.order("topics.bumped_at DESC")
|
||
end
|
||
|
||
def ts_rank_cd(weight_filter:, prefix_match: true)
|
||
<<~SQL
|
||
TS_RANK_CD(
|
||
#{SiteSetting.search_ranking_weights.present? ? "'#{SiteSetting.search_ranking_weights}'," : ""}
|
||
post_search_data.search_data,
|
||
#{@term.blank? ? "" : ts_query(weight_filter: weight_filter, prefix_match: prefix_match)},
|
||
#{SiteSetting.search_ranking_normalization}|32
|
||
)
|
||
SQL
|
||
end
|
||
|
||
def categories_ignored(posts)
|
||
posts.where(<<~SQL, Searchable::PRIORITIES[:ignore])
|
||
(categories.search_priority IS NULL OR categories.search_priority IS NOT NULL AND categories.search_priority <> ?)
|
||
SQL
|
||
end
|
||
|
||
def self.default_ts_config
|
||
"'#{Search.ts_config}'"
|
||
end
|
||
|
||
def default_ts_config
|
||
self.class.default_ts_config
|
||
end
|
||
|
||
def self.ts_query(term:, ts_config: nil, joiner: nil, weight_filter: nil, prefix_match: true)
|
||
to_tsquery(
|
||
ts_config: ts_config,
|
||
term: set_tsquery_weight_filter(term, weight_filter, prefix_match: prefix_match),
|
||
)
|
||
end
|
||
|
||
def self.to_tsquery(ts_config: nil, term:, joiner: nil)
|
||
ts_config = ActiveRecord::Base.connection.quote(ts_config) if ts_config
|
||
escaped_term = wrap_unaccent("'#{escape_string(term)}'")
|
||
tsquery = "TO_TSQUERY(#{ts_config || default_ts_config}, #{escaped_term})"
|
||
# PG 14 and up default to using the followed by operator
|
||
# this restores the old behavior
|
||
tsquery = "REGEXP_REPLACE(#{tsquery}::text, '<->|<\\d+>', '&', 'g')::tsquery"
|
||
tsquery = "REPLACE(#{tsquery}::text, '&', '#{escape_string(joiner)}')::tsquery" if joiner
|
||
tsquery
|
||
end
|
||
|
||
def self.set_tsquery_weight_filter(term, weight_filter, prefix_match: true)
|
||
"'#{self.escape_string(term)}':#{prefix_match ? "*" : ""}#{weight_filter}"
|
||
end
|
||
|
||
def self.escape_string(term)
|
||
PG::Connection.escape_string(term).gsub('\\', '\\\\\\')
|
||
end
|
||
|
||
def ts_query(ts_config = nil, weight_filter: nil, prefix_match: true)
|
||
@ts_query_cache ||= {}
|
||
@ts_query_cache[
|
||
"#{ts_config || default_ts_config} #{@term} #{weight_filter} #{prefix_match}"
|
||
] ||= Search.ts_query(
|
||
term: @term,
|
||
ts_config: ts_config,
|
||
weight_filter: weight_filter,
|
||
prefix_match: prefix_match,
|
||
)
|
||
end
|
||
|
||
def wrap_rows(query)
|
||
"SELECT *, row_number() over() row_number FROM (#{query.to_sql}) xxx"
|
||
end
|
||
|
||
def aggregate_post_sql(opts)
|
||
min_id =
|
||
if SiteSetting.search_recent_regular_posts_offset_post_id > 0
|
||
if %w[all_topics private_message].include?(opts[:type_filter])
|
||
0
|
||
else
|
||
SiteSetting.search_recent_regular_posts_offset_post_id
|
||
end
|
||
else
|
||
# This is kept around for backwards compatibility.
|
||
# TODO: Drop this code path after Discourse 2.7 has been released.
|
||
Search.min_post_id
|
||
end
|
||
|
||
min_or_max = @order == :latest ? "max" : "min"
|
||
|
||
query =
|
||
if @order == :likes
|
||
# likes are a pain to aggregate so skip
|
||
posts_query(limit, type_filter: opts[:type_filter]).select("topics.id", "posts.post_number")
|
||
else
|
||
posts_query(limit, aggregate_search: true, type_filter: opts[:type_filter]).select(
|
||
"topics.id",
|
||
"#{min_or_max}(posts.post_number) post_number",
|
||
).group("topics.id")
|
||
end
|
||
|
||
if min_id > 0
|
||
low_set = query.dup.where("post_search_data.post_id < ?", min_id)
|
||
high_set = query.where("post_search_data.post_id >= ?", min_id)
|
||
|
||
return { default: wrap_rows(high_set), remaining: wrap_rows(low_set) }
|
||
end
|
||
|
||
# double wrapping so we get correct row numbers
|
||
{ default: wrap_rows(query) }
|
||
end
|
||
|
||
def aggregate_posts(post_sql)
|
||
return [] unless post_sql
|
||
|
||
posts_scope(posts_eager_loads(Post)).joins(
|
||
"JOIN (#{post_sql}) x ON x.id = posts.topic_id AND x.post_number = posts.post_number",
|
||
).order("row_number")
|
||
end
|
||
|
||
def aggregate_search(opts = {})
|
||
post_sql = aggregate_post_sql(opts)
|
||
|
||
added = 0
|
||
|
||
aggregate_posts(post_sql[:default]).each do |p|
|
||
@results.add(p)
|
||
added += 1
|
||
end
|
||
|
||
aggregate_posts(post_sql[:remaining]).each { |p| @results.add(p) } if added < limit
|
||
end
|
||
|
||
def private_messages_search
|
||
raise Discourse::InvalidAccess.new("anonymous can not search PMs") unless @guardian.user
|
||
|
||
aggregate_search(type_filter: "private_messages")
|
||
end
|
||
|
||
def all_topics_search
|
||
aggregate_search(type_filter: "all_topics")
|
||
end
|
||
|
||
def topic_search
|
||
if @search_context.is_a?(Topic)
|
||
posts =
|
||
posts_scope(posts_eager_loads(posts_query(limit))).where(
|
||
"posts.topic_id = ?",
|
||
@search_context.id,
|
||
)
|
||
|
||
posts.each { |post| @results.add(post) }
|
||
else
|
||
aggregate_search
|
||
end
|
||
end
|
||
|
||
def posts_eager_loads(query)
|
||
query = query.includes(:user, :post_search_data)
|
||
topic_eager_loads = [{ category: :parent_category }]
|
||
|
||
topic_eager_loads << :tags if SiteSetting.tagging_enabled
|
||
|
||
Search.custom_topic_eager_loads.each do |custom_loads|
|
||
topic_eager_loads.concat(
|
||
custom_loads.is_a?(Array) ? custom_loads : custom_loads.call(search_pms: @search_pms).to_a,
|
||
)
|
||
end
|
||
|
||
query.includes(topic: topic_eager_loads)
|
||
end
|
||
|
||
# Limited for performance reasons since `TS_HEADLINE` is slow when the text
|
||
# document is too long.
|
||
MAX_LENGTH_FOR_HEADLINE = 2500
|
||
|
||
def posts_scope(default_scope = Post.all)
|
||
if SiteSetting.use_pg_headlines_for_excerpt
|
||
search_term = @term.present? ? Search.escape_string(@term) : nil
|
||
ts_config = default_ts_config
|
||
|
||
default_scope
|
||
.joins("INNER JOIN post_search_data pd ON pd.post_id = posts.id")
|
||
.joins("INNER JOIN topics t1 ON t1.id = posts.topic_id")
|
||
.select(
|
||
"TS_HEADLINE(
|
||
#{ts_config},
|
||
t1.fancy_title,
|
||
PLAINTO_TSQUERY(#{ts_config}, '#{search_term}'),
|
||
'StartSel=''<span class=\"#{HIGHLIGHT_CSS_CLASS}\">'', StopSel=''</span>'', HighlightAll=true'
|
||
) AS topic_title_headline",
|
||
"TS_HEADLINE(
|
||
#{ts_config},
|
||
LEFT(
|
||
TS_HEADLINE(
|
||
#{ts_config},
|
||
LEFT(pd.raw_data, #{MAX_LENGTH_FOR_HEADLINE}),
|
||
PLAINTO_TSQUERY(#{ts_config}, '#{search_term}'),
|
||
'ShortWord=0, MaxFragments=1, MinWords=50, MaxWords=51, StartSel='''', StopSel='''''
|
||
),
|
||
#{Search::GroupedSearchResults::BLURB_LENGTH}
|
||
),
|
||
PLAINTO_TSQUERY(#{ts_config}, '#{search_term}'),
|
||
'HighlightAll=true, StartSel=''<span class=\"#{HIGHLIGHT_CSS_CLASS}\">'', StopSel=''</span>'''
|
||
) AS headline",
|
||
"LEFT(pd.raw_data, 50) AS leading_raw_data",
|
||
"RIGHT(pd.raw_data, 50) AS trailing_raw_data",
|
||
default_scope.arel.projections,
|
||
)
|
||
else
|
||
default_scope
|
||
end
|
||
end
|
||
|
||
def log_query?(readonly_mode)
|
||
SiteSetting.log_search_queries? && @opts[:search_type].present? && !readonly_mode &&
|
||
@opts[:type_filter] != "exclude_topics"
|
||
end
|
||
|
||
def min_search_term_length
|
||
return @opts[:min_search_term_length] if @opts[:min_search_term_length]
|
||
|
||
if SiteSetting.search_tokenize_chinese
|
||
return SiteSetting.defaults.get("min_search_term_length", "zh_CN")
|
||
end
|
||
|
||
if SiteSetting.search_tokenize_japanese
|
||
return SiteSetting.defaults.get("min_search_term_length", "ja")
|
||
end
|
||
|
||
SiteSetting.min_search_term_length
|
||
end
|
||
end
|