discourse

mirror of https://github.com/discourse/discourse.git synced 2024-11-24 13:18:33 +08:00

Author	SHA1	Message	Date
Guo Xiang Tan	5c31216aea	FIX: Search for whole URLs wasn't working.	2020-07-14 15:31:48 +08:00
Guo Xiang Tan	d8c796bc44	FIX: Ensure that aggregating search shows the post with the higest rank. Previously, we would only take either the `MIN` or `MAX` for `post_number` during aggregation meaning that the ranking is not considered. ``` require 'benchmark/ips' Benchmark.ips do \|x\| x.config(time: 10, warmup: 2) x.report("current aggregate search query") do DB.exec <<~SQL SELECT "posts"."id", "posts"."user_id", "posts"."topic_id", "posts"."post_number", "posts"."raw", "posts"."cooked", "posts"."created_at", "posts"."updated_at", "posts"."reply_to_post_number", "posts"."reply_count", "posts"."quote_count", "posts"."deleted_at", "posts"."off_topic_count", "posts"."like_count", "posts"."incoming_link_count", "posts"."bookmark_count", "posts"."score", "posts"."reads", "posts"."post_type", "posts"."sort_order", "posts"."last_editor_id", "posts"."hidden", "posts"."hidden_reason_id", "posts"."notify_moderators_count", "posts"."spam_count", "posts"."illegal_count", "posts"."inappropriate_count", "posts"."last_version_at", "posts"."user_deleted", "posts"."reply_to_user_id", "posts"."percent_rank", "posts"."notify_user_count", "posts"."like_score", "posts"."deleted_by_id", "posts"."edit_reason", "posts"."word_count", "posts"."version", "posts"."cook_method", "posts"."wiki", "posts"."baked_at", "posts"."baked_version", "posts"."hidden_at", "posts"."self_edits", "posts"."reply_quoted", "posts"."via_email", "posts"."raw_email", "posts"."public_version", "posts"."action_code", "posts"."locked_by_id", "posts"."image_upload_id" FROM "posts" JOIN (SELECT , row_number() over() row_number FROM (SELECT topics.id, min(posts.post_number) post_number FROM "posts" INNER JOIN "post_search_data" ON "post_search_data"."post_id" = "posts"."id" INNER JOIN "topics" ON "topics"."id" = "posts"."topic_id" AND ("topics"."deleted_at" IS NULL) LEFT JOIN categories ON categories.id = topics.category_id WHERE ("posts"."deleted_at" IS NULL) AND "posts"."post_type" IN (1, 2, 3, 4) AND (topics.visible) AND (topics.archetype <> 'private_message') AND (post_search_data.search_data @@ TO_TSQUERY('english', '''postgres'':ABCD')) AND (categories.id NOT IN ( SELECT categories.id WHERE categories.search_priority = 1 ) ) AND ((categories.id IS NULL) OR (NOT categories.read_restricted)) GROUP BY topics.id ORDER BY MAX(( TS_RANK_CD( post_search_data.search_data, TO_TSQUERY('english', '''postgres'':ABCD'), 1\|32 ) ( CASE categories.search_priority WHEN 2 THEN 0.6 WHEN 3 THEN 0.8 WHEN 4 THEN 1.2 WHEN 5 THEN 1.4 ELSE CASE WHEN topics.closed THEN 0.9 ELSE 1 END END ) ) ) DESC, topics.bumped_at DESC LIMIT 51 OFFSET 0) xxx) x ON x.id = posts.topic_id AND x.post_number = posts.post_number WHERE ("posts"."deleted_at" IS NULL) ORDER BY row_number; SQL end x.report("current aggregate search query with proper ranking") do DB.exec <<~SQL SELECT "posts"."id", "posts"."user_id", "posts"."topic_id", "posts"."post_number", "posts"."raw", "posts"."cooked", "posts"."created_at", "posts"."updated_at", "posts"."reply_to_post_number", "posts"."reply_count", "posts"."quote_count", "posts"."deleted_at", "posts"."off_topic_count", "posts"."like_count", "posts"."incoming_link_count", "posts"."bookmark_count", "posts"."score", "posts"."reads", "posts"."post_type", "posts"."sort_order", "posts"."last_editor_id", "posts"."hidden", "posts"."hidden_reason_id", "posts"."notify_moderators_count", "posts"."spam_count", "posts"."illegal_count", "posts"."inappropriate_count", "posts"."last_version_at", "posts"."user_deleted", "posts"."reply_to_user_id", "posts"."percent_rank", "posts"."notify_user_count", "posts"."like_score", "posts"."deleted_by_id", "posts"."edit_reason", "posts"."word_count", "posts"."version", "posts"."cook_method", "posts"."wiki", "posts"."baked_at", "posts"."baked_version", "posts"."hidden_at", "posts"."self_edits", "posts"."reply_quoted", "posts"."via_email", "posts"."raw_email", "posts"."public_version", "posts"."action_code", "posts"."locked_by_id", "posts"."image_upload_id" FROM "posts" JOIN (SELECT , row_number() over() row_number FROM (SELECT subquery.topic_id id, (ARRAY_AGG(subquery.post_number))[1] post_number, MAX(subquery.rank) rank, MAX(subquery.bumped_at) bumped_at FROM (SELECT "posts"."id", "posts"."user_id", "posts"."topic_id", "posts"."post_number", "posts"."raw", "posts"."cooked", "posts"."created_at", "posts"."updated_at", "posts"."reply_to_post_number", "posts"."reply_count", "posts"."quote_count", "posts"."deleted_at", "posts"."off_topic_count", "posts"."like_count", "posts"."incoming_link_count", "posts"."bookmark_count", "posts"."score", "posts"."reads", "posts"."post_type", "posts"."sort_order", "posts"."last_editor_id", "posts"."hidden", "posts"."hidden_reason_id", "posts"."notify_moderators_count", "posts"."spam_count", "posts"."illegal_count", "posts"."inappropriate_count", "posts"."last_version_at", "posts"."user_deleted", "posts"."reply_to_user_id", "posts"."percent_rank", "posts"."notify_user_count", "posts"."like_score", "posts"."deleted_by_id", "posts"."edit_reason", "posts"."word_count", "posts"."version", "posts"."cook_method", "posts"."wiki", "posts"."baked_at", "posts"."baked_version", "posts"."hidden_at", "posts"."self_edits", "posts"."reply_quoted", "posts"."via_email", "posts"."raw_email", "posts"."public_version", "posts"."action_code", "posts"."locked_by_id", "posts"."image_upload_id", ( TS_RANK_CD( post_search_data.search_data, TO_TSQUERY('english', '''postgres'':ABCD'), 1\|32 ) * ( CASE categories.search_priority WHEN 2 THEN 0.6 WHEN 3 THEN 0.8 WHEN 4 THEN 1.2 WHEN 5 THEN 1.4 ELSE CASE WHEN topics.closed THEN 0.9 ELSE 1 END END ) ) rank, topics.bumped_at bumped_at FROM "posts" INNER JOIN "post_search_data" ON "post_search_data"."post_id" = "posts"."id" INNER JOIN "topics" ON "topics"."id" = "posts"."topic_id" AND ("topics"."deleted_at" IS NULL) LEFT JOIN categories ON categories.id = topics.category_id WHERE ("posts"."deleted_at" IS NULL) AND "posts"."post_type" IN (1, 2, 3, 4) AND (topics.visible) AND (topics.archetype <> 'private_message') AND (post_search_data.search_data @@ TO_TSQUERY('english', '''postgres'':*ABCD')) AND (categories.id NOT IN ( SELECT categories.id WHERE categories.search_priority = 1 ) ) AND ((categories.id IS NULL) OR (NOT categories.read_restricted))) subquery GROUP BY subquery.topic_id ORDER BY rank DESC, bumped_at DESC LIMIT 51 OFFSET 0) xxx) x ON x.id = posts.topic_id AND x.post_number = posts.post_number WHERE ("posts"."deleted_at" IS NULL) ORDER BY row_number; SQL end x.compare! end ``` ``` Warming up -------------------------------------- current aggregate search query 1.000 i/100ms current aggregate search query with proper ranking 1.000 i/100ms Calculating ------------------------------------- current aggregate search query 17.726 (± 0.0%) i/s - 178.000 in 10.045107s current aggregate search query with proper ranking 17.802 (± 0.0%) i/s - 178.000 in 10.002230s Comparison: current aggregate search query with proper ranking: 17.8 i/s current aggregate search query: 17.7 i/s - 1.00x (± 0.00) slower ```	2020-07-14 13:39:13 +08:00
Guo Xiang Tan	4009c9f711	DEV: Fix search specs to take note of order in assertions. `contain_exactly` does not care about the order which isn't what we want.	2020-07-14 13:37:44 +08:00
Guo Xiang Tan	ce39733b1a	FIX: Incorrect search blurb when advanced search filters are used take2 Also remove include_blurbs attribute which isn't used.	2020-07-14 11:50:40 +08:00
Guo Xiang Tan	0c742dd022	DEV: Simple formatting fix.	2020-07-07 15:46:14 +08:00
Vinoth Kannan	ce1491e830	UX: remove `in:unpinned` filter from advanced search page. (#9911 )	2020-05-29 00:47:28 +05:30
Michael Brown	d9a02d1336	Revert "Revert "Merge branch 'master' of https://github.com/discourse/discourse "" This reverts commit `20780a1eee`. * SECURITY: re-adds accidentally reverted commit: 03d26cd6: ensure embed_url contains valid http(s) uri * when the merge commit `e62a85cf` was reverted, git chose the `2660c2e2` parent to land on instead of the `03d26cd6` parent (which contains security fixes)	2020-05-23 00:56:13 -04:00
Jeff Atwood	20780a1eee	Revert "Merge branch 'master' of https://github.com/discourse/discourse " This reverts commit `e62a85cf6f`, reversing changes made to `2660c2e21d`.	2020-05-22 20:25:56 -07:00
Martin Brennan	df68d11c38	FEATURE: Add topic excerpt max length site setting (#9847 ) Adds a new topic_excerpt_maxlength site setting. * When topic excerpt is requested for a post, use the new topic_excerpt_maxlength site setting to limit the size of the excerpt * Remove code for getting/setting Post.excerpt_size as it is not used anywhere	2020-05-21 13:19:48 +10:00
David Taylor	03818e642a	FEATURE: Include optimized thumbnails for topics (#9215 ) This introduces new APIs for obtaining optimized thumbnails for topics. There are a few building blocks required for this: - Introduces new `image_upload_id` columns on the `posts` and `topics` table. This replaces the old `image_url` column, which means that thumbnails are now restricted to uploads. Hotlinked thumbnails are no longer possible. In normal use (with pull_hotlinked_images enabled), this has no noticeable impact - A migration attempts to match existing urls to upload records. If a match cannot be found then the posts will be queued for rebake - Optimized thumbnails are generated during post_process_cooked. If thumbnails are missing when serializing a topic list, then a sidekiq job is queued - Topic lists and topics now include a `thumbnails` key, which includes all the available images: ``` "thumbnails": [ { "max_width": null, "max_height": null, "url": "//example.com/original-image.png", "width": 1380, "height": 1840 }, { "max_width": 1024, "max_height": 1024, "url": "//example.com/optimized-image.png", "width": 768, "height": 1024 } ] ``` - Themes can request additional thumbnail sizes by using a modifier in their `about.json` file: ``` "modifiers": { "topic_thumbnail_sizes": [ [200, 200], [800, 800] ], ... ``` Remember that these are generated asynchronously, so your theme should include logic to fallback to other available thumbnails if your requested size has not yet been generated - Two new raw plugin outlets are introduced, to improve the customisability of the topic list. `topic-list-before-columns` and `topic-list-before-link`	2020-05-05 09:07:50 +01:00
Sam Saffron	10b37e1e36	FIX: add support for sub-sub category slugs in search Previous to this change slugs for leaves in 3 level nestings would not work Our UX picks only the last two levels This also makes the results consistent for slugs as it enforces order.	2020-03-20 15:36:50 +11:00
Jarek Radosz	29b35aa64c	DEV: Improve flaky time-sensitive specs (#9141 )	2020-03-10 22:13:17 +01:00
David Taylor	5b3630dba3	FIX: Do not raise an error when in:all search is performed by anon (#9113 ) Also improve in:all specs to catch to catch similar failures	2020-03-05 17:50:29 +00:00
David Taylor	c344f43211	UX: Admins should only see their own PMs when searching in:all Admins are technically allowed to access all PMs, but it can be confusing to include them all in search. Follow-up to `e0605029dc`	2020-01-28 11:26:42 +00:00
adam j hartz	e0605029dc	FEATURE: allow searching public topics and personal messages simultaneously (#8784 ) The new search modifier `in:all` can be used to include both public and personal messages in the same search. Co-authored-by: adam j hartz <hz@mit.edu>	2020-01-28 10:11:33 +00:00
Mark VanLandingham	c5eec19368	FIX: Featuring topic on other users profile shows their topics (#8769 )	2020-01-22 14:16:17 -06:00
Mark VanLandingham	8c4ffaea1b	FEATURE: Modal for profile featured topic & admin wrench refactor (#8545 )	2019-12-16 08:41:34 -08:00
Neil Lalonde	875f0d8fd8	FEATURE: Tag synonyms This feature adds the ability to define synonyms for tags, and the ability to merge one tag into another while keeping it as a synonym. For example, tags named "js" and "java-script" can be synonyms of "javascript". When searching and creating topics using synonyms, they will be mapped to the base tag. Along with this change is a new UI found on each tag's page (for example, `/tags/javascript`) where more information about the tag can be shown. It will list the synonyms, which categories it's restricted to (if any), and which tag groups it belongs to (if tag group names are public on the `/tags` page by enabling the "tags listed by group" setting). Staff users will be able to manage tags in this UI, merge tags, and add/remove synonyms.	2019-12-04 13:33:51 -05:00
Martin Brennan	e7226a8c84	FEATURE: Allow scoping search to tag (#8345 ) * When viewing a tag, the search widget will now show a checkbox to scope the search by tag, which will limit search results to that tag on desktop and mobile	2019-11-14 10:40:26 +10:00
Krzysztof Kotlarek	427d54b2b0	DEV: Upgrading Discourse to Zeitwerk (#8098 ) Zeitwerk simplifies working with dependencies in dev and makes it easier reloading class chains. We no longer need to use Rails "require_dependency" anywhere and instead can just use standard Ruby patterns to require files. This is a far reaching change and we expect some followups here.	2019-10-02 14:01:53 +10:00
Daniel Waterworth	4ae8065f2c	DEV: Default to skipping creating a topic when fabricating categories (#7976 ) This speeds up the test suite by 9%	2019-08-06 11:26:54 +01:00
Osama Sayegh	5fc5a7f5ae	FEATURE: Add search operator to see all direct messages from a user (#7913 ) * FEATURE: Add search operator to see all direct messages from a user * Only show message if related messages >= 5 * Make "all messages" the hyperlink * Review	2019-07-22 10:55:49 -04:00
Josh Moore	6c5689984f	FEATURE: in:tagged search (srv side) (#7822 ) * FEATURE: in:tagged and in:untagged advanced search filters Similar to in:solved or in:unsolved, the filters check for an existence of the topic_id in the topic_tags table. see: https://meta.discourse.org/t/how-to-search-filter-untagged-topics/119641/2	2019-06-28 18:19:57 +10:00
Sam Saffron	8f7a387aa7	FEATURE: add support for tag group search The behaviour of #TERM in search has been amended 1. We try category or subcategory slugs 2. We try tags 3. We try tag-groups The term `hello #my-group` will search for all posts tagged with any of the tags in the tag group `My Group` Future work may be introducing a slug cache here or caching it in the table but the assumption is that the number of tag groups will not be huge	2019-06-27 17:53:26 +10:00
Penar Musaraj	f51f37eddf	FEATURE: apply a small penalty to closed topics when searching (#7782 )	2019-06-21 12:03:45 +10:00
Daniel Waterworth	90c226949c	prefabricate admin in search_spec.rb	2019-05-10 08:34:04 -04:00
Vinoth Kannan	7869a10d18	Revert "FEATURE: Added unlisted topics option to advanced search (#7447 )" This reverts commit `539723f8ff` since it is failing the build.	2019-05-01 21:06:20 +05:30
Tim Lange	539723f8ff	FEATURE: Added unlisted topics option to advanced search (#7447 )	2019-05-01 12:31:13 +10:00
Sam Saffron	4ea21fa2d0	DEV: use #frozen_string_literal: true on all spec This change both speeds up specs (less strings to allocate) and helps catch cases where methods in Discourse are mutating inputs. Overall we will be migrating everything to use #frozen_string_literal: true it will take a while, but this is the first and safest move in this direction	2019-04-30 10:27:42 +10:00
Sam Saffron	45285f1477	DEV: remove update_attributes which is deprecated in Rails 6 See: https://github.com/rails/rails/pull/31998 update_attributes is a relic of the past, it should no longer be used.	2019-04-29 17:32:25 +10:00
Guo Xiang Tan	c10861da2f	DEV: Fix randomly failing search spec.	2019-04-03 16:42:14 +08:00
Guo Xiang Tan	e87ca59401	FIX: Relevance search will now consider document length in ranking. The default ranking options ranks by the number of matches which is highly problematic when posts are stuffed with a keyword. The ranking will now be divided by the document length which is a much fairer way to rank.	2019-04-01 14:37:45 +08:00
Guo Xiang Tan	dae0bb4c67	FIX: Post blurb incorrect when search contains a phrase match. If the blurb generated is not around the search term, we will not be able to highlight it on the client side.	2019-03-26 17:01:52 +08:00
Guo Xiang Tan	1799820256	DEV: Improve search phrase spec to show that it actually works.	2019-03-26 16:31:15 +08:00
Guo Xiang Tan	bf57f39353	DEV: Remove code that is not used.	2019-03-26 15:36:26 +08:00
Guo Xiang Tan	ac661e856a	FEATURE: Allow categories to be prioritized/deprioritized in search. (#7209 )	2019-03-25 10:59:55 +08:00
Guo Xiang Tan	64f20e7e7a	FIX: Don't ignore category in search when using category filters.	2019-03-19 11:23:14 +08:00
Guo Xiang Tan	5e410dc5e0	FEATURE: Ability to exclude category from search results. (#7194 ) This commit also adds `Category#search_priority` which sets the ground work to enable prioritizing of posts for certain categories when searching.	2019-03-18 15:25:45 +08:00
Guo Xiang Tan	da941840d4	FIX: Advanced search category term should be case insensitive.	2019-03-12 14:11:21 +08:00
Joffrey JAFFEUX	dc4001370c	FEATURE: displays groups in menu search (#7090 )	2019-03-04 10:30:09 +01:00
Sam	0a357299b7	FEATURE: add `f` and `t` search shortcuts for first post / title Previously with had `in:title` and `in:first` search shortcuts for searching in first post or title only. They are a bit of handful to type. This add 2 shortcuts (t and f) for searching titles of first posts. This commit also cleans up all advanced filters, they were not properly regex terminated allowing for weird clauses like `in:firstinator` acting the same as `in:first`	2019-02-25 10:55:24 +11:00
Bianca Nenciu	4f3ee86bbd	FIX: in:title should work irrespective of the order. (#6968 )	2019-02-05 10:54:52 +01:00
Arpit Jalan	a121d40771	FIX: do not show PM topics when moving posts to an existing public topic (#6876 )	2019-01-14 15:00:45 +05:30
Gerhard Schlager	c376670bd2	FIX: a search term containing '& could lead to errors This also makes sure that the search term in front or after special characters isn't ignored.	2018-11-21 22:07:56 +01:00
Sam	06b9d8223a	FIX: search within topic not working correctly in CJK We were splitting the term prior to search causing everything to miss	2018-11-07 09:41:55 +11:00
Daniel Hollas	cee51672c9	FIX: Strip accents from search query `4481836` introduced accent stipping in search_indexer, but we need to strip it from the query itself as well TODO in search with diacritics: - Still need to fix excerpts on search page - need to support accent stripping in in_topic search - need to make sure that in:title works correctly - need to fix "word boldening" in titles	2018-10-23 12:10:33 +11:00
David Taylor	9bf522f227	FEATURE: Mixed case tagging (#6454 ) - By default, behaviour is not changed: tags are made lowercase upon creation and edit. - If force_lowercase_tags is disabled, then mixed case tags are allowed. - Tags must remain case-insensitively unique. This is enforced by ActiveRecord and Postgres. - A migration is added to provide a `UNIQUE` index on `lower(name)`. Migration includes a safety to correct any current tags that do not meet the criteria. - A `where_name` scope is added to `models/tag.rb`, to allow easy case-insensitive lookups. This is used instead of `Tag.where(name: "blah")`. - URLs remain lowercase. Mixed case URLs are functional, but have the lowercase equivalent as the canonical.	2018-10-05 10:23:52 +01:00
Penar Musaraj	70d74f8fc1	FIX: advanced search ordering broken when using tags	2018-09-28 17:27:08 +08:00
Sam	9b7cab589a	FIX: revert diacritic stripping See more details in test case and at: https://meta.discourse.org/t/discourse-should-ignore-if-a-character-is-accented-when-doing-a-search/90198/16?u=sam	2018-08-31 11:46:55 +10:00
Maja Komel	020eba4623	FIX: find tags with non-latin names (#6312 )	2018-08-27 11:05:28 +10:00

1 2 3 4

183 Commits