discourse/spec/components/text_cleaner_spec.rb

# frozen_string_literal: true

require 'rails_helper'
require 'text_cleaner'

describe TextCleaner do

  context "exclamation marks" do

    let(:duplicated_string) { "my precious!!!!" }
    let(:deduplicated_string) { "my precious!" }

    it "ignores multiple ! by default" do
      expect(TextCleaner.clean(duplicated_string)).to eq(duplicated_string)
    end

    it "deduplicates ! when enabled" do
      expect(TextCleaner.clean(duplicated_string, deduplicate_exclamation_marks: true)).to eq(deduplicated_string)
    end

  end

  context "question marks" do

    let(:duplicated_string) { "please help me????" }
    let(:deduplicated_string) { "please help me?" }

    it "ignores multiple ? by default" do
      expect(TextCleaner.clean(duplicated_string)).to eq(duplicated_string)
    end

    it "deduplicates ? when enabled" do
      expect(TextCleaner.clean(duplicated_string, deduplicate_question_marks: true)).to eq(deduplicated_string)
    end

  end

  context "all upper case text" do

    let(:all_caps) { "ENTIRE TEXT IS ALL CAPS" }
    let(:almost_all_caps) { "ENTIRE TEXT iS ALL CAPS" }
    let(:regular_case) { "entire text is all caps" }

    it "ignores all upper case text by default" do
      expect(TextCleaner.clean(all_caps)).to eq(all_caps)
    end

    it "replaces all upper case text with regular case letters when enabled" do
      expect(TextCleaner.clean(all_caps, replace_all_upper_case: true)).to eq(regular_case)
    end

    it "ignores almost all upper case text when enabled" do
      expect(TextCleaner.clean(almost_all_caps, replace_all_upper_case: true)).to eq(almost_all_caps)
    end

  end

  context "first letter" do

    let(:lowercased) { "this is awesome" }
    let(:capitalized) { "This is awesome" }
    let(:iletter) { "iLetter" }

    it "ignores first letter case by default" do
      expect(TextCleaner.clean(lowercased)).to eq(lowercased)
      expect(TextCleaner.clean(capitalized)).to eq(capitalized)
      expect(TextCleaner.clean(iletter)).to eq(iletter)
    end

    it "capitalizes first letter when enabled" do
      expect(TextCleaner.clean(lowercased, capitalize_first_letter: true)).to eq(capitalized)
      expect(TextCleaner.clean(capitalized, capitalize_first_letter: true)).to eq(capitalized)
      expect(TextCleaner.clean(iletter, capitalize_first_letter: true)).to eq(iletter)
    end

  end

  context "periods at the end" do

    let(:with_one_period) { "oops." }
    let(:with_several_periods) { "oops..." }
    let(:without_period) { "oops" }

    it "ignores unnecessary periods at the end by default" do
      expect(TextCleaner.clean(with_one_period)).to eq(with_one_period)
      expect(TextCleaner.clean(with_several_periods)).to eq(with_several_periods)
    end

    it "removes unnecessary periods at the end when enabled" do
      expect(TextCleaner.clean(with_one_period, remove_all_periods_from_the_end: true)).to eq(without_period)
      expect(TextCleaner.clean(with_several_periods, remove_all_periods_from_the_end: true)).to eq(without_period)
    end

    it "keeps trailing whitespaces when enabled" do
      expect(TextCleaner.clean(with_several_periods + " ", remove_all_periods_from_the_end: true)).to eq(without_period + " ")
    end

  end

  context "extraneous space" do

    let(:with_space_exclamation) { "oops !" }
    let(:without_space_exclamation) { "oops!" }
    let(:with_space_question) { "oops ?" }
    let(:without_space_question) { "oops?" }

    it "ignores extraneous space before the end punctuation by default" do
      expect(TextCleaner.clean(with_space_exclamation)).to eq(with_space_exclamation)
      expect(TextCleaner.clean(with_space_question)).to eq(with_space_question)
    end

    it "removes extraneous space before the end punctuation when enabled" do
      expect(TextCleaner.clean(with_space_exclamation, remove_extraneous_space: true)).to eq(without_space_exclamation)
      expect(TextCleaner.clean(with_space_question, remove_extraneous_space: true)).to eq(without_space_question)
    end

    it "keep trailing whitespaces when enabled" do
      expect(TextCleaner.clean(with_space_exclamation + " ", remove_extraneous_space: true)).to eq(without_space_exclamation + " ")
      expect(TextCleaner.clean(with_space_question + " ", remove_extraneous_space: true)).to eq(without_space_question + " ")
    end

  end

  context "interior spaces" do

    let(:spacey_string) { "hello     there's weird     spaces here." }
    let(:unspacey_string) { "hello there's weird spaces here." }

    it "ignores interior spaces by default" do
      expect(TextCleaner.clean(spacey_string)).to eq(spacey_string)
    end

    it "fixes interior spaces when enabled" do
      expect(TextCleaner.clean(spacey_string, fixes_interior_spaces: true)).to eq(unspacey_string)
    end

  end

  context "leading and trailing whitespaces" do

    let(:spacey_string) { "   \t  test \n  " }
    let(:unspacey_string) { "test" }

    it "ignores leading and trailing whitespaces by default" do
      expect(TextCleaner.clean(spacey_string)).to eq(spacey_string)
    end

    it "strips leading and trailing whitespaces when enabled" do
      expect(TextCleaner.clean(spacey_string, strip_whitespaces: true)).to eq(unspacey_string)
    end

  end

  context "title" do

    it "fixes interior spaces" do
      expect(TextCleaner.clean_title("Hello   there")).to eq("Hello there")
    end

    it "strips leading and trailing whitespaces" do
      expect(TextCleaner.clean_title(" \t Hello there \n ")).to eq("Hello there")
    end

    it "strips zero width spaces" do
      expect(TextCleaner.clean_title("Hello there")).to eq("Hello there")
      expect(TextCleaner.clean_title("Hello there").length).to eq(11)
    end

    context "title_prettify site setting is enabled" do

      before { SiteSetting.title_prettify = true }

      it "deduplicates !" do
        expect(TextCleaner.clean_title("Hello there!!!!")).to eq("Hello there!")
      end

      it "deduplicates ?" do
        expect(TextCleaner.clean_title("Hello there????")).to eq("Hello there?")
      end

      it "replaces all upper case text with regular case letters" do
        expect(TextCleaner.clean_title("HELLO THERE")).to eq("Hello there")
      end

      it "doesn't replace all upper case text when uppercase posts are allowed" do
        SiteSetting.allow_uppercase_posts = true
        expect(TextCleaner.clean_title("HELLO THERE")).to eq("HELLO THERE")
      end

      it "capitalizes first letter" do
        expect(TextCleaner.clean_title("hello there")).to eq("Hello there")
      end

      it "removes unnecessary period at the end" do
        expect(TextCleaner.clean_title("Hello there.")).to eq("Hello there")
      end

      it "removes extraneous space before the end punctuation" do
        SiteSetting.title_remove_extraneous_space = true
        expect(TextCleaner.clean_title("Hello there ?")).to eq("Hello there?")

        SiteSetting.title_remove_extraneous_space = false
        expect(TextCleaner.clean_title("Hello there ?")).to eq("Hello there ?")
      end

      it "replaces all upper case unicode text with regular unicode case letters" do
        expect(TextCleaner.clean_title("INVESTIGAÇÃO POLÍTICA NA CÂMARA")).to eq("Investigação política na câmara")
      end

      it "doesn't downcase text if only one word is upcase in a non-ascii alphabet" do
        expect(TextCleaner.clean_title("«Эта неделя в EVE»")).to eq("«Эта неделя в EVE»")
      end

      it "capitalizes first unicode letter" do
        expect(TextCleaner.clean_title("épico encontro")).to eq("Épico encontro")
      end

      it "correctly cleans Turkish characters" do
        expect(TextCleaner.clean_title("GIDA")).to eq("Gida")
        expect(TextCleaner.clean_title("istanbul")).to eq("Istanbul")

        SiteSetting.default_locale = "tr_TR"
        expect(TextCleaner.clean_title("GIDA")).to eq("Gıda")
        expect(TextCleaner.clean_title("istanbul")).to eq("İstanbul")
      end
    end

  end

  describe "#normalize_whitespaces" do
    it "normalize whitespaces" do
      whitespaces = "\u0020\u00A0\u1680\u180E\u2000\u2001\u2002\u2003\u2004\u2005\u2006\u2007\u2008\u2009\u200A\u2028\u2029\u202F\u205F\u3000"
      expect(whitespaces.strip).not_to eq("")
      expect(TextCleaner.normalize_whitespaces(whitespaces).strip).to eq("")
      expect(TextCleaner.normalize_whitespaces(nil)).to be_nil
    end

    it "does not muck with zero width white space" do
      # this is used for khmer, dont mess with it
      expect(TextCleaner.normalize_whitespaces("hello\u200Bworld").strip).to eq("hello\u200Bworld")
      expect(TextCleaner.normalize_whitespaces("hello\uFEFFworld").strip).to eq("hello\uFEFFworld")

    end
  end

  context "invalid byte sequence" do
    let(:with_invalid_bytes) { "abc\u3042\x81" }
    let(:without_invalid_bytes) { "abc\u3042" }

    it "removes invalid bytes" do
      expect(TextCleaner.clean(with_invalid_bytes)).to eq(without_invalid_bytes)
    end
  end
end
-												DEV: use #frozen_string_literal: true on all spec

This change both speeds up specs (less strings to allocate) and helps catch
cases where methods in Discourse are mutating inputs.

Overall we will be migrating everything to use #frozen_string_literal: true
it will take a while, but this is the first and safest move in this direction

											
										
										
											2019-04-30 08:27:42 +08:00
+								# frozen_string_literal: true
-												Prepare for separation of RSpec helper files

Since rspec-rails 3, the default installation creates two helper files:
* `spec_helper.rb`
* `rails_helper.rb`

`spec_helper.rb` is intended as a way of running specs that do not
require Rails, whereas `rails_helper.rb` loads Rails (as Discourse's
current `spec_helper.rb` does).

For more information:

https://www.relishapp.com/rspec/rspec-rails/docs/upgrade#default-helper-files

In this commit, I've simply replaced all instances of `spec_helper` with
`rails_helper`, and renamed the original `spec_helper.rb`.

This brings the Discourse project closer to the standard usage of RSpec
in a Rails app.

At present, every spec relies on loading Rails, but there are likely
many that don't need to. In a future pull request, I hope to introduce a
separate, minimal `spec_helper.rb` which can be used in tests which
don't rely on Rails.

											
										
										
											2015-10-11 17:41:23 +08:00
+								require 'rails_helper'
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								require 'text_cleaner'
 								describe TextCleaner do
 								  context "exclamation marks" do
 								    let(:duplicated_string) { "my precious!!!!" }
 								    let(:deduplicated_string) { "my precious!" }
 								    it "ignores multiple ! by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(duplicated_string)).to eq(duplicated_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "deduplicates ! when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(duplicated_string, deduplicate_exclamation_marks: true)).to eq(deduplicated_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "question marks" do
 								    let(:duplicated_string) { "please help me????" }
 								    let(:deduplicated_string) { "please help me?" }
 								    it "ignores multiple ? by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(duplicated_string)).to eq(duplicated_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "deduplicates ? when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(duplicated_string, deduplicate_question_marks: true)).to eq(deduplicated_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "all upper case text" do
 								    let(:all_caps) { "ENTIRE TEXT IS ALL CAPS" }
 								    let(:almost_all_caps) { "ENTIRE TEXT iS ALL CAPS" }
 								    let(:regular_case) { "entire text is all caps" }
 								    it "ignores all upper case text by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(all_caps)).to eq(all_caps)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "replaces all upper case text with regular case letters when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(all_caps, replace_all_upper_case: true)).to eq(regular_case)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "ignores almost all upper case text when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(almost_all_caps, replace_all_upper_case: true)).to eq(almost_all_caps)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "first letter" do
 								    let(:lowercased) { "this is awesome" }
 								    let(:capitalized) { "This is awesome" }
-												Thread title fixer should ignore special cases like iLetter

											
										
										
											2013-05-24 03:31:08 +08:00
+								    let(:iletter) { "iLetter" }
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
 								    it "ignores first letter case by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(lowercased)).to eq(lowercased)
 								      expect(TextCleaner.clean(capitalized)).to eq(capitalized)
 								      expect(TextCleaner.clean(iletter)).to eq(iletter)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "capitalizes first letter when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(lowercased, capitalize_first_letter: true)).to eq(capitalized)
 								      expect(TextCleaner.clean(capitalized, capitalize_first_letter: true)).to eq(capitalized)
 								      expect(TextCleaner.clean(iletter, capitalize_first_letter: true)).to eq(iletter)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
-												Text Cleaner now removes all periods from the end of the title

											
										
										
											2013-04-18 06:19:42 +08:00
+								  context "periods at the end" do
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
-												Text Cleaner now removes all periods from the end of the title

											
										
										
											2013-04-18 06:19:42 +08:00
+								    let(:with_one_period) { "oops." }
 								    let(:with_several_periods) { "oops..." }
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    let(:without_period) { "oops" }
-												Text Cleaner now removes all periods from the end of the title

											
										
										
											2013-04-18 06:19:42 +08:00
+								    it "ignores unnecessary periods at the end by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(with_one_period)).to eq(with_one_period)
 								      expect(TextCleaner.clean(with_several_periods)).to eq(with_several_periods)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
-												Text Cleaner now removes all periods from the end of the title

											
										
										
											2013-04-18 06:19:42 +08:00
+								    it "removes unnecessary periods at the end when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(with_one_period, remove_all_periods_from_the_end: true)).to eq(without_period)
 								      expect(TextCleaner.clean(with_several_periods, remove_all_periods_from_the_end: true)).to eq(without_period)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "keeps trailing whitespaces when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(with_several_periods + " ", remove_all_periods_from_the_end: true)).to eq(without_period + " ")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "extraneous space" do
 								    let(:with_space_exclamation) { "oops !" }
 								    let(:without_space_exclamation) { "oops!" }
 								    let(:with_space_question) { "oops ?" }
 								    let(:without_space_question) { "oops?" }
 								    it "ignores extraneous space before the end punctuation by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(with_space_exclamation)).to eq(with_space_exclamation)
 								      expect(TextCleaner.clean(with_space_question)).to eq(with_space_question)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "removes extraneous space before the end punctuation when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(with_space_exclamation, remove_extraneous_space: true)).to eq(without_space_exclamation)
 								      expect(TextCleaner.clean(with_space_question, remove_extraneous_space: true)).to eq(without_space_question)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "keep trailing whitespaces when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(with_space_exclamation + " ", remove_extraneous_space: true)).to eq(without_space_exclamation + " ")
 								      expect(TextCleaner.clean(with_space_question + " ", remove_extraneous_space: true)).to eq(without_space_question + " ")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "interior spaces" do
 								    let(:spacey_string) { "hello     there's weird     spaces here." }
 								    let(:unspacey_string) { "hello there's weird spaces here." }
 								    it "ignores interior spaces by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(spacey_string)).to eq(spacey_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "fixes interior spaces when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(spacey_string, fixes_interior_spaces: true)).to eq(unspacey_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "leading and trailing whitespaces" do
 								    let(:spacey_string) { "   \t  test \n  " }
 								    let(:unspacey_string) { "test" }
 								    it "ignores leading and trailing whitespaces by default" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(spacey_string)).to eq(spacey_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "strips leading and trailing whitespaces when enabled" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean(spacey_string, strip_whitespaces: true)).to eq(unspacey_string)
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
 								  context "title" do
 								    it "fixes interior spaces" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean_title("Hello   there")).to eq("Hello there")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								    it "strips leading and trailing whitespaces" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(TextCleaner.clean_title(" \t Hello there \n ")).to eq("Hello there")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
-												FIX: strip zero width spaces from topic title

											
										
										
											2018-02-21 02:22:36 +08:00
+								    it "strips zero width spaces" do
 								      expect(TextCleaner.clean_title("Hello there")).to eq("Hello there")
 								      expect(TextCleaner.clean_title("Hello there").length).to eq(11)
 								    end
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    context "title_prettify site setting is enabled" do
 								      before { SiteSetting.title_prettify = true }
 								      it "deduplicates !" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								        expect(TextCleaner.clean_title("Hello there!!!!")).to eq("Hello there!")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      end
 								      it "deduplicates ?" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								        expect(TextCleaner.clean_title("Hello there????")).to eq("Hello there?")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      end
 								      it "replaces all upper case text with regular case letters" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								        expect(TextCleaner.clean_title("HELLO THERE")).to eq("Hello there")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      end
-												FIX: allow_uppercase_posts didn't work for topic titles

											
										
										
											2018-10-09 05:50:06 +08:00
+								      it "doesn't replace all upper case text when uppercase posts are allowed" do
 								        SiteSetting.allow_uppercase_posts = true
 								        expect(TextCleaner.clean_title("HELLO THERE")).to eq("HELLO THERE")
 								      end
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      it "capitalizes first letter" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								        expect(TextCleaner.clean_title("hello there")).to eq("Hello there")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      end
 								      it "removes unnecessary period at the end" do
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								        expect(TextCleaner.clean_title("Hello there.")).to eq("Hello there")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      end
 								      it "removes extraneous space before the end punctuation" do
-												FEATURE: English locale with international date formats

Makes en_US the new default locale

											
										
										
											2019-05-16 05:43:00 +08:00
+								        SiteSetting.title_remove_extraneous_space = true
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								        expect(TextCleaner.clean_title("Hello there ?")).to eq("Hello there?")
-												FEATURE: English locale with international date formats

Makes en_US the new default locale

											
										
										
											2019-05-16 05:43:00 +08:00
 								        SiteSetting.title_remove_extraneous_space = false
 								        expect(TextCleaner.clean_title("Hello there ?")).to eq("Hello there ?")
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								      end
-												Add spec to unicode upcase and downcase
											
										
										
											2016-03-08 09:10:49 +08:00
+								      it "replaces all upper case unicode text with regular unicode case letters" do
 								        expect(TextCleaner.clean_title("INVESTIGAÇÃO POLÍTICA NA CÂMARA")).to eq("Investigação política na câmara")
 								      end
-												FIX: Title prettify shoundn't downcase all non-ascii titles

											
										
										
											2017-08-09 01:03:24 +08:00
+								      it "doesn't downcase text if only one word is upcase in a non-ascii alphabet" do
 								        expect(TextCleaner.clean_title("«Эта неделя в EVE»")).to eq("«Эта неделя в EVE»")
 								      end
-												Add spec to unicode upcase and downcase
											
										
										
											2016-03-08 09:10:49 +08:00
+								      it "capitalizes first unicode letter" do
 								        expect(TextCleaner.clean_title("épico encontro")).to eq("Épico encontro")
 								      end
-												Rewrite capitalize for readability

Makes capitalize logic more clear with @sam suggestion

											
										
										
											2016-03-20 20:35:48 +08:00
-												FEATURE: Correctly convert topic title to uppercase and lowercase for Turkish default locale (#13115)


											
										
										
											2021-05-24 16:13:30 +08:00
+								      it "correctly cleans Turkish characters" do
 								        expect(TextCleaner.clean_title("GIDA")).to eq("Gida")
 								        expect(TextCleaner.clean_title("istanbul")).to eq("Istanbul")
 								        SiteSetting.default_locale = "tr_TR"
 								        expect(TextCleaner.clean_title("GIDA")).to eq("Gıda")
 								        expect(TextCleaner.clean_title("istanbul")).to eq("İstanbul")
 								      end
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								    end
 								  end
-												FEATURE: normalize whitespaces in topic title/post content

											
										
										
											2014-08-12 06:01:58 +08:00
+								  describe "#normalize_whitespaces" do
 								    it "normalize whitespaces" do
-												FIX: stop stripping zero-width-whitespace

This char is used for formatting khmer words

											
										
										
											2015-03-27 10:01:31 +08:00
+								      whitespaces = "\u0020\u00A0\u1680\u180E\u2000\u2001\u2002\u2003\u2004\u2005\u2006\u2007\u2008\u2009\u200A\u2028\u2029\u202F\u205F\u3000"
-												few components with rspec3 syntax

											
										
										
											2015-01-10 00:34:37 +08:00
+								      expect(whitespaces.strip).not_to eq("")
 								      expect(TextCleaner.normalize_whitespaces(whitespaces).strip).to eq("")
-												FIX: Skip gsub for normalizing whitespaces when text is nil (#6631)


											
										
										
											2018-11-20 16:12:32 +08:00
+								      expect(TextCleaner.normalize_whitespaces(nil)).to be_nil
-												FEATURE: normalize whitespaces in topic title/post content

											
										
										
											2014-08-12 06:01:58 +08:00
+								    end
-												FIX: stop stripping zero-width-whitespace

This char is used for formatting khmer words

											
										
										
											2015-03-27 10:01:31 +08:00
 								    it "does not muck with zero width white space" do
 								      # this is used for khmer, dont mess with it
 								      expect(TextCleaner.normalize_whitespaces("hello\u200Bworld").strip).to eq("hello\u200Bworld")
 								      expect(TextCleaner.normalize_whitespaces("hello\uFEFFworld").strip).to eq("hello\uFEFFworld")
 								    end
-												FEATURE: normalize whitespaces in topic title/post content

											
										
										
											2014-08-12 06:01:58 +08:00
+								  end
-												FIX: strip invalid byte sequences

											
										
										
											2019-02-26 07:12:34 +08:00
+								  context "invalid byte sequence" do
 								    let(:with_invalid_bytes) { "abc\u3042\x81" }
 								    let(:without_invalid_bytes) { "abc\u3042" }
 								    it "removes invalid bytes" do
 								      expect(TextCleaner.clean(with_invalid_bytes)).to eq(without_invalid_bytes)
 								    end
 								  end
-												auto replace rules in titles

											
										
										
											2013-04-10 17:00:50 +08:00
+								end