discourse/lib/encodings.rb
Sam Saffron 30990006a9 DEV: enable frozen string literal on all files
This reduces chances of errors where consumers of strings mutate inputs
and reduces memory usage of the app.

Test suite passes now, but there may be some stuff left, so we will run
a few sites on a branch prior to merging
2019-05-13 09:31:32 +08:00

36 lines
999 B
Ruby

# frozen_string_literal: true
require 'rchardet'
module Encodings
def self.to_utf8(string)
result = CharDet.detect(string)
encoded_string = try_utf8(string, result['encoding']) if result && result['encoding']
encoded_string = force_utf8(string) if encoded_string.nil?
encoded_string
end
def self.try_utf8(string, source_encoding)
encoded = string.encode(Encoding::UTF_8, source_encoding)
encoded&.valid_encoding? ? delete_bom!(encoded) : nil
rescue Encoding::InvalidByteSequenceError,
Encoding::UndefinedConversionError,
Encoding::ConverterNotFoundError
nil
end
def self.force_utf8(string)
encoded_string = string.encode(Encoding::UTF_8,
undef: :replace,
invalid: :replace,
replace: '')
delete_bom!(encoded_string)
end
def self.delete_bom!(string)
string.sub!(/\A\xEF\xBB\xBF/, '') unless string.blank?
string
end
end