multibyte.rb 1.9 KB
Newer Older
1
# frozen_string_literal: true
2

3
require "active_support/multibyte"
4

5
class String
6 7 8 9
  # == Multibyte proxy
  #
  # +mb_chars+ is a multibyte safe proxy for string methods.
  #
10
  # It creates and returns an instance of the ActiveSupport::Multibyte::Chars class which
11 12 13
  # encapsulates the original string. A Unicode safe version of all the String methods are defined on this proxy
  # class. If the proxy class doesn't respond to a certain method, it's forwarded to the encapsulated string.
  #
14
  #   >> "lj".upcase
D
Dixit Patel 已提交
15
  #   => "LJ"
16 17
  #   >> "lj".mb_chars.upcase.to_s
  #   => "LJ"
18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34
  #
  # == Method chaining
  #
  # All the methods on the Chars proxy which normally return a string will return a Chars object. This allows
  # method chaining on the result of any of these methods.
  #
  #   name.mb_chars.reverse.length # => 12
  #
  # == Interoperability and configuration
  #
  # The Chars object tries to be as interchangeable with String objects as possible: sorting and comparing between
  # String and Char work like expected. The bang! methods change the internal string representation in the Chars
  # object. Interoperability problems can be resolved easily with a +to_s+ call.
  #
  # For more information about the methods defined on the Chars proxy see ActiveSupport::Multibyte::Chars. For
  # information about how to change the default Multibyte behavior see ActiveSupport::Multibyte.
  def mb_chars
35
    ActiveSupport::Multibyte.proxy_class.new(self)
36
  end
37

I
Islam Wazery 已提交
38
  # Returns +true+ if string has utf_8 encoding.
39 40 41 42 43 44
  #
  #   utf_8_str = "some string".encode "UTF-8"
  #   iso_str = "some string".encode "ISO-8859-1"
  #
  #   utf_8_str.is_utf8? # => true
  #   iso_str.is_utf8?   # => false
45 46 47 48 49 50 51 52
  def is_utf8?
    case encoding
    when Encoding::UTF_8
      valid_encoding?
    when Encoding::ASCII_8BIT, Encoding::US_ASCII
      dup.force_encoding(Encoding::UTF_8).valid_encoding?
    else
      false
53
    end
54 55
  end
end