Module XSD::Charset
In: xsd/charset.rb

Methods

Classes and Modules

Class XSD::Charset::CharsetConversionError
Class XSD::Charset::CharsetError
Class XSD::Charset::UnknownCharsetError
Class XSD::Charset::XSDError

Constants

EncodingConvertMap = {}   Maps
CharsetMap = { 'NONE' => 'us-ascii', 'EUC' => 'euc-jp', 'SJIS' => 'shift_jis', 'UTF8' => 'utf-8', 'X_ISO_8859_1' => 'iso-8859-1', 'X_UNKNOWN' => nil, }
USASCIIRegexp = Regexp.new("\\A#{us_ascii}*\\z", nil, "NONE")
EUCRegexp = Regexp.new("\\A#{character_euc}*\\z", nil, "NONE")
SJISRegexp = Regexp.new("\\A#{character_sjis}*\\z", nil, "NONE")
UTF8Regexp = Regexp.new("\\A#{character_utf8}*\\z", nil, "NONE")

Public Class methods

[Source]

# File xsd/charset.rb, line 116
  def Charset.charset_label(encoding)
    CharsetMap[encoding.upcase]
  end

[Source]

# File xsd/charset.rb, line 120
  def Charset.charset_str(label)
    if CharsetMap.respond_to?(:key)
      CharsetMap.key(label.downcase) || 'X_UNKNOWN'
    else
      CharsetMap.index(label.downcase) || 'X_UNKNOWN'
    end
  end

handlers

[Source]

# File xsd/charset.rb, line 84
  def Charset.encoding
    @internal_encoding
  end

[Source]

# File xsd/charset.rb, line 88
  def Charset.encoding=(encoding)
    warn("xsd charset is set to #{encoding}") if $DEBUG
    @internal_encoding = encoding
  end

[Source]

# File xsd/charset.rb, line 105
  def Charset.encoding_conv(str, enc_from, enc_to)
    if enc_from == enc_to or enc_from == 'NONE' or enc_to == 'NONE'
      str
    elsif converter = EncodingConvertMap[[enc_from, enc_to]]
      converter.call(str)
    else
      raise CharsetConversionError.new(
        "Converter not found: #{enc_from} -> #{enc_to}")
    end
  end

[Source]

# File xsd/charset.rb, line 101
  def Charset.encoding_from_xml(str, charset)
    encoding_conv(str, charset_str(charset), @internal_encoding)
  end

[Source]

# File xsd/charset.rb, line 97
  def Charset.encoding_to_xml(str, charset)
    encoding_conv(str, @internal_encoding, charset_str(charset))
  end

[Source]

# File xsd/charset.rb, line 26
  def Charset.init
    EncodingConvertMap[['UTF8', 'X_ISO8859_1']] =
      Proc.new { |str| str.unpack('U*').pack('C*') }
    EncodingConvertMap[['X_ISO8859_1', 'UTF8']] =
      Proc.new { |str| str.unpack('C*').pack('U*') }
    begin
      require 'xsd/iconvcharset'
      @internal_encoding = 'UTF8'
      sjtag = (/(mswin|bccwin|mingw|cygwin|emx)/ =~ RUBY_PLATFORM) ? 'cp932' :
        'shift_jis'
      EncodingConvertMap[['UTF8', 'EUC' ]] =
        Proc.new { |str| IconvCharset.safe_iconv("euc-jp", "utf-8", str) }
      EncodingConvertMap[['EUC' , 'UTF8']] =
        Proc.new { |str| IconvCharset.safe_iconv("utf-8", "euc-jp", str) }
      EncodingConvertMap[['EUC' , 'SJIS']] =
        Proc.new { |str| IconvCharset.safe_iconv(sjtag, "euc-jp", str) }
      EncodingConvertMap[['UTF8', 'SJIS']] =
        Proc.new { |str| IconvCharset.safe_iconv(sjtag, "utf-8", str) }
      EncodingConvertMap[['SJIS', 'UTF8']] =
        Proc.new { |str| IconvCharset.safe_iconv("utf-8", sjtag, str) }
      EncodingConvertMap[['SJIS', 'EUC' ]] =
        Proc.new { |str| IconvCharset.safe_iconv("euc-jp", sjtag, str) }
    rescue LoadError
      begin
        require 'nkf'
        EncodingConvertMap[['EUC' , 'SJIS']] =
          Proc.new { |str| NKF.nkf('-sXm0', str) }
        EncodingConvertMap[['SJIS', 'EUC' ]] =
          Proc.new { |str| NKF.nkf('-eXm0', str) }
      rescue LoadError
      end
  
      begin
        require 'uconv'
        @internal_encoding = 'UTF8'
        EncodingConvertMap[['UTF8', 'EUC' ]] = Uconv.method(:u8toeuc)
        EncodingConvertMap[['UTF8', 'SJIS']] = Uconv.method(:u8tosjis)
        EncodingConvertMap[['EUC' , 'UTF8']] = Uconv.method(:euctou8)
        EncodingConvertMap[['SJIS', 'UTF8']] = Uconv.method(:sjistou8)
      rescue LoadError
      end
    end
  end

[Source]

# File xsd/charset.rb, line 170
  def Charset.is_ces(str, code = $KCODE)
    case code
    when 'NONE'
      is_us_ascii(str)
    when 'UTF8'
      is_utf8(str)
    when 'EUC'
      is_euc(str)
    when 'SJIS'
      is_sjis(str)
    else
      raise UnknownCharsetError.new("Unknown charset: #{code}")
    end
  end

[Source]

# File xsd/charset.rb, line 162
  def Charset.is_euc(str)
    EUCRegexp =~ str
  end

[Source]

# File xsd/charset.rb, line 166
  def Charset.is_sjis(str)
    SJISRegexp =~ str
  end

[Source]

# File xsd/charset.rb, line 154
  def Charset.is_us_ascii(str)
    USASCIIRegexp =~ str
  end

[Source]

# File xsd/charset.rb, line 158
  def Charset.is_utf8(str)
    UTF8Regexp =~ str
  end

[Source]

# File xsd/charset.rb, line 93
  def Charset.xml_encoding_label
    charset_label(@internal_encoding)
  end

[Validate]