# File xsd/charset.rb, line 116
def Charset.charset_label(encoding)
CharsetMap[encoding.upcase]
end
# File xsd/charset.rb, line 120
def Charset.charset_str(label)
if CharsetMap.respond_to?(:key)
CharsetMap.key(label.downcase) || 'X_UNKNOWN'
else
CharsetMap.index(label.downcase) || 'X_UNKNOWN'
end
end
handlers
# File xsd/charset.rb, line 84
def Charset.encoding
@internal_encoding
end
# File xsd/charset.rb, line 88
def Charset.encoding=(encoding)
warn("xsd charset is set to #{encoding}") if $DEBUG
@internal_encoding = encoding
end
# File xsd/charset.rb, line 105
def Charset.encoding_conv(str, enc_from, enc_to)
if enc_from == enc_to or enc_from == 'NONE' or enc_to == 'NONE'
str
elsif converter = EncodingConvertMap[[enc_from, enc_to]]
converter.call(str)
else
raise CharsetConversionError.new(
"Converter not found: #{enc_from} -> #{enc_to}")
end
end
# File xsd/charset.rb, line 101
def Charset.encoding_from_xml(str, charset)
encoding_conv(str, charset_str(charset), @internal_encoding)
end
# File xsd/charset.rb, line 97
def Charset.encoding_to_xml(str, charset)
encoding_conv(str, @internal_encoding, charset_str(charset))
end
# File xsd/charset.rb, line 26
def Charset.init
EncodingConvertMap[['UTF8', 'X_ISO8859_1']] =
Proc.new { |str| str.unpack('U*').pack('C*') }
EncodingConvertMap[['X_ISO8859_1', 'UTF8']] =
Proc.new { |str| str.unpack('C*').pack('U*') }
begin
require 'xsd/iconvcharset'
@internal_encoding = 'UTF8'
sjtag = (/(mswin|bccwin|mingw|cygwin|emx)/ =~ RUBY_PLATFORM) ? 'cp932' :
'shift_jis'
EncodingConvertMap[['UTF8', 'EUC' ]] =
Proc.new { |str| IconvCharset.safe_iconv("euc-jp", "utf-8", str) }
EncodingConvertMap[['EUC' , 'UTF8']] =
Proc.new { |str| IconvCharset.safe_iconv("utf-8", "euc-jp", str) }
EncodingConvertMap[['EUC' , 'SJIS']] =
Proc.new { |str| IconvCharset.safe_iconv(sjtag, "euc-jp", str) }
EncodingConvertMap[['UTF8', 'SJIS']] =
Proc.new { |str| IconvCharset.safe_iconv(sjtag, "utf-8", str) }
EncodingConvertMap[['SJIS', 'UTF8']] =
Proc.new { |str| IconvCharset.safe_iconv("utf-8", sjtag, str) }
EncodingConvertMap[['SJIS', 'EUC' ]] =
Proc.new { |str| IconvCharset.safe_iconv("euc-jp", sjtag, str) }
rescue LoadError
begin
require 'nkf'
EncodingConvertMap[['EUC' , 'SJIS']] =
Proc.new { |str| NKF.nkf('-sXm0', str) }
EncodingConvertMap[['SJIS', 'EUC' ]] =
Proc.new { |str| NKF.nkf('-eXm0', str) }
rescue LoadError
end
begin
require 'uconv'
@internal_encoding = 'UTF8'
EncodingConvertMap[['UTF8', 'EUC' ]] = Uconv.method(:u8toeuc)
EncodingConvertMap[['UTF8', 'SJIS']] = Uconv.method(:u8tosjis)
EncodingConvertMap[['EUC' , 'UTF8']] = Uconv.method(:euctou8)
EncodingConvertMap[['SJIS', 'UTF8']] = Uconv.method(:sjistou8)
rescue LoadError
end
end
end
# File xsd/charset.rb, line 170
def Charset.is_ces(str, code = $KCODE)
case code
when 'NONE'
is_us_ascii(str)
when 'UTF8'
is_utf8(str)
when 'EUC'
is_euc(str)
when 'SJIS'
is_sjis(str)
else
raise UnknownCharsetError.new("Unknown charset: #{code}")
end
end
# File xsd/charset.rb, line 162
def Charset.is_euc(str)
EUCRegexp =~ str
end
# File xsd/charset.rb, line 166
def Charset.is_sjis(str)
SJISRegexp =~ str
end
# File xsd/charset.rb, line 154
def Charset.is_us_ascii(str)
USASCIIRegexp =~ str
end
Commenting is here to help enhance the documentation. For example, code samples, or clarification of the documentation.
If you have questions about Ruby or the documentation, please post to one of the Ruby mailing lists. You will get better, faster, help that way.
If you wish to post a correction of the docs, please do so, but also file bug report so that it can be corrected for the next release. Thank you.
If you want to help improve the Ruby documentation, please see Improve the docs, or visit Documenting-ruby.org.