PHP 8.2.31
Preview: kconv.rb Size: 8.12 KB
//proc/thread-self/root/opt/alt/ruby18/lib64/ruby/1.8/kconv.rb

#
# kconv.rb - Kanji Converter.
#
# $Id: kconv.rb 11708 2007-02-12 23:01:19Z shyouhei $
#
# ----
#
# kconv.rb implements the Kconv class for Kanji Converter.  Additionally,
# some methods in String classes are added to allow easy conversion.
#

require 'nkf'

#
# Kanji Converter for Ruby.
#
module Kconv
  #
  # Public Constants
  #
  
  #Constant of Encoding
  
  # Auto-Detect
  AUTO = NKF::AUTO
  # ISO-2022-JP
  JIS = NKF::JIS
  # EUC-JP
  EUC = NKF::EUC
  # Shift_JIS
  SJIS = NKF::SJIS
  # BINARY
  BINARY = NKF::BINARY
  # NOCONV
  NOCONV = NKF::NOCONV
  # ASCII
  ASCII = NKF::ASCII
  # UTF-8
  UTF8 = NKF::UTF8
  # UTF-16
  UTF16 = NKF::UTF16
  # UTF-32
  UTF32 = NKF::UTF32
  # UNKNOWN
  UNKNOWN = NKF::UNKNOWN

  #
  # Private Constants
  #
  
  # Revision of kconv.rb
  REVISION = %q$Revision: 11708 $
  
  #Regexp of Encoding
  
  # Regexp of Shift_JIS string (private constant)
  RegexpShiftjis = /\A(?:
		       [\x00-\x7f\xa1-\xdf] |
		       [\x81-\x9f\xe0-\xfc][\x40-\x7e\x80-\xfc] 
		      )*\z/nx

  # Regexp of EUC-JP string (private constant)
  RegexpEucjp = /\A(?:
		    [\x00-\x7f]                         |
		    \x8e        [\xa1-\xdf]             |
		    \x8f        [\xa1-\xfe] [\xa1-\xfe] |
		    [\xa1-\xfe] [\xa1-\xfe]
		   )*\z/nx

  # Regexp of UTF-8 string (private constant)
  RegexpUtf8  = /\A(?:
		    [\x00-\x7f]                                     |
		    [\xc2-\xdf] [\x80-\xbf]                         |
		    \xe0        [\xa0-\xbf] [\x80-\xbf]             |
		    [\xe1-\xef] [\x80-\xbf] [\x80-\xbf]             |
		    \xf0        [\x90-\xbf] [\x80-\xbf] [\x80-\xbf] |
		    [\xf1-\xf3] [\x80-\xbf] [\x80-\xbf] [\x80-\xbf] |
		    \xf4        [\x80-\x8f] [\x80-\xbf] [\x80-\xbf]
		   )*\z/nx

  #
  # Public Methods
  #
  
  # call-seq:
  #    Kconv.kconv(str, out_code, in_code = Kconv::AUTO)
  #
  # Convert <code>str</code> to out_code.
  # <code>out_code</code> and <code>in_code</code> are given as constants of Kconv.
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want to decode them, use NKF.nkf.
  def kconv(str, out_code, in_code = AUTO)
    opt = '-'
    case in_code
    when ::NKF::JIS
      opt << 'J'
    when ::NKF::EUC
      opt << 'E'
    when ::NKF::SJIS
      opt << 'S'
    when ::NKF::UTF8
      opt << 'W'
    when ::NKF::UTF16
      opt << 'W16'
    end

    case out_code
    when ::NKF::JIS
      opt << 'j'
    when ::NKF::EUC
      opt << 'e'
    when ::NKF::SJIS
      opt << 's'
    when ::NKF::UTF8
      opt << 'w'
    when ::NKF::UTF16
      opt << 'w16'
    when ::NKF::NOCONV
      return str
    end

    opt = '' if opt == '-'

    ::NKF::nkf(opt, str)
  end
  module_function :kconv

  #
  # Encode to
  #

  # call-seq:
  #    Kconv.tojis(str)   -> string
  #
  # Convert <code>str</code> to ISO-2022-JP
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-jxm0', str).
  def tojis(str)
    ::NKF::nkf('-jm', str)
  end
  module_function :tojis

  # call-seq:
  #    Kconv.toeuc(str)   -> string
  #
  # Convert <code>str</code> to EUC-JP
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-exm0', str).
  def toeuc(str)
    ::NKF::nkf('-em', str)
  end
  module_function :toeuc

  # call-seq:
  #    Kconv.tosjis(str)   -> string
  #
  # Convert <code>str</code> to Shift_JIS
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-sxm0', str).
  def tosjis(str)
    ::NKF::nkf('-sm', str)
  end
  module_function :tosjis

  # call-seq:
  #    Kconv.toutf8(str)   -> string
  #
  # Convert <code>str</code> to UTF-8
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-wxm0', str).
  def toutf8(str)
    ::NKF::nkf('-wm', str)
  end
  module_function :toutf8

  # call-seq:
  #    Kconv.toutf16(str)   -> string
  #
  # Convert <code>str</code> to UTF-16
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-w16xm0', str).
  def toutf16(str)
    ::NKF::nkf('-w16m', str)
  end
  module_function :toutf16

  #
  # guess
  #

  # call-seq:
  #    Kconv.guess(str)   -> integer
  #
  # Guess input encoding by NKF.guess2
  def guess(str)
    ::NKF::guess(str)
  end
  module_function :guess

  # call-seq:
  #    Kconv.guess_old(str)   -> integer
  #
  # Guess input encoding by NKF.guess1
  def guess_old(str)
    ::NKF::guess1(str)
  end
  module_function :guess_old

  #
  # isEncoding
  #

  # call-seq:
  #    Kconv.iseuc(str)   -> obj or nil
  #
  # Returns whether input encoding is EUC-JP or not.
  #
  # *Note* don't expect this return value is MatchData.
  def iseuc(str)
    RegexpEucjp.match( str )
  end
  module_function :iseuc

  # call-seq:
  #    Kconv.issjis(str)   -> obj or nil
  #
  # Returns whether input encoding is Shift_JIS or not.
  #
  # *Note* don't expect this return value is MatchData.
  def issjis(str)
    RegexpShiftjis.match( str )
  end
  module_function :issjis

  # call-seq:
  #    Kconv.isutf8(str)   -> obj or nil
  #
  # Returns whether input encoding is UTF-8 or not.
  #
  # *Note* don't expect this return value is MatchData.
  def isutf8(str)
    RegexpUtf8.match( str )
  end
  module_function :isutf8

end

class String
  # call-seq:
  #    String#kconv(out_code, in_code = Kconv::AUTO)
  #
  # Convert <code>self</code> to out_code.
  # <code>out_code</code> and <code>in_code</code> are given as constants of Kconv.
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want to decode them, use NKF.nkf.
  def kconv(out_code, in_code=Kconv::AUTO)
    Kconv::kconv(self, out_code, in_code)
  end
  
  #
  # to Encoding
  #
  
  # call-seq:
  #    String#tojis   -> string
  #
  # Convert <code>self</code> to ISO-2022-JP
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-jxm0', str).
  def tojis; Kconv.tojis(self) end

  # call-seq:
  #    String#toeuc   -> string
  #
  # Convert <code>self</code> to EUC-JP
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-exm0', str).
  def toeuc; Kconv.toeuc(self) end

  # call-seq:
  #    String#tosjis   -> string
  #
  # Convert <code>self</code> to Shift_JIS
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-sxm0', str).
  def tosjis; Kconv.tosjis(self) end

  # call-seq:
  #    String#toutf8   -> string
  #
  # Convert <code>self</code> to UTF-8
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-wxm0', str).
  def toutf8; Kconv.toutf8(self) end

  # call-seq:
  #    String#toutf16   -> string
  #
  # Convert <code>self</code> to UTF-16
  #
  # *Note*
  # This method decode MIME encoded string and
  # convert halfwidth katakana to fullwidth katakana.
  # If you don't want it, use NKF.nkf('-w16xm0', str).
  def toutf16; Kconv.toutf16(self) end

  #
  # is Encoding
  #

  # call-seq:
  #    String#iseuc   -> obj or nil
  #
  # Returns whether <code>self</code>'s encoding is EUC-JP or not.
  #
  # *Note* don't expect this return value is MatchData.
  def iseuc;	Kconv.iseuc(self) end

  # call-seq:
  #    String#issjis   -> obj or nil
  #
  # Returns whether <code>self</code>'s encoding is Shift_JIS or not.
  #
  # *Note* don't expect this return value is MatchData.
  def issjis;	Kconv.issjis(self) end

  # call-seq:
  #    String#isutf8   -> obj or nil
  #
  # Returns whether <code>self</code>'s encoding is UTF-8 or not.
  #
  # *Note* don't expect this return value is MatchData.
  def isutf8;	Kconv.isutf8(self) end
end

Directory Contents

Dirs: 27 × Files: 83

Name Size Perms Modified Actions
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
cgi DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
date DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
digest DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
dl DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
drb DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
io DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
irb DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
net DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
openssl DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
optparse DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
racc DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
rdoc DIR
- drwxr-xr-x 2024-03-03 22:48:17
Edit Download
rexml DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
rinda DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
rss DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
runit DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
shell DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
soap DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
test DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
uri DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
webrick DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
wsdl DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
- drwxr-xr-x 2024-03-03 22:50:34
Edit Download
xmlrpc DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
xsd DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
yaml DIR
- drwxr-xr-x 2024-03-03 22:48:14
Edit Download
2.50 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
3.37 KB lrw-r--r-- 2007-07-16 15:47:16
Edit Download
17.73 KB lrw-r--r-- 2008-02-10 15:24:56
Edit Download
6.89 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
73.74 KB lrw-r--r-- 2009-12-14 02:40:07
Edit Download
12.84 KB lrw-r--r-- 2009-08-03 05:59:38
Edit Download
24.46 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
53.02 KB lrw-r--r-- 2010-06-08 04:45:42
Edit Download
128 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
20.61 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
8.81 KB lrw-r--r-- 2009-07-16 00:35:14
Edit Download
1.12 KB lrw-r--r-- 2007-07-28 00:40:58
Edit Download
19 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
4.04 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
5.60 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
274 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
21.38 KB lrw-r--r-- 2009-02-23 17:44:50
Edit Download
487 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
633 B lrw-r--r-- 2008-02-18 01:17:44
Edit Download
42.23 KB lrw-r--r-- 2011-05-20 22:29:13
Edit Download
5.38 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
1.84 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
6.16 KB lrw-r--r-- 2008-06-06 08:05:24
Edit Download
6.17 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
8.10 KB lrw-r--r-- 2008-04-10 10:52:50
Edit Download
14.88 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
2.25 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
6.43 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
590 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
21.96 KB lrw-r--r-- 2008-07-12 15:08:29
Edit Download
7.43 KB lrw-r--r-- 2009-08-09 08:44:15
Edit Download
4.30 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
8.12 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
17.59 KB lrw-r--r-- 2011-05-30 02:08:57
Edit Download
1.28 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
5.42 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
27.21 KB lrw-r--r-- 2009-01-24 15:02:50
Edit Download
411 B lrw-r--r-- 2007-03-06 10:09:51
Edit Download
50.65 KB lrw-r--r-- 2010-12-04 06:34:10
Edit Download
7.93 KB lrw-r--r-- 2009-11-25 07:45:29
Edit Download
2.07 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
5.15 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
20.49 KB lrw-r--r-- 2007-10-08 11:16:54
Edit Download
2.10 KB lrw-r--r-- 2009-12-14 04:28:06
Edit Download
575 B lrw-r--r-- 2010-11-22 07:21:45
Edit Download
47.12 KB lrw-r--r-- 2009-02-20 11:43:35
Edit Download
3.35 KB lrw-r--r-- 2009-05-26 12:06:21
Edit Download
1.55 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
1.33 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
29.39 KB lrw-r--r-- 2010-11-23 08:21:08
Edit Download
1.48 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
15.97 KB lrw-r--r-- 2007-06-07 10:06:41
Edit Download
18.33 KB lrw-r--r-- 2007-02-16 19:53:09
Edit Download
90 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
1.59 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
11.15 KB lrw-r--r-- 2008-06-06 08:05:24
Edit Download
12.05 KB lrw-r--r-- 2010-06-08 05:02:31
Edit Download
835 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
1.55 KB lrw-r--r-- 2008-08-08 01:58:40
Edit Download
56.83 KB lrw-r--r-- 2010-12-23 03:22:57
Edit Download
504 B lrw-r--r-- 2007-10-21 12:19:43
Edit Download
180 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
20.63 KB lrw-r--r-- 2009-01-20 03:23:46
Edit Download
4.27 KB lrw-r--r-- 2011-12-10 12:17:33
Edit Download
27.08 KB lrw-r--r-- 2008-06-09 09:20:43
Edit Download
418 B lrw-r--r-- 2007-03-06 10:09:51
Edit Download
4.66 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
3.99 KB lrw-r--r-- 2008-03-21 12:16:15
Edit Download
8.08 KB lrw-r--r-- 2008-07-03 11:14:50
Edit Download
6.09 KB lrw-r--r-- 2009-02-19 16:41:12
Edit Download
4.86 KB lrw-r--r-- 2008-04-21 09:43:44
Edit Download
104 B lrw-r--r-- 2007-02-13 19:39:32
Edit Download
4.32 KB lrw-r--r-- 2010-06-08 07:08:15
Edit Download
31.58 KB lrw-r--r-- 2008-06-06 08:05:24
Edit Download
3.00 KB lrw-r--r-- 2010-06-08 06:24:25
Edit Download
3.69 KB lrw-r--r-- 2009-01-26 02:12:10
Edit Download
2.73 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
7.99 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
4.54 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
710 B lrw-r--r-- 2008-04-15 09:41:47
Edit Download
2.68 KB lrw-r--r-- 2007-02-12 23:01:19
Edit Download
811 B lrw-r--r-- 2007-02-12 23:01:19
Edit Download
12.36 KB lrw-r--r-- 2008-04-19 11:45:39
Edit Download

If ZipArchive is unavailable, a .tar will be created (no compression).