* encoding.c: provide basic features for M17N.
* parse.y: encoding aware parsing.
* parse.y (pragma_encoding): encoding specification pragma.
* parse.y (rb_intern3): encoding specified symbols.
* string.c (rb_str_length): length based on characters.
for older behavior, bytesize method added.
* string.c (rb_str_index_m): index based on characters. rindex as
well.
* string.c (succ_char): encoding aware succeeding string.
* string.c (rb_str_reverse): reverse based on characters.
* string.c (rb_str_inspect): encoding aware string description.
* string.c (rb_str_upcase_bang): encoding aware case conversion.
downcase, capitalize, swapcase as well.
* string.c (rb_str_tr_bang): tr based on characters. delete,
squeeze, tr_s, count as well.
* string.c (rb_str_split_m): split based on characters.
* string.c (rb_str_each_line): encoding aware each_line.
* string.c (rb_str_each_char): added. iteration based on
characters.
* string.c (rb_str_strip_bang): encoding aware whitespace
stripping. lstrip, rstrip as well.
* string.c (rb_str_justify): encoding aware justifying (ljust,
rjust, center).
* string.c (str_encoding): get encoding attribute from a string.
* re.c (rb_reg_initialize): encoding aware regular expression
* sprintf.c (rb_str_format): formatting (i.e. length count) based
on characters.
* io.c (rb_io_getc): getc to return one-character string.
for older behavior, getbyte method added.
* ext/stringio/stringio.c (strio_getc): ditto.
* io.c (rb_io_ungetc): allow pushing arbitrary string at the
current reading point.
* ext/stringio/stringio.c (strio_ungetc): ditto.
* ext/strscan/strscan.c: encoding support.
git-svn-id: svn+ssh://ci.ruby-lang.org/ruby/trunk@13261 b2dd03c8-39d4-4d8f-98ff-823fe69b080e
2007-08-24 23:29:39 -04:00
|
|
|
|
# -*- coding: euc-jp -*-
|
|
|
|
|
#
|
2003-10-16 03:45:51 -04:00
|
|
|
|
# unicodeout.rb --
|
|
|
|
|
#
|
|
|
|
|
# This demonstration script shows how you can produce output (in label
|
|
|
|
|
# widgets) using many different alphabets.
|
|
|
|
|
#
|
|
|
|
|
# based on Tcl/Tk8.4.4 widget demos
|
|
|
|
|
|
|
|
|
|
if defined?($unicodeout_demo) && $unicodeout_demo
|
|
|
|
|
$unicodeout_demo.destroy
|
|
|
|
|
$unicodeout_demo = nil
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
$unicodeout_demo = TkToplevel.new {|w|
|
|
|
|
|
title("Unicode Label Demonstration")
|
|
|
|
|
iconname("unicodeout")
|
|
|
|
|
positionWindow(w)
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
TkLabel.new($unicodeout_demo,
|
2004-10-11 00:51:21 -04:00
|
|
|
|
:font=>$font, :wraplength=>'5.4i', :justify=>:left,
|
|
|
|
|
:text=><<EOL).pack(:side=>:top)
|
2003-10-16 03:45:51 -04:00
|
|
|
|
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ϡ<EFBFBD>Tk<EFBFBD>ˤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ѥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ф<EFBFBD><EFBFBD>륵<EFBFBD>ݡ<EFBFBD><EFBFBD>ȤˤĤ<EFBFBD><EFBFBD>Ƥ<EFBFBD>\
|
|
|
|
|
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ץ<EFBFBD><EFBFBD>Ǥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɽ<EFBFBD><EFBFBD><EFBFBD>ˤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD>ʤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>ºݤˤɤΤ褦<EFBFBD><EFBFBD>ɽ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
<EFBFBD>ܤˤ<EFBFBD><EFBFBD>뤫<EFBFBD>ϡ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>ʤ<EFBFBD><EFBFBD>δĶ<EFBFBD><EFBFBD>ˤɤΤ褦<EFBFBD><EFBFBD>ʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>礬<EFBFBD><EFBFBD><EFBFBD>ȡ<EFBFBD><EFBFBD>뤵<EFBFBD><EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD>뤫<EFBFBD><EFBFBD>\
|
|
|
|
|
<EFBFBD>礭<EFBFBD><EFBFBD><EFBFBD><EFBFBD>¸<EFBFBD><EFBFBD><EFBFBD>ޤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>ޤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>оݤȤʤ<EFBFBD>ʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>礬<EFBFBD><EFBFBD><EFBFBD>ȡ<EFBFBD><EFBFBD>뤵<EFBFBD><EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD>ʤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
<EFBFBD>ɤΤ褦<EFBFBD><EFBFBD>ɽ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ʤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>뤫<EFBFBD>⤢<EFBFBD>ʤ<EFBFBD><EFBFBD>δĶ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ǥ<EFBFBD><EFBFBD><EFBFBD>\
|
2003-10-17 18:36:40 -04:00
|
|
|
|
<EFBFBD>֥<EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɻ<EFBFBD><EFBFBD>ȡץܥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ƥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɽ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
Unicodeout_SampleFrame<EFBFBD><EFBFBD><EFBFBD>饹<EFBFBD><EFBFBD>@@font<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
(<EFBFBD>ե<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD>ѹ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ޤ<EFBFBD><EFBFBD><EFBFBD>)\
|
|
|
|
|
<EFBFBD>ֺƼ¹ԡץܥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>Υ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>å<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ƤߤƤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
|
2003-10-16 03:45:51 -04:00
|
|
|
|
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ץȤ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ĥ褦<EFBFBD>ˡ<EFBFBD>ʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>\\uXXXX<EFBFBD>Ȥ<EFBFBD><EFBFBD><EFBFBD>\
|
2003-10-17 18:36:40 -04:00
|
|
|
|
Tcl<EFBFBD>Υ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɽ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ѥ<EFBFBD><EFBFBD><EFBFBD>UNICODEʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ǽ<EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD>ޤ<EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
ʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ϡ<EFBFBD>Tk::UTF8_String<EFBFBD><EFBFBD>åɤˤ<EFBFBD><EFBFBD>äơ<EFBFBD>\
|
|
|
|
|
<EFBFBD><EFBFBD>UTF8<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ʸ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ǥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>פȤ<EFBFBD><EFBFBD><EFBFBD>\
|
2003-10-16 03:45:51 -04:00
|
|
|
|
<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɾ<EFBFBD><EFBFBD><EFBFBD><EFBFBD>դ<EFBFBD><EFBFBD><EFBFBD>ʸ<EFBFBD><EFBFBD><EFBFBD>֥<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
(Tcl<EFBFBD>Υ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɽ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>Ѵ<EFBFBD><EFBFBD>Ѥ<EFBFBD>)<EFBFBD><EFBFBD><EFBFBD>Ѵ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>\
|
|
|
|
|
<EFBFBD><EFBFBD><EFBFBD>٥륦<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>åȤ<EFBFBD><EFBFBD>Ϥ<EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>դ<EFBFBD><EFBFBD>Ƥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>
|
|
|
|
|
EOL
|
|
|
|
|
#'
|
|
|
|
|
|
|
|
|
|
TkFrame.new($unicodeout_demo){|f|
|
|
|
|
|
pack(:side=>:bottom, :fill=>:x, :pady=>'2m')
|
|
|
|
|
|
2004-05-01 12:09:54 -04:00
|
|
|
|
TkButton.new(f, :text=>'<27>Ĥ<EFBFBD><C4A4><EFBFBD>', :width=>15, :command=>proc{
|
2004-10-11 00:51:21 -04:00
|
|
|
|
$unicodeout_demo.destroy
|
|
|
|
|
$unicodeout_demo = nil
|
|
|
|
|
}).pack(:side=>:left, :expand=>true)
|
2003-10-16 03:45:51 -04:00
|
|
|
|
|
|
|
|
|
TkButton.new(f, :text=>'<27><><EFBFBD><EFBFBD><EFBFBD>ɻ<EFBFBD><C9BB><EFBFBD>', :width=>15, :command=>proc{
|
2004-10-11 00:51:21 -04:00
|
|
|
|
showCode 'unicodeout'
|
|
|
|
|
}).pack(:side=>:left, :expand=>true)
|
2003-10-16 03:45:51 -04:00
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
wait_msg = TkLabel.new($unicodeout_demo,
|
2004-10-11 00:51:21 -04:00
|
|
|
|
:text=>"<EFBFBD>ե<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>ɤ߹<EFBFBD><EFBFBD>ߤδ<EFBFBD>λ<EFBFBD>ޤ<EFBFBD>" +
|
|
|
|
|
"<EFBFBD><EFBFBD><EFBFBD>Ф餯<EFBFBD><EFBFBD><EFBFBD>Ԥ<EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD><EFBFBD>",
|
|
|
|
|
:font=>"Helvetica 12 italic").pack
|
2003-10-16 03:45:51 -04:00
|
|
|
|
|
|
|
|
|
class Unicodeout_SampleFrame < TkFrame
|
|
|
|
|
@@font = $font
|
2003-10-17 18:36:40 -04:00
|
|
|
|
# @@font = 'Helvetica 14'
|
|
|
|
|
# @@font = 'Courier 12'
|
|
|
|
|
# @@font = 'clearlyu 16'
|
|
|
|
|
# @@font = 'fixed 12'
|
|
|
|
|
# @@font = 'Times 12'
|
|
|
|
|
# @@font = 'Newspaper 12'
|
|
|
|
|
# @@font = '{New century schoolbook} 12'
|
2003-10-16 03:45:51 -04:00
|
|
|
|
|
|
|
|
|
def initialize()
|
|
|
|
|
super($unicodeout_demo)
|
|
|
|
|
grid_columnconfig(1, :weight=>1)
|
|
|
|
|
end
|
|
|
|
|
|
|
|
|
|
def add_sample(lang, *args)
|
|
|
|
|
sample_txt = Tk::UTF8_String(args.join(''))
|
|
|
|
|
l = TkLabel.new(self, :font=>@@font, :text=>lang+':',
|
2004-10-11 00:51:21 -04:00
|
|
|
|
:anchor=>:nw, :pady=>0)
|
2003-10-17 18:36:40 -04:00
|
|
|
|
#s = TkLabel.new(self, :font=>@@font, :text=>sample_txt,
|
2003-10-16 03:45:51 -04:00
|
|
|
|
s = TkLabel.new(self, :font=>TkFont.new(@@font), :text=>sample_txt,
|
2004-10-11 00:51:21 -04:00
|
|
|
|
:anchor=>:nw, :width=>30, :pady=>0)
|
2003-10-16 03:45:51 -04:00
|
|
|
|
Tk.grid(l, s, :sticky=>:ew, :pady=>0)
|
|
|
|
|
l.grid_config(:padx, '1m')
|
|
|
|
|
end
|
|
|
|
|
end
|
|
|
|
|
f = Unicodeout_SampleFrame.new
|
|
|
|
|
f.pack(:expand=>true, :fill=>:both, :padx=>'2m', :pady=>'1m')
|
|
|
|
|
|
|
|
|
|
# Processing when some characters are missing might take a while, so make
|
|
|
|
|
# sure we're displaying something in the meantime...
|
|
|
|
|
|
|
|
|
|
oldCursor = $unicodeout_demo.cursor
|
|
|
|
|
$unicodeout_demo.cursor('watch')
|
|
|
|
|
Tk.update
|
|
|
|
|
|
|
|
|
|
f.add_sample('Arabic',
|
2004-10-11 00:51:21 -04:00
|
|
|
|
'\uFE94\uFEF4\uFE91\uFEAE\uFECC\uFEDF\uFE8D\uFE94',
|
|
|
|
|
'\uFEE4\uFEE0\uFEDC\uFEDF\uFE8D')
|
2003-10-16 03:45:51 -04:00
|
|
|
|
f.add_sample('Trad. Chinese', '\u4E2D\u570B\u7684\u6F22\u5B57')
|
|
|
|
|
f.add_sample('Simpl. Chinese', '\u6C49\u8BED')
|
|
|
|
|
f.add_sample('Greek',
|
2004-10-11 00:51:21 -04:00
|
|
|
|
'\u0395\u03BB\u03BB\u03B7\u03BD\u03B9\u03BA\u03AE ',
|
|
|
|
|
'\u03B3\u03BB\u03CE\u03C3\u03C3\u03B1')
|
2003-10-16 03:45:51 -04:00
|
|
|
|
f.add_sample('Hebrew',
|
2004-10-11 00:51:21 -04:00
|
|
|
|
'\u05DD\u05D9\u05DC\u05E9\u05D5\u05E8\u05D9 ',
|
|
|
|
|
'\u05DC\u05D9\u05D0\u05E8\u05E9\u05D9')
|
2003-10-16 03:45:51 -04:00
|
|
|
|
f.add_sample('Japanese',
|
2004-10-11 00:51:21 -04:00
|
|
|
|
'\u65E5\u672C\u8A9E\u306E\u3072\u3089\u304C\u306A, ',
|
|
|
|
|
'\u6F22\u5B57\u3068\u30AB\u30BF\u30AB\u30CA')
|
2003-10-16 03:45:51 -04:00
|
|
|
|
f.add_sample('Korean', '\uB300\uD55C\uBBFC\uAD6D\uC758 \uD55C\uAE00')
|
|
|
|
|
f.add_sample('Russian',
|
2004-10-11 00:51:21 -04:00
|
|
|
|
'\u0420\u0443\u0441\u0441\u043A\u0438\u0439 ',
|
|
|
|
|
'\u044F\u0437\u044B\u043A')
|
2003-10-16 03:45:51 -04:00
|
|
|
|
|
|
|
|
|
wait_msg.destroy
|
|
|
|
|
$unicodeout_demo.cursor(oldCursor)
|