mirror of
https://github.com/ruby/ruby.git
synced 2022-11-09 12:17:21 -05:00
Add encoding conversion (transcoding) from UTF-8 to CESU-8 and back. CESU-8 is an encoding similar to UTF-8, but encodes codepoints above U+FFFF as two surrogates, these surrogates again being encoded as if they were UTF-8 codepoints. This preserves the same binary sorting order as in UTF-16. It is also somewhat similar (although not exactly identical) to an encoding used internally by Java. This completes issue #15995. enc/trans/cesu_8.trans: Add encoding conversion from/to CESU-8 test/ruby/test_transcode.rb: Add tests for above |
||
|---|---|---|
| .. | ||
| CP | ||
| EMOJI | ||
| GB | ||
| JIS | ||
| ucm | ||
| big5-hkscs-tbl.rb | ||
| big5-uao-tbl.rb | ||
| big5.trans | ||
| cesu_8.trans | ||
| chinese.trans | ||
| cp850-tbl.rb | ||
| cp852-tbl.rb | ||
| cp855-tbl.rb | ||
| cp949-tbl.rb | ||
| ebcdic.trans | ||
| emoji-exchange-tbl.rb | ||
| emoji.trans | ||
| emoji_iso2022_kddi.trans | ||
| emoji_sjis_docomo.trans | ||
| emoji_sjis_kddi.trans | ||
| emoji_sjis_softbank.trans | ||
| escape.trans | ||
| euckr-tbl.rb | ||
| gb18030-tbl.rb | ||
| gb18030.trans | ||
| gbk-tbl.rb | ||
| gbk.trans | ||
| ibm437-tbl.rb | ||
| ibm737-tbl.rb | ||
| ibm775-tbl.rb | ||
| ibm852-tbl.rb | ||
| ibm855-tbl.rb | ||
| ibm857-tbl.rb | ||
| ibm860-tbl.rb | ||
| ibm861-tbl.rb | ||
| ibm862-tbl.rb | ||
| ibm863-tbl.rb | ||
| ibm865-tbl.rb | ||
| ibm866-tbl.rb | ||
| ibm869-tbl.rb | ||
| iso-8859-1-tbl.rb | ||
| iso-8859-2-tbl.rb | ||
| iso-8859-3-tbl.rb | ||
| iso-8859-4-tbl.rb | ||
| iso-8859-5-tbl.rb | ||
| iso-8859-6-tbl.rb | ||
| iso-8859-7-tbl.rb | ||
| iso-8859-8-tbl.rb | ||
| iso-8859-9-tbl.rb | ||
| iso-8859-10-tbl.rb | ||
| iso-8859-11-tbl.rb | ||
| iso-8859-13-tbl.rb | ||
| iso-8859-14-tbl.rb | ||
| iso-8859-15-tbl.rb | ||
| iso-8859-16-tbl.rb | ||
| iso2022.trans | ||
| japanese.trans | ||
| japanese_euc.trans | ||
| japanese_sjis.trans | ||
| koi8-r-tbl.rb | ||
| koi8-u-tbl.rb | ||
| korean.trans | ||
| maccroatian-tbl.rb | ||
| maccyrillic-tbl.rb | ||
| macgreek-tbl.rb | ||
| maciceland-tbl.rb | ||
| macroman-tbl.rb | ||
| macromania-tbl.rb | ||
| macturkish-tbl.rb | ||
| macukraine-tbl.rb | ||
| newline.trans | ||
| single_byte.trans | ||
| tis-620-tbl.rb | ||
| transdb.c | ||
| utf8_mac-tbl.rb | ||
| utf8_mac.trans | ||
| utf_16_32.trans | ||
| windows-874-tbl.rb | ||
| windows-1250-tbl.rb | ||
| windows-1251-tbl.rb | ||
| windows-1252-tbl.rb | ||
| windows-1253-tbl.rb | ||
| windows-1254-tbl.rb | ||
| windows-1255-tbl.rb | ||
| windows-1256-tbl.rb | ||
| windows-1257-tbl.rb | ||