1140 lines
27 KiB
Perl
1140 lines
27 KiB
Perl
#! /bin/false
|
|
# vim: set autoindent shiftwidth=4 tabstop=4:
|
|
|
|
# Conversion routines for KOI8-RU.
|
|
# Copyright (C) 2002-2017 Guido Flohr <guido.flohr@cantanea.com>,
|
|
# all rights reserved.
|
|
|
|
# This program is free software: you can redistribute it and/or modify
|
|
# it under the terms of the GNU General Public License as published by
|
|
# the Free Software Foundation; either version 3 of the License, or
|
|
# (at your option) any later version.
|
|
|
|
# This program is distributed in the hope that it will be useful,
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
# GNU General Public License for more details.
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
# along with this program. If not, see <http://www.gnu.org/licenses/>.
|
|
|
|
package Locale::RecodeData::KOI8_RU;
|
|
|
|
use strict;
|
|
|
|
require Locale::RecodeData;
|
|
use base qw(Locale::RecodeData);
|
|
|
|
my @to_ucs4 = (
|
|
0x0000,
|
|
0x0001,
|
|
0x0002,
|
|
0x0003,
|
|
0x0004,
|
|
0x0005,
|
|
0x0006,
|
|
0x0007,
|
|
0x0008,
|
|
0x0009,
|
|
0x000a,
|
|
0x000b,
|
|
0x000c,
|
|
0x000d,
|
|
0x000e,
|
|
0x000f,
|
|
0x0010,
|
|
0x0011,
|
|
0x0012,
|
|
0x0013,
|
|
0x0014,
|
|
0x0015,
|
|
0x0016,
|
|
0x0017,
|
|
0x0018,
|
|
0x0019,
|
|
0x001a,
|
|
0x001b,
|
|
0x001c,
|
|
0x001d,
|
|
0x001e,
|
|
0x001f,
|
|
0x0020,
|
|
0x0021,
|
|
0x0022,
|
|
0x0023,
|
|
0x0024,
|
|
0x0025,
|
|
0x0026,
|
|
0x0027,
|
|
0x0028,
|
|
0x0029,
|
|
0x002a,
|
|
0x002b,
|
|
0x002c,
|
|
0x002d,
|
|
0x002e,
|
|
0x002f,
|
|
0x0030,
|
|
0x0031,
|
|
0x0032,
|
|
0x0033,
|
|
0x0034,
|
|
0x0035,
|
|
0x0036,
|
|
0x0037,
|
|
0x0038,
|
|
0x0039,
|
|
0x003a,
|
|
0x003b,
|
|
0x003c,
|
|
0x003d,
|
|
0x003e,
|
|
0x003f,
|
|
0x0040,
|
|
0x0041,
|
|
0x0042,
|
|
0x0043,
|
|
0x0044,
|
|
0x0045,
|
|
0x0046,
|
|
0x0047,
|
|
0x0048,
|
|
0x0049,
|
|
0x004a,
|
|
0x004b,
|
|
0x004c,
|
|
0x004d,
|
|
0x004e,
|
|
0x004f,
|
|
0x0050,
|
|
0x0051,
|
|
0x0052,
|
|
0x0053,
|
|
0x0054,
|
|
0x0055,
|
|
0x0056,
|
|
0x0057,
|
|
0x0058,
|
|
0x0059,
|
|
0x005a,
|
|
0x005b,
|
|
0x005c,
|
|
0x005d,
|
|
0x005e,
|
|
0x005f,
|
|
0x0060,
|
|
0x0061,
|
|
0x0062,
|
|
0x0063,
|
|
0x0064,
|
|
0x0065,
|
|
0x0066,
|
|
0x0067,
|
|
0x0068,
|
|
0x0069,
|
|
0x006a,
|
|
0x006b,
|
|
0x006c,
|
|
0x006d,
|
|
0x006e,
|
|
0x006f,
|
|
0x0070,
|
|
0x0071,
|
|
0x0072,
|
|
0x0073,
|
|
0x0074,
|
|
0x0075,
|
|
0x0076,
|
|
0x0077,
|
|
0x0078,
|
|
0x0079,
|
|
0x007a,
|
|
0x007b,
|
|
0x007c,
|
|
0x007d,
|
|
0x007e,
|
|
0x007f,
|
|
0x2500,
|
|
0x2502,
|
|
0x250c,
|
|
0x2510,
|
|
0x2514,
|
|
0x2518,
|
|
0x251c,
|
|
0x2524,
|
|
0x252c,
|
|
0x2534,
|
|
0x253c,
|
|
0x2580,
|
|
0x2584,
|
|
0x2588,
|
|
0x258c,
|
|
0x2590,
|
|
0x2591,
|
|
0x2592,
|
|
0x2593,
|
|
0x2320,
|
|
0x25a0,
|
|
0x2219,
|
|
0x221a,
|
|
0x2248,
|
|
0x2264,
|
|
0x2265,
|
|
0x00a0,
|
|
0x2321,
|
|
0x00b0,
|
|
0x00b2,
|
|
0x00b7,
|
|
0x00f7,
|
|
0x2550,
|
|
0x2551,
|
|
0x2552,
|
|
0x0451,
|
|
0x0454,
|
|
0x2554,
|
|
0x0456,
|
|
0x0457,
|
|
0x2557,
|
|
0x2558,
|
|
0x2559,
|
|
0x255a,
|
|
0x255b,
|
|
0x0491,
|
|
0x045e,
|
|
0x255e,
|
|
0x255f,
|
|
0x2560,
|
|
0x2561,
|
|
0x0401,
|
|
0x0404,
|
|
0x2563,
|
|
0x0406,
|
|
0x0407,
|
|
0x2566,
|
|
0x2567,
|
|
0x2568,
|
|
0x2569,
|
|
0x256a,
|
|
0x0490,
|
|
0x040e,
|
|
0x00a9,
|
|
0x044e,
|
|
0x0430,
|
|
0x0431,
|
|
0x0446,
|
|
0x0434,
|
|
0x0435,
|
|
0x0444,
|
|
0x0433,
|
|
0x0445,
|
|
0x0438,
|
|
0x0439,
|
|
0x043a,
|
|
0x043b,
|
|
0x043c,
|
|
0x043d,
|
|
0x043e,
|
|
0x043f,
|
|
0x044f,
|
|
0x0440,
|
|
0x0441,
|
|
0x0442,
|
|
0x0443,
|
|
0x0436,
|
|
0x0432,
|
|
0x044c,
|
|
0x044b,
|
|
0x0437,
|
|
0x0448,
|
|
0x044d,
|
|
0x0449,
|
|
0x0447,
|
|
0x044a,
|
|
0x042e,
|
|
0x0410,
|
|
0x0411,
|
|
0x0426,
|
|
0x0414,
|
|
0x0415,
|
|
0x0424,
|
|
0x0413,
|
|
0x0425,
|
|
0x0418,
|
|
0x0419,
|
|
0x041a,
|
|
0x041b,
|
|
0x041c,
|
|
0x041d,
|
|
0x041e,
|
|
0x041f,
|
|
0x042f,
|
|
0x0420,
|
|
0x0421,
|
|
0x0422,
|
|
0x0423,
|
|
0x0416,
|
|
0x0412,
|
|
0x042c,
|
|
0x042b,
|
|
0x0417,
|
|
0x0428,
|
|
0x042d,
|
|
0x0429,
|
|
0x0427,
|
|
0x042a,
|
|
);
|
|
|
|
my @to_utf8 = (
|
|
"\x00",
|
|
"\x01",
|
|
"\x02",
|
|
"\x03",
|
|
"\x04",
|
|
"\x05",
|
|
"\x06",
|
|
"\x07",
|
|
"\x08",
|
|
"\x09",
|
|
"\x0a",
|
|
"\x0b",
|
|
"\x0c",
|
|
"\x0d",
|
|
"\x0e",
|
|
"\x0f",
|
|
"\x10",
|
|
"\x11",
|
|
"\x12",
|
|
"\x13",
|
|
"\x14",
|
|
"\x15",
|
|
"\x16",
|
|
"\x17",
|
|
"\x18",
|
|
"\x19",
|
|
"\x1a",
|
|
"\x1b",
|
|
"\x1c",
|
|
"\x1d",
|
|
"\x1e",
|
|
"\x1f",
|
|
"\x20",
|
|
"\x21",
|
|
"\x22",
|
|
"\x23",
|
|
"\x24",
|
|
"\x25",
|
|
"\x26",
|
|
"\x27",
|
|
"\x28",
|
|
"\x29",
|
|
"\x2a",
|
|
"\x2b",
|
|
"\x2c",
|
|
"\x2d",
|
|
"\x2e",
|
|
"\x2f",
|
|
"\x30",
|
|
"\x31",
|
|
"\x32",
|
|
"\x33",
|
|
"\x34",
|
|
"\x35",
|
|
"\x36",
|
|
"\x37",
|
|
"\x38",
|
|
"\x39",
|
|
"\x3a",
|
|
"\x3b",
|
|
"\x3c",
|
|
"\x3d",
|
|
"\x3e",
|
|
"\x3f",
|
|
"\x40",
|
|
"\x41",
|
|
"\x42",
|
|
"\x43",
|
|
"\x44",
|
|
"\x45",
|
|
"\x46",
|
|
"\x47",
|
|
"\x48",
|
|
"\x49",
|
|
"\x4a",
|
|
"\x4b",
|
|
"\x4c",
|
|
"\x4d",
|
|
"\x4e",
|
|
"\x4f",
|
|
"\x50",
|
|
"\x51",
|
|
"\x52",
|
|
"\x53",
|
|
"\x54",
|
|
"\x55",
|
|
"\x56",
|
|
"\x57",
|
|
"\x58",
|
|
"\x59",
|
|
"\x5a",
|
|
"\x5b",
|
|
"\x5c",
|
|
"\x5d",
|
|
"\x5e",
|
|
"\x5f",
|
|
"\x60",
|
|
"\x61",
|
|
"\x62",
|
|
"\x63",
|
|
"\x64",
|
|
"\x65",
|
|
"\x66",
|
|
"\x67",
|
|
"\x68",
|
|
"\x69",
|
|
"\x6a",
|
|
"\x6b",
|
|
"\x6c",
|
|
"\x6d",
|
|
"\x6e",
|
|
"\x6f",
|
|
"\x70",
|
|
"\x71",
|
|
"\x72",
|
|
"\x73",
|
|
"\x74",
|
|
"\x75",
|
|
"\x76",
|
|
"\x77",
|
|
"\x78",
|
|
"\x79",
|
|
"\x7a",
|
|
"\x7b",
|
|
"\x7c",
|
|
"\x7d",
|
|
"\x7e",
|
|
"\x7f",
|
|
"\xe2\x94\x80",
|
|
"\xe2\x94\x82",
|
|
"\xe2\x94\x8c",
|
|
"\xe2\x94\x90",
|
|
"\xe2\x94\x94",
|
|
"\xe2\x94\x98",
|
|
"\xe2\x94\x9c",
|
|
"\xe2\x94\xa4",
|
|
"\xe2\x94\xac",
|
|
"\xe2\x94\xb4",
|
|
"\xe2\x94\xbc",
|
|
"\xe2\x96\x80",
|
|
"\xe2\x96\x84",
|
|
"\xe2\x96\x88",
|
|
"\xe2\x96\x8c",
|
|
"\xe2\x96\x90",
|
|
"\xe2\x96\x91",
|
|
"\xe2\x96\x92",
|
|
"\xe2\x96\x93",
|
|
"\xe2\x8c\xa0",
|
|
"\xe2\x96\xa0",
|
|
"\xe2\x88\x99",
|
|
"\xe2\x88\x9a",
|
|
"\xe2\x89\x88",
|
|
"\xe2\x89\xa4",
|
|
"\xe2\x89\xa5",
|
|
"\xc2\xa0",
|
|
"\xe2\x8c\xa1",
|
|
"\xc2\xb0",
|
|
"\xc2\xb2",
|
|
"\xc2\xb7",
|
|
"\xc3\xb7",
|
|
"\xe2\x95\x90",
|
|
"\xe2\x95\x91",
|
|
"\xe2\x95\x92",
|
|
"\xd1\x91",
|
|
"\xd1\x94",
|
|
"\xe2\x95\x94",
|
|
"\xd1\x96",
|
|
"\xd1\x97",
|
|
"\xe2\x95\x97",
|
|
"\xe2\x95\x98",
|
|
"\xe2\x95\x99",
|
|
"\xe2\x95\x9a",
|
|
"\xe2\x95\x9b",
|
|
"\xd2\x91",
|
|
"\xd1\x9e",
|
|
"\xe2\x95\x9e",
|
|
"\xe2\x95\x9f",
|
|
"\xe2\x95\xa0",
|
|
"\xe2\x95\xa1",
|
|
"\xd0\x81",
|
|
"\xd0\x84",
|
|
"\xe2\x95\xa3",
|
|
"\xd0\x86",
|
|
"\xd0\x87",
|
|
"\xe2\x95\xa6",
|
|
"\xe2\x95\xa7",
|
|
"\xe2\x95\xa8",
|
|
"\xe2\x95\xa9",
|
|
"\xe2\x95\xaa",
|
|
"\xd2\x90",
|
|
"\xd0\x8e",
|
|
"\xc2\xa9",
|
|
"\xd1\x8e",
|
|
"\xd0\xb0",
|
|
"\xd0\xb1",
|
|
"\xd1\x86",
|
|
"\xd0\xb4",
|
|
"\xd0\xb5",
|
|
"\xd1\x84",
|
|
"\xd0\xb3",
|
|
"\xd1\x85",
|
|
"\xd0\xb8",
|
|
"\xd0\xb9",
|
|
"\xd0\xba",
|
|
"\xd0\xbb",
|
|
"\xd0\xbc",
|
|
"\xd0\xbd",
|
|
"\xd0\xbe",
|
|
"\xd0\xbf",
|
|
"\xd1\x8f",
|
|
"\xd1\x80",
|
|
"\xd1\x81",
|
|
"\xd1\x82",
|
|
"\xd1\x83",
|
|
"\xd0\xb6",
|
|
"\xd0\xb2",
|
|
"\xd1\x8c",
|
|
"\xd1\x8b",
|
|
"\xd0\xb7",
|
|
"\xd1\x88",
|
|
"\xd1\x8d",
|
|
"\xd1\x89",
|
|
"\xd1\x87",
|
|
"\xd1\x8a",
|
|
"\xd0\xae",
|
|
"\xd0\x90",
|
|
"\xd0\x91",
|
|
"\xd0\xa6",
|
|
"\xd0\x94",
|
|
"\xd0\x95",
|
|
"\xd0\xa4",
|
|
"\xd0\x93",
|
|
"\xd0\xa5",
|
|
"\xd0\x98",
|
|
"\xd0\x99",
|
|
"\xd0\x9a",
|
|
"\xd0\x9b",
|
|
"\xd0\x9c",
|
|
"\xd0\x9d",
|
|
"\xd0\x9e",
|
|
"\xd0\x9f",
|
|
"\xd0\xaf",
|
|
"\xd0\xa0",
|
|
"\xd0\xa1",
|
|
"\xd0\xa2",
|
|
"\xd0\xa3",
|
|
"\xd0\x96",
|
|
"\xd0\x92",
|
|
"\xd0\xac",
|
|
"\xd0\xab",
|
|
"\xd0\x97",
|
|
"\xd0\xa8",
|
|
"\xd0\xad",
|
|
"\xd0\xa9",
|
|
"\xd0\xa7",
|
|
"\xd0\xaa",
|
|
);
|
|
|
|
my %from_ucs4 = (
|
|
0x00000000 => "\x00",
|
|
0x00000001 => "\x01",
|
|
0x00000002 => "\x02",
|
|
0x00000003 => "\x03",
|
|
0x00000004 => "\x04",
|
|
0x00000005 => "\x05",
|
|
0x00000006 => "\x06",
|
|
0x00000007 => "\x07",
|
|
0x00000008 => "\x08",
|
|
0x00000009 => "\x09",
|
|
0x0000000a => "\x0a",
|
|
0x0000000b => "\x0b",
|
|
0x0000000c => "\x0c",
|
|
0x0000000d => "\x0d",
|
|
0x0000000e => "\x0e",
|
|
0x0000000f => "\x0f",
|
|
0x00000010 => "\x10",
|
|
0x00000011 => "\x11",
|
|
0x00000012 => "\x12",
|
|
0x00000013 => "\x13",
|
|
0x00000014 => "\x14",
|
|
0x00000015 => "\x15",
|
|
0x00000016 => "\x16",
|
|
0x00000017 => "\x17",
|
|
0x00000018 => "\x18",
|
|
0x00000019 => "\x19",
|
|
0x0000001a => "\x1a",
|
|
0x0000001b => "\x1b",
|
|
0x0000001c => "\x1c",
|
|
0x0000001d => "\x1d",
|
|
0x0000001e => "\x1e",
|
|
0x0000001f => "\x1f",
|
|
0x00000020 => "\x20",
|
|
0x00000021 => "\x21",
|
|
0x00000022 => "\x22",
|
|
0x00000023 => "\x23",
|
|
0x00000024 => "\x24",
|
|
0x00000025 => "\x25",
|
|
0x00000026 => "\x26",
|
|
0x00000027 => "\x27",
|
|
0x00000028 => "\x28",
|
|
0x00000029 => "\x29",
|
|
0x0000002a => "\x2a",
|
|
0x0000002b => "\x2b",
|
|
0x0000002c => "\x2c",
|
|
0x0000002d => "\x2d",
|
|
0x0000002e => "\x2e",
|
|
0x0000002f => "\x2f",
|
|
0x00000030 => "\x30",
|
|
0x00000031 => "\x31",
|
|
0x00000032 => "\x32",
|
|
0x00000033 => "\x33",
|
|
0x00000034 => "\x34",
|
|
0x00000035 => "\x35",
|
|
0x00000036 => "\x36",
|
|
0x00000037 => "\x37",
|
|
0x00000038 => "\x38",
|
|
0x00000039 => "\x39",
|
|
0x0000003a => "\x3a",
|
|
0x0000003b => "\x3b",
|
|
0x0000003c => "\x3c",
|
|
0x0000003d => "\x3d",
|
|
0x0000003e => "\x3e",
|
|
0x0000003f => "\x3f",
|
|
0x00000040 => "\x40",
|
|
0x00000041 => "\x41",
|
|
0x00000042 => "\x42",
|
|
0x00000043 => "\x43",
|
|
0x00000044 => "\x44",
|
|
0x00000045 => "\x45",
|
|
0x00000046 => "\x46",
|
|
0x00000047 => "\x47",
|
|
0x00000048 => "\x48",
|
|
0x00000049 => "\x49",
|
|
0x0000004a => "\x4a",
|
|
0x0000004b => "\x4b",
|
|
0x0000004c => "\x4c",
|
|
0x0000004d => "\x4d",
|
|
0x0000004e => "\x4e",
|
|
0x0000004f => "\x4f",
|
|
0x00000050 => "\x50",
|
|
0x00000051 => "\x51",
|
|
0x00000052 => "\x52",
|
|
0x00000053 => "\x53",
|
|
0x00000054 => "\x54",
|
|
0x00000055 => "\x55",
|
|
0x00000056 => "\x56",
|
|
0x00000057 => "\x57",
|
|
0x00000058 => "\x58",
|
|
0x00000059 => "\x59",
|
|
0x0000005a => "\x5a",
|
|
0x0000005b => "\x5b",
|
|
0x0000005c => "\x5c",
|
|
0x0000005d => "\x5d",
|
|
0x0000005e => "\x5e",
|
|
0x0000005f => "\x5f",
|
|
0x00000060 => "\x60",
|
|
0x00000061 => "\x61",
|
|
0x00000062 => "\x62",
|
|
0x00000063 => "\x63",
|
|
0x00000064 => "\x64",
|
|
0x00000065 => "\x65",
|
|
0x00000066 => "\x66",
|
|
0x00000067 => "\x67",
|
|
0x00000068 => "\x68",
|
|
0x00000069 => "\x69",
|
|
0x0000006a => "\x6a",
|
|
0x0000006b => "\x6b",
|
|
0x0000006c => "\x6c",
|
|
0x0000006d => "\x6d",
|
|
0x0000006e => "\x6e",
|
|
0x0000006f => "\x6f",
|
|
0x00000070 => "\x70",
|
|
0x00000071 => "\x71",
|
|
0x00000072 => "\x72",
|
|
0x00000073 => "\x73",
|
|
0x00000074 => "\x74",
|
|
0x00000075 => "\x75",
|
|
0x00000076 => "\x76",
|
|
0x00000077 => "\x77",
|
|
0x00000078 => "\x78",
|
|
0x00000079 => "\x79",
|
|
0x0000007a => "\x7a",
|
|
0x0000007b => "\x7b",
|
|
0x0000007c => "\x7c",
|
|
0x0000007d => "\x7d",
|
|
0x0000007e => "\x7e",
|
|
0x0000007f => "\x7f",
|
|
0x000000a0 => "\x9a",
|
|
0x000000a9 => "\xbf",
|
|
0x000000b0 => "\x9c",
|
|
0x000000b2 => "\x9d",
|
|
0x000000b7 => "\x9e",
|
|
0x000000f7 => "\x9f",
|
|
0x00000401 => "\xb3",
|
|
0x00000404 => "\xb4",
|
|
0x00000406 => "\xb6",
|
|
0x00000407 => "\xb7",
|
|
0x0000040e => "\xbe",
|
|
0x00000410 => "\xe1",
|
|
0x00000411 => "\xe2",
|
|
0x00000412 => "\xf7",
|
|
0x00000413 => "\xe7",
|
|
0x00000414 => "\xe4",
|
|
0x00000415 => "\xe5",
|
|
0x00000416 => "\xf6",
|
|
0x00000417 => "\xfa",
|
|
0x00000418 => "\xe9",
|
|
0x00000419 => "\xea",
|
|
0x0000041a => "\xeb",
|
|
0x0000041b => "\xec",
|
|
0x0000041c => "\xed",
|
|
0x0000041d => "\xee",
|
|
0x0000041e => "\xef",
|
|
0x0000041f => "\xf0",
|
|
0x00000420 => "\xf2",
|
|
0x00000421 => "\xf3",
|
|
0x00000422 => "\xf4",
|
|
0x00000423 => "\xf5",
|
|
0x00000424 => "\xe6",
|
|
0x00000425 => "\xe8",
|
|
0x00000426 => "\xe3",
|
|
0x00000427 => "\xfe",
|
|
0x00000428 => "\xfb",
|
|
0x00000429 => "\xfd",
|
|
0x0000042a => "\xff",
|
|
0x0000042b => "\xf9",
|
|
0x0000042c => "\xf8",
|
|
0x0000042d => "\xfc",
|
|
0x0000042e => "\xe0",
|
|
0x0000042f => "\xf1",
|
|
0x00000430 => "\xc1",
|
|
0x00000431 => "\xc2",
|
|
0x00000432 => "\xd7",
|
|
0x00000433 => "\xc7",
|
|
0x00000434 => "\xc4",
|
|
0x00000435 => "\xc5",
|
|
0x00000436 => "\xd6",
|
|
0x00000437 => "\xda",
|
|
0x00000438 => "\xc9",
|
|
0x00000439 => "\xca",
|
|
0x0000043a => "\xcb",
|
|
0x0000043b => "\xcc",
|
|
0x0000043c => "\xcd",
|
|
0x0000043d => "\xce",
|
|
0x0000043e => "\xcf",
|
|
0x0000043f => "\xd0",
|
|
0x00000440 => "\xd2",
|
|
0x00000441 => "\xd3",
|
|
0x00000442 => "\xd4",
|
|
0x00000443 => "\xd5",
|
|
0x00000444 => "\xc6",
|
|
0x00000445 => "\xc8",
|
|
0x00000446 => "\xc3",
|
|
0x00000447 => "\xde",
|
|
0x00000448 => "\xdb",
|
|
0x00000449 => "\xdd",
|
|
0x0000044a => "\xdf",
|
|
0x0000044b => "\xd9",
|
|
0x0000044c => "\xd8",
|
|
0x0000044d => "\xdc",
|
|
0x0000044e => "\xc0",
|
|
0x0000044f => "\xd1",
|
|
0x00000451 => "\xa3",
|
|
0x00000454 => "\xa4",
|
|
0x00000456 => "\xa6",
|
|
0x00000457 => "\xa7",
|
|
0x0000045e => "\xae",
|
|
0x00000490 => "\xbd",
|
|
0x00000491 => "\xad",
|
|
0x00002219 => "\x95",
|
|
0x0000221a => "\x96",
|
|
0x00002248 => "\x97",
|
|
0x00002264 => "\x98",
|
|
0x00002265 => "\x99",
|
|
0x00002320 => "\x93",
|
|
0x00002321 => "\x9b",
|
|
0x00002500 => "\x80",
|
|
0x00002502 => "\x81",
|
|
0x0000250c => "\x82",
|
|
0x00002510 => "\x83",
|
|
0x00002514 => "\x84",
|
|
0x00002518 => "\x85",
|
|
0x0000251c => "\x86",
|
|
0x00002524 => "\x87",
|
|
0x0000252c => "\x88",
|
|
0x00002534 => "\x89",
|
|
0x0000253c => "\x8a",
|
|
0x00002550 => "\xa0",
|
|
0x00002551 => "\xa1",
|
|
0x00002552 => "\xa2",
|
|
0x00002554 => "\xa5",
|
|
0x00002557 => "\xa8",
|
|
0x00002558 => "\xa9",
|
|
0x00002559 => "\xaa",
|
|
0x0000255a => "\xab",
|
|
0x0000255b => "\xac",
|
|
0x0000255e => "\xaf",
|
|
0x0000255f => "\xb0",
|
|
0x00002560 => "\xb1",
|
|
0x00002561 => "\xb2",
|
|
0x00002563 => "\xb5",
|
|
0x00002566 => "\xb8",
|
|
0x00002567 => "\xb9",
|
|
0x00002568 => "\xba",
|
|
0x00002569 => "\xbb",
|
|
0x0000256a => "\xbc",
|
|
0x00002580 => "\x8b",
|
|
0x00002584 => "\x8c",
|
|
0x00002588 => "\x8d",
|
|
0x0000258c => "\x8e",
|
|
0x00002590 => "\x8f",
|
|
0x00002591 => "\x90",
|
|
0x00002592 => "\x91",
|
|
0x00002593 => "\x92",
|
|
0x000025a0 => "\x94",
|
|
);
|
|
|
|
sub _recode
|
|
{
|
|
if ($_[0]->{_from} eq 'INTERNAL') {
|
|
$_[1] = join '',
|
|
map $from_ucs4{$_}
|
|
|| (defined $from_ucs4{$_} ? $from_ucs4{$_} : "\x3f"),
|
|
@{$_[1]};
|
|
} elsif ($_[0]->{_to} eq 'UTF-8',) {
|
|
$_[1] = join '', map $to_utf8[$_], unpack 'C*', $_[1];
|
|
} else {
|
|
$_[1] = [ map
|
|
$to_ucs4[$_],
|
|
unpack 'C*', $_[1]
|
|
];
|
|
}
|
|
|
|
return 1;
|
|
}
|
|
|
|
1;
|
|
|
|
__END__
|
|
|
|
=head1 NAME
|
|
|
|
Locale::RecodeData::KOI8_RU - Conversion routines for KOI8-RU
|
|
|
|
=head1 SYNOPSIS
|
|
|
|
This module is internal to libintl. Do not use directly!
|
|
|
|
=head1 DESCRIPTION
|
|
|
|
This module is generated and contains the conversion tables and
|
|
routines for KOI8-RU.
|
|
|
|
=head1 COMMENTS
|
|
|
|
The following comments have been extracted from the original charmap:
|
|
|
|
|
|
This charmap has been generated automatically from GNU libiconv
|
|
conversions.
|
|
|
|
Please note that aliases listed above are not necessarily valid!
|
|
|
|
=head1 CHARACTER TABLE
|
|
|
|
The following table is sorted in the same order as the original charmap.
|
|
All character codes are in hexadecimal. Please read 'ISO-10646' as
|
|
'ISO-10646-UCS4'.
|
|
|
|
Local | ISO-10646 | Description
|
|
-------+-----------+-------------------------------------------------
|
|
00 | 00000000 | NULL (NUL)
|
|
01 | 00000001 | START OF HEADING (SOH)
|
|
02 | 00000002 | START OF TEXT (STX)
|
|
03 | 00000003 | END OF TEXT (ETX)
|
|
04 | 00000004 | END OF TRANSMISSION (EOT)
|
|
05 | 00000005 | ENQUIRY (ENQ)
|
|
06 | 00000006 | ACKNOWLEDGE (ACK)
|
|
07 | 00000007 | BELL (BEL)
|
|
08 | 00000008 | BACKSPACE (BS)
|
|
09 | 00000009 | CHARACTER TABULATION (HT)
|
|
0A | 0000000A | LINE FEED (LF)
|
|
0B | 0000000B | LINE TABULATION (VT)
|
|
0C | 0000000C | FORM FEED (FF)
|
|
0D | 0000000D | CARRIAGE RETURN (CR)
|
|
0E | 0000000E | SHIFT OUT (SO)
|
|
0F | 0000000F | SHIFT IN (SI)
|
|
10 | 00000010 | DATALINK ESCAPE (DLE)
|
|
11 | 00000011 | DEVICE CONTROL ONE (DC1)
|
|
12 | 00000012 | DEVICE CONTROL TWO (DC2)
|
|
13 | 00000013 | DEVICE CONTROL THREE (DC3)
|
|
14 | 00000014 | DEVICE CONTROL FOUR (DC4)
|
|
15 | 00000015 | NEGATIVE ACKNOWLEDGE (NAK)
|
|
16 | 00000016 | SYNCHRONOUS IDLE (SYN)
|
|
17 | 00000017 | END OF TRANSMISSION BLOCK (ETB)
|
|
18 | 00000018 | CANCEL (CAN)
|
|
19 | 00000019 | END OF MEDIUM (EM)
|
|
1A | 0000001A | SUBSTITUTE (SUB)
|
|
1B | 0000001B | ESCAPE (ESC)
|
|
1C | 0000001C | FILE SEPARATOR (IS4)
|
|
1D | 0000001D | GROUP SEPARATOR (IS3)
|
|
1E | 0000001E | RECORD SEPARATOR (IS2)
|
|
1F | 0000001F | UNIT SEPARATOR (IS1)
|
|
20 | 00000020 | SPACE
|
|
21 | 00000021 | EXCLAMATION MARK
|
|
22 | 00000022 | QUOTATION MARK
|
|
23 | 00000023 | NUMBER SIGN
|
|
24 | 00000024 | DOLLAR SIGN
|
|
25 | 00000025 | PERCENT SIGN
|
|
26 | 00000026 | AMPERSAND
|
|
27 | 00000027 | APOSTROPHE
|
|
28 | 00000028 | LEFT PARENTHESIS
|
|
29 | 00000029 | RIGHT PARENTHESIS
|
|
2A | 0000002A | ASTERISK
|
|
2B | 0000002B | PLUS SIGN
|
|
2C | 0000002C | COMMA
|
|
2D | 0000002D | HYPHEN-MINUS
|
|
2E | 0000002E | FULL STOP
|
|
2F | 0000002F | SOLIDUS
|
|
30 | 00000030 | DIGIT ZERO
|
|
31 | 00000031 | DIGIT ONE
|
|
32 | 00000032 | DIGIT TWO
|
|
33 | 00000033 | DIGIT THREE
|
|
34 | 00000034 | DIGIT FOUR
|
|
35 | 00000035 | DIGIT FIVE
|
|
36 | 00000036 | DIGIT SIX
|
|
37 | 00000037 | DIGIT SEVEN
|
|
38 | 00000038 | DIGIT EIGHT
|
|
39 | 00000039 | DIGIT NINE
|
|
3A | 0000003A | COLON
|
|
3B | 0000003B | SEMICOLON
|
|
3C | 0000003C | LESS-THAN SIGN
|
|
3D | 0000003D | EQUALS SIGN
|
|
3E | 0000003E | GREATER-THAN SIGN
|
|
3F | 0000003F | QUESTION MARK
|
|
40 | 00000040 | COMMERCIAL AT
|
|
41 | 00000041 | LATIN CAPITAL LETTER A
|
|
42 | 00000042 | LATIN CAPITAL LETTER B
|
|
43 | 00000043 | LATIN CAPITAL LETTER C
|
|
44 | 00000044 | LATIN CAPITAL LETTER D
|
|
45 | 00000045 | LATIN CAPITAL LETTER E
|
|
46 | 00000046 | LATIN CAPITAL LETTER F
|
|
47 | 00000047 | LATIN CAPITAL LETTER G
|
|
48 | 00000048 | LATIN CAPITAL LETTER H
|
|
49 | 00000049 | LATIN CAPITAL LETTER I
|
|
4A | 0000004A | LATIN CAPITAL LETTER J
|
|
4B | 0000004B | LATIN CAPITAL LETTER K
|
|
4C | 0000004C | LATIN CAPITAL LETTER L
|
|
4D | 0000004D | LATIN CAPITAL LETTER M
|
|
4E | 0000004E | LATIN CAPITAL LETTER N
|
|
4F | 0000004F | LATIN CAPITAL LETTER O
|
|
50 | 00000050 | LATIN CAPITAL LETTER P
|
|
51 | 00000051 | LATIN CAPITAL LETTER Q
|
|
52 | 00000052 | LATIN CAPITAL LETTER R
|
|
53 | 00000053 | LATIN CAPITAL LETTER S
|
|
54 | 00000054 | LATIN CAPITAL LETTER T
|
|
55 | 00000055 | LATIN CAPITAL LETTER U
|
|
56 | 00000056 | LATIN CAPITAL LETTER V
|
|
57 | 00000057 | LATIN CAPITAL LETTER W
|
|
58 | 00000058 | LATIN CAPITAL LETTER X
|
|
59 | 00000059 | LATIN CAPITAL LETTER Y
|
|
5A | 0000005A | LATIN CAPITAL LETTER Z
|
|
5B | 0000005B | LEFT SQUARE BRACKET
|
|
5C | 0000005C | REVERSE SOLIDUS
|
|
5D | 0000005D | RIGHT SQUARE BRACKET
|
|
5E | 0000005E | CIRCUMFLEX ACCENT
|
|
5F | 0000005F | LOW LINE
|
|
60 | 00000060 | GRAVE ACCENT
|
|
61 | 00000061 | LATIN SMALL LETTER A
|
|
62 | 00000062 | LATIN SMALL LETTER B
|
|
63 | 00000063 | LATIN SMALL LETTER C
|
|
64 | 00000064 | LATIN SMALL LETTER D
|
|
65 | 00000065 | LATIN SMALL LETTER E
|
|
66 | 00000066 | LATIN SMALL LETTER F
|
|
67 | 00000067 | LATIN SMALL LETTER G
|
|
68 | 00000068 | LATIN SMALL LETTER H
|
|
69 | 00000069 | LATIN SMALL LETTER I
|
|
6A | 0000006A | LATIN SMALL LETTER J
|
|
6B | 0000006B | LATIN SMALL LETTER K
|
|
6C | 0000006C | LATIN SMALL LETTER L
|
|
6D | 0000006D | LATIN SMALL LETTER M
|
|
6E | 0000006E | LATIN SMALL LETTER N
|
|
6F | 0000006F | LATIN SMALL LETTER O
|
|
70 | 00000070 | LATIN SMALL LETTER P
|
|
71 | 00000071 | LATIN SMALL LETTER Q
|
|
72 | 00000072 | LATIN SMALL LETTER R
|
|
73 | 00000073 | LATIN SMALL LETTER S
|
|
74 | 00000074 | LATIN SMALL LETTER T
|
|
75 | 00000075 | LATIN SMALL LETTER U
|
|
76 | 00000076 | LATIN SMALL LETTER V
|
|
77 | 00000077 | LATIN SMALL LETTER W
|
|
78 | 00000078 | LATIN SMALL LETTER X
|
|
79 | 00000079 | LATIN SMALL LETTER Y
|
|
7A | 0000007A | LATIN SMALL LETTER Z
|
|
7B | 0000007B | LEFT CURLY BRACKET
|
|
7C | 0000007C | VERTICAL LINE
|
|
7D | 0000007D | RIGHT CURLY BRACKET
|
|
7E | 0000007E | TILDE
|
|
7F | 0000007F | DELETE (DEL)
|
|
80 | 00002500 | BOX DRAWINGS LIGHT HORIZONTAL
|
|
81 | 00002502 | BOX DRAWINGS LIGHT VERTICAL
|
|
82 | 0000250C | BOX DRAWINGS LIGHT DOWN AND RIGHT
|
|
83 | 00002510 | BOX DRAWINGS LIGHT DOWN AND LEFT
|
|
84 | 00002514 | BOX DRAWINGS LIGHT UP AND RIGHT
|
|
85 | 00002518 | BOX DRAWINGS LIGHT UP AND LEFT
|
|
86 | 0000251C | BOX DRAWINGS LIGHT VERTICAL AND RIGHT
|
|
87 | 00002524 | BOX DRAWINGS LIGHT VERTICAL AND LEFT
|
|
88 | 0000252C | BOX DRAWINGS LIGHT DOWN AND HORIZONTAL
|
|
89 | 00002534 | BOX DRAWINGS LIGHT UP AND HORIZONTAL
|
|
8A | 0000253C | BOX DRAWINGS LIGHT VERTICAL AND HORIZONTAL
|
|
8B | 00002580 | UPPER HALF BLOCK
|
|
8C | 00002584 | LOWER HALF BLOCK
|
|
8D | 00002588 | FULL BLOCK
|
|
8E | 0000258C | LEFT HALF BLOCK
|
|
8F | 00002590 | RIGHT HALF BLOCK
|
|
90 | 00002591 | LIGHT SHADE
|
|
91 | 00002592 | MEDIUM SHADE
|
|
92 | 00002593 | DARK SHADE
|
|
93 | 00002320 | TOP HALF INTEGRAL
|
|
94 | 000025A0 | BLACK SQUARE
|
|
95 | 00002219 | BULLET OPERATOR
|
|
96 | 0000221A | SQUARE ROOT
|
|
97 | 00002248 | ALMOST EQUAL TO
|
|
98 | 00002264 | LESS-THAN OR EQUAL TO
|
|
99 | 00002265 | GREATER-THAN OR EQUAL TO
|
|
9A | 000000A0 | NO-BREAK SPACE
|
|
9B | 00002321 | BOTTOM HALF INTEGRAL
|
|
9C | 000000B0 | DEGREE SIGN
|
|
9D | 000000B2 | SUPERSCRIPT TWO
|
|
9E | 000000B7 | MIDDLE DOT
|
|
9F | 000000F7 | DIVISION SIGN
|
|
A0 | 00002550 | BOX DRAWINGS DOUBLE HORIZONTAL
|
|
A1 | 00002551 | BOX DRAWINGS DOUBLE VERTICAL
|
|
A2 | 00002552 | BOX DRAWINGS DOWN SINGLE AND RIGHT DOUBLE
|
|
A3 | 00000451 | CYRILLIC SMALL LETTER IO
|
|
A4 | 00000454 | CYRILLIC SMALL LETTER UKRAINIAN IE
|
|
A5 | 00002554 | BOX DRAWINGS DOUBLE DOWN AND RIGHT
|
|
A6 | 00000456 | CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
|
|
A7 | 00000457 | CYRILLIC SMALL LETTER YI
|
|
A8 | 00002557 | BOX DRAWINGS DOUBLE DOWN AND LEFT
|
|
A9 | 00002558 | BOX DRAWINGS UP SINGLE AND RIGHT DOUBLE
|
|
AA | 00002559 | BOX DRAWINGS UP DOUBLE AND RIGHT SINGLE
|
|
AB | 0000255A | BOX DRAWINGS DOUBLE UP AND RIGHT
|
|
AC | 0000255B | BOX DRAWINGS UP SINGLE AND LEFT DOUBLE
|
|
AD | 00000491 | CYRILLIC SMALL LETTER GHE WITH UPTURN
|
|
AE | 0000045E | CYRILLIC SMALL LETTER SHORT U
|
|
AF | 0000255E | BOX DRAWINGS VERTICAL SINGLE AND RIGHT DOUBLE
|
|
B0 | 0000255F | BOX DRAWINGS VERTICAL DOUBLE AND RIGHT SINGLE
|
|
B1 | 00002560 | BOX DRAWINGS DOUBLE VERTICAL AND RIGHT
|
|
B2 | 00002561 | BOX DRAWINGS VERTICAL SINGLE AND LEFT DOUBLE
|
|
B3 | 00000401 | CYRILLIC CAPITAL LETTER IO
|
|
B4 | 00000404 | CYRILLIC CAPITAL LETTER UKRAINIAN IE
|
|
B5 | 00002563 | BOX DRAWINGS DOUBLE VERTICAL AND LEFT
|
|
B6 | 00000406 | CYRILLIC CAPITAL LETTER BYELORUSSIAN-UKRAINIAN I
|
|
B7 | 00000407 | CYRILLIC CAPITAL LETTER YI
|
|
B8 | 00002566 | BOX DRAWINGS DOUBLE DOWN AND HORIZONTAL
|
|
B9 | 00002567 | BOX DRAWINGS UP SINGLE AND HORIZONTAL DOUBLE
|
|
BA | 00002568 | BOX DRAWINGS UP DOUBLE AND HORIZONTAL SINGLE
|
|
BB | 00002569 | BOX DRAWINGS DOUBLE UP AND HORIZONTAL
|
|
BC | 0000256A | BOX DRAWINGS VERTICAL SINGLE AND HORIZONTAL DOUBLE
|
|
BD | 00000490 | CYRILLIC CAPITAL LETTER GHE WITH UPTURN
|
|
BE | 0000040E | CYRILLIC CAPITAL LETTER SHORT U
|
|
BF | 000000A9 | COPYRIGHT SIGN
|
|
C0 | 0000044E | CYRILLIC SMALL LETTER YU
|
|
C1 | 00000430 | CYRILLIC SMALL LETTER A
|
|
C2 | 00000431 | CYRILLIC SMALL LETTER BE
|
|
C3 | 00000446 | CYRILLIC SMALL LETTER TSE
|
|
C4 | 00000434 | CYRILLIC SMALL LETTER DE
|
|
C5 | 00000435 | CYRILLIC SMALL LETTER IE
|
|
C6 | 00000444 | CYRILLIC SMALL LETTER EF
|
|
C7 | 00000433 | CYRILLIC SMALL LETTER GHE
|
|
C8 | 00000445 | CYRILLIC SMALL LETTER HA
|
|
C9 | 00000438 | CYRILLIC SMALL LETTER I
|
|
CA | 00000439 | CYRILLIC SMALL LETTER SHORT I
|
|
CB | 0000043A | CYRILLIC SMALL LETTER KA
|
|
CC | 0000043B | CYRILLIC SMALL LETTER EL
|
|
CD | 0000043C | CYRILLIC SMALL LETTER EM
|
|
CE | 0000043D | CYRILLIC SMALL LETTER EN
|
|
CF | 0000043E | CYRILLIC SMALL LETTER O
|
|
D0 | 0000043F | CYRILLIC SMALL LETTER PE
|
|
D1 | 0000044F | CYRILLIC SMALL LETTER YA
|
|
D2 | 00000440 | CYRILLIC SMALL LETTER ER
|
|
D3 | 00000441 | CYRILLIC SMALL LETTER ES
|
|
D4 | 00000442 | CYRILLIC SMALL LETTER TE
|
|
D5 | 00000443 | CYRILLIC SMALL LETTER U
|
|
D6 | 00000436 | CYRILLIC SMALL LETTER ZHE
|
|
D7 | 00000432 | CYRILLIC SMALL LETTER VE
|
|
D8 | 0000044C | CYRILLIC SMALL LETTER SOFT SIGN
|
|
D9 | 0000044B | CYRILLIC SMALL LETTER YERU
|
|
DA | 00000437 | CYRILLIC SMALL LETTER ZE
|
|
DB | 00000448 | CYRILLIC SMALL LETTER SHA
|
|
DC | 0000044D | CYRILLIC SMALL LETTER E
|
|
DD | 00000449 | CYRILLIC SMALL LETTER SHCHA
|
|
DE | 00000447 | CYRILLIC SMALL LETTER CHE
|
|
DF | 0000044A | CYRILLIC SMALL LETTER HARD SIGN
|
|
E0 | 0000042E | CYRILLIC CAPITAL LETTER YU
|
|
E1 | 00000410 | CYRILLIC CAPITAL LETTER A
|
|
E2 | 00000411 | CYRILLIC CAPITAL LETTER BE
|
|
E3 | 00000426 | CYRILLIC CAPITAL LETTER TSE
|
|
E4 | 00000414 | CYRILLIC CAPITAL LETTER DE
|
|
E5 | 00000415 | CYRILLIC CAPITAL LETTER IE
|
|
E6 | 00000424 | CYRILLIC CAPITAL LETTER EF
|
|
E7 | 00000413 | CYRILLIC CAPITAL LETTER GHE
|
|
E8 | 00000425 | CYRILLIC CAPITAL LETTER HA
|
|
E9 | 00000418 | CYRILLIC CAPITAL LETTER I
|
|
EA | 00000419 | CYRILLIC CAPITAL LETTER SHORT I
|
|
EB | 0000041A | CYRILLIC CAPITAL LETTER KA
|
|
EC | 0000041B | CYRILLIC CAPITAL LETTER EL
|
|
ED | 0000041C | CYRILLIC CAPITAL LETTER EM
|
|
EE | 0000041D | CYRILLIC CAPITAL LETTER EN
|
|
EF | 0000041E | CYRILLIC CAPITAL LETTER O
|
|
F0 | 0000041F | CYRILLIC CAPITAL LETTER PE
|
|
F1 | 0000042F | CYRILLIC CAPITAL LETTER YA
|
|
F2 | 00000420 | CYRILLIC CAPITAL LETTER ER
|
|
F3 | 00000421 | CYRILLIC CAPITAL LETTER ES
|
|
F4 | 00000422 | CYRILLIC CAPITAL LETTER TE
|
|
F5 | 00000423 | CYRILLIC CAPITAL LETTER U
|
|
F6 | 00000416 | CYRILLIC CAPITAL LETTER ZHE
|
|
F7 | 00000412 | CYRILLIC CAPITAL LETTER VE
|
|
F8 | 0000042C | CYRILLIC CAPITAL LETTER SOFT SIGN
|
|
F9 | 0000042B | CYRILLIC CAPITAL LETTER YERU
|
|
FA | 00000417 | CYRILLIC CAPITAL LETTER ZE
|
|
FB | 00000428 | CYRILLIC CAPITAL LETTER SHA
|
|
FC | 0000042D | CYRILLIC CAPITAL LETTER E
|
|
FD | 00000429 | CYRILLIC CAPITAL LETTER SHCHA
|
|
FE | 00000427 | CYRILLIC CAPITAL LETTER CHE
|
|
FF | 0000042A | CYRILLIC CAPITAL LETTER HARD SIGN
|
|
|
|
|
|
=head1 AUTHOR
|
|
|
|
Copyright (C) 2002-2017 L<Guido Flohr|http://www.guido-flohr.net/>
|
|
(L<mailto:guido.flohr@cantanea.com>), all rights reserved. See the source
|
|
code for details!code for details!
|
|
|
|
=head1 SEE ALSO
|
|
|
|
Locale::RecodeData(3), Locale::Recode(3), perl(1)
|
|
|
|
=cut
|
|
Local Variables:
|
|
mode: perl
|
|
perl-indent-level: 4
|
|
perl-continued-statement-offset: 4
|
|
perl-continued-brace-offset: 0
|
|
perl-brace-offset: -4
|
|
perl-brace-imaginary-offset: 0
|
|
perl-label-offset: -4
|
|
cperl-indent-level: 4
|
|
cperl-continued-statement-offset: 2
|
|
tab-width: 4
|
|
End:
|