xref: /webtrees/app/Encodings/Windows1251.php (revision e873f434551745f888937263ff89e80db3b0f785)
11c6adce8SGreg Roach<?php
21c6adce8SGreg Roach
31c6adce8SGreg Roach/**
41c6adce8SGreg Roach * webtrees: online genealogy
5d11be702SGreg Roach * Copyright (C) 2023 webtrees development team
61c6adce8SGreg Roach * This program is free software: you can redistribute it and/or modify
71c6adce8SGreg Roach * it under the terms of the GNU General Public License as published by
81c6adce8SGreg Roach * the Free Software Foundation, either version 3 of the License, or
91c6adce8SGreg Roach * (at your option) any later version.
101c6adce8SGreg Roach * This program is distributed in the hope that it will be useful,
111c6adce8SGreg Roach * but WITHOUT ANY WARRANTY; without even the implied warranty of
121c6adce8SGreg Roach * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
131c6adce8SGreg Roach * GNU General Public License for more details.
141c6adce8SGreg Roach * You should have received a copy of the GNU General Public License
151c6adce8SGreg Roach * along with this program. If not, see <https://www.gnu.org/licenses/>.
161c6adce8SGreg Roach */
171c6adce8SGreg Roach
181c6adce8SGreg Roachdeclare(strict_types=1);
191c6adce8SGreg Roach
201c6adce8SGreg Roachnamespace Fisharebest\Webtrees\Encodings;
211c6adce8SGreg Roach
221c6adce8SGreg Roach/**
231c6adce8SGreg Roach * Convert between Windows Code Page 1251 and UTF-8.
241c6adce8SGreg Roach *
251c6adce8SGreg Roach * @link https://en.wikipedia.org/wiki/Windows-1251
261c6adce8SGreg Roach */
271c6adce8SGreg Roachclass Windows1251 extends AbstractEncoding
281c6adce8SGreg Roach{
29*e873f434SGreg Roach    public const string NAME = 'CP1251';
301c6adce8SGreg Roach
31*e873f434SGreg Roach    protected const array TO_UTF8 = [
321c6adce8SGreg Roach        "\x80" => UTF8::CYRILLIC_CAPITAL_LETTER_DJE,
331c6adce8SGreg Roach        "\x81" => UTF8::CYRILLIC_CAPITAL_LETTER_GJE,
341c6adce8SGreg Roach        "\x82" => UTF8::SINGLE_LOW_9_QUOTATION_MARK,
351c6adce8SGreg Roach        "\x83" => UTF8::CYRILLIC_SMALL_LETTER_GJE,
361c6adce8SGreg Roach        "\x84" => UTF8::DOUBLE_LOW_9_QUOTATION_MARK,
371c6adce8SGreg Roach        "\x85" => UTF8::HORIZONTAL_ELLIPSIS,
381c6adce8SGreg Roach        "\x86" => UTF8::DAGGER,
391c6adce8SGreg Roach        "\x87" => UTF8::DOUBLE_DAGGER,
401c6adce8SGreg Roach        "\x88" => UTF8::EURO_SIGN,
411c6adce8SGreg Roach        "\x89" => UTF8::PER_MILLE_SIGN,
421c6adce8SGreg Roach        "\x8A" => UTF8::CYRILLIC_CAPITAL_LETTER_LJE,
431c6adce8SGreg Roach        "\x8B" => UTF8::SINGLE_LEFT_POINTING_ANGLE_QUOTATION_MARK,
441c6adce8SGreg Roach        "\x8C" => UTF8::CYRILLIC_CAPITAL_LETTER_NJE,
451c6adce8SGreg Roach        "\x8D" => UTF8::CYRILLIC_CAPITAL_LETTER_KJE,
461c6adce8SGreg Roach        "\x8E" => UTF8::CYRILLIC_CAPITAL_LETTER_TSHE,
471c6adce8SGreg Roach        "\x8F" => UTF8::CYRILLIC_CAPITAL_LETTER_DZHE,
481c6adce8SGreg Roach        "\x90" => UTF8::CYRILLIC_SMALL_LETTER_DJE,
491c6adce8SGreg Roach        "\x91" => UTF8::LEFT_SINGLE_QUOTATION_MARK,
501c6adce8SGreg Roach        "\x92" => UTF8::RIGHT_SINGLE_QUOTATION_MARK,
511c6adce8SGreg Roach        "\x93" => UTF8::LEFT_DOUBLE_QUOTATION_MARK,
521c6adce8SGreg Roach        "\x94" => UTF8::RIGHT_DOUBLE_QUOTATION_MARK,
531c6adce8SGreg Roach        "\x95" => UTF8::BULLET,
541c6adce8SGreg Roach        "\x96" => UTF8::EN_DASH,
551c6adce8SGreg Roach        "\x97" => UTF8::EM_DASH,
561c6adce8SGreg Roach        "\x98" => UTF8::REPLACEMENT_CHARACTER,
571c6adce8SGreg Roach        "\x99" => UTF8::TRADE_MARK_SIGN,
581c6adce8SGreg Roach        "\x9A" => UTF8::CYRILLIC_SMALL_LETTER_LJE,
591c6adce8SGreg Roach        "\x9B" => UTF8::SINGLE_RIGHT_POINTING_ANGLE_QUOTATION_MARK,
601c6adce8SGreg Roach        "\x9C" => UTF8::CYRILLIC_SMALL_LETTER_NJE,
611c6adce8SGreg Roach        "\x9D" => UTF8::CYRILLIC_SMALL_LETTER_KJE,
621c6adce8SGreg Roach        "\x9E" => UTF8::CYRILLIC_SMALL_LETTER_TSHE,
631c6adce8SGreg Roach        "\x9F" => UTF8::CYRILLIC_SMALL_LETTER_DZHE,
641c6adce8SGreg Roach        "\xA0" => UTF8::NO_BREAK_SPACE,
651c6adce8SGreg Roach        "\xA1" => UTF8::CYRILLIC_CAPITAL_LETTER_SHORT_U,
661c6adce8SGreg Roach        "\xA2" => UTF8::CYRILLIC_SMALL_LETTER_SHORT_U,
671c6adce8SGreg Roach        "\xA3" => UTF8::CYRILLIC_CAPITAL_LETTER_JE,
681c6adce8SGreg Roach        "\xA4" => UTF8::CURRENCY_SIGN,
691c6adce8SGreg Roach        "\xA5" => UTF8::CYRILLIC_CAPITAL_LETTER_GHE_WITH_UPTURN,
701c6adce8SGreg Roach        "\xA6" => UTF8::BROKEN_BAR,
711c6adce8SGreg Roach        "\xA7" => UTF8::SECTION_SIGN,
721c6adce8SGreg Roach        "\xA8" => UTF8::CYRILLIC_CAPITAL_LETTER_IO,
731c6adce8SGreg Roach        "\xA9" => UTF8::COPYRIGHT_SIGN,
741c6adce8SGreg Roach        "\xAA" => UTF8::CYRILLIC_CAPITAL_LETTER_UKRANIAN_IE,
751c6adce8SGreg Roach        "\xAB" => UTF8::LEFT_POINTING_DOUBLE_ANGLE_QUOTATION_MARK,
761c6adce8SGreg Roach        "\xAC" => UTF8::NOT_SIGN,
771c6adce8SGreg Roach        "\xAD" => UTF8::SOFT_HYPHEN,
781c6adce8SGreg Roach        "\xAE" => UTF8::REGISTERED_SIGN,
791c6adce8SGreg Roach        "\xAF" => UTF8::CYRILLIC_CAPITAL_LETTER_YI,
801c6adce8SGreg Roach        "\xB0" => UTF8::DEGREE_SIGN,
811c6adce8SGreg Roach        "\xB1" => UTF8::PLUS_MINUS_SIGN,
821c6adce8SGreg Roach        "\xB2" => UTF8::CYRILLIC_CAPITAL_LETTER_BYELORUSSIAN_UKRAINIAN_I,
831c6adce8SGreg Roach        "\xB3" => UTF8::CYRILLIC_SMALL_LETTER_BYELORUSSIAN_UKRAINIAN_I,
841c6adce8SGreg Roach        "\xB4" => UTF8::CYRILLIC_SMALL_LETTER_GHE_WITH_UPTURN,
851c6adce8SGreg Roach        "\xB5" => UTF8::MICRO_SIGN,
861c6adce8SGreg Roach        "\xB6" => UTF8::PILCROW_SIGN,
871c6adce8SGreg Roach        "\xB7" => UTF8::MIDDLE_DOT,
881c6adce8SGreg Roach        "\xB8" => UTF8::CYRILLIC_SMALL_LETTER_IO,
891c6adce8SGreg Roach        "\xB9" => UTF8::NUMERO_SIGN,
901c6adce8SGreg Roach        "\xBA" => UTF8::CYRILLIC_SMALL_LETTER_UKRANIAN_IE,
911c6adce8SGreg Roach        "\xBB" => UTF8::RIGHT_POINTING_DOUBLE_ANGLE_QUOTATION_MARK,
921c6adce8SGreg Roach        "\xBC" => UTF8::CYRILLIC_SMALL_LETTER_JE,
931c6adce8SGreg Roach        "\xBD" => UTF8::CYRILLIC_CAPITAL_LETTER_DZE,
941c6adce8SGreg Roach        "\xBE" => UTF8::CYRILLIC_SMALL_LETTER_DZE,
951c6adce8SGreg Roach        "\xBF" => UTF8::CYRILLIC_SMALL_LETTER_YI,
961c6adce8SGreg Roach        "\xC0" => UTF8::CYRILLIC_CAPITAL_LETTER_A,
971c6adce8SGreg Roach        "\xC1" => UTF8::CYRILLIC_CAPITAL_LETTER_BE,
981c6adce8SGreg Roach        "\xC2" => UTF8::CYRILLIC_CAPITAL_LETTER_VE,
991c6adce8SGreg Roach        "\xC3" => UTF8::CYRILLIC_CAPITAL_LETTER_GHE,
1001c6adce8SGreg Roach        "\xC4" => UTF8::CYRILLIC_CAPITAL_LETTER_DE,
1011c6adce8SGreg Roach        "\xC5" => UTF8::CYRILLIC_CAPITAL_LETTER_IE,
1021c6adce8SGreg Roach        "\xC6" => UTF8::CYRILLIC_CAPITAL_LETTER_ZHE,
1031c6adce8SGreg Roach        "\xC7" => UTF8::CYRILLIC_CAPITAL_LETTER_ZE,
1041c6adce8SGreg Roach        "\xC8" => UTF8::CYRILLIC_CAPITAL_LETTER_I,
1051c6adce8SGreg Roach        "\xC9" => UTF8::CYRILLIC_CAPITAL_LETTER_SHORT_I,
1061c6adce8SGreg Roach        "\xCA" => UTF8::CYRILLIC_CAPITAL_LETTER_KA,
1071c6adce8SGreg Roach        "\xCB" => UTF8::CYRILLIC_CAPITAL_LETTER_EL,
1081c6adce8SGreg Roach        "\xCC" => UTF8::CYRILLIC_CAPITAL_LETTER_EM,
1091c6adce8SGreg Roach        "\xCD" => UTF8::CYRILLIC_CAPITAL_LETTER_EN,
1101c6adce8SGreg Roach        "\xCE" => UTF8::CYRILLIC_CAPITAL_LETTER_O,
1111c6adce8SGreg Roach        "\xCF" => UTF8::CYRILLIC_CAPITAL_LETTER_PE,
1121c6adce8SGreg Roach        "\xD0" => UTF8::CYRILLIC_CAPITAL_LETTER_ER,
1131c6adce8SGreg Roach        "\xD1" => UTF8::CYRILLIC_CAPITAL_LETTER_ES,
1141c6adce8SGreg Roach        "\xD2" => UTF8::CYRILLIC_CAPITAL_LETTER_TE,
1151c6adce8SGreg Roach        "\xD3" => UTF8::CYRILLIC_CAPITAL_LETTER_U,
1161c6adce8SGreg Roach        "\xD4" => UTF8::CYRILLIC_CAPITAL_LETTER_EF,
1171c6adce8SGreg Roach        "\xD5" => UTF8::CYRILLIC_CAPITAL_LETTER_HA,
1181c6adce8SGreg Roach        "\xD6" => UTF8::CYRILLIC_CAPITAL_LETTER_TSE,
1191c6adce8SGreg Roach        "\xD7" => UTF8::CYRILLIC_CAPITAL_LETTER_CHE,
1201c6adce8SGreg Roach        "\xD8" => UTF8::CYRILLIC_CAPITAL_LETTER_SHA,
1211c6adce8SGreg Roach        "\xD9" => UTF8::CYRILLIC_CAPITAL_LETTER_SHCHA,
1221c6adce8SGreg Roach        "\xDA" => UTF8::CYRILLIC_CAPITAL_LETTER_HARD_SIGN,
1231c6adce8SGreg Roach        "\xDB" => UTF8::CYRILLIC_CAPITAL_LETTER_YERU,
1241c6adce8SGreg Roach        "\xDC" => UTF8::CYRILLIC_CAPITAL_LETTER_SOFT_SIGN,
1251c6adce8SGreg Roach        "\xDD" => UTF8::CYRILLIC_CAPITAL_LETTER_E,
1261c6adce8SGreg Roach        "\xDE" => UTF8::CYRILLIC_CAPITAL_LETTER_YU,
1271c6adce8SGreg Roach        "\xDF" => UTF8::CYRILLIC_CAPITAL_LETTER_YA,
1281c6adce8SGreg Roach        "\xE0" => UTF8::CYRILLIC_SMALL_LETTER_A,
1291c6adce8SGreg Roach        "\xE1" => UTF8::CYRILLIC_SMALL_LETTER_BE,
1301c6adce8SGreg Roach        "\xE2" => UTF8::CYRILLIC_SMALL_LETTER_VE,
1311c6adce8SGreg Roach        "\xE3" => UTF8::CYRILLIC_SMALL_LETTER_GHE,
1321c6adce8SGreg Roach        "\xE4" => UTF8::CYRILLIC_SMALL_LETTER_DE,
1331c6adce8SGreg Roach        "\xE5" => UTF8::CYRILLIC_SMALL_LETTER_IE,
1341c6adce8SGreg Roach        "\xE6" => UTF8::CYRILLIC_SMALL_LETTER_ZHE,
1351c6adce8SGreg Roach        "\xE7" => UTF8::CYRILLIC_SMALL_LETTER_ZE,
1361c6adce8SGreg Roach        "\xE8" => UTF8::CYRILLIC_SMALL_LETTER_I,
1371c6adce8SGreg Roach        "\xE9" => UTF8::CYRILLIC_SMALL_LETTER_SHORT_I,
1381c6adce8SGreg Roach        "\xEA" => UTF8::CYRILLIC_SMALL_LETTER_KA,
1391c6adce8SGreg Roach        "\xEB" => UTF8::CYRILLIC_SMALL_LETTER_EL,
1401c6adce8SGreg Roach        "\xEC" => UTF8::CYRILLIC_SMALL_LETTER_EM,
1411c6adce8SGreg Roach        "\xED" => UTF8::CYRILLIC_SMALL_LETTER_EN,
1421c6adce8SGreg Roach        "\xEE" => UTF8::CYRILLIC_SMALL_LETTER_O,
1431c6adce8SGreg Roach        "\xEF" => UTF8::CYRILLIC_SMALL_LETTER_PE,
1441c6adce8SGreg Roach        "\xF0" => UTF8::CYRILLIC_SMALL_LETTER_ER,
1451c6adce8SGreg Roach        "\xF1" => UTF8::CYRILLIC_SMALL_LETTER_ES,
1461c6adce8SGreg Roach        "\xF2" => UTF8::CYRILLIC_SMALL_LETTER_TE,
1471c6adce8SGreg Roach        "\xF3" => UTF8::CYRILLIC_SMALL_LETTER_U,
1481c6adce8SGreg Roach        "\xF4" => UTF8::CYRILLIC_SMALL_LETTER_EF,
1491c6adce8SGreg Roach        "\xF5" => UTF8::CYRILLIC_SMALL_LETTER_HA,
1501c6adce8SGreg Roach        "\xF6" => UTF8::CYRILLIC_SMALL_LETTER_TSE,
1511c6adce8SGreg Roach        "\xF7" => UTF8::CYRILLIC_SMALL_LETTER_CHE,
1521c6adce8SGreg Roach        "\xF8" => UTF8::CYRILLIC_SMALL_LETTER_SHA,
1531c6adce8SGreg Roach        "\xF9" => UTF8::CYRILLIC_SMALL_LETTER_SHCHA,
1541c6adce8SGreg Roach        "\xFA" => UTF8::CYRILLIC_SMALL_LETTER_HARD_SIGN,
1551c6adce8SGreg Roach        "\xFB" => UTF8::CYRILLIC_SMALL_LETTER_YERU,
1561c6adce8SGreg Roach        "\xFC" => UTF8::CYRILLIC_SMALL_LETTER_SOFT_SIGN,
1571c6adce8SGreg Roach        "\xFD" => UTF8::CYRILLIC_SMALL_LETTER_E,
1581c6adce8SGreg Roach        "\xFE" => UTF8::CYRILLIC_SMALL_LETTER_YU,
1591c6adce8SGreg Roach        "\xFF" => UTF8::CYRILLIC_SMALL_LETTER_YA,
1601c6adce8SGreg Roach    ];
1611c6adce8SGreg Roach}
162