[ruby/prism] feat: Adds macCroatian encoding
(https://github.com/ruby/prism/pull/1880) * feat: Adds macCroatian encoding - Based on: https://en.wikipedia.org/wiki/Mac_OS_Croatian_encoding https://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/CROATIAN.TXT Co-authored-by: Josefine Rost <nijrost@gmail.com> * Use output from bin/encodings and adds to docs/encoding.md --------- https://github.com/ruby/prism/commit/019a82d8f3 Co-authored-by: Josefine Rost <nijrost@gmail.com>
This commit is contained in:
parent
f2ed7eaba0
commit
f9fb05f9d0
@ -196,6 +196,7 @@ extern pm_encoding_t pm_encoding_iso_8859_15;
|
|||||||
extern pm_encoding_t pm_encoding_iso_8859_16;
|
extern pm_encoding_t pm_encoding_iso_8859_16;
|
||||||
extern pm_encoding_t pm_encoding_koi8_r;
|
extern pm_encoding_t pm_encoding_koi8_r;
|
||||||
extern pm_encoding_t pm_encoding_mac_cent_euro;
|
extern pm_encoding_t pm_encoding_mac_cent_euro;
|
||||||
|
extern pm_encoding_t pm_encoding_mac_croatian;
|
||||||
extern pm_encoding_t pm_encoding_mac_cyrillic;
|
extern pm_encoding_t pm_encoding_mac_cyrillic;
|
||||||
extern pm_encoding_t pm_encoding_mac_greek;
|
extern pm_encoding_t pm_encoding_mac_greek;
|
||||||
extern pm_encoding_t pm_encoding_mac_iceland;
|
extern pm_encoding_t pm_encoding_mac_iceland;
|
||||||
|
@ -841,6 +841,30 @@ static uint8_t pm_encoding_mac_cent_euro_table[256] = {
|
|||||||
};
|
};
|
||||||
|
|
||||||
/**
|
/**
|
||||||
|
* Each element of the following table contains a bitfield that indicates a
|
||||||
|
* piece of information about the corresponding macCroatian character.
|
||||||
|
*/
|
||||||
|
static uint8_t pm_encoding_mac_croatian_table[256] = {
|
||||||
|
// 0 1 2 3 4 5 6 7 8 9 A B C D E F
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 0x
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 1x
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 2x
|
||||||
|
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, 0, 0, 0, 0, 0, // 3x
|
||||||
|
0, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, // 4x
|
||||||
|
7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 0, 0, 0, 0, 0, // 5x
|
||||||
|
0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, // 6x
|
||||||
|
3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 0, 0, 0, // 7x
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 8x
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 9x
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Ax
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Bx
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Cx
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Dx
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Ex
|
||||||
|
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Fx
|
||||||
|
};
|
||||||
|
|
||||||
|
/**
|
||||||
* Each element of the following table contains a bitfield that indicates a
|
* Each element of the following table contains a bitfield that indicates a
|
||||||
* piece of information about the corresponding macCyrillic character.
|
* piece of information about the corresponding macCyrillic character.
|
||||||
*/
|
*/
|
||||||
@ -1371,6 +1395,7 @@ PRISM_ENCODING_TABLE(iso_8859_15)
|
|||||||
PRISM_ENCODING_TABLE(iso_8859_16)
|
PRISM_ENCODING_TABLE(iso_8859_16)
|
||||||
PRISM_ENCODING_TABLE(koi8_r)
|
PRISM_ENCODING_TABLE(koi8_r)
|
||||||
PRISM_ENCODING_TABLE(mac_cent_euro)
|
PRISM_ENCODING_TABLE(mac_cent_euro)
|
||||||
|
PRISM_ENCODING_TABLE(mac_croatian)
|
||||||
PRISM_ENCODING_TABLE(mac_cyrillic)
|
PRISM_ENCODING_TABLE(mac_cyrillic)
|
||||||
PRISM_ENCODING_TABLE(mac_greek)
|
PRISM_ENCODING_TABLE(mac_greek)
|
||||||
PRISM_ENCODING_TABLE(mac_iceland)
|
PRISM_ENCODING_TABLE(mac_iceland)
|
||||||
@ -1752,6 +1777,16 @@ pm_encoding_t pm_encoding_mac_cent_euro = {
|
|||||||
.multibyte = false
|
.multibyte = false
|
||||||
};
|
};
|
||||||
|
|
||||||
|
/** macCroatian */
|
||||||
|
pm_encoding_t pm_encoding_mac_croatian = {
|
||||||
|
.name = "macCroatian",
|
||||||
|
.char_width = pm_encoding_single_char_width,
|
||||||
|
.alnum_char = pm_encoding_mac_croatian_alnum_char,
|
||||||
|
.alpha_char = pm_encoding_mac_croatian_alpha_char,
|
||||||
|
.isupper_char = pm_encoding_mac_croatian_isupper_char,
|
||||||
|
.multibyte = false
|
||||||
|
};
|
||||||
|
|
||||||
/** macCyrillic */
|
/** macCyrillic */
|
||||||
pm_encoding_t pm_encoding_mac_cyrillic = {
|
pm_encoding_t pm_encoding_mac_cyrillic = {
|
||||||
.name = "macCyrillic",
|
.name = "macCyrillic",
|
||||||
|
@ -6145,6 +6145,7 @@ parser_lex_magic_comment_encoding_value(pm_parser_t *parser, const uint8_t *star
|
|||||||
break;
|
break;
|
||||||
case 'M': case 'm':
|
case 'M': case 'm':
|
||||||
ENCODING1("macCentEuro", pm_encoding_mac_cent_euro);
|
ENCODING1("macCentEuro", pm_encoding_mac_cent_euro);
|
||||||
|
ENCODING1("macCroatian", pm_encoding_mac_croatian);
|
||||||
ENCODING1("macCyrillic", pm_encoding_mac_cyrillic);
|
ENCODING1("macCyrillic", pm_encoding_mac_cyrillic);
|
||||||
ENCODING1("macGreek", pm_encoding_mac_greek);
|
ENCODING1("macGreek", pm_encoding_mac_greek);
|
||||||
ENCODING1("macIceland", pm_encoding_mac_iceland);
|
ENCODING1("macIceland", pm_encoding_mac_iceland);
|
||||||
|
@ -43,6 +43,7 @@ module Prism
|
|||||||
Encoding::ISO_8859_16 => 0x00...0x100,
|
Encoding::ISO_8859_16 => 0x00...0x100,
|
||||||
Encoding::KOI8_R => 0x00...0x100,
|
Encoding::KOI8_R => 0x00...0x100,
|
||||||
Encoding::MACCENTEURO => 0x00...0x100,
|
Encoding::MACCENTEURO => 0x00...0x100,
|
||||||
|
Encoding::MACCROATIAN => 0x00...0x100,
|
||||||
Encoding::MACCYRILLIC => 0x00...0x100,
|
Encoding::MACCYRILLIC => 0x00...0x100,
|
||||||
Encoding::MACGREEK => 0x00...0x100,
|
Encoding::MACGREEK => 0x00...0x100,
|
||||||
Encoding::MACICELAND => 0x00...0x100,
|
Encoding::MACICELAND => 0x00...0x100,
|
||||||
|
Loading…
x
Reference in New Issue
Block a user