[ruby/prism] IBM857 encoding

8c9b580f84
This commit is contained in:
Kevin Newton 2023-11-12 00:11:14 -05:00 committed by git
parent 076d0957b9
commit a7df025c3f
4 changed files with 39 additions and 0 deletions

View file

@ -170,6 +170,7 @@ extern pm_encoding_t pm_encoding_ibm737;
extern pm_encoding_t pm_encoding_ibm775; extern pm_encoding_t pm_encoding_ibm775;
extern pm_encoding_t pm_encoding_ibm852; extern pm_encoding_t pm_encoding_ibm852;
extern pm_encoding_t pm_encoding_ibm855; extern pm_encoding_t pm_encoding_ibm855;
extern pm_encoding_t pm_encoding_ibm857;
extern pm_encoding_t pm_encoding_iso_8859_1; extern pm_encoding_t pm_encoding_iso_8859_1;
extern pm_encoding_t pm_encoding_iso_8859_2; extern pm_encoding_t pm_encoding_iso_8859_2;
extern pm_encoding_t pm_encoding_iso_8859_3; extern pm_encoding_t pm_encoding_iso_8859_3;

View file

@ -240,6 +240,30 @@ static uint8_t pm_encoding_ibm855_table[256] = {
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Fx 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Fx
}; };
/**
* Each element of the following table contains a bitfield that indicates a
* piece of information about the corresponding IBM857 character.
*/
static uint8_t pm_encoding_ibm857_table[256] = {
// 0 1 2 3 4 5 6 7 8 9 A B C D E F
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 0x
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 1x
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 2x
2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, 0, 0, 0, 0, 0, // 3x
0, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, // 4x
7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 0, 0, 0, 0, 0, // 5x
0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, // 6x
3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 0, 0, 0, // 7x
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 8x
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 9x
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Ax
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Bx
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Cx
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Dx
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Ex
0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Fx
};
/** /**
* Each element of the following table contains a bitfield that indicates a * Each element of the following table contains a bitfield that indicates a
* piece of information about the corresponding ISO-8859-1 character. * piece of information about the corresponding ISO-8859-1 character.
@ -914,6 +938,7 @@ PRISM_ENCODING_TABLE(ibm737)
PRISM_ENCODING_TABLE(ibm775) PRISM_ENCODING_TABLE(ibm775)
PRISM_ENCODING_TABLE(ibm852) PRISM_ENCODING_TABLE(ibm852)
PRISM_ENCODING_TABLE(ibm855) PRISM_ENCODING_TABLE(ibm855)
PRISM_ENCODING_TABLE(ibm857)
PRISM_ENCODING_TABLE(iso_8859_1) PRISM_ENCODING_TABLE(iso_8859_1)
PRISM_ENCODING_TABLE(iso_8859_2) PRISM_ENCODING_TABLE(iso_8859_2)
PRISM_ENCODING_TABLE(iso_8859_3) PRISM_ENCODING_TABLE(iso_8859_3)
@ -1052,6 +1077,16 @@ pm_encoding_t pm_encoding_ibm855 = {
.multibyte = false .multibyte = false
}; };
/** IBM857 */
pm_encoding_t pm_encoding_ibm857 = {
.name = "IBM857",
.char_width = pm_encoding_single_char_width,
.alnum_char = pm_encoding_ibm857_alnum_char,
.alpha_char = pm_encoding_ibm857_alpha_char,
.isupper_char = pm_encoding_ibm857_isupper_char,
.multibyte = false
};
/** ISO-8859-1 */ /** ISO-8859-1 */
pm_encoding_t pm_encoding_iso_8859_1 = { pm_encoding_t pm_encoding_iso_8859_1 = {
.name = "ISO-8859-1", .name = "ISO-8859-1",

View file

@ -6071,6 +6071,7 @@ parser_lex_magic_comment_encoding_value(pm_parser_t *parser, const uint8_t *star
ENCODING1("CP850", pm_encoding_cp850); ENCODING1("CP850", pm_encoding_cp850);
ENCODING1("CP852", pm_encoding_cp852); ENCODING1("CP852", pm_encoding_cp852);
ENCODING1("CP855", pm_encoding_cp855); ENCODING1("CP855", pm_encoding_cp855);
ENCODING1("CP857", pm_encoding_ibm857);
ENCODING1("CP878", pm_encoding_koi8_r); ENCODING1("CP878", pm_encoding_koi8_r);
ENCODING2("CP932", "csWindows31J", pm_encoding_windows_31j); ENCODING2("CP932", "csWindows31J", pm_encoding_windows_31j);
ENCODING1("CP936", pm_encoding_gbk); ENCODING1("CP936", pm_encoding_gbk);
@ -6104,6 +6105,7 @@ parser_lex_magic_comment_encoding_value(pm_parser_t *parser, const uint8_t *star
ENCODING1("IBM850", pm_encoding_cp850); ENCODING1("IBM850", pm_encoding_cp850);
ENCODING1("IBM852", pm_encoding_ibm852); ENCODING1("IBM852", pm_encoding_ibm852);
ENCODING1("IBM855", pm_encoding_ibm855); ENCODING1("IBM855", pm_encoding_ibm855);
ENCODING1("IBM857", pm_encoding_ibm857);
ENCODING2("ISO-8859-1", "ISO8859-1", pm_encoding_iso_8859_1); ENCODING2("ISO-8859-1", "ISO8859-1", pm_encoding_iso_8859_1);
ENCODING2("ISO-8859-2", "ISO8859-2", pm_encoding_iso_8859_2); ENCODING2("ISO-8859-2", "ISO8859-2", pm_encoding_iso_8859_2);
ENCODING2("ISO-8859-3", "ISO8859-3", pm_encoding_iso_8859_3); ENCODING2("ISO-8859-3", "ISO8859-3", pm_encoding_iso_8859_3);

View file

@ -20,6 +20,7 @@ module Prism
Encoding::IBM775, Encoding::IBM775,
Encoding::IBM852, Encoding::IBM852,
Encoding::IBM855, Encoding::IBM855,
Encoding::IBM857,
Encoding::ISO_8859_1, Encoding::ISO_8859_1,
Encoding::ISO_8859_2, Encoding::ISO_8859_2,
Encoding::ISO_8859_3, Encoding::ISO_8859_3,