aboutsummaryrefslogtreecommitdiffstats
path: root/prism
diff options
context:
space:
mode:
authorLynne Ashminov <47822041+lynne-ashminov@users.noreply.github.com>2023-11-20 15:06:10 -0500
committergit <svn-admin@ruby-lang.org>2023-11-20 20:06:14 +0000
commit307a5cb20b3e34f6a3bd240e70ddc26bd268ace3 (patch)
treed6a811d8429d861125ba380a5ba7683238c37b4f /prism
parent9fbdb26f06822305781a7fa12db1ee7249dbd0a8 (diff)
downloadruby-307a5cb20b3e34f6a3bd240e70ddc26bd268ace3.tar.gz
[ruby/prism] adds encodings for ibm869
(https://github.com/ruby/prism/pull/1886) https://github.com/ruby/prism/commit/41462400b7
Diffstat (limited to 'prism')
-rw-r--r--prism/enc/pm_encoding.h1
-rw-r--r--prism/enc/pm_tables.c35
-rw-r--r--prism/prism.c2
3 files changed, 38 insertions, 0 deletions
diff --git a/prism/enc/pm_encoding.h b/prism/enc/pm_encoding.h
index 0cccd5a58d..1785a842cc 100644
--- a/prism/enc/pm_encoding.h
+++ b/prism/enc/pm_encoding.h
@@ -180,6 +180,7 @@ extern pm_encoding_t pm_encoding_ibm863;
extern pm_encoding_t pm_encoding_ibm864;
extern pm_encoding_t pm_encoding_ibm865;
extern pm_encoding_t pm_encoding_ibm866;
+extern pm_encoding_t pm_encoding_ibm869;
extern pm_encoding_t pm_encoding_iso_8859_1;
extern pm_encoding_t pm_encoding_iso_8859_2;
extern pm_encoding_t pm_encoding_iso_8859_3;
diff --git a/prism/enc/pm_tables.c b/prism/enc/pm_tables.c
index c726b99887..70a44720ca 100644
--- a/prism/enc/pm_tables.c
+++ b/prism/enc/pm_tables.c
@@ -458,6 +458,30 @@ static uint8_t pm_encoding_ibm866_table[256] = {
/**
* Each element of the following table contains a bitfield that indicates a
+ * piece of information about the corresponding IBM869 character.
+ */
+static uint8_t pm_encoding_ibm869_table[256] = {
+// 0 1 2 3 4 5 6 7 8 9 A B C D E F
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 0x
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 1x
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 2x
+ 2, 2, 2, 2, 2, 2, 2, 2, 2, 2, 0, 0, 0, 0, 0, 0, // 3x
+ 0, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, // 4x
+ 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 7, 0, 0, 0, 0, 0, // 5x
+ 0, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, // 6x
+ 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 3, 0, 0, 0, 0, 0, // 7x
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 8x
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // 9x
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Ax
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Bx
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Cx
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Dx
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Ex
+ 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, // Fx
+};
+
+/**
+ * Each element of the following table contains a bitfield that indicates a
* piece of information about the corresponding ISO-8859-1 character.
*/
static uint8_t pm_encoding_iso_8859_1_table[256] = {
@@ -1403,6 +1427,7 @@ PRISM_ENCODING_TABLE(ibm863)
PRISM_ENCODING_TABLE(ibm864)
PRISM_ENCODING_TABLE(ibm865)
PRISM_ENCODING_TABLE(ibm866)
+PRISM_ENCODING_TABLE(ibm869)
PRISM_ENCODING_TABLE(iso_8859_1)
PRISM_ENCODING_TABLE(iso_8859_2)
PRISM_ENCODING_TABLE(iso_8859_3)
@@ -1642,6 +1667,16 @@ pm_encoding_t pm_encoding_ibm866 = {
.multibyte = false
};
+/** IBM869 */
+pm_encoding_t pm_encoding_ibm869 = {
+ .name = "IBM869",
+ .char_width = pm_encoding_single_char_width,
+ .alnum_char = pm_encoding_ibm869_alnum_char,
+ .alpha_char = pm_encoding_ibm869_alpha_char,
+ .isupper_char = pm_encoding_ibm869_isupper_char,
+ .multibyte = false
+};
+
/** ISO-8859-1 */
pm_encoding_t pm_encoding_iso_8859_1 = {
.name = "ISO-8859-1",
diff --git a/prism/prism.c b/prism/prism.c
index 4935bdc4bf..f041fb5167 100644
--- a/prism/prism.c
+++ b/prism/prism.c
@@ -6089,6 +6089,7 @@ parser_lex_magic_comment_encoding_value(pm_parser_t *parser, const uint8_t *star
ENCODING1("CP864", pm_encoding_ibm864);
ENCODING1("CP865", pm_encoding_ibm865);
ENCODING1("CP866", pm_encoding_ibm866);
+ ENCODING1("CP869", pm_encoding_ibm869);
ENCODING1("CP874", pm_encoding_windows_874);
ENCODING1("CP878", pm_encoding_koi8_r);
ENCODING1("CP863", pm_encoding_ibm863);
@@ -6133,6 +6134,7 @@ parser_lex_magic_comment_encoding_value(pm_parser_t *parser, const uint8_t *star
ENCODING1("IBM864", pm_encoding_ibm864);
ENCODING1("IBM865", pm_encoding_ibm865);
ENCODING1("IBM866", pm_encoding_ibm866);
+ ENCODING1("IBM869", pm_encoding_ibm869);
ENCODING2("ISO-8859-1", "ISO8859-1", pm_encoding_iso_8859_1);
ENCODING2("ISO-8859-2", "ISO8859-2", pm_encoding_iso_8859_2);
ENCODING2("ISO-8859-3", "ISO8859-3", pm_encoding_iso_8859_3);