summaryrefslogtreecommitdiff
path: root/src/charset.c
diff options
context:
space:
mode:
authorKenichi Handa <handa@m17n.org>2008-11-27 08:00:16 +0000
committerKenichi Handa <handa@m17n.org>2008-11-27 08:00:16 +0000
commitecca2aad92d1b528fffbebba5867183b110a6fa9 (patch)
tree94b74a250554307f1cd86aa617eb6962bc50d688 /src/charset.c
parent55870ffc30547ff5dacd37db45fed4b38a0dd7e6 (diff)
downloademacs-ecca2aad92d1b528fffbebba5867183b110a6fa9.tar.gz
(Vchar_unified_charset_table): Delete it.
(inhibit_load_charset_map): New variable. (temp_charset_work): New variable. (SET_TEMP_CHARSET_WORK_ENCODER, GET_TEMP_CHARSET_WORK_ENCODER) (SET_TEMP_CHARSET_WORK_DECODER, GET_TEMP_CHARSET_WORK_DECODER): New macros. (load_charset_map): Meaning of control_flag changed. If inhibit_load_charset_map is nonzero, setup a table in temp_charset_work. (load_charset): New argument control_flag. (map_charset_for_dump): New function. (map_charset_chars): If inhibit_load_charset_map is nonzero, use map_charset_for_dump. (Fdefine_charset_internal): If the charset method is MAP, load mapping tables by calling load_charset. (Funify_charset): Don't load a mapping table but directly set Vchar_unify_table. (maybe_unify_char): New function. (decode_char): Don't handle the deleted method MAP_DEFERRED. Handle the case of inhibit_load_charset_map being nonzero. (encode_char): Don't handle the deleted method MAP_DEFERRED. Handle the case of inhibit_load_charset_map being nonzero. (Fclear_charset_maps): Just free temp_charset_work. (syms_of_charset): Make `inhibit-load-charset-map' a Lisp variable.
Diffstat (limited to 'src/charset.c')
-rw-r--r--src/charset.c563
1 files changed, 385 insertions, 178 deletions
diff --git a/src/charset.c b/src/charset.c
index 43155d2cc65..3c52d1f333f 100644
--- a/src/charset.c
+++ b/src/charset.c
@@ -120,7 +120,8 @@ int iso_charset_table[ISO_MAX_DIMENSION][ISO_MAX_CHARS][ISO_MAX_FINAL];
Lisp_Object Vcharset_map_path;
-Lisp_Object Vchar_unified_charset_table;
+/* If nonzero, don't load charset maps. */
+int inhibit_load_charset_map;
Lisp_Object Vcurrent_iso639_language;
@@ -166,7 +167,63 @@ map_char_table_for_charset P_ ((void (*c_function) (Lisp_Object, Lisp_Object),
| (((charset)->code_space[12] + ((idx) / (charset)->code_space[11])) \
<< 24))))
+/* Structure to hold mapping tables for a charset. Used by temacs
+ invoked for dumping. */
+static struct
+{
+ /* The current charset for which the following tables are setup. */
+ struct charset *current;
+
+ /* 1 iff the following table is used for encoder. */
+ short for_encoder;
+
+ /* When the following table is used for encoding, mininum and
+ maxinum character of the current charset. */
+ int min_char, max_char;
+
+ /* A Unicode character correspoinding to the code indice 0 (i.e. the
+ minimum code-point) of the current charset, or -1 if the code
+ indice 0 is not a Unicode character. This is checked when
+ table.encoder[CHAR] is zero. */
+ int zero_index_char;
+
+ union {
+ /* Table mapping code-indices (not code-points) of the current
+ charset to Unicode characters. If decoder[CHAR] is -1, CHAR
+ doesn't belong to the current charset. */
+ int decoder[0x10000];
+ /* Table mapping Unicode characters to code-indices of the current
+ charset. The first 0x10000 elements are for BMP (0..0xFFFF),
+ and the last 0x10000 are for SMP (0x10000..0x1FFFF) or SIP
+ (0x20000..0x2FFFF). Note that there is no charset map that
+ uses both SMP and SIP. */
+ unsigned short encoder[0x20000];
+ } table;
+} *temp_charset_work;
+
+#define SET_TEMP_CHARSET_WORK_ENCODER(C, CODE) \
+ do { \
+ if ((CODE) == 0) \
+ temp_charset_work->zero_index_char = (C); \
+ else if ((C) < 0x20000) \
+ temp_charset_work->table.encoder[(C)] = (CODE); \
+ else \
+ temp_charset_work->table.encoder[(C) - 0x10000] = (CODE); \
+ } while (0)
+
+#define GET_TEMP_CHARSET_WORK_ENCODER(C) \
+ ((C) == temp_charset_work->zero_index_char ? 0 \
+ : (C) < 0x20000 ? (temp_charset_work->table.encoder[(C)] \
+ ? (int) temp_charset_work->table.encoder[(C)] : -1) \
+ : temp_charset_work->table.encoder[(C) - 0x10000] \
+ ? temp_charset_work->table.encoder[(C) - 0x10000] : -1)
+
+#define SET_TEMP_CHARSET_WORK_DECODER(C, CODE) \
+ (temp_charset_work->table.decoder[(CODE)] = (C))
+
+#define GET_TEMP_CHARSET_WORK_DECODER(CODE) \
+ (temp_charset_work->table.decoder[(CODE)])
/* Set to 1 to warn that a charset map is loaded and thus a buffer
@@ -182,16 +239,30 @@ struct charset_map_entries
struct charset_map_entries *next;
};
-/* Load the mapping information for CHARSET from ENTRIES.
+/* Load the mapping information of CHARSET from ENTRIES for
+ initializing (CONTROL_FLAG == 0), decoding (CONTROL_FLAG == 1), and
+ encoding (CONTROL_FLAG == 2).
+
+ If CONTROL_FLAG is 0, setup CHARSET->min_char, CHARSET->max_char,
+ and CHARSET->fast_map.
+
+ If CONTROL_FLAG is 1, setup the following tables according to
+ CHARSET->method and inhibit_load_charset_map.
- If CONTROL_FLAG is 0, setup CHARSET->min_char and CHARSET->max_char.
+ CHARSET->method | inhibit_lcm == 0 | inhibit_lcm == 1
+ ----------------------+--------------------+---------------------------
+ CHARSET_METHOD_MAP | CHARSET->decoder | temp_charset_work->decoder
+ ----------------------+--------------------+---------------------------
+ CHARSET_METHOD_OFFSET | Vchar_unify_table | temp_charset_work->decoder
- If CONTROL_FLAG is 1, setup CHARSET->min_char, CHARSET->max_char,
- CHARSET->decoder, and CHARSET->encoder.
+ If CONTROL_FLAG is 2, setup the following tables.
- If CONTROL_FLAG is 2, setup CHARSET->deunifier and
- Vchar_unify_table. If Vchar_unified_charset_table is non-nil,
- setup it too. */
+ CHARSET->method | inhibit_lcm == 0 | inhibit_lcm == 1
+ ----------------------+--------------------+---------------------------
+ CHARSET_METHOD_MAP | CHARSET->encoder | temp_charset_work->encoder
+ ----------------------+--------------------+--------------------------
+ CHARSET_METHOD_OFFSET | CHARSET->deunifier | temp_charset_work->encoder
+*/
static void
load_charset_map (charset, entries, n_entries, control_flag)
@@ -210,16 +281,55 @@ load_charset_map (charset, entries, n_entries, control_flag)
if (n_entries <= 0)
return;
- if (control_flag > 0)
+ if (control_flag)
{
- int n = CODE_POINT_TO_INDEX (charset, max_code) + 1;
-
- table = Fmake_char_table (Qnil, Qnil);
- if (control_flag == 1)
- vec = Fmake_vector (make_number (n), make_number (-1));
- else if (! CHAR_TABLE_P (Vchar_unify_table))
- Vchar_unify_table = Fmake_char_table (Qnil, Qnil);
+ if (! inhibit_load_charset_map)
+ {
+ if (control_flag == 1)
+ {
+ if (charset->method == CHARSET_METHOD_MAP)
+ {
+ int n = CODE_POINT_TO_INDEX (charset, max_code) + 1;
+ vec = CHARSET_DECODER (charset)
+ = Fmake_vector (make_number (n), make_number (-1));
+ }
+ else
+ {
+ char_table_set_range (Vchar_unify_table,
+ charset->min_char, charset->max_char,
+ Qnil);
+ }
+ }
+ else
+ {
+ table = Fmake_char_table (Qnil, Qnil);
+ if (charset->method == CHARSET_METHOD_MAP)
+ CHARSET_ENCODER (charset) = table;
+ else
+ CHARSET_DEUNIFIER (charset) = table;
+ }
+ }
+ else
+ {
+ if (! temp_charset_work)
+ temp_charset_work = malloc (sizeof (*temp_charset_work));
+ if (control_flag == 1)
+ {
+ memset (temp_charset_work->table.decoder, -1,
+ sizeof (int) * 0x10000);
+ temp_charset_work->for_encoder = 0;
+ }
+ else
+ {
+ memset (temp_charset_work->table.encoder, 0,
+ sizeof (unsigned short) * 0x20000);
+ temp_charset_work->zero_index_char = -1;
+ }
+ temp_charset_work->current = charset;
+ temp_charset_work->for_encoder = (control_flag == 2);
+ control_flag += 2;
+ }
charset_map_loaded = 1;
}
@@ -251,14 +361,48 @@ load_charset_map (charset, entries, n_entries, control_flag)
if (from_index < 0 || to_index < 0)
continue;
- if (control_flag < 2)
- {
- int c;
+ if (to_c > max_char)
+ max_char = to_c;
+ else if (from_c < min_char)
+ min_char = from_c;
- if (to_c > max_char)
- max_char = to_c;
- else if (from_c < min_char)
- min_char = from_c;
+ if (control_flag == 1)
+ {
+ if (charset->method == CHARSET_METHOD_MAP)
+ for (; from_index <= to_index; from_index++, from_c++)
+ ASET (vec, from_index, make_number (from_c));
+ else
+ for (; from_index <= to_index; from_index++, from_c++)
+ CHAR_TABLE_SET (Vchar_unify_table,
+ CHARSET_CODE_OFFSET (charset) + from_index,
+ make_number (from_c));
+ }
+ else if (control_flag == 2)
+ {
+ if (charset->method == CHARSET_METHOD_MAP
+ && CHARSET_COMPACT_CODES_P (charset))
+ for (; from_index <= to_index; from_index++, from_c++)
+ {
+ unsigned code = INDEX_TO_CODE_POINT (charset, from_index);
+
+ if (NILP (CHAR_TABLE_REF (table, from_c)))
+ CHAR_TABLE_SET (table, from_c, make_number (code));
+ }
+ else
+ for (; from_index <= to_index; from_index++, from_c++)
+ {
+ if (NILP (CHAR_TABLE_REF (table, from_c)))
+ CHAR_TABLE_SET (table, from_c, make_number (from_index));
+ }
+ }
+ else if (control_flag == 3)
+ for (; from_index <= to_index; from_index++, from_c++)
+ SET_TEMP_CHARSET_WORK_DECODER (from_c, from_index);
+ else if (control_flag == 4)
+ for (; from_index <= to_index; from_index++, from_c++)
+ SET_TEMP_CHARSET_WORK_ENCODER (from_c, from_index);
+ else /* control_flag == 0 */
+ {
if (ascii_compatible_p)
{
if (! ASCII_BYTE_P (from_c))
@@ -272,70 +416,22 @@ load_charset_map (charset, entries, n_entries, control_flag)
}
}
- for (c = from_c; c <= to_c; c++)
- CHARSET_FAST_MAP_SET (c, fast_map);
-
- if (control_flag == 1)
- {
- unsigned code = from;
-
- if (CHARSET_COMPACT_CODES_P (charset))
- while (1)
- {
- ASET (vec, from_index, make_number (from_c));
- if (NILP (CHAR_TABLE_REF (table, from_c)))
- CHAR_TABLE_SET (table, from_c, make_number (code));
- if (from_index == to_index)
- break;
- from_index++, from_c++;
- code = INDEX_TO_CODE_POINT (charset, from_index);
- }
- else
- for (; from_index <= to_index; from_index++, from_c++)
- {
- ASET (vec, from_index, make_number (from_c));
- if (NILP (CHAR_TABLE_REF (table, from_c)))
- CHAR_TABLE_SET (table, from_c, make_number (from_index));
- }
- }
- }
- else
- {
- unsigned code = from;
-
- while (1)
- {
- int c1 = DECODE_CHAR (charset, code);
-
- if (c1 >= 0)
- {
- CHAR_TABLE_SET (table, from_c, make_number (c1));
- CHAR_TABLE_SET (Vchar_unify_table, c1, make_number (from_c));
- if (CHAR_TABLE_P (Vchar_unified_charset_table))
- CHAR_TABLE_SET (Vchar_unified_charset_table, c1,
- CHARSET_NAME (charset));
- }
- if (from_index == to_index)
- break;
- from_index++, from_c++;
- code = INDEX_TO_CODE_POINT (charset, from_index);
- }
+ for (; from_c <= to_c; from_c++)
+ CHARSET_FAST_MAP_SET (from_c, fast_map);
}
}
- if (control_flag < 2)
+ if (control_flag == 0)
{
CHARSET_MIN_CHAR (charset) = (ascii_compatible_p
? nonascii_min_char : min_char);
CHARSET_MAX_CHAR (charset) = max_char;
- if (control_flag == 1)
- {
- CHARSET_DECODER (charset) = vec;
- CHARSET_ENCODER (charset) = table;
- }
}
- else
- CHARSET_DEUNIFIER (charset) = table;
+ else if (control_flag == 4)
+ {
+ temp_charset_work->min_char = min_char;
+ temp_charset_work->max_char = max_char;
+ }
}
@@ -531,21 +627,31 @@ load_charset_map_from_vector (charset, vec, control_flag)
load_charset_map (charset, head, n_entries, control_flag);
}
+
+/* Load a mapping table for CHARSET. CONTROL-FLAG tells what kind of
+ map it is (see the comment of load_charset_map for the detail). */
+
static void
-load_charset (charset)
+load_charset (charset, control_flag)
struct charset *charset;
+ int control_flag;
{
- if (CHARSET_METHOD (charset) == CHARSET_METHOD_MAP_DEFERRED)
- {
- Lisp_Object map;
+ Lisp_Object map;
- map = CHARSET_MAP (charset);
- if (STRINGP (map))
- load_charset_map_from_file (charset, map, 1);
- else
- load_charset_map_from_vector (charset, map, 1);
- CHARSET_METHOD (charset) = CHARSET_METHOD_MAP;
- }
+ if (inhibit_load_charset_map
+ && temp_charset_work
+ && charset == temp_charset_work->current
+ && (control_flag == 2 == temp_charset_work->for_encoder))
+ return;
+
+ if (CHARSET_METHOD (charset) == CHARSET_METHOD_MAP)
+ map = CHARSET_MAP (charset);
+ else if (CHARSET_UNIFIED_P (charset))
+ map = CHARSET_UNIFY_MAP (charset);
+ if (STRINGP (map))
+ load_charset_map_from_file (charset, map, control_flag);
+ else
+ load_charset_map_from_vector (charset, map, control_flag);
}
@@ -558,6 +664,68 @@ DEFUN ("charsetp", Fcharsetp, Scharsetp, 1, 1, 0,
}
+void map_charset_for_dump P_ ((void (*c_function) (Lisp_Object, Lisp_Object),
+ Lisp_Object function, Lisp_Object arg,
+ unsigned from, unsigned to));
+
+void
+map_charset_for_dump (c_function, function, arg, from, to)
+ void (*c_function) (Lisp_Object, Lisp_Object);
+ Lisp_Object function, arg;
+ unsigned from, to;
+{
+ int from_idx = CODE_POINT_TO_INDEX (temp_charset_work->current, from);
+ int to_idx = CODE_POINT_TO_INDEX (temp_charset_work->current, to);
+ Lisp_Object range;
+ int c, stop;
+ struct gcpro gcpro1;
+
+ range = Fcons (Qnil, Qnil);
+ GCPRO1 (range);
+
+ c = temp_charset_work->min_char;
+ stop = (temp_charset_work->max_char < 0x20000
+ ? temp_charset_work->max_char : 0xFFFF);
+
+ while (1)
+ {
+ int index = GET_TEMP_CHARSET_WORK_ENCODER (c);
+
+ if (index >= from_idx && index <= to_idx)
+ {
+ if (NILP (XCAR (range)))
+ XSETCAR (range, make_number (c));
+ }
+ else if (! NILP (XCAR (range)))
+ {
+ XSETCDR (range, make_number (c - 1));
+ if (c_function)
+ (*c_function) (arg, range);
+ else
+ call2 (function, range, arg);
+ XSETCAR (range, Qnil);
+ }
+ if (c == stop)
+ {
+ if (c == temp_charset_work->max_char)
+ {
+ if (! NILP (XCAR (range)))
+ {
+ XSETCDR (range, make_number (c));
+ if (c_function)
+ (*c_function) (arg, range);
+ else
+ call2 (function, range, arg);
+ }
+ break;
+ }
+ c = 0x1FFFF;
+ stop = temp_charset_work->max_char;
+ }
+ c++;
+ }
+}
+
void
map_charset_chars (c_function, function, arg,
charset, from, to)
@@ -569,20 +737,9 @@ map_charset_chars (c_function, function, arg,
Lisp_Object range;
int partial;
- if (CHARSET_METHOD (charset) == CHARSET_METHOD_MAP_DEFERRED)
- load_charset (charset);
-
partial = (from > CHARSET_MIN_CODE (charset)
|| to < CHARSET_MAX_CODE (charset));
- if (CHARSET_UNIFIED_P (charset)
- && CHAR_TABLE_P (CHARSET_DEUNIFIER (charset)))
- {
- map_char_table_for_charset (c_function, function,
- CHARSET_DEUNIFIER (charset), arg,
- partial ? charset : NULL, from, to);
- }
-
if (CHARSET_METHOD (charset) == CHARSET_METHOD_OFFSET)
{
int from_idx = CODE_POINT_TO_INDEX (charset, from);
@@ -590,6 +747,18 @@ map_charset_chars (c_function, function, arg,
int from_c = from_idx + CHARSET_CODE_OFFSET (charset);
int to_c = to_idx + CHARSET_CODE_OFFSET (charset);
+ if (CHARSET_UNIFIED_P (charset))
+ {
+ if (! CHAR_TABLE_P (CHARSET_DEUNIFIER (charset)))
+ load_charset (charset, 2);
+ if (CHAR_TABLE_P (CHARSET_DEUNIFIER (charset)))
+ map_char_table_for_charset (c_function, function,
+ CHARSET_DEUNIFIER (charset), arg,
+ partial ? charset : NULL, from, to);
+ else
+ map_charset_for_dump (c_function, function, arg, from, to);
+ }
+
range = Fcons (make_number (from_c), make_number (to_c));
if (NILP (function))
(*c_function) (arg, range);
@@ -599,10 +768,13 @@ map_charset_chars (c_function, function, arg,
else if (CHARSET_METHOD (charset) == CHARSET_METHOD_MAP)
{
if (! CHAR_TABLE_P (CHARSET_ENCODER (charset)))
- return;
- map_char_table_for_charset (c_function, function,
- CHARSET_ENCODER (charset), arg,
- partial ? charset : NULL, from, to);
+ load_charset (charset, 2);
+ if (CHAR_TABLE_P (CHARSET_ENCODER (charset)))
+ map_char_table_for_charset (c_function, function,
+ CHARSET_ENCODER (charset), arg,
+ partial ? charset : NULL, from, to);
+ else
+ map_charset_for_dump (c_function, function, arg, from, to);
}
else if (CHARSET_METHOD (charset) == CHARSET_METHOD_SUBSET)
{
@@ -821,7 +993,7 @@ usage: (define-charset-internal ...) */)
charset.max_code = code;
}
- charset.compact_codes_p = charset.max_code < 0x1000000;
+ charset.compact_codes_p = charset.max_code < 0x10000;
val = args[charset_arg_invalid_code];
if (NILP (val))
@@ -910,11 +1082,7 @@ usage: (define-charset-internal ...) */)
{
val = args[charset_arg_map];
ASET (attrs, charset_map, val);
- if (STRINGP (val))
- load_charset_map_from_file (&charset, val, 0);
- else
- load_charset_map_from_vector (&charset, val, 0);
- charset.method = CHARSET_METHOD_MAP_DEFERRED;
+ charset.method = CHARSET_METHOD_MAP;
}
else if (! NILP (args[charset_arg_subset]))
{
@@ -1030,6 +1198,9 @@ usage: (define-charset-internal ...) */)
charset.id = id;
charset_table[id] = charset;
+ if (charset.method == CHARSET_METHOD_MAP)
+ load_charset (&charset, 0);
+
if (charset.iso_final >= 0)
{
ISO_CHARSET_TABLE (charset.dimension, charset.iso_chars_96,
@@ -1219,8 +1390,6 @@ Optional third argument DEUNIFY, if non-nil, means to de-unify CHARSET. */)
CHECK_CHARSET_GET_ID (charset, id);
cs = CHARSET_FROM_ID (id);
- if (CHARSET_METHOD (cs) == CHARSET_METHOD_MAP_DEFERRED)
- load_charset (cs);
if (NILP (deunify)
? CHARSET_UNIFIED_P (cs) && ! NILP (CHARSET_DEUNIFIER (cs))
: ! CHARSET_UNIFIED_P (cs))
@@ -1229,18 +1398,21 @@ Optional third argument DEUNIFY, if non-nil, means to de-unify CHARSET. */)
CHARSET_UNIFIED_P (cs) = 0;
if (NILP (deunify))
{
- if (CHARSET_METHOD (cs) != CHARSET_METHOD_OFFSET)
+ if (CHARSET_METHOD (cs) != CHARSET_METHOD_OFFSET
+ || CHARSET_CODE_OFFSET (cs) < 0x110000)
error ("Can't unify charset: %s", SDATA (SYMBOL_NAME (charset)));
if (NILP (unify_map))
unify_map = CHARSET_UNIFY_MAP (cs);
- if (STRINGP (unify_map))
- load_charset_map_from_file (cs, unify_map, 2);
- else if (VECTORP (unify_map))
- load_charset_map_from_vector (cs, unify_map, 2);
- else if (NILP (unify_map))
- error ("No unify-map for charset");
else
- error ("Bad unify-map arg");
+ {
+ if (! STRINGP (unify_map) && ! VECTORP (unify_map))
+ signal_error ("Bad unify-map", unify_map);
+ CHARSET_UNIFY_MAP (cs) = unify_map;
+ }
+ if (NILP (Vchar_unify_table))
+ Vchar_unify_table = Fmake_char_table (Qnil, Qnil);
+ char_table_set_range (Vchar_unify_table,
+ cs->min_char, cs->max_char, charset);
CHARSET_UNIFIED_P (cs) = 1;
}
else if (CHAR_TABLE_P (Vchar_unify_table))
@@ -1485,6 +1657,41 @@ only `ascii', `eight-bit-control', and `eight-bit-graphic'. */)
+/* Return a unified character code for C (>= 0x110000). VAL is a
+ value of Vchar_unify_table for C; i.e. it is nil, an integer, or a
+ charset symbol. */
+int
+maybe_unify_char (c, val)
+ int c;
+ Lisp_Object val;
+{
+ struct charset *charset;
+
+ if (INTEGERP (val))
+ return XINT (val);
+ if (NILP (val))
+ return c;
+
+ CHECK_CHARSET_GET_CHARSET (val, charset);
+ load_charset (charset, 1);
+ if (! inhibit_load_charset_map)
+ {
+ val = CHAR_TABLE_REF (Vchar_unify_table, c);
+ if (! NILP (val))
+ c = XINT (val);
+ }
+ else
+ {
+ int code_index = c - CHARSET_CODE_OFFSET (charset);
+ int unified = GET_TEMP_CHARSET_WORK_DECODER (code_index);
+
+ if (unified > 0)
+ c = unified;
+ }
+ return c;
+}
+
+
/* Return a character correponding to the code-point CODE of
CHARSET. */
@@ -1499,12 +1706,6 @@ decode_char (charset, code)
if (code < CHARSET_MIN_CODE (charset) || code > CHARSET_MAX_CODE (charset))
return -1;
- if (method == CHARSET_METHOD_MAP_DEFERRED)
- {
- load_charset (charset);
- method = CHARSET_METHOD (charset);
- }
-
if (method == CHARSET_METHOD_SUBSET)
{
Lisp_Object subset_info;
@@ -1547,21 +1748,24 @@ decode_char (charset, code)
decoder = CHARSET_DECODER (charset);
if (! VECTORP (decoder))
- return -1;
- c = XINT (AREF (decoder, char_index));
+ {
+ load_charset (charset, 1);
+ decoder = CHARSET_DECODER (charset);
+ }
+ if (VECTORP (decoder))
+ c = XINT (AREF (decoder, char_index));
+ else
+ c = GET_TEMP_CHARSET_WORK_DECODER (char_index);
}
- else
+ else /* method == CHARSET_METHOD_OFFSET */
{
c = char_index + CHARSET_CODE_OFFSET (charset);
+ if (CHARSET_UNIFIED_P (charset)
+ && c > MAX_UNICODE_CHAR)
+ MAYBE_UNIFY_CHAR (c);
}
}
- if (CHARSET_UNIFIED_P (charset)
- && c >= 0)
- {
- MAYBE_UNIFY_CHAR (c);
- }
-
return c;
}
@@ -1583,16 +1787,27 @@ encode_char (charset, c)
if (CHARSET_UNIFIED_P (charset))
{
Lisp_Object deunifier, deunified;
+ int code_index = -1;
deunifier = CHARSET_DEUNIFIER (charset);
if (! CHAR_TABLE_P (deunifier))
{
- Funify_charset (CHARSET_NAME (charset), Qnil, Qnil);
+ load_charset (charset, 2);
deunifier = CHARSET_DEUNIFIER (charset);
}
- deunified = CHAR_TABLE_REF (deunifier, c);
- if (! NILP (deunified))
- c = XINT (deunified);
+ if (CHAR_TABLE_P (deunifier))
+ {
+ Lisp_Object deunified = CHAR_TABLE_REF (deunifier, c);
+
+ if (INTEGERP (deunified))
+ code_index = XINT (deunified);
+ }
+ else
+ {
+ code_index = GET_TEMP_CHARSET_WORK_ENCODER (c);
+ }
+ if (code_index >= 0)
+ c = CHARSET_CODE_OFFSET (charset) + code_index;
}
if (method == CHARSET_METHOD_SUBSET)
@@ -1633,12 +1848,6 @@ encode_char (charset, c)
|| c < CHARSET_MIN_CHAR (charset) || c > CHARSET_MAX_CHAR (charset))
return CHARSET_INVALID_CODE (charset);
- if (method == CHARSET_METHOD_MAP_DEFERRED)
- {
- load_charset (charset);
- method = CHARSET_METHOD (charset);
- }
-
if (method == CHARSET_METHOD_MAP)
{
Lisp_Object encoder;
@@ -1646,18 +1855,27 @@ encode_char (charset, c)
encoder = CHARSET_ENCODER (charset);
if (! CHAR_TABLE_P (CHARSET_ENCODER (charset)))
- return CHARSET_INVALID_CODE (charset);
- val = CHAR_TABLE_REF (encoder, c);
- if (NILP (val))
- return CHARSET_INVALID_CODE (charset);
- code = XINT (val);
- if (! CHARSET_COMPACT_CODES_P (charset))
- code = INDEX_TO_CODE_POINT (charset, code);
+ load_charset (charset);
+ if (CHAR_TABLE_P (CHARSET_ENCODER (charset)))
+ {
+ val = CHAR_TABLE_REF (encoder, c);
+ if (NILP (val))
+ return CHARSET_INVALID_CODE (charset);
+ code = XINT (val);
+ if (! CHARSET_COMPACT_CODES_P (charset))
+ code = INDEX_TO_CODE_POINT (charset, code);
+ }
+ else
+ {
+ code = GET_TEMP_CHARSET_WORK_ENCODER (c);
+ code = INDEX_TO_CODE_POINT (charset, code);
+ }
}
else /* method == CHARSET_METHOD_OFFSET */
{
- code = c - CHARSET_CODE_OFFSET (charset);
- code = INDEX_TO_CODE_POINT (charset, code);
+ int code_index = c - CHARSET_CODE_OFFSET (charset);
+
+ code = INDEX_TO_CODE_POINT (charset, code_index);
}
return code;
@@ -1932,35 +2150,23 @@ DIMENSION, CHARS, and FINAL-CHAR. */)
DEFUN ("clear-charset-maps", Fclear_charset_maps, Sclear_charset_maps,
0, 0, 0,
doc: /*
-Clear encoder and decoder of charsets that are loaded from mapfiles. */)
+Internal use only.
+Clear temporary charset mapping tables.
+It should be called only from temacs invoked for dumping. */)
()
{
int i;
struct charset *charset;
Lisp_Object attrs;
- for (i = 0; i < charset_table_used; i++)
+ if (temp_charset_work)
{
- charset = CHARSET_FROM_ID (i);
- attrs = CHARSET_ATTRIBUTES (charset);
-
- if (CHARSET_METHOD (charset) == CHARSET_METHOD_MAP)
- {
- CHARSET_ATTR_DECODER (attrs) = Qnil;
- CHARSET_ATTR_ENCODER (attrs) = Qnil;
- CHARSET_METHOD (charset) = CHARSET_METHOD_MAP_DEFERRED;
- }
-
- if (CHARSET_UNIFIED_P (charset))
- CHARSET_ATTR_DEUNIFIER (attrs) = Qnil;
+ free (temp_charset_work);
+ temp_charset_work = NULL;
}
- if (CHAR_TABLE_P (Vchar_unified_charset_table))
- {
- Foptimize_char_table (Vchar_unified_charset_table, Qnil);
- Vchar_unify_table = Vchar_unified_charset_table;
- Vchar_unified_charset_table = Qnil;
- }
+ if (CHAR_TABLE_P (Vchar_unify_table))
+ Foptimize_char_table (Vchar_unify_table, Qnil);
return Qnil;
}
@@ -2124,9 +2330,6 @@ syms_of_charset ()
xmalloc (sizeof (struct charset) * charset_table_size));
charset_table_used = 0;
- staticpro (&Vchar_unified_charset_table);
- Vchar_unified_charset_table = Fmake_char_table (Qnil, make_number (-1));
-
defsubr (&Scharsetp);
defsubr (&Smap_charset_chars);
defsubr (&Sdefine_charset_internal);
@@ -2154,6 +2357,10 @@ syms_of_charset ()
doc: /* *List of directories to search for charset map files. */);
Vcharset_map_path = Qnil;
+ DEFVAR_BOOL ("inhibit-load-charset-map", &inhibit_load_charset_map,
+ doc: /* Inhibit loading of charset maps. Used when dumping Emacs. */);
+ inhibit_load_charset_map = 0;
+
DEFVAR_LISP ("charset-list", &Vcharset_list,
doc: /* List of all charsets ever defined. */);
Vcharset_list = Qnil;