1 /* chartab.c -- char-table support
2 Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008, 2009, 2010, 2011
3 National Institute of Advanced Industrial Science and Technology (AIST)
4 Registration Number H13PRO009
6 This file is part of GNU Emacs.
8 GNU Emacs is free software: you can redistribute it and/or modify
9 it under the terms of the GNU General Public License as published by
10 the Free Software Foundation, either version 3 of the License, or
11 (at your option) any later version.
13 GNU Emacs is distributed in the hope that it will be useful,
14 but WITHOUT ANY WARRANTY; without even the implied warranty of
15 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
16 GNU General Public License for more details.
18 You should have received a copy of the GNU General Public License
19 along with GNU Emacs. If not, see <http://www.gnu.org/licenses/>. */
24 #include "character.h"
30 /* Number of elements in Nth level char-table. */
31 const int chartab_size
[4] =
32 { (1 << CHARTAB_SIZE_BITS_0
),
33 (1 << CHARTAB_SIZE_BITS_1
),
34 (1 << CHARTAB_SIZE_BITS_2
),
35 (1 << CHARTAB_SIZE_BITS_3
) };
37 /* Number of characters each element of Nth level char-table
39 static const int chartab_chars
[4] =
40 { (1 << (CHARTAB_SIZE_BITS_1
+ CHARTAB_SIZE_BITS_2
+ CHARTAB_SIZE_BITS_3
)),
41 (1 << (CHARTAB_SIZE_BITS_2
+ CHARTAB_SIZE_BITS_3
)),
42 (1 << CHARTAB_SIZE_BITS_3
),
45 /* Number of characters (in bits) each element of Nth level char-table
47 static const int chartab_bits
[4] =
48 { (CHARTAB_SIZE_BITS_1
+ CHARTAB_SIZE_BITS_2
+ CHARTAB_SIZE_BITS_3
),
49 (CHARTAB_SIZE_BITS_2
+ CHARTAB_SIZE_BITS_3
),
53 #define CHARTAB_IDX(c, depth, min_char) \
54 (((c) - (min_char)) >> chartab_bits[(depth)])
57 /* Preamble for uniprop (Unicode character property) tables. See the
58 comment of "Unicode character property tables". */
60 /* Purpose of uniprop tables. */
61 static Lisp_Object Qchar_code_property_table
;
63 /* Types of decoder and encoder functions for uniprop values. */
64 typedef Lisp_Object (*uniprop_decoder_t
) (Lisp_Object
, Lisp_Object
);
65 typedef Lisp_Object (*uniprop_encoder_t
) (Lisp_Object
, Lisp_Object
);
67 static Lisp_Object
uniprop_table_uncompress (Lisp_Object
, int);
68 static uniprop_decoder_t
uniprop_get_decoder (Lisp_Object
);
70 /* 1 iff TABLE is a uniprop table. */
71 #define UNIPROP_TABLE_P(TABLE) \
72 (EQ (XCHAR_TABLE (TABLE)->purpose, Qchar_code_property_table) \
73 && CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (TABLE)) == 5)
75 /* Return a decoder for values in the uniprop table TABLE. */
76 #define UNIPROP_GET_DECODER(TABLE) \
77 (UNIPROP_TABLE_P (TABLE) ? uniprop_get_decoder (TABLE) : NULL)
79 /* Nonzero iff OBJ is a string representing uniprop values of 128
80 succeeding characters (the bottom level of a char-table) by a
81 compressed format. We are sure that no property value has a string
82 starting with '\001' nor '\002'. */
83 #define UNIPROP_COMPRESSED_FORM_P(OBJ) \
84 (STRINGP (OBJ) && SCHARS (OBJ) > 0 \
85 && ((SREF (OBJ, 0) == 1 || (SREF (OBJ, 0) == 2))))
88 DEFUN ("make-char-table", Fmake_char_table
, Smake_char_table
, 1, 2, 0,
89 doc
: /* Return a newly created char-table, with purpose PURPOSE.
90 Each element is initialized to INIT, which defaults to nil.
92 PURPOSE should be a symbol. If it has a `char-table-extra-slots'
93 property, the property's value should be an integer between 0 and 10
94 that specifies how many extra slots the char-table has. Otherwise,
95 the char-table has no extra slot. */)
96 (register Lisp_Object purpose
, Lisp_Object init
)
103 CHECK_SYMBOL (purpose
);
104 n
= Fget (purpose
, Qchar_table_extra_slots
);
111 args_out_of_range (n
, Qnil
);
115 size
= VECSIZE (struct Lisp_Char_Table
) - 1 + n_extras
;
116 vector
= Fmake_vector (make_number (size
), init
);
117 XSETPVECTYPE (XVECTOR (vector
), PVEC_CHAR_TABLE
);
118 set_char_table_parent (vector
, Qnil
);
119 set_char_table_purpose (vector
, purpose
);
120 XSETCHAR_TABLE (vector
, XCHAR_TABLE (vector
));
125 make_sub_char_table (int depth
, int min_char
, Lisp_Object defalt
)
128 int size
= VECSIZE (struct Lisp_Sub_Char_Table
) - 1 + chartab_size
[depth
];
130 table
= Fmake_vector (make_number (size
), defalt
);
131 XSETPVECTYPE (XVECTOR (table
), PVEC_SUB_CHAR_TABLE
);
132 XSUB_CHAR_TABLE (table
)->depth
= make_number (depth
);
133 XSUB_CHAR_TABLE (table
)->min_char
= make_number (min_char
);
139 char_table_ascii (Lisp_Object table
)
141 Lisp_Object sub
, val
;
143 sub
= XCHAR_TABLE (table
)->contents
[0];
144 if (! SUB_CHAR_TABLE_P (sub
))
146 sub
= XSUB_CHAR_TABLE (sub
)->contents
[0];
147 if (! SUB_CHAR_TABLE_P (sub
))
149 val
= XSUB_CHAR_TABLE (sub
)->contents
[0];
150 if (UNIPROP_TABLE_P (table
) && UNIPROP_COMPRESSED_FORM_P (val
))
151 val
= uniprop_table_uncompress (sub
, 0);
156 copy_sub_char_table (Lisp_Object table
)
158 int depth
= XINT (XSUB_CHAR_TABLE (table
)->depth
);
159 int min_char
= XINT (XSUB_CHAR_TABLE (table
)->min_char
);
160 Lisp_Object copy
= make_sub_char_table (depth
, min_char
, Qnil
);
163 /* Recursively copy any sub char-tables. */
164 for (i
= 0; i
< chartab_size
[depth
]; i
++)
166 Lisp_Object val
= XSUB_CHAR_TABLE (table
)->contents
[i
];
167 set_sub_char_table_contents
168 (copy
, i
, SUB_CHAR_TABLE_P (val
) ? copy_sub_char_table (val
) : val
);
176 copy_char_table (Lisp_Object table
)
179 int size
= XCHAR_TABLE (table
)->header
.size
& PSEUDOVECTOR_SIZE_MASK
;
182 copy
= Fmake_vector (make_number (size
), Qnil
);
183 XSETPVECTYPE (XVECTOR (copy
), PVEC_CHAR_TABLE
);
184 set_char_table_defalt (copy
, XCHAR_TABLE (table
)->defalt
);
185 set_char_table_parent (copy
, XCHAR_TABLE (table
)->parent
);
186 set_char_table_purpose (copy
, XCHAR_TABLE (table
)->purpose
);
187 for (i
= 0; i
< chartab_size
[0]; i
++)
188 set_char_table_contents
190 (SUB_CHAR_TABLE_P (XCHAR_TABLE (table
)->contents
[i
])
191 ? copy_sub_char_table (XCHAR_TABLE (table
)->contents
[i
])
192 : XCHAR_TABLE (table
)->contents
[i
]));
193 set_char_table_ascii (copy
, char_table_ascii (copy
));
194 size
-= VECSIZE (struct Lisp_Char_Table
) - 1;
195 for (i
= 0; i
< size
; i
++)
196 set_char_table_extras (copy
, i
, XCHAR_TABLE (table
)->extras
[i
]);
198 XSETCHAR_TABLE (copy
, XCHAR_TABLE (copy
));
203 sub_char_table_ref (Lisp_Object table
, int c
, bool is_uniprop
)
205 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
206 int depth
= XINT (tbl
->depth
);
207 int min_char
= XINT (tbl
->min_char
);
209 int idx
= CHARTAB_IDX (c
, depth
, min_char
);
211 val
= tbl
->contents
[idx
];
212 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (val
))
213 val
= uniprop_table_uncompress (table
, idx
);
214 if (SUB_CHAR_TABLE_P (val
))
215 val
= sub_char_table_ref (val
, c
, is_uniprop
);
220 char_table_ref (Lisp_Object table
, int c
)
222 struct Lisp_Char_Table
*tbl
= XCHAR_TABLE (table
);
225 if (ASCII_CHAR_P (c
))
228 if (SUB_CHAR_TABLE_P (val
))
229 val
= XSUB_CHAR_TABLE (val
)->contents
[c
];
233 val
= tbl
->contents
[CHARTAB_IDX (c
, 0, 0)];
234 if (SUB_CHAR_TABLE_P (val
))
235 val
= sub_char_table_ref (val
, c
, UNIPROP_TABLE_P (table
));
240 if (NILP (val
) && CHAR_TABLE_P (tbl
->parent
))
241 val
= char_table_ref (tbl
->parent
, c
);
247 sub_char_table_ref_and_range (Lisp_Object table
, int c
, int *from
, int *to
,
248 Lisp_Object defalt
, bool is_uniprop
)
250 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
251 int depth
= XINT (tbl
->depth
);
252 int min_char
= XINT (tbl
->min_char
);
253 int chartab_idx
= CHARTAB_IDX (c
, depth
, min_char
), idx
;
256 val
= tbl
->contents
[chartab_idx
];
257 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (val
))
258 val
= uniprop_table_uncompress (table
, chartab_idx
);
259 if (SUB_CHAR_TABLE_P (val
))
260 val
= sub_char_table_ref_and_range (val
, c
, from
, to
, defalt
, is_uniprop
);
265 while (idx
> 0 && *from
< min_char
+ idx
* chartab_chars
[depth
])
267 Lisp_Object this_val
;
269 c
= min_char
+ idx
* chartab_chars
[depth
] - 1;
271 this_val
= tbl
->contents
[idx
];
272 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (this_val
))
273 this_val
= uniprop_table_uncompress (table
, idx
);
274 if (SUB_CHAR_TABLE_P (this_val
))
275 this_val
= sub_char_table_ref_and_range (this_val
, c
, from
, to
, defalt
,
277 else if (NILP (this_val
))
280 if (! EQ (this_val
, val
))
286 while (((c
= (chartab_idx
+ 1) * chartab_chars
[depth
])
287 < chartab_chars
[depth
- 1])
288 && (c
+= min_char
) <= *to
)
290 Lisp_Object this_val
;
293 this_val
= tbl
->contents
[chartab_idx
];
294 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (this_val
))
295 this_val
= uniprop_table_uncompress (table
, chartab_idx
);
296 if (SUB_CHAR_TABLE_P (this_val
))
297 this_val
= sub_char_table_ref_and_range (this_val
, c
, from
, to
, defalt
,
299 else if (NILP (this_val
))
301 if (! EQ (this_val
, val
))
312 /* Return the value for C in char-table TABLE. Shrink the range *FROM
313 and *TO to cover characters (containing C) that have the same value
314 as C. It is not assured that the values of (*FROM - 1) and (*TO +
315 1) are different from that of C. */
318 char_table_ref_and_range (Lisp_Object table
, int c
, int *from
, int *to
)
320 struct Lisp_Char_Table
*tbl
= XCHAR_TABLE (table
);
321 int chartab_idx
= CHARTAB_IDX (c
, 0, 0), idx
;
323 bool is_uniprop
= UNIPROP_TABLE_P (table
);
325 val
= tbl
->contents
[chartab_idx
];
330 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (val
))
331 val
= uniprop_table_uncompress (table
, chartab_idx
);
332 if (SUB_CHAR_TABLE_P (val
))
333 val
= sub_char_table_ref_and_range (val
, c
, from
, to
, tbl
->defalt
,
338 while (*from
< idx
* chartab_chars
[0])
340 Lisp_Object this_val
;
342 c
= idx
* chartab_chars
[0] - 1;
344 this_val
= tbl
->contents
[idx
];
345 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (this_val
))
346 this_val
= uniprop_table_uncompress (table
, idx
);
347 if (SUB_CHAR_TABLE_P (this_val
))
348 this_val
= sub_char_table_ref_and_range (this_val
, c
, from
, to
,
349 tbl
->defalt
, is_uniprop
);
350 else if (NILP (this_val
))
351 this_val
= tbl
->defalt
;
353 if (! EQ (this_val
, val
))
359 while (*to
>= (chartab_idx
+ 1) * chartab_chars
[0])
361 Lisp_Object this_val
;
364 c
= chartab_idx
* chartab_chars
[0];
365 this_val
= tbl
->contents
[chartab_idx
];
366 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (this_val
))
367 this_val
= uniprop_table_uncompress (table
, chartab_idx
);
368 if (SUB_CHAR_TABLE_P (this_val
))
369 this_val
= sub_char_table_ref_and_range (this_val
, c
, from
, to
,
370 tbl
->defalt
, is_uniprop
);
371 else if (NILP (this_val
))
372 this_val
= tbl
->defalt
;
373 if (! EQ (this_val
, val
))
385 sub_char_table_set (Lisp_Object table
, int c
, Lisp_Object val
, bool is_uniprop
)
387 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
388 int depth
= XINT ((tbl
)->depth
);
389 int min_char
= XINT ((tbl
)->min_char
);
390 int i
= CHARTAB_IDX (c
, depth
, min_char
);
394 set_sub_char_table_contents (table
, i
, val
);
397 sub
= tbl
->contents
[i
];
398 if (! SUB_CHAR_TABLE_P (sub
))
400 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (sub
))
401 sub
= uniprop_table_uncompress (table
, i
);
404 sub
= make_sub_char_table (depth
+ 1,
405 min_char
+ i
* chartab_chars
[depth
],
407 set_sub_char_table_contents (table
, i
, sub
);
410 sub_char_table_set (sub
, c
, val
, is_uniprop
);
415 char_table_set (Lisp_Object table
, int c
, Lisp_Object val
)
417 struct Lisp_Char_Table
*tbl
= XCHAR_TABLE (table
);
420 && SUB_CHAR_TABLE_P (tbl
->ascii
))
421 set_sub_char_table_contents (tbl
->ascii
, c
, val
);
424 int i
= CHARTAB_IDX (c
, 0, 0);
427 sub
= tbl
->contents
[i
];
428 if (! SUB_CHAR_TABLE_P (sub
))
430 sub
= make_sub_char_table (1, i
* chartab_chars
[0], sub
);
431 set_char_table_contents (table
, i
, sub
);
433 sub_char_table_set (sub
, c
, val
, UNIPROP_TABLE_P (table
));
434 if (ASCII_CHAR_P (c
))
435 set_char_table_ascii (table
, char_table_ascii (table
));
440 sub_char_table_set_range (Lisp_Object table
, int from
, int to
, Lisp_Object val
,
443 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
444 int depth
= XINT ((tbl
)->depth
);
445 int min_char
= XINT ((tbl
)->min_char
);
446 int chars_in_block
= chartab_chars
[depth
];
447 int i
, c
, lim
= chartab_size
[depth
];
451 i
= CHARTAB_IDX (from
, depth
, min_char
);
452 c
= min_char
+ chars_in_block
* i
;
453 for (; i
< lim
; i
++, c
+= chars_in_block
)
457 if (from
<= c
&& c
+ chars_in_block
- 1 <= to
)
458 set_sub_char_table_contents (table
, i
, val
);
461 Lisp_Object sub
= tbl
->contents
[i
];
462 if (! SUB_CHAR_TABLE_P (sub
))
464 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (sub
))
465 sub
= uniprop_table_uncompress (table
, i
);
468 sub
= make_sub_char_table (depth
+ 1, c
, sub
);
469 set_sub_char_table_contents (table
, i
, sub
);
472 sub_char_table_set_range (sub
, from
, to
, val
, is_uniprop
);
479 char_table_set_range (Lisp_Object table
, int from
, int to
, Lisp_Object val
)
481 struct Lisp_Char_Table
*tbl
= XCHAR_TABLE (table
);
484 char_table_set (table
, from
, val
);
487 bool is_uniprop
= UNIPROP_TABLE_P (table
);
488 int lim
= CHARTAB_IDX (to
, 0, 0);
491 for (i
= CHARTAB_IDX (from
, 0, 0), c
= 0; i
<= lim
;
492 i
++, c
+= chartab_chars
[0])
496 if (from
<= c
&& c
+ chartab_chars
[0] - 1 <= to
)
497 set_char_table_contents (table
, i
, val
);
500 Lisp_Object sub
= tbl
->contents
[i
];
501 if (! SUB_CHAR_TABLE_P (sub
))
503 sub
= make_sub_char_table (1, i
* chartab_chars
[0], sub
);
504 set_char_table_contents (table
, i
, sub
);
506 sub_char_table_set_range (sub
, from
, to
, val
, is_uniprop
);
509 if (ASCII_CHAR_P (from
))
510 set_char_table_ascii (table
, char_table_ascii (table
));
515 DEFUN ("char-table-subtype", Fchar_table_subtype
, Schar_table_subtype
,
518 Return the subtype of char-table CHAR-TABLE. The value is a symbol. */)
519 (Lisp_Object char_table
)
521 CHECK_CHAR_TABLE (char_table
);
523 return XCHAR_TABLE (char_table
)->purpose
;
526 DEFUN ("char-table-parent", Fchar_table_parent
, Schar_table_parent
,
528 doc
: /* Return the parent char-table of CHAR-TABLE.
529 The value is either nil or another char-table.
530 If CHAR-TABLE holds nil for a given character,
531 then the actual applicable value is inherited from the parent char-table
532 \(or from its parents, if necessary). */)
533 (Lisp_Object char_table
)
535 CHECK_CHAR_TABLE (char_table
);
537 return XCHAR_TABLE (char_table
)->parent
;
540 DEFUN ("set-char-table-parent", Fset_char_table_parent
, Sset_char_table_parent
,
542 doc
: /* Set the parent char-table of CHAR-TABLE to PARENT.
543 Return PARENT. PARENT must be either nil or another char-table. */)
544 (Lisp_Object char_table
, Lisp_Object parent
)
548 CHECK_CHAR_TABLE (char_table
);
552 CHECK_CHAR_TABLE (parent
);
554 for (temp
= parent
; !NILP (temp
); temp
= XCHAR_TABLE (temp
)->parent
)
555 if (EQ (temp
, char_table
))
556 error ("Attempt to make a chartable be its own parent");
559 set_char_table_parent (char_table
, parent
);
564 DEFUN ("char-table-extra-slot", Fchar_table_extra_slot
, Schar_table_extra_slot
,
566 doc
: /* Return the value of CHAR-TABLE's extra-slot number N. */)
567 (Lisp_Object char_table
, Lisp_Object n
)
569 CHECK_CHAR_TABLE (char_table
);
572 || XINT (n
) >= CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (char_table
)))
573 args_out_of_range (char_table
, n
);
575 return XCHAR_TABLE (char_table
)->extras
[XINT (n
)];
578 DEFUN ("set-char-table-extra-slot", Fset_char_table_extra_slot
,
579 Sset_char_table_extra_slot
,
581 doc
: /* Set CHAR-TABLE's extra-slot number N to VALUE. */)
582 (Lisp_Object char_table
, Lisp_Object n
, Lisp_Object value
)
584 CHECK_CHAR_TABLE (char_table
);
587 || XINT (n
) >= CHAR_TABLE_EXTRA_SLOTS (XCHAR_TABLE (char_table
)))
588 args_out_of_range (char_table
, n
);
590 set_char_table_extras (char_table
, XINT (n
), value
);
594 DEFUN ("char-table-range", Fchar_table_range
, Schar_table_range
,
596 doc
: /* Return the value in CHAR-TABLE for a range of characters RANGE.
597 RANGE should be nil (for the default value),
598 a cons of character codes (for characters in the range), or a character code. */)
599 (Lisp_Object char_table
, Lisp_Object range
)
602 CHECK_CHAR_TABLE (char_table
);
604 if (EQ (range
, Qnil
))
605 val
= XCHAR_TABLE (char_table
)->defalt
;
606 else if (CHARACTERP (range
))
607 val
= CHAR_TABLE_REF (char_table
, XFASTINT (range
));
608 else if (CONSP (range
))
612 CHECK_CHARACTER_CAR (range
);
613 CHECK_CHARACTER_CDR (range
);
614 from
= XFASTINT (XCAR (range
));
615 to
= XFASTINT (XCDR (range
));
616 val
= char_table_ref_and_range (char_table
, from
, &from
, &to
);
617 /* Not yet implemented. */
620 error ("Invalid RANGE argument to `char-table-range'");
624 DEFUN ("set-char-table-range", Fset_char_table_range
, Sset_char_table_range
,
626 doc
: /* Set the value in CHAR-TABLE for a range of characters RANGE to VALUE.
627 RANGE should be t (for all characters), nil (for the default value),
628 a cons of character codes (for characters in the range),
629 or a character code. Return VALUE. */)
630 (Lisp_Object char_table
, Lisp_Object range
, Lisp_Object value
)
632 CHECK_CHAR_TABLE (char_table
);
637 set_char_table_ascii (char_table
, value
);
638 for (i
= 0; i
< chartab_size
[0]; i
++)
639 set_char_table_contents (char_table
, i
, value
);
641 else if (EQ (range
, Qnil
))
642 set_char_table_defalt (char_table
, value
);
643 else if (CHARACTERP (range
))
644 char_table_set (char_table
, XINT (range
), value
);
645 else if (CONSP (range
))
647 CHECK_CHARACTER_CAR (range
);
648 CHECK_CHARACTER_CDR (range
);
649 char_table_set_range (char_table
,
650 XINT (XCAR (range
)), XINT (XCDR (range
)), value
);
653 error ("Invalid RANGE argument to `set-char-table-range'");
658 DEFUN ("set-char-table-default", Fset_char_table_default
,
659 Sset_char_table_default
, 3, 3, 0,
661 This function is obsolete and has no effect. */)
662 (Lisp_Object char_table
, Lisp_Object ch
, Lisp_Object value
)
667 /* Look up the element in TABLE at index CH, and return it as an
668 integer. If the element is not a character, return CH itself. */
671 char_table_translate (Lisp_Object table
, int ch
)
674 value
= Faref (table
, make_number (ch
));
675 if (! CHARACTERP (value
))
681 optimize_sub_char_table (Lisp_Object table
, Lisp_Object test
)
683 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
684 int depth
= XINT (tbl
->depth
);
685 Lisp_Object elt
, this;
689 elt
= XSUB_CHAR_TABLE (table
)->contents
[0];
690 if (SUB_CHAR_TABLE_P (elt
))
692 elt
= optimize_sub_char_table (elt
, test
);
693 set_sub_char_table_contents (table
, 0, elt
);
695 optimizable
= SUB_CHAR_TABLE_P (elt
) ? 0 : 1;
696 for (i
= 1; i
< chartab_size
[depth
]; i
++)
698 this = XSUB_CHAR_TABLE (table
)->contents
[i
];
699 if (SUB_CHAR_TABLE_P (this))
701 this = optimize_sub_char_table (this, test
);
702 set_sub_char_table_contents (table
, i
, this);
705 && (NILP (test
) ? NILP (Fequal (this, elt
)) /* defaults to `equal'. */
706 : EQ (test
, Qeq
) ? !EQ (this, elt
) /* Optimize `eq' case. */
707 : NILP (call2 (test
, this, elt
))))
711 return (optimizable
? elt
: table
);
714 DEFUN ("optimize-char-table", Foptimize_char_table
, Soptimize_char_table
,
716 doc
: /* Optimize CHAR-TABLE.
717 TEST is the comparison function used to decide whether two entries are
718 equivalent and can be merged. It defaults to `equal'. */)
719 (Lisp_Object char_table
, Lisp_Object test
)
724 CHECK_CHAR_TABLE (char_table
);
726 for (i
= 0; i
< chartab_size
[0]; i
++)
728 elt
= XCHAR_TABLE (char_table
)->contents
[i
];
729 if (SUB_CHAR_TABLE_P (elt
))
730 set_char_table_contents
731 (char_table
, i
, optimize_sub_char_table (elt
, test
));
733 /* Reset the `ascii' cache, in case it got optimized away. */
734 set_char_table_ascii (char_table
, char_table_ascii (char_table
));
740 /* Map C_FUNCTION or FUNCTION over TABLE (top or sub char-table),
741 calling it for each character or group of characters that share a
742 value. RANGE is a cons (FROM . TO) specifying the range of target
743 characters, VAL is a value of FROM in TABLE, TOP is the top
746 ARG is passed to C_FUNCTION when that is called.
748 It returns the value of last character covered by TABLE (not the
749 value inherited from the parent), and by side-effect, the car part
750 of RANGE is updated to the minimum character C where C and all the
751 following characters in TABLE have the same value. */
754 map_sub_char_table (void (*c_function
) (Lisp_Object
, Lisp_Object
, Lisp_Object
),
755 Lisp_Object function
, Lisp_Object table
, Lisp_Object arg
, Lisp_Object val
,
756 Lisp_Object range
, Lisp_Object top
)
758 /* Depth of TABLE. */
760 /* Minimum and maximum characters covered by TABLE. */
761 int min_char
, max_char
;
762 /* Number of characters covered by one element of TABLE. */
764 int from
= XINT (XCAR (range
)), to
= XINT (XCDR (range
));
766 bool is_uniprop
= UNIPROP_TABLE_P (top
);
767 uniprop_decoder_t decoder
= UNIPROP_GET_DECODER (top
);
769 if (SUB_CHAR_TABLE_P (table
))
771 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
773 depth
= XINT (tbl
->depth
);
774 min_char
= XINT (tbl
->min_char
);
775 max_char
= min_char
+ chartab_chars
[depth
- 1] - 1;
783 chars_in_block
= chartab_chars
[depth
];
787 /* Set I to the index of the first element to check. */
788 if (from
<= min_char
)
791 i
= (from
- min_char
) / chars_in_block
;
792 for (c
= min_char
+ chars_in_block
* i
; c
<= max_char
;
793 i
++, c
+= chars_in_block
)
795 Lisp_Object
this = (SUB_CHAR_TABLE_P (table
)
796 ? XSUB_CHAR_TABLE (table
)->contents
[i
]
797 : XCHAR_TABLE (table
)->contents
[i
]);
798 int nextc
= c
+ chars_in_block
;
800 if (is_uniprop
&& UNIPROP_COMPRESSED_FORM_P (this))
801 this = uniprop_table_uncompress (table
, i
);
802 if (SUB_CHAR_TABLE_P (this))
805 XSETCDR (range
, make_number (nextc
- 1));
806 val
= map_sub_char_table (c_function
, function
, this, arg
,
812 this = XCHAR_TABLE (top
)->defalt
;
815 bool different_value
= 1;
819 if (! NILP (XCHAR_TABLE (top
)->parent
))
821 Lisp_Object parent
= XCHAR_TABLE (top
)->parent
;
822 Lisp_Object temp
= XCHAR_TABLE (parent
)->parent
;
824 /* This is to get a value of FROM in PARENT
825 without checking the parent of PARENT. */
826 set_char_table_parent (parent
, Qnil
);
827 val
= CHAR_TABLE_REF (parent
, from
);
828 set_char_table_parent (parent
, temp
);
829 XSETCDR (range
, make_number (c
- 1));
830 val
= map_sub_char_table (c_function
, function
,
831 parent
, arg
, val
, range
,
837 if (! NILP (val
) && different_value
)
839 XSETCDR (range
, make_number (c
- 1));
840 if (EQ (XCAR (range
), XCDR (range
)))
843 (*c_function
) (arg
, XCAR (range
), val
);
847 val
= decoder (top
, val
);
848 call2 (function
, XCAR (range
), val
);
854 (*c_function
) (arg
, range
, val
);
858 val
= decoder (top
, val
);
859 call2 (function
, range
, val
);
865 XSETCAR (range
, make_number (c
));
868 XSETCDR (range
, make_number (to
));
874 /* Map C_FUNCTION or FUNCTION over TABLE, calling it for each
875 character or group of characters that share a value.
877 ARG is passed to C_FUNCTION when that is called. */
880 map_char_table (void (*c_function
) (Lisp_Object
, Lisp_Object
, Lisp_Object
),
881 Lisp_Object function
, Lisp_Object table
, Lisp_Object arg
)
883 Lisp_Object range
, val
, parent
;
884 struct gcpro gcpro1
, gcpro2
, gcpro3
, gcpro4
;
885 uniprop_decoder_t decoder
= UNIPROP_GET_DECODER (table
);
887 range
= Fcons (make_number (0), make_number (MAX_CHAR
));
888 parent
= XCHAR_TABLE (table
)->parent
;
890 GCPRO4 (table
, arg
, range
, parent
);
891 val
= XCHAR_TABLE (table
)->ascii
;
892 if (SUB_CHAR_TABLE_P (val
))
893 val
= XSUB_CHAR_TABLE (val
)->contents
[0];
894 val
= map_sub_char_table (c_function
, function
, table
, arg
, val
, range
,
897 /* If VAL is nil and TABLE has a parent, we must consult the parent
899 while (NILP (val
) && ! NILP (XCHAR_TABLE (table
)->parent
))
902 int from
= XINT (XCAR (range
));
904 parent
= XCHAR_TABLE (table
)->parent
;
905 temp
= XCHAR_TABLE (parent
)->parent
;
906 /* This is to get a value of FROM in PARENT without checking the
908 set_char_table_parent (parent
, Qnil
);
909 val
= CHAR_TABLE_REF (parent
, from
);
910 set_char_table_parent (parent
, temp
);
911 val
= map_sub_char_table (c_function
, function
, parent
, arg
, val
, range
,
918 if (EQ (XCAR (range
), XCDR (range
)))
921 (*c_function
) (arg
, XCAR (range
), val
);
925 val
= decoder (table
, val
);
926 call2 (function
, XCAR (range
), val
);
932 (*c_function
) (arg
, range
, val
);
936 val
= decoder (table
, val
);
937 call2 (function
, range
, val
);
945 DEFUN ("map-char-table", Fmap_char_table
, Smap_char_table
,
947 doc
: /* Call FUNCTION for each character in CHAR-TABLE that has non-nil value.
948 FUNCTION is called with two arguments, KEY and VALUE.
949 KEY is a character code or a cons of character codes specifying a
950 range of characters that have the same value.
951 VALUE is what (char-table-range CHAR-TABLE KEY) returns. */)
952 (Lisp_Object function
, Lisp_Object char_table
)
954 CHECK_CHAR_TABLE (char_table
);
956 map_char_table (NULL
, function
, char_table
, char_table
);
962 map_sub_char_table_for_charset (void (*c_function
) (Lisp_Object
, Lisp_Object
),
963 Lisp_Object function
, Lisp_Object table
, Lisp_Object arg
,
964 Lisp_Object range
, struct charset
*charset
,
965 unsigned from
, unsigned to
)
967 struct Lisp_Sub_Char_Table
*tbl
= XSUB_CHAR_TABLE (table
);
968 int depth
= XINT (tbl
->depth
);
972 for (i
= 0, c
= XINT (tbl
->min_char
); i
< chartab_size
[depth
];
973 i
++, c
+= chartab_chars
[depth
])
977 this = tbl
->contents
[i
];
978 if (SUB_CHAR_TABLE_P (this))
979 map_sub_char_table_for_charset (c_function
, function
, this, arg
,
980 range
, charset
, from
, to
);
983 if (! NILP (XCAR (range
)))
985 XSETCDR (range
, make_number (c
- 1));
987 (*c_function
) (arg
, range
);
989 call2 (function
, range
, arg
);
991 XSETCAR (range
, Qnil
);
995 for (i
= 0, c
= XINT (tbl
->min_char
); i
< chartab_size
[depth
]; i
++, c
++)
1000 this = tbl
->contents
[i
];
1003 && (code
= ENCODE_CHAR (charset
, c
),
1004 (code
< from
|| code
> to
))))
1006 if (! NILP (XCAR (range
)))
1008 XSETCDR (range
, make_number (c
- 1));
1010 (*c_function
) (arg
, range
);
1012 call2 (function
, range
, arg
);
1013 XSETCAR (range
, Qnil
);
1018 if (NILP (XCAR (range
)))
1019 XSETCAR (range
, make_number (c
));
1025 /* Support function for `map-charset-chars'. Map C_FUNCTION or
1026 FUNCTION over TABLE, calling it for each character or a group of
1027 succeeding characters that have non-nil value in TABLE. TABLE is a
1028 "mapping table" or a "deunifier table" of a certain charset.
1030 If CHARSET is not NULL (this is the case that `map-charset-chars'
1031 is called with non-nil FROM-CODE and TO-CODE), it is a charset who
1032 owns TABLE, and the function is called only on a character in the
1033 range FROM and TO. FROM and TO are not character codes, but code
1034 points of a character in CHARSET.
1036 This function is called in these two cases:
1038 (1) A charset has a mapping file name in :map property.
1040 (2) A charset has an upper code space in :offset property and a
1041 mapping file name in :unify-map property. In this case, this
1042 function is called only for characters in the Unicode code space.
1043 Characters in upper code space are handled directly in
1044 map_charset_chars. */
1047 map_char_table_for_charset (void (*c_function
) (Lisp_Object
, Lisp_Object
),
1048 Lisp_Object function
, Lisp_Object table
, Lisp_Object arg
,
1049 struct charset
*charset
,
1050 unsigned from
, unsigned to
)
1054 struct gcpro gcpro1
;
1056 range
= Fcons (Qnil
, Qnil
);
1059 for (i
= 0, c
= 0; i
< chartab_size
[0]; i
++, c
+= chartab_chars
[0])
1063 this = XCHAR_TABLE (table
)->contents
[i
];
1064 if (SUB_CHAR_TABLE_P (this))
1065 map_sub_char_table_for_charset (c_function
, function
, this, arg
,
1066 range
, charset
, from
, to
);
1069 if (! NILP (XCAR (range
)))
1071 XSETCDR (range
, make_number (c
- 1));
1073 (*c_function
) (arg
, range
);
1075 call2 (function
, range
, arg
);
1077 XSETCAR (range
, Qnil
);
1080 if (! NILP (XCAR (range
)))
1082 XSETCDR (range
, make_number (c
- 1));
1084 (*c_function
) (arg
, range
);
1086 call2 (function
, range
, arg
);
1093 /* Unicode character property tables.
1095 This section provides a convenient and efficient way to get Unicode
1096 character properties of characters from C code (from Lisp, you must
1097 use get-char-code-property).
1099 The typical usage is to get a char-table object for a specific
1100 property like this (use of the "bidi-class" property below is just
1103 Lisp_Object bidi_class_table = uniprop_table (intern ("bidi-class"));
1105 (uniprop_table can return nil if it fails to find data for the
1106 named property, or if it fails to load the appropriate Lisp support
1107 file, so the return value should be tested to be non-nil, before it
1110 To get a property value for character CH use CHAR_TABLE_REF:
1112 Lisp_Object bidi_class = CHAR_TABLE_REF (bidi_class_table, CH);
1114 In this case, what you actually get is an index number to the
1115 vector of property values (symbols nil, L, R, etc).
1117 The full list of Unicode character properties supported by Emacs is
1118 documented in the ELisp manual, in the node "Character Properties".
1120 A table for Unicode character property has these characteristics:
1122 o The purpose is `char-code-property-table', which implies that the
1123 table has 5 extra slots.
1125 o The second extra slot is a Lisp function, an index (integer) to
1126 the array uniprop_decoder[], or nil. If it is a Lisp function, we
1127 can't use such a table from C (at the moment). If it is nil, it
1128 means that we don't have to decode values.
1130 o The third extra slot is a Lisp function, an index (integer) to
1131 the array uniprop_encoder[], or nil. If it is a Lisp function, we
1132 can't use such a table from C (at the moment). If it is nil, it
1133 means that we don't have to encode values. */
1136 /* Uncompress the IDXth element of sub-char-table TABLE. */
1139 uniprop_table_uncompress (Lisp_Object table
, int idx
)
1141 Lisp_Object val
= XSUB_CHAR_TABLE (table
)->contents
[idx
];
1142 int min_char
= (XINT (XSUB_CHAR_TABLE (table
)->min_char
)
1143 + chartab_chars
[2] * idx
);
1144 Lisp_Object sub
= make_sub_char_table (3, min_char
, Qnil
);
1145 const unsigned char *p
, *pend
;
1147 set_sub_char_table_contents (table
, idx
, sub
);
1148 p
= SDATA (val
), pend
= p
+ SBYTES (val
);
1153 idx
= STRING_CHAR_ADVANCE (p
);
1154 while (p
< pend
&& idx
< chartab_chars
[2])
1156 int v
= STRING_CHAR_ADVANCE (p
);
1157 set_sub_char_table_contents
1158 (sub
, idx
++, v
> 0 ? make_number (v
) : Qnil
);
1163 /* RUN-LENGTH TABLE */
1165 for (idx
= 0; p
< pend
; )
1167 int v
= STRING_CHAR_ADVANCE (p
);
1173 count
= STRING_CHAR_AND_LENGTH (p
, len
);
1183 set_sub_char_table_contents (sub
, idx
++, make_number (v
));
1186 /* It seems that we don't need this function because C code won't need
1187 to get a property that is compressed in this form. */
1191 /* WORD-LIST TABLE */
1198 /* Decode VALUE as an element of char-table TABLE. */
1201 uniprop_decode_value_run_length (Lisp_Object table
, Lisp_Object value
)
1203 if (VECTORP (XCHAR_TABLE (table
)->extras
[4]))
1205 Lisp_Object valvec
= XCHAR_TABLE (table
)->extras
[4];
1207 if (XINT (value
) >= 0 && XINT (value
) < ASIZE (valvec
))
1208 value
= AREF (valvec
, XINT (value
));
1213 static uniprop_decoder_t uniprop_decoder
[] =
1214 { uniprop_decode_value_run_length
};
1216 static int uniprop_decoder_count
1217 = (sizeof uniprop_decoder
) / sizeof (uniprop_decoder
[0]);
1220 /* Return the decoder of char-table TABLE or nil if none. */
1222 static uniprop_decoder_t
1223 uniprop_get_decoder (Lisp_Object table
)
1227 if (! INTEGERP (XCHAR_TABLE (table
)->extras
[1]))
1229 i
= XINT (XCHAR_TABLE (table
)->extras
[1]);
1230 if (i
< 0 || i
>= uniprop_decoder_count
)
1232 return uniprop_decoder
[i
];
1236 /* Encode VALUE as an element of char-table TABLE which contains
1237 characters as elements. */
1240 uniprop_encode_value_character (Lisp_Object table
, Lisp_Object value
)
1242 if (! NILP (value
) && ! CHARACTERP (value
))
1243 wrong_type_argument (Qintegerp
, value
);
1248 /* Encode VALUE as an element of char-table TABLE which adopts RUN-LENGTH
1252 uniprop_encode_value_run_length (Lisp_Object table
, Lisp_Object value
)
1254 Lisp_Object
*value_table
= XVECTOR (XCHAR_TABLE (table
)->extras
[4])->contents
;
1255 int i
, size
= ASIZE (XCHAR_TABLE (table
)->extras
[4]);
1257 for (i
= 0; i
< size
; i
++)
1258 if (EQ (value
, value_table
[i
]))
1261 wrong_type_argument (build_string ("Unicode property value"), value
);
1262 return make_number (i
);
1266 /* Encode VALUE as an element of char-table TABLE which adopts RUN-LENGTH
1267 compression and contains numbers as elements . */
1270 uniprop_encode_value_numeric (Lisp_Object table
, Lisp_Object value
)
1272 Lisp_Object
*value_table
= XVECTOR (XCHAR_TABLE (table
)->extras
[4])->contents
;
1273 int i
, size
= ASIZE (XCHAR_TABLE (table
)->extras
[4]);
1275 CHECK_NUMBER (value
);
1276 for (i
= 0; i
< size
; i
++)
1277 if (EQ (value
, value_table
[i
]))
1279 value
= make_number (i
);
1282 Lisp_Object args
[2];
1284 args
[0] = XCHAR_TABLE (table
)->extras
[4];
1285 args
[1] = Fmake_vector (make_number (1), value
);
1286 set_char_table_extras (table
, 4, Fvconcat (2, args
));
1288 return make_number (i
);
1291 static uniprop_encoder_t uniprop_encoder
[] =
1292 { uniprop_encode_value_character
,
1293 uniprop_encode_value_run_length
,
1294 uniprop_encode_value_numeric
};
1296 static int uniprop_encoder_count
1297 = (sizeof uniprop_encoder
) / sizeof (uniprop_encoder
[0]);
1300 /* Return the encoder of char-table TABLE or nil if none. */
1302 static uniprop_decoder_t
1303 uniprop_get_encoder (Lisp_Object table
)
1307 if (! INTEGERP (XCHAR_TABLE (table
)->extras
[2]))
1309 i
= XINT (XCHAR_TABLE (table
)->extras
[2]);
1310 if (i
< 0 || i
>= uniprop_encoder_count
)
1312 return uniprop_encoder
[i
];
1315 /* Return a char-table for Unicode character property PROP. This
1316 function may load a Lisp file and thus may cause
1317 garbage-collection. */
1320 uniprop_table (Lisp_Object prop
)
1322 Lisp_Object val
, table
, result
;
1324 val
= Fassq (prop
, Vchar_code_property_alist
);
1328 if (STRINGP (table
))
1330 struct gcpro gcpro1
;
1332 result
= Fload (concat2 (build_string ("international/"), table
),
1339 if (! CHAR_TABLE_P (table
)
1340 || ! UNIPROP_TABLE_P (table
))
1342 val
= XCHAR_TABLE (table
)->extras
[1];
1344 ? (XINT (val
) < 0 || XINT (val
) >= uniprop_decoder_count
)
1347 /* Prepare ASCII values in advance for CHAR_TABLE_REF. */
1348 set_char_table_ascii (table
, char_table_ascii (table
));
1352 DEFUN ("unicode-property-table-internal", Funicode_property_table_internal
,
1353 Sunicode_property_table_internal
, 1, 1, 0,
1354 doc
: /* Return a char-table for Unicode character property PROP.
1355 Use `get-unicode-property-internal' and
1356 `put-unicode-property-internal' instead of `aref' and `aset' to get
1357 and put an element value. */)
1360 Lisp_Object table
= uniprop_table (prop
);
1362 if (CHAR_TABLE_P (table
))
1364 return Fcdr (Fassq (prop
, Vchar_code_property_alist
));
1367 DEFUN ("get-unicode-property-internal", Fget_unicode_property_internal
,
1368 Sget_unicode_property_internal
, 2, 2, 0,
1369 doc
: /* Return an element of CHAR-TABLE for character CH.
1370 CHAR-TABLE must be what returned by `unicode-property-table-internal'. */)
1371 (Lisp_Object char_table
, Lisp_Object ch
)
1374 uniprop_decoder_t decoder
;
1376 CHECK_CHAR_TABLE (char_table
);
1377 CHECK_CHARACTER (ch
);
1378 if (! UNIPROP_TABLE_P (char_table
))
1379 error ("Invalid Unicode property table");
1380 val
= CHAR_TABLE_REF (char_table
, XINT (ch
));
1381 decoder
= uniprop_get_decoder (char_table
);
1382 return (decoder
? decoder (char_table
, val
) : val
);
1385 DEFUN ("put-unicode-property-internal", Fput_unicode_property_internal
,
1386 Sput_unicode_property_internal
, 3, 3, 0,
1387 doc
: /* Set an element of CHAR-TABLE for character CH to VALUE.
1388 CHAR-TABLE must be what returned by `unicode-property-table-internal'. */)
1389 (Lisp_Object char_table
, Lisp_Object ch
, Lisp_Object value
)
1391 uniprop_encoder_t encoder
;
1393 CHECK_CHAR_TABLE (char_table
);
1394 CHECK_CHARACTER (ch
);
1395 if (! UNIPROP_TABLE_P (char_table
))
1396 error ("Invalid Unicode property table");
1397 encoder
= uniprop_get_encoder (char_table
);
1399 value
= encoder (char_table
, value
);
1400 CHAR_TABLE_SET (char_table
, XINT (ch
), value
);
1406 syms_of_chartab (void)
1408 DEFSYM (Qchar_code_property_table
, "char-code-property-table");
1410 defsubr (&Smake_char_table
);
1411 defsubr (&Schar_table_parent
);
1412 defsubr (&Schar_table_subtype
);
1413 defsubr (&Sset_char_table_parent
);
1414 defsubr (&Schar_table_extra_slot
);
1415 defsubr (&Sset_char_table_extra_slot
);
1416 defsubr (&Schar_table_range
);
1417 defsubr (&Sset_char_table_range
);
1418 defsubr (&Sset_char_table_default
);
1419 defsubr (&Soptimize_char_table
);
1420 defsubr (&Smap_char_table
);
1421 defsubr (&Sunicode_property_table_internal
);
1422 defsubr (&Sget_unicode_property_internal
);
1423 defsubr (&Sput_unicode_property_internal
);
1425 /* Each element has the form (PROP . TABLE).
1426 PROP is a symbol representing a character property.
1427 TABLE is a char-table containing the property value for each character.
1428 TABLE may be a name of file to load to build a char-table.
1429 This variable should be modified only through
1430 `define-char-code-property'. */
1432 DEFVAR_LISP ("char-code-property-alist", Vchar_code_property_alist
,
1433 doc
: /* Alist of character property name vs char-table containing property values.
1434 Internal use only. */);
1435 Vchar_code_property_alist
= Qnil
;