1 /* Basic character support.
2 Copyright (C) 1995, 1997, 1998, 2001 Electrotechnical Laboratory, JAPAN.
3 Licensed to the Free Software Foundation.
4 Copyright (C) 2001, 2002, 2003, 2004, 2005, 2006, 2007, 2008
5 Free Software Foundation, Inc.
6 Copyright (C) 2003, 2004, 2005, 2006, 2007, 2008
7 National Institute of Advanced Industrial Science and Technology (AIST)
8 Registration Number H13PRO009
10 This file is part of GNU Emacs.
12 GNU Emacs is free software; you can redistribute it and/or modify
13 it under the terms of the GNU General Public License as published by
14 the Free Software Foundation; either version 3, or (at your option)
17 GNU Emacs is distributed in the hope that it will be useful,
18 but WITHOUT ANY WARRANTY; without even the implied warranty of
19 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
20 GNU General Public License for more details.
22 You should have received a copy of the GNU General Public License
23 along with GNU Emacs; see the file COPYING. If not, write to the
24 Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
25 Boston, MA 02110-1301, USA. */
27 /* At first, see the document in `character.h' to understand the code
38 #include <sys/types.h>
40 #include "character.h"
43 #include "composite.h"
52 Lisp_Object Qcharacterp
;
54 /* Vector of translation table ever defined.
55 ID of a translation table is used to index this vector. */
56 Lisp_Object Vtranslation_table_vector
;
58 /* A char-table for characters which may invoke auto-filling. */
59 Lisp_Object Vauto_fill_chars
;
61 Lisp_Object Qauto_fill_chars
;
63 /* Char-table of information about which character to unify to which
65 Lisp_Object Vchar_unify_table
;
67 /* A char-table. An element is non-nil iff the corresponding
68 character has a printable glyph. */
69 Lisp_Object Vprintable_chars
;
71 /* A char-table. An elemnent is a column-width of the corresponding
73 Lisp_Object Vchar_width_table
;
75 /* A char-table. An element is a symbol indicating the direction
76 property of corresponding character. */
77 Lisp_Object Vchar_direction_table
;
79 /* Variable used locally in the macro FETCH_MULTIBYTE_CHAR. */
80 unsigned char *_fetch_multibyte_char_p
;
82 /* Char table of scripts. */
83 Lisp_Object Vchar_script_table
;
85 /* Alist of scripts vs representative characters. */
86 Lisp_Object Vscript_representative_chars
;
88 static Lisp_Object Qchar_script_table
;
90 /* Mapping table from unibyte chars to multibyte chars. */
91 int unibyte_to_multibyte_table
[256];
93 /* Nth element is 1 iff unibyte char N can be mapped to a multibyte
95 char unibyte_has_multibyte_table
[256];
99 /* If character code C has modifier masks, reflect them to the
100 character code if possible. Return the resulting code. */
103 char_resolve_modifier_mask (c
)
106 /* A non-ASCII character can't reflect modifier bits to the code. */
107 if (! ASCII_CHAR_P ((c
& ~CHAR_MODIFIER_MASK
)))
110 /* For Meta, Shift, and Control modifiers, we need special care. */
113 /* Shift modifier is valid only with [A-Za-z]. */
114 if ((c
& 0377) >= 'A' && (c
& 0377) <= 'Z')
116 else if ((c
& 0377) >= 'a' && (c
& 0377) <= 'z')
117 c
= (c
& ~CHAR_SHIFT
) - ('a' - 'A');
118 /* Shift modifier for control characters and SPC is ignored. */
119 else if ((c
& ~CHAR_MODIFIER_MASK
) <= 0x20)
124 /* Simulate the code in lread.c. */
125 /* Allow `\C- ' and `\C-?'. */
126 if ((c
& 0377) == ' ')
127 c
&= ~0177 & ~ CHAR_CTL
;
128 else if ((c
& 0377) == '?')
129 c
= 0177 | (c
& ~0177 & ~CHAR_CTL
);
130 /* ASCII control chars are made from letters (both cases),
131 as well as the non-letters within 0100...0137. */
132 else if ((c
& 0137) >= 0101 && (c
& 0137) <= 0132)
133 c
&= (037 | (~0177 & ~CHAR_CTL
));
134 else if ((c
& 0177) >= 0100 && (c
& 0177) <= 0137)
135 c
&= (037 | (~0177 & ~CHAR_CTL
));
139 /* Move the meta bit to the right place for a string. */
140 c
= (c
& ~CHAR_META
) | 0x80;
147 /* Store multibyte form of character C at P. If C has modifier bits,
148 handle them appropriately. */
157 if (c
& CHAR_MODIFIER_MASK
)
159 c
= (unsigned) char_resolve_modifier_mask ((int) c
);
160 /* If C still has any modifier bits, just ignore it. */
161 c
&= ~CHAR_MODIFIER_MASK
;
164 MAYBE_UNIFY_CHAR (c
);
166 if (c
<= MAX_3_BYTE_CHAR
)
168 bytes
= CHAR_STRING (c
, p
);
170 else if (c
<= MAX_4_BYTE_CHAR
)
172 p
[0] = (0xF0 | (c
>> 18));
173 p
[1] = (0x80 | ((c
>> 12) & 0x3F));
174 p
[2] = (0x80 | ((c
>> 6) & 0x3F));
175 p
[3] = (0x80 | (c
& 0x3F));
178 else if (c
<= MAX_5_BYTE_CHAR
)
181 p
[1] = (0x80 | ((c
>> 18) & 0x0F));
182 p
[2] = (0x80 | ((c
>> 12) & 0x3F));
183 p
[3] = (0x80 | ((c
>> 6) & 0x3F));
184 p
[4] = (0x80 | (c
& 0x3F));
187 else if (c
<= MAX_CHAR
)
189 c
= CHAR_TO_BYTE8 (c
);
190 bytes
= BYTE8_STRING (c
, p
);
193 error ("Invalid character: %d", c
);
199 /* Return a character whose multibyte form is at P. Set LEN is not
200 NULL, it must be a pointer to integer. In that case, set *LEN to
201 the byte length of the multibyte form. If ADVANCED is not NULL, is
202 must be a pointer to unsigned char. In that case, set *ADVANCED to
203 the ending address (i.e. the starting address of the next
204 character) of the multibyte form. */
207 string_char (p
, advanced
, len
)
208 const unsigned char *p
;
209 const unsigned char **advanced
;
213 const unsigned char *saved_p
= p
;
215 if (*p
< 0x80 || ! (*p
& 0x20) || ! (*p
& 0x10))
217 c
= STRING_CHAR_ADVANCE (p
);
219 else if (! (*p
& 0x08))
221 c
= ((((p
)[0] & 0xF) << 18)
222 | (((p
)[1] & 0x3F) << 12)
223 | (((p
)[2] & 0x3F) << 6)
229 c
= ((((p
)[1] & 0x3F) << 18)
230 | (((p
)[2] & 0x3F) << 12)
231 | (((p
)[3] & 0x3F) << 6)
236 MAYBE_UNIFY_CHAR (c
);
246 /* Translate character C by translation table TABLE. If C is
247 negative, translate a character specified by CHARSET and CODE. If
248 no translation is found in TABLE, return the untranslated
249 character. If TABLE is a list, elements are char tables. In this
250 case, translace C by all tables. */
253 translate_char (table
, c
)
257 if (CHAR_TABLE_P (table
))
261 ch
= CHAR_TABLE_REF (table
, c
);
267 for (; CONSP (table
); table
= XCDR (table
))
268 c
= translate_char (XCAR (table
), c
);
273 /* Convert the multibyte character C to unibyte 8-bit character based
274 on the current value of charset_unibyte. If dimension of
275 charset_unibyte is more than one, return (C & 0xFF).
277 The argument REV_TBL is now ignored. It will be removed in the
281 multibyte_char_to_unibyte (c
, rev_tbl
)
285 struct charset
*charset
;
288 if (CHAR_BYTE8_P (c
))
289 return CHAR_TO_BYTE8 (c
);
290 charset
= CHARSET_FROM_ID (charset_unibyte
);
291 c1
= ENCODE_CHAR (charset
, c
);
292 return ((c1
!= CHARSET_INVALID_CODE (charset
)) ? c1
: c
& 0xFF);
295 /* Like multibyte_char_to_unibyte, but return -1 if C is not supported
296 by charset_unibyte. */
299 multibyte_char_to_unibyte_safe (c
)
302 struct charset
*charset
;
305 if (CHAR_BYTE8_P (c
))
306 return CHAR_TO_BYTE8 (c
);
307 charset
= CHARSET_FROM_ID (charset_unibyte
);
308 c1
= ENCODE_CHAR (charset
, c
);
309 return ((c1
!= CHARSET_INVALID_CODE (charset
)) ? c1
: -1);
312 DEFUN ("characterp", Fcharacterp
, Scharacterp
, 1, 2, 0,
313 doc
: /* Return non-nil if OBJECT is a character. */)
315 Lisp_Object object
, ignore
;
317 return (CHARACTERP (object
) ? Qt
: Qnil
);
320 DEFUN ("max-char", Fmax_char
, Smax_char
, 0, 0, 0,
321 doc
: /* Return the character of the maximum code. */)
324 return make_number (MAX_CHAR
);
327 DEFUN ("unibyte-char-to-multibyte", Funibyte_char_to_multibyte
,
328 Sunibyte_char_to_multibyte
, 1, 1, 0,
329 doc
: /* Convert the byte CH to multibyte character. */)
334 struct charset
*charset
;
336 CHECK_CHARACTER (ch
);
339 error ("Invalid unibyte character: %d", c
);
340 charset
= CHARSET_FROM_ID (charset_unibyte
);
341 c
= DECODE_CHAR (charset
, c
);
343 c
= BYTE8_TO_CHAR (XFASTINT (ch
));
344 return make_number (c
);
347 DEFUN ("multibyte-char-to-unibyte", Fmultibyte_char_to_unibyte
,
348 Smultibyte_char_to_unibyte
, 1, 1, 0,
349 doc
: /* Convert the multibyte character CH to a byte.
350 If the multibyte character does not represent a byte, return -1. */)
356 CHECK_CHARACTER (ch
);
359 /* Can't distinguish a byte read from a unibyte buffer from
360 a latin1 char, so let's let it slide. */
364 int cu
= CHAR_TO_BYTE8 (cm
);
365 return make_number (cu
);
369 DEFUN ("char-bytes", Fchar_bytes
, Schar_bytes
, 1, 1, 0,
370 doc
: /* Return 1 regardless of the argument CHAR.
371 This is now an obsolete function. We keep it just for backward compatibility.
372 usage: (char-bytes CHAR) */)
376 CHECK_CHARACTER (ch
);
377 return make_number (1);
380 DEFUN ("char-width", Fchar_width
, Schar_width
, 1, 1, 0,
381 doc
: /* Return width of CHAR when displayed in the current buffer.
382 The width is measured by how many columns it occupies on the screen.
383 Tab is taken to occupy `tab-width' columns.
384 usage: (char-width CHAR) */)
390 struct Lisp_Char_Table
*dp
= buffer_display_table ();
392 CHECK_CHARACTER (ch
);
395 /* Get the way the display table would display it. */
396 disp
= dp
? DISP_CHAR_VECTOR (dp
, c
) : Qnil
;
399 width
= ASIZE (disp
);
401 width
= CHAR_WIDTH (c
);
403 return make_number (width
);
406 /* Return width of string STR of length LEN when displayed in the
407 current buffer. The width is measured by how many columns it
408 occupies on the screen. If PRECISION > 0, return the width of
409 longest substring that doesn't exceed PRECISION, and set number of
410 characters and bytes of the substring in *NCHARS and *NBYTES
414 c_string_width (str
, len
, precision
, nchars
, nbytes
)
415 const unsigned char *str
;
416 int precision
, *nchars
, *nbytes
;
418 int i
= 0, i_byte
= 0;
420 struct Lisp_Char_Table
*dp
= buffer_display_table ();
424 int bytes
, thiswidth
;
426 int c
= STRING_CHAR_AND_LENGTH (str
+ i_byte
, len
- i_byte
, bytes
);
430 val
= DISP_CHAR_VECTOR (dp
, c
);
432 thiswidth
= XVECTOR (val
)->size
;
434 thiswidth
= CHAR_WIDTH (c
);
438 thiswidth
= CHAR_WIDTH (c
);
442 && (width
+ thiswidth
> precision
))
462 /* Return width of string STR of length LEN when displayed in the
463 current buffer. The width is measured by how many columns it
464 occupies on the screen. */
471 return c_string_width (str
, len
, -1, NULL
, NULL
);
474 /* Return width of Lisp string STRING when displayed in the current
475 buffer. The width is measured by how many columns it occupies on
476 the screen while paying attention to compositions. If PRECISION >
477 0, return the width of longest substring that doesn't exceed
478 PRECISION, and set number of characters and bytes of the substring
479 in *NCHARS and *NBYTES respectively. */
482 lisp_string_width (string
, precision
, nchars
, nbytes
)
484 int precision
, *nchars
, *nbytes
;
486 int len
= SCHARS (string
);
487 /* This set multibyte to 0 even if STRING is multibyte when it
488 contains only ascii and eight-bit-graphic, but that's
490 int multibyte
= len
< SBYTES (string
);
491 unsigned char *str
= SDATA (string
);
492 int i
= 0, i_byte
= 0;
494 struct Lisp_Char_Table
*dp
= buffer_display_table ();
498 int chars
, bytes
, thiswidth
;
501 EMACS_INT ignore
, end
;
503 if (find_composition (i
, -1, &ignore
, &end
, &val
, string
)
504 && ((cmp_id
= get_composition_id (i
, i_byte
, end
- i
, val
, string
))
507 thiswidth
= composition_table
[cmp_id
]->width
;
509 bytes
= string_char_to_byte (string
, end
) - i_byte
;
516 c
= STRING_CHAR_AND_LENGTH (str
+ i_byte
, len
- i_byte
, bytes
);
518 c
= str
[i_byte
], bytes
= 1;
522 val
= DISP_CHAR_VECTOR (dp
, c
);
524 thiswidth
= XVECTOR (val
)->size
;
526 thiswidth
= CHAR_WIDTH (c
);
530 thiswidth
= CHAR_WIDTH (c
);
535 && (width
+ thiswidth
> precision
))
555 DEFUN ("string-width", Fstring_width
, Sstring_width
, 1, 1, 0,
556 doc
: /* Return width of STRING when displayed in the current buffer.
557 Width is measured by how many columns it occupies on the screen.
558 When calculating width of a multibyte character in STRING,
559 only the base leading-code is considered; the validity of
560 the following bytes is not checked. Tabs in STRING are always
561 taken to occupy `tab-width' columns.
562 usage: (string-width STRING) */)
569 XSETFASTINT (val
, lisp_string_width (str
, -1, NULL
, NULL
));
573 DEFUN ("char-direction", Fchar_direction
, Schar_direction
, 1, 1, 0,
574 doc
: /* Return the direction of CHAR.
575 The returned value is 0 for left-to-right and 1 for right-to-left.
576 usage: (char-direction CHAR) */)
582 CHECK_CHARACTER (ch
);
584 return CHAR_TABLE_REF (Vchar_direction_table
, c
);
587 /* Return the number of characters in the NBYTES bytes at PTR.
588 This works by looking at the contents and checking for multibyte
589 sequences while assuming that there's no invalid sequence.
590 However, if the current buffer has enable-multibyte-characters =
591 nil, we treat each byte as a character. */
594 chars_in_text (ptr
, nbytes
)
595 const unsigned char *ptr
;
598 /* current_buffer is null at early stages of Emacs initialization. */
599 if (current_buffer
== 0
600 || NILP (current_buffer
->enable_multibyte_characters
))
603 return multibyte_chars_in_text (ptr
, nbytes
);
606 /* Return the number of characters in the NBYTES bytes at PTR.
607 This works by looking at the contents and checking for multibyte
608 sequences while assuming that there's no invalid sequence. It
609 ignores enable-multibyte-characters. */
612 multibyte_chars_in_text (ptr
, nbytes
)
613 const unsigned char *ptr
;
616 const unsigned char *endp
= ptr
+ nbytes
;
621 int len
= MULTIBYTE_LENGTH (ptr
, endp
);
632 /* Parse unibyte text at STR of LEN bytes as a multibyte text, count
633 characters and bytes in it, and store them in *NCHARS and *NBYTES
634 respectively. On counting bytes, pay attention to that 8-bit
635 characters not constructing a valid multibyte sequence are
636 represented by 2-byte in a multibyte text. */
639 parse_str_as_multibyte (str
, len
, nchars
, nbytes
)
640 const unsigned char *str
;
641 int len
, *nchars
, *nbytes
;
643 const unsigned char *endp
= str
+ len
;
644 int n
, chars
= 0, bytes
= 0;
646 if (len
>= MAX_MULTIBYTE_LENGTH
)
648 const unsigned char *adjusted_endp
= endp
- MAX_MULTIBYTE_LENGTH
;
649 while (str
< adjusted_endp
)
651 if ((n
= MULTIBYTE_LENGTH_NO_CHECK (str
)) > 0)
652 str
+= n
, bytes
+= n
;
660 if ((n
= MULTIBYTE_LENGTH (str
, endp
)) > 0)
661 str
+= n
, bytes
+= n
;
672 /* Arrange unibyte text at STR of NBYTES bytes as a multibyte text.
673 It actually converts only such 8-bit characters that don't contruct
674 a multibyte sequence to multibyte forms of Latin-1 characters. If
675 NCHARS is nonzero, set *NCHARS to the number of characters in the
676 text. It is assured that we can use LEN bytes at STR as a work
677 area and that is enough. Return the number of bytes of the
681 str_as_multibyte (str
, len
, nbytes
, nchars
)
683 int len
, nbytes
, *nchars
;
685 unsigned char *p
= str
, *endp
= str
+ nbytes
;
690 if (nbytes
>= MAX_MULTIBYTE_LENGTH
)
692 unsigned char *adjusted_endp
= endp
- MAX_MULTIBYTE_LENGTH
;
693 while (p
< adjusted_endp
694 && (n
= MULTIBYTE_LENGTH_NO_CHECK (p
)) > 0)
697 while ((n
= MULTIBYTE_LENGTH (p
, endp
)) > 0)
707 safe_bcopy ((char *) p
, (char *) (endp
- nbytes
), nbytes
);
710 if (nbytes
>= MAX_MULTIBYTE_LENGTH
)
712 unsigned char *adjusted_endp
= endp
- MAX_MULTIBYTE_LENGTH
;
713 while (p
< adjusted_endp
)
715 if ((n
= MULTIBYTE_LENGTH_NO_CHECK (p
)) > 0)
723 c
= BYTE8_TO_CHAR (c
);
724 to
+= CHAR_STRING (c
, to
);
731 if ((n
= MULTIBYTE_LENGTH (p
, endp
)) > 0)
739 c
= BYTE8_TO_CHAR (c
);
740 to
+= CHAR_STRING (c
, to
);
749 /* Parse unibyte string at STR of LEN bytes, and return the number of
750 bytes it may ocupy when converted to multibyte string by
751 `str_to_multibyte'. */
754 parse_str_to_multibyte (str
, len
)
758 unsigned char *endp
= str
+ len
;
761 for (bytes
= 0; str
< endp
; str
++)
762 bytes
+= (*str
< 0x80) ? 1 : 2;
767 /* Convert unibyte text at STR of NBYTES bytes to a multibyte text
768 that contains the same single-byte characters. It actually
769 converts all 8-bit characters to multibyte forms. It is assured
770 that we can use LEN bytes at STR as a work area and that is
774 str_to_multibyte (str
, len
, bytes
)
778 unsigned char *p
= str
, *endp
= str
+ bytes
;
781 while (p
< endp
&& *p
< 0x80) p
++;
787 safe_bcopy ((char *) p
, (char *) (endp
- bytes
), bytes
);
794 c
= BYTE8_TO_CHAR (c
);
795 to
+= CHAR_STRING (c
, to
);
800 /* Arrange multibyte text at STR of LEN bytes as a unibyte text. It
801 actually converts characters in the range 0x80..0xFF to
805 str_as_unibyte (str
, bytes
)
809 const unsigned char *p
= str
, *endp
= str
+ bytes
;
816 len
= BYTES_BY_CHAR_HEAD (c
);
817 if (CHAR_BYTE8_HEAD_P (c
))
821 to
= str
+ (p
- str
);
825 len
= BYTES_BY_CHAR_HEAD (c
);
826 if (CHAR_BYTE8_HEAD_P (c
))
828 c
= STRING_CHAR_ADVANCE (p
);
829 *to
++ = CHAR_TO_BYTE8 (c
);
833 while (len
--) *to
++ = *p
++;
840 string_count_byte8 (string
)
843 int multibyte
= STRING_MULTIBYTE (string
);
844 int nbytes
= SBYTES (string
);
845 unsigned char *p
= SDATA (string
);
846 unsigned char *pend
= p
+ nbytes
;
854 len
= BYTES_BY_CHAR_HEAD (c
);
856 if (CHAR_BYTE8_HEAD_P (c
))
871 string_escape_byte8 (string
)
874 int nchars
= SCHARS (string
);
875 int nbytes
= SBYTES (string
);
876 int multibyte
= STRING_MULTIBYTE (string
);
878 const unsigned char *src
, *src_end
;
883 if (multibyte
&& nchars
== nbytes
)
886 byte8_count
= string_count_byte8 (string
);
888 if (byte8_count
== 0)
892 /* Convert 2-byte sequence of byte8 chars to 4-byte octal. */
893 val
= make_uninit_multibyte_string (nchars
+ byte8_count
* 3,
894 nbytes
+ byte8_count
* 2);
896 /* Convert 1-byte sequence of byte8 chars to 4-byte octal. */
897 val
= make_uninit_string (nbytes
+ byte8_count
* 3);
899 src
= SDATA (string
);
900 src_end
= src
+ nbytes
;
903 while (src
< src_end
)
906 len
= BYTES_BY_CHAR_HEAD (c
);
908 if (CHAR_BYTE8_HEAD_P (c
))
910 c
= STRING_CHAR_ADVANCE (src
);
911 c
= CHAR_TO_BYTE8 (c
);
912 sprintf ((char *) dst
, "\\%03o", c
);
916 while (len
--) *dst
++ = *src
++;
919 while (src
< src_end
)
924 sprintf ((char *) dst
, "\\%03o", c
);
934 DEFUN ("string", Fstring
, Sstring
, 0, MANY
, 0,
936 Concatenate all the argument characters and make the result a string.
937 usage: (string &rest CHARACTERS) */)
943 unsigned char *buf
= (unsigned char *) alloca (MAX_MULTIBYTE_LENGTH
* n
);
944 unsigned char *p
= buf
;
947 for (i
= 0; i
< n
; i
++)
949 CHECK_CHARACTER (args
[i
]);
951 p
+= CHAR_STRING (c
, p
);
954 return make_string_from_bytes ((char *) buf
, n
, p
- buf
);
957 DEFUN ("unibyte-string", Funibyte_string
, Sunibyte_string
, 0, MANY
, 0,
958 doc
: /* Concatenate all the argument bytes and make the result a unibyte string.
959 usage: (unibyte-string &rest BYTES) */)
965 unsigned char *buf
= (unsigned char *) alloca (n
);
966 unsigned char *p
= buf
;
969 for (i
= 0; i
< n
; i
++)
971 CHECK_NATNUM (args
[i
]);
972 c
= XFASTINT (args
[i
]);
974 args_out_of_range_3 (args
[i
], make_number (0), make_number (255));
978 return make_string_from_bytes ((char *) buf
, n
, p
- buf
);
981 DEFUN ("char-resolve-modifers", Fchar_resolve_modifiers
,
982 Schar_resolve_modifiers
, 1, 1, 0,
983 doc
: /* Resolve modifiers in the character CHAR.
984 The value is a character with modifiers resolved into the character
985 code. Unresolved modifiers are kept in the value.
986 usage: (char-resolve-modifers CHAR) */)
988 Lisp_Object character
;
992 CHECK_NUMBER (character
);
993 c
= XINT (character
);
994 return make_number (char_resolve_modifier_mask (c
));
998 init_character_once ()
1005 syms_of_character ()
1007 DEFSYM (Qcharacterp
, "characterp");
1008 DEFSYM (Qauto_fill_chars
, "auto-fill-chars");
1010 staticpro (&Vchar_unify_table
);
1011 Vchar_unify_table
= Qnil
;
1013 defsubr (&Smax_char
);
1014 defsubr (&Scharacterp
);
1015 defsubr (&Sunibyte_char_to_multibyte
);
1016 defsubr (&Smultibyte_char_to_unibyte
);
1017 defsubr (&Schar_bytes
);
1018 defsubr (&Schar_width
);
1019 defsubr (&Sstring_width
);
1020 defsubr (&Schar_direction
);
1022 defsubr (&Sunibyte_string
);
1023 defsubr (&Schar_resolve_modifiers
);
1025 DEFVAR_LISP ("translation-table-vector", &Vtranslation_table_vector
,
1027 Vector recording all translation tables ever defined.
1028 Each element is a pair (SYMBOL . TABLE) relating the table to the
1029 symbol naming it. The ID of a translation table is an index into this vector. */);
1030 Vtranslation_table_vector
= Fmake_vector (make_number (16), Qnil
);
1032 DEFVAR_LISP ("auto-fill-chars", &Vauto_fill_chars
,
1034 A char-table for characters which invoke auto-filling.
1035 Such characters have value t in this table. */);
1036 Vauto_fill_chars
= Fmake_char_table (Qauto_fill_chars
, Qnil
);
1037 CHAR_TABLE_SET (Vauto_fill_chars
, ' ', Qt
);
1038 CHAR_TABLE_SET (Vauto_fill_chars
, '\n', Qt
);
1040 DEFVAR_LISP ("char-width-table", &Vchar_width_table
,
1042 A char-table for width (columns) of each character. */);
1043 Vchar_width_table
= Fmake_char_table (Qnil
, make_number (1));
1044 char_table_set_range (Vchar_width_table
, 0x80, 0x9F, make_number (4));
1045 char_table_set_range (Vchar_width_table
, MAX_5_BYTE_CHAR
+ 1, MAX_CHAR
,
1048 DEFVAR_LISP ("char-direction-table", &Vchar_direction_table
,
1049 doc
: /* A char-table for direction of each character. */);
1050 Vchar_direction_table
= Fmake_char_table (Qnil
, make_number (1));
1052 DEFVAR_LISP ("printable-chars", &Vprintable_chars
,
1053 doc
: /* A char-table for each printable character. */);
1054 Vprintable_chars
= Fmake_char_table (Qnil
, Qnil
);
1055 Fset_char_table_range (Vprintable_chars
,
1056 Fcons (make_number (32), make_number (126)), Qt
);
1057 Fset_char_table_range (Vprintable_chars
,
1058 Fcons (make_number (160),
1059 make_number (MAX_5_BYTE_CHAR
)), Qt
);
1061 DEFVAR_LISP ("char-script-table", &Vchar_script_table
,
1062 doc
: /* Char table of script symbols.
1063 It has one extra slot whose value is a list of script symbols. */);
1065 /* Intern this now in case it isn't already done.
1066 Setting this variable twice is harmless.
1067 But don't staticpro it here--that is done in alloc.c. */
1068 Qchar_table_extra_slots
= intern ("char-table-extra-slots");
1069 DEFSYM (Qchar_script_table
, "char-script-table");
1070 Fput (Qchar_script_table
, Qchar_table_extra_slots
, make_number (1));
1071 Vchar_script_table
= Fmake_char_table (Qchar_script_table
, Qnil
);
1073 DEFVAR_LISP ("script-representative-chars", &Vscript_representative_chars
,
1074 doc
: /* Alist of scripts vs the representative characters. */);
1075 Vscript_representative_chars
= Qnil
;
1080 /* arch-tag: b6665960-3c3d-4184-85cd-af4318197999
1081 (do not change this comment) */