1 /* vi:set ts=8 sts=4 sw=4:
3 * VIM - Vi IMproved by Bram Moolenaar
5 * Do ":help uganda" in Vim to read copying and usage conditions.
6 * Do ":help credits" in Vim to see a list of people who contributed.
7 * See README.txt for an overview of the Vim source code.
13 static int win_chartabsize
__ARGS((win_T
*wp
, char_u
*p
, colnr_T col
));
17 static int win_nolbr_chartabsize
__ARGS((win_T
*wp
, char_u
*s
, colnr_T col
, int *headp
));
20 static unsigned nr2hex
__ARGS((unsigned c
));
22 static int chartab_initialized
= FALSE
;
24 /* b_chartab[] is an array of 32 bytes, each bit representing one of the
25 * characters 0-255. */
26 #define SET_CHARTAB(buf, c) (buf)->b_chartab[(unsigned)(c) >> 3] |= (1 << ((c) & 0x7))
27 #define RESET_CHARTAB(buf, c) (buf)->b_chartab[(unsigned)(c) >> 3] &= ~(1 << ((c) & 0x7))
28 #define GET_CHARTAB(buf, c) ((buf)->b_chartab[(unsigned)(c) >> 3] & (1 << ((c) & 0x7)))
31 * Fill chartab[]. Also fills curbuf->b_chartab[] with flags for keyword
32 * characters for current buffer.
34 * Depends on the option settings 'iskeyword', 'isident', 'isfname',
35 * 'isprint' and 'encoding'.
37 * The index in chartab[] depends on 'encoding':
38 * - For non-multi-byte index with the byte (same as the character).
39 * - For DBCS index with the first byte.
40 * - For UTF-8 index with the character (when first byte is up to 0x80 it is
41 * the same as the character, if the first byte is 0x80 and above it depends
44 * The contents of chartab[]:
45 * - The lower two bits, masked by CT_CELL_MASK, give the number of display
46 * cells the character occupies (1 or 2). Not valid for UTF-8 above 0x80.
47 * - CT_PRINT_CHAR bit is set when the character is printable (no need to
48 * translate the character before displaying it). Note that only DBCS
49 * characters can have 2 display cells and still be printable.
50 * - CT_FNAME_CHAR bit is set when the character can be in a file name.
51 * - CT_ID_CHAR bit is set when the character can be in an identifier.
53 * Return FAIL if 'iskeyword', 'isident', 'isfname' or 'isprint' option has an
54 * error, OK otherwise.
59 return buf_init_chartab(curbuf
, TRUE
);
63 buf_init_chartab(buf
, global
)
65 int global
; /* FALSE: only set buf->b_chartab[] */
77 * Set the default size for printable characters:
78 * From <Space> to '~' is 1 (printable), others are 2 (not printable).
79 * This also inits all 'isident' and 'isfname' flags to FALSE.
81 * EBCDIC: all chars below ' ' are not printable, all others are
86 chartab
[c
++] = (dy_flags
& DY_UHEX
) ? 4 : 2;
92 chartab
[c
++] = 1 + CT_PRINT_CHAR
;
97 chartab
[c
++] = 1 + CT_PRINT_CHAR
;
103 /* UTF-8: bytes 0xa0 - 0xff are printable (latin1) */
104 if (enc_utf8
&& c
>= 0xa0)
105 chartab
[c
++] = CT_PRINT_CHAR
+ 1;
106 /* euc-jp characters starting with 0x8e are single width */
107 else if (enc_dbcs
== DBCS_JPNU
&& c
== 0x8e)
108 chartab
[c
++] = CT_PRINT_CHAR
+ 1;
109 /* other double-byte chars can be printable AND double-width */
110 else if (enc_dbcs
!= 0 && MB_BYTE2LEN(c
) == 2)
111 chartab
[c
++] = CT_PRINT_CHAR
+ 2;
114 /* the rest is unprintable by default */
115 chartab
[c
++] = (dy_flags
& DY_UHEX
) ? 4 : 2;
119 /* Assume that every multi-byte char is a filename character. */
120 for (c
= 1; c
< 256; ++c
)
121 if ((enc_dbcs
!= 0 && MB_BYTE2LEN(c
) > 1)
122 || (enc_dbcs
== DBCS_JPNU
&& c
== 0x8e)
123 || (enc_utf8
&& c
>= 0xa0))
124 chartab
[c
] |= CT_FNAME_CHAR
;
129 * Init word char flags all to FALSE
131 vim_memset(buf
->b_chartab
, 0, (size_t)32);
134 for (c
= 0; c
< 256; ++c
)
136 /* double-byte characters are probably word characters */
137 if (MB_BYTE2LEN(c
) == 2)
144 * In lisp mode the '-' character is included in keywords.
147 SET_CHARTAB(buf
, '-');
150 /* Walk through the 'isident', 'iskeyword', 'isfname' and 'isprint'
151 * options Each option is a list of characters, character numbers or
152 * ranges, separated by commas, e.g.: "200-210,x,#-178,-"
154 for (i
= global
? 0 : 3; i
<= 3; ++i
)
157 p
= p_isi
; /* first round: 'isident' */
159 p
= p_isp
; /* second round: 'isprint' */
161 p
= p_isf
; /* third round: 'isfname' */
163 p
= buf
->b_p_isk
; /* fourth round: 'iskeyword' */
169 if (*p
== '^' && p
[1] != NUL
)
179 c
= mb_ptr2char_adv(&p
);
184 if (*p
== '-' && p
[1] != NUL
)
192 c2
= mb_ptr2char_adv(&p
);
197 if (c
<= 0 || c
>= 256 || (c2
< c
&& c2
!= -1) || c2
>= 256
198 || !(*p
== NUL
|| *p
== ','))
201 if (c2
== -1) /* not a range */
204 * A single '@' (not "@-@"):
205 * Decide on letters being ID/printable/keyword chars with
206 * standard function isalpha(). This takes care of locale for
207 * single-byte characters).
220 /* Use the MB_ functions here, because isalpha() doesn't
221 * work properly when 'encoding' is "latin1" and the locale is
223 if (!do_isalpha
|| MB_ISLOWER(c
) || MB_ISUPPER(c
)
225 || (p_altkeymap
&& (F_isalpha(c
) || F_isdigit(c
)))
229 if (i
== 0) /* (re)set ID flag */
232 chartab
[c
] &= ~CT_ID_CHAR
;
234 chartab
[c
] |= CT_ID_CHAR
;
236 else if (i
== 1) /* (re)set printable */
244 && (F_isalpha(c
) || F_isdigit(c
)))
248 /* For double-byte we keep the cell width, so
249 * that we can detect it from the first byte. */
250 && !(enc_dbcs
&& MB_BYTE2LEN(c
) == 2)
256 chartab
[c
] = (chartab
[c
] & ~CT_CELL_MASK
)
257 + ((dy_flags
& DY_UHEX
) ? 4 : 2);
258 chartab
[c
] &= ~CT_PRINT_CHAR
;
262 chartab
[c
] = (chartab
[c
] & ~CT_CELL_MASK
) + 1;
263 chartab
[c
] |= CT_PRINT_CHAR
;
267 else if (i
== 2) /* (re)set fname flag */
270 chartab
[c
] &= ~CT_FNAME_CHAR
;
272 chartab
[c
] |= CT_FNAME_CHAR
;
274 else /* i == 3 */ /* (re)set keyword flag */
277 RESET_CHARTAB(buf
, c
);
284 p
= skip_to_option_part(p
);
287 chartab_initialized
= TRUE
;
292 * Translate any special characters in buf[bufsize] in-place.
293 * The result is a string with only printable characters, but if there is not
294 * enough room, not all characters will be translated.
297 trans_characters(buf
, bufsize
)
301 int len
; /* length of string needing translation */
302 int room
; /* room in buffer after string */
303 char_u
*trs
; /* translated character */
304 int trs_len
; /* length of trs[] */
306 len
= (int)STRLEN(buf
);
307 room
= bufsize
- len
;
311 /* Assume a multi-byte character doesn't need translation. */
312 if (has_mbyte
&& (trs_len
= (*mb_ptr2len
)(buf
)) > 1)
317 trs
= transchar_byte(*buf
);
318 trs_len
= (int)STRLEN(trs
);
324 mch_memmove(buf
+ trs_len
, buf
+ 1, (size_t)len
);
326 mch_memmove(buf
, trs
, (size_t)trs_len
);
333 #if defined(FEAT_EVAL) || defined(FEAT_TITLE) || defined(FEAT_INS_EXPAND) \
336 * Translate a string into allocated memory, replacing special chars with
337 * printable chars. Returns NULL when out of memory.
353 /* Compute the length of the result, taking account of unprintable
354 * multi-byte characters. */
359 if ((l
= (*mb_ptr2len
)(p
)) > 1)
361 c
= (*mb_ptr2char
)(p
);
367 transchar_hex(hexbuf
, c
);
368 len
+= (int)STRLEN(hexbuf
);
373 l
= byte2cells(*p
++);
377 len
+= 4; /* illegal byte sequence */
380 res
= alloc((unsigned)(len
+ 1));
384 res
= alloc((unsigned)(vim_strsize(s
) + 1));
392 if (has_mbyte
&& (l
= (*mb_ptr2len
)(p
)) > 1)
394 c
= (*mb_ptr2char
)(p
);
396 STRNCAT(res
, p
, l
); /* append printable multi-byte char */
398 transchar_hex(res
+ STRLEN(res
), c
);
403 STRCAT(res
, transchar_byte(*p
++));
410 #if defined(FEAT_SYN_HL) || defined(FEAT_INS_EXPAND) || defined(PROTO)
412 * Convert the string "str[orglen]" to do ignore-case comparing. Uses the
414 * When "buf" is NULL returns an allocated string (NULL for out-of-memory).
415 * Otherwise puts the result in "buf[buflen]".
418 str_foldcase(str
, orglen
, buf
, buflen
)
428 #define GA_CHAR(i) ((char_u *)ga.ga_data)[i]
429 #define GA_PTR(i) ((char_u *)ga.ga_data + i)
430 #define STR_CHAR(i) (buf == NULL ? GA_CHAR(i) : buf[i])
431 #define STR_PTR(i) (buf == NULL ? GA_PTR(i) : buf + i)
433 /* Copy "str" into "buf" or allocated memory, unmodified. */
436 ga_init2(&ga
, 1, 10);
437 if (ga_grow(&ga
, len
+ 1) == FAIL
)
439 mch_memmove(ga
.ga_data
, str
, (size_t)len
);
444 if (len
>= buflen
) /* Ugly! */
446 mch_memmove(buf
, str
, (size_t)len
);
453 /* Make each character lower case. */
455 while (STR_CHAR(i
) != NUL
)
458 if (enc_utf8
|| (has_mbyte
&& MB_BYTE2LEN(STR_CHAR(i
)) > 1))
462 int c
= utf_ptr2char(STR_PTR(i
));
463 int ol
= utf_ptr2len(STR_PTR(i
));
464 int lc
= utf_tolower(c
);
466 /* Only replace the character when it is not an invalid
467 * sequence (ASCII character or more than one byte) and
468 * utf_tolower() doesn't return the original character. */
469 if ((c
< 0x80 || ol
> 1) && c
!= lc
)
471 int nl
= utf_char2len(lc
);
473 /* If the byte length changes need to shift the following
474 * characters forward or backward. */
479 if (buf
== NULL
? ga_grow(&ga
, nl
- ol
+ 1) == FAIL
480 : len
+ nl
- ol
>= buflen
)
482 /* out of memory, keep old char */
491 STRMOVE(GA_PTR(i
) + nl
, GA_PTR(i
) + ol
);
492 ga
.ga_len
+= nl
- ol
;
496 STRMOVE(buf
+ i
+ nl
, buf
+ i
+ ol
);
501 (void)utf_char2bytes(lc
, STR_PTR(i
));
504 /* skip to next multi-byte char */
505 i
+= (*mb_ptr2len
)(STR_PTR(i
));
511 GA_CHAR(i
) = TOLOWER_LOC(GA_CHAR(i
));
513 buf
[i
] = TOLOWER_LOC(buf
[i
]);
519 return (char_u
*)ga
.ga_data
;
525 * Catch 22: chartab[] can't be initialized before the options are
526 * initialized, and initializing options may cause transchar() to be called!
527 * When chartab_initialized == FALSE don't use chartab[].
528 * Does NOT work for multi-byte characters, c must be <= 255.
529 * Also doesn't work for the first byte of a multi-byte, "c" must be a
532 static char_u transchar_buf
[7];
541 if (IS_SPECIAL(c
)) /* special key code, display as ~@ char */
543 transchar_buf
[0] = '~';
544 transchar_buf
[1] = '@';
549 if ((!chartab_initialized
&& (
553 (c
>= ' ' && c
<= '~')
558 )) || (c
< 256 && vim_isprintc_strict(c
)))
560 /* printable character */
561 transchar_buf
[i
] = c
;
562 transchar_buf
[i
+ 1] = NUL
;
565 transchar_nonprint(transchar_buf
+ i
, c
);
566 return transchar_buf
;
569 #if defined(FEAT_MBYTE) || defined(PROTO)
571 * Like transchar(), but called with a byte instead of a character. Checks
572 * for an illegal UTF-8 byte.
578 if (enc_utf8
&& c
>= 0x80)
580 transchar_nonprint(transchar_buf
, c
);
581 return transchar_buf
;
588 * Convert non-printable character to two or more printable characters in
589 * "buf[]". "buf" needs to be able to hold five bytes.
590 * Does NOT work for multi-byte characters, c must be <= 255.
593 transchar_nonprint(buf
, c
)
598 c
= NUL
; /* we use newline in place of a NUL */
599 else if (c
== CAR
&& get_fileformat(curbuf
) == EOL_MAC
)
600 c
= NL
; /* we use CR in place of NL in this case */
602 if (dy_flags
& DY_UHEX
) /* 'display' has "uhex" */
603 transchar_hex(buf
, c
);
606 /* For EBCDIC only the characters 0-63 and 255 are not printable */
607 else if (CtrlChar(c
) != 0 || c
== DEL
)
609 else if (c
<= 0x7f) /* 0x00 - 0x1f and 0x7f */
615 buf
[1] = '?'; /* DEL displayed as ^? */
617 buf
[1] = CtrlChar(c
);
619 buf
[1] = c
^ 0x40; /* DEL displayed as ^? */
625 else if (enc_utf8
&& c
>= 0x80)
627 transchar_hex(buf
, c
);
631 else if (c
>= ' ' + 0x80 && c
<= '~' + 0x80) /* 0xa0 - 0xfe */
641 buf
[1] = MetaChar(c
);
645 else /* 0x80 - 0x9f and 0xff */
648 * TODO: EBCDIC I don't know what to do with this chars, so I display
649 * them as '~?' for now
653 buf
[1] = '?'; /* 0xff displayed as ~? */
655 buf
[1] = (c
- 0x80) ^ 0x40; /* 0xff displayed as ~? */
662 transchar_hex(buf
, c
)
672 buf
[++i
] = nr2hex((unsigned)c
>> 12);
673 buf
[++i
] = nr2hex((unsigned)c
>> 8);
676 buf
[++i
] = nr2hex((unsigned)c
>> 4);
677 buf
[++i
] = nr2hex((unsigned)c
);
683 * Convert the lower 4 bits of byte "c" to its hex character.
684 * Lower case letters are used to avoid the confusion of <F1> being 0xf1 or
692 return (c
& 0xf) + '0';
693 return (c
& 0xf) - 10 + 'a';
697 * Return number of display cells occupied by byte "b".
698 * Caller must make sure 0 <= b <= 255.
699 * For multi-byte mode "b" must be the first byte of a character.
700 * A TAB is counted as two cells: "^I".
701 * For UTF-8 mode this will return 0 for bytes >= 0x80, because the number of
702 * cells depends on further bytes.
709 if (enc_utf8
&& b
>= 0x80)
712 return (chartab
[b
] & CT_CELL_MASK
);
716 * Return number of display cells occupied by character "c".
717 * "c" can be a special key (negative number) in which case 3 or 4 is returned.
718 * A TAB is counted as two cells: "^I" or four: "<09>".
725 return char2cells(K_SECOND(c
)) + 2;
729 /* UTF-8: above 0x80 need to check the value */
731 return utf_char2cells(c
);
732 /* DBCS: double-byte means double-width, except for euc-jp with first
734 if (enc_dbcs
!= 0 && c
>= 0x100)
736 if (enc_dbcs
== DBCS_JPNU
&& ((unsigned)c
>> 8) == 0x8e)
742 return (chartab
[c
& 0xff] & CT_CELL_MASK
);
746 * Return number of display cells occupied by character at "*p".
747 * A TAB is counted as two cells: "^I" or four: "<09>".
754 /* For UTF-8 we need to look at more bytes if the first byte is >= 0x80. */
755 if (enc_utf8
&& *p
>= 0x80)
756 return utf_ptr2cells(p
);
757 /* For DBCS we can tell the cell count from the first byte. */
759 return (chartab
[*p
] & CT_CELL_MASK
);
763 * Return the number of characters string "s" will take on the screen,
764 * counting TABs as two characters: "^I".
770 return vim_strnsize(s
, (int)MAXCOL
);
774 * Return the number of characters string "s[len]" will take on the screen,
775 * counting TABs as two characters: "^I".
784 while (*s
!= NUL
&& --len
>= 0)
789 int l
= (*mb_ptr2len
)(s
);
791 size
+= ptr2cells(s
);
797 size
+= byte2cells(*s
++);
803 * Return the number of characters 'c' will take on the screen, taking
804 * into account the size of a tab.
805 * Use a define to make it fast, this is used very often!!!
806 * Also see getvcol() below.
809 #define RET_WIN_BUF_CHARTABSIZE(wp, buf, p, col) \
810 if (*(p) == TAB && (!(wp)->w_p_list || lcs_tab1)) \
813 ts = (buf)->b_p_ts; \
814 return (int)(ts - (col % ts)); \
819 #if defined(FEAT_VREPLACE) || defined(FEAT_EX_EXTRA) || defined(FEAT_GUI) \
820 || defined(FEAT_VIRTUALEDIT) || defined(PROTO)
826 RET_WIN_BUF_CHARTABSIZE(curwin
, curbuf
, p
, col
)
830 #ifdef FEAT_LINEBREAK
832 win_chartabsize(wp
, p
, col
)
837 RET_WIN_BUF_CHARTABSIZE(wp
, wp
->w_buffer
, p
, col
)
842 * return the number of characters the string 's' will take on the screen,
843 * taking into account the size of a tab
852 col
+= lbr_chartabsize_adv(&s
, col
);
857 * Like linetabsize(), but for a given window instead of the current one.
860 win_linetabsize(wp
, p
, len
)
868 for (s
= p
; *s
!= NUL
&& (len
== MAXCOL
|| s
< p
+ len
); mb_ptr_adv(s
))
869 col
+= win_lbr_chartabsize(wp
, s
, col
, NULL
);
874 * Return TRUE if 'c' is a normal identifier character:
875 * Letters and characters from the 'isident' option.
881 return (c
> 0 && c
< 0x100 && (chartab
[c
] & CT_ID_CHAR
));
885 * return TRUE if 'c' is a keyword character: Letters and characters from
886 * 'iskeyword' option for current buffer.
887 * For multi-byte characters mb_get_class() is used (builtin rules).
897 return dbcs_class((unsigned)c
>> 8, (unsigned)(c
& 0xff)) >= 2;
899 return utf_class(c
) >= 2;
902 return (c
> 0 && c
< 0x100 && GET_CHARTAB(curbuf
, c
) != 0);
906 * Just like vim_iswordc() but uses a pointer to the (multi-byte) character.
913 if (has_mbyte
&& MB_BYTE2LEN(*p
) > 1)
914 return mb_get_class(p
) >= 2;
916 return GET_CHARTAB(curbuf
, *p
) != 0;
919 #if defined(FEAT_SYN_HL) || defined(PROTO)
921 vim_iswordc_buf(p
, buf
)
926 if (has_mbyte
&& MB_BYTE2LEN(*p
) > 1)
927 return mb_get_class(p
) >= 2;
929 return (GET_CHARTAB(buf
, *p
) != 0);
934 * return TRUE if 'c' is a valid file-name character
935 * Assume characters above 0x100 are valid (multi-byte).
941 return (c
>= 0x100 || (c
> 0 && (chartab
[c
] & CT_FNAME_CHAR
)));
945 * return TRUE if 'c' is a valid file-name character or a wildcard character
946 * Assume characters above 0x100 are valid (multi-byte).
947 * Explicitly interpret ']' as a wildcard character as mch_has_wildcard("]")
958 return vim_isfilec(c
) || c
== ']' || mch_has_wildcard(buf
);
962 * return TRUE if 'c' is a printable character
963 * Assume characters above 0x100 are printable (multi-byte), except for
971 if (enc_utf8
&& c
>= 0x100)
972 return utf_printable(c
);
974 return (c
>= 0x100 || (c
> 0 && (chartab
[c
] & CT_PRINT_CHAR
)));
978 * Strict version of vim_isprintc(c), don't return TRUE if "c" is the head
979 * byte of a double-byte character.
982 vim_isprintc_strict(c
)
986 if (enc_dbcs
!= 0 && c
< 0x100 && MB_BYTE2LEN(c
) > 1)
988 if (enc_utf8
&& c
>= 0x100)
989 return utf_printable(c
);
991 return (c
>= 0x100 || (c
> 0 && (chartab
[c
] & CT_PRINT_CHAR
)));
995 * like chartabsize(), but also check for line breaks on the screen
998 lbr_chartabsize(s
, col
)
1002 #ifdef FEAT_LINEBREAK
1003 if (!curwin
->w_p_lbr
&& *p_sbr
== NUL
)
1007 if (curwin
->w_p_wrap
)
1008 return win_nolbr_chartabsize(curwin
, s
, col
, NULL
);
1010 RET_WIN_BUF_CHARTABSIZE(curwin
, curbuf
, s
, col
)
1011 #ifdef FEAT_LINEBREAK
1013 return win_lbr_chartabsize(curwin
, s
, col
, NULL
);
1018 * Call lbr_chartabsize() and advance the pointer.
1021 lbr_chartabsize_adv(s
, col
)
1027 retval
= lbr_chartabsize(*s
, col
);
1033 * This function is used very often, keep it fast!!!!
1035 * If "headp" not NULL, set *headp to the size of what we for 'showbreak'
1036 * string at start of line. Warning: *headp is only set if it's a non-zero
1037 * value, init to 0 before calling.
1040 win_lbr_chartabsize(wp
, s
, col
, headp
)
1046 #ifdef FEAT_LINEBREAK
1059 int tab_corr
= (*s
== TAB
);
1063 * No 'linebreak' and 'showbreak': return quickly.
1065 if (!wp
->w_p_lbr
&& *p_sbr
== NUL
)
1070 return win_nolbr_chartabsize(wp
, s
, col
, headp
);
1072 RET_WIN_BUF_CHARTABSIZE(wp
, wp
->w_buffer
, s
, col
)
1075 #ifdef FEAT_LINEBREAK
1077 * First get normal size, without 'linebreak'
1079 size
= win_chartabsize(wp
, s
, col
);
1083 * If 'linebreak' set check at a blank before a non-blank if the line
1084 * needs a break here
1088 && !vim_isbreak(s
[1])
1091 # ifdef FEAT_VERTSPLIT
1097 * Count all characters from first non-blank after a blank up to next
1098 * non-blank after a blank.
1100 numberextra
= win_col_off(wp
);
1102 colmax
= (colnr_T
)(W_WIDTH(wp
) - numberextra
);
1105 n
= colmax
+ win_col_off2(wp
);
1107 colmax
+= (((col
- colmax
) / n
) + 1) * n
;
1118 && (col2
== col
|| !vim_isbreak(*ps
))))))
1121 col2
+= win_chartabsize(wp
, s
, col2
);
1122 if (col2
>= colmax
) /* doesn't fit */
1124 size
= colmax
- col
;
1131 else if (has_mbyte
&& size
== 2 && MB_BYTE2LEN(*s
) > 1
1132 && wp
->w_p_wrap
&& in_win_border(wp
, col
))
1134 ++size
; /* Count the ">" in the last column. */
1140 * May have to add something for 'showbreak' string at start of line
1141 * Set *headp to the size of what we add.
1144 if (*p_sbr
!= NUL
&& wp
->w_p_wrap
&& col
!= 0)
1146 numberextra
= win_col_off(wp
);
1147 col
+= numberextra
+ mb_added
;
1148 if (col
>= (colnr_T
)W_WIDTH(wp
))
1151 numberextra
= W_WIDTH(wp
) - (numberextra
- win_col_off2(wp
));
1152 if (numberextra
> 0)
1153 col
= col
% numberextra
;
1155 if (col
== 0 || col
+ size
> (colnr_T
)W_WIDTH(wp
))
1157 added
= vim_strsize(p_sbr
);
1159 size
+= (added
/ wp
->w_buffer
->b_p_ts
) * wp
->w_buffer
->b_p_ts
;
1167 *headp
= added
+ mb_added
;
1172 #if defined(FEAT_MBYTE) || defined(PROTO)
1174 * Like win_lbr_chartabsize(), except that we know 'linebreak' is off and
1175 * 'wrap' is on. This means we need to check for a double-byte character that
1176 * doesn't fit at the end of the screen line.
1179 win_nolbr_chartabsize(wp
, s
, col
, headp
)
1187 if (*s
== TAB
&& (!wp
->w_p_list
|| lcs_tab1
))
1189 n
= wp
->w_buffer
->b_p_ts
;
1190 return (int)(n
- (col
% n
));
1193 /* Add one cell for a double-width character in the last column of the
1194 * window, displayed with a ">". */
1195 if (n
== 2 && MB_BYTE2LEN(*s
) > 1 && in_win_border(wp
, col
))
1205 * Return TRUE if virtual column "vcol" is in the rightmost column of window
1209 in_win_border(wp
, vcol
)
1213 int width1
; /* width of first line (after line number) */
1214 int width2
; /* width of further lines */
1216 #ifdef FEAT_VERTSPLIT
1217 if (wp
->w_width
== 0) /* there is no border */
1220 width1
= W_WIDTH(wp
) - win_col_off(wp
);
1221 if ((int)vcol
< width1
- 1)
1223 if ((int)vcol
== width1
- 1)
1225 width2
= width1
+ win_col_off2(wp
);
1228 return ((vcol
- width1
) % width2
== width2
- 1);
1230 #endif /* FEAT_MBYTE */
1233 * Get virtual column number of pos.
1234 * start: on the first position of this character (TAB, ctrl)
1235 * cursor: where the cursor is on this character (first char, except for TAB)
1236 * end: on the last position of this character (TAB, ctrl)
1238 * This is used very often, keep it fast!
1241 getvcol(wp
, pos
, start
, cursor
, end
)
1249 char_u
*ptr
; /* points to current char */
1250 char_u
*posptr
; /* points to char at pos->col */
1253 int ts
= wp
->w_buffer
->b_p_ts
;
1257 ptr
= ml_get_buf(wp
->w_buffer
, pos
->lnum
, FALSE
);
1258 if (pos
->col
== MAXCOL
)
1259 posptr
= NULL
; /* continue until the NUL */
1261 posptr
= ptr
+ pos
->col
;
1264 * This function is used very often, do some speed optimizations.
1265 * When 'list', 'linebreak' and 'showbreak' are not set use a simple loop.
1266 * Also use this when 'list' is set but tabs take their normal size.
1268 if ((!wp
->w_p_list
|| lcs_tab1
!= NUL
)
1269 #ifdef FEAT_LINEBREAK
1270 && !wp
->w_p_lbr
&& *p_sbr
== NUL
1283 /* make sure we don't go past the end of the line */
1286 incr
= 1; /* NUL at end of line only takes one column */
1289 /* A tab gets expanded, depending on the current column */
1291 incr
= ts
- (vcol
% ts
);
1297 /* For utf-8, if the byte is >= 0x80, need to look at
1298 * further bytes to find the cell width. */
1299 if (enc_utf8
&& c
>= 0x80)
1300 incr
= utf_ptr2cells(ptr
);
1304 /* If a double-cell char doesn't fit at the end of a line
1305 * it wraps to the next line, it's like this char is three
1307 if (incr
== 2 && wp
->w_p_wrap
&& MB_BYTE2LEN(*ptr
) > 1
1308 && in_win_border(wp
, vcol
))
1319 if (posptr
!= NULL
&& ptr
>= posptr
) /* character at pos->col */
1330 /* A tab gets expanded, depending on the current column */
1332 incr
= win_lbr_chartabsize(wp
, ptr
, vcol
, &head
);
1333 /* make sure we don't go past the end of the line */
1336 incr
= 1; /* NUL at end of line only takes one column */
1340 if (posptr
!= NULL
&& ptr
>= posptr
) /* character at pos->col */
1348 *start
= vcol
+ head
;
1350 *end
= vcol
+ incr
- 1;
1356 && !virtual_active()
1359 && (*p_sel
== 'e' || ltoreq(*pos
, VIsual
)))
1362 *cursor
= vcol
+ incr
- 1; /* cursor at end */
1364 *cursor
= vcol
+ head
; /* cursor at start */
1369 * Get virtual cursor column in the current window, pretending 'list' is off.
1372 getvcol_nolist(posp
)
1375 int list_save
= curwin
->w_p_list
;
1378 curwin
->w_p_list
= FALSE
;
1379 getvcol(curwin
, posp
, NULL
, &vcol
, NULL
);
1380 curwin
->w_p_list
= list_save
;
1384 #if defined(FEAT_VIRTUALEDIT) || defined(PROTO)
1386 * Get virtual column in virtual mode.
1389 getvvcol(wp
, pos
, start
, cursor
, end
)
1403 if (virtual_active())
1405 /* For virtual mode, only want one value */
1406 getvcol(wp
, pos
, &col
, NULL
, NULL
);
1408 coladd
= pos
->coladd
;
1411 /* Cannot put the cursor on part of a wide character. */
1412 ptr
= ml_get_buf(wp
->w_buffer
, pos
->lnum
, FALSE
);
1413 if (pos
->col
< (colnr_T
)STRLEN(ptr
))
1415 int c
= (*mb_ptr2char
)(ptr
+ pos
->col
);
1417 if (c
!= TAB
&& vim_isprintc(c
))
1419 endadd
= (colnr_T
)(char2cells(c
) - 1);
1420 if (coladd
> endadd
) /* past end of line */
1433 *end
= col
+ endadd
;
1436 getvcol(wp
, pos
, start
, cursor
, end
);
1440 #if defined(FEAT_VISUAL) || defined(PROTO)
1442 * Get the leftmost and rightmost virtual column of pos1 and pos2.
1443 * Used for Visual block mode.
1446 getvcols(wp
, pos1
, pos2
, left
, right
)
1449 colnr_T
*left
, *right
;
1451 colnr_T from1
, from2
, to1
, to2
;
1453 if (ltp(pos1
, pos2
))
1455 getvvcol(wp
, pos1
, &from1
, NULL
, &to1
);
1456 getvvcol(wp
, pos2
, &from2
, NULL
, &to2
);
1460 getvvcol(wp
, pos2
, &from1
, NULL
, &to1
);
1461 getvvcol(wp
, pos1
, &from2
, NULL
, &to2
);
1469 if (*p_sel
== 'e' && from2
- 1 >= to1
)
1480 * skipwhite: skip over ' ' and '\t'.
1488 while (vim_iswhite(*p
)) /* skip to next non-white */
1502 while (VIM_ISDIGIT(*p
)) /* skip to next non-digit */
1507 #if defined(FEAT_SYN_HL) || defined(FEAT_SPELL) || defined(PROTO)
1509 * skip over digits and hex characters
1517 while (vim_isxdigit(*p
)) /* skip to next non-digit */
1523 #if defined(FEAT_EX_EXTRA) || defined(PROTO)
1525 * skip to digit (or NUL after the string)
1533 while (*p
!= NUL
&& !VIM_ISDIGIT(*p
)) /* skip to next digit */
1539 * skip to hex character (or NUL after the string)
1547 while (*p
!= NUL
&& !vim_isxdigit(*p
)) /* skip to next digit */
1554 * Variant of isdigit() that can handle characters > 0x100.
1555 * We don't use isdigit() here, because on some systems it also considers
1556 * superscript 1 to be a digit.
1557 * Use the VIM_ISDIGIT() macro for simple arguments.
1563 return (c
>= '0' && c
<= '9');
1567 * Variant of isxdigit() that can handle characters > 0x100.
1568 * We don't use isxdigit() here, because on some systems it also considers
1569 * superscript 1 to be a digit.
1575 return (c
>= '0' && c
<= '9')
1576 || (c
>= 'a' && c
<= 'f')
1577 || (c
>= 'A' && c
<= 'F');
1580 #if defined(FEAT_MBYTE) || defined(PROTO)
1582 * Vim's own character class functions. These exist because many library
1583 * islower()/toupper() etc. do not work properly: they crash when used with
1584 * invalid values or can't handle latin1 when the locale is C.
1585 * Speed is most important here.
1587 #define LATIN1LOWER 'l'
1588 #define LATIN1UPPER 'U'
1590 /* !"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\]%_'abcdefghijklmnopqrstuvwxyz{|}~ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ */
1591 static char_u latin1flags
[257] = " UUUUUUUUUUUUUUUUUUUUUUUUUU llllllllllllllllllllllllll UUUUUUUUUUUUUUUUUUUUUUU UUUUUUUllllllllllllllllllllllll llllllll";
1592 static char_u latin1upper
[257] = " !\"#$%&'()*+,-./0123456789:;<=>?@ABCDEFGHIJKLMNOPQRSTUVWXYZ[\\]^_`ABCDEFGHIJKLMNOPQRSTUVWXYZ{|}~\x7f€�‚ƒ„…†‡ˆ‰Š‹Œ�Ž��‘’“”•–—˜™š›œ�žŸ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿ÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ×ØÙÚÛÜÝÞßÀÁÂÃÄÅÆÇÈÉÊËÌÍÎÏÐÑÒÓÔÕÖ÷ØÙÚÛÜÝÞÿ";
1593 static char_u latin1lower
[257] = " !\"#$%&'()*+,-./0123456789:;<=>?@abcdefghijklmnopqrstuvwxyz[\\]^_`abcdefghijklmnopqrstuvwxyz{|}~\x7f€�‚ƒ„…†‡ˆ‰Š‹Œ�Ž��‘’“”•–—˜™š›œ�žŸ ¡¢£¤¥¦§¨©ª«¬®¯°±²³´µ¶·¸¹º»¼½¾¿àáâãäåæçèéêëìíîïðñòóôõö×øùúûüýþßàáâãäåæçèéêëìíîïðñòóôõö÷øùúûüýþÿ";
1604 return utf_islower(c
);
1607 #ifdef HAVE_ISWLOWER
1611 /* islower() can't handle these chars and may crash */
1615 return (latin1flags
[c
] & LATIN1LOWER
) == LATIN1LOWER
;
1629 return utf_isupper(c
);
1632 #ifdef HAVE_ISWUPPER
1636 /* islower() can't handle these chars and may crash */
1640 return (latin1flags
[c
] & LATIN1UPPER
) == LATIN1UPPER
;
1654 return utf_toupper(c
);
1657 #ifdef HAVE_TOWUPPER
1661 /* toupper() can't handle these chars and may crash */
1665 return latin1upper
[c
];
1667 return TOUPPER_LOC(c
);
1679 return utf_tolower(c
);
1682 #ifdef HAVE_TOWLOWER
1686 /* tolower() can't handle these chars and may crash */
1690 return latin1lower
[c
];
1692 return TOLOWER_LOC(c
);
1697 * skiptowhite: skip over text until ' ' or '\t' or NUL.
1703 while (*p
!= ' ' && *p
!= '\t' && *p
!= NUL
)
1708 #if defined(FEAT_LISTCMDS) || defined(FEAT_SIGNS) || defined(FEAT_SNIFF) \
1711 * skiptowhite_esc: Like skiptowhite(), but also skip escaped chars
1717 while (*p
!= ' ' && *p
!= '\t' && *p
!= NUL
)
1719 if ((*p
== '\\' || *p
== Ctrl_V
) && *(p
+ 1) != NUL
)
1728 * Getdigits: Get a number from a string and skip over it.
1729 * Note: the argument is a pointer to a char_u pointer!
1739 retval
= atol((char *)p
);
1740 if (*p
== '-') /* skip negative sign */
1742 p
= skipdigits(p
); /* skip to next non-digit */
1748 * Return TRUE if "lbuf" is empty or only contains blanks.
1751 vim_isblankline(lbuf
)
1756 p
= skipwhite(lbuf
);
1757 return (*p
== NUL
|| *p
== '\r' || *p
== '\n');
1761 * Convert a string into a long and/or unsigned long, taking care of
1762 * hexadecimal and octal numbers. Accepts a '-' sign.
1763 * If "hexp" is not NULL, returns a flag to indicate the type of the number:
1768 * If "len" is not NULL, the length of the number in characters is returned.
1769 * If "nptr" is not NULL, the signed result is returned in it.
1770 * If "unptr" is not NULL, the unsigned result is returned in it.
1771 * If "dooct" is non-zero recognize octal numbers, when > 1 always assume
1773 * If "dohex" is non-zero recognize hex numbers, when > 1 always assume
1777 vim_str2nr(start
, hexp
, len
, dooct
, dohex
, nptr
, unptr
)
1779 int *hexp
; /* return: type of number 0 = decimal, 'x'
1780 or 'X' is hex, '0' = octal */
1781 int *len
; /* return: detected length of number */
1782 int dooct
; /* recognize octal number */
1783 int dohex
; /* recognize hex number */
1784 long *nptr
; /* return: signed result */
1785 unsigned long *unptr
; /* return: unsigned result */
1787 char_u
*ptr
= start
;
1788 int hex
= 0; /* default is decimal */
1789 int negative
= FALSE
;
1790 unsigned long un
= 0;
1799 /* Recognize hex and octal. */
1800 if (ptr
[0] == '0' && ptr
[1] != '8' && ptr
[1] != '9')
1803 if (dohex
&& (hex
== 'X' || hex
== 'x') && vim_isxdigit(ptr
[2]))
1804 ptr
+= 2; /* hexadecimal */
1807 hex
= 0; /* default is decimal */
1810 /* Don't interpret "0", "08" or "0129" as octal. */
1811 for (n
= 1; VIM_ISDIGIT(ptr
[n
]); ++n
)
1815 hex
= 0; /* can't be octal */
1819 hex
= '0'; /* assume octal */
1826 * Do the string-to-numeric conversion "manually" to avoid sscanf quirks.
1828 if (hex
== '0' || dooct
> 1)
1831 while ('0' <= *ptr
&& *ptr
<= '7')
1833 un
= 8 * un
+ (unsigned long)(*ptr
- '0');
1837 else if (hex
!= 0 || dohex
> 1)
1840 while (vim_isxdigit(*ptr
))
1842 un
= 16 * un
+ (unsigned long)hex2nr(*ptr
);
1849 while (VIM_ISDIGIT(*ptr
))
1851 un
= 10 * un
+ (unsigned long)(*ptr
- '0');
1859 *len
= (int)(ptr
- start
);
1862 if (negative
) /* account for leading '-' for decimal numbers */
1872 * Return the value of a single hex character.
1873 * Only valid when the argument is '0' - '9', 'A' - 'F' or 'a' - 'f'.
1879 if (c
>= 'a' && c
<= 'f')
1880 return c
- 'a' + 10;
1881 if (c
>= 'A' && c
<= 'F')
1882 return c
- 'A' + 10;
1886 #if defined(FEAT_TERMRESPONSE) \
1887 || (defined(FEAT_GUI_GTK) && defined(FEAT_WINDOWS)) || defined(PROTO)
1889 * Convert two hex characters to a byte.
1890 * Return -1 if one of the characters is not hex.
1896 if (!vim_isxdigit(p
[0]) || !vim_isxdigit(p
[1]))
1898 return (hex2nr(p
[0]) << 4) + hex2nr(p
[1]);
1903 * Return TRUE if "str" starts with a backslash that should be removed.
1904 * For MS-DOS, WIN32 and OS/2 this is only done when the character after the
1905 * backslash is not a normal file name character.
1906 * '$' is a valid file name character, we don't remove the backslash before
1907 * it. This means it is not possible to use an environment variable after a
1908 * backslash. "C:\$VIM\doc" is taken literally, only "$VIM\doc" works.
1909 * Although "\ name" is valid, the backslash in "Program\ files" must be
1910 * removed. Assume a file name doesn't start with a space.
1911 * For multi-byte names, never remove a backslash before a non-ascii
1912 * character, assume that all multi-byte characters are valid file name
1919 #ifdef BACKSLASH_IN_FILENAME
1920 return (str
[0] == '\\'
1928 && !vim_isfilec(str
[1]))));
1930 return (str
[0] == '\\' && str
[1] != NUL
);
1935 * Halve the number of backslashes in a file name argument.
1936 * For MS-DOS we only do this if the character after the backslash
1937 * is not a normal file character.
1944 if (rem_backslash(p
))
1949 * backslash_halve() plus save the result in allocated memory.
1952 backslash_halve_save(p
)
1957 res
= vim_strsave(p
);
1960 backslash_halve(res
);
1964 #if (defined(EBCDIC) && defined(FEAT_POSTSCRIPT)) || defined(PROTO)
1966 * Table for EBCDIC to ASCII conversion unashamedly taken from xxd.c!
1967 * The first 64 entries have been added to map control characters defined in
1970 static char_u ebcdic2ascii_tab
[256] =
1972 0000, 0001, 0002, 0003, 0004, 0011, 0006, 0177,
1973 0010, 0011, 0012, 0013, 0014, 0015, 0016, 0017,
1974 0020, 0021, 0022, 0023, 0024, 0012, 0010, 0027,
1975 0030, 0031, 0032, 0033, 0033, 0035, 0036, 0037,
1976 0040, 0041, 0042, 0043, 0044, 0045, 0046, 0047,
1977 0050, 0051, 0052, 0053, 0054, 0055, 0056, 0057,
1978 0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,
1979 0070, 0071, 0072, 0073, 0074, 0075, 0076, 0077,
1980 0040, 0240, 0241, 0242, 0243, 0244, 0245, 0246,
1981 0247, 0250, 0325, 0056, 0074, 0050, 0053, 0174,
1982 0046, 0251, 0252, 0253, 0254, 0255, 0256, 0257,
1983 0260, 0261, 0041, 0044, 0052, 0051, 0073, 0176,
1984 0055, 0057, 0262, 0263, 0264, 0265, 0266, 0267,
1985 0270, 0271, 0313, 0054, 0045, 0137, 0076, 0077,
1986 0272, 0273, 0274, 0275, 0276, 0277, 0300, 0301,
1987 0302, 0140, 0072, 0043, 0100, 0047, 0075, 0042,
1988 0303, 0141, 0142, 0143, 0144, 0145, 0146, 0147,
1989 0150, 0151, 0304, 0305, 0306, 0307, 0310, 0311,
1990 0312, 0152, 0153, 0154, 0155, 0156, 0157, 0160,
1991 0161, 0162, 0136, 0314, 0315, 0316, 0317, 0320,
1992 0321, 0345, 0163, 0164, 0165, 0166, 0167, 0170,
1993 0171, 0172, 0322, 0323, 0324, 0133, 0326, 0327,
1994 0330, 0331, 0332, 0333, 0334, 0335, 0336, 0337,
1995 0340, 0341, 0342, 0343, 0344, 0135, 0346, 0347,
1996 0173, 0101, 0102, 0103, 0104, 0105, 0106, 0107,
1997 0110, 0111, 0350, 0351, 0352, 0353, 0354, 0355,
1998 0175, 0112, 0113, 0114, 0115, 0116, 0117, 0120,
1999 0121, 0122, 0356, 0357, 0360, 0361, 0362, 0363,
2000 0134, 0237, 0123, 0124, 0125, 0126, 0127, 0130,
2001 0131, 0132, 0364, 0365, 0366, 0367, 0370, 0371,
2002 0060, 0061, 0062, 0063, 0064, 0065, 0066, 0067,
2003 0070, 0071, 0372, 0373, 0374, 0375, 0376, 0377
2007 * Convert a buffer worth of characters from EBCDIC to ASCII. Only useful if
2008 * wanting 7-bit ASCII characters out the other end.
2011 ebcdic2ascii(buffer
, len
)
2017 for (i
= 0; i
< len
; i
++)
2018 buffer
[i
] = ebcdic2ascii_tab
[buffer
[i
]];