1 /***************************************************************************
3 * Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
10 * Copyright (C) 2005 by Gadi Cohen
12 * Largely based on php_hebrev by Zeev Suraski <zeev@php.net>
13 * Heavily modified by Gadi Cohen aka Kinslayer <dragon@wastelands.net>
15 * All files in this archive are subject to the GNU General Public License.
16 * See the file COPYING in the source tree root for full license agreement.
18 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
19 * KIND, either express or implied.
21 ****************************************************************************/
27 #include "rbunicode.h"
29 #include "scroll_engine.h"
32 /* #define _HEB_BUFFER_LENGTH (MAX_PATH + LCD_WIDTH/2 + 3 + 2 + 2) * 2 */
33 #define _HEB_BLOCK_TYPE_ENG 1
34 #define _HEB_BLOCK_TYPE_HEB 0
35 #define _HEB_ORIENTATION_LTR 1
36 #define _HEB_ORIENTATION_RTL 0
38 #define ischar(c) ((c > 0x0589 && c < 0x0700) || \
39 (c >= 0xfb50 && c <= 0xfefc) ? 1 : 0)
40 #define _isblank(c) ((c==' ' || c=='\t') ? 1 : 0)
41 #define _isnewline(c) ((c=='\n' || c=='\r') ? 1 : 0)
42 #define XOR(a,b) ((a||b) && !(a&&b))
44 static const arab_t
* arab_lookup(unsigned short uchar
)
46 if (uchar
>= 0x621 && uchar
<= 0x63a)
47 return &(jointable
[uchar
- 0x621]);
48 if (uchar
>= 0x640 && uchar
<= 0x64a)
49 return &(jointable
[uchar
- 0x621 - 5]);
50 if (uchar
>= 0x671 && uchar
<= 0x6d5)
51 return &(jointable
[uchar
- 0x621 - 5 - 38]);
52 if (uchar
== 0x200D) /* Support for the zero-width joiner */
57 static void arabjoin(unsigned short * stringprt
, int length
)
59 bool connected
= false;
60 unsigned short * writeprt
= stringprt
;
62 const arab_t
* prev
= 0;
64 const arab_t
* ligature
= 0;
68 for (i
= 0; i
<= length
; i
++) {
69 cur
= arab_lookup(uchar
= *stringprt
++);
71 /* Skip non-arabic chars */
74 /* Finish the last char */
76 *writeprt
++ = prev
->final
;
79 *writeprt
++ = prev
->isolated
;
88 /* nothing to do for arabic char if the previous was non-arabic */
94 /* if it's LAM, check for LAM+ALEPH ligatures */
95 if (prev
->isolated
== 0xfedd) {
96 switch (cur
->isolated
) {
98 ligature
= &(lamaleph
[0]);
101 ligature
= &(lamaleph
[1]);
104 ligature
= &(lamaleph
[2]);
107 ligature
= &(lamaleph
[3]);
111 if (ligature
) { /* replace the 2 glyphs by their ligature */
115 if (connected
) { /* previous char has something connected to it */
116 if (prev
->medial
&& cur
->final
) /* Can we connect to it? */
117 *writeprt
++ = prev
->medial
;
119 *writeprt
++ = prev
->final
;
123 if (prev
->initial
&& cur
->final
) { /* Can we connect to it? */
124 *writeprt
++ = prev
->initial
;
127 *writeprt
++ = prev
->isolated
;
134 unsigned short *bidi_l2v(const unsigned char *str
, int orientation
)
136 int length
= utf8length(str
);
137 static unsigned short utf16_buf
[SCROLL_LINE_SIZE
];
138 static unsigned short bidi_buf
[SCROLL_LINE_SIZE
];
139 unsigned short *heb_str
, *target
, *tmp
; /* *broken_str */
140 int block_start
, block_end
, block_type
, block_length
, i
;
143 int begin, end, char_count, orig_begin;
147 target
= tmp
= utf16_buf
;
149 str
= utf8decode(str
, target
++);
152 if (target
== utf16_buf
) /* empty string */
155 /* properly join any arabic chars */
156 arabjoin(utf16_buf
, length
);
158 block_start
=block_end
=block_length
=0;
164 target
= heb_str
+ length
;
170 block_type
= _HEB_BLOCK_TYPE_HEB
;
172 block_type
= _HEB_BLOCK_TYPE_ENG
;
175 while((XOR(ischar(*(tmp
+1)),block_type
)
176 || _isblank(*(tmp
+1)) || ispunct((int)*(tmp
+1))
178 && block_end
< length
-1) {
184 if (block_type
!= orientation
) {
185 while ((_isblank(*tmp
) || ispunct((int)*tmp
))
186 && *tmp
!='/' && *tmp
!='-' && block_end
>block_start
) {
192 for (i
=block_start
; i
<=block_end
; i
++) {
193 *target
= (block_type
== orientation
) ?
194 *(utf16_buf
+i
) : *(utf16_buf
+block_end
-i
+block_start
);
195 if (block_type
!=orientation
) {
207 target
+= orientation
? 1 : -1;
209 block_type
= !block_type
;
210 block_start
=block_end
+1;
211 } while(block_end
<length
-1);
215 #if 0 /* Is this code really necessary? */
216 broken_str
= utf16_buf
;
222 while ((!max_chars
|| char_count
<max_chars
) && begin
>0) {
225 if (begin
<=0 || _isnewline(heb_str
[begin
])) {
226 while(begin
>0 && _isnewline(heb_str
[begin
-1])) {
233 if (char_count
==max_chars
) { /* try to avoid breaking words */
234 int new_char_count
= char_count
;
235 int new_begin
= begin
;
237 while (new_char_count
>0) {
238 if (_isblank(heb_str
[new_begin
]) ||
239 _isnewline(heb_str
[new_begin
])) {
245 if (new_char_count
>0) {
246 char_count
=new_char_count
;
252 /* if (_isblank(heb_str[begin])) {
256 /* skip leading newlines */
257 while (begin
<=end
&& _isnewline(heb_str
[begin
])) {
262 for (i
=begin
; i
<=end
; i
++) {
263 *target
= heb_str
[i
];
267 for (i
=orig_begin
; i
<=end
&& _isnewline(heb_str
[i
]); i
++) {
268 *target
= heb_str
[i
];