1 /***************************************************************************
3 * Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
10 * Copyright (C) 2005 by Gadi Cohen
12 * Largely based on php_hebrev by Zeev Suraski <zeev@php.net>
13 * Heavily modified by Gadi Cohen aka Kinslayer <dragon@wastelands.net>
15 * All files in this archive are subject to the GNU General Public License.
16 * See the file COPYING in the source tree root for full license agreement.
18 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
19 * KIND, either express or implied.
21 ****************************************************************************/
27 #include "rbunicode.h"
29 #include "scroll_engine.h"
31 /* #define _HEB_BUFFER_LENGTH (MAX_PATH + LCD_WIDTH/2 + 3 + 2 + 2) * 2 */
32 #define _HEB_BLOCK_TYPE_ENG 1
33 #define _HEB_BLOCK_TYPE_HEB 0
34 #define _HEB_ORIENTATION_LTR 1
35 #define _HEB_ORIENTATION_RTL 0
37 #define ischar(c) ((c > 0x0589 && c < 0x0700) || \
38 (c >= 0xfb50 && c <= 0xfefc) ? 1 : 0)
39 #define _isblank(c) ((c==' ' || c=='\t') ? 1 : 0)
40 #define _isnewline(c) ((c=='\n' || c=='\r') ? 1 : 0)
41 #define XOR(a,b) ((a||b) && !(a&&b))
43 const arab_t
* arab_lookup(unsigned short uchar
)
45 if (uchar
>= 0x621 && uchar
<= 0x63a)
46 return &(jointable
[uchar
- 0x621]);
47 if (uchar
>= 0x640 && uchar
<= 0x64a)
48 return &(jointable
[uchar
- 0x621 - 5]);
49 if (uchar
>= 0x671 && uchar
<= 0x6d5)
50 return &(jointable
[uchar
- 0x621 - 5 - 38]);
51 if (uchar
== 0x200D) /* Support for the zero-width joiner */
56 void arabjoin(unsigned short * stringprt
, int length
){
58 bool connected
= false;
59 unsigned short * writeprt
= stringprt
;
61 const arab_t
* prev
= 0;
63 const arab_t
* ligature
= 0;
67 for (i
= 0; i
<= length
; i
++) {
68 cur
= arab_lookup(uchar
= *stringprt
++);
70 /* Skip non-arabic chars */
73 /* Finish the last char */
75 *writeprt
++ = prev
->final
;
78 *writeprt
++ = prev
->isolated
;
87 /* nothing to do for arabic char if the previous was non-arabic */
93 /* if it's LAM, check for LAM+ALEPH ligatures */
94 if (prev
->isolated
== 0xfedd) {
95 switch (cur
->isolated
) {
97 ligature
= &(lamaleph
[0]);
100 ligature
= &(lamaleph
[1]);
103 ligature
= &(lamaleph
[2]);
106 ligature
= &(lamaleph
[3]);
110 if (ligature
) { /* replace the 2 glyphs by their ligature */
114 if (connected
) { /* previous char has something connected to it */
115 if (prev
->medial
&& cur
->final
) /* Can we connect to it? */
116 *writeprt
++ = prev
->medial
;
118 *writeprt
++ = prev
->final
;
122 if (prev
->initial
&& cur
->final
) { /* Can we connect to it? */
123 *writeprt
++ = prev
->initial
;
126 *writeprt
++ = prev
->isolated
;
133 unsigned short *bidi_l2v(const unsigned char *str
, int orientation
)
135 int length
= utf8length(str
);
136 static unsigned short utf16_buf
[SCROLL_LINE_SIZE
];
137 static unsigned short bidi_buf
[SCROLL_LINE_SIZE
];
138 unsigned short *heb_str
, *target
, *tmp
; /* *broken_str */
139 int block_start
, block_end
, block_type
, block_length
, i
;
142 int begin, end, char_count, orig_begin;
146 target
= tmp
= utf16_buf
;
148 str
= utf8decode(str
, target
++);
151 if (target
== utf16_buf
) /* empty string */
154 /* properly join any arabic chars */
155 arabjoin(utf16_buf
, length
);
157 block_start
=block_end
=block_length
=0;
163 target
= heb_str
+ length
;
169 block_type
= _HEB_BLOCK_TYPE_HEB
;
171 block_type
= _HEB_BLOCK_TYPE_ENG
;
174 while((XOR(ischar(*(tmp
+1)),block_type
)
175 || _isblank(*(tmp
+1)) || ispunct((int)*(tmp
+1))
177 && block_end
< length
-1) {
183 if (block_type
!= orientation
) {
184 while ((_isblank(*tmp
) || ispunct((int)*tmp
))
185 && *tmp
!='/' && *tmp
!='-' && block_end
>block_start
) {
191 for (i
=block_start
; i
<=block_end
; i
++) {
192 *target
= (block_type
== orientation
) ?
193 *(utf16_buf
+i
) : *(utf16_buf
+block_end
-i
+block_start
);
194 if (block_type
!=orientation
) {
206 target
+= orientation
? 1 : -1;
208 block_type
= !block_type
;
209 block_start
=block_end
+1;
210 } while(block_end
<length
-1);
214 #if 0 /* Is this code really necessary? */
215 broken_str
= utf16_buf
;
221 while ((!max_chars
|| char_count
<max_chars
) && begin
>0) {
224 if (begin
<=0 || _isnewline(heb_str
[begin
])) {
225 while(begin
>0 && _isnewline(heb_str
[begin
-1])) {
232 if (char_count
==max_chars
) { /* try to avoid breaking words */
233 int new_char_count
= char_count
;
234 int new_begin
= begin
;
236 while (new_char_count
>0) {
237 if (_isblank(heb_str
[new_begin
]) ||
238 _isnewline(heb_str
[new_begin
])) {
244 if (new_char_count
>0) {
245 char_count
=new_char_count
;
251 /* if (_isblank(heb_str[begin])) {
255 /* skip leading newlines */
256 while (begin
<=end
&& _isnewline(heb_str
[begin
])) {
261 for (i
=begin
; i
<=end
; i
++) {
262 *target
= heb_str
[i
];
266 for (i
=orig_begin
; i
<=end
&& _isnewline(heb_str
[i
]); i
++) {
267 *target
= heb_str
[i
];