1 /***************************************************************************
3 * Open \______ \ ____ ____ | | _\_ |__ _______ ___
4 * Source | _// _ \_/ ___\| |/ /| __ \ / _ \ \/ /
5 * Jukebox | | ( <_> ) \___| < | \_\ ( <_> > < <
6 * Firmware |____|_ /\____/ \___ >__|_ \|___ /\____/__/\_ \
10 * Copyright (C) 2005 by Gadi Cohen
12 * Largely based on php_hebrev by Zeev Suraski <zeev@php.net>
13 * Heavily modified by Gadi Cohen aka Kinslayer <dragon@wastelands.net>
15 * All files in this archive are subject to the GNU General Public License.
16 * See the file COPYING in the source tree root for full license agreement.
18 * This software is distributed on an "AS IS" basis, WITHOUT WARRANTY OF ANY
19 * KIND, either express or implied.
21 ****************************************************************************/
27 #include "rbunicode.h"
30 //#define _HEB_BUFFER_LENGTH (MAX_PATH + LCD_WIDTH/2 + 3 + 2 + 2) * 2
31 #define _HEB_BLOCK_TYPE_ENG 1
32 #define _HEB_BLOCK_TYPE_HEB 0
33 #define _HEB_ORIENTATION_LTR 1
34 #define _HEB_ORIENTATION_RTL 0
36 #define ischar(c) ((c > 0x0589 && c < 0x0700) || (c >= 0xfb50 && c <= 0xfefc) ? 1 : 0)
37 #define _isblank(c) ((c==' ' || c=='\t') ? 1 : 0)
38 #define _isnewline(c) ((c=='\n' || c=='\r') ? 1 : 0)
39 #define XOR(a,b) ((a||b) && !(a&&b))
41 const arab_t
* arab_lookup(unsigned short uchar
)
43 if (uchar
>= 0x621 && uchar
<= 0x63a)
44 return &(jointable
[uchar
- 0x621]);
45 if (uchar
>= 0x640 && uchar
<= 0x64a)
46 return &(jointable
[uchar
- 0x621 - 5]);
47 if (uchar
>= 0x671 && uchar
<= 0x6d5)
48 return &(jointable
[uchar
- 0x621 - 5 - 38]);
49 if (uchar
== 0x200D) /* Support for the zero-width joiner */
54 void arabjoin(unsigned short * stringprt
, int length
){
56 bool connected
= false;
57 unsigned short * writeprt
= stringprt
;
59 const arab_t
* prev
= 0;
61 const arab_t
* ligature
= 0;
65 for (i
= 0; i
<= length
; i
++) {
66 cur
= arab_lookup(uchar
= *stringprt
++);
68 /* Skip non-arabic chars */
71 /* Finish the last char */
73 *writeprt
++ = prev
->final
;
76 *writeprt
++ = prev
->isolated
;
85 /* nothing to do for arabic char if the previous was non-arabic */
91 /* if it's LAM, check for LAM+ALEPH ligatures */
92 if (prev
->isolated
== 0xfedd) {
93 switch (cur
->isolated
) {
95 ligature
= &(lamaleph
[0]);
98 ligature
= &(lamaleph
[1]);
101 ligature
= &(lamaleph
[2]);
104 ligature
= &(lamaleph
[3]);
108 if (ligature
) { /* replace the 2 glyphs by their ligature */
112 if (connected
) { /* previous char has something connected to it */
113 if (prev
->medial
&& cur
->final
) /* Can we connect to it? */
114 *writeprt
++ = prev
->medial
;
116 *writeprt
++ = prev
->final
;
120 if (prev
->initial
&& cur
->final
) { /* Can we connect to it? */
121 *writeprt
++ = prev
->initial
;
124 *writeprt
++ = prev
->isolated
;
131 unsigned short *bidi_l2v(const unsigned char *str
, int orientation
)
133 int length
= utf8length(str
);
134 static unsigned short utf16_buf
[SCROLL_LINE_SIZE
];
135 static unsigned short bidi_buf
[SCROLL_LINE_SIZE
];
136 unsigned short *heb_str
, *target
, *tmp
; // *broken_str
137 int block_start
, block_end
, block_type
, block_length
, i
;
139 //int begin, end, char_count, orig_begin;
142 target
= tmp
= utf16_buf
;
144 str
= utf8decode(str
, target
++);
147 if (target
== utf16_buf
) /* empty string */
150 /* properly join any arabic chars */
151 arabjoin(utf16_buf
, length
);
153 block_start
=block_end
=block_length
=0;
159 target
= heb_str
+ length
;
165 block_type
= _HEB_BLOCK_TYPE_HEB
;
167 block_type
= _HEB_BLOCK_TYPE_ENG
;
170 while((XOR(ischar(*(tmp
+1)),block_type
)
171 || _isblank(*(tmp
+1)) || ispunct((int)*(tmp
+1))
173 && block_end
< length
-1) {
179 if (block_type
!= orientation
) {
180 while ((_isblank(*tmp
) || ispunct((int)*tmp
))
181 && *tmp
!='/' && *tmp
!='-' && block_end
>block_start
) {
187 for (i
=block_start
; i
<=block_end
; i
++) {
188 *target
= (block_type
== orientation
) ? *(utf16_buf
+i
) : *(utf16_buf
+block_end
-i
+block_start
);
189 if (block_type
!=orientation
) {
201 target
+= orientation
? 1 : -1;
203 block_type
= !block_type
;
204 block_start
=block_end
+1;
205 } while(block_end
<length
-1);
209 #if 0 /* Is this code really necessary? */
210 broken_str
= utf16_buf
;
216 while ((!max_chars
|| char_count
<max_chars
) && begin
>0) {
219 if (begin
<=0 || _isnewline(heb_str
[begin
])) {
220 while(begin
>0 && _isnewline(heb_str
[begin
-1])) {
227 if (char_count
==max_chars
) { /* try to avoid breaking words */
228 int new_char_count
= char_count
;
229 int new_begin
= begin
;
231 while (new_char_count
>0) {
232 if (_isblank(heb_str
[new_begin
]) ||
233 _isnewline(heb_str
[new_begin
])) {
239 if (new_char_count
>0) {
240 char_count
=new_char_count
;
246 /* if (_isblank(heb_str[begin])) {
250 /* skip leading newlines */
251 while (begin
<=end
&& _isnewline(heb_str
[begin
])) {
256 for (i
=begin
; i
<=end
; i
++) {
257 *target
= heb_str
[i
];
261 for (i
=orig_begin
; i
<=end
&& _isnewline(heb_str
[i
]); i
++) {
262 *target
= heb_str
[i
];