2008-05-30 Vladimir Makarov <vmakarov@redhat.com>
[official-gcc.git] / gcc / ada / widechar.adb
blob861df1197398cebe89fb89815b00747f218f3ed3
1 ------------------------------------------------------------------------------
2 -- --
3 -- GNAT COMPILER COMPONENTS --
4 -- --
5 -- W I D E C H A R --
6 -- --
7 -- B o d y --
8 -- --
9 -- Copyright (C) 1992-2008, Free Software Foundation, Inc. --
10 -- --
11 -- GNAT is free software; you can redistribute it and/or modify it under --
12 -- terms of the GNU General Public License as published by the Free Soft- --
13 -- ware Foundation; either version 2, or (at your option) any later ver- --
14 -- sion. GNAT is distributed in the hope that it will be useful, but WITH- --
15 -- OUT ANY WARRANTY; without even the implied warranty of MERCHANTABILITY --
16 -- or FITNESS FOR A PARTICULAR PURPOSE. See the GNU General Public License --
17 -- for more details. You should have received a copy of the GNU General --
18 -- Public License distributed with GNAT; see file COPYING. If not, write --
19 -- to the Free Software Foundation, 51 Franklin Street, Fifth Floor, --
20 -- Boston, MA 02110-1301, USA. --
21 -- --
22 -- As a special exception, if other files instantiate generics from this --
23 -- unit, or you link this unit with other files to produce an executable, --
24 -- this unit does not by itself cause the resulting executable to be --
25 -- covered by the GNU General Public License. This exception does not --
26 -- however invalidate any other reasons why the executable file might be --
27 -- covered by the GNU Public License. --
28 -- --
29 -- GNAT was originally developed by the GNAT team at New York University. --
30 -- Extensive contributions were provided by Ada Core Technologies Inc. --
31 -- --
32 ------------------------------------------------------------------------------
34 -- Note: this package uses the generic subprograms in System.Wch_Cnv, which
35 -- completely encapsulate the set of wide character encoding methods, so no
36 -- modifications are required when adding new encoding methods.
38 with Opt; use Opt;
40 with System.WCh_Cnv; use System.WCh_Cnv;
41 with System.WCh_Con; use System.WCh_Con;
43 package body Widechar is
45 ---------------------------
46 -- Is_Start_Of_Wide_Char --
47 ---------------------------
49 function Is_Start_Of_Wide_Char
50 (S : Source_Buffer_Ptr;
51 P : Source_Ptr) return Boolean
53 begin
54 case Wide_Character_Encoding_Method is
56 -- For Hex mode, just test for an ESC character. The ESC character
57 -- cannot appear in any other context in a legal Ada program.
59 when WCEM_Hex =>
60 return S (P) = ASCII.ESC;
62 -- For brackets, just test ["x where x is a hex character. This is
63 -- sufficient test, since this sequence cannot otherwise appear in a
64 -- legal Ada program.
66 when WCEM_Brackets =>
67 return P <= S'Last - 2
68 and then S (P) = '['
69 and then S (P + 1) = '"'
70 and then (S (P + 2) in '0' .. '9'
71 or else
72 S (P + 2) in 'a' .. 'f'
73 or else
74 S (P + 2) in 'A' .. 'F');
76 -- All other encoding methods use the upper bit set in the first
77 -- character to uniquely represent a wide character.
79 when WCEM_Upper |
80 WCEM_Shift_JIS |
81 WCEM_EUC |
82 WCEM_UTF8 =>
83 return S (P) >= Character'Val (16#80#);
84 end case;
85 end Is_Start_Of_Wide_Char;
87 -----------------
88 -- Length_Wide --
89 -----------------
91 function Length_Wide return Nat is
92 begin
93 return WC_Longest_Sequence;
94 end Length_Wide;
96 ---------------
97 -- Scan_Wide --
98 ---------------
100 procedure Scan_Wide
101 (S : Source_Buffer_Ptr;
102 P : in out Source_Ptr;
103 C : out Char_Code;
104 Err : out Boolean)
106 P_Init : constant Source_Ptr := P;
107 Chr : Character;
109 function In_Char return Character;
110 -- Function to obtain characters of wide character escape sequence
112 -------------
113 -- In_Char --
114 -------------
116 function In_Char return Character is
117 begin
118 P := P + 1;
119 return S (P - 1);
120 end In_Char;
122 function WC_In is new Char_Sequence_To_UTF_32 (In_Char);
124 -- Start of processing for Scan_Wide
126 begin
127 Chr := In_Char;
129 -- Scan out the wide character. If the first character is a bracket,
130 -- we allow brackets encoding regardless of the standard encoding
131 -- method being used, but otherwise we use this standard method.
133 if Chr = '[' then
134 C := Char_Code (WC_In (Chr, WCEM_Brackets));
135 else
136 C := Char_Code (WC_In (Chr, Wide_Character_Encoding_Method));
137 end if;
139 Err := False;
140 Wide_Char_Byte_Count := Wide_Char_Byte_Count + Nat (P - P_Init - 1);
142 exception
143 when Constraint_Error =>
144 C := Char_Code (0);
145 P := P - 1;
146 Err := True;
147 end Scan_Wide;
149 --------------
150 -- Set_Wide --
151 --------------
153 procedure Set_Wide
154 (C : Char_Code;
155 S : in out String;
156 P : in out Natural)
158 procedure Out_Char (C : Character);
159 -- Procedure to store one character of wide character sequence
161 --------------
162 -- Out_Char --
163 --------------
165 procedure Out_Char (C : Character) is
166 begin
167 P := P + 1;
168 S (P) := C;
169 end Out_Char;
171 procedure WC_Out is new UTF_32_To_Char_Sequence (Out_Char);
173 -- Start of processing for Set_Wide
175 begin
176 WC_Out (UTF_32_Code (C), Wide_Character_Encoding_Method);
177 end Set_Wide;
179 ---------------
180 -- Skip_Wide --
181 ---------------
183 procedure Skip_Wide (S : String; P : in out Natural) is
184 P_Init : constant Natural := P;
186 function Skip_Char return Character;
187 -- Function to skip one character of wide character escape sequence
189 ---------------
190 -- Skip_Char --
191 ---------------
193 function Skip_Char return Character is
194 begin
195 P := P + 1;
196 return S (P - 1);
197 end Skip_Char;
199 function WC_Skip is new Char_Sequence_To_UTF_32 (Skip_Char);
201 Discard : UTF_32_Code;
202 pragma Warnings (Off, Discard);
204 -- Start of processing for Skip_Wide
206 begin
207 Discard := WC_Skip (Skip_Char, Wide_Character_Encoding_Method);
208 Wide_Char_Byte_Count := Wide_Char_Byte_Count + Nat (P - P_Init - 1);
209 end Skip_Wide;
211 ---------------
212 -- Skip_Wide --
213 ---------------
215 procedure Skip_Wide (S : Source_Buffer_Ptr; P : in out Source_Ptr) is
216 P_Init : constant Source_Ptr := P;
218 function Skip_Char return Character;
219 -- Function to skip one character of wide character escape sequence
221 ---------------
222 -- Skip_Char --
223 ---------------
225 function Skip_Char return Character is
226 begin
227 P := P + 1;
228 return S (P - 1);
229 end Skip_Char;
231 function WC_Skip is new Char_Sequence_To_UTF_32 (Skip_Char);
233 Discard : UTF_32_Code;
234 pragma Warnings (Off, Discard);
236 -- Start of processing for Skip_Wide
238 begin
239 Discard := WC_Skip (Skip_Char, Wide_Character_Encoding_Method);
240 Wide_Char_Byte_Count := Wide_Char_Byte_Count + Nat (P - P_Init - 1);
241 end Skip_Wide;
243 end Widechar;