2 * CP57002.cs - ISCII code pages 57002-57011.
4 * Atsushi Enomoto <atsushi@ximian.com> (C) 2005 Novell, Inc.
8 * Copyright (c) 2002 Southern Storm Software, Pty Ltd
10 * Permission is hereby granted, free of charge, to any person obtaining
11 * a copy of this software and associated documentation files (the "Software"),
12 * to deal in the Software without restriction, including without limitation
13 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
14 * and/or sell copies of the Software, and to permit persons to whom the
15 * Software is furnished to do so, subject to the following conditions:
17 * The above copyright notice and this permission notice shall be included
18 * in all copies or substantial portions of the Software.
20 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS
21 * OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
22 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
23 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR
24 * OTHER LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE,
25 * ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
26 * OTHER DEALINGS IN THE SOFTWARE.
36 // This class provides an abstract base for the ISCII encodings,
37 // which all have a similar pattern. Code points 0x00-0x7F are
38 // the standard ASCII character set, and code points 0x80-0xFF
39 // are a shifted version of the Unicode character set, starting
43 public abstract class ISCIIEncoding
: MonoEncoding
51 protected ISCIIEncoding(int codePage
, int shift
,
52 String encodingName
, String webName
)
56 this.encodingName
= encodingName
;
57 this.webName
= webName
;
60 // Get the number of bytes needed to encode a character buffer.
61 public override int GetByteCount(char[] chars
, int index
, int count
)
65 throw new ArgumentNullException("chars");
67 if(index
< 0 || index
> chars
.Length
)
69 throw new ArgumentOutOfRangeException
70 ("index", Strings
.GetString("ArgRange_Array"));
72 if(count
< 0 || count
> (chars
.Length
- index
))
74 throw new ArgumentOutOfRangeException
75 ("count", Strings
.GetString("ArgRange_Array"));
80 // Convenience wrappers for "GetByteCount".
81 public override int GetByteCount(String s
)
85 throw new ArgumentNullException("s");
90 public unsafe override int GetByteCountImpl (char* chars
, int count
)
96 char first
= (char)shift
;
97 char last
= (char)(shift
+ 0x7F);
101 if(ch
< (char)0x0080)
103 // Regular ASCII subset.
106 else if(ch
>= first
&& ch
<= last
)
108 // ISCII range that we need to shift.
111 else if(ch
>= '\uFF01' && ch
<= '\uFF5E')
113 // ASCII full-width characters.
118 // FIXME: implement fallback support for GetByteCountImpl().
124 // Return the final length of the output.
131 public unsafe override int GetBytesImpl (char* chars
, int charCount
, byte* bytes
, int byteCount
)
134 EncoderFallbackBuffer buffer
= null;
141 throw new ArgumentNullException("chars");
145 throw new ArgumentNullException("bytes");
148 // Convert the characters into bytes.
150 int posn
= byteIndex
;
151 char first
= (char)shift
;
152 char last
= (char)(shift
+ 0x7F);
153 while(charCount
-- > 0)
155 ch
= chars
[charIndex
++];
156 if(ch
< (char)0x0080)
158 // Regular ASCII subset.
159 bytes
[posn
++] = (byte)ch
;
161 else if(ch
>= first
&& ch
<= last
)
163 // ISCII range that we need to shift.
164 bytes
[posn
++] = (byte)(ch
- first
+ 0x80);
166 else if(ch
>= '\uFF01' && ch
<= '\uFF5E')
168 // ASCII full-width characters.
169 bytes
[posn
++] = (byte)(ch
- 0xFEE0);
174 HandleFallback (ref buffer
, chars
, ref charIndex
, ref charCount
, bytes
, ref posn
, ref byteCount
);
177 bytes
[posn
++] = (byte)'?';
183 // Return the final length of the output.
184 return posn
- byteIndex
;
188 // Convenience wrappers for "GetBytes".
189 public override int GetBytes(String s, int charIndex, int charCount,
190 byte[] bytes, int byteIndex)
192 // Validate the parameters.
195 throw new ArgumentNullException("s");
199 throw new ArgumentNullException("bytes");
201 if(charIndex < 0 || charIndex > s.Length)
203 throw new ArgumentOutOfRangeException
205 Strings.GetString("ArgRange_StringIndex"));
207 if(charCount < 0 || charCount > (s.Length - charIndex))
209 throw new ArgumentOutOfRangeException
211 Strings.GetString("ArgRange_StringRange"));
213 if(byteIndex < 0 || byteIndex > bytes.Length)
215 throw new ArgumentOutOfRangeException
217 Strings.GetString("ArgRange_Array"));
219 if((bytes.Length - byteIndex) < charCount)
221 throw new ArgumentException
222 (Strings.GetString("Arg_InsufficientSpace"), "bytes");
225 // Convert the characters into bytes.
227 int posn = byteIndex;
228 char first = (char)shift;
229 char last = (char)(shift + 0x7F);
230 while(charCount-- > 0)
233 if(ch < (char)0x0080)
235 // Regular ASCII subset.
236 bytes[posn++] = (byte)ch;
238 else if(ch >= first && ch <= last)
240 // ISCII range that we need to shift.
241 bytes[posn++] = (byte)(ch - first + 0x80);
243 else if(ch >= '\uFF01' && ch <= '\uFF5E')
245 // ASCII full-width characters.
246 bytes[posn++] = (byte)(ch - 0xFEE0);
250 bytes[posn++] = (byte)'?';
254 // Return the final length of the output.
255 return posn - byteIndex;
259 // Get the number of characters needed to decode a byte buffer.
260 public override int GetCharCount(byte[] bytes
, int index
, int count
)
264 throw new ArgumentNullException("bytes");
266 if(index
< 0 || index
> bytes
.Length
)
268 throw new ArgumentOutOfRangeException
269 ("index", Strings
.GetString("ArgRange_Array"));
271 if(count
< 0 || count
> (bytes
.Length
- index
))
273 throw new ArgumentOutOfRangeException
274 ("count", Strings
.GetString("ArgRange_Array"));
279 // Get the characters that result from decoding a byte buffer.
280 public override int GetChars(byte[] bytes
, int byteIndex
, int byteCount
,
281 char[] chars
, int charIndex
)
283 // Validate the parameters.
286 throw new ArgumentNullException("bytes");
290 throw new ArgumentNullException("chars");
292 if(byteIndex
< 0 || byteIndex
> bytes
.Length
)
294 throw new ArgumentOutOfRangeException
295 ("byteIndex", Strings
.GetString("ArgRange_Array"));
297 if(byteCount
< 0 || byteCount
> (bytes
.Length
- byteIndex
))
299 throw new ArgumentOutOfRangeException
300 ("byteCount", Strings
.GetString("ArgRange_Array"));
302 if(charIndex
< 0 || charIndex
> chars
.Length
)
304 throw new ArgumentOutOfRangeException
305 ("charIndex", Strings
.GetString("ArgRange_Array"));
307 if((chars
.Length
- charIndex
) < byteCount
)
309 throw new ArgumentException
310 (Strings
.GetString("Arg_InsufficientSpace"), "chars");
313 // Convert the bytes into characters.
314 int count
= byteCount
;
316 int shift
= this.shift
- 0x80;
319 byteval
= (int)(bytes
[byteIndex
++]);
322 // Ordinary ASCII character.
323 chars
[charIndex
++] = (char)byteval
;
327 // Shift the ISCII character into the Unicode page.
328 chars
[charIndex
++] = (char)(byteval
+ shift
);
334 // Get the maximum number of bytes needed to encode a
335 // specified number of characters.
336 public override int GetMaxByteCount(int charCount
)
340 throw new ArgumentOutOfRangeException
342 Strings
.GetString("ArgRange_NonNegative"));
347 // Get the maximum number of characters needed to decode a
348 // specified number of bytes.
349 public override int GetMaxCharCount(int byteCount
)
353 throw new ArgumentOutOfRangeException
355 Strings
.GetString("ArgRange_NonNegative"));
362 // Get the mail body name for this encoding.
363 public override String BodyName
371 // Get the human-readable name for this encoding.
372 public override String EncodingName
380 // Get the mail agent header name for this encoding.
381 public override String HeaderName
389 // Get the IANA-preferred Web name for this encoding.
390 public override String WebName
398 #endif // !ECMA_COMPAT
400 }; // class ISCIIEncoding
402 // Define the ISCII code pages as subclasses of "ISCIIEncoding".
405 public class CP57002
: ISCIIEncoding
407 public CP57002() : base(57002, 0x0900, "ISCII Devanagari", "x-iscii-de") {}
412 public class CP57003
: ISCIIEncoding
414 public CP57003() : base(57003, 0x0980, "ISCII Bengali", "x-iscii-be") {}
419 public class CP57004
: ISCIIEncoding
421 public CP57004() : base(57004, 0x0B80, "ISCII Tamil", "x-iscii-ta") {}
426 public class CP57005
: ISCIIEncoding
428 public CP57005() : base(57005, 0x0B80, "ISCII Telugu", "x-iscii-te") {}
433 public class CP57006
: ISCIIEncoding
435 // Note: Unicode has a "Sinhala" page, but no "Assamese" page.
436 // Until I hear otherwise, I will assume that they are the same
437 // thing with different names - Rhys Weatherley, 16 April 2002.
438 public CP57006() : base(57006, 0x0D80, "ISCII Assamese", "x-iscii-as") {}
443 public class CP57007
: ISCIIEncoding
445 public CP57007() : base(57007, 0x0B00, "ISCII Oriya", "x-iscii-or") {}
450 public class CP57008
: ISCIIEncoding
452 public CP57008() : base(57008, 0x0C80, "ISCII Kannada", "x-iscii-ka") {}
457 public class CP57009
: ISCIIEncoding
459 public CP57009() : base(57009, 0x0D00, "ISCII Malayalam", "x-iscii-ma") {}
464 public class CP57010
: ISCIIEncoding
466 public CP57010() : base(57010, 0x0A80, "ISCII Gujarati", "x-iscii-gu") {}
471 public class CP57011
: ISCIIEncoding
473 // Note: Unicode has a "Gurmukhi" page, but no "Punjabi" page.
474 // Other ISCII-related information on the Internet seems to
475 // indicate that they are the same. Until I hear otherwise,
476 // I will assume that they are the same thing with different
477 // names - Rhys Weatherley, 16 April 2002.
478 public CP57011() : base(57011, 0x0A00, "ISCII Punjabi", "x-iscii-pa") {}
482 // Define the web encoding name aliases for the above code pages.
485 public class ENCx_iscii_de
: CP57002
487 public ENCx_iscii_de() : base() {}
489 }; // class ENCx_iscii_de
492 public class ENCx_iscii_be
: CP57003
494 public ENCx_iscii_be() : base() {}
496 }; // class ENCx_iscii_be
499 public class ENCx_iscii_ta
: CP57004
501 public ENCx_iscii_ta() : base() {}
503 }; // class ENCx_iscii_ta
506 public class ENCx_iscii_te
: CP57005
508 public ENCx_iscii_te() : base() {}
510 }; // class ENCx_iscii_te
513 public class ENCx_iscii_as
: CP57006
515 public ENCx_iscii_as() : base() {}
517 }; // class ENCx_iscii_as
520 public class ENCx_iscii_or
: CP57007
522 public ENCx_iscii_or() : base() {}
524 }; // class ENCx_iscii_or
527 public class ENCx_iscii_ka
: CP57008
529 public ENCx_iscii_ka() : base() {}
531 }; // class ENCx_iscii_ka
534 public class ENCx_iscii_ma
: CP57009
536 public ENCx_iscii_ma() : base() {}
538 }; // class ENCx_iscii_ma
541 public class ENCx_iscii_gu
: CP57010
543 public ENCx_iscii_gu() : base() {}
545 }; // class ENCx_iscii_gu
548 public class ENCx_iscii_pa
: CP57011
550 public ENCx_iscii_pa() : base() {}
552 }; // class ENCx_iscii_pa
554 }; // namespace I18N.Other