1 /* Shared functions related to mangling names for the GNU compiler
2 for the Java(TM) language.
3 Copyright (C) 2001, 2002, 2003 Free Software Foundation, Inc.
5 This file is part of GCC.
7 GCC is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 2, or (at your option)
12 GCC is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with GCC; see the file COPYING. If not, write to
19 the Free Software Foundation, 59 Temple Place - Suite 330,
20 Boston, MA 02111-1307, USA.
22 Java and all Java-based marks are trademarks or registered trademarks
23 of Sun Microsystems, Inc. in the United States and other countries.
24 The Free Software Foundation is independent of Sun Microsystems, Inc. */
26 /* Written by Alexandre Petit-Bianco <apbianco@cygnus.com> */
30 #include "coretypes.h"
34 #include "java-tree.h"
38 static void append_unicode_mangled_name (const char *, int);
40 static int unicode_mangling_length (const char *, int);
43 extern struct obstack
*mangle_obstack
;
45 /* If the assembler doesn't support UTF8 in symbol names, some
46 characters might need to be escaped. */
50 /* Assuming (NAME, LEN) is a Utf8-encoding string, emit the string
51 appropriately mangled (with Unicode escapes if needed) to
52 MANGLE_OBSTACK. Note that `java', `lang' and `Object' are used so
53 frequently that they could be cached. */
56 append_gpp_mangled_name (const char *name
, int len
)
58 int encoded_len
= unicode_mangling_length (name
, len
);
59 int needs_escapes
= encoded_len
> 0;
62 sprintf (buf
, "%d", (needs_escapes
? encoded_len
: len
));
63 obstack_grow (mangle_obstack
, buf
, strlen (buf
));
66 append_unicode_mangled_name (name
, len
);
68 obstack_grow (mangle_obstack
, name
, len
);
71 /* Assuming (NAME, LEN) is a Utf8-encoded string, emit the string
72 appropriately mangled (with Unicode escapes) to MANGLE_OBSTACK.
73 Characters needing an escape are encoded `__UNN_' to `__UNNNN_', in
74 which case `__U' will be mangled `__U_'. */
77 append_unicode_mangled_name (const char *name
, int len
)
79 const unsigned char *ptr
;
80 const unsigned char *limit
= (const unsigned char *)name
+ len
;
82 for (ptr
= (const unsigned char *) name
; ptr
< limit
; )
84 int ch
= UTF8_GET(ptr
, limit
);
86 if ((ISALNUM (ch
) && ch
!= 'U') || ch
== '$')
87 obstack_1grow (mangle_obstack
, ch
);
88 /* Everything else needs encoding */
92 if (ch
== '_' || ch
== 'U')
94 /* Prepare to recognize __U */
95 if (ch
== '_' && (uuU
< 3))
98 obstack_1grow (mangle_obstack
, ch
);
100 /* We recognize __U that we wish to encode
101 __U_. Finish the encoding. */
102 else if (ch
== 'U' && (uuU
== 2))
105 obstack_grow (mangle_obstack
, "U_", 2);
107 /* Otherwise, just reset uuU and emit the character we
112 obstack_1grow (mangle_obstack
, ch
);
116 sprintf (buf
, "__U%x_", ch
);
117 obstack_grow (mangle_obstack
, buf
, strlen (buf
));
123 /* Assuming (NAME, LEN) is a Utf8-encoding string, calculate the
124 length of the string as mangled (a la g++) including Unicode
125 escapes. If no escapes are needed, return 0. */
128 unicode_mangling_length (const char *name
, int len
)
130 const unsigned char *ptr
;
131 const unsigned char *limit
= (const unsigned char *)name
+ len
;
132 int need_escapes
= 0; /* Whether we need an escape or not */
133 int num_chars
= 0; /* Number of characters in the mangled name */
134 int uuU
= 0; /* Help us to find __U. 0: '_', 1: '__' */
135 for (ptr
= (const unsigned char *) name
; ptr
< limit
; )
137 int ch
= UTF8_GET(ptr
, limit
);
140 error ("internal error - invalid Utf8 name");
141 if ((ISALNUM (ch
) && ch
!= 'U') || ch
== '$')
143 /* Everything else needs encoding */
146 int encoding_length
= 2;
148 if (ch
== '_' || ch
== 'U')
150 /* It's always at least one character. */
153 /* Prepare to recognize __U */
154 if (ch
== '_' && (uuU
< 3))
157 /* We recognize __U that we wish to encode __U_, we
158 count one more character. */
159 else if (ch
== 'U' && (uuU
== 2))
165 /* Otherwise, just reset uuU */
177 num_chars
+= (4 + encoding_length
);
190 /* The assembler supports UTF8, we don't use escapes. Mangling is
191 simply <N>NAME. <N> is the number of UTF8 encoded characters that
192 are found in NAME. Note that `java', `lang' and `Object' are used
193 so frequently that they could be cached. */
196 append_gpp_mangled_name (const char *name
, int len
)
198 const unsigned char *ptr
;
199 const unsigned char *limit
= (const unsigned char *)name
+ len
;
203 /* Compute the length of the string we wish to mangle. */
204 for (encoded_len
= 0, ptr
= (const unsigned char *) name
;
205 ptr
< limit
; encoded_len
++)
207 int ch
= UTF8_GET(ptr
, limit
);
210 error ("internal error - invalid Utf8 name");
213 sprintf (buf
, "%d", encoded_len
);
214 obstack_grow (mangle_obstack
, buf
, strlen (buf
));
215 obstack_grow (mangle_obstack
, name
, len
);
218 #endif /* HAVE_AS_UTF8 */