2 * Demangle VC++ symbols into C function prototypes
4 * Copyright 2000 Jon Griffiths
7 * This library is free software; you can redistribute it and/or
8 * modify it under the terms of the GNU Lesser General Public
9 * License as published by the Free Software Foundation; either
10 * version 2.1 of the License, or (at your option) any later version.
12 * This library is distributed in the hope that it will be useful,
13 * but WITHOUT ANY WARRANTY; without even the implied warranty of
14 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
15 * Lesser General Public License for more details.
17 * You should have received a copy of the GNU Lesser General Public
18 * License along with this library; if not, write to the Free Software
19 * Foundation, Inc., 51 Franklin St, Fifth Floor, Boston, MA 02110-1301, USA
23 #include "wine/port.h"
30 #include "wine/debug.h"
32 WINE_DEFAULT_DEBUG_CHANNEL(msvcrt
);
35 * - document a bit (grammar + functions)
36 * - back-port this new code into tools/winedump/msmangle.c
39 /* How data types modifiers are stored:
40 * M (in the following definitions) is defined for
41 * 'A', 'B', 'C' and 'D' as follows
45 * {<D>}: "const volatile "
52 * same as for arguments and also the following
59 unsigned start
; /* first valid reference in array */
60 unsigned num
; /* total number of used elts */
66 /* Structure holding a parsed symbol */
69 unsigned flags
; /* the UNDNAME_ flags used for demangling */
70 malloc_func_t mem_alloc_ptr
; /* internal allocator */
71 free_func_t mem_free_ptr
; /* internal deallocator */
73 const char* current
; /* pointer in input (mangled) string */
74 char* result
; /* demangled string */
76 struct array names
; /* array of names for back reference */
77 struct array stack
; /* stack of parsed strings */
79 void* alloc_list
; /* linked list of allocated blocks */
80 unsigned avail_in_first
; /* number of available bytes in head block */
83 /* Type for parsing mangled types */
90 static BOOL
symbol_demangle(struct parsed_symbol
* sym
);
92 /******************************************************************
95 * Internal allocator. Uses a simple linked list of large blocks
96 * where we use a poor-man allocator. It's fast, and since all
97 * allocation is pool, memory management is easy (esp. freeing).
99 static void* und_alloc(struct parsed_symbol
* sym
, unsigned int len
)
103 #define BLOCK_SIZE 1024
104 #define AVAIL_SIZE (1024 - sizeof(void*))
106 if (len
> AVAIL_SIZE
)
108 /* allocate a specific block */
109 ptr
= sym
->mem_alloc_ptr(sizeof(void*) + len
);
110 if (!ptr
) return NULL
;
111 *(void**)ptr
= sym
->alloc_list
;
112 sym
->alloc_list
= ptr
;
113 sym
->avail_in_first
= 0;
114 ptr
= (char*)sym
->alloc_list
+ sizeof(void*);
118 if (len
> sym
->avail_in_first
)
120 /* add a new block */
121 ptr
= sym
->mem_alloc_ptr(BLOCK_SIZE
);
122 if (!ptr
) return NULL
;
123 *(void**)ptr
= sym
->alloc_list
;
124 sym
->alloc_list
= ptr
;
125 sym
->avail_in_first
= AVAIL_SIZE
;
127 /* grab memory from head block */
128 ptr
= (char*)sym
->alloc_list
+ BLOCK_SIZE
- sym
->avail_in_first
;
129 sym
->avail_in_first
-= len
;
136 /******************************************************************
138 * Frees all the blocks in the list of large blocks allocated by
141 static void und_free_all(struct parsed_symbol
* sym
)
145 while (sym
->alloc_list
)
147 next
= *(void**)sym
->alloc_list
;
148 if(sym
->mem_free_ptr
) sym
->mem_free_ptr(sym
->alloc_list
);
149 sym
->alloc_list
= next
;
151 sym
->avail_in_first
= 0;
154 /******************************************************************
156 * Initialises an array of strings
158 static void str_array_init(struct array
* a
)
160 a
->start
= a
->num
= a
->max
= a
->alloc
= 0;
164 /******************************************************************
166 * Adding a new string to an array
168 static BOOL
str_array_push(struct parsed_symbol
* sym
, const char* ptr
, int len
,
178 new = und_alloc(sym
, (a
->alloc
= 32) * sizeof(a
->elts
[0]));
179 if (!new) return FALSE
;
182 else if (a
->max
>= a
->alloc
)
184 new = und_alloc(sym
, (a
->alloc
* 2) * sizeof(a
->elts
[0]));
185 if (!new) return FALSE
;
186 memcpy(new, a
->elts
, a
->alloc
* sizeof(a
->elts
[0]));
190 if (len
== -1) len
= strlen(ptr
);
191 a
->elts
[a
->num
] = und_alloc(sym
, len
+ 1);
192 assert(a
->elts
[a
->num
]);
193 memcpy(a
->elts
[a
->num
], ptr
, len
);
194 a
->elts
[a
->num
][len
] = '\0';
195 if (++a
->num
>= a
->max
) a
->max
= a
->num
;
200 for (i
= a
->max
- 1; i
>= 0; i
--)
203 if (i
< a
->start
) c
= '-';
204 else if (i
>= a
->num
) c
= '}';
205 TRACE("%p\t%d%c %s\n", a
, i
, c
, debugstr_a(a
->elts
[i
]));
212 /******************************************************************
214 * Extracts a reference from an existing array (doing proper type
217 static char* str_array_get_ref(struct array
* cref
, unsigned idx
)
220 if (cref
->start
+ idx
>= cref
->max
)
222 WARN("Out of bounds: %p %d + %d >= %d\n",
223 cref
, cref
->start
, idx
, cref
->max
);
226 TRACE("Returning %p[%d] => %s\n",
227 cref
, idx
, debugstr_a(cref
->elts
[cref
->start
+ idx
]));
228 return cref
->elts
[cref
->start
+ idx
];
231 /******************************************************************
233 * Helper for printf type of command (only %s and %c are implemented)
234 * while dynamically allocating the buffer
236 static char* str_printf(struct parsed_symbol
* sym
, const char* format
, ...)
239 unsigned int len
= 1, i
, sz
;
244 va_start(args
, format
);
245 for (i
= 0; format
[i
]; i
++)
247 if (format
[i
] == '%')
251 case 's': t
= va_arg(args
, char*); if (t
) len
+= strlen(t
); break;
252 case 'c': (void)va_arg(args
, int); len
++; break;
253 default: i
--; /* fall through */
254 case '%': len
++; break;
260 if (!(tmp
= und_alloc(sym
, len
))) return NULL
;
261 va_start(args
, format
);
262 for (p
= tmp
, i
= 0; format
[i
]; i
++)
264 if (format
[i
] == '%')
269 t
= va_arg(args
, char*);
278 *p
++ = (char)va_arg(args
, int);
280 default: i
--; /* fall through */
281 case '%': *p
++ = '%'; break;
284 else *p
++ = format
[i
];
291 /* forward declaration */
292 static BOOL
demangle_datatype(struct parsed_symbol
* sym
, struct datatype_t
* ct
,
293 struct array
* pmt
, BOOL in_args
);
295 static const char* get_number(struct parsed_symbol
* sym
)
300 if (*sym
->current
== '?')
305 if (*sym
->current
>= '0' && *sym
->current
<= '8')
307 ptr
= und_alloc(sym
, 3);
308 if (sgn
) ptr
[0] = '-';
309 ptr
[sgn
? 1 : 0] = *sym
->current
+ 1;
310 ptr
[sgn
? 2 : 1] = '\0';
313 else if (*sym
->current
== '9')
315 ptr
= und_alloc(sym
, 4);
316 if (sgn
) ptr
[0] = '-';
317 ptr
[sgn
? 1 : 0] = '1';
318 ptr
[sgn
? 2 : 1] = '0';
319 ptr
[sgn
? 3 : 2] = '\0';
322 else if (*sym
->current
>= 'A' && *sym
->current
<= 'P')
326 while (*sym
->current
>= 'A' && *sym
->current
<= 'P')
329 ret
+= *sym
->current
++ - 'A';
331 if (*sym
->current
!= '@') return NULL
;
333 ptr
= und_alloc(sym
, 17);
334 MSVCRT_sprintf(ptr
, "%s%u", sgn
? "-" : "", ret
);
341 /******************************************************************
343 * Parses a list of function/method arguments, creates a string corresponding
344 * to the arguments' list.
346 static char* get_args(struct parsed_symbol
* sym
, struct array
* pmt_ref
, BOOL z_term
,
347 char open_char
, char close_char
)
350 struct datatype_t ct
;
351 struct array arg_collect
;
352 char* args_str
= NULL
;
356 str_array_init(&arg_collect
);
358 /* Now come the function arguments */
359 while (*sym
->current
)
361 /* Decode each data type and append it to the argument list */
362 if (*sym
->current
== '@')
367 if (!demangle_datatype(sym
, &ct
, pmt_ref
, TRUE
))
369 /* 'void' terminates an argument list in a function */
370 if (z_term
&& !strcmp(ct
.left
, "void")) break;
371 if (!str_array_push(sym
, str_printf(sym
, "%s%s", ct
.left
, ct
.right
), -1,
374 if (!strcmp(ct
.left
, "...")) break;
376 /* Functions are always terminated by 'Z'. If we made it this far and
377 * don't find it, we have incorrectly identified a data type.
379 if (z_term
&& *sym
->current
++ != 'Z') return NULL
;
381 if (arg_collect
.num
== 0 ||
382 (arg_collect
.num
== 1 && !strcmp(arg_collect
.elts
[0], "void")))
383 return str_printf(sym
, "%cvoid%c", open_char
, close_char
);
384 for (i
= 1; i
< arg_collect
.num
; i
++)
386 args_str
= str_printf(sym
, "%s,%s", args_str
, arg_collect
.elts
[i
]);
389 last
= args_str
? args_str
: arg_collect
.elts
[0];
390 if (close_char
== '>' && last
[strlen(last
) - 1] == '>')
391 args_str
= str_printf(sym
, "%c%s%s %c",
392 open_char
, arg_collect
.elts
[0], args_str
, close_char
);
394 args_str
= str_printf(sym
, "%c%s%s%c",
395 open_char
, arg_collect
.elts
[0], args_str
, close_char
);
400 /******************************************************************
402 * Parses the type modifier. Always returns static strings.
404 static BOOL
get_modifier(struct parsed_symbol
*sym
, const char **ret
, const char **ptr_modif
)
407 if (*sym
->current
== 'E')
409 if (!(sym
->flags
& UNDNAME_NO_MS_KEYWORDS
))
411 *ptr_modif
= "__ptr64";
412 if (sym
->flags
& UNDNAME_NO_LEADING_UNDERSCORES
)
413 *ptr_modif
= *ptr_modif
+ 2;
417 switch (*sym
->current
++)
419 case 'A': *ret
= NULL
; break;
420 case 'B': *ret
= "const"; break;
421 case 'C': *ret
= "volatile"; break;
422 case 'D': *ret
= "const volatile"; break;
423 default: return FALSE
;
428 static BOOL
get_modified_type(struct datatype_t
*ct
, struct parsed_symbol
* sym
,
429 struct array
*pmt_ref
, char modif
, BOOL in_args
)
431 const char* modifier
;
432 const char* str_modif
;
433 const char *ptr_modif
= "";
435 if (*sym
->current
== 'E')
437 if (!(sym
->flags
& UNDNAME_NO_MS_KEYWORDS
))
439 if (sym
->flags
& UNDNAME_NO_LEADING_UNDERSCORES
)
440 ptr_modif
= " ptr64";
442 ptr_modif
= " __ptr64";
449 case 'A': str_modif
= str_printf(sym
, " &%s", ptr_modif
); break;
450 case 'B': str_modif
= str_printf(sym
, " &%s volatile", ptr_modif
); break;
451 case 'P': str_modif
= str_printf(sym
, " *%s", ptr_modif
); break;
452 case 'Q': str_modif
= str_printf(sym
, " *%s const", ptr_modif
); break;
453 case 'R': str_modif
= str_printf(sym
, " *%s volatile", ptr_modif
); break;
454 case 'S': str_modif
= str_printf(sym
, " *%s const volatile", ptr_modif
); break;
455 case '?': str_modif
= ""; break;
456 default: return FALSE
;
459 if (get_modifier(sym
, &modifier
, &ptr_modif
))
461 unsigned mark
= sym
->stack
.num
;
462 struct datatype_t sub_ct
;
464 /* multidimensional arrays */
465 if (*sym
->current
== 'Y')
471 if (!(n1
= get_number(sym
))) return FALSE
;
474 if (str_modif
[0] == ' ' && !modifier
)
479 str_modif
= str_printf(sym
, " (%s%s)", modifier
, str_modif
);
483 str_modif
= str_printf(sym
, " (%s)", str_modif
);
486 str_modif
= str_printf(sym
, "%s[%s]", str_modif
, get_number(sym
));
489 /* Recurse to get the referred-to type */
490 if (!demangle_datatype(sym
, &sub_ct
, pmt_ref
, FALSE
))
493 ct
->left
= str_printf(sym
, "%s %s%s", sub_ct
.left
, modifier
, str_modif
);
496 /* don't insert a space between duplicate '*' */
497 if (!in_args
&& str_modif
[0] && str_modif
[1] == '*' && sub_ct
.left
[strlen(sub_ct
.left
)-1] == '*')
499 ct
->left
= str_printf(sym
, "%s%s", sub_ct
.left
, str_modif
);
501 ct
->right
= sub_ct
.right
;
502 sym
->stack
.num
= mark
;
507 /******************************************************************
509 * Gets the literal name from the current position in the mangled
510 * symbol to the first '@' character. It pushes the parsed name to
511 * the symbol names stack and returns a pointer to it or NULL in
514 static char* get_literal_string(struct parsed_symbol
* sym
)
516 const char *ptr
= sym
->current
;
519 if (!((*sym
->current
>= 'A' && *sym
->current
<= 'Z') ||
520 (*sym
->current
>= 'a' && *sym
->current
<= 'z') ||
521 (*sym
->current
>= '0' && *sym
->current
<= '9') ||
522 *sym
->current
== '_' || *sym
->current
== '$')) {
523 TRACE("Failed at '%c' in %s\n", *sym
->current
, debugstr_a(ptr
));
526 } while (*++sym
->current
!= '@');
528 if (!str_array_push(sym
, ptr
, sym
->current
- 1 - ptr
, &sym
->names
))
531 return str_array_get_ref(&sym
->names
, sym
->names
.num
- sym
->names
.start
- 1);
534 /******************************************************************
536 * Parses a name with a template argument list and returns it as
538 * In a template argument list the back reference to the names
539 * table is separately created. '0' points to the class component
540 * name with the template arguments. We use the same stack array
541 * to hold the names but save/restore the stack state before/after
542 * parsing the template argument list.
544 static char* get_template_name(struct parsed_symbol
* sym
)
547 unsigned num_mark
= sym
->names
.num
;
548 unsigned start_mark
= sym
->names
.start
;
549 unsigned stack_mark
= sym
->stack
.num
;
550 struct array array_pmt
;
552 sym
->names
.start
= sym
->names
.num
;
553 if (!(name
= get_literal_string(sym
))) {
554 sym
->names
.start
= start_mark
;
557 str_array_init(&array_pmt
);
558 args
= get_args(sym
, &array_pmt
, FALSE
, '<', '>');
560 name
= str_printf(sym
, "%s%s", name
, args
);
561 sym
->names
.num
= num_mark
;
562 sym
->names
.start
= start_mark
;
563 sym
->stack
.num
= stack_mark
;
567 /******************************************************************
569 * Parses class as a list of parent-classes, terminated by '@' and stores the
570 * result in 'a' array. Each parent-classes, as well as the inner element
571 * (either field/method name or class name), are represented in the mangled
572 * name by a literal name ([a-zA-Z0-9_]+ terminated by '@') or a back reference
573 * ([0-9]) or a name with template arguments ('?$' literal name followed by the
574 * template argument list). The class name components appear in the reverse
575 * order in the mangled name, e.g aaa@bbb@ccc@@ will be demangled to
577 * For each of these class name components a string will be allocated in the
580 static BOOL
get_class(struct parsed_symbol
* sym
)
582 const char* name
= NULL
;
584 while (*sym
->current
!= '@')
586 switch (*sym
->current
)
588 case '\0': return FALSE
;
590 case '0': case '1': case '2': case '3':
591 case '4': case '5': case '6': case '7':
593 name
= str_array_get_ref(&sym
->names
, *sym
->current
++ - '0');
596 switch (*++sym
->current
)
600 if ((name
= get_template_name(sym
)) &&
601 !str_array_push(sym
, name
, -1, &sym
->names
))
606 struct array stack
= sym
->stack
;
607 unsigned int start
= sym
->names
.start
;
608 unsigned int num
= sym
->names
.num
;
610 str_array_init( &sym
->stack
);
611 if (symbol_demangle( sym
)) name
= str_printf( sym
, "`%s'", sym
->result
);
612 sym
->names
.start
= start
;
613 sym
->names
.num
= num
;
618 if (!(name
= get_number( sym
))) return FALSE
;
619 name
= str_printf( sym
, "`%s'", name
);
624 name
= get_literal_string(sym
);
627 if (!name
|| !str_array_push(sym
, name
, -1, &sym
->stack
))
634 /******************************************************************
636 * From an array collected by get_class in sym->stack, constructs the
637 * corresponding (allocated) string
639 static char* get_class_string(struct parsed_symbol
* sym
, int start
)
642 unsigned int len
, sz
;
644 struct array
*a
= &sym
->stack
;
646 for (len
= 0, i
= start
; i
< a
->num
; i
++)
649 len
+= 2 + strlen(a
->elts
[i
]);
651 if (!(ret
= und_alloc(sym
, len
- 1))) return NULL
;
652 for (len
= 0, i
= a
->num
- 1; i
>= start
; i
--)
654 sz
= strlen(a
->elts
[i
]);
655 memcpy(ret
+ len
, a
->elts
[i
], sz
);
667 /******************************************************************
669 * Wrapper around get_class and get_class_string.
671 static char* get_class_name(struct parsed_symbol
* sym
)
673 unsigned mark
= sym
->stack
.num
;
677 s
= get_class_string(sym
, mark
);
678 sym
->stack
.num
= mark
;
682 /******************************************************************
683 * get_calling_convention
684 * Returns a static string corresponding to the calling convention described
685 * by char 'ch'. Sets export to TRUE iff the calling convention is exported.
687 static BOOL
get_calling_convention(char ch
, const char** call_conv
,
688 const char** exported
, unsigned flags
)
690 *call_conv
= *exported
= NULL
;
692 if (!(flags
& (UNDNAME_NO_MS_KEYWORDS
| UNDNAME_NO_ALLOCATION_LANGUAGE
)))
694 if (flags
& UNDNAME_NO_LEADING_UNDERSCORES
)
696 if (((ch
- 'A') % 2) == 1) *exported
= "dll_export ";
699 case 'A': case 'B': *call_conv
= "cdecl"; break;
700 case 'C': case 'D': *call_conv
= "pascal"; break;
701 case 'E': case 'F': *call_conv
= "thiscall"; break;
702 case 'G': case 'H': *call_conv
= "stdcall"; break;
703 case 'I': case 'J': *call_conv
= "fastcall"; break;
704 case 'K': case 'L': break;
705 case 'M': *call_conv
= "clrcall"; break;
706 default: ERR("Unknown calling convention %c\n", ch
); return FALSE
;
711 if (((ch
- 'A') % 2) == 1) *exported
= "__dll_export ";
714 case 'A': case 'B': *call_conv
= "__cdecl"; break;
715 case 'C': case 'D': *call_conv
= "__pascal"; break;
716 case 'E': case 'F': *call_conv
= "__thiscall"; break;
717 case 'G': case 'H': *call_conv
= "__stdcall"; break;
718 case 'I': case 'J': *call_conv
= "__fastcall"; break;
719 case 'K': case 'L': break;
720 case 'M': *call_conv
= "__clrcall"; break;
721 default: ERR("Unknown calling convention %c\n", ch
); return FALSE
;
728 /*******************************************************************
730 * Return a string containing an allocated string for a simple data type
732 static const char* get_simple_type(char c
)
734 const char* type_string
;
738 case 'C': type_string
= "signed char"; break;
739 case 'D': type_string
= "char"; break;
740 case 'E': type_string
= "unsigned char"; break;
741 case 'F': type_string
= "short"; break;
742 case 'G': type_string
= "unsigned short"; break;
743 case 'H': type_string
= "int"; break;
744 case 'I': type_string
= "unsigned int"; break;
745 case 'J': type_string
= "long"; break;
746 case 'K': type_string
= "unsigned long"; break;
747 case 'M': type_string
= "float"; break;
748 case 'N': type_string
= "double"; break;
749 case 'O': type_string
= "long double"; break;
750 case 'X': type_string
= "void"; break;
751 case 'Z': type_string
= "..."; break;
752 default: type_string
= NULL
; break;
757 /*******************************************************************
759 * Return a string containing an allocated string for a simple data type
761 static const char* get_extended_type(char c
)
763 const char* type_string
;
767 case 'D': type_string
= "__int8"; break;
768 case 'E': type_string
= "unsigned __int8"; break;
769 case 'F': type_string
= "__int16"; break;
770 case 'G': type_string
= "unsigned __int16"; break;
771 case 'H': type_string
= "__int32"; break;
772 case 'I': type_string
= "unsigned __int32"; break;
773 case 'J': type_string
= "__int64"; break;
774 case 'K': type_string
= "unsigned __int64"; break;
775 case 'L': type_string
= "__int128"; break;
776 case 'M': type_string
= "unsigned __int128"; break;
777 case 'N': type_string
= "bool"; break;
778 case 'W': type_string
= "wchar_t"; break;
779 default: type_string
= NULL
; break;
784 /*******************************************************************
787 * Attempt to demangle a C++ data type, which may be datatype.
788 * a datatype type is made up of a number of simple types. e.g:
789 * char** = (pointer to (pointer to (char)))
791 static BOOL
demangle_datatype(struct parsed_symbol
* sym
, struct datatype_t
* ct
,
792 struct array
* pmt_ref
, BOOL in_args
)
798 ct
->left
= ct
->right
= NULL
;
800 switch (dt
= *sym
->current
++)
803 /* MS type: __int8,__int16 etc */
804 ct
->left
= get_extended_type(*sym
->current
++);
806 case 'C': case 'D': case 'E': case 'F': case 'G':
807 case 'H': case 'I': case 'J': case 'K': case 'M':
808 case 'N': case 'O': case 'X': case 'Z':
809 /* Simple data types */
810 ct
->left
= get_simple_type(dt
);
813 case 'T': /* union */
814 case 'U': /* struct */
815 case 'V': /* class */
816 case 'Y': /* cointerface */
817 /* Class/struct/union/cointerface */
819 const char* struct_name
= NULL
;
820 const char* type_name
= NULL
;
822 if (!(struct_name
= get_class_name(sym
)))
824 if (!(sym
->flags
& UNDNAME_NO_COMPLEX_TYPE
))
828 case 'T': type_name
= "union "; break;
829 case 'U': type_name
= "struct "; break;
830 case 'V': type_name
= "class "; break;
831 case 'Y': type_name
= "cointerface "; break;
834 ct
->left
= str_printf(sym
, "%s%s", type_name
, struct_name
);
838 /* not all the time is seems */
842 if (!(ptr
= get_number(sym
))) goto done
;
843 ct
->left
= str_printf(sym
, "`template-parameter-%s'", ptr
);
847 if (!get_modified_type(ct
, sym
, pmt_ref
, '?', in_args
)) goto done
;
850 case 'A': /* reference */
851 case 'B': /* volatile reference */
852 if (!get_modified_type(ct
, sym
, pmt_ref
, dt
, in_args
)) goto done
;
854 case 'Q': /* const pointer */
855 case 'R': /* volatile pointer */
856 case 'S': /* const volatile pointer */
857 if (!get_modified_type(ct
, sym
, pmt_ref
, in_args
? dt
: 'P', in_args
)) goto done
;
859 case 'P': /* Pointer */
860 if (isdigit(*sym
->current
))
863 * P6 = Function pointer
864 * P8 = Member function pointer
865 * others who knows.. */
866 if (*sym
->current
== '8')
869 const char* call_conv
;
870 const char* exported
;
871 struct datatype_t sub_ct
;
872 unsigned mark
= sym
->stack
.num
;
874 const char* modifier
;
875 const char* ptr_modif
;
879 if (!(class = get_class_name(sym
)))
881 if (!get_modifier(sym
, &modifier
, &ptr_modif
))
884 modifier
= str_printf(sym
, "%s %s", modifier
, ptr_modif
);
885 else if(ptr_modif
[0])
886 modifier
= str_printf(sym
, " %s", ptr_modif
);
887 if (!get_calling_convention(*sym
->current
++,
888 &call_conv
, &exported
,
889 sym
->flags
& ~UNDNAME_NO_ALLOCATION_LANGUAGE
))
891 if (!demangle_datatype(sym
, &sub_ct
, pmt_ref
, FALSE
))
894 args
= get_args(sym
, pmt_ref
, TRUE
, '(', ')');
895 if (!args
) goto done
;
896 sym
->stack
.num
= mark
;
898 ct
->left
= str_printf(sym
, "%s%s (%s %s::*",
899 sub_ct
.left
, sub_ct
.right
, call_conv
, class);
900 ct
->right
= str_printf(sym
, ")%s%s", args
, modifier
);
902 else if (*sym
->current
== '6')
905 const char* call_conv
;
906 const char* exported
;
907 struct datatype_t sub_ct
;
908 unsigned mark
= sym
->stack
.num
;
912 if (!get_calling_convention(*sym
->current
++,
913 &call_conv
, &exported
,
914 sym
->flags
& ~UNDNAME_NO_ALLOCATION_LANGUAGE
) ||
915 !demangle_datatype(sym
, &sub_ct
, pmt_ref
, FALSE
))
918 args
= get_args(sym
, pmt_ref
, TRUE
, '(', ')');
919 if (!args
) goto done
;
920 sym
->stack
.num
= mark
;
922 ct
->left
= str_printf(sym
, "%s%s (%s*",
923 sub_ct
.left
, sub_ct
.right
, call_conv
);
924 ct
->right
= str_printf(sym
, ")%s", args
);
928 else if (!get_modified_type(ct
, sym
, pmt_ref
, 'P', in_args
)) goto done
;
931 if (*sym
->current
== '4')
935 if (!(enum_name
= get_class_name(sym
)))
937 if (sym
->flags
& UNDNAME_NO_COMPLEX_TYPE
)
938 ct
->left
= enum_name
;
940 ct
->left
= str_printf(sym
, "enum %s", enum_name
);
944 case '0': case '1': case '2': case '3': case '4':
945 case '5': case '6': case '7': case '8': case '9':
946 /* Referring back to previously parsed type */
947 /* left and right are pushed as two separate strings */
948 if (!pmt_ref
) goto done
;
949 ct
->left
= str_array_get_ref(pmt_ref
, (dt
- '0') * 2);
950 ct
->right
= str_array_get_ref(pmt_ref
, (dt
- '0') * 2 + 1);
951 if (!ct
->left
) goto done
;
955 switch (*sym
->current
++)
958 if (!(ct
->left
= get_number(sym
))) goto done
;
963 if (!(ptr
= get_number(sym
))) goto done
;
964 ct
->left
= str_printf(sym
, "`template-parameter%s'", ptr
);
971 if (!(p1
= get_number(sym
))) goto done
;
972 if (!(p2
= get_number(sym
))) goto done
;
973 ct
->left
= str_printf(sym
, "{%s,%s}", p1
, p2
);
981 if (!(p1
= get_number(sym
))) goto done
;
982 if (!(p2
= get_number(sym
))) goto done
;
983 if (!(p3
= get_number(sym
))) goto done
;
984 ct
->left
= str_printf(sym
, "{%s,%s,%s}", p1
, p2
, p3
);
990 if (!(ptr
= get_number(sym
))) goto done
;
991 ct
->left
= str_printf(sym
, "`non-type-template-parameter%s'", ptr
);
995 if (*sym
->current
== 'B')
997 unsigned mark
= sym
->stack
.num
;
998 struct datatype_t sub_ct
;
999 const char* arr
= NULL
;
1002 /* multidimensional arrays */
1003 if (*sym
->current
== 'Y')
1009 if (!(n1
= get_number(sym
))) goto done
;
1013 arr
= str_printf(sym
, "%s[%s]", arr
, get_number(sym
));
1016 if (!demangle_datatype(sym
, &sub_ct
, pmt_ref
, FALSE
)) goto done
;
1019 ct
->left
= str_printf(sym
, "%s %s", sub_ct
.left
, arr
);
1021 ct
->left
= sub_ct
.left
;
1022 ct
->right
= sub_ct
.right
;
1023 sym
->stack
.num
= mark
;
1025 else if (*sym
->current
== 'C')
1027 const char *ptr
, *ptr_modif
;
1030 if (!get_modifier(sym
, &ptr
, &ptr_modif
)) goto done
;
1031 if (!demangle_datatype(sym
, ct
, pmt_ref
, in_args
)) goto done
;
1032 ct
->left
= str_printf(sym
, "%s %s", ct
->left
, ptr
);
1038 ERR("Unknown type %c\n", dt
);
1041 if (add_pmt
&& pmt_ref
&& in_args
)
1043 /* left and right are pushed as two separate strings */
1044 if (!str_array_push(sym
, ct
->left
? ct
->left
: "", -1, pmt_ref
) ||
1045 !str_array_push(sym
, ct
->right
? ct
->right
: "", -1, pmt_ref
))
1050 return ct
->left
!= NULL
;
1053 /******************************************************************
1055 * Does the final parsing and handling for a variable or a field in
1058 static BOOL
handle_data(struct parsed_symbol
* sym
)
1060 const char* access
= NULL
;
1061 const char* member_type
= NULL
;
1062 const char* modifier
= NULL
;
1063 const char* ptr_modif
;
1064 struct datatype_t ct
;
1069 * 1 protected static
1071 * 3 private non-static
1072 * 4 protected non-static
1073 * 5 public non-static
1078 if (!(sym
->flags
& UNDNAME_NO_ACCESS_SPECIFIERS
))
1080 /* we only print the access for static members */
1081 switch (*sym
->current
)
1083 case '0': access
= "private: "; break;
1084 case '1': access
= "protected: "; break;
1085 case '2': access
= "public: "; break;
1089 if (!(sym
->flags
& UNDNAME_NO_MEMBER_TYPE
))
1091 if (*sym
->current
>= '0' && *sym
->current
<= '2')
1092 member_type
= "static ";
1095 name
= get_class_string(sym
, 0);
1097 switch (*sym
->current
++)
1099 case '0': case '1': case '2':
1100 case '3': case '4': case '5':
1102 unsigned mark
= sym
->stack
.num
;
1105 str_array_init(&pmt
);
1107 if (!demangle_datatype(sym
, &ct
, &pmt
, FALSE
)) goto done
;
1108 if (!get_modifier(sym
, &modifier
, &ptr_modif
)) goto done
;
1109 if (modifier
&& ptr_modif
) modifier
= str_printf(sym
, "%s %s", modifier
, ptr_modif
);
1110 else if (!modifier
) modifier
= ptr_modif
;
1111 sym
->stack
.num
= mark
;
1114 case '6' : /* compiler generated static */
1115 case '7' : /* compiler generated static */
1116 ct
.left
= ct
.right
= NULL
;
1117 if (!get_modifier(sym
, &modifier
, &ptr_modif
)) goto done
;
1118 if (*sym
->current
!= '@')
1122 if (!(cls
= get_class_name(sym
)))
1124 ct
.right
= str_printf(sym
, "{for `%s'}", cls
);
1129 modifier
= ct
.left
= ct
.right
= NULL
;
1133 if (sym
->flags
& UNDNAME_NAME_ONLY
) ct
.left
= ct
.right
= modifier
= NULL
;
1135 sym
->result
= str_printf(sym
, "%s%s%s%s%s%s%s%s", access
,
1136 member_type
, ct
.left
,
1137 modifier
&& ct
.left
? " " : NULL
, modifier
,
1138 modifier
|| ct
.left
? " " : NULL
, name
, ct
.right
);
1144 /******************************************************************
1146 * Does the final parsing and handling for a function or a method in
1149 static BOOL
handle_method(struct parsed_symbol
* sym
, BOOL cast_op
)
1152 const char* access
= NULL
;
1154 const char* member_type
= NULL
;
1155 struct datatype_t ct_ret
;
1156 const char* call_conv
;
1157 const char* modifier
= NULL
;
1158 const char* exported
;
1159 const char* args_str
= NULL
;
1160 const char* name
= NULL
;
1161 BOOL ret
= FALSE
, has_args
= TRUE
, has_ret
= TRUE
;
1163 struct array array_pmt
;
1165 /* FIXME: why 2 possible letters for each option?
1168 * 'C' private: static
1169 * 'D' private: static
1170 * 'E' private: virtual
1171 * 'F' private: virtual
1172 * 'G' private: thunk
1173 * 'H' private: thunk
1176 * 'K' protected: static
1177 * 'L' protected: static
1178 * 'M' protected: virtual
1179 * 'N' protected: virtual
1180 * 'O' protected: thunk
1181 * 'P' protected: thunk
1184 * 'S' public: static
1185 * 'T' public: static
1186 * 'U' public: virtual
1187 * 'V' public: virtual
1192 * "$0" private: thunk vtordisp
1193 * "$1" private: thunk vtordisp
1194 * "$2" protected: thunk vtordisp
1195 * "$3" protected: thunk vtordisp
1196 * "$4" public: thunk vtordisp
1197 * "$5" public: thunk vtordisp
1199 * "$R" thunk vtordispex
1201 accmem
= *sym
->current
++;
1204 if (*sym
->current
>= '0' && *sym
->current
<= '5')
1205 access_id
= (*sym
->current
- '0') / 2;
1206 else if (*sym
->current
== 'R')
1207 access_id
= (sym
->current
[1] - '0') / 2;
1208 else if (*sym
->current
!= 'B')
1211 else if (accmem
>= 'A' && accmem
<= 'Z')
1212 access_id
= (accmem
- 'A') / 8;
1218 case 0: access
= "private: "; break;
1219 case 1: access
= "protected: "; break;
1220 case 2: access
= "public: "; break;
1222 if (accmem
== '$' || (accmem
- 'A') % 8 == 6 || (accmem
- 'A') % 8 == 7)
1223 access
= str_printf(sym
, "[thunk]:%s", access
? access
: " ");
1225 if (accmem
== '$' && *sym
->current
!= 'B')
1226 member_type
= "virtual ";
1227 else if (accmem
<= 'X')
1229 switch ((accmem
- 'A') % 8)
1231 case 2: case 3: member_type
= "static "; break;
1232 case 4: case 5: case 6: case 7: member_type
= "virtual "; break;
1236 if (sym
->flags
& UNDNAME_NO_ACCESS_SPECIFIERS
)
1238 if (sym
->flags
& UNDNAME_NO_MEMBER_TYPE
)
1241 name
= get_class_string(sym
, 0);
1243 if (accmem
== '$' && *sym
->current
== 'B') /* vcall thunk */
1248 n
= get_number(sym
);
1250 if(!n
|| *sym
->current
++ != 'A') goto done
;
1251 name
= str_printf(sym
, "%s{%s,{flat}}' }'", name
, n
);
1255 else if (accmem
== '$' && *sym
->current
== 'R') /* vtordispex thunk */
1257 const char *n1
, *n2
, *n3
, *n4
;
1260 n1
= get_number(sym
);
1261 n2
= get_number(sym
);
1262 n3
= get_number(sym
);
1263 n4
= get_number(sym
);
1265 if(!n1
|| !n2
|| !n3
|| !n4
) goto done
;
1266 name
= str_printf(sym
, "%s`vtordispex{%s,%s,%s,%s}' ", name
, n1
, n2
, n3
, n4
);
1268 else if (accmem
== '$') /* vtordisp thunk */
1270 const char *n1
, *n2
;
1273 n1
= get_number(sym
);
1274 n2
= get_number(sym
);
1276 if (!n1
|| !n2
) goto done
;
1277 name
= str_printf(sym
, "%s`vtordisp{%s,%s}' ", name
, n1
, n2
);
1279 else if ((accmem
- 'A') % 8 == 6 || (accmem
- 'A') % 8 == 7) /* a thunk */
1280 name
= str_printf(sym
, "%s`adjustor{%s}' ", name
, get_number(sym
));
1282 if (has_args
&& (accmem
== '$' ||
1283 (accmem
<= 'X' && (accmem
- 'A') % 8 != 2 && (accmem
- 'A') % 8 != 3)))
1285 const char *ptr_modif
;
1286 /* Implicit 'this' pointer */
1287 /* If there is an implicit this pointer, const modifier follows */
1288 if (!get_modifier(sym
, &modifier
, &ptr_modif
)) goto done
;
1289 if (modifier
|| ptr_modif
) modifier
= str_printf(sym
, "%s %s", modifier
, ptr_modif
);
1292 if (!get_calling_convention(*sym
->current
++, &call_conv
, &exported
,
1296 str_array_init(&array_pmt
);
1298 /* Return type, or @ if 'void' */
1299 if (has_ret
&& *sym
->current
== '@')
1301 ct_ret
.left
= "void";
1302 ct_ret
.right
= NULL
;
1307 if (!demangle_datatype(sym
, &ct_ret
, &array_pmt
, FALSE
))
1310 if (!has_ret
|| sym
->flags
& UNDNAME_NO_FUNCTION_RETURNS
)
1311 ct_ret
.left
= ct_ret
.right
= NULL
;
1314 name
= str_printf(sym
, "%s%s%s", name
, ct_ret
.left
, ct_ret
.right
);
1315 ct_ret
.left
= ct_ret
.right
= NULL
;
1318 mark
= sym
->stack
.num
;
1319 if (has_args
&& !(args_str
= get_args(sym
, &array_pmt
, TRUE
, '(', ')'))) goto done
;
1320 if (sym
->flags
& UNDNAME_NAME_ONLY
) args_str
= modifier
= NULL
;
1321 if (sym
->flags
& UNDNAME_NO_THISTYPE
) modifier
= NULL
;
1322 sym
->stack
.num
= mark
;
1324 /* Note: '()' after 'Z' means 'throws', but we don't care here
1327 sym
->result
= str_printf(sym
, "%s%s%s%s%s%s%s%s%s%s%s",
1328 access
, member_type
, ct_ret
.left
,
1329 (ct_ret
.left
&& !ct_ret
.right
) ? " " : NULL
,
1330 call_conv
, call_conv
? " " : NULL
, exported
,
1331 name
, args_str
, modifier
, ct_ret
.right
);
1337 /*******************************************************************
1339 * Demangle a C++ linker symbol
1341 static BOOL
symbol_demangle(struct parsed_symbol
* sym
)
1344 unsigned do_after
= 0;
1345 static CHAR dashed_null
[] = "--null--";
1347 /* FIXME seems wrong as name, as it demangles a simple data type */
1348 if (sym
->flags
& UNDNAME_NO_ARGUMENTS
)
1350 struct datatype_t ct
;
1352 if (demangle_datatype(sym
, &ct
, NULL
, FALSE
))
1354 sym
->result
= str_printf(sym
, "%s%s", ct
.left
, ct
.right
);
1360 /* MS mangled names always begin with '?' */
1361 if (*sym
->current
!= '?') return FALSE
;
1364 /* Then function name or operator code */
1365 if (*sym
->current
== '?' && (sym
->current
[1] != '$' || sym
->current
[2] == '?'))
1367 const char* function_name
= NULL
;
1369 if (sym
->current
[1] == '$')
1375 /* C++ operator code (one character, or two if the first is '_') */
1376 switch (*++sym
->current
)
1378 case '0': do_after
= 1; break;
1379 case '1': do_after
= 2; break;
1380 case '2': function_name
= "operator new"; break;
1381 case '3': function_name
= "operator delete"; break;
1382 case '4': function_name
= "operator="; break;
1383 case '5': function_name
= "operator>>"; break;
1384 case '6': function_name
= "operator<<"; break;
1385 case '7': function_name
= "operator!"; break;
1386 case '8': function_name
= "operator=="; break;
1387 case '9': function_name
= "operator!="; break;
1388 case 'A': function_name
= "operator[]"; break;
1389 case 'B': function_name
= "operator "; do_after
= 3; break;
1390 case 'C': function_name
= "operator->"; break;
1391 case 'D': function_name
= "operator*"; break;
1392 case 'E': function_name
= "operator++"; break;
1393 case 'F': function_name
= "operator--"; break;
1394 case 'G': function_name
= "operator-"; break;
1395 case 'H': function_name
= "operator+"; break;
1396 case 'I': function_name
= "operator&"; break;
1397 case 'J': function_name
= "operator->*"; break;
1398 case 'K': function_name
= "operator/"; break;
1399 case 'L': function_name
= "operator%"; break;
1400 case 'M': function_name
= "operator<"; break;
1401 case 'N': function_name
= "operator<="; break;
1402 case 'O': function_name
= "operator>"; break;
1403 case 'P': function_name
= "operator>="; break;
1404 case 'Q': function_name
= "operator,"; break;
1405 case 'R': function_name
= "operator()"; break;
1406 case 'S': function_name
= "operator~"; break;
1407 case 'T': function_name
= "operator^"; break;
1408 case 'U': function_name
= "operator|"; break;
1409 case 'V': function_name
= "operator&&"; break;
1410 case 'W': function_name
= "operator||"; break;
1411 case 'X': function_name
= "operator*="; break;
1412 case 'Y': function_name
= "operator+="; break;
1413 case 'Z': function_name
= "operator-="; break;
1415 switch (*++sym
->current
)
1417 case '0': function_name
= "operator/="; break;
1418 case '1': function_name
= "operator%="; break;
1419 case '2': function_name
= "operator>>="; break;
1420 case '3': function_name
= "operator<<="; break;
1421 case '4': function_name
= "operator&="; break;
1422 case '5': function_name
= "operator|="; break;
1423 case '6': function_name
= "operator^="; break;
1424 case '7': function_name
= "`vftable'"; break;
1425 case '8': function_name
= "`vbtable'"; break;
1426 case '9': function_name
= "`vcall'"; break;
1427 case 'A': function_name
= "`typeof'"; break;
1428 case 'B': function_name
= "`local static guard'"; break;
1429 case 'C': function_name
= "`string'"; do_after
= 4; break;
1430 case 'D': function_name
= "`vbase destructor'"; break;
1431 case 'E': function_name
= "`vector deleting destructor'"; break;
1432 case 'F': function_name
= "`default constructor closure'"; break;
1433 case 'G': function_name
= "`scalar deleting destructor'"; break;
1434 case 'H': function_name
= "`vector constructor iterator'"; break;
1435 case 'I': function_name
= "`vector destructor iterator'"; break;
1436 case 'J': function_name
= "`vector vbase constructor iterator'"; break;
1437 case 'K': function_name
= "`virtual displacement map'"; break;
1438 case 'L': function_name
= "`eh vector constructor iterator'"; break;
1439 case 'M': function_name
= "`eh vector destructor iterator'"; break;
1440 case 'N': function_name
= "`eh vector vbase constructor iterator'"; break;
1441 case 'O': function_name
= "`copy constructor closure'"; break;
1443 sym
->flags
|= UNDNAME_NO_FUNCTION_RETURNS
;
1444 switch (*++sym
->current
)
1448 struct datatype_t ct
;
1452 str_array_init(&pmt
);
1453 demangle_datatype(sym
, &ct
, &pmt
, FALSE
);
1454 if (!demangle_datatype(sym
, &ct
, NULL
, FALSE
))
1456 function_name
= str_printf(sym
, "%s%s `RTTI Type Descriptor'",
1463 const char* n1
, *n2
, *n3
, *n4
;
1465 n1
= get_number(sym
);
1466 n2
= get_number(sym
);
1467 n3
= get_number(sym
);
1468 n4
= get_number(sym
);
1470 function_name
= str_printf(sym
, "`RTTI Base Class Descriptor at (%s,%s,%s,%s)'",
1474 case '2': function_name
= "`RTTI Base Class Array'"; break;
1475 case '3': function_name
= "`RTTI Class Hierarchy Descriptor'"; break;
1476 case '4': function_name
= "`RTTI Complete Object Locator'"; break;
1478 ERR("Unknown RTTI operator: _R%c\n", *sym
->current
);
1482 case 'S': function_name
= "`local vftable'"; break;
1483 case 'T': function_name
= "`local vftable constructor closure'"; break;
1484 case 'U': function_name
= "operator new[]"; break;
1485 case 'V': function_name
= "operator delete[]"; break;
1486 case 'X': function_name
= "`placement delete closure'"; break;
1487 case 'Y': function_name
= "`placement delete[] closure'"; break;
1489 ERR("Unknown operator: _%c\n", *sym
->current
);
1494 /* FIXME: Other operators */
1495 ERR("Unknown operator: %c\n", *sym
->current
);
1502 if (!str_array_push(sym
, dashed_null
, -1, &sym
->stack
))
1506 sym
->result
= (char*)function_name
;
1512 struct array array_pmt
;
1514 str_array_init(&array_pmt
);
1515 args
= get_args(sym
, &array_pmt
, FALSE
, '<', '>');
1516 if (args
!= NULL
) function_name
= str_printf(sym
, "%s%s", function_name
, args
);
1521 if (!str_array_push(sym
, function_name
, -1, &sym
->stack
))
1526 else if (*sym
->current
== '$')
1528 /* Strange construct, it's a name with a template argument list
1531 ret
= (sym
->result
= get_template_name(sym
)) != NULL
;
1534 else if (*sym
->current
== '?' && sym
->current
[1] == '$')
1537 /* Either a class name, or '@' if the symbol is not a class member */
1538 switch (*sym
->current
)
1540 case '@': sym
->current
++; break;
1543 /* Class the function is associated with, terminated by '@@' */
1544 if (!get_class(sym
)) goto done
;
1550 case 0: default: break;
1552 /* it's time to set the member name for ctor & dtor */
1553 if (sym
->stack
.num
<= 1) goto done
;
1555 sym
->stack
.elts
[0] = sym
->stack
.elts
[1];
1557 sym
->stack
.elts
[0] = str_printf(sym
, "~%s", sym
->stack
.elts
[1]);
1558 /* ctors and dtors don't have return type */
1559 sym
->flags
|= UNDNAME_NO_FUNCTION_RETURNS
;
1562 sym
->flags
&= ~UNDNAME_NO_FUNCTION_RETURNS
;
1569 /* Function/Data type and access level */
1570 if (*sym
->current
>= '0' && *sym
->current
<= '9')
1571 ret
= handle_data(sym
);
1572 else if ((*sym
->current
>= 'A' && *sym
->current
<= 'Z') || *sym
->current
== '$')
1573 ret
= handle_method(sym
, do_after
== 3);
1576 if (ret
) assert(sym
->result
);
1577 else WARN("Failed at %s\n", debugstr_a(sym
->current
));
1582 /*********************************************************************
1583 * __unDNameEx (MSVCRT.@)
1585 * Demangle a C++ identifier.
1588 * buffer [O] If not NULL, the place to put the demangled string
1589 * mangled [I] Mangled name of the function
1590 * buflen [I] Length of buffer
1591 * memget [I] Function to allocate memory with
1592 * memfree [I] Function to free memory with
1593 * unknown [?] Unknown, possibly a call back
1594 * flags [I] Flags determining demangled format
1597 * Success: A string pointing to the unmangled name, allocated with memget.
1600 char* CDECL
__unDNameEx(char* buffer
, const char* mangled
, int buflen
,
1601 malloc_func_t memget
, free_func_t memfree
,
1602 void* unknown
, unsigned short int flags
)
1604 struct parsed_symbol sym
;
1607 TRACE("(%p,%s,%d,%p,%p,%p,%x)\n",
1608 buffer
, debugstr_a(mangled
), buflen
, memget
, memfree
, unknown
, flags
);
1610 /* The flags details is not documented by MS. However, it looks exactly
1611 * like the UNDNAME_ manifest constants from imagehlp.h and dbghelp.h
1612 * So, we copied those (on top of the file)
1614 memset(&sym
, 0, sizeof(struct parsed_symbol
));
1615 if (flags
& UNDNAME_NAME_ONLY
)
1616 flags
|= UNDNAME_NO_FUNCTION_RETURNS
| UNDNAME_NO_ACCESS_SPECIFIERS
|
1617 UNDNAME_NO_MEMBER_TYPE
| UNDNAME_NO_ALLOCATION_LANGUAGE
|
1618 UNDNAME_NO_COMPLEX_TYPE
;
1621 sym
.mem_alloc_ptr
= memget
;
1622 sym
.mem_free_ptr
= memfree
;
1623 sym
.current
= mangled
;
1624 str_array_init( &sym
.names
);
1625 str_array_init( &sym
.stack
);
1627 result
= symbol_demangle(&sym
) ? sym
.result
: mangled
;
1628 if (buffer
&& buflen
)
1630 lstrcpynA( buffer
, result
, buflen
);
1634 buffer
= memget(strlen(result
) + 1);
1635 if (buffer
) strcpy(buffer
, result
);
1644 /*********************************************************************
1645 * __unDName (MSVCRT.@)
1647 char* CDECL
__unDName(char* buffer
, const char* mangled
, int buflen
,
1648 malloc_func_t memget
, free_func_t memfree
,
1649 unsigned short int flags
)
1651 return __unDNameEx(buffer
, mangled
, buflen
, memget
, memfree
, NULL
, flags
);