Automatic date update in version.in
[binutils-gdb/blckswan.git] / gdb / go-lang.c
blob844f743e83dc9fb8298fc95eb9beec5a65b6a7f2
1 /* Go language support routines for GDB, the GNU debugger.
3 Copyright (C) 2012-2022 Free Software Foundation, Inc.
5 This file is part of GDB.
7 This program is free software; you can redistribute it and/or modify
8 it under the terms of the GNU General Public License as published by
9 the Free Software Foundation; either version 3 of the License, or
10 (at your option) any later version.
12 This program is distributed in the hope that it will be useful,
13 but WITHOUT ANY WARRANTY; without even the implied warranty of
14 MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
15 GNU General Public License for more details.
17 You should have received a copy of the GNU General Public License
18 along with this program. If not, see <http://www.gnu.org/licenses/>. */
20 /* TODO:
21 - split stacks
22 - printing of native types
23 - goroutines
24 - lots more
25 - gccgo mangling needs redoing
26 It's too hard, for example, to know whether one is looking at a mangled
27 Go symbol or not, and their are ambiguities, e.g., the demangler may
28 get passed *any* symbol, including symbols from other languages
29 and including symbols that are already demangled.
30 One thought is to at least add an _G prefix.
31 - 6g mangling isn't supported yet
34 #include "defs.h"
35 #include "gdbsupport/gdb_obstack.h"
36 #include "block.h"
37 #include "symtab.h"
38 #include "language.h"
39 #include "varobj.h"
40 #include "go-lang.h"
41 #include "c-lang.h"
42 #include "parser-defs.h"
43 #include "gdbarch.h"
45 #include <ctype.h>
47 /* The main function in the main package. */
48 static const char GO_MAIN_MAIN[] = "main.main";
50 /* Function returning the special symbol name used by Go for the main
51 procedure in the main program if it is found in minimal symbol list.
52 This function tries to find minimal symbols so that it finds them even
53 if the program was compiled without debugging information. */
55 const char *
56 go_main_name (void)
58 struct bound_minimal_symbol msym;
60 msym = lookup_minimal_symbol (GO_MAIN_MAIN, NULL, NULL);
61 if (msym.minsym != NULL)
62 return GO_MAIN_MAIN;
64 /* No known entry procedure found, the main program is probably not Go. */
65 return NULL;
68 /* Return non-zero if TYPE is a gccgo string.
69 We assume CHECK_TYPEDEF has already been done. */
71 static int
72 gccgo_string_p (struct type *type)
74 /* gccgo strings don't necessarily have a name we can use. */
76 if (type->num_fields () == 2)
78 struct type *type0 = type->field (0).type ();
79 struct type *type1 = type->field (1).type ();
81 type0 = check_typedef (type0);
82 type1 = check_typedef (type1);
84 if (type0->code () == TYPE_CODE_PTR
85 && strcmp (type->field (0).name (), "__data") == 0
86 && type1->code () == TYPE_CODE_INT
87 && strcmp (type->field (1).name (), "__length") == 0)
89 struct type *target_type = TYPE_TARGET_TYPE (type0);
91 target_type = check_typedef (target_type);
93 if (target_type->code () == TYPE_CODE_INT
94 && TYPE_LENGTH (target_type) == 1
95 && strcmp (target_type->name (), "uint8") == 0)
96 return 1;
100 return 0;
103 /* Return non-zero if TYPE is a 6g string.
104 We assume CHECK_TYPEDEF has already been done. */
106 static int
107 sixg_string_p (struct type *type)
109 if (type->num_fields () == 2
110 && type->name () != NULL
111 && strcmp (type->name (), "string") == 0)
112 return 1;
114 return 0;
117 /* Classify the kind of Go object that TYPE is.
118 TYPE is a TYPE_CODE_STRUCT, used to represent a Go object. */
120 enum go_type
121 go_classify_struct_type (struct type *type)
123 type = check_typedef (type);
125 /* Recognize strings as they're useful to be able to print without
126 pretty-printers. */
127 if (gccgo_string_p (type)
128 || sixg_string_p (type))
129 return GO_TYPE_STRING;
131 return GO_TYPE_NONE;
134 /* Subroutine of unpack_mangled_go_symbol to simplify it.
135 Given "[foo.]bar.baz", store "bar" in *PACKAGEP and "baz" in *OBJECTP.
136 We stomp on the last '.' to nul-terminate "bar".
137 The caller is responsible for memory management. */
139 static void
140 unpack_package_and_object (char *buf,
141 const char **packagep, const char **objectp)
143 char *last_dot;
145 last_dot = strrchr (buf, '.');
146 gdb_assert (last_dot != NULL);
147 *objectp = last_dot + 1;
148 *last_dot = '\0';
149 last_dot = strrchr (buf, '.');
150 if (last_dot != NULL)
151 *packagep = last_dot + 1;
152 else
153 *packagep = buf;
156 /* Given a mangled Go symbol, find its package name, object name, and
157 method type (if present).
158 E.g., for "libgo_net.textproto.String.N33_libgo_net.textproto.ProtocolError"
159 *PACKAGEP = "textproto"
160 *OBJECTP = "String"
161 *METHOD_TYPE_PACKAGEP = "textproto"
162 *METHOD_TYPE_OBJECTP = "ProtocolError"
164 Space for the resulting strings is malloc'd in one buffer.
165 PACKAGEP,OBJECTP,METHOD_TYPE* will (typically) point into this buffer.
166 [There are a few exceptions, but the caller is still responsible for
167 freeing the resulting pointer.]
168 A pointer to this buffer is returned, or NULL if symbol isn't a
169 mangled Go symbol.
170 The caller is responsible for freeing the result.
172 *METHOD_TYPE_IS_POINTERP is set to a boolean indicating if
173 the method type is a pointer.
175 There may be value in returning the outer container,
176 i.e., "net" in the above example, but for now it's not needed.
177 Plus it's currently not straightforward to compute,
178 it comes from -fgo-prefix, and there's no algorithm to compute it.
180 If we ever need to unpack the method type, this routine should work
181 for that too. */
183 static char *
184 unpack_mangled_go_symbol (const char *mangled_name,
185 const char **packagep,
186 const char **objectp,
187 const char **method_type_packagep,
188 const char **method_type_objectp,
189 int *method_type_is_pointerp)
191 char *buf;
192 char *p;
193 int len = strlen (mangled_name);
194 /* Pointer to last digit in "N<digit(s)>_". */
195 char *saw_digit;
196 /* Pointer to "N" if valid "N<digit(s)>_" found. */
197 char *method_type;
198 /* Pointer to the first '.'. */
199 const char *first_dot;
200 /* Pointer to the last '.'. */
201 const char *last_dot;
202 /* Non-zero if we saw a pointer indicator. */
203 int saw_pointer;
205 *packagep = *objectp = NULL;
206 *method_type_packagep = *method_type_objectp = NULL;
207 *method_type_is_pointerp = 0;
209 /* main.init is mangled specially. */
210 if (strcmp (mangled_name, "__go_init_main") == 0)
212 char *package = xstrdup ("main");
214 *packagep = package;
215 *objectp = "init";
216 return package;
219 /* main.main is mangled specially (missing prefix). */
220 if (strcmp (mangled_name, "main.main") == 0)
222 char *package = xstrdup ("main");
224 *packagep = package;
225 *objectp = "main";
226 return package;
229 /* We may get passed, e.g., "main.T.Foo", which is *not* mangled.
230 Alas it looks exactly like "prefix.package.object."
231 To cope for now we only recognize the following prefixes:
233 go: the default
234 libgo_.*: used by gccgo's runtime
236 Thus we don't support -fgo-prefix (except as used by the runtime). */
237 if (!startswith (mangled_name, "go.")
238 && !startswith (mangled_name, "libgo_"))
239 return NULL;
241 /* Quick check for whether a search may be fruitful. */
242 /* Ignore anything with @plt, etc. in it. */
243 if (strchr (mangled_name, '@') != NULL)
244 return NULL;
245 /* It must have at least two dots. */
246 first_dot = strchr (mangled_name, '.');
247 if (first_dot == NULL)
248 return NULL;
249 /* Treat "foo.bar" as unmangled. It can collide with lots of other
250 languages and it's not clear what the consequences are.
251 And except for main.main, all gccgo symbols are at least
252 prefix.package.object. */
253 last_dot = strrchr (mangled_name, '.');
254 if (last_dot == first_dot)
255 return NULL;
257 /* More quick checks. */
258 if (last_dot[1] == '\0' /* foo. */
259 || last_dot[-1] == '.') /* foo..bar */
260 return NULL;
262 /* At this point we've decided we have a mangled Go symbol. */
264 buf = xstrdup (mangled_name);
266 /* Search backwards looking for "N<digit(s)>". */
267 p = buf + len;
268 saw_digit = method_type = NULL;
269 saw_pointer = 0;
270 while (p > buf)
272 int current = *(const unsigned char *) --p;
273 int current_is_digit = isdigit (current);
275 if (saw_digit)
277 if (current_is_digit)
278 continue;
279 if (current == 'N'
280 && ((p > buf && p[-1] == '.')
281 || (p > buf + 1 && p[-1] == 'p' && p[-2] == '.')))
283 if (atoi (p + 1) == strlen (saw_digit + 2))
285 if (p[-1] == '.')
286 method_type = p - 1;
287 else
289 gdb_assert (p[-1] == 'p');
290 saw_pointer = 1;
291 method_type = p - 2;
293 break;
296 /* Not what we're looking for, reset and keep looking. */
297 saw_digit = NULL;
298 saw_pointer = 0;
299 continue;
301 if (current_is_digit && p[1] == '_')
303 /* Possible start of method "this" [sic] type. */
304 saw_digit = p;
305 continue;
309 if (method_type != NULL
310 /* Ensure not something like "..foo". */
311 && (method_type > buf && method_type[-1] != '.'))
313 unpack_package_and_object (saw_digit + 2,
314 method_type_packagep, method_type_objectp);
315 *method_type = '\0';
316 *method_type_is_pointerp = saw_pointer;
319 unpack_package_and_object (buf, packagep, objectp);
320 return buf;
323 /* Implements the la_demangle language_defn routine for language Go.
325 N.B. This may get passed *any* symbol, including symbols from other
326 languages and including symbols that are already demangled.
327 Both of these situations are kinda unfortunate, but that's how things
328 are today.
330 N.B. This currently only supports gccgo's mangling.
332 N.B. gccgo's mangling needs, I think, changing.
333 This demangler can't work in all situations,
334 thus not too much effort is currently put into it. */
336 gdb::unique_xmalloc_ptr<char>
337 go_language::demangle_symbol (const char *mangled_name, int options) const
339 const char *package_name;
340 const char *object_name;
341 const char *method_type_package_name;
342 const char *method_type_object_name;
343 int method_type_is_pointer;
345 if (mangled_name == NULL)
346 return NULL;
348 gdb::unique_xmalloc_ptr<char> name_buf
349 (unpack_mangled_go_symbol (mangled_name,
350 &package_name, &object_name,
351 &method_type_package_name,
352 &method_type_object_name,
353 &method_type_is_pointer));
354 if (name_buf == NULL)
355 return NULL;
357 auto_obstack tempbuf;
359 /* Print methods as they appear in "method expressions". */
360 if (method_type_package_name != NULL)
362 /* FIXME: Seems like we should include package_name here somewhere. */
363 if (method_type_is_pointer)
364 obstack_grow_str (&tempbuf, "(*");
365 obstack_grow_str (&tempbuf, method_type_package_name);
366 obstack_grow_str (&tempbuf, ".");
367 obstack_grow_str (&tempbuf, method_type_object_name);
368 if (method_type_is_pointer)
369 obstack_grow_str (&tempbuf, ")");
370 obstack_grow_str (&tempbuf, ".");
371 obstack_grow_str (&tempbuf, object_name);
373 else
375 obstack_grow_str (&tempbuf, package_name);
376 obstack_grow_str (&tempbuf, ".");
377 obstack_grow_str (&tempbuf, object_name);
379 obstack_grow_str0 (&tempbuf, "");
381 return make_unique_xstrdup ((const char *) obstack_finish (&tempbuf));
384 /* Given a Go symbol, return its package or NULL if unknown.
385 Space for the result is malloc'd, caller must free. */
387 char *
388 go_symbol_package_name (const struct symbol *sym)
390 const char *mangled_name = sym->linkage_name ();
391 const char *package_name;
392 const char *object_name;
393 const char *method_type_package_name;
394 const char *method_type_object_name;
395 int method_type_is_pointer;
396 char *name_buf;
397 char *result;
399 gdb_assert (sym->language () == language_go);
400 name_buf = unpack_mangled_go_symbol (mangled_name,
401 &package_name, &object_name,
402 &method_type_package_name,
403 &method_type_object_name,
404 &method_type_is_pointer);
405 /* Some Go symbols don't have mangled form we interpret (yet). */
406 if (name_buf == NULL)
407 return NULL;
408 result = xstrdup (package_name);
409 xfree (name_buf);
410 return result;
413 /* Return the package that BLOCK is in, or NULL if there isn't one.
414 Space for the result is malloc'd, caller must free. */
416 char *
417 go_block_package_name (const struct block *block)
419 while (block != NULL)
421 struct symbol *function = block->function ();
423 if (function != NULL)
425 char *package_name = go_symbol_package_name (function);
427 if (package_name != NULL)
428 return package_name;
430 /* Stop looking if we find a function without a package name.
431 We're most likely outside of Go and thus the concept of the
432 "current" package is gone. */
433 return NULL;
436 block = block->superblock ();
439 return NULL;
442 /* See language.h. */
444 void
445 go_language::language_arch_info (struct gdbarch *gdbarch,
446 struct language_arch_info *lai) const
448 const struct builtin_go_type *builtin = builtin_go_type (gdbarch);
450 /* Helper function to allow shorter lines below. */
451 auto add = [&] (struct type * t) -> struct type *
453 lai->add_primitive_type (t);
454 return t;
457 add (builtin->builtin_void);
458 add (builtin->builtin_char);
459 add (builtin->builtin_bool);
460 add (builtin->builtin_int);
461 add (builtin->builtin_uint);
462 add (builtin->builtin_uintptr);
463 add (builtin->builtin_int8);
464 add (builtin->builtin_int16);
465 add (builtin->builtin_int32);
466 add (builtin->builtin_int64);
467 add (builtin->builtin_uint8);
468 add (builtin->builtin_uint16);
469 add (builtin->builtin_uint32);
470 add (builtin->builtin_uint64);
471 add (builtin->builtin_float32);
472 add (builtin->builtin_float64);
473 add (builtin->builtin_complex64);
474 add (builtin->builtin_complex128);
476 lai->set_string_char_type (builtin->builtin_char);
477 lai->set_bool_type (builtin->builtin_bool, "bool");
480 /* Single instance of the Go language class. */
482 static go_language go_language_defn;
484 static void *
485 build_go_types (struct gdbarch *gdbarch)
487 struct builtin_go_type *builtin_go_type
488 = GDBARCH_OBSTACK_ZALLOC (gdbarch, struct builtin_go_type);
490 builtin_go_type->builtin_void
491 = arch_type (gdbarch, TYPE_CODE_VOID, TARGET_CHAR_BIT, "void");
492 builtin_go_type->builtin_char
493 = arch_character_type (gdbarch, 8, 1, "char");
494 builtin_go_type->builtin_bool
495 = arch_boolean_type (gdbarch, 8, 0, "bool");
496 builtin_go_type->builtin_int
497 = arch_integer_type (gdbarch, gdbarch_int_bit (gdbarch), 0, "int");
498 builtin_go_type->builtin_uint
499 = arch_integer_type (gdbarch, gdbarch_int_bit (gdbarch), 1, "uint");
500 builtin_go_type->builtin_uintptr
501 = arch_integer_type (gdbarch, gdbarch_ptr_bit (gdbarch), 1, "uintptr");
502 builtin_go_type->builtin_int8
503 = arch_integer_type (gdbarch, 8, 0, "int8");
504 builtin_go_type->builtin_int16
505 = arch_integer_type (gdbarch, 16, 0, "int16");
506 builtin_go_type->builtin_int32
507 = arch_integer_type (gdbarch, 32, 0, "int32");
508 builtin_go_type->builtin_int64
509 = arch_integer_type (gdbarch, 64, 0, "int64");
510 builtin_go_type->builtin_uint8
511 = arch_integer_type (gdbarch, 8, 1, "uint8");
512 builtin_go_type->builtin_uint16
513 = arch_integer_type (gdbarch, 16, 1, "uint16");
514 builtin_go_type->builtin_uint32
515 = arch_integer_type (gdbarch, 32, 1, "uint32");
516 builtin_go_type->builtin_uint64
517 = arch_integer_type (gdbarch, 64, 1, "uint64");
518 builtin_go_type->builtin_float32
519 = arch_float_type (gdbarch, 32, "float32", floatformats_ieee_single);
520 builtin_go_type->builtin_float64
521 = arch_float_type (gdbarch, 64, "float64", floatformats_ieee_double);
522 builtin_go_type->builtin_complex64
523 = init_complex_type ("complex64", builtin_go_type->builtin_float32);
524 builtin_go_type->builtin_complex128
525 = init_complex_type ("complex128", builtin_go_type->builtin_float64);
527 return builtin_go_type;
530 static struct gdbarch_data *go_type_data;
532 const struct builtin_go_type *
533 builtin_go_type (struct gdbarch *gdbarch)
535 return (const struct builtin_go_type *) gdbarch_data (gdbarch, go_type_data);
538 void _initialize_go_language ();
539 void
540 _initialize_go_language ()
542 go_type_data = gdbarch_data_register_post_init (build_go_types);