From: Sergey Kaplun via Tarantool-patches <tarantool-patches@dev.tarantool.org>
To: Sergey Bronnikov <sergeyb@tarantool.org>,
Evgeniy Temirgaleev <e.temirgaleev@tarantool.org>
Cc: tarantool-patches@dev.tarantool.org
Subject: [Tarantool-patches] [PATCH luajit 3/4] dbg: introduce lj-gco command
Date: Thu, 4 Jun 2026 12:30:51 +0300 [thread overview]
Message-ID: <20260604093052.2221827-4-skaplun@tarantool.org> (raw)
In-Reply-To: <20260604093052.2221827-1-skaplun@tarantool.org>
Our GDB extension already has dumpers for TValues. But sometimes it
may be useful to dump GC objects (GCobj) without stack context. This
patch adds additional wrappers around dumpers for GC objects to get the
corresponding GC object from a TValue. Also, the lj-gco command is
introduced. It allows dumping GC objects without stack context. The
output format is the same as for the lj-tv command.
Part of tarantool/tarantool#4808
---
src/luajit_dbg.py | 182 ++++++++++++------
.../debug-extension-tests.py | 83 ++++++--
2 files changed, 190 insertions(+), 75 deletions(-)
diff --git a/src/luajit_dbg.py b/src/luajit_dbg.py
index 300d65e9..f5868e61 100644
--- a/src/luajit_dbg.py
+++ b/src/luajit_dbg.py
@@ -882,44 +882,29 @@ def lightudV(tv):
# Dumpers.
+# GCobj dumpers.
-def dump_lj_tnil(tv):
- return 'nil'
-
-
-def dump_lj_tfalse(tv):
- return 'false'
-
-
-def dump_lj_ttrue(tv):
- return 'true'
-
-
-def dump_lj_tlightud(tv):
- return 'light userdata @ {}'.format(strx64(lightudV(tv)))
-
-
-def dump_lj_tstr(tv):
+def dump_lj_gco_str(gcobj):
return 'string {body} @ {address}'.format(
- body=strdata(gcval(tv['gcr'])),
- address=strx64(gcval(tv['gcr']))
+ body=strdata(gcobj),
+ address=strx64(gcobj)
)
-def dump_lj_tupval(tv):
- return 'upvalue @ {}'.format(strx64(gcval(tv['gcr'])))
+def dump_lj_gco_upval(gcobj):
+ return 'upvalue @ {}'.format(strx64(gcobj))
-def dump_lj_tthread(tv):
- return 'thread @ {}'.format(strx64(gcval(tv['gcr'])))
+def dump_lj_gco_thread(gcobj):
+ return 'thread @ {}'.format(strx64(gcobj))
-def dump_lj_tproto(tv):
- return 'proto @ {}'.format(strx64(gcval(tv['gcr'])))
+def dump_lj_gco_proto(gcobj):
+ return 'proto @ {}'.format(strx64(gcobj))
-def dump_lj_tfunc(tv):
- func = dbg.cast('struct GCfuncC *', gcval(tv['gcr']))
+def dump_lj_gco_func(gcobj):
+ func = dbg.cast('struct GCfuncC *', gcobj)
ffid = func['ffid']
if ffid == 0:
@@ -936,20 +921,20 @@ def dump_lj_tfunc(tv):
return 'fast function #{}'.format(int(ffid))
-def dump_lj_ttrace(tv):
- trace = dbg.cast('struct GCtrace *', gcval(tv['gcr']))
+def dump_lj_gco_trace(gcobj):
+ trace = dbg.cast('struct GCtrace *', gcobj)
return 'trace {traceno} @ {addr}'.format(
traceno=strx64(trace['traceno']),
addr=strx64(trace)
)
-def dump_lj_tcdata(tv):
- return 'cdata @ {}'.format(strx64(gcval(tv['gcr'])))
+def dump_lj_gco_cdata(gcobj):
+ return 'cdata @ {}'.format(strx64(gcobj))
-def dump_lj_ttab(tv):
- table = dbg.cast('GCtab *', gcval(tv['gcr']))
+def dump_lj_gco_tab(gcobj):
+ table = dbg.cast('GCtab *', gcobj)
return 'table @ {gcr} (asize: {asize}, hmask: {hmask})'.format(
gcr=strx64(table),
asize=table['asize'],
@@ -957,41 +942,94 @@ def dump_lj_ttab(tv):
)
-def dump_lj_tudata(tv):
- return 'userdata @ {}'.format(strx64(gcval(tv['gcr'])))
+def dump_lj_gco_udata(gcobj):
+ return 'userdata @ {}'.format(strx64(gcobj))
+
+
+def dump_lj_gco_invalid(gcobj):
+ return 'not valid type @ {}'.format(strx64(gcobj))
+
+
+# TValue dumpers
+
+def dump_lj_tv_nil(tv):
+ return 'nil'
+
+
+def dump_lj_tv_false(tv):
+ return 'false'
+
+
+def dump_lj_tv_true(tv):
+ return 'true'
+
+
+def dump_lj_tv_lightud(tv):
+ return 'light userdata @ {}'.format(strx64(lightudV(tv)))
+
+
+# Generate wrappers for TValues containing GCobj.
+gco_fn_dumpers = [
+ fn for fn in globals().keys() if fn.startswith('dump_lj_gco')
+]
+for fn_name in gco_fn_dumpers:
+ wrapped_fn_name = fn_name.replace('gco', 'tv')
+ # Lambda takes `fn_name` as a reference, so the additional
+ # lambda is needed to fixate the correct wrapper.
+ globals()[wrapped_fn_name] = (lambda f: (
+ lambda tv: globals()[f](gcval(tv['gcr']))
+ ))(fn_name)
-def dump_lj_tnumx(tv):
+def dump_lj_tv_numx(tv):
if tvisint(tv):
return 'integer {}'.format(dbg.cast('int32_t', tv['i']))
else:
return 'number {}'.format(dbg.cast('double', tv['n']))
-def dump_lj_invalid(tv):
- return 'not valid type @ {}'.format(strx64(gcval(tv['gcr'])))
-
-
-dumpers = {
- 'LJ_TNIL': dump_lj_tnil,
- 'LJ_TFALSE': dump_lj_tfalse,
- 'LJ_TTRUE': dump_lj_ttrue,
- 'LJ_TLIGHTUD': dump_lj_tlightud,
- 'LJ_TSTR': dump_lj_tstr,
- 'LJ_TUPVAL': dump_lj_tupval,
- 'LJ_TTHREAD': dump_lj_tthread,
- 'LJ_TPROTO': dump_lj_tproto,
- 'LJ_TFUNC': dump_lj_tfunc,
- 'LJ_TTRACE': dump_lj_ttrace,
- 'LJ_TCDATA': dump_lj_tcdata,
- 'LJ_TTAB': dump_lj_ttab,
- 'LJ_TUDATA': dump_lj_tudata,
- 'LJ_TNUMX': dump_lj_tnumx,
+gco_dumpers = {
+ 'LJ_TSTR': dump_lj_gco_str,
+ 'LJ_TUPVAL': dump_lj_gco_upval,
+ 'LJ_TTHREAD': dump_lj_gco_thread,
+ 'LJ_TPROTO': dump_lj_gco_proto,
+ 'LJ_TFUNC': dump_lj_gco_func,
+ 'LJ_TTRACE': dump_lj_gco_trace,
+ 'LJ_TCDATA': dump_lj_gco_cdata,
+ 'LJ_TTAB': dump_lj_gco_tab,
+ 'LJ_TUDATA': dump_lj_gco_udata,
}
+tv_dumpers = {
+ 'LJ_TNIL': dump_lj_tv_nil,
+ 'LJ_TFALSE': dump_lj_tv_false,
+ 'LJ_TTRUE': dump_lj_tv_true,
+ 'LJ_TLIGHTUD': dump_lj_tv_lightud,
+ 'LJ_TSTR': dump_lj_tv_str, # noqa: F821 # Generated.
+ 'LJ_TUPVAL': dump_lj_tv_upval, # noqa: F821 # Generated.
+ 'LJ_TTHREAD': dump_lj_tv_thread, # noqa: F821 # Generated.
+ 'LJ_TPROTO': dump_lj_tv_proto, # noqa: F821 # Generated.
+ 'LJ_TFUNC': dump_lj_tv_func, # noqa: F821 # Generated.
+ 'LJ_TTRACE': dump_lj_tv_trace, # noqa: F821 # Generated.
+ 'LJ_TCDATA': dump_lj_tv_cdata, # noqa: F821 # Generated.
+ 'LJ_TTAB': dump_lj_tv_tab, # noqa: F821 # Generated.
+ 'LJ_TUDATA': dump_lj_tv_udata, # noqa: F821 # Generated.
+ 'LJ_TNUMX': dump_lj_tv_numx,
+}
+
+
+def dump_gcobj(gcobj):
+ return gco_dumpers.get(
+ typenames(i2notu32(gcobj['gch']['gct'])), dump_lj_gco_invalid
+ )(gcobj)
+
+
def dump_tvalue(tvalue):
- return dumpers.get(typenames(itypemap(tvalue)), dump_lj_invalid)(tvalue)
+ return tv_dumpers.get(
+ typenames(itypemap(tvalue)),
+ dump_lj_tv_invalid # noqa: F821 # Generated.
+ )(tvalue)
def dump_framelink_slot_address(fr):
@@ -1011,7 +1049,7 @@ def dump_framelink(L, fr):
p='P' if frame_typep(fr) & FRAME_P else ''
),
d=dbg.cast('TValue *', fr) - dbg.cast('TValue *', frame_prev(fr)),
- f=dump_lj_tfunc(fr - LJ_FR2),
+ f=dump_lj_tv_func(fr - LJ_FR2), # noqa: F821 # Generated.
)
@@ -1141,6 +1179,35 @@ The command requires no args and dumps current GC stats:
))
+class LJDumpGCobj(dbg.LJBase):
+ '''
+lj-gco <GCobj *>
+
+The command receives a pointer to <GCobj> (GCobj address) and dumps
+the type and some info related to it.
+
+* LJ_TSTR: string <string payload> @ <gcr>
+* LJ_TUPVAL: upvalue @ <gcr>
+* LJ_TTHREAD: thread @ <gcr>
+* LJ_TPROTO: proto @ <gcr>
+* LJ_TFUNC: <LFUNC|CFUNC|FFUNC>
+ <LFUNC>: Lua function @ <gcr>, <nupvals> upvalues, <chunk:line>
+ <CFUNC>: C function <mcode address>
+ <FFUNC>: fast function #<ffid>
+* LJ_TTRACE: trace <traceno> @ <gcr>
+* LJ_TCDATA: cdata @ <gcr>
+* LJ_TTAB: table @ <gcr> (asize: <asize>, hmask: <hmask>)
+* LJ_TUDATA: userdata @ <gcr>
+
+Whether the type of the given address differs from the listed above, then
+error message occurs.
+ '''
+
+ def execute(self, arg):
+ gcobj = dbg.cast('GCobj *', dbg.eval(arg))
+ dbg.write('{}\n'.format(dump_gcobj(gcobj)))
+
+
class LJDumpStack(dbg.LJBase):
'''
lj-stack [<lua_State *>]
@@ -1302,6 +1369,7 @@ def load(event=None):
dbg.initialize_extension({
'lj-arch': LJDumpArch,
'lj-gc': LJGC,
+ 'lj-gco': LJDumpGCobj,
'lj-stack': LJDumpStack,
'lj-state': LJState,
'lj-str': LJDumpString,
diff --git a/test/tarantool-debugger-tests/debug-extension-tests.py b/test/tarantool-debugger-tests/debug-extension-tests.py
index 06a118ff..7e2b5ac4 100644
--- a/test/tarantool-debugger-tests/debug-extension-tests.py
+++ b/test/tarantool-debugger-tests/debug-extension-tests.py
@@ -138,6 +138,17 @@ class TestCaseBase(unittest.TestCase):
self.assertRegex(self.output, self.pattern.strip())
+# LLDB + Clang on macOS can't produce debug info for the C-defined
+# macros. Thus, we hardcoded its value manually.
+def gcval(arg):
+ if sys.platform == 'darwin':
+ # Assume GC64 build only.
+ LJ_GCVMASK = '(((uint64_t)1 << 47) - 1)'
+ return '(((' + arg + ')->gcr).gcptr64 & ' + LJ_GCVMASK + ')'
+ else:
+ return 'gcval(' + arg + ')'
+
+
class TestLoad(TestCaseBase):
extension_cmds = ''
location = 'lj_cf_print'
@@ -145,6 +156,7 @@ class TestLoad(TestCaseBase):
pattern = (
r'lj-arch command initialized\n'
r'lj-gc command initialized\n'
+ r'lj-gco command initialized\n'
r'lj-stack command initialized\n'
r'lj-state command initialized\n'
r'lj-str command initialized\n'
@@ -223,6 +235,31 @@ class TestLJStackFunc(TestCaseBase):
pattern = STACK_RX
+# Sorted in LJT order.
+GCO_ARGS = (
+ '"hello",\n'
+ 'coroutine.create(function() end),\n'
+ 'function() end,\n'
+ 'require,\n'
+ 'print,\n'
+ 'ffi.new("int*"),\n'
+ '{1},\n'
+ 'newproxy(),\n'
+)
+
+
+GCO_RX = (
+ r'string \"hello\" @ ' + RX_ADDR + r'\n'
+ r'thread @ ' + RX_ADDR + r'\n'
+ r'Lua function @ ' + RX_ADDR + r', [0-9]+ upvalues, .+:[0-9]+\n'
+ r'C function @ ' + RX_ADDR + r'\n'
+ r'fast function #[0-9]+\n'
+ r'cdata @ ' + RX_ADDR + r'\n'
+ r'table @ ' + RX_ADDR + r' \(asize: \d+, hmask: ' + RX_HASH + r'\)\n'
+ r'userdata @ ' + RX_ADDR + r'\n'
+)
+
+
class TestLJTV(TestCaseBase):
location = 'lj_cf_print'
extension_cmds = (
@@ -249,15 +286,8 @@ class TestLJTV(TestCaseBase):
' nil,\n'
' false,\n'
' true,\n'
- ' debug.upvalueid(print, 1), \n' # lightuserdata
- ' "hello",\n'
- ' coroutine.create(function() end),\n'
- ' function() end,\n'
- ' require,\n'
- ' print,\n'
- ' ffi.new("int*"),\n'
- ' {1},\n'
- ' newproxy(),\n'
+ ' debug.upvalueid(print, 1), \n' + # lightuserdata
+ GCO_ARGS +
' 1,\n'
' 1.1\n'
')\n'
@@ -267,15 +297,8 @@ class TestLJTV(TestCaseBase):
r'nil\n'
r'false\n'
r'true\n'
- r'light userdata @ ' + RX_ADDR + r'\n'
- r'string \"hello\" @ ' + RX_ADDR + r'\n'
- r'thread @ ' + RX_ADDR + r'\n'
- r'Lua function @ ' + RX_ADDR + r', [0-9]+ upvalues, .+:[0-9]+\n'
- r'C function @ ' + RX_ADDR + r'\n'
- r'fast function #[0-9]+\n'
- r'cdata @ ' + RX_ADDR + r'\n'
- r'table @ ' + RX_ADDR + r' \(asize: \d+, hmask: ' + RX_HASH + r'\)\n'
- r'userdata @ ' + RX_ADDR + r'\n'
+ r'light userdata @ ' + RX_ADDR + r'\n' +
+ GCO_RX +
RX_INT + r' .*1.*\n'
r'number 1.1\d+\n'
)
@@ -312,6 +335,30 @@ class TestLJTab(TestCaseBase):
)
+class TestLJGCo(TestCaseBase):
+ location = 'lj_cf_print'
+ extension_cmds = (
+ 'lj-gco ' + gcval('L->base + 0') + '\n'
+ 'lj-gco ' + gcval('L->base + 1') + '\n'
+ 'lj-gco ' + gcval('L->base + 2') + '\n'
+ 'lj-gco ' + gcval('L->base + 3') + '\n'
+ 'lj-gco ' + gcval('L->base + 4') + '\n'
+ 'lj-gco ' + gcval('L->base + 5') + '\n'
+ 'lj-gco ' + gcval('L->base + 6') + '\n'
+ 'lj-gco ' + gcval('L->base + 7') + '\n'
+ )
+
+ lua_script = (
+ 'local ffi = require("ffi")\n'
+ 'print(\n' +
+ GCO_ARGS +
+ ' 1\n' # Stub for the pattern.
+ ')\n'
+ )
+
+ pattern = GCO_RX
+
+
for test_cls in TestCaseBase.__subclasses__():
test_cls.test = lambda self: self.check()
--
2.54.0
next prev parent reply other threads:[~2026-06-04 9:33 UTC|newest]
Thread overview: 13+ messages / expand[flat|nested] mbox.gz Atom feed top
2026-06-04 9:30 [Tarantool-patches] [PATCH luajit 0/4] Introduce dumpers for bytecodes in debuggers Sergey Kaplun via Tarantool-patches
2026-06-04 9:30 ` [Tarantool-patches] [PATCH luajit 1/4] dbg: fix lj-stack command for LLDB Sergey Kaplun via Tarantool-patches
2026-06-05 14:55 ` Sergey Bronnikov via Tarantool-patches
2026-06-04 9:30 ` [Tarantool-patches] [PATCH luajit 2/4] dbg: fix DUALNUM detection " Sergey Kaplun via Tarantool-patches
2026-06-05 14:57 ` Sergey Bronnikov via Tarantool-patches
2026-06-05 16:01 ` Sergey Kaplun via Tarantool-patches
2026-06-04 9:30 ` Sergey Kaplun via Tarantool-patches [this message]
2026-06-05 15:02 ` [Tarantool-patches] [PATCH luajit 3/4] dbg: introduce lj-gco command Sergey Bronnikov via Tarantool-patches
2026-06-04 9:30 ` [Tarantool-patches] [PATCH luajit 4/4] dbg: introduce lj-bc, lj-func and lj-proto dumpers Sergey Kaplun via Tarantool-patches
2026-06-05 15:07 ` Sergey Bronnikov via Tarantool-patches
2026-06-05 16:10 ` Sergey Kaplun via Tarantool-patches
2026-06-05 14:55 ` [Tarantool-patches] [PATCH luajit 0/4] Introduce dumpers for bytecodes in debuggers Sergey Bronnikov via Tarantool-patches
2026-06-05 16:03 ` [Tarantool-patches] [PATCH luajit 3/5] dbg: update help for the lj-arch command Sergey Kaplun via Tarantool-patches
Reply instructions:
You may reply publicly to this message via plain-text email
using any one of the following methods:
* Save the following mbox file, import it into your mail client,
and reply-to-all from there: mbox
Avoid top-posting and favor interleaved quoting:
https://en.wikipedia.org/wiki/Posting_style#Interleaved_style
* Reply using the --to, --cc, and --in-reply-to
switches of git-send-email(1):
git send-email \
--in-reply-to=20260604093052.2221827-4-skaplun@tarantool.org \
--to=tarantool-patches@dev.tarantool.org \
--cc=e.temirgaleev@tarantool.org \
--cc=sergeyb@tarantool.org \
--cc=skaplun@tarantool.org \
--subject='Re: [Tarantool-patches] [PATCH luajit 3/4] dbg: introduce lj-gco command' \
/path/to/YOUR_REPLY
https://kernel.org/pub/software/scm/git/docs/git-send-email.html
* If your mail client supports setting the In-Reply-To header
via mailto: links, try the mailto: link
This is a public inbox, see mirroring instructions
for how to clone and mirror all data and code used for this inbox