mirror of
https://github.com/ElementsProject/lightning.git
synced 2025-01-03 20:44:54 +01:00
07c4d39b75
... and then dualopend returns, and we access the fread leak_detect struct. ``` lightningd: FATAL SIGNAL 6 (version 065ca1e) 0x55ecd4be8145 send_backtrace common/daemon.c:33 0x55ecd4be81f1 crashdump common/daemon.c:46 0x7f200acab51f ??? ./signal/../sysdeps/unix/sysv/linux/x86_64/libc_sigaction.c:0 0x7f200acff828 __pthread_kill_implementation ./nptl/pthread_kill.c:44 0x7f200acff828 __pthread_kill_internal ./nptl/pthread_kill.c:80 0x7f200acff828 __GI___pthread_kill ./nptl/pthread_kill.c:91 0x7f200acab475 __GI_raise ../sysdeps/posix/raise.c:26 0x7f200ac917b6 __GI_abort ./stdlib/abort.c:79 0x55ecd4c6827f call_error ccan/ccan/tal/tal.c:93 0x55ecd4c68470 check_bounds ccan/ccan/tal/tal.c:165 0x55ecd4c684c2 to_tal_hdr ccan/ccan/tal/tal.c:175 0x55ecd4c68eb8 tal_free ccan/ccan/tal/tal.c:479 0x55ecd4b8bdd0 finish_report lightningd/memdump.c:138 0x55ecd4b8c115 leak_detect_req_done lightningd/memdump.c:201 0x55ecd4c68664 notify ccan/ccan/tal/tal.c:237 0x55ecd4c68b9e del_tree ccan/ccan/tal/tal.c:402 0x55ecd4c68bf3 del_tree ccan/ccan/tal/tal.c:412 0x55ecd4c68bf3 del_tree ccan/ccan/tal/tal.c:412 0x55ecd4c68f43 tal_free ccan/ccan/tal/tal.c:486 0x55ecd4c5751f io_close ccan/ccan/io/io.c:450 0x55ecd4bbce68 subd_shutdown_remaining lightningd/subd.c:911 0x55ecd4b8724a shutdown_subdaemons lightningd/lightningd.c:541 0x55ecd4b883cc main lightningd/lightningd.c:1207 0x7f200ac92fcf __libc_start_call_main ../sysdeps/nptl/libc_start_call_main.h:58 0x7f200ac9307c __libc_start_main_impl ../csu/libc-start.c:409 0x55ecd4b5cc54 ??? ``` Signed-off-by: Rusty Russell <rusty@rustcorp.com.au>
312 lines
8.3 KiB
C
312 lines
8.3 KiB
C
/* Only possible if we're in developer mode. */
|
|
#include "config.h"
|
|
#if DEVELOPER
|
|
#include <backtrace.h>
|
|
#include <ccan/tal/str/str.h>
|
|
#include <common/json_command.h>
|
|
#include <common/memleak.h>
|
|
#include <common/param.h>
|
|
#include <common/timeout.h>
|
|
#include <connectd/connectd_wiregen.h>
|
|
#include <errno.h>
|
|
#include <gossipd/gossipd_wiregen.h>
|
|
#include <hsmd/hsmd_wiregen.h>
|
|
#include <lightningd/chaintopology.h>
|
|
#include <lightningd/jsonrpc.h>
|
|
#include <lightningd/lightningd.h>
|
|
#include <lightningd/memdump.h>
|
|
#include <lightningd/opening_common.h>
|
|
#include <lightningd/peer_control.h>
|
|
#include <lightningd/subd.h>
|
|
#include <wire/wire_sync.h>
|
|
|
|
static void json_add_ptr(struct json_stream *response, const char *name,
|
|
const void *ptr)
|
|
{
|
|
char ptrstr[STR_MAX_CHARS(void *)];
|
|
snprintf(ptrstr, sizeof(ptrstr), "%p", ptr);
|
|
json_add_string(response, name, ptrstr);
|
|
}
|
|
|
|
static size_t add_memdump(struct json_stream *response,
|
|
const char *name, const tal_t *root,
|
|
struct command *cmd)
|
|
{
|
|
const tal_t *i;
|
|
size_t cumulative_size = 0;
|
|
|
|
json_array_start(response, name);
|
|
for (i = tal_first(root); i; i = tal_next(i)) {
|
|
const char *name = tal_name(i);
|
|
size_t size = tal_bytelen(i);
|
|
|
|
/* Don't try to dump this command! */
|
|
if (i == cmd || i == cmd->jcon)
|
|
continue;
|
|
|
|
/* Don't dump logs, we know they grow. */
|
|
if (name && streq(name, "struct log_book"))
|
|
continue;
|
|
|
|
json_object_start(response, NULL);
|
|
json_add_ptr(response, "parent", tal_parent(i));
|
|
json_add_ptr(response, "value", i);
|
|
json_add_u64(response, "size", size);
|
|
if (name)
|
|
json_add_string(response, "label", name);
|
|
|
|
if (tal_first(i))
|
|
size += add_memdump(response, "children", i, cmd);
|
|
json_add_u64(response, "cumulative_size", size);
|
|
json_object_end(response);
|
|
cumulative_size += size;
|
|
}
|
|
json_array_end(response);
|
|
return cumulative_size;
|
|
}
|
|
|
|
static struct command_result *json_memdump(struct command *cmd,
|
|
const char *buffer,
|
|
const jsmntok_t *obj UNNEEDED,
|
|
const jsmntok_t *params)
|
|
{
|
|
struct json_stream *response;
|
|
|
|
if (!param(cmd, buffer, params, NULL))
|
|
return command_param_failed();
|
|
|
|
response = json_stream_success(cmd);
|
|
add_memdump(response, "memdump", NULL, cmd);
|
|
|
|
return command_success(cmd, response);
|
|
}
|
|
|
|
static const struct json_command dev_memdump_command = {
|
|
"dev-memdump",
|
|
"developer",
|
|
json_memdump,
|
|
"Show memory objects currently in use"
|
|
};
|
|
AUTODATA(json_command, &dev_memdump_command);
|
|
|
|
static int json_add_syminfo(void *data, uintptr_t pc UNUSED,
|
|
const char *filename, int lineno,
|
|
const char *function)
|
|
{
|
|
struct json_stream *response = data;
|
|
char *str;
|
|
|
|
/* This can happen in backtraces. */
|
|
if (!filename || !function)
|
|
return 0;
|
|
|
|
str = tal_fmt(response, "%s:%u (%s)", filename, lineno, function);
|
|
json_add_string(response, NULL, str);
|
|
tal_free(str);
|
|
return 0;
|
|
}
|
|
|
|
static void json_add_backtrace(struct json_stream *response,
|
|
const uintptr_t *bt)
|
|
{
|
|
size_t i;
|
|
|
|
if (!bt)
|
|
return;
|
|
|
|
json_array_start(response, "backtrace");
|
|
/* First one serves as counter. */
|
|
for (i = 1; i < bt[0]; i++) {
|
|
backtrace_pcinfo(backtrace_state,
|
|
bt[i], json_add_syminfo,
|
|
NULL, response);
|
|
}
|
|
json_array_end(response);
|
|
}
|
|
|
|
static void finish_report(const struct leak_detect *leaks)
|
|
{
|
|
struct htable *memtable;
|
|
const tal_t *i;
|
|
const uintptr_t *backtrace;
|
|
struct command *cmd;
|
|
struct lightningd *ld;
|
|
struct json_stream *response;
|
|
|
|
/* If it timed out, we free ourselved and exit! */
|
|
if (!leaks->cmd) {
|
|
tal_free(leaks);
|
|
return;
|
|
}
|
|
|
|
/* Convenience variables */
|
|
cmd = leaks->cmd;
|
|
ld = cmd->ld;
|
|
|
|
/* Enter everything, except this cmd and its jcon */
|
|
memtable = memleak_find_allocations(cmd, cmd, cmd->jcon);
|
|
|
|
/* First delete known false positives. */
|
|
memleak_remove_htable(memtable, &ld->topology->txwatches.raw);
|
|
memleak_remove_htable(memtable, &ld->topology->txowatches.raw);
|
|
memleak_remove_htable(memtable, &ld->htlcs_in.raw);
|
|
memleak_remove_htable(memtable, &ld->htlcs_out.raw);
|
|
memleak_remove_htable(memtable, &ld->htlc_sets.raw);
|
|
|
|
/* Now delete ld and those which it has pointers to. */
|
|
memleak_remove_region(memtable, ld, sizeof(*ld));
|
|
|
|
response = json_stream_success(cmd);
|
|
json_array_start(response, "leaks");
|
|
while ((i = memleak_get(memtable, &backtrace)) != NULL) {
|
|
const tal_t *p;
|
|
|
|
json_object_start(response, NULL);
|
|
json_add_ptr(response, "value", i);
|
|
if (tal_name(i))
|
|
json_add_string(response, "label", tal_name(i));
|
|
|
|
json_add_backtrace(response, backtrace);
|
|
json_array_start(response, "parents");
|
|
for (p = tal_parent(i); p; p = tal_parent(p)) {
|
|
json_add_string(response, NULL, tal_name(p));
|
|
p = tal_parent(p);
|
|
}
|
|
json_array_end(response);
|
|
json_object_end(response);
|
|
}
|
|
|
|
for (size_t i = 0; i < tal_count(leaks->leakers); i++) {
|
|
json_object_start(response, NULL);
|
|
json_add_string(response, "subdaemon", leaks->leakers[i]);
|
|
json_object_end(response);
|
|
}
|
|
json_array_end(response);
|
|
|
|
/* Command is now done. */
|
|
was_pending(command_success(cmd, response));
|
|
}
|
|
|
|
static void leak_detect_timeout(struct leak_detect *leak_detect)
|
|
{
|
|
/* We actually *do* leak the leak_detect, but cmd is about
|
|
* to exit. */
|
|
notleak(tal_steal(NULL, leak_detect));
|
|
finish_report(leak_detect);
|
|
leak_detect->cmd = NULL;
|
|
}
|
|
|
|
static void leak_detect_req_done(const struct subd_req *req,
|
|
struct leak_detect *leak_detect)
|
|
{
|
|
leak_detect->num_outstanding_requests--;
|
|
if (leak_detect->num_outstanding_requests == 0)
|
|
finish_report(leak_detect);
|
|
}
|
|
|
|
/* Start a leak request: decrements num_outstanding_requests when freed. */
|
|
void start_leak_request(const struct subd_req *req,
|
|
struct leak_detect *leak_detect)
|
|
{
|
|
leak_detect->num_outstanding_requests++;
|
|
/* When req is freed, request finished. */
|
|
tal_add_destructor2(req, leak_detect_req_done, leak_detect);
|
|
}
|
|
|
|
/* Yep, found a leak in this subd. */
|
|
void report_subd_memleak(struct leak_detect *leak_detect, struct subd *leaker)
|
|
{
|
|
tal_arr_expand(&leak_detect->leakers,
|
|
tal_strdup(leak_detect, leaker->name));
|
|
}
|
|
|
|
static void gossip_dev_memleak_done(struct subd *gossipd,
|
|
const u8 *reply,
|
|
const int *fds UNUSED,
|
|
struct leak_detect *leaks)
|
|
{
|
|
bool found_leak;
|
|
|
|
if (!fromwire_gossipd_dev_memleak_reply(reply, &found_leak))
|
|
fatal("Bad gossip_dev_memleak");
|
|
|
|
if (found_leak)
|
|
report_subd_memleak(leaks, gossipd);
|
|
}
|
|
|
|
static void connect_dev_memleak_done(struct subd *connectd,
|
|
const u8 *reply,
|
|
const int *fds UNUSED,
|
|
struct leak_detect *leaks)
|
|
{
|
|
bool found_leak;
|
|
|
|
if (!fromwire_connectd_dev_memleak_reply(reply, &found_leak))
|
|
fatal("Bad connect_dev_memleak");
|
|
|
|
if (found_leak)
|
|
report_subd_memleak(leaks, connectd);
|
|
}
|
|
|
|
static struct command_result *json_memleak(struct command *cmd,
|
|
const char *buffer,
|
|
const jsmntok_t *obj UNNEEDED,
|
|
const jsmntok_t *params)
|
|
{
|
|
struct lightningd *ld = cmd->ld;
|
|
u8 *msg;
|
|
bool found_leak;
|
|
struct leak_detect *leaks;
|
|
|
|
if (!param(cmd, buffer, params, NULL))
|
|
return command_param_failed();
|
|
|
|
if (!getenv("LIGHTNINGD_DEV_MEMLEAK")) {
|
|
return command_fail(cmd, LIGHTNINGD,
|
|
"Leak detection needs $LIGHTNINGD_DEV_MEMLEAK");
|
|
}
|
|
|
|
leaks = tal(cmd, struct leak_detect);
|
|
leaks->cmd = cmd;
|
|
leaks->num_outstanding_requests = 0;
|
|
leaks->leakers = tal_arr(leaks, const char *, 0);
|
|
|
|
/* hsmd is sync, so do that first. */
|
|
if (!wire_sync_write(ld->hsm_fd,
|
|
take(towire_hsmd_dev_memleak(NULL))))
|
|
fatal("Could not write to HSM: %s", strerror(errno));
|
|
msg = wire_sync_read(tmpctx, ld->hsm_fd);
|
|
if (!fromwire_hsmd_dev_memleak_reply(msg, &found_leak))
|
|
fatal("Bad HSMD_DEV_MEMLEAK_REPLY: %s", tal_hex(tmpctx, msg));
|
|
|
|
if (found_leak)
|
|
report_subd_memleak(leaks, ld->hsm);
|
|
|
|
/* Now do all the async ones. */
|
|
start_leak_request(subd_req(ld->connectd, ld->connectd,
|
|
take(towire_connectd_dev_memleak(NULL)),
|
|
-1, 0, connect_dev_memleak_done, leaks),
|
|
leaks);
|
|
start_leak_request(subd_req(ld->gossip, ld->gossip,
|
|
take(towire_gossipd_dev_memleak(NULL)),
|
|
-1, 0, gossip_dev_memleak_done, leaks),
|
|
leaks);
|
|
|
|
/* Ask all per-peer daemons */
|
|
peer_dev_memleak(ld, leaks);
|
|
|
|
/* Set timer: dualopend doesn't always listen! */
|
|
notleak(new_reltimer(ld->timers, leaks, time_from_sec(20),
|
|
leak_detect_timeout, leaks));
|
|
return command_still_pending(cmd);
|
|
}
|
|
|
|
static const struct json_command dev_memleak_command = {
|
|
"dev-memleak",
|
|
"developer",
|
|
json_memleak,
|
|
"Show unreferenced memory objects"
|
|
};
|
|
AUTODATA(json_command, &dev_memleak_command);
|
|
#endif /* DEVELOPER */
|