Files
sysprof/src/libsysprof/sysprof-proc-source.c
2021-02-25 13:44:58 -08:00

594 lines
18 KiB
C

/* sysprof-proc-source.c
*
* Copyright 2016-2019 Christian Hergert <chergert@redhat.com>
*
* This program is free software: you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation, either version 3 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program. If not, see <http://www.gnu.org/licenses/>.
*
* SPDX-License-Identifier: GPL-3.0-or-later
*/
/* Sysprof -- Sampling, systemwide CPU profiler
* Copyright 2004, Red Hat, Inc.
* Copyright 2004, 2005, Soeren Sandmann
*
* This program is free software; you can redistribute it and/or modify
* it under the terms of the GNU General Public License as published by
* the Free Software Foundation; either version 2 of the License, or
* (at your option) any later version.
*
* This program is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
* GNU General Public License for more details.
*
* You should have received a copy of the GNU General Public License
* along with this program; if not, write to the Free Software
* Foundation, Inc., 59 Temple Place - Suite 330, Boston, MA 02111-1307, USA.
*/
#include "config.h"
#include <json-glib/json-glib.h>
#include <stdio.h>
#include <stdlib.h>
#include <string.h>
#include "sysprof-helpers.h"
#include "sysprof-mountinfo.h"
#include "sysprof-proc-source.h"
struct _SysprofProcSource
{
GObject parent_instance;
SysprofCaptureWriter *writer;
GArray *pids;
SysprofMountinfo *mountinfo;
GHashTable *podman;
guint is_ready : 1;
};
typedef struct
{
char *id;
char **layers;
} PodmanInfo;
static void source_iface_init (SysprofSourceInterface *iface);
G_DEFINE_TYPE_EXTENDED (SysprofProcSource, sysprof_proc_source, G_TYPE_OBJECT, 0,
G_IMPLEMENT_INTERFACE (SYSPROF_TYPE_SOURCE, source_iface_init))
static void
sysprof_proc_source_populate_process (SysprofProcSource *self,
GPid pid,
const gchar *cmdline)
{
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (pid > 0);
sysprof_capture_writer_add_process (self->writer,
SYSPROF_CAPTURE_CURRENT_TIME,
-1,
pid,
cmdline);
}
static void
sysprof_proc_source_populate_maps (SysprofProcSource *self,
GPid pid,
const gchar *mapsstr,
const gchar *mountinfostr)
{
g_auto(GStrv) maps = NULL;
guint i;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (mapsstr != NULL);
g_assert (mountinfostr != NULL);
g_assert (pid > 0);
sysprof_mountinfo_reset (self->mountinfo);
sysprof_mountinfo_parse_mountinfo (self->mountinfo, mountinfostr);
maps = g_strsplit (mapsstr, "\n", 0);
for (i = 0; maps [i] != NULL; i++)
{
g_autofree gchar *translated = NULL;
gchar file[512];
const gchar *fileptr = file;
gulong start;
gulong end;
gulong offset;
gulong inode;
gint r;
r = sscanf (maps [i],
"%lx-%lx %*15s %lx %*x:%*x %lu %512s",
&start, &end, &offset, &inode, file);
file [sizeof file - 1] = '\0';
if (r != 5)
continue;
if (strcmp ("[vdso]", file) == 0)
{
/*
* Søren Sandmann Pedersen says:
*
* For the vdso, the kernel reports 'offset' as the
* the same as the mapping addres. This doesn't make
* any sense to me, so we just zero it here. There
* is code in binfile.c (read_inode) that returns 0
* for [vdso].
*/
offset = 0;
inode = 0;
}
/* Possibly translate the path based on mounts/mountinfo data */
if ((translated = sysprof_mountinfo_translate (self->mountinfo, file)))
fileptr = translated;
sysprof_capture_writer_add_map (self->writer,
SYSPROF_CAPTURE_CURRENT_TIME,
-1,
pid,
start,
end,
offset,
inode,
fileptr);
}
}
static gboolean
pid_is_interesting (SysprofProcSource *self,
GPid pid)
{
if (self->pids == NULL || self->pids->len == 0)
return TRUE;
for (guint i = 0; i < self->pids->len; i++)
{
if (g_array_index (self->pids, GPid, i) == pid)
return TRUE;
}
return FALSE;
}
static void
podman_info_free (gpointer data)
{
PodmanInfo *info = data;
g_free (info->id);
g_strfreev (info->layers);
g_free (info);
}
static void
update_containers_json (SysprofProcSource *self)
{
g_autoptr(JsonParser) parser = NULL;
g_autofree gchar *path = NULL;
JsonNode *root;
JsonArray *ar;
guint n_items;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
parser = json_parser_new ();
path = g_build_filename (g_get_user_data_dir (),
"containers",
"storage",
"overlay-containers",
"containers.json",
NULL);
if (!json_parser_load_from_file (parser, path, NULL) ||
!(root = json_parser_get_root (parser)) ||
!JSON_NODE_HOLDS_ARRAY (root) ||
!(ar = json_node_get_array (root)))
return;
n_items = json_array_get_length (ar);
for (guint i = 0; i < n_items; i++)
{
JsonObject *item = json_array_get_object_element (ar, i);
PodmanInfo *info;
const char *id;
const char *layer;
if (item == NULL)
continue;
id = json_object_get_string_member (item, "id");
layer = json_object_get_string_member (item, "layer");
if (id == NULL || layer == NULL)
continue;
info = g_new0 (PodmanInfo, 1);
info->id = g_strdup (id);
info->layers = g_new0 (char *, 2);
info->layers[0] = g_strdup (layer);
info->layers[1] = NULL;
g_hash_table_insert (self->podman, info->id, info);
}
}
static void
sysprof_proc_source_populate_pid_podman (SysprofProcSource *self,
GPid pid,
const char *container)
{
PodmanInfo *info;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (container != NULL);
if (!(info = g_hash_table_lookup (self->podman, container)))
{
update_containers_json (self);
info = g_hash_table_lookup (self->podman, container);
}
if (info != NULL)
{
for (guint i = 0; info->layers[i]; i++)
{
g_autofree char *path = g_build_filename (g_get_user_data_dir (),
"containers",
"storage",
"overlay",
info->layers[i],
"diff",
NULL);
sysprof_capture_writer_add_overlay (self->writer,
SYSPROF_CAPTURE_CURRENT_TIME,
-1, pid, i, path, "/");
}
}
}
static void
sysprof_proc_source_populate_pid_flatpak (SysprofProcSource *self,
GPid pid,
const char *app_id)
{
g_autofree gchar *info_path = NULL;
g_autoptr(GKeyFile) key_file = NULL;
g_autofree gchar *app_path = NULL;
g_autofree gchar *runtime_path = NULL;
g_autofree gchar *contents = NULL;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (app_id != NULL);
info_path = g_strdup_printf ("/proc/%d/root/.flatpak-info", pid);
key_file = g_key_file_new ();
if (!sysprof_helpers_get_proc_file (sysprof_helpers_get_default (),
info_path, NULL, &contents, NULL))
return;
if (!g_key_file_load_from_data (key_file, contents, -1, 0, NULL) ||
!g_key_file_has_group (key_file, "Instance") ||
!(app_path = g_key_file_get_string (key_file, "Instance", "app-path", NULL)) ||
!(runtime_path = g_key_file_get_string (key_file, "Instance", "runtime-path", NULL)))
return;
sysprof_capture_writer_add_overlay (self->writer,
SYSPROF_CAPTURE_CURRENT_TIME,
-1, pid, 0, runtime_path, "/usr");
sysprof_capture_writer_add_overlay (self->writer,
SYSPROF_CAPTURE_CURRENT_TIME,
-1, pid, 0, app_path, "/app");
}
static void
sysprof_proc_source_populate_pid_root (SysprofProcSource *self,
GPid pid,
const char *cgroup)
{
static GRegex *flatpak;
static GRegex *podman;
g_autoptr(GMatchInfo) podman_match = NULL;
g_autoptr(GMatchInfo) flatpak_match = NULL;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (cgroup != NULL);
/* This function tries to discover the podman container that contains the
* process identified on the host as @pid. We can only do anything with this
* if the pids are in containers that the running user controls (so that we
* can actually access the overlays).
*
* This stuff, and I want to emphasize, is a giant hack. Just like containers
* are on Linux. But if we are really careful, we can make this work for the
* one particular use case I care about, which is podman/toolbox on Fedora
* Workstation/Silverblue.
*
* -- Christian
*/
if (podman == NULL)
{
podman = g_regex_new ("libpod-([a-z0-9]{64})\\.scope", G_REGEX_OPTIMIZE, 0, NULL);
g_assert (podman != NULL);
}
/* If this looks like a cgroup associated with a Flatpak, then we can find
* information about the filesystem in /proc/$pid/root/.flatpak-info (assuming
* we can actually read that file. That is possible from the host, but not
* really if we are running in a Flatpak ourself, so we access it through
* the daemon to ensure we can access it.
*/
if (flatpak == NULL)
{
flatpak = g_regex_new ("app-flatpak-([a-zA-Z_\\-\\.]+)-[0-9]+\\.scope", G_REGEX_OPTIMIZE, 0, NULL);
g_assert (flatpak != NULL);
}
if (g_regex_match (podman, cgroup, 0, &podman_match))
{
char *word = g_match_info_fetch (podman_match, 1);
sysprof_proc_source_populate_pid_podman (self, pid, word);
g_free (word);
}
else if (g_regex_match (flatpak, cgroup, 0, &flatpak_match))
{
char *word = g_match_info_fetch (flatpak_match, 1);
sysprof_proc_source_populate_pid_flatpak (self, pid, word);
g_free (word);
}
}
static void
sysprof_proc_source_populate (SysprofProcSource *self,
GVariant *info)
{
g_autofree gchar *mounts = NULL;
SysprofHelpers *helpers;
gsize n_pids = 0;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (info != NULL);
g_assert (g_variant_is_of_type (info, G_VARIANT_TYPE ("aa{sv}")));
if (self->writer == NULL)
return;
helpers = sysprof_helpers_get_default ();
if (!sysprof_helpers_get_proc_file (helpers, "/proc/mounts", NULL, &mounts, NULL))
return;
sysprof_mountinfo_parse_mounts (self->mountinfo, mounts);
n_pids = g_variant_n_children (info);
for (gsize i = 0; i < n_pids; i++)
{
g_autoptr(GVariant) pidinfo = g_variant_get_child_value (info, i);
GVariantDict dict;
const gchar *cmdline;
const gchar *comm;
const gchar *mountinfo;
const gchar *maps;
const gchar *cgroup;
gint32 pid;
g_variant_dict_init (&dict, pidinfo);
if (!g_variant_dict_lookup (&dict, "pid", "i", &pid) ||
!pid_is_interesting (self, pid))
goto skip;
if (!g_variant_dict_lookup (&dict, "cmdline", "&s", &cmdline))
cmdline = "";
if (!g_variant_dict_lookup (&dict, "comm", "&s", &comm))
comm = "";
if (!g_variant_dict_lookup (&dict, "mountinfo", "&s", &mountinfo))
mountinfo = "";
if (!g_variant_dict_lookup (&dict, "maps", "&s", &maps))
maps = "";
if (!g_variant_dict_lookup (&dict, "cgroup", "&s", &cgroup))
cgroup = "";
sysprof_proc_source_populate_process (self, pid, *cmdline ? cmdline : comm);
sysprof_proc_source_populate_maps (self, pid, maps, mountinfo);
sysprof_proc_source_populate_pid_root (self, pid, cgroup);
skip:
g_variant_dict_clear (&dict);
}
}
static void
sysprof_proc_source_get_process_info_cb (GObject *object,
GAsyncResult *result,
gpointer user_data)
{
SysprofHelpers *helpers = (SysprofHelpers *)object;
g_autoptr(SysprofProcSource) self = user_data;
g_autoptr(GVariant) info = NULL;
g_autoptr(GError) error = NULL;
g_assert (SYSPROF_IS_HELPERS (helpers));
g_assert (G_IS_ASYNC_RESULT (result));
g_assert (SYSPROF_IS_PROC_SOURCE (self));
if (!sysprof_helpers_get_process_info_finish (helpers, result, &info, &error))
{
sysprof_source_emit_failed (SYSPROF_SOURCE (self), error);
return;
}
sysprof_proc_source_populate (self, info);
sysprof_source_emit_finished (SYSPROF_SOURCE (self));
}
static void
sysprof_proc_source_start (SysprofSource *source)
{
SysprofProcSource *self = (SysprofProcSource *)source;
SysprofHelpers *helpers = sysprof_helpers_get_default ();
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (self->writer != NULL);
sysprof_helpers_get_process_info_async (helpers,
"pid,maps,mountinfo,cmdline,comm,cgroup",
NULL,
sysprof_proc_source_get_process_info_cb,
g_object_ref (self));
}
static void
sysprof_proc_source_stop (SysprofSource *source)
{
SysprofProcSource *self = (SysprofProcSource *)source;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_clear_pointer (&self->writer, sysprof_capture_writer_unref);
}
static void
sysprof_proc_source_set_writer (SysprofSource *source,
SysprofCaptureWriter *writer)
{
SysprofProcSource *self = (SysprofProcSource *)source;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (writer != NULL);
self->writer = sysprof_capture_writer_ref (writer);
}
static void
sysprof_proc_source_add_pid (SysprofSource *source,
GPid pid)
{
SysprofProcSource *self = (SysprofProcSource *)source;
guint i;
g_assert (SYSPROF_IS_PROC_SOURCE (self));
g_assert (pid > -1);
for (i = 0; i < self->pids->len; i++)
{
GPid ele = g_array_index (self->pids, GPid, i);
if (ele == pid)
return;
}
g_array_append_val (self->pids, pid);
}
static void
sysprof_proc_source_auth_cb (GObject *object,
GAsyncResult *result,
gpointer user_data)
{
SysprofHelpers *helpers = (SysprofHelpers *)object;
g_autoptr(SysprofProcSource) self = user_data;
g_autoptr(GError) error = NULL;
g_assert (SYSPROF_IS_HELPERS (helpers));
g_assert (G_IS_ASYNC_RESULT (result));
g_assert (SYSPROF_IS_PROC_SOURCE (self));
if (!sysprof_helpers_authorize_finish (helpers, result, &error))
{
sysprof_source_emit_failed (SYSPROF_SOURCE (self), error);
}
else
{
self->is_ready = TRUE;
sysprof_source_emit_ready (SYSPROF_SOURCE (self));
}
}
static void
sysprof_proc_source_prepare (SysprofSource *source)
{
g_assert (SYSPROF_IS_PROC_SOURCE (source));
sysprof_helpers_authorize_async (sysprof_helpers_get_default (),
NULL,
sysprof_proc_source_auth_cb,
g_object_ref (source));
}
static gboolean
sysprof_proc_source_get_is_ready (SysprofSource *source)
{
return SYSPROF_PROC_SOURCE (source)->is_ready;
}
static void
source_iface_init (SysprofSourceInterface *iface)
{
iface->set_writer = sysprof_proc_source_set_writer;
iface->start = sysprof_proc_source_start;
iface->stop = sysprof_proc_source_stop;
iface->add_pid = sysprof_proc_source_add_pid;
iface->prepare = sysprof_proc_source_prepare;
iface->get_is_ready = sysprof_proc_source_get_is_ready;
}
static void
sysprof_proc_source_finalize (GObject *object)
{
SysprofProcSource *self = (SysprofProcSource *)object;
g_clear_pointer (&self->writer, sysprof_capture_writer_unref);
g_clear_pointer (&self->pids, g_array_unref);
g_clear_pointer (&self->mountinfo, sysprof_mountinfo_free);
g_clear_pointer (&self->podman, g_hash_table_unref);
G_OBJECT_CLASS (sysprof_proc_source_parent_class)->finalize (object);
}
static void
sysprof_proc_source_class_init (SysprofProcSourceClass *klass)
{
GObjectClass *object_class = G_OBJECT_CLASS (klass);
object_class->finalize = sysprof_proc_source_finalize;
}
static void
sysprof_proc_source_init (SysprofProcSource *self)
{
self->pids = g_array_new (FALSE, FALSE, sizeof (GPid));
self->mountinfo = sysprof_mountinfo_new ();
self->podman = g_hash_table_new_full (g_str_hash, g_str_equal, NULL, podman_info_free);
}
SysprofSource *
sysprof_proc_source_new (void)
{
return g_object_new (SYSPROF_TYPE_PROC_SOURCE, NULL);
}