sources/perf: Capture DRM vblank events as a mark.

This should be useful to visualize system-wide events in the CPU
timeline, especially once we add some more events.

We may want to define some modes eventually, as not all captures will
care about GPU visualization.  However, it's pretty low overhead (60Hz
* number of monitors), so maybe we can just filter it out at
visualization time.

We do a bit more setup work than necessary here (looking up the config
number for the tracepoint per CPU, rather than looking it up once at
startup), but I suspect I'll want to refactor the init anyway once we
add more tracepoint markers.
This commit is contained in:
Eric Anholt
2018-05-16 09:37:42 +01:00
committed by Christian Hergert
parent 925dadce82
commit ac11f0f941
2 changed files with 188 additions and 1 deletions

View File

@ -115,7 +115,7 @@ _perf_event_open (struct perf_event_attr *attr,
assert (attr != NULL);
/* Quick sanity check */
if (attr->sample_period < 100000)
if (attr->sample_period < 100000 && attr->type != PERF_TYPE_TRACEPOINT)
return -EINVAL;
return syscall (__NR_perf_event_open, attr, pid, cpu, group_fd, flags);

View File

@ -43,6 +43,7 @@
#include <glib/gi18n.h>
#include <errno.h>
#include <string.h>
#include <sys/ioctl.h>
#include <sys/types.h>
#include <unistd.h>
@ -53,6 +54,43 @@
#define N_WAKEUP_EVENTS 149
/* Identifiers for the various tracepoints we might watch for */
enum SpTracepoint {
DRM_VBLANK,
};
typedef struct {
enum SpTracepoint tp;
const char *path;
} SpOptionalTracepoint;
/* Global list of the optional tracepoints we might want to watch. */
static const SpOptionalTracepoint optional_tracepoints[] = {
/* This event fires just after the vblank IRQ handler starts.
*
* Note that on many platforms when nothing is waiting for vblank
* (no pageflips have happened recently, no rendering is
* synchronizing to vblank), the vblank IRQ will get masked off and
* the event won't show up in the timeline.
*
* Also note that when we're in watch-a-single-process mode, we
* won't get the event since it comes in on an IRQ handler, not for
* our pid.
*/
{ DRM_VBLANK, "drm/drm_vblank_event" },
};
/* Struct describing tracepoint events.
*
* This should be extended with some sort of union for the describing
* the locations of the relevant fields within the _RAW section of the
* struct perf_event, so we can pick out things like the vblank CRTC
* number and MSC.
*/
typedef struct {
enum SpTracepoint tp;
} SpTracepointDesc;
struct _SpPerfSource
{
GObject parent_instance;
@ -61,6 +99,9 @@ struct _SpPerfSource
SpPerfCounter *counter;
GHashTable *pids;
/* Mapping from perf sample identifiers to SpTracepointDesc. */
GHashTable *tracepoint_event_ids;
guint running : 1;
guint is_ready : 1;
};
@ -93,6 +134,7 @@ sp_perf_source_finalize (GObject *object)
g_clear_pointer (&self->writer, sp_capture_writer_unref);
g_clear_pointer (&self->counter, sp_perf_counter_unref);
g_clear_pointer (&self->pids, g_hash_table_unref);
g_clear_pointer (&self->tracepoint_event_ids, g_hash_table_unref);
G_OBJECT_CLASS (sp_perf_source_parent_class)->finalize (object);
}
@ -116,6 +158,7 @@ static void
sp_perf_source_init (SpPerfSource *self)
{
self->pids = g_hash_table_new (NULL, NULL);
self->tracepoint_event_ids = g_hash_table_new (NULL, NULL);
}
static gboolean
@ -128,6 +171,30 @@ do_emit_exited (gpointer data)
return G_SOURCE_REMOVE;
}
static void
sp_perf_source_handle_tracepoint (SpPerfSource *self,
gint cpu,
const SpPerfCounterEventSample *sample,
SpTracepointDesc *tp_desc)
{
switch (tp_desc->tp)
{
case DRM_VBLANK:
sp_capture_writer_add_mark (self->writer,
sample->time,
cpu,
sample->pid,
0,
"drm",
"vblank",
NULL);
break;
default:
break;
}
}
static void
sp_perf_source_handle_sample (SpPerfSource *self,
gint cpu,
@ -136,10 +203,22 @@ sp_perf_source_handle_sample (SpPerfSource *self,
const guint64 *ips;
gint n_ips;
guint64 trace[3];
SpTracepointDesc *tp_desc;
g_assert (SP_IS_PERF_SOURCE (self));
g_assert (sample != NULL);
/* We don't capture IPs with tracepoints, and get _RAW data instead. Handle
* them separately.
*/
tp_desc = g_hash_table_lookup (self->tracepoint_event_ids,
GINT_TO_POINTER (sample->identifier));
if (tp_desc)
{
sp_perf_source_handle_tracepoint (self, cpu, sample, tp_desc);
return;
}
ips = sample->ips;
n_ips = sample->n_ips;
@ -276,6 +355,106 @@ sp_perf_source_handle_event (SpPerfCounterEvent *event,
}
}
static gboolean
sp_perf_get_tracepoint_config (const char *path, gint64 *config)
{
gchar *filename = NULL;
gchar *contents;
size_t len;
filename = g_strdup_printf ("/sys/kernel/debug/tracing/events/%s/id", path);
if (!filename)
return FALSE;
if (!g_file_get_contents (filename, &contents, &len, NULL))
{
g_free (filename);
return FALSE;
}
g_free(filename);
*config = strtoull(contents, NULL, 0);
g_free (contents);
return TRUE;
}
/* Adds a perf tracepoint event, if it's available.
*
* These are kernel tracepoints that we want to include in our capture
* when present, but may be kernel version or driver-specific.
*/
static void
sp_perf_source_add_optional_tracepoint (SpPerfSource *self,
GPid pid,
gint cpu,
const SpOptionalTracepoint *optional_tracepoint,
GError **error)
{
struct perf_event_attr attr = { 0 };
SpTracepointDesc *tp_desc;
gulong flags = 0;
gint fd;
gint64 config;
gint64 id;
int ret;
if (!sp_perf_get_tracepoint_config(optional_tracepoint->path, &config))
return;
attr.type = PERF_TYPE_TRACEPOINT;
attr.sample_type = PERF_SAMPLE_RAW
| PERF_SAMPLE_IP
| PERF_SAMPLE_TID
| PERF_SAMPLE_IDENTIFIER
| PERF_SAMPLE_CALLCHAIN
| PERF_SAMPLE_TIME;
attr.config = config;
attr.sample_period = 1;
#ifdef HAVE_PERF_CLOCKID
attr.clockid = sp_clock;
attr.use_clockid = 1;
#endif
attr.size = sizeof attr;
fd = sp_perf_counter_open (self->counter, &attr, pid, cpu, -1, flags);
ret = ioctl (fd, PERF_EVENT_IOC_ID, &id);
if (ret != 0)
{
g_set_error (error,
G_IO_ERROR,
G_IO_ERROR_FAILED,
_("Sysprof failed to get perf_event ID."));
close(fd);
return;
}
tp_desc = g_malloc (sizeof (*tp_desc));
if (!tp_desc)
{
close(fd);
return;
}
tp_desc->tp = optional_tracepoint->tp;
/* Here's where we should inspect the /format file to determine how
* to pick fields out of the _RAW data.
*/
/* We're truncating the event ID from 64b to 32 to fit in the hash.
* The event IDs start from 0 at boot, so meh.
*/
g_assert (id <= 0xffffffff);
g_hash_table_insert (self->tracepoint_event_ids,
GINT_TO_POINTER (id), tp_desc);
}
static gboolean
sp_perf_source_start_pid (SpPerfSource *self,
GPid pid,
@ -286,6 +465,7 @@ sp_perf_source_start_pid (SpPerfSource *self,
gint ncpu = g_get_num_processors ();
gint cpu = 0;
gint fd;
gint i;
g_assert (SP_IS_PERF_SOURCE (self));
@ -359,6 +539,13 @@ sp_perf_source_start_pid (SpPerfSource *self,
return FALSE;
}
}
for (i = 0; i < G_N_ELEMENTS(optional_tracepoints); i++)
{
sp_perf_source_add_optional_tracepoint (self, pid, cpu,
&optional_tracepoints[i],
error);
}
}
return TRUE;