/* sysprof-document.c * * Copyright 2023 Christian Hergert * * This program is free software: you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation, either version 3 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with this program. If not, see . * * SPDX-License-Identifier: GPL-3.0-or-later */ #include "config.h" #include #include #include "sysprof-document-private.h" #include "sysprof-document-frame-private.h" #include "sysprof-document-symbols-private.h" #include "sysprof-symbolizer-private.h" struct _SysprofDocument { GObject parent_instance; GArray *frames; GMappedFile *mapped_file; const guint8 *base; GtkBitset *samples; GMutex strings_mutex; GHashTable *strings; SysprofCaptureFileHeader header; guint needs_swap : 1; }; typedef struct _SysprofDocumentFramePointer { guint64 offset : 48; guint64 length : 16; } SysprofDocumentFramePointer; static GType sysprof_document_get_item_type (GListModel *model) { return SYSPROF_TYPE_DOCUMENT_FRAME; } static guint sysprof_document_get_n_items (GListModel *model) { return SYSPROF_DOCUMENT (model)->frames->len; } static gpointer sysprof_document_get_item (GListModel *model, guint position) { SysprofDocument *self = SYSPROF_DOCUMENT (model); SysprofDocumentFramePointer *ptr; if (position >= self->frames->len) return NULL; ptr = &g_array_index (self->frames, SysprofDocumentFramePointer, position); return _sysprof_document_frame_new (self->mapped_file, (gconstpointer)&self->base[ptr->offset], ptr->length, self->needs_swap); } static void list_model_iface_init (GListModelInterface *iface) { iface->get_item_type = sysprof_document_get_item_type; iface->get_n_items = sysprof_document_get_n_items; iface->get_item = sysprof_document_get_item; } G_DEFINE_FINAL_TYPE_WITH_CODE (SysprofDocument, sysprof_document, G_TYPE_OBJECT, G_IMPLEMENT_INTERFACE (G_TYPE_LIST_MODEL, list_model_iface_init)) static void sysprof_document_finalize (GObject *object) { SysprofDocument *self = (SysprofDocument *)object; g_clear_pointer (&self->mapped_file, g_mapped_file_unref); g_clear_pointer (&self->frames, g_array_unref); g_clear_pointer (&self->strings, g_hash_table_unref); g_clear_pointer (&self->samples, gtk_bitset_unref); g_mutex_clear (&self->strings_mutex); G_OBJECT_CLASS (sysprof_document_parent_class)->finalize (object); } static void sysprof_document_class_init (SysprofDocumentClass *klass) { GObjectClass *object_class = G_OBJECT_CLASS (klass); object_class->finalize = sysprof_document_finalize; } static void sysprof_document_init (SysprofDocument *self) { g_mutex_init (&self->strings_mutex); self->frames = g_array_new (FALSE, FALSE, sizeof (SysprofDocumentFramePointer)); self->strings = g_hash_table_new_full (g_str_hash, g_str_equal, NULL, (GDestroyNotify)g_ref_string_release); self->samples = gtk_bitset_new_empty (); } static gboolean sysprof_document_load (SysprofDocument *self, int capture_fd, GError **error) { goffset pos; gsize len; g_assert (SYSPROF_IS_DOCUMENT (self)); g_assert (capture_fd > -1); if (!(self->mapped_file = g_mapped_file_new_from_fd (capture_fd, FALSE, error))) return FALSE; self->base = (const guint8 *)g_mapped_file_get_contents (self->mapped_file); len = g_mapped_file_get_length (self->mapped_file); if (len < sizeof self->header) return FALSE; /* Keep a copy of our header */ memcpy (&self->header, self->base, sizeof self->header); #if G_BYTE_ORDER == G_LITTLE_ENDIAN self->needs_swap = !self->header.little_endian; #else self->needs_swap = !!self->header.little_endian; #endif if (self->needs_swap) { self->header.time = GUINT64_SWAP_LE_BE (self->header.time); self->header.end_time = GUINT64_SWAP_LE_BE (self->header.end_time); } pos = sizeof self->header; while (pos < (len - sizeof(guint16))) { const SysprofCaptureFrame *tainted; SysprofDocumentFramePointer ptr; guint16 frame_len; memcpy (&frame_len, &self->base[pos], sizeof frame_len); if (self->needs_swap) frame_len = GUINT16_SWAP_LE_BE (frame_len); if (frame_len < sizeof (SysprofCaptureFrame)) break; ptr.offset = pos; ptr.length = frame_len; tainted = (const SysprofCaptureFrame *)(gpointer)&self->base[pos]; if (tainted->type == SYSPROF_CAPTURE_FRAME_SAMPLE || tainted->type == SYSPROF_CAPTURE_FRAME_ALLOCATION) gtk_bitset_add (self->samples, self->frames->len); pos += frame_len; g_array_append_val (self->frames, ptr); } return TRUE; } /** * sysprof_document_new_from_fd: * @capture_fd: a file-descriptor to be mapped * @error: a location for a #GError, or %NULL * * Creates a new memory map using @capture_fd to read the underlying * Sysprof capture. * * No ownership of @capture_fd is transferred, and the caller may close * @capture_fd after calling this function. * * Returns: A #SysprofDocument if successful; otherwise %NULL * and @error is set. * * Since: 45.0 */ SysprofDocument * sysprof_document_new_from_fd (int capture_fd, GError **error) { g_autoptr(SysprofDocument) self = NULL; g_return_val_if_fail (capture_fd > -1, NULL); self = g_object_new (SYSPROF_TYPE_DOCUMENT, NULL); if (!sysprof_document_load (self, capture_fd, error)) return NULL; return g_steal_pointer (&self); } /** * sysprof_document_new: * @filename: a path to a capture file * @error: location for a #GError, or %NULL * * Similar to sysprof_document_new_from_fd() but opens the file found * at @filename as a #GMappedFile. * * Returns: a #SysprofDocument if successful; otherwise %NULL * and @error is set. * * Since: 45.0 */ SysprofDocument * sysprof_document_new (const char *filename, GError **error) { g_autoptr(SysprofDocument) self = NULL; g_autofd int capture_fd = -1; g_return_val_if_fail (filename != NULL, NULL); if (-1 == (capture_fd = g_open (filename, O_RDONLY|O_CLOEXEC, 0))) { int errsv = errno; g_set_error (error, G_FILE_ERROR, g_file_error_from_errno (errsv), "%s", g_strerror (errsv)); return NULL; } self = g_object_new (SYSPROF_TYPE_DOCUMENT, NULL); if (!sysprof_document_load (self, capture_fd, error)) return NULL; return g_steal_pointer (&self); } char * _sysprof_document_ref_string (SysprofDocument *self, const char *name) { char *ret; g_return_val_if_fail (SYSPROF_IS_DOCUMENT (self), NULL); if (name == NULL) return NULL; g_mutex_lock (&self->strings_mutex); if (!(ret = g_hash_table_lookup (self->strings, name))) { ret = g_ref_string_new (name); g_hash_table_insert (self->strings, ret, ret); } ret = g_ref_string_acquire (ret); g_mutex_unlock (&self->strings_mutex); return ret; } static void sysprof_document_symbolize_symbols_cb (GObject *object, GAsyncResult *result, gpointer user_data) { g_autoptr(SysprofDocumentSymbols) symbols = NULL; g_autoptr(GTask) task = user_data; g_autoptr(GError) error = NULL; g_assert (G_IS_ASYNC_RESULT (result)); g_assert (G_IS_TASK (task)); if ((symbols = _sysprof_document_symbols_new_finish (result, &error))) g_task_return_pointer (task, g_steal_pointer (&symbols), g_object_unref); else g_task_return_error (task, g_steal_pointer (&error)); } static void sysprof_document_symbolize_prepare_cb (GObject *object, GAsyncResult *result, gpointer user_data) { SysprofSymbolizer *symbolizer = (SysprofSymbolizer *)object; g_autoptr(GTask) task = user_data; g_autoptr(GError) error = NULL; g_assert (SYSPROF_IS_SYMBOLIZER (symbolizer)); g_assert (G_IS_ASYNC_RESULT (result)); g_assert (G_IS_TASK (task)); if (!_sysprof_symbolizer_prepare_finish (symbolizer, result, &error)) g_task_return_error (task, g_steal_pointer (&error)); else _sysprof_document_symbols_new (g_task_get_source_object (task), symbolizer, g_task_get_cancellable (task), sysprof_document_symbolize_symbols_cb, g_object_ref (task)); } void sysprof_document_symbolize_async (SysprofDocument *self, SysprofSymbolizer *symbolizer, GCancellable *cancellable, GAsyncReadyCallback callback, gpointer user_data) { g_autoptr(SysprofDocumentSymbols) symbols = NULL; g_autoptr(GTask) task = NULL; g_return_if_fail (SYSPROF_IS_DOCUMENT (self)); g_return_if_fail (SYSPROF_IS_SYMBOLIZER (symbolizer)); g_return_if_fail (!cancellable || SYSPROF_IS_SYMBOLIZER (symbolizer)); task = g_task_new (self, cancellable, callback, user_data); g_task_set_source_tag (task, sysprof_document_symbolize_async); _sysprof_symbolizer_prepare_async (symbolizer, self, cancellable, sysprof_document_symbolize_prepare_cb, g_steal_pointer (&task)); } SysprofDocumentSymbols * sysprof_document_symbolize_finish (SysprofDocument *self, GAsyncResult *result, GError **error) { g_return_val_if_fail (SYSPROF_IS_DOCUMENT (self), NULL); g_return_val_if_fail (G_IS_TASK (result), NULL); g_return_val_if_fail (g_task_is_valid (result, self), NULL); g_return_val_if_fail (g_task_get_source_tag (G_TASK (result)) == sysprof_document_symbolize_async, NULL); return g_task_propagate_pointer (G_TASK (result), error); } gboolean _sysprof_document_is_native (SysprofDocument *self) { g_return_val_if_fail (SYSPROF_IS_DOCUMENT (self), FALSE); return self->needs_swap == FALSE; } static void sysprof_document_lookup_file (GTask *task, gpointer source_object, gpointer task_data, GCancellable *cancellable) { SysprofDocument *self = source_object; g_autoptr(GByteArray) bytes = NULL; const char *filename = task_data; gboolean is_native; int filename_len; g_assert (G_IS_TASK (task)); g_assert (SYSPROF_IS_DOCUMENT (source_object)); g_assert (filename != NULL); g_assert (!cancellable || G_IS_CANCELLABLE (cancellable)); bytes = g_byte_array_new (); is_native = self->needs_swap == FALSE; filename_len = strlen (filename); if (filename_len > 255) { g_task_return_new_error (task, G_IO_ERROR, G_IO_ERROR_INVALID_FILENAME, "Filename too long for storage in capture file"); return; } /* We can access capture data on a thread because the pointers to * frames are created during construction and then never mutated. * * But do remember that frame data may not be byte-swapped. We do * not need to swap frame->type becaues it's 1 byte. */ for (guint i = 0; i < self->frames->len; i++) { const SysprofDocumentFramePointer *ptr = &g_array_index (self->frames, SysprofDocumentFramePointer, i); const SysprofCaptureFrame *frame = (gpointer)&self->base[ptr->offset]; const SysprofCaptureFileChunk *chunk; SysprofCaptureFrameType type = frame->type; guint16 data_len; /* Ignore everything but file chunks */ if (type != SYSPROF_CAPTURE_FRAME_FILE_CHUNK) continue; chunk = (const SysprofCaptureFileChunk *)(gpointer)frame; /* Check path without being certain frame->path is \0 terminatd */ if (memcmp (filename, chunk->path, filename_len) != 0 || chunk->path[filename_len] != 0) continue; if (is_native) data_len = chunk->len; else #if G_BYTE_ORDER == G_LITTLE_ENDIAN data_len = GUINT16_TO_LE (chunk->len); #else data_len = GUINT16_TO_BE (chunk->len); #endif /* Check for corrupted file chunk data length */ if (G_STRUCT_OFFSET (SysprofCaptureFileChunk, data) + data_len > ptr->length) { g_byte_array_set_size (bytes, 0); break; } g_byte_array_append (bytes, chunk->data, data_len); if (chunk->is_last) break; } if (bytes->len == 0) g_task_return_new_error (task, G_IO_ERROR, G_IO_ERROR_NOT_FOUND, "Failed to locate file \"%s\"", filename); else g_task_return_pointer (task, g_byte_array_free_to_bytes (g_steal_pointer (&bytes)), (GDestroyNotify)g_bytes_unref); } void sysprof_document_lookup_file_async (SysprofDocument *self, const char *filename, GCancellable *cancellable, GAsyncReadyCallback callback, gpointer user_data) { g_autoptr(GTask) task = NULL; g_return_if_fail (SYSPROF_IS_DOCUMENT (self)); g_return_if_fail (filename != NULL); g_return_if_fail (!cancellable || G_IS_CANCELLABLE (cancellable)); task = g_task_new (self, cancellable, callback, user_data); g_task_set_source_tag (task, sysprof_document_lookup_file_async); g_task_set_task_data (task, g_strdup (filename), g_free); g_task_run_in_thread (task, sysprof_document_lookup_file); } /** * sysprof_document_lookup_file_finish: * @self: a #SysprofDocument * @result: the #GAsyncResult provided to callback * @error: a location for a #GError, or %NULL * * Completes a request to load the contents of a file that was * embedded within the document. * * Returns: (transfer full): a #GBytes if successful; otherwise %NULL * and @error is set. */ GBytes * sysprof_document_lookup_file_finish (SysprofDocument *self, GAsyncResult *result, GError **error) { g_return_val_if_fail (SYSPROF_IS_DOCUMENT (self), NULL); g_return_val_if_fail (G_IS_TASK (result), NULL); g_return_val_if_fail (g_task_is_valid (result, self), NULL); return g_task_propagate_pointer (G_TASK (result), error); } GtkBitset * _sysprof_document_samples (SysprofDocument *self) { g_return_val_if_fail (SYSPROF_IS_DOCUMENT (self), NULL); return self->samples; }