Files
python-bpf/pythonbpf/vmlinux_parser/class_handler.py

118 lines
5.0 KiB
Python

import logging
from functools import lru_cache
import importlib
from .dependency_handler import DependencyHandler
from .dependency_node import DependencyNode
import ctypes
logger = logging.getLogger(__name__)
@lru_cache(maxsize=1)
def get_module_symbols(module_name: str):
imported_module = importlib.import_module(module_name)
return [name for name in dir(imported_module)], imported_module
# Recursive function that gets all the dependent classes and adds them to handler
def process_vmlinux_class(node, llvm_module, handler: DependencyHandler):
symbols_in_module, imported_module = get_module_symbols("vmlinux")
# Handle both node objects and type objects
if hasattr(node, "name"):
current_symbol_name = node.name
elif hasattr(node, "__name__"):
current_symbol_name = node.__name__
else:
current_symbol_name = str(node)
if current_symbol_name not in symbols_in_module:
raise ImportError(f"{current_symbol_name} not present in module vmlinux")
logger.info(f"Resolving vmlinux class {current_symbol_name}")
logger.debug(
f"Current handler state: {handler.is_ready} readiness and {handler.get_all_nodes()} all nodes"
)
field_table = {} # should contain the field and it's type.
# Get the class object from the module
class_obj = getattr(imported_module, current_symbol_name)
# Below, I've written a general structure that gets class-info
# everytime, no matter the format in which it is present
# Inspect the class fields
# Assuming class_obj has fields stored in some standard way
# If it's a ctypes-like structure with _fields_
if hasattr(class_obj, "_fields_"):
for field_name, field_type in class_obj._fields_:
field_table[field_name] = field_type
# If it's using __annotations__
elif hasattr(class_obj, "__annotations__"):
for field_name, field_type in class_obj.__annotations__.items():
field_table[field_name] = field_type
else:
raise TypeError("Could not get required class and definition")
logger.debug(f"Extracted fields for {current_symbol_name}: {field_table}")
if handler.has_node(current_symbol_name):
logger.info("Extraction pruned due to already available field")
return True
else:
new_dep_node = DependencyNode(name=current_symbol_name)
handler.add_node(new_dep_node)
for elem_name, elem_type in field_table.items():
module_name = getattr(elem_type, "__module__", None)
if module_name == ctypes.__name__:
new_dep_node.add_field(elem_name, elem_type, ready=True)
elif module_name == "vmlinux":
new_dep_node.add_field(elem_name, elem_type, ready=False)
print("elem_name:", elem_name, "elem_type:", elem_type)
# currently fails when a non-normal type appears which is basically everytime
identify_ctypes_type(elem_name, elem_type, new_dep_node)
symbol_name = (
elem_type.__name__
if hasattr(elem_type, "__name__")
else str(elem_type)
)
vmlinux_symbol = None
if hasattr(elem_type, "_type_"):
containing_module_name = getattr(
(elem_type._type_), "__module__", None
)
if containing_module_name == ctypes.__name__:
new_dep_node.set_field_ready(elem_name, True)
continue
elif containing_module_name == "vmlinux":
symbol_name = (
(elem_type._type_).__name__
if hasattr((elem_type._type_), "__name__")
else str(elem_type._type_)
)
vmlinux_symbol = getattr(imported_module, symbol_name)
else:
vmlinux_symbol = getattr(imported_module, symbol_name)
if process_vmlinux_class(vmlinux_symbol, llvm_module, handler):
new_dep_node.set_field_ready(elem_name, True)
else:
raise ValueError(
f"{elem_name} with type {elem_type} not supported in recursive resolver"
)
logger.info(f"added node: {current_symbol_name}")
return True
def identify_ctypes_type(elem_name, elem_type, new_dep_node: DependencyNode):
if isinstance(elem_type, type):
if issubclass(elem_type, ctypes.Array):
new_dep_node.set_field_type(elem_name, ctypes.Array)
new_dep_node.set_field_containing_type(elem_name, elem_type._type_)
new_dep_node.set_field_type_size(elem_name, elem_type._length_)
elif issubclass(elem_type, ctypes._Pointer):
new_dep_node.set_field_type(elem_name, ctypes._Pointer)
new_dep_node.set_field_containing_type(elem_name, elem_type._type_)
else:
raise TypeError("Instance sent instead of Class")