try to separate out ast node from vmlinux type

one recursion issue solved
add support for single depth pointer resolution
2026-02-10 07:00:56 +00:00 · 2025-10-12 01:59:14 +05:30 · 2025-10-12 01:33:23 +05:30 · 2025-10-11 23:18:51 +05:30 · 2025-10-11 22:28:23 +05:30 · 2025-10-11 22:00:25 +05:30
8 changed files with 327 additions and 168 deletions
--- a/.pre-commit-config.yaml
+++ b/.pre-commit-config.yaml
@ -12,7 +12,7 @@
 #
 # See https://github.com/pre-commit/pre-commit

-exclude: 'vmlinux.*\.py$'
+exclude: 'vmlinux.py'

 ci:
  autoupdate_commit_msg: "chore: update pre-commit hooks"
--- a/pythonbpf/vmlinux_parser/init.py
+++ b/pythonbpf/vmlinux_parser/init.py
@ -1 +1,3 @@
 from .import_detector import vmlinux_proc
+
+__all__ = ["vmlinux_proc"]
--- a/pythonbpf/vmlinux_parser/class_handler.py
+++ b/pythonbpf/vmlinux_parser/class_handler.py
@ -0,0 +1,177 @@
+import logging
+from functools import lru_cache
+import importlib
+from .dependency_handler import DependencyHandler
+from .dependency_node import DependencyNode
+import ctypes
+
+logger = logging.getLogger(__name__)
+
+
+@lru_cache(maxsize=1)
+def get_module_symbols(module_name: str):
+    imported_module = importlib.import_module(module_name)
+    return [name for name in dir(imported_module)], imported_module
+
+def process_vmlinux_class(node, llvm_module, handler: DependencyHandler):
+    symbols_in_module, imported_module = get_module_symbols("vmlinux")
+    if node.name in symbols_in_module:
+        vmlinux_type = getattr(imported_module, node.name)
+        process_vmlinux_post_ast(vmlinux_type, llvm_module, handler)
+    else:
+        raise ImportError(f"{node.name} not in vmlinux")
+
+# Recursive function that gets all the dependent classes and adds them to handler
+def process_vmlinux_post_ast(node, llvm_module, handler: DependencyHandler, processing_stack=None):
+    """
+    Recursively process vmlinux classes and their dependencies.
+
+    Args:
+        node: The class/type to process
+        llvm_module: The LLVM module context
+        handler: DependencyHandler to track all nodes
+        processing_stack: Set of currently processing nodes to detect cycles
+    """
+    # Initialize processing stack on first call
+    if processing_stack is None:
+        processing_stack = set()
+
+    symbols_in_module, imported_module = get_module_symbols("vmlinux")
+
+    # Handle both node objects and type objects
+    if hasattr(node, "name"):
+        current_symbol_name = node.name
+    elif hasattr(node, "__name__"):
+        current_symbol_name = node.__name__
+    else:
+        current_symbol_name = str(node)
+
+    if current_symbol_name not in symbols_in_module:
+        raise ImportError(f"{current_symbol_name} not present in module vmlinux")
+
+    # Check if we're already processing this node (circular dependency)
+    if current_symbol_name in processing_stack:
+        logger.debug(f"Circular dependency detected for {current_symbol_name}, skipping")
+        return True
+
+    # Check if already processed
+    if handler.has_node(current_symbol_name):
+        existing_node = handler.get_node(current_symbol_name)
+        # If the node exists and is ready, we're done
+        if existing_node and existing_node.is_ready:
+            logger.info(f"Node {current_symbol_name} already processed and ready")
+            return True
+
+    logger.info(f"Resolving vmlinux class {current_symbol_name}")
+    logger.debug(
+        f"Current handler state: {handler.is_ready} readiness and {handler.get_all_nodes()} all nodes"
+    )
+
+    # Add to processing stack to detect cycles
+    processing_stack.add(current_symbol_name)
+
+    try:
+        field_table = {}  # should contain the field and it's type.
+
+        # Get the class object from the module
+        class_obj = getattr(imported_module, current_symbol_name)
+
+        # Inspect the class fields
+        if hasattr(class_obj, "_fields_"):
+            for field_name, field_type in class_obj._fields_:
+                field_table[field_name] = field_type
+        elif hasattr(class_obj, "__annotations__"):
+            for field_name, field_type in class_obj.__annotations__.items():
+                field_table[field_name] = field_type
+        else:
+            raise TypeError("Could not get required class and definition")
+
+        logger.debug(f"Extracted fields for {current_symbol_name}: {field_table}")
+
+        # Create or get the node
+        if handler.has_node(current_symbol_name):
+            new_dep_node = handler.get_node(current_symbol_name)
+        else:
+            new_dep_node = DependencyNode(name=current_symbol_name)
+            handler.add_node(new_dep_node)
+
+        # Process each field
+        for elem_name, elem_type in field_table.items():
+            module_name = getattr(elem_type, "__module__", None)
+
+            if module_name == ctypes.__name__:
+                # Simple ctypes - mark as ready immediately
+                new_dep_node.add_field(elem_name, elem_type, ready=True)
+
+            elif module_name == "vmlinux":
+                # Complex vmlinux type - needs recursive processing
+                new_dep_node.add_field(elem_name, elem_type, ready=False)
+                logger.debug(f"Processing vmlinux field: {elem_name}, type: {elem_type}")
+
+                identify_ctypes_type(elem_name, elem_type, new_dep_node)
+
+                # Determine the actual symbol to process
+                symbol_name = (
+                    elem_type.__name__
+                    if hasattr(elem_type, "__name__")
+                    else str(elem_type)
+                )
+                vmlinux_symbol = None
+
+                # Handle pointers/arrays to other types
+                if hasattr(elem_type, "_type_"):
+                    containing_module_name = getattr(
+                        (elem_type._type_), "__module__", None
+                    )
+                    if containing_module_name == ctypes.__name__:
+                        # Pointer/Array to ctypes - mark as ready
+                        new_dep_node.set_field_ready(elem_name, True)
+                        continue
+                    elif containing_module_name == "vmlinux":
+                        # Pointer/Array to vmlinux type
+                        symbol_name = (
+                            (elem_type._type_).__name__
+                            if hasattr((elem_type._type_), "__name__")
+                            else str(elem_type._type_)
+                        )
+
+                        # Self-referential check
+                        if symbol_name == current_symbol_name:
+                            logger.debug(f"Self-referential field {elem_name} in {current_symbol_name}")
+                            # For pointers to self, we can mark as ready since the type is being defined
+                            new_dep_node.set_field_ready(elem_name, True)
+                            continue
+
+                        vmlinux_symbol = getattr(imported_module, symbol_name)
+                else:
+                    # Direct vmlinux type (not pointer/array)
+                    vmlinux_symbol = getattr(imported_module, symbol_name)
+
+                # Recursively process the dependency
+                if vmlinux_symbol is not None:
+                    if process_vmlinux_post_ast(vmlinux_symbol, llvm_module, handler, processing_stack):
+                        new_dep_node.set_field_ready(elem_name, True)
+            else:
+                raise ValueError(
+                    f"{elem_name} with type {elem_type} not supported in recursive resolver"
+                )
+
+        logger.info(f"Successfully processed node: {current_symbol_name}")
+        return True
+
+    finally:
+        # Remove from processing stack when done
+        processing_stack.discard(current_symbol_name)
+
+
+def identify_ctypes_type(elem_name, elem_type, new_dep_node: DependencyNode):
+    if isinstance(elem_type, type):
+        if issubclass(elem_type, ctypes.Array):
+            new_dep_node.set_field_type(elem_name, ctypes.Array)
+            new_dep_node.set_field_containing_type(elem_name, elem_type._type_)
+            new_dep_node.set_field_type_size(elem_name, elem_type._length_)
+        elif issubclass(elem_type, ctypes._Pointer):
+            new_dep_node.set_field_type(elem_name, ctypes._Pointer)
+            new_dep_node.set_field_containing_type(elem_name, elem_type._type_)
+    else:
+        raise TypeError("Instance sent instead of Class")
--- a/pythonbpf/vmlinux_parser/dependency_node.py
+++ b/pythonbpf/vmlinux_parser/dependency_node.py
@ -1,12 +1,15 @@
 from dataclasses import dataclass, field
 from typing import Dict, Any, Optional

-
+#TODO: FIX THE FUCKING TYPE NAME CONVENTION.
@dataclass
 class Field:
    """Represents a field in a dependency node with its type and readiness state."""
+
    name: str
    type: type
+    containing_type: Optional[Any]
+    type_size: Optional[int]
    value: Any = None
    ready: bool = False

@ -20,6 +23,26 @@ class Field:
        if mark_ready:
            self.ready = True

+    def set_type(self, given_type, mark_ready: bool = True) -> None:
+        """Set value of the type field and mark as ready"""
+        self.type = given_type
+        if mark_ready:
+            self.ready = True
+
+    def set_containing_type(
+        self, containing_type: Optional[Any], mark_ready: bool = True
+    ) -> None:
+        """Set the containing_type of this field and optionally mark it as ready."""
+        self.containing_type = containing_type
+        if mark_ready:
+            self.ready = True
+
+    def set_type_size(self, type_size: Any, mark_ready: bool = True) -> None:
+        """Set the type_size of this field and optionally mark it as ready."""
+        self.type_size = type_size
+        if mark_ready:
+            self.ready = True
+

@dataclass
 class DependencyNode:
@ -64,13 +87,29 @@ class DependencyNode:
        ready_fields = somestruct.get_ready_fields()
        print(f"Ready fields: {[field.name for field in ready_fields.values()]}")  # ['field_1', 'field_2']
    """
+
    name: str
    fields: Dict[str, Field] = field(default_factory=dict)
    _ready_cache: Optional[bool] = field(default=None, repr=False)

-    def add_field(self, name: str, field_type: type, initial_value: Any = None, ready: bool = False) -> None:
+    def add_field(
+        self,
+        name: str,
+        field_type: type,
+        initial_value: Any = None,
+        containing_type: Optional[Any] = None,
+        type_size: Optional[int] = None,
+        ready: bool = False,
+    ) -> None:
        """Add a field to the node with an optional initial value and readiness state."""
-        self.fields[name] = Field(name=name, type=field_type, value=initial_value, ready=ready)
+        self.fields[name] = Field(
+            name=name,
+            type=field_type,
+            value=initial_value,
+            ready=ready,
+            containing_type=containing_type,
+            type_size=type_size,
+        )
        # Invalidate readiness cache
        self._ready_cache = None

@ -87,6 +126,37 @@ class DependencyNode:
        # Invalidate readiness cache
        self._ready_cache = None

+    def set_field_type(self, name: str, type: Any, mark_ready: bool = True) -> None:
+        """Set a field's type and optionally mark it as ready."""
+        if name not in self.fields:
+            raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
+
+        self.fields[name].set_type(type, mark_ready)
+        # Invalidate readiness cache
+        self._ready_cache = None
+
+    def set_field_containing_type(
+        self, name: str, containing_type: Any, mark_ready: bool = True
+    ) -> None:
+        """Set a field's containing_type and optionally mark it as ready."""
+        if name not in self.fields:
+            raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
+
+        self.fields[name].set_containing_type(containing_type, mark_ready)
+        # Invalidate readiness cache
+        self._ready_cache = None
+
+    def set_field_type_size(
+        self, name: str, type_size: Any, mark_ready: bool = True
+    ) -> None:
+        """Set a field's type_size and optionally mark it as ready."""
+        if name not in self.fields:
+            raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
+
+        self.fields[name].set_type_size(type_size, mark_ready)
+        # Invalidate readiness cache
+        self._ready_cache = None
+
    def set_field_ready(self, name: str, is_ready: bool = True) -> None:
        """Mark a field as ready or not ready."""
        if name not in self.fields:
--- a/pythonbpf/vmlinux_parser/import_detector.py
+++ b/pythonbpf/vmlinux_parser/import_detector.py
@ -6,7 +6,7 @@ import inspect

 from .dependency_handler import DependencyHandler
 from .ir_generation import IRGenerator
-from .vmlinux_class_handler import process_vmlinux_class
+from .class_handler import process_vmlinux_class

 logger = logging.getLogger(__name__)

@ -58,8 +58,8 @@ def detect_import_statement(tree: ast.AST) -> List[Tuple[str, ast.ImportFrom]]:
                # Valid single import
                for alias in node.names:
                    import_name = alias.name
-                    # Use alias if provided, otherwise use the original name
-                    as_name = alias.asname if alias.asname else alias.name
+                    # Use alias if provided, otherwise use the original name (commented)
+                    # as_name = alias.asname if alias.asname else alias.name
                    vmlinux_imports.append(("vmlinux", node))
                    logger.info(f"Found vmlinux import: {import_name}")

@ -68,13 +68,14 @@ def detect_import_statement(tree: ast.AST) -> List[Tuple[str, ast.ImportFrom]]:
            for alias in node.names:
                if alias.name == "vmlinux" or alias.name.startswith("vmlinux."):
                    raise SyntaxError(
-                        f"Direct import of vmlinux module is not supported. "
-                        f"Use 'from vmlinux import <type>' instead."
+                        "Direct import of vmlinux module is not supported. "
+                        "Use 'from vmlinux import <type>' instead."
                    )

    logger.info(f"Total vmlinux imports detected: {len(vmlinux_imports)}")
    return vmlinux_imports

+
 def vmlinux_proc(tree: ast.AST, module):
    import_statements = detect_import_statement(tree)

@ -107,7 +108,10 @@ def vmlinux_proc(tree: ast.AST, module):
            imported_name = alias.name
            found = False
            for mod_node in mod_ast.body:
-                if isinstance(mod_node, ast.ClassDef) and mod_node.name == imported_name:
+                if (
+                    isinstance(mod_node, ast.ClassDef)
+                    and mod_node.name == imported_name
+                ):
                    process_vmlinux_class(mod_node, module, handler)
                    found = True
                    break
@ -120,9 +124,12 @@ def vmlinux_proc(tree: ast.AST, module):
                if found:
                    break
            if not found:
-                logger.info(f"{imported_name} not found as ClassDef or Assign in vmlinux")
+                logger.info(
+                    f"{imported_name} not found as ClassDef or Assign in vmlinux"
+                )

    IRGenerator(module, handler)

+
 def process_vmlinux_assign(node, module, assignments: Dict[str, type]):
    raise NotImplementedError("Assignment handling has not been implemented yet")
--- a/pythonbpf/vmlinux_parser/vmlinux_class_handler.py
+++ b/pythonbpf/vmlinux_parser/vmlinux_class_handler.py
@ -1,96 +0,0 @@
-import ast
-import logging
-from functools import lru_cache
-import importlib
-from .dependency_handler import DependencyHandler
-from .dependency_node import DependencyNode
-import ctypes
-
-logger = logging.getLogger(__name__)
-
-
-@lru_cache(maxsize=1)
-def get_module_symbols(module_name: str):
-    imported_module = importlib.import_module(module_name)
-    return [name for name in dir(imported_module)], imported_module
-
-
-# Recursive function that gets all the dependent classes and adds them to handler
-def process_vmlinux_class(node, llvm_module, handler: DependencyHandler):
-    symbols_in_module, imported_module = get_module_symbols("vmlinux")
-
-    # Handle both node objects and type objects
-    if hasattr(node, 'name'):
-        current_symbol_name = node.name
-    elif hasattr(node, '__name__'):
-        current_symbol_name = node.__name__
-    else:
-        current_symbol_name = str(node)
-
-    if current_symbol_name not in symbols_in_module:
-        raise ImportError(f"{current_symbol_name} not present in module vmlinux")
-    logger.info(f"Resolving vmlinux class {current_symbol_name}")
-    logger.debug(f"Current handler state: {handler.is_ready} readiness and {handler.get_all_nodes()} all nodes")
-    field_table = {}  # should contain the field and it's type.
-
-    # Get the class object from the module
-    class_obj = getattr(imported_module, current_symbol_name)
-
-    # Below, I've written a general structure that gets class-info
-    # everytime, no matter the format in which it is present
-
-    # Inspect the class fields
-    # Assuming class_obj has fields stored in some standard way
-    # If it's a ctypes-like structure with _fields_
-    if hasattr(class_obj, '_fields_'):
-        for field_name, field_type in class_obj._fields_:
-            field_table[field_name] = field_type
-
-    # If it's using __annotations__
-    elif hasattr(class_obj, '__annotations__'):
-        for field_name, field_type in class_obj.__annotations__.items():
-            field_table[field_name] = field_type
-
-    else:
-        raise TypeError("Could not get required class and definition")
-
-    logger.debug(f"Extracted fields for {current_symbol_name}: {field_table}")
-    if handler.has_node(current_symbol_name):
-        logger.info("Extraction pruned due to already available field")
-        return True
-    else:
-        new_dep_node = DependencyNode(name=current_symbol_name)
-        for elem_name, elem_type in field_table.items():
-            module_name = getattr(elem_type, "__module__", None)
-            if module_name == ctypes.__name__:
-                new_dep_node.add_field(elem_name, elem_type, ready=True)
-            elif module_name == "vmlinux":
-                new_dep_node.add_field(elem_name, elem_type, ready=False)
-                print("elem_name:", elem_name, "elem_type:", elem_type)
-                # currently fails when a non-normal type appears which is basically everytime
-                identify_ctypes_type(elem_type)
-                symbol_name = elem_type.__name__ if hasattr(elem_type, '__name__') else str(elem_type)
-                vmlinux_symbol = getattr(imported_module, symbol_name)
-                if process_vmlinux_class(vmlinux_symbol, llvm_module, handler):
-                    new_dep_node.set_field_ready(elem_name, True)
-            else:
-                raise ValueError(f"{elem_name} with type {elem_type} not supported in recursive resolver")
-        handler.add_node(new_dep_node)
-        logger.info(f"added node: {current_symbol_name}")
-
-    return True
-
-def identify_ctypes_type(t):
-    if isinstance(t, type):  # t is a type/class
-        if issubclass(t, ctypes.Array):
-            print("Array type")
-            print("Element type:", t._type_)
-            print("Length:", t._length_)
-        elif issubclass(t, ctypes._Pointer):
-            print("Pointer type")
-            print("Points to:", t._type_)
-        elif issubclass(t, ctypes._SimpleCData):
-            print("Scalar type")
-            print("Base type:", t)
-    else:
-        raise TypeError("Instance sent instead of Class")
--- a/tests/failing_tests/xdp_pass.py
+++ b/tests/failing_tests/xdp_pass.py
@ -1,9 +1,9 @@
 from pythonbpf import bpf, map, section, bpfglobal, compile, compile_to_ir
 from pythonbpf.maps import HashMap
 from pythonbpf.helper import XDP_PASS
-from vmlinux import struct_xdp_md
 from vmlinux import struct_ring_buffer_per_cpu  # noqa: F401
 from vmlinux import struct_xdp_buff  # noqa: F401
+from vmlinux import struct_xdp_md
 from ctypes import c_int64

 # Instructions to how to run this program
--- a/tools/vmlinux-gen.py
+++ b/tools/vmlinux-gen.py
@ -26,8 +26,13 @@ import tempfile


 class BTFConverter:
-    def __init__(self, btf_source="/sys/kernel/btf/vmlinux", output_file="vmlinux.py",
-                 keep_intermediate=False, verbose=False):
+    def __init__(
+        self,
+        btf_source="/sys/kernel/btf/vmlinux",
+        output_file="vmlinux.py",
+        keep_intermediate=False,
+        verbose=False,
+    ):
        self.btf_source = btf_source
        self.output_file = output_file
        self.keep_intermediate = keep_intermediate
@ -44,11 +49,7 @@ class BTFConverter:
        self.log(f"{description}...")
        try:
            result = subprocess.run(
-                cmd,
-                shell=True,
-                check=True,
-                capture_output=True,
-                text=True
+                cmd, shell=True, check=True, capture_output=True, text=True
            )
            if self.verbose and result.stdout:
                print(result.stdout)
@ -69,51 +70,55 @@ class BTFConverter:
        """Step 1.5: Preprocess enum definitions."""
        self.log("Preprocessing enum definitions...")

-        with open(input_file, 'r') as f:
+        with open(input_file, "r") as f:
            original_code = f.read()

        # Extract anonymous enums
        enums = re.findall(
-            r'(?<!typedef\s)(enum\s*\{[^}]*\})\s*(\w+)\s*(?::\s*\d+)?\s*;',
-            original_code
+            r"(?<!typedef\s)(enum\s*\{[^}]*\})\s*(\w+)\s*(?::\s*\d+)?\s*;",
+            original_code,
        )
-        enum_defs = [enum_block + ';' for enum_block, _ in enums]
+        enum_defs = [enum_block + ";" for enum_block, _ in enums]

        # Replace anonymous enums with int declarations
        processed_code = re.sub(
-            r'(?<!typedef\s)enum\s*\{[^}]*\}\s*(\w+)\s*(?::\s*\d+)?\s*;',
-            r'int \1;',
-            original_code
+            r"(?<!typedef\s)enum\s*\{[^}]*\}\s*(\w+)\s*(?::\s*\d+)?\s*;",
+            r"int \1;",
+            original_code,
        )

        # Prepend enum definitions
        if enum_defs:
-            enum_text = '\n'.join(enum_defs) + '\n\n'
+            enum_text = "\n".join(enum_defs) + "\n\n"
            processed_code = enum_text + processed_code

        output_file = os.path.join(self.temp_dir, "vmlinux_processed.h")
-        with open(output_file, 'w') as f:
+        with open(output_file, "w") as f:
            f.write(processed_code)

        return output_file

    def step2_5_process_kioctx(self, input_file):
-        #TODO: this is a very bad bug and design decision. A single struct has an issue mostly.
+        # TODO: this is a very bad bug and design decision. A single struct has an issue mostly.
        """Step 2.5: Process struct kioctx to extract nested anonymous structs."""
        self.log("Processing struct kioctx nested structs...")

-        with open(input_file, 'r') as f:
+        with open(input_file, "r") as f:
            content = f.read()

        # Pattern to match struct kioctx with its full body (handles multiple nesting levels)
-        kioctx_pattern = r'struct\s+kioctx\s*\{(?:[^{}]|\{(?:[^{}]|\{[^{}]*\})*\})*\}\s*;'
+        kioctx_pattern = (
+            r"struct\s+kioctx\s*\{(?:[^{}]|\{(?:[^{}]|\{[^{}]*\})*\})*\}\s*;"
+        )

        def process_kioctx_replacement(match):
            full_struct = match.group(0)
            self.log(f"Found struct kioctx, length: {len(full_struct)} chars")

            # Extract the struct body (everything between outermost { and })
-            body_match = re.search(r'struct\s+kioctx\s*\{(.*)\}\s*;', full_struct, re.DOTALL)
+            body_match = re.search(
+                r"struct\s+kioctx\s*\{(.*)\}\s*;", full_struct, re.DOTALL
+            )
            if not body_match:
                return full_struct

@ -121,7 +126,7 @@ class BTFConverter:

            # Find all anonymous structs within the body
            # Pattern: struct { ... } followed by ; (not a member name)
-            anon_struct_pattern = r'struct\s*\{[^}]*\}'
+            # anon_struct_pattern = r"struct\s*\{[^}]*\}"

            anon_structs = []
            anon_counter = 4  # Start from 4, counting down to 1
@ -131,7 +136,9 @@ class BTFConverter:
                anon_struct_content = m.group(0)

                # Extract the body of the anonymous struct
-                anon_body_match = re.search(r'struct\s*\{(.*)\}', anon_struct_content, re.DOTALL)
+                anon_body_match = re.search(
+                    r"struct\s*\{(.*)\}", anon_struct_content, re.DOTALL
+                )
                if not anon_body_match:
                    return anon_struct_content

@ -154,7 +161,7 @@ class BTFConverter:
            processed_body = body

            # Find all occurrences and process them
-            pattern_with_semicolon = r'struct\s*\{([^}]*)\}\s*;'
+            pattern_with_semicolon = r"struct\s*\{([^}]*)\}\s*;"
            matches = list(re.finditer(pattern_with_semicolon, body, re.DOTALL))

            if not matches:
@ -178,14 +185,16 @@ class BTFConverter:

                # Replace in the body
                replacement = f"struct {anon_name} {member_name};"
-                processed_body = processed_body[:start_pos] + replacement + processed_body[end_pos:]
+                processed_body = (
+                    processed_body[:start_pos] + replacement + processed_body[end_pos:]
+                )

                anon_counter -= 1

            # Rebuild the complete definition
            if anon_structs:
                # Prepend the anonymous struct definitions
-                anon_definitions = '\n'.join(anon_structs) + '\n\n'
+                anon_definitions = "\n".join(anon_structs) + "\n\n"
                new_struct = f"struct kioctx {{{processed_body}}};"
                return anon_definitions + new_struct
            else:
@ -193,14 +202,11 @@ class BTFConverter:

        # Apply the transformation
        processed_content = re.sub(
-            kioctx_pattern,
-            process_kioctx_replacement,
-            content,
-            flags=re.DOTALL
+            kioctx_pattern, process_kioctx_replacement, content, flags=re.DOTALL
        )

        output_file = os.path.join(self.temp_dir, "vmlinux_kioctx_processed.h")
-        with open(output_file, 'w') as f:
+        with open(output_file, "w") as f:
            f.write(processed_content)

        self.log(f"Saved kioctx-processed output to {output_file}")
@ -218,7 +224,7 @@ class BTFConverter:
        output_file = os.path.join(self.temp_dir, "vmlinux_raw.py")
        cmd = (
            f"clang2py {input_file} -o {output_file} "
-            f"--clang-args=\"-fno-ms-extensions -I/usr/include -I/usr/include/linux\""
+            f'--clang-args="-fno-ms-extensions -I/usr/include -I/usr/include/linux"'
        )
        self.run_command(cmd, "Converting to Python ctypes")
        return output_file
@ -234,25 +240,21 @@ class BTFConverter:
        data = re.sub(r"\('_[0-9]+',\s*ctypes\.[a-zA-Z0-9_]+,\s*0\),?\s*\n?", "", data)

        # Replace ('_20', ctypes.c_uint64, 64) → ('_20', ctypes.c_uint64)
-        data = re.sub(r"\('(_[0-9]+)',\s*(ctypes\.[a-zA-Z0-9_]+),\s*[0-9]+\)", r"('\1', \2)", data)
+        data = re.sub(
+            r"\('(_[0-9]+)',\s*(ctypes\.[a-zA-Z0-9_]+),\s*[0-9]+\)", r"('\1', \2)", data
+        )

        # Replace ('_20', ctypes.c_char, 8) with ('_20', ctypes.c_uint8, 8)
-        data = re.sub(
-            r"(ctypes\.c_char)(\s*,\s*\d+\))",
-            r"ctypes.c_uint8\2",
-            data
-        )
+        data = re.sub(r"(ctypes\.c_char)(\s*,\s*\d+\))", r"ctypes.c_uint8\2", data)

        # below to replace those c_bool with bitfield greater than 8
        def repl(m):
            name, bits = m.groups()
-            return f"('{name}', ctypes.c_uint32, {bits})" if int(bits) > 8 else m.group(0)
+            return (
+                f"('{name}', ctypes.c_uint32, {bits})" if int(bits) > 8 else m.group(0)
+            )

-        data = re.sub(
-            r"\('([^']+)',\s*ctypes\.c_bool,\s*(\d+)\)",
-            repl,
-            data
-        )
+        data = re.sub(r"\('([^']+)',\s*ctypes\.c_bool,\s*(\d+)\)", repl, data)

        # Remove ctypes. prefix from invalid entries
        invalid_ctypes = ["bpf_iter_state", "_cache_type", "fs_context_purpose"]
@ -269,6 +271,7 @@ class BTFConverter:
        if not self.keep_intermediate and self.temp_dir != ".":
            self.log(f"Cleaning up temporary directory: {self.temp_dir}")
            import shutil
+
            shutil.rmtree(self.temp_dir, ignore_errors=True)

    def convert(self):
@ -292,6 +295,7 @@ class BTFConverter:
        except Exception as e:
            print(f"\n✗ Error during conversion: {e}", file=sys.stderr)
            import traceback
+
            traceback.print_exc()
            sys.exit(1)
        finally:
@ -304,18 +308,13 @@ class BTFConverter:
        dependencies = {
            "bpftool": "bpftool --version",
            "clang": "clang --version",
-            "clang2py": "clang2py --version"
+            "clang2py": "clang2py --version",
        }

        missing = []
        for tool, cmd in dependencies.items():
            try:
-                subprocess.run(
-                    cmd,
-                    shell=True,
-                    check=True,
-                    capture_output=True
-                )
+                subprocess.run(cmd, shell=True, check=True, capture_output=True)
            except subprocess.CalledProcessError:
                missing.append(tool)

@ -337,31 +336,31 @@ Examples:
  %(prog)s
  %(prog)s -o kernel_types.py
  %(prog)s --btf-source /sys/kernel/btf/custom_module -k -v
-        """
+        """,
    )

    parser.add_argument(
        "--btf-source",
        default="/sys/kernel/btf/vmlinux",
-        help="Path to BTF source (default: /sys/kernel/btf/vmlinux)"
+        help="Path to BTF source (default: /sys/kernel/btf/vmlinux)",
    )

    parser.add_argument(
-        "-o", "--output",
+        "-o",
+        "--output",
        default="vmlinux.py",
-        help="Output Python file (default: vmlinux.py)"
+        help="Output Python file (default: vmlinux.py)",
    )

    parser.add_argument(
-        "-k", "--keep-intermediate",
+        "-k",
+        "--keep-intermediate",
        action="store_true",
-        help="Keep intermediate files (vmlinux.h, vmlinux_processed.h, etc.)"
+        help="Keep intermediate files (vmlinux.h, vmlinux_processed.h, etc.)",
    )

    parser.add_argument(
-        "-v", "--verbose",
-        action="store_true",
-        help="Enable verbose output"
+        "-v", "--verbose", action="store_true", help="Enable verbose output"
    )

    args = parser.parse_args()
@ -370,7 +369,7 @@ Examples:
        btf_source=args.btf_source,
        output_file=args.output,
        keep_intermediate=args.keep_intermediate,
-        verbose=args.verbose
+        verbose=args.verbose,
    )

    converter.convert()
Author	SHA1	Message	Date
varun-r-mallya	8774277000	try to separate out ast node from vmlinux type	2025-10-12 01:59:14 +05:30
varun-r-mallya	8743ea17f3	one recursion issue solved	2025-10-12 01:33:23 +05:30
varun-r-mallya	f8844104a6	add support for single depth pointer resolution	2025-10-11 23:18:51 +05:30
varun-r-mallya	3343bedd11	add extra fields to Field datatype Signed-off-by: varun-r-mallya <varunrmallya@gmail.com>	2025-10-11 22:28:23 +05:30
varun-r-mallya	75d3ad4fe2	format chore	2025-10-11 22:00:25 +05:30