mirror of
https://github.com/varun-r-mallya/Python-BPF.git
synced 2026-02-11 15:40:56 +00:00
Compare commits
97 Commits
refactor_a
...
d4f5a9c36e
| Author | SHA1 | Date | |
|---|---|---|---|
| d4f5a9c36e | |||
| 20ec307288 | |||
| 0b4c6264a8 | |||
| e5741562f6 | |||
| 93634a4769 | |||
| 9b8462f1ed | |||
| 785182787c | |||
| 80396c78a6 | |||
| 8774277000 | |||
| 8743ea17f3 | |||
| f8844104a6 | |||
| 3343bedd11 | |||
| 75d3ad4fe2 | |||
| abbf17748d | |||
| 7c559840f0 | |||
| 06773c895f | |||
| 1e3d775865 | |||
| 168e26268e | |||
| 2cf7b28793 | |||
| d24d59c2ba | |||
| f190a33e21 | |||
| eb636ef731 | |||
| 2ae3aade60 | |||
| f227fe9310 | |||
| 7940d02bc7 | |||
| 2483ef2840 | |||
| 68e9693f9a | |||
| e4575a6b1e | |||
| 3ec3ab30fe | |||
| 7fb3ecff48 | |||
| ec59dad025 | |||
| 28b7b1620c | |||
| 9f8e240a38 | |||
| e6c05ab494 | |||
| 8aa9cf7119 | |||
| 9683e3799f | |||
| 200d293750 | |||
| ed196caebf | |||
| a049796b81 | |||
| 384fc9dd40 | |||
| 5f2df57e64 | |||
| 130d8a9edc | |||
| 40ae3d825a | |||
| 484624104e | |||
| e7c4bdb150 | |||
| 7210366e7d | |||
| 435bf27176 | |||
| 1ba27ac7cf | |||
| e4ddec3a02 | |||
| bc7b5c97d1 | |||
| fa720f8e6b | |||
| eff0f66d95 | |||
| b43c252224 | |||
| aae7aa981d | |||
| 6f9a7301af | |||
| 48923d03d4 | |||
| 019a83cf11 | |||
| 140d9e6e35 | |||
| a351b0f1b5 | |||
| 3cb73ff0c3 | |||
| 3b08c2bede | |||
| 86378d6cc4 | |||
| 00d1c583af | |||
| cfc246c80d | |||
| f3c80f9e5f | |||
| 0d3a5748dd | |||
| 079431754c | |||
| 46f5eca33d | |||
| 7081e939fb | |||
| 1e29460d6f | |||
| e180a89644 | |||
| 34a267e982 | |||
| c81aad7c67 | |||
| 2e677c2c7b | |||
| 4ea7b22b44 | |||
| b8b937bfca | |||
| 6cc29c4fa1 | |||
| 5451ba646d | |||
| 7720437ca5 | |||
| eb0a7a917d | |||
| 6f65903552 | |||
| 97e74d09be | |||
| 9c7560ed2e | |||
| 2979ceedcf | |||
| 745f59278f | |||
| 49c59b32ca | |||
| ff78140a7d | |||
| 82ff71b753 | |||
| f46e7cd846 | |||
| 9d73eb67c4 | |||
| 21ce041353 | |||
| 6402cf7be5 | |||
| 9a96e1247b | |||
| 989134f4be | |||
| b95fbd0ed0 | |||
| d84ce0c6fa | |||
| 8d07a4cd05 |
3
.gitignore
vendored
3
.gitignore
vendored
@ -7,3 +7,6 @@ __pycache__/
|
|||||||
*.ll
|
*.ll
|
||||||
*.o
|
*.o
|
||||||
.ipynb_checkpoints/
|
.ipynb_checkpoints/
|
||||||
|
vmlinux.py
|
||||||
|
~*
|
||||||
|
vmlinux.h
|
||||||
|
|||||||
@ -12,7 +12,7 @@
|
|||||||
#
|
#
|
||||||
# See https://github.com/pre-commit/pre-commit
|
# See https://github.com/pre-commit/pre-commit
|
||||||
|
|
||||||
exclude: 'vmlinux.*\.py$'
|
exclude: 'vmlinux.py'
|
||||||
|
|
||||||
ci:
|
ci:
|
||||||
autoupdate_commit_msg: "chore: update pre-commit hooks"
|
autoupdate_commit_msg: "chore: update pre-commit hooks"
|
||||||
@ -41,7 +41,7 @@ repos:
|
|||||||
- id: ruff
|
- id: ruff
|
||||||
args: ["--fix", "--show-fixes"]
|
args: ["--fix", "--show-fixes"]
|
||||||
- id: ruff-format
|
- id: ruff-format
|
||||||
exclude: ^(docs)|^(tests)|^(examples)
|
# exclude: ^(docs)|^(tests)|^(examples)
|
||||||
|
|
||||||
# Checking static types
|
# Checking static types
|
||||||
- repo: https://github.com/pre-commit/mirrors-mypy
|
- repo: https://github.com/pre-commit/mirrors-mypy
|
||||||
|
|||||||
@ -83,14 +83,14 @@ def hist() -> HashMap:
|
|||||||
def hello(ctx: c_void_p) -> c_int64:
|
def hello(ctx: c_void_p) -> c_int64:
|
||||||
process_id = pid()
|
process_id = pid()
|
||||||
one = 1
|
one = 1
|
||||||
prev = hist().lookup(process_id)
|
prev = hist.lookup(process_id)
|
||||||
if prev:
|
if prev:
|
||||||
previous_value = prev + 1
|
previous_value = prev + 1
|
||||||
print(f"count: {previous_value} with {process_id}")
|
print(f"count: {previous_value} with {process_id}")
|
||||||
hist().update(process_id, previous_value)
|
hist.update(process_id, previous_value)
|
||||||
return c_int64(0)
|
return c_int64(0)
|
||||||
else:
|
else:
|
||||||
hist().update(process_id, one)
|
hist.update(process_id, one)
|
||||||
return c_int64(0)
|
return c_int64(0)
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
13
TODO.md
13
TODO.md
@ -1,13 +0,0 @@
|
|||||||
## Short term
|
|
||||||
|
|
||||||
- Implement enough functionality to port the BCC tutorial examples in PythonBPF
|
|
||||||
- Add all maps
|
|
||||||
- XDP support in pylibbpf
|
|
||||||
- ringbuf support
|
|
||||||
- Add oneline IfExpr conditionals (wishlist)
|
|
||||||
|
|
||||||
## Long term
|
|
||||||
|
|
||||||
- Refactor the codebase to be better than a hackathon project
|
|
||||||
- Port to C++ and use actual LLVM?
|
|
||||||
- Fix struct_kioctx issue in the vmlinux transpiler
|
|
||||||
@ -308,6 +308,7 @@
|
|||||||
"def hist() -> HashMap:\n",
|
"def hist() -> HashMap:\n",
|
||||||
" return HashMap(key=c_int32, value=c_uint64, max_entries=4096)\n",
|
" return HashMap(key=c_int32, value=c_uint64, max_entries=4096)\n",
|
||||||
"\n",
|
"\n",
|
||||||
|
"\n",
|
||||||
"@bpf\n",
|
"@bpf\n",
|
||||||
"@section(\"tracepoint/syscalls/sys_enter_clone\")\n",
|
"@section(\"tracepoint/syscalls/sys_enter_clone\")\n",
|
||||||
"def hello(ctx: c_void_p) -> c_int64:\n",
|
"def hello(ctx: c_void_p) -> c_int64:\n",
|
||||||
@ -329,6 +330,7 @@
|
|||||||
"def LICENSE() -> str:\n",
|
"def LICENSE() -> str:\n",
|
||||||
" return \"GPL\"\n",
|
" return \"GPL\"\n",
|
||||||
"\n",
|
"\n",
|
||||||
|
"\n",
|
||||||
"b = BPF()"
|
"b = BPF()"
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
@ -357,7 +359,6 @@
|
|||||||
}
|
}
|
||||||
],
|
],
|
||||||
"source": [
|
"source": [
|
||||||
"\n",
|
|
||||||
"b.load_and_attach()\n",
|
"b.load_and_attach()\n",
|
||||||
"hist = BpfMap(b, hist)\n",
|
"hist = BpfMap(b, hist)\n",
|
||||||
"print(\"Recording\")\n",
|
"print(\"Recording\")\n",
|
||||||
|
|||||||
@ -8,12 +8,14 @@ def hello_world(ctx: c_void_p) -> c_int64:
|
|||||||
print("Hello, World!")
|
print("Hello, World!")
|
||||||
return c_int64(0)
|
return c_int64(0)
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@section("kprobe/do_unlinkat")
|
@section("kprobe/do_unlinkat")
|
||||||
def hello_world2(ctx: c_void_p) -> c_int64:
|
def hello_world2(ctx: c_void_p) -> c_int64:
|
||||||
print("Hello, World!")
|
print("Hello, World!")
|
||||||
return c_int64(0)
|
return c_int64(0)
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def LICENSE() -> str:
|
def LICENSE() -> str:
|
||||||
|
|||||||
@ -27,7 +27,7 @@ def hello(ctx: c_void_p) -> c_int32:
|
|||||||
dataobj.pid = pid()
|
dataobj.pid = pid()
|
||||||
dataobj.ts = ktime()
|
dataobj.ts = ktime()
|
||||||
# dataobj.comm = strobj
|
# dataobj.comm = strobj
|
||||||
print(f"clone called at {dataobj.ts} by pid" f"{dataobj.pid}, comm {strobj}")
|
print(f"clone called at {dataobj.ts} by pid{dataobj.pid}, comm {strobj}")
|
||||||
events.output(dataobj)
|
events.output(dataobj)
|
||||||
return c_int32(0)
|
return c_int32(0)
|
||||||
|
|
||||||
|
|||||||
248446
examples/vmlinux.py
248446
examples/vmlinux.py
File diff suppressed because it is too large
Load Diff
@ -1,8 +1,8 @@
|
|||||||
from pythonbpf import bpf, map, section, bpfglobal, compile
|
from pythonbpf import bpf, map, section, bpfglobal, compile, compile_to_ir
|
||||||
from pythonbpf.helper import XDP_PASS
|
from pythonbpf.helper import XDP_PASS
|
||||||
from pythonbpf.maps import HashMap
|
from pythonbpf.maps import HashMap
|
||||||
|
from ctypes import c_int64, c_void_p
|
||||||
|
|
||||||
from ctypes import c_void_p, c_int64
|
|
||||||
|
|
||||||
# Instructions to how to run this program
|
# Instructions to how to run this program
|
||||||
# 1. Install PythonBPF: pip install pythonbpf
|
# 1. Install PythonBPF: pip install pythonbpf
|
||||||
@ -41,4 +41,5 @@ def LICENSE() -> str:
|
|||||||
return "GPL"
|
return "GPL"
|
||||||
|
|
||||||
|
|
||||||
|
compile_to_ir("xdp_pass.py", "xdp_pass.ll")
|
||||||
compile()
|
compile()
|
||||||
|
|||||||
@ -1,191 +0,0 @@
|
|||||||
import ast
|
|
||||||
import logging
|
|
||||||
|
|
||||||
from llvmlite import ir
|
|
||||||
from dataclasses import dataclass
|
|
||||||
from typing import Any
|
|
||||||
from pythonbpf.helper import HelperHandlerRegistry
|
|
||||||
from pythonbpf.type_deducer import ctypes_to_ir
|
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
|
||||||
|
|
||||||
|
|
||||||
@dataclass
|
|
||||||
class LocalSymbol:
|
|
||||||
var: ir.AllocaInstr
|
|
||||||
ir_type: ir.Type
|
|
||||||
metadata: Any = None
|
|
||||||
|
|
||||||
def __iter__(self):
|
|
||||||
yield self.var
|
|
||||||
yield self.ir_type
|
|
||||||
yield self.metadata
|
|
||||||
|
|
||||||
|
|
||||||
def _is_helper_call(call_node):
|
|
||||||
"""Check if a call node is a BPF helper function call."""
|
|
||||||
if isinstance(call_node.func, ast.Name):
|
|
||||||
# Exclude print from requiring temps (handles f-strings differently)
|
|
||||||
func_name = call_node.func.id
|
|
||||||
return HelperHandlerRegistry.has_handler(func_name) and func_name != "print"
|
|
||||||
|
|
||||||
elif isinstance(call_node.func, ast.Attribute):
|
|
||||||
return HelperHandlerRegistry.has_handler(call_node.func.attr)
|
|
||||||
|
|
||||||
return False
|
|
||||||
|
|
||||||
|
|
||||||
def handle_assign_allocation(builder, stmt, local_sym_tab, structs_sym_tab):
|
|
||||||
"""Handle memory allocation for assignment statements."""
|
|
||||||
|
|
||||||
# Validate assignment
|
|
||||||
if len(stmt.targets) != 1:
|
|
||||||
logger.warning("Multi-target assignment not supported, skipping allocation")
|
|
||||||
return
|
|
||||||
|
|
||||||
target = stmt.targets[0]
|
|
||||||
|
|
||||||
# Skip non-name targets (e.g., struct field assignments)
|
|
||||||
if isinstance(target, ast.Attribute):
|
|
||||||
logger.debug(f"Struct field assignment to {target.attr}, no allocation needed")
|
|
||||||
return
|
|
||||||
|
|
||||||
if not isinstance(target, ast.Name):
|
|
||||||
logger.warning(f"Unsupported assignment target type: {type(target).__name__}")
|
|
||||||
return
|
|
||||||
|
|
||||||
var_name = target.id
|
|
||||||
rval = stmt.value
|
|
||||||
|
|
||||||
# Skip if already allocated
|
|
||||||
if var_name in local_sym_tab:
|
|
||||||
logger.debug(f"Variable {var_name} already allocated, skipping")
|
|
||||||
return
|
|
||||||
|
|
||||||
# Determine type and allocate based on rval
|
|
||||||
if isinstance(rval, ast.Call):
|
|
||||||
_allocate_for_call(builder, var_name, rval, local_sym_tab, structs_sym_tab)
|
|
||||||
elif isinstance(rval, ast.Constant):
|
|
||||||
_allocate_for_constant(builder, var_name, rval, local_sym_tab)
|
|
||||||
elif isinstance(rval, ast.BinOp):
|
|
||||||
_allocate_for_binop(builder, var_name, local_sym_tab)
|
|
||||||
else:
|
|
||||||
logger.warning(
|
|
||||||
f"Unsupported assignment value type for {var_name}: {type(rval).__name__}"
|
|
||||||
)
|
|
||||||
|
|
||||||
|
|
||||||
def _allocate_for_call(builder, var_name, rval, local_sym_tab, structs_sym_tab):
|
|
||||||
"""Allocate memory for variable assigned from a call."""
|
|
||||||
|
|
||||||
if isinstance(rval.func, ast.Name):
|
|
||||||
call_type = rval.func.id
|
|
||||||
|
|
||||||
# C type constructors
|
|
||||||
if call_type in ("c_int32", "c_int64", "c_uint32", "c_uint64"):
|
|
||||||
ir_type = ctypes_to_ir(call_type)
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = ir_type.width // 8
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} as {call_type}")
|
|
||||||
|
|
||||||
# Helper functions
|
|
||||||
elif HelperHandlerRegistry.has_handler(call_type):
|
|
||||||
ir_type = ir.IntType(64) # Assume i64 return type
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = 8
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} for helper {call_type}")
|
|
||||||
|
|
||||||
# Deref function
|
|
||||||
elif call_type == "deref":
|
|
||||||
ir_type = ir.IntType(64) # Assume i64 return type
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = 8
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} for deref")
|
|
||||||
|
|
||||||
# Struct constructors
|
|
||||||
elif call_type in structs_sym_tab:
|
|
||||||
struct_info = structs_sym_tab[call_type]
|
|
||||||
var = builder.alloca(struct_info.ir_type, name=var_name)
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, struct_info.ir_type, call_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} for struct {call_type}")
|
|
||||||
|
|
||||||
else:
|
|
||||||
logger.warning(f"Unknown call type for allocation: {call_type}")
|
|
||||||
|
|
||||||
elif isinstance(rval.func, ast.Attribute):
|
|
||||||
# Map method calls - need double allocation for ptr handling
|
|
||||||
_allocate_for_map_method(builder, var_name, local_sym_tab)
|
|
||||||
|
|
||||||
else:
|
|
||||||
logger.warning(f"Unsupported call function type for {var_name}")
|
|
||||||
|
|
||||||
|
|
||||||
def _allocate_for_map_method(builder, var_name, local_sym_tab):
|
|
||||||
"""Allocate memory for variable assigned from map method (double alloc)."""
|
|
||||||
|
|
||||||
# Main variable (pointer to pointer)
|
|
||||||
ir_type = ir.PointerType(ir.IntType(64))
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
|
|
||||||
# Temporary variable for computed values
|
|
||||||
tmp_ir_type = ir.IntType(64)
|
|
||||||
var_tmp = builder.alloca(tmp_ir_type, name=f"{var_name}_tmp")
|
|
||||||
local_sym_tab[f"{var_name}_tmp"] = LocalSymbol(var_tmp, tmp_ir_type)
|
|
||||||
|
|
||||||
logger.info(f"Pre-allocated {var_name} and {var_name}_tmp for map method")
|
|
||||||
|
|
||||||
|
|
||||||
def _allocate_for_constant(builder, var_name, rval, local_sym_tab):
|
|
||||||
"""Allocate memory for variable assigned from a constant."""
|
|
||||||
|
|
||||||
if isinstance(rval.value, bool):
|
|
||||||
ir_type = ir.IntType(1)
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = 1
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} as bool")
|
|
||||||
|
|
||||||
elif isinstance(rval.value, int):
|
|
||||||
ir_type = ir.IntType(64)
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = 8
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} as i64")
|
|
||||||
|
|
||||||
elif isinstance(rval.value, str):
|
|
||||||
ir_type = ir.PointerType(ir.IntType(8))
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = 8
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} as string")
|
|
||||||
|
|
||||||
else:
|
|
||||||
logger.warning(
|
|
||||||
f"Unsupported constant type for {var_name}: {type(rval.value).__name__}"
|
|
||||||
)
|
|
||||||
|
|
||||||
|
|
||||||
def _allocate_for_binop(builder, var_name, local_sym_tab):
|
|
||||||
"""Allocate memory for variable assigned from a binary operation."""
|
|
||||||
ir_type = ir.IntType(64) # Assume i64 result
|
|
||||||
var = builder.alloca(ir_type, name=var_name)
|
|
||||||
var.align = 8
|
|
||||||
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
|
||||||
logger.info(f"Pre-allocated {var_name} for binop result")
|
|
||||||
|
|
||||||
|
|
||||||
def allocate_temp_pool(builder, max_temps, local_sym_tab):
|
|
||||||
"""Allocate the temporary scratch space pool for helper arguments."""
|
|
||||||
if max_temps == 0:
|
|
||||||
return
|
|
||||||
|
|
||||||
logger.info(f"Allocating temp pool of {max_temps} variables")
|
|
||||||
for i in range(max_temps):
|
|
||||||
temp_name = f"__helper_temp_{i}"
|
|
||||||
temp_var = builder.alloca(ir.IntType(64), name=temp_name)
|
|
||||||
temp_var.align = 8
|
|
||||||
local_sym_tab[temp_name] = LocalSymbol(temp_var, ir.IntType(64))
|
|
||||||
@ -1,108 +0,0 @@
|
|||||||
import ast
|
|
||||||
import logging
|
|
||||||
from llvmlite import ir
|
|
||||||
from pythonbpf.expr import eval_expr
|
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
|
||||||
|
|
||||||
|
|
||||||
def handle_struct_field_assignment(
|
|
||||||
func, module, builder, target, rval, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
):
|
|
||||||
"""Handle struct field assignment (obj.field = value)."""
|
|
||||||
|
|
||||||
var_name = target.value.id
|
|
||||||
field_name = target.attr
|
|
||||||
|
|
||||||
if var_name not in local_sym_tab:
|
|
||||||
logger.error(f"Variable '{var_name}' not found in symbol table")
|
|
||||||
return
|
|
||||||
|
|
||||||
struct_type = local_sym_tab[var_name].metadata
|
|
||||||
struct_info = structs_sym_tab[struct_type]
|
|
||||||
|
|
||||||
if field_name not in struct_info.fields:
|
|
||||||
logger.error(f"Field '{field_name}' not found in struct '{struct_type}'")
|
|
||||||
return
|
|
||||||
|
|
||||||
# Get field pointer and evaluate value
|
|
||||||
field_ptr = struct_info.gep(builder, local_sym_tab[var_name].var, field_name)
|
|
||||||
val = eval_expr(
|
|
||||||
func, module, builder, rval, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
|
||||||
|
|
||||||
if val is None:
|
|
||||||
logger.error(f"Failed to evaluate value for {var_name}.{field_name}")
|
|
||||||
return
|
|
||||||
|
|
||||||
# TODO: Handle string assignment to char array (not a priority)
|
|
||||||
field_type = struct_info.field_type(field_name)
|
|
||||||
if isinstance(field_type, ir.ArrayType) and val[1] == ir.PointerType(ir.IntType(8)):
|
|
||||||
logger.warning(
|
|
||||||
f"String to char array assignment not implemented for {var_name}.{field_name}"
|
|
||||||
)
|
|
||||||
return
|
|
||||||
|
|
||||||
# Store the value
|
|
||||||
builder.store(val[0], field_ptr)
|
|
||||||
logger.info(f"Assigned to struct field {var_name}.{field_name}")
|
|
||||||
|
|
||||||
|
|
||||||
def handle_variable_assignment(
|
|
||||||
func, module, builder, var_name, rval, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
):
|
|
||||||
"""Handle single named variable assignment."""
|
|
||||||
|
|
||||||
if var_name not in local_sym_tab:
|
|
||||||
logger.error(f"Variable {var_name} not declared.")
|
|
||||||
return False
|
|
||||||
|
|
||||||
var_ptr = local_sym_tab[var_name].var
|
|
||||||
var_type = local_sym_tab[var_name].ir_type
|
|
||||||
|
|
||||||
# NOTE: Special case for struct initialization
|
|
||||||
if isinstance(rval, ast.Call) and isinstance(rval.func, ast.Name):
|
|
||||||
struct_name = rval.func.id
|
|
||||||
if struct_name in structs_sym_tab and len(rval.args) == 0:
|
|
||||||
struct_info = structs_sym_tab[struct_name]
|
|
||||||
ir_struct = struct_info.ir_type
|
|
||||||
|
|
||||||
builder.store(ir.Constant(ir_struct, None), var_ptr)
|
|
||||||
logger.info(f"Initialized struct {struct_name} for variable {var_name}")
|
|
||||||
return True
|
|
||||||
|
|
||||||
val_result = eval_expr(
|
|
||||||
func, module, builder, rval, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
|
||||||
if val_result is None:
|
|
||||||
logger.error(f"Failed to evaluate value for {var_name}")
|
|
||||||
return False
|
|
||||||
|
|
||||||
val, val_type = val_result
|
|
||||||
logger.info(f"Evaluated value for {var_name}: {val} of type {val_type}, {var_type}")
|
|
||||||
if val_type != var_type:
|
|
||||||
if isinstance(val_type, ir.IntType) and isinstance(var_type, ir.IntType):
|
|
||||||
# Allow implicit int widening
|
|
||||||
if val_type.width < var_type.width:
|
|
||||||
val = builder.sext(val, var_type)
|
|
||||||
logger.info(f"Implicitly widened int for variable {var_name}")
|
|
||||||
elif val_type.width > var_type.width:
|
|
||||||
val = builder.trunc(val, var_type)
|
|
||||||
logger.info(f"Implicitly truncated int for variable {var_name}")
|
|
||||||
elif isinstance(val_type, ir.IntType) and isinstance(var_type, ir.PointerType):
|
|
||||||
# NOTE: This is assignment to a PTR_TO_MAP_VALUE_OR_NULL
|
|
||||||
logger.info(
|
|
||||||
f"Creating temporary variable for pointer assignment to {var_name}"
|
|
||||||
)
|
|
||||||
var_ptr_tmp = local_sym_tab[f"{var_name}_tmp"].var
|
|
||||||
builder.store(val, var_ptr_tmp)
|
|
||||||
val = var_ptr_tmp
|
|
||||||
else:
|
|
||||||
logger.error(
|
|
||||||
f"Type mismatch for variable {var_name}: {val_type} vs {var_type}"
|
|
||||||
)
|
|
||||||
return False
|
|
||||||
|
|
||||||
builder.store(val, var_ptr)
|
|
||||||
logger.info(f"Assigned value to variable {var_name}")
|
|
||||||
return True
|
|
||||||
@ -3,70 +3,43 @@ from llvmlite import ir
|
|||||||
from logging import Logger
|
from logging import Logger
|
||||||
import logging
|
import logging
|
||||||
|
|
||||||
from pythonbpf.expr import get_base_type_and_depth, deref_to_depth, eval_expr
|
|
||||||
|
|
||||||
logger: Logger = logging.getLogger(__name__)
|
logger: Logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
|
||||||
def get_operand_value(
|
def recursive_dereferencer(var, builder):
|
||||||
func, module, operand, builder, local_sym_tab, map_sym_tab, structs_sym_tab=None
|
"""dereference until primitive type comes out"""
|
||||||
):
|
# TODO: Not worrying about stack overflow for now
|
||||||
|
logger.info(f"Dereferencing {var}, type is {var.type}")
|
||||||
|
if isinstance(var.type, ir.PointerType):
|
||||||
|
a = builder.load(var)
|
||||||
|
return recursive_dereferencer(a, builder)
|
||||||
|
elif isinstance(var.type, ir.IntType):
|
||||||
|
return var
|
||||||
|
else:
|
||||||
|
raise TypeError(f"Unsupported type for dereferencing: {var.type}")
|
||||||
|
|
||||||
|
|
||||||
|
def get_operand_value(operand, builder, local_sym_tab):
|
||||||
"""Extract the value from an operand, handling variables and constants."""
|
"""Extract the value from an operand, handling variables and constants."""
|
||||||
logger.info(f"Getting operand value for: {ast.dump(operand)}")
|
|
||||||
if isinstance(operand, ast.Name):
|
if isinstance(operand, ast.Name):
|
||||||
if operand.id in local_sym_tab:
|
if operand.id in local_sym_tab:
|
||||||
var = local_sym_tab[operand.id].var
|
return recursive_dereferencer(local_sym_tab[operand.id].var, builder)
|
||||||
var_type = var.type
|
|
||||||
base_type, depth = get_base_type_and_depth(var_type)
|
|
||||||
logger.info(f"var is {var}, base_type is {base_type}, depth is {depth}")
|
|
||||||
val = deref_to_depth(func, builder, var, depth)
|
|
||||||
return val
|
|
||||||
raise ValueError(f"Undefined variable: {operand.id}")
|
raise ValueError(f"Undefined variable: {operand.id}")
|
||||||
elif isinstance(operand, ast.Constant):
|
elif isinstance(operand, ast.Constant):
|
||||||
if isinstance(operand.value, int):
|
if isinstance(operand.value, int):
|
||||||
cst = ir.Constant(ir.IntType(64), int(operand.value))
|
return ir.Constant(ir.IntType(64), operand.value)
|
||||||
return cst
|
|
||||||
raise TypeError(f"Unsupported constant type: {type(operand.value)}")
|
raise TypeError(f"Unsupported constant type: {type(operand.value)}")
|
||||||
elif isinstance(operand, ast.BinOp):
|
elif isinstance(operand, ast.BinOp):
|
||||||
res = handle_binary_op_impl(
|
return handle_binary_op_impl(operand, builder, local_sym_tab)
|
||||||
func, module, operand, builder, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
|
||||||
return res
|
|
||||||
else:
|
|
||||||
res = eval_expr(
|
|
||||||
func, module, builder, operand, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
|
||||||
if res is None:
|
|
||||||
raise ValueError(f"Failed to evaluate call expression: {operand}")
|
|
||||||
val, _ = res
|
|
||||||
logger.info(f"Evaluated expr to {val} of type {val.type}")
|
|
||||||
base_type, depth = get_base_type_and_depth(val.type)
|
|
||||||
if depth > 0:
|
|
||||||
val = deref_to_depth(func, builder, val, depth)
|
|
||||||
return val
|
|
||||||
raise TypeError(f"Unsupported operand type: {type(operand)}")
|
raise TypeError(f"Unsupported operand type: {type(operand)}")
|
||||||
|
|
||||||
|
|
||||||
def handle_binary_op_impl(
|
def handle_binary_op_impl(rval, builder, local_sym_tab):
|
||||||
func, module, rval, builder, local_sym_tab, map_sym_tab, structs_sym_tab=None
|
|
||||||
):
|
|
||||||
op = rval.op
|
op = rval.op
|
||||||
left = get_operand_value(
|
left = get_operand_value(rval.left, builder, local_sym_tab)
|
||||||
func, module, rval.left, builder, local_sym_tab, map_sym_tab, structs_sym_tab
|
right = get_operand_value(rval.right, builder, local_sym_tab)
|
||||||
)
|
|
||||||
right = get_operand_value(
|
|
||||||
func, module, rval.right, builder, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
|
||||||
logger.info(f"left is {left}, right is {right}, op is {op}")
|
logger.info(f"left is {left}, right is {right}, op is {op}")
|
||||||
|
|
||||||
# NOTE: Before doing the operation, if the operands are integers
|
|
||||||
# we always extend them to i64. The assignment to LHS will take
|
|
||||||
# care of truncation if needed.
|
|
||||||
if isinstance(left.type, ir.IntType) and left.type.width < 64:
|
|
||||||
left = builder.sext(left, ir.IntType(64))
|
|
||||||
if isinstance(right.type, ir.IntType) and right.type.width < 64:
|
|
||||||
right = builder.sext(right, ir.IntType(64))
|
|
||||||
|
|
||||||
# Map AST operation nodes to LLVM IR builder methods
|
# Map AST operation nodes to LLVM IR builder methods
|
||||||
op_map = {
|
op_map = {
|
||||||
ast.Add: builder.add,
|
ast.Add: builder.add,
|
||||||
@ -89,19 +62,8 @@ def handle_binary_op_impl(
|
|||||||
raise SyntaxError("Unsupported binary operation")
|
raise SyntaxError("Unsupported binary operation")
|
||||||
|
|
||||||
|
|
||||||
def handle_binary_op(
|
def handle_binary_op(rval, builder, var_name, local_sym_tab):
|
||||||
func,
|
result = handle_binary_op_impl(rval, builder, local_sym_tab)
|
||||||
module,
|
|
||||||
rval,
|
|
||||||
builder,
|
|
||||||
var_name,
|
|
||||||
local_sym_tab,
|
|
||||||
map_sym_tab,
|
|
||||||
structs_sym_tab=None,
|
|
||||||
):
|
|
||||||
result = handle_binary_op_impl(
|
|
||||||
func, module, rval, builder, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
|
||||||
if var_name and var_name in local_sym_tab:
|
if var_name and var_name in local_sym_tab:
|
||||||
logger.info(
|
logger.info(
|
||||||
f"Storing result {result} into variable {local_sym_tab[var_name].var}"
|
f"Storing result {result} into variable {local_sym_tab[var_name].var}"
|
||||||
|
|||||||
@ -4,6 +4,7 @@ from .license_pass import license_processing
|
|||||||
from .functions import func_proc
|
from .functions import func_proc
|
||||||
from .maps import maps_proc
|
from .maps import maps_proc
|
||||||
from .structs import structs_proc
|
from .structs import structs_proc
|
||||||
|
from .vmlinux_parser import vmlinux_proc
|
||||||
from .globals_pass import (
|
from .globals_pass import (
|
||||||
globals_list_creation,
|
globals_list_creation,
|
||||||
globals_processing,
|
globals_processing,
|
||||||
@ -44,6 +45,7 @@ def processor(source_code, filename, module):
|
|||||||
for func_node in bpf_chunks:
|
for func_node in bpf_chunks:
|
||||||
logger.info(f"Found BPF function/struct: {func_node.name}")
|
logger.info(f"Found BPF function/struct: {func_node.name}")
|
||||||
|
|
||||||
|
vmlinux_proc(tree, module)
|
||||||
populate_global_symbol_table(tree, module)
|
populate_global_symbol_table(tree, module)
|
||||||
license_processing(tree, module)
|
license_processing(tree, module)
|
||||||
globals_processing(tree, module)
|
globals_processing(tree, module)
|
||||||
|
|||||||
@ -1,10 +1,4 @@
|
|||||||
from .expr_pass import eval_expr, handle_expr
|
from .expr_pass import eval_expr, handle_expr
|
||||||
from .type_normalization import convert_to_bool, get_base_type_and_depth, deref_to_depth
|
from .type_normalization import convert_to_bool
|
||||||
|
|
||||||
__all__ = [
|
__all__ = ["eval_expr", "handle_expr", "convert_to_bool"]
|
||||||
"eval_expr",
|
|
||||||
"handle_expr",
|
|
||||||
"convert_to_bool",
|
|
||||||
"get_base_type_and_depth",
|
|
||||||
"deref_to_depth",
|
|
||||||
]
|
|
||||||
|
|||||||
@ -26,7 +26,7 @@ def _handle_constant_expr(expr: ast.Constant):
|
|||||||
if isinstance(expr.value, int) or isinstance(expr.value, bool):
|
if isinstance(expr.value, int) or isinstance(expr.value, bool):
|
||||||
return ir.Constant(ir.IntType(64), int(expr.value)), ir.IntType(64)
|
return ir.Constant(ir.IntType(64), int(expr.value)), ir.IntType(64)
|
||||||
else:
|
else:
|
||||||
logger.error(f"Unsupported constant type {ast.dump(expr)}")
|
logger.error("Unsupported constant type")
|
||||||
return None
|
return None
|
||||||
|
|
||||||
|
|
||||||
@ -176,28 +176,21 @@ def _handle_unary_op(
|
|||||||
structs_sym_tab=None,
|
structs_sym_tab=None,
|
||||||
):
|
):
|
||||||
"""Handle ast.UnaryOp expressions."""
|
"""Handle ast.UnaryOp expressions."""
|
||||||
if not isinstance(expr.op, ast.Not) and not isinstance(expr.op, ast.USub):
|
if not isinstance(expr.op, ast.Not):
|
||||||
logger.error("Only 'not' and '-' unary operators are supported")
|
logger.error("Only 'not' unary operator is supported")
|
||||||
return None
|
return None
|
||||||
|
|
||||||
from pythonbpf.binary_ops import get_operand_value
|
operand = eval_expr(
|
||||||
|
func, module, builder, expr.operand, local_sym_tab, map_sym_tab, structs_sym_tab
|
||||||
operand = get_operand_value(
|
|
||||||
func, module, expr.operand, builder, local_sym_tab, map_sym_tab, structs_sym_tab
|
|
||||||
)
|
)
|
||||||
if operand is None:
|
if operand is None:
|
||||||
logger.error("Failed to evaluate operand for unary operation")
|
logger.error("Failed to evaluate operand for unary operation")
|
||||||
return None
|
return None
|
||||||
|
|
||||||
if isinstance(expr.op, ast.Not):
|
operand_val, operand_type = operand
|
||||||
true_const = ir.Constant(ir.IntType(1), 1)
|
true_const = ir.Constant(ir.IntType(1), 1)
|
||||||
result = builder.xor(convert_to_bool(builder, operand), true_const)
|
result = builder.xor(convert_to_bool(builder, operand_val), true_const)
|
||||||
return result, ir.IntType(1)
|
return result, ir.IntType(1)
|
||||||
elif isinstance(expr.op, ast.USub):
|
|
||||||
# Multiply by -1
|
|
||||||
neg_one = ir.Constant(ir.IntType(64), -1)
|
|
||||||
result = builder.mul(operand, neg_one)
|
|
||||||
return result, ir.IntType(64)
|
|
||||||
|
|
||||||
|
|
||||||
def _handle_and_op(func, builder, expr, local_sym_tab, map_sym_tab, structs_sym_tab):
|
def _handle_and_op(func, builder, expr, local_sym_tab, map_sym_tab, structs_sym_tab):
|
||||||
@ -409,16 +402,7 @@ def eval_expr(
|
|||||||
elif isinstance(expr, ast.BinOp):
|
elif isinstance(expr, ast.BinOp):
|
||||||
from pythonbpf.binary_ops import handle_binary_op
|
from pythonbpf.binary_ops import handle_binary_op
|
||||||
|
|
||||||
return handle_binary_op(
|
return handle_binary_op(expr, builder, None, local_sym_tab)
|
||||||
func,
|
|
||||||
module,
|
|
||||||
expr,
|
|
||||||
builder,
|
|
||||||
None,
|
|
||||||
local_sym_tab,
|
|
||||||
map_sym_tab,
|
|
||||||
structs_sym_tab,
|
|
||||||
)
|
|
||||||
elif isinstance(expr, ast.Compare):
|
elif isinstance(expr, ast.Compare):
|
||||||
return _handle_compare(
|
return _handle_compare(
|
||||||
func, module, builder, expr, local_sym_tab, map_sym_tab, structs_sym_tab
|
func, module, builder, expr, local_sym_tab, map_sym_tab, structs_sym_tab
|
||||||
|
|||||||
@ -16,7 +16,7 @@ COMPARISON_OPS = {
|
|||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
def get_base_type_and_depth(ir_type):
|
def _get_base_type_and_depth(ir_type):
|
||||||
"""Get the base type for pointer types."""
|
"""Get the base type for pointer types."""
|
||||||
cur_type = ir_type
|
cur_type = ir_type
|
||||||
depth = 0
|
depth = 0
|
||||||
@ -26,7 +26,7 @@ def get_base_type_and_depth(ir_type):
|
|||||||
return cur_type, depth
|
return cur_type, depth
|
||||||
|
|
||||||
|
|
||||||
def deref_to_depth(func, builder, val, target_depth):
|
def _deref_to_depth(func, builder, val, target_depth):
|
||||||
"""Dereference a pointer to a certain depth."""
|
"""Dereference a pointer to a certain depth."""
|
||||||
|
|
||||||
cur_val = val
|
cur_val = val
|
||||||
@ -88,13 +88,13 @@ def _normalize_types(func, builder, lhs, rhs):
|
|||||||
logger.error(f"Type mismatch: {lhs.type} vs {rhs.type}")
|
logger.error(f"Type mismatch: {lhs.type} vs {rhs.type}")
|
||||||
return None, None
|
return None, None
|
||||||
else:
|
else:
|
||||||
lhs_base, lhs_depth = get_base_type_and_depth(lhs.type)
|
lhs_base, lhs_depth = _get_base_type_and_depth(lhs.type)
|
||||||
rhs_base, rhs_depth = get_base_type_and_depth(rhs.type)
|
rhs_base, rhs_depth = _get_base_type_and_depth(rhs.type)
|
||||||
if lhs_base == rhs_base:
|
if lhs_base == rhs_base:
|
||||||
if lhs_depth < rhs_depth:
|
if lhs_depth < rhs_depth:
|
||||||
rhs = deref_to_depth(func, builder, rhs, rhs_depth - lhs_depth)
|
rhs = _deref_to_depth(func, builder, rhs, rhs_depth - lhs_depth)
|
||||||
elif rhs_depth < lhs_depth:
|
elif rhs_depth < lhs_depth:
|
||||||
lhs = deref_to_depth(func, builder, lhs, lhs_depth - rhs_depth)
|
lhs = _deref_to_depth(func, builder, lhs, lhs_depth - rhs_depth)
|
||||||
return _normalize_types(func, builder, lhs, rhs)
|
return _normalize_types(func, builder, lhs, rhs)
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@ -1,18 +1,13 @@
|
|||||||
from llvmlite import ir
|
from llvmlite import ir
|
||||||
import ast
|
import ast
|
||||||
import logging
|
import logging
|
||||||
|
from typing import Any
|
||||||
|
from dataclasses import dataclass
|
||||||
|
|
||||||
from pythonbpf.helper import (
|
from pythonbpf.helper import HelperHandlerRegistry, handle_helper_call
|
||||||
HelperHandlerRegistry,
|
|
||||||
reset_scratch_pool,
|
|
||||||
)
|
|
||||||
from pythonbpf.type_deducer import ctypes_to_ir
|
from pythonbpf.type_deducer import ctypes_to_ir
|
||||||
|
from pythonbpf.binary_ops import handle_binary_op
|
||||||
from pythonbpf.expr import eval_expr, handle_expr, convert_to_bool
|
from pythonbpf.expr import eval_expr, handle_expr, convert_to_bool
|
||||||
from pythonbpf.assign_pass import (
|
|
||||||
handle_variable_assignment,
|
|
||||||
handle_struct_field_assignment,
|
|
||||||
)
|
|
||||||
from pythonbpf.allocation_pass import handle_assign_allocation, allocate_temp_pool
|
|
||||||
|
|
||||||
from .return_utils import _handle_none_return, _handle_xdp_return, _is_xdp_name
|
from .return_utils import _handle_none_return, _handle_xdp_return, _is_xdp_name
|
||||||
|
|
||||||
@ -20,6 +15,18 @@ from .return_utils import _handle_none_return, _handle_xdp_return, _is_xdp_name
|
|||||||
logger = logging.getLogger(__name__)
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class LocalSymbol:
|
||||||
|
var: ir.AllocaInstr
|
||||||
|
ir_type: ir.Type
|
||||||
|
metadata: Any = None
|
||||||
|
|
||||||
|
def __iter__(self):
|
||||||
|
yield self.var
|
||||||
|
yield self.ir_type
|
||||||
|
yield self.metadata
|
||||||
|
|
||||||
|
|
||||||
def get_probe_string(func_node):
|
def get_probe_string(func_node):
|
||||||
"""Extract the probe string from the decorator of the function node."""
|
"""Extract the probe string from the decorator of the function node."""
|
||||||
# TODO: right now we have the whole string in the section decorator
|
# TODO: right now we have the whole string in the section decorator
|
||||||
@ -41,49 +48,196 @@ def handle_assign(
|
|||||||
func, module, builder, stmt, map_sym_tab, local_sym_tab, structs_sym_tab
|
func, module, builder, stmt, map_sym_tab, local_sym_tab, structs_sym_tab
|
||||||
):
|
):
|
||||||
"""Handle assignment statements in the function body."""
|
"""Handle assignment statements in the function body."""
|
||||||
|
|
||||||
# TODO: Support this later
|
|
||||||
# GH #37
|
|
||||||
if len(stmt.targets) != 1:
|
if len(stmt.targets) != 1:
|
||||||
logger.error("Multi-target assignment is not supported for now")
|
logger.info("Unsupported multiassignment")
|
||||||
return
|
return
|
||||||
|
|
||||||
|
num_types = ("c_int32", "c_int64", "c_uint32", "c_uint64")
|
||||||
|
|
||||||
target = stmt.targets[0]
|
target = stmt.targets[0]
|
||||||
|
logger.info(f"Handling assignment to {ast.dump(target)}")
|
||||||
|
if not isinstance(target, ast.Name) and not isinstance(target, ast.Attribute):
|
||||||
|
logger.info("Unsupported assignment target")
|
||||||
|
return
|
||||||
|
var_name = target.id if isinstance(target, ast.Name) else target.value.id
|
||||||
rval = stmt.value
|
rval = stmt.value
|
||||||
|
|
||||||
if isinstance(target, ast.Name):
|
|
||||||
# NOTE: Simple variable assignment case: x = 5
|
|
||||||
var_name = target.id
|
|
||||||
result = handle_variable_assignment(
|
|
||||||
func,
|
|
||||||
module,
|
|
||||||
builder,
|
|
||||||
var_name,
|
|
||||||
rval,
|
|
||||||
local_sym_tab,
|
|
||||||
map_sym_tab,
|
|
||||||
structs_sym_tab,
|
|
||||||
)
|
|
||||||
if not result:
|
|
||||||
logger.error(f"Failed to handle assignment to {var_name}")
|
|
||||||
return
|
|
||||||
|
|
||||||
if isinstance(target, ast.Attribute):
|
if isinstance(target, ast.Attribute):
|
||||||
# NOTE: Struct field assignment case: pkt.field = value
|
# struct field assignment
|
||||||
handle_struct_field_assignment(
|
field_name = target.attr
|
||||||
func,
|
if var_name in local_sym_tab:
|
||||||
module,
|
struct_type = local_sym_tab[var_name].metadata
|
||||||
builder,
|
struct_info = structs_sym_tab[struct_type]
|
||||||
target,
|
if field_name in struct_info.fields:
|
||||||
rval,
|
field_ptr = struct_info.gep(
|
||||||
local_sym_tab,
|
builder, local_sym_tab[var_name].var, field_name
|
||||||
map_sym_tab,
|
)
|
||||||
structs_sym_tab,
|
val = eval_expr(
|
||||||
)
|
func,
|
||||||
return
|
module,
|
||||||
|
builder,
|
||||||
# Unsupported target type
|
rval,
|
||||||
logger.error(f"Unsupported assignment target: {ast.dump(target)}")
|
local_sym_tab,
|
||||||
|
map_sym_tab,
|
||||||
|
structs_sym_tab,
|
||||||
|
)
|
||||||
|
if isinstance(struct_info.field_type(field_name), ir.ArrayType) and val[
|
||||||
|
1
|
||||||
|
] == ir.PointerType(ir.IntType(8)):
|
||||||
|
# TODO: Figure it out, not a priority rn
|
||||||
|
# Special case for string assignment to char array
|
||||||
|
# str_len = struct_info["field_types"][field_idx].count
|
||||||
|
# assign_string_to_array(builder, field_ptr, val[0], str_len)
|
||||||
|
# print(f"Assigned to struct field {var_name}.{field_name}")
|
||||||
|
pass
|
||||||
|
if val is None:
|
||||||
|
logger.info("Failed to evaluate struct field assignment")
|
||||||
|
return
|
||||||
|
logger.info(field_ptr)
|
||||||
|
builder.store(val[0], field_ptr)
|
||||||
|
logger.info(f"Assigned to struct field {var_name}.{field_name}")
|
||||||
|
return
|
||||||
|
elif isinstance(rval, ast.Constant):
|
||||||
|
if isinstance(rval.value, bool):
|
||||||
|
if rval.value:
|
||||||
|
builder.store(
|
||||||
|
ir.Constant(ir.IntType(1), 1), local_sym_tab[var_name].var
|
||||||
|
)
|
||||||
|
else:
|
||||||
|
builder.store(
|
||||||
|
ir.Constant(ir.IntType(1), 0), local_sym_tab[var_name].var
|
||||||
|
)
|
||||||
|
logger.info(f"Assigned constant {rval.value} to {var_name}")
|
||||||
|
elif isinstance(rval.value, int):
|
||||||
|
# Assume c_int64 for now
|
||||||
|
# var = builder.alloca(ir.IntType(64), name=var_name)
|
||||||
|
# var.align = 8
|
||||||
|
builder.store(
|
||||||
|
ir.Constant(ir.IntType(64), rval.value), local_sym_tab[var_name].var
|
||||||
|
)
|
||||||
|
logger.info(f"Assigned constant {rval.value} to {var_name}")
|
||||||
|
elif isinstance(rval.value, str):
|
||||||
|
str_val = rval.value.encode("utf-8") + b"\x00"
|
||||||
|
str_const = ir.Constant(
|
||||||
|
ir.ArrayType(ir.IntType(8), len(str_val)), bytearray(str_val)
|
||||||
|
)
|
||||||
|
global_str = ir.GlobalVariable(
|
||||||
|
module, str_const.type, name=f"{var_name}_str"
|
||||||
|
)
|
||||||
|
global_str.linkage = "internal"
|
||||||
|
global_str.global_constant = True
|
||||||
|
global_str.initializer = str_const
|
||||||
|
str_ptr = builder.bitcast(global_str, ir.PointerType(ir.IntType(8)))
|
||||||
|
builder.store(str_ptr, local_sym_tab[var_name].var)
|
||||||
|
logger.info(f"Assigned string constant '{rval.value}' to {var_name}")
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported constant type")
|
||||||
|
elif isinstance(rval, ast.Call):
|
||||||
|
if isinstance(rval.func, ast.Name):
|
||||||
|
call_type = rval.func.id
|
||||||
|
logger.info(f"Assignment call type: {call_type}")
|
||||||
|
if (
|
||||||
|
call_type in num_types
|
||||||
|
and len(rval.args) == 1
|
||||||
|
and isinstance(rval.args[0], ast.Constant)
|
||||||
|
and isinstance(rval.args[0].value, int)
|
||||||
|
):
|
||||||
|
ir_type = ctypes_to_ir(call_type)
|
||||||
|
# var = builder.alloca(ir_type, name=var_name)
|
||||||
|
# var.align = ir_type.width // 8
|
||||||
|
builder.store(
|
||||||
|
ir.Constant(ir_type, rval.args[0].value),
|
||||||
|
local_sym_tab[var_name].var,
|
||||||
|
)
|
||||||
|
logger.info(
|
||||||
|
f"Assigned {call_type} constant {rval.args[0].value} to {var_name}"
|
||||||
|
)
|
||||||
|
elif HelperHandlerRegistry.has_handler(call_type):
|
||||||
|
# var = builder.alloca(ir.IntType(64), name=var_name)
|
||||||
|
# var.align = 8
|
||||||
|
val = handle_helper_call(
|
||||||
|
rval,
|
||||||
|
module,
|
||||||
|
builder,
|
||||||
|
func,
|
||||||
|
local_sym_tab,
|
||||||
|
map_sym_tab,
|
||||||
|
structs_sym_tab,
|
||||||
|
)
|
||||||
|
builder.store(val[0], local_sym_tab[var_name].var)
|
||||||
|
logger.info(f"Assigned constant {rval.func.id} to {var_name}")
|
||||||
|
elif call_type == "deref" and len(rval.args) == 1:
|
||||||
|
logger.info(f"Handling deref assignment {ast.dump(rval)}")
|
||||||
|
val = eval_expr(
|
||||||
|
func,
|
||||||
|
module,
|
||||||
|
builder,
|
||||||
|
rval,
|
||||||
|
local_sym_tab,
|
||||||
|
map_sym_tab,
|
||||||
|
structs_sym_tab,
|
||||||
|
)
|
||||||
|
if val is None:
|
||||||
|
logger.info("Failed to evaluate deref argument")
|
||||||
|
return
|
||||||
|
logger.info(f"Dereferenced value: {val}, storing in {var_name}")
|
||||||
|
builder.store(val[0], local_sym_tab[var_name].var)
|
||||||
|
logger.info(f"Dereferenced and assigned to {var_name}")
|
||||||
|
elif call_type in structs_sym_tab and len(rval.args) == 0:
|
||||||
|
struct_info = structs_sym_tab[call_type]
|
||||||
|
ir_type = struct_info.ir_type
|
||||||
|
# var = builder.alloca(ir_type, name=var_name)
|
||||||
|
# Null init
|
||||||
|
builder.store(ir.Constant(ir_type, None), local_sym_tab[var_name].var)
|
||||||
|
logger.info(f"Assigned struct {call_type} to {var_name}")
|
||||||
|
else:
|
||||||
|
logger.info(f"Unsupported assignment call type: {call_type}")
|
||||||
|
elif isinstance(rval.func, ast.Attribute):
|
||||||
|
logger.info(f"Assignment call attribute: {ast.dump(rval.func)}")
|
||||||
|
if isinstance(rval.func.value, ast.Name):
|
||||||
|
if rval.func.value.id in map_sym_tab:
|
||||||
|
map_name = rval.func.value.id
|
||||||
|
method_name = rval.func.attr
|
||||||
|
if HelperHandlerRegistry.has_handler(method_name):
|
||||||
|
val = handle_helper_call(
|
||||||
|
rval,
|
||||||
|
module,
|
||||||
|
builder,
|
||||||
|
func,
|
||||||
|
local_sym_tab,
|
||||||
|
map_sym_tab,
|
||||||
|
structs_sym_tab,
|
||||||
|
)
|
||||||
|
builder.store(val[0], local_sym_tab[var_name].var)
|
||||||
|
else:
|
||||||
|
# TODO: probably a struct access
|
||||||
|
logger.info(f"TODO STRUCT ACCESS {ast.dump(rval)}")
|
||||||
|
elif isinstance(rval.func.value, ast.Call) and isinstance(
|
||||||
|
rval.func.value.func, ast.Name
|
||||||
|
):
|
||||||
|
map_name = rval.func.value.func.id
|
||||||
|
method_name = rval.func.attr
|
||||||
|
if map_name in map_sym_tab:
|
||||||
|
if HelperHandlerRegistry.has_handler(method_name):
|
||||||
|
val = handle_helper_call(
|
||||||
|
rval,
|
||||||
|
module,
|
||||||
|
builder,
|
||||||
|
func,
|
||||||
|
local_sym_tab,
|
||||||
|
map_sym_tab,
|
||||||
|
structs_sym_tab,
|
||||||
|
)
|
||||||
|
# var = builder.alloca(ir.IntType(64), name=var_name)
|
||||||
|
# var.align = 8
|
||||||
|
builder.store(val[0], local_sym_tab[var_name].var)
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported assignment call structure")
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported assignment call function type")
|
||||||
|
elif isinstance(rval, ast.BinOp):
|
||||||
|
handle_binary_op(rval, builder, var_name, local_sym_tab)
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported assignment value type")
|
||||||
|
|
||||||
|
|
||||||
def handle_cond(
|
def handle_cond(
|
||||||
@ -176,7 +330,6 @@ def process_stmt(
|
|||||||
ret_type=ir.IntType(64),
|
ret_type=ir.IntType(64),
|
||||||
):
|
):
|
||||||
logger.info(f"Processing statement: {ast.dump(stmt)}")
|
logger.info(f"Processing statement: {ast.dump(stmt)}")
|
||||||
reset_scratch_pool()
|
|
||||||
if isinstance(stmt, ast.Expr):
|
if isinstance(stmt, ast.Expr):
|
||||||
handle_expr(
|
handle_expr(
|
||||||
func,
|
func,
|
||||||
@ -207,107 +360,119 @@ def process_stmt(
|
|||||||
return did_return
|
return did_return
|
||||||
|
|
||||||
|
|
||||||
def handle_if_allocation(
|
|
||||||
module, builder, stmt, func, ret_type, map_sym_tab, local_sym_tab, structs_sym_tab
|
|
||||||
):
|
|
||||||
"""Recursively handle allocations in if/else branches."""
|
|
||||||
if stmt.body:
|
|
||||||
allocate_mem(
|
|
||||||
module,
|
|
||||||
builder,
|
|
||||||
stmt.body,
|
|
||||||
func,
|
|
||||||
ret_type,
|
|
||||||
map_sym_tab,
|
|
||||||
local_sym_tab,
|
|
||||||
structs_sym_tab,
|
|
||||||
)
|
|
||||||
if stmt.orelse:
|
|
||||||
allocate_mem(
|
|
||||||
module,
|
|
||||||
builder,
|
|
||||||
stmt.orelse,
|
|
||||||
func,
|
|
||||||
ret_type,
|
|
||||||
map_sym_tab,
|
|
||||||
local_sym_tab,
|
|
||||||
structs_sym_tab,
|
|
||||||
)
|
|
||||||
|
|
||||||
|
|
||||||
def count_temps_in_call(call_node, local_sym_tab):
|
|
||||||
"""Count the number of temporary variables needed for a function call."""
|
|
||||||
|
|
||||||
count = 0
|
|
||||||
is_helper = False
|
|
||||||
|
|
||||||
# NOTE: We exclude print calls for now
|
|
||||||
if isinstance(call_node.func, ast.Name):
|
|
||||||
if (
|
|
||||||
HelperHandlerRegistry.has_handler(call_node.func.id)
|
|
||||||
and call_node.func.id != "print"
|
|
||||||
):
|
|
||||||
is_helper = True
|
|
||||||
elif isinstance(call_node.func, ast.Attribute):
|
|
||||||
if HelperHandlerRegistry.has_handler(call_node.func.attr):
|
|
||||||
is_helper = True
|
|
||||||
|
|
||||||
if not is_helper:
|
|
||||||
return 0
|
|
||||||
|
|
||||||
for arg in call_node.args:
|
|
||||||
# NOTE: Count all non-name arguments
|
|
||||||
# For struct fields, if it is being passed as an argument,
|
|
||||||
# The struct object should already exist in the local_sym_tab
|
|
||||||
if not isinstance(arg, ast.Name) and not (
|
|
||||||
isinstance(arg, ast.Attribute) and arg.value.id in local_sym_tab
|
|
||||||
):
|
|
||||||
count += 1
|
|
||||||
|
|
||||||
return count
|
|
||||||
|
|
||||||
|
|
||||||
def allocate_mem(
|
def allocate_mem(
|
||||||
module, builder, body, func, ret_type, map_sym_tab, local_sym_tab, structs_sym_tab
|
module, builder, body, func, ret_type, map_sym_tab, local_sym_tab, structs_sym_tab
|
||||||
):
|
):
|
||||||
max_temps_needed = 0
|
|
||||||
|
|
||||||
def update_max_temps_for_stmt(stmt):
|
|
||||||
nonlocal max_temps_needed
|
|
||||||
temps_needed = 0
|
|
||||||
|
|
||||||
if isinstance(stmt, ast.If):
|
|
||||||
for s in stmt.body:
|
|
||||||
update_max_temps_for_stmt(s)
|
|
||||||
for s in stmt.orelse:
|
|
||||||
update_max_temps_for_stmt(s)
|
|
||||||
return
|
|
||||||
|
|
||||||
for node in ast.walk(stmt):
|
|
||||||
if isinstance(node, ast.Call):
|
|
||||||
temps_needed += count_temps_in_call(node, local_sym_tab)
|
|
||||||
max_temps_needed = max(max_temps_needed, temps_needed)
|
|
||||||
|
|
||||||
for stmt in body:
|
for stmt in body:
|
||||||
update_max_temps_for_stmt(stmt)
|
has_metadata = False
|
||||||
|
|
||||||
# Handle allocations
|
|
||||||
if isinstance(stmt, ast.If):
|
if isinstance(stmt, ast.If):
|
||||||
handle_if_allocation(
|
if stmt.body:
|
||||||
module,
|
local_sym_tab = allocate_mem(
|
||||||
builder,
|
module,
|
||||||
stmt,
|
builder,
|
||||||
func,
|
stmt.body,
|
||||||
ret_type,
|
func,
|
||||||
map_sym_tab,
|
ret_type,
|
||||||
local_sym_tab,
|
map_sym_tab,
|
||||||
structs_sym_tab,
|
local_sym_tab,
|
||||||
)
|
structs_sym_tab,
|
||||||
|
)
|
||||||
|
if stmt.orelse:
|
||||||
|
local_sym_tab = allocate_mem(
|
||||||
|
module,
|
||||||
|
builder,
|
||||||
|
stmt.orelse,
|
||||||
|
func,
|
||||||
|
ret_type,
|
||||||
|
map_sym_tab,
|
||||||
|
local_sym_tab,
|
||||||
|
structs_sym_tab,
|
||||||
|
)
|
||||||
elif isinstance(stmt, ast.Assign):
|
elif isinstance(stmt, ast.Assign):
|
||||||
handle_assign_allocation(builder, stmt, local_sym_tab, structs_sym_tab)
|
if len(stmt.targets) != 1:
|
||||||
|
logger.info("Unsupported multiassignment")
|
||||||
allocate_temp_pool(builder, max_temps_needed, local_sym_tab)
|
continue
|
||||||
|
target = stmt.targets[0]
|
||||||
|
if not isinstance(target, ast.Name):
|
||||||
|
logger.info("Unsupported assignment target")
|
||||||
|
continue
|
||||||
|
var_name = target.id
|
||||||
|
rval = stmt.value
|
||||||
|
if var_name in local_sym_tab:
|
||||||
|
logger.info(f"Variable {var_name} already allocated")
|
||||||
|
continue
|
||||||
|
if isinstance(rval, ast.Call):
|
||||||
|
if isinstance(rval.func, ast.Name):
|
||||||
|
call_type = rval.func.id
|
||||||
|
if call_type in ("c_int32", "c_int64", "c_uint32", "c_uint64"):
|
||||||
|
ir_type = ctypes_to_ir(call_type)
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = ir_type.width // 8
|
||||||
|
logger.info(
|
||||||
|
f"Pre-allocated variable {var_name} of type {call_type}"
|
||||||
|
)
|
||||||
|
elif HelperHandlerRegistry.has_handler(call_type):
|
||||||
|
# Assume return type is int64 for now
|
||||||
|
ir_type = ir.IntType(64)
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = ir_type.width // 8
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} for helper")
|
||||||
|
elif call_type == "deref" and len(rval.args) == 1:
|
||||||
|
# Assume return type is int64 for now
|
||||||
|
ir_type = ir.IntType(64)
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = ir_type.width // 8
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} for deref")
|
||||||
|
elif call_type in structs_sym_tab:
|
||||||
|
struct_info = structs_sym_tab[call_type]
|
||||||
|
ir_type = struct_info.ir_type
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
has_metadata = True
|
||||||
|
logger.info(
|
||||||
|
f"Pre-allocated variable {var_name} for struct {call_type}"
|
||||||
|
)
|
||||||
|
elif isinstance(rval.func, ast.Attribute):
|
||||||
|
ir_type = ir.PointerType(ir.IntType(64))
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
# var.align = ir_type.width // 8
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} for map")
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported assignment call function type")
|
||||||
|
continue
|
||||||
|
elif isinstance(rval, ast.Constant):
|
||||||
|
if isinstance(rval.value, bool):
|
||||||
|
ir_type = ir.IntType(1)
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = 1
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} of type c_bool")
|
||||||
|
elif isinstance(rval.value, int):
|
||||||
|
# Assume c_int64 for now
|
||||||
|
ir_type = ir.IntType(64)
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = ir_type.width // 8
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} of type c_int64")
|
||||||
|
elif isinstance(rval.value, str):
|
||||||
|
ir_type = ir.PointerType(ir.IntType(8))
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = 8
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} of type string")
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported constant type")
|
||||||
|
continue
|
||||||
|
elif isinstance(rval, ast.BinOp):
|
||||||
|
# Assume c_int64 for now
|
||||||
|
ir_type = ir.IntType(64)
|
||||||
|
var = builder.alloca(ir_type, name=var_name)
|
||||||
|
var.align = ir_type.width // 8
|
||||||
|
logger.info(f"Pre-allocated variable {var_name} of type c_int64")
|
||||||
|
else:
|
||||||
|
logger.info("Unsupported assignment value type")
|
||||||
|
continue
|
||||||
|
|
||||||
|
if has_metadata:
|
||||||
|
local_sym_tab[var_name] = LocalSymbol(var, ir_type, call_type)
|
||||||
|
else:
|
||||||
|
local_sym_tab[var_name] = LocalSymbol(var, ir_type)
|
||||||
return local_sym_tab
|
return local_sym_tab
|
||||||
|
|
||||||
|
|
||||||
|
|||||||
@ -1,10 +1,9 @@
|
|||||||
from .helper_utils import HelperHandlerRegistry, reset_scratch_pool
|
from .helper_utils import HelperHandlerRegistry
|
||||||
from .bpf_helper_handler import handle_helper_call
|
from .bpf_helper_handler import handle_helper_call
|
||||||
from .helpers import ktime, pid, deref, XDP_DROP, XDP_PASS
|
from .helpers import ktime, pid, deref, XDP_DROP, XDP_PASS
|
||||||
|
|
||||||
__all__ = [
|
__all__ = [
|
||||||
"HelperHandlerRegistry",
|
"HelperHandlerRegistry",
|
||||||
"reset_scratch_pool",
|
|
||||||
"handle_helper_call",
|
"handle_helper_call",
|
||||||
"ktime",
|
"ktime",
|
||||||
"pid",
|
"pid",
|
||||||
|
|||||||
@ -34,7 +34,6 @@ def bpf_ktime_get_ns_emitter(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
"""
|
"""
|
||||||
Emit LLVM IR for bpf_ktime_get_ns helper function call.
|
Emit LLVM IR for bpf_ktime_get_ns helper function call.
|
||||||
@ -57,7 +56,6 @@ def bpf_map_lookup_elem_emitter(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
"""
|
"""
|
||||||
Emit LLVM IR for bpf_map_lookup_elem helper function call.
|
Emit LLVM IR for bpf_map_lookup_elem helper function call.
|
||||||
@ -66,17 +64,11 @@ def bpf_map_lookup_elem_emitter(
|
|||||||
raise ValueError(
|
raise ValueError(
|
||||||
f"Map lookup expects exactly one argument (key), got {len(call.args)}"
|
f"Map lookup expects exactly one argument (key), got {len(call.args)}"
|
||||||
)
|
)
|
||||||
key_ptr = get_or_create_ptr_from_arg(
|
key_ptr = get_or_create_ptr_from_arg(call.args[0], builder, local_sym_tab)
|
||||||
func, module, call.args[0], builder, local_sym_tab, map_sym_tab, struct_sym_tab
|
|
||||||
)
|
|
||||||
map_void_ptr = builder.bitcast(map_ptr, ir.PointerType())
|
map_void_ptr = builder.bitcast(map_ptr, ir.PointerType())
|
||||||
|
|
||||||
# TODO: I have changed the return type to i64*, as we are
|
|
||||||
# allocating space for that type in allocate_mem. This is
|
|
||||||
# temporary, and we will honour other widths later. But this
|
|
||||||
# allows us to have cool binary ops on the returned value.
|
|
||||||
fn_type = ir.FunctionType(
|
fn_type = ir.FunctionType(
|
||||||
ir.PointerType(ir.IntType(64)), # Return type: void*
|
ir.PointerType(), # Return type: void*
|
||||||
[ir.PointerType(), ir.PointerType()], # Args: (void*, void*)
|
[ir.PointerType(), ir.PointerType()], # Args: (void*, void*)
|
||||||
var_arg=False,
|
var_arg=False,
|
||||||
)
|
)
|
||||||
@ -99,7 +91,6 @@ def bpf_printk_emitter(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
"""Emit LLVM IR for bpf_printk helper function call."""
|
"""Emit LLVM IR for bpf_printk helper function call."""
|
||||||
if not hasattr(func, "_fmt_counter"):
|
if not hasattr(func, "_fmt_counter"):
|
||||||
@ -147,7 +138,6 @@ def bpf_map_update_elem_emitter(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
"""
|
"""
|
||||||
Emit LLVM IR for bpf_map_update_elem helper function call.
|
Emit LLVM IR for bpf_map_update_elem helper function call.
|
||||||
@ -162,12 +152,8 @@ def bpf_map_update_elem_emitter(
|
|||||||
value_arg = call.args[1]
|
value_arg = call.args[1]
|
||||||
flags_arg = call.args[2] if len(call.args) > 2 else None
|
flags_arg = call.args[2] if len(call.args) > 2 else None
|
||||||
|
|
||||||
key_ptr = get_or_create_ptr_from_arg(
|
key_ptr = get_or_create_ptr_from_arg(key_arg, builder, local_sym_tab)
|
||||||
func, module, key_arg, builder, local_sym_tab, map_sym_tab, struct_sym_tab
|
value_ptr = get_or_create_ptr_from_arg(value_arg, builder, local_sym_tab)
|
||||||
)
|
|
||||||
value_ptr = get_or_create_ptr_from_arg(
|
|
||||||
func, module, value_arg, builder, local_sym_tab, map_sym_tab, struct_sym_tab
|
|
||||||
)
|
|
||||||
flags_val = get_flags_val(flags_arg, builder, local_sym_tab)
|
flags_val = get_flags_val(flags_arg, builder, local_sym_tab)
|
||||||
|
|
||||||
map_void_ptr = builder.bitcast(map_ptr, ir.PointerType())
|
map_void_ptr = builder.bitcast(map_ptr, ir.PointerType())
|
||||||
@ -202,7 +188,6 @@ def bpf_map_delete_elem_emitter(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
"""
|
"""
|
||||||
Emit LLVM IR for bpf_map_delete_elem helper function call.
|
Emit LLVM IR for bpf_map_delete_elem helper function call.
|
||||||
@ -212,9 +197,7 @@ def bpf_map_delete_elem_emitter(
|
|||||||
raise ValueError(
|
raise ValueError(
|
||||||
f"Map delete expects exactly one argument (key), got {len(call.args)}"
|
f"Map delete expects exactly one argument (key), got {len(call.args)}"
|
||||||
)
|
)
|
||||||
key_ptr = get_or_create_ptr_from_arg(
|
key_ptr = get_or_create_ptr_from_arg(call.args[0], builder, local_sym_tab)
|
||||||
func, module, call.args[0], builder, local_sym_tab, map_sym_tab, struct_sym_tab
|
|
||||||
)
|
|
||||||
map_void_ptr = builder.bitcast(map_ptr, ir.PointerType())
|
map_void_ptr = builder.bitcast(map_ptr, ir.PointerType())
|
||||||
|
|
||||||
# Define function type for bpf_map_delete_elem
|
# Define function type for bpf_map_delete_elem
|
||||||
@ -242,7 +225,6 @@ def bpf_get_current_pid_tgid_emitter(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
"""
|
"""
|
||||||
Emit LLVM IR for bpf_get_current_pid_tgid helper function call.
|
Emit LLVM IR for bpf_get_current_pid_tgid helper function call.
|
||||||
@ -269,7 +251,6 @@ def bpf_perf_event_output_handler(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab=None,
|
local_sym_tab=None,
|
||||||
struct_sym_tab=None,
|
struct_sym_tab=None,
|
||||||
map_sym_tab=None,
|
|
||||||
):
|
):
|
||||||
if len(call.args) != 1:
|
if len(call.args) != 1:
|
||||||
raise ValueError(
|
raise ValueError(
|
||||||
@ -334,7 +315,6 @@ def handle_helper_call(
|
|||||||
func,
|
func,
|
||||||
local_sym_tab,
|
local_sym_tab,
|
||||||
struct_sym_tab,
|
struct_sym_tab,
|
||||||
map_sym_tab,
|
|
||||||
)
|
)
|
||||||
|
|
||||||
# Handle direct function calls (e.g., print(), ktime())
|
# Handle direct function calls (e.g., print(), ktime())
|
||||||
|
|||||||
@ -3,8 +3,7 @@ import logging
|
|||||||
from collections.abc import Callable
|
from collections.abc import Callable
|
||||||
|
|
||||||
from llvmlite import ir
|
from llvmlite import ir
|
||||||
from pythonbpf.expr import eval_expr, get_base_type_and_depth, deref_to_depth
|
from pythonbpf.expr import eval_expr
|
||||||
from pythonbpf.binary_ops import get_operand_value
|
|
||||||
|
|
||||||
logger = logging.getLogger(__name__)
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
@ -35,41 +34,6 @@ class HelperHandlerRegistry:
|
|||||||
return helper_name in cls._handlers
|
return helper_name in cls._handlers
|
||||||
|
|
||||||
|
|
||||||
class ScratchPoolManager:
|
|
||||||
"""Manage the temporary helper variables in local_sym_tab"""
|
|
||||||
|
|
||||||
def __init__(self):
|
|
||||||
self._counter = 0
|
|
||||||
|
|
||||||
@property
|
|
||||||
def counter(self):
|
|
||||||
return self._counter
|
|
||||||
|
|
||||||
def reset(self):
|
|
||||||
self._counter = 0
|
|
||||||
logger.debug("Scratch pool counter reset to 0")
|
|
||||||
|
|
||||||
def get_next_temp(self, local_sym_tab):
|
|
||||||
temp_name = f"__helper_temp_{self._counter}"
|
|
||||||
self._counter += 1
|
|
||||||
|
|
||||||
if temp_name not in local_sym_tab:
|
|
||||||
raise ValueError(
|
|
||||||
f"Scratch pool exhausted or inadequate: {temp_name}. "
|
|
||||||
f"Current counter: {self._counter}"
|
|
||||||
)
|
|
||||||
|
|
||||||
return local_sym_tab[temp_name].var, temp_name
|
|
||||||
|
|
||||||
|
|
||||||
_temp_pool_manager = ScratchPoolManager() # Singleton instance
|
|
||||||
|
|
||||||
|
|
||||||
def reset_scratch_pool():
|
|
||||||
"""Reset the scratch pool counter"""
|
|
||||||
_temp_pool_manager.reset()
|
|
||||||
|
|
||||||
|
|
||||||
def get_var_ptr_from_name(var_name, local_sym_tab):
|
def get_var_ptr_from_name(var_name, local_sym_tab):
|
||||||
"""Get a pointer to a variable from the symbol table."""
|
"""Get a pointer to a variable from the symbol table."""
|
||||||
if local_sym_tab and var_name in local_sym_tab:
|
if local_sym_tab and var_name in local_sym_tab:
|
||||||
@ -77,41 +41,27 @@ def get_var_ptr_from_name(var_name, local_sym_tab):
|
|||||||
raise ValueError(f"Variable '{var_name}' not found in local symbol table")
|
raise ValueError(f"Variable '{var_name}' not found in local symbol table")
|
||||||
|
|
||||||
|
|
||||||
def create_int_constant_ptr(value, builder, local_sym_tab, int_width=64):
|
def create_int_constant_ptr(value, builder, int_width=64):
|
||||||
"""Create a pointer to an integer constant."""
|
"""Create a pointer to an integer constant."""
|
||||||
|
|
||||||
# Default to 64-bit integer
|
# Default to 64-bit integer
|
||||||
ptr, temp_name = _temp_pool_manager.get_next_temp(local_sym_tab)
|
int_type = ir.IntType(int_width)
|
||||||
logger.info(f"Using temp variable '{temp_name}' for int constant {value}")
|
ptr = builder.alloca(int_type)
|
||||||
const_val = ir.Constant(ir.IntType(int_width), value)
|
ptr.align = int_type.width // 8
|
||||||
builder.store(const_val, ptr)
|
builder.store(ir.Constant(int_type, value), ptr)
|
||||||
return ptr
|
return ptr
|
||||||
|
|
||||||
|
|
||||||
def get_or_create_ptr_from_arg(
|
def get_or_create_ptr_from_arg(arg, builder, local_sym_tab):
|
||||||
func, module, arg, builder, local_sym_tab, map_sym_tab, struct_sym_tab=None
|
|
||||||
):
|
|
||||||
"""Extract or create pointer from the call arguments."""
|
"""Extract or create pointer from the call arguments."""
|
||||||
|
|
||||||
if isinstance(arg, ast.Name):
|
if isinstance(arg, ast.Name):
|
||||||
ptr = get_var_ptr_from_name(arg.id, local_sym_tab)
|
ptr = get_var_ptr_from_name(arg.id, local_sym_tab)
|
||||||
elif isinstance(arg, ast.Constant) and isinstance(arg.value, int):
|
elif isinstance(arg, ast.Constant) and isinstance(arg.value, int):
|
||||||
ptr = create_int_constant_ptr(arg.value, builder, local_sym_tab)
|
ptr = create_int_constant_ptr(arg.value, builder)
|
||||||
else:
|
else:
|
||||||
# Evaluate the expression and store the result in a temp variable
|
raise NotImplementedError(
|
||||||
val = get_operand_value(
|
"Only simple variable names are supported as args in map helpers."
|
||||||
func, module, arg, builder, local_sym_tab, map_sym_tab, struct_sym_tab
|
|
||||||
)
|
)
|
||||||
if val is None:
|
|
||||||
raise ValueError("Failed to evaluate expression for helper arg.")
|
|
||||||
|
|
||||||
# NOTE: We assume the result is an int64 for now
|
|
||||||
# if isinstance(arg, ast.Attribute):
|
|
||||||
# return val
|
|
||||||
ptr, temp_name = _temp_pool_manager.get_next_temp(local_sym_tab)
|
|
||||||
logger.info(f"Using temp variable '{temp_name}' for expression result")
|
|
||||||
builder.store(val, ptr)
|
|
||||||
|
|
||||||
return ptr
|
return ptr
|
||||||
|
|
||||||
|
|
||||||
@ -274,27 +224,10 @@ def _populate_fval(ftype, node, fmt_parts, exprs):
|
|||||||
raise NotImplementedError(
|
raise NotImplementedError(
|
||||||
f"Unsupported integer width in f-string: {ftype.width}"
|
f"Unsupported integer width in f-string: {ftype.width}"
|
||||||
)
|
)
|
||||||
elif isinstance(ftype, ir.PointerType):
|
elif ftype == ir.PointerType(ir.IntType(8)):
|
||||||
target, depth = get_base_type_and_depth(ftype)
|
# NOTE: We assume i8* is a string
|
||||||
if isinstance(target, ir.IntType):
|
fmt_parts.append("%s")
|
||||||
if target.width == 64:
|
exprs.append(node)
|
||||||
fmt_parts.append("%lld")
|
|
||||||
exprs.append(node)
|
|
||||||
elif target.width == 32:
|
|
||||||
fmt_parts.append("%d")
|
|
||||||
exprs.append(node)
|
|
||||||
elif target.width == 8 and depth == 1:
|
|
||||||
# NOTE: Assume i8* is a string
|
|
||||||
fmt_parts.append("%s")
|
|
||||||
exprs.append(node)
|
|
||||||
else:
|
|
||||||
raise NotImplementedError(
|
|
||||||
f"Unsupported pointer target type in f-string: {target}"
|
|
||||||
)
|
|
||||||
else:
|
|
||||||
raise NotImplementedError(
|
|
||||||
f"Unsupported pointer target type in f-string: {target}"
|
|
||||||
)
|
|
||||||
else:
|
else:
|
||||||
raise NotImplementedError(f"Unsupported field type in f-string: {ftype}")
|
raise NotImplementedError(f"Unsupported field type in f-string: {ftype}")
|
||||||
|
|
||||||
@ -331,20 +264,7 @@ def _prepare_expr_args(expr, func, module, builder, local_sym_tab, struct_sym_ta
|
|||||||
|
|
||||||
if val:
|
if val:
|
||||||
if isinstance(val.type, ir.PointerType):
|
if isinstance(val.type, ir.PointerType):
|
||||||
target, depth = get_base_type_and_depth(val.type)
|
val = builder.ptrtoint(val, ir.IntType(64))
|
||||||
if isinstance(target, ir.IntType):
|
|
||||||
if target.width >= 32:
|
|
||||||
val = deref_to_depth(func, builder, val, depth)
|
|
||||||
val = builder.sext(val, ir.IntType(64))
|
|
||||||
elif target.width == 8 and depth == 1:
|
|
||||||
# NOTE: i8* is string, no need to deref
|
|
||||||
pass
|
|
||||||
|
|
||||||
else:
|
|
||||||
logger.warning(
|
|
||||||
"Only int and ptr supported in bpf_printk args. Others default to 0."
|
|
||||||
)
|
|
||||||
val = ir.Constant(ir.IntType(64), 0)
|
|
||||||
elif isinstance(val.type, ir.IntType):
|
elif isinstance(val.type, ir.IntType):
|
||||||
if val.type.width < 64:
|
if val.type.width < 64:
|
||||||
val = builder.sext(val, ir.IntType(64))
|
val = builder.sext(val, ir.IntType(64))
|
||||||
|
|||||||
@ -15,5 +15,8 @@ def deref(ptr):
|
|||||||
return result if result is not None else 0
|
return result if result is not None else 0
|
||||||
|
|
||||||
|
|
||||||
|
XDP_ABORTED = ctypes.c_int64(0)
|
||||||
XDP_DROP = ctypes.c_int64(1)
|
XDP_DROP = ctypes.c_int64(1)
|
||||||
XDP_PASS = ctypes.c_int64(2)
|
XDP_PASS = ctypes.c_int64(2)
|
||||||
|
XDP_TX = ctypes.c_int64(3)
|
||||||
|
XDP_REDIRECT = ctypes.c_int64(4)
|
||||||
|
|||||||
0
pythonbpf/tbaa_gen/__init__.py
Normal file
0
pythonbpf/tbaa_gen/__init__.py
Normal file
3
pythonbpf/vmlinux_parser/__init__.py
Normal file
3
pythonbpf/vmlinux_parser/__init__.py
Normal file
@ -0,0 +1,3 @@
|
|||||||
|
from .import_detector import vmlinux_proc
|
||||||
|
|
||||||
|
__all__ = ["vmlinux_proc"]
|
||||||
167
pythonbpf/vmlinux_parser/class_handler.py
Normal file
167
pythonbpf/vmlinux_parser/class_handler.py
Normal file
@ -0,0 +1,167 @@
|
|||||||
|
import logging
|
||||||
|
from functools import lru_cache
|
||||||
|
import importlib
|
||||||
|
from .dependency_handler import DependencyHandler
|
||||||
|
from .dependency_node import DependencyNode
|
||||||
|
import ctypes
|
||||||
|
from typing import Optional, Any, Dict
|
||||||
|
|
||||||
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
|
||||||
|
@lru_cache(maxsize=1)
|
||||||
|
def get_module_symbols(module_name: str):
|
||||||
|
imported_module = importlib.import_module(module_name)
|
||||||
|
return [name for name in dir(imported_module)], imported_module
|
||||||
|
|
||||||
|
|
||||||
|
def process_vmlinux_class(node, llvm_module, handler: DependencyHandler):
|
||||||
|
symbols_in_module, imported_module = get_module_symbols("vmlinux")
|
||||||
|
if node.name in symbols_in_module:
|
||||||
|
vmlinux_type = getattr(imported_module, node.name)
|
||||||
|
process_vmlinux_post_ast(vmlinux_type, llvm_module, handler)
|
||||||
|
else:
|
||||||
|
raise ImportError(f"{node.name} not in vmlinux")
|
||||||
|
|
||||||
|
|
||||||
|
def process_vmlinux_post_ast(
|
||||||
|
elem_type_class, llvm_handler, handler: DependencyHandler, processing_stack=None
|
||||||
|
):
|
||||||
|
# Initialize processing stack on first call
|
||||||
|
if processing_stack is None:
|
||||||
|
processing_stack = set()
|
||||||
|
symbols_in_module, imported_module = get_module_symbols("vmlinux")
|
||||||
|
|
||||||
|
current_symbol_name = elem_type_class.__name__
|
||||||
|
logger.info(f"Begin {current_symbol_name} Processing")
|
||||||
|
field_table: Dict[str, list] = {}
|
||||||
|
is_complex_type = False
|
||||||
|
containing_type: Optional[Any] = None
|
||||||
|
ctype_complex_type: Optional[Any] = None
|
||||||
|
type_length: Optional[int] = None
|
||||||
|
module_name = getattr(elem_type_class, "__module__", None)
|
||||||
|
|
||||||
|
# Check if already processed
|
||||||
|
if handler.has_node(current_symbol_name):
|
||||||
|
logger.debug(f"Node {current_symbol_name} already processed and ready")
|
||||||
|
return True
|
||||||
|
|
||||||
|
# XXX:Check it's use. It's probably not being used.
|
||||||
|
if current_symbol_name in processing_stack:
|
||||||
|
logger.debug(
|
||||||
|
f"Dependency already in processing stack for {current_symbol_name}, skipping"
|
||||||
|
)
|
||||||
|
return True
|
||||||
|
|
||||||
|
processing_stack.add(current_symbol_name)
|
||||||
|
|
||||||
|
if module_name == "vmlinux":
|
||||||
|
if hasattr(elem_type_class, "_type_"):
|
||||||
|
pass
|
||||||
|
else:
|
||||||
|
new_dep_node = DependencyNode(name=current_symbol_name)
|
||||||
|
handler.add_node(new_dep_node)
|
||||||
|
class_obj = getattr(imported_module, current_symbol_name)
|
||||||
|
# Inspect the class fields
|
||||||
|
if hasattr(class_obj, "_fields_"):
|
||||||
|
for field_elem in class_obj._fields_:
|
||||||
|
field_name: str = ""
|
||||||
|
field_type: Optional[Any] = None
|
||||||
|
bitfield_size: Optional[int] = None
|
||||||
|
if len(field_elem) == 2:
|
||||||
|
field_name, field_type = field_elem
|
||||||
|
elif len(field_elem) == 3:
|
||||||
|
field_name, field_type, bitfield_size = field_elem
|
||||||
|
field_table[field_name] = [field_type, bitfield_size]
|
||||||
|
elif hasattr(class_obj, "__annotations__"):
|
||||||
|
for field_elem in class_obj.__annotations__.items():
|
||||||
|
if len(field_elem) == 2:
|
||||||
|
field_name, field_type = field_elem
|
||||||
|
bitfield_size = None
|
||||||
|
elif len(field_elem) == 3:
|
||||||
|
field_name, field_type, bitfield_size = field_elem
|
||||||
|
else:
|
||||||
|
raise ValueError(
|
||||||
|
"Number of fields in items() of class object unexpected"
|
||||||
|
)
|
||||||
|
field_table[field_name] = [field_type, bitfield_size]
|
||||||
|
else:
|
||||||
|
raise TypeError("Could not get required class and definition")
|
||||||
|
|
||||||
|
logger.debug(f"Extracted fields for {current_symbol_name}: {field_table}")
|
||||||
|
for elem in field_table.items():
|
||||||
|
elem_name, elem_temp_list = elem
|
||||||
|
[elem_type, elem_bitfield_size] = elem_temp_list
|
||||||
|
local_module_name = getattr(elem_type, "__module__", None)
|
||||||
|
new_dep_node.add_field(elem_name, elem_type, ready=False)
|
||||||
|
if local_module_name == ctypes.__name__:
|
||||||
|
new_dep_node.set_field_bitfield_size(elem_name, elem_bitfield_size)
|
||||||
|
new_dep_node.set_field_ready(elem_name, is_ready=True)
|
||||||
|
logger.debug(
|
||||||
|
f"Field {elem_name} is direct ctypes type: {elem_type}"
|
||||||
|
)
|
||||||
|
elif local_module_name == "vmlinux":
|
||||||
|
new_dep_node.set_field_bitfield_size(elem_name, elem_bitfield_size)
|
||||||
|
logger.debug(
|
||||||
|
f"Processing vmlinux field: {elem_name}, type: {elem_type}"
|
||||||
|
)
|
||||||
|
if hasattr(elem_type, "_type_"):
|
||||||
|
is_complex_type = True
|
||||||
|
containing_type = elem_type._type_
|
||||||
|
if hasattr(elem_type, "_length_") and is_complex_type:
|
||||||
|
type_length = elem_type._length_
|
||||||
|
|
||||||
|
if containing_type.__module__ == "vmlinux":
|
||||||
|
pass
|
||||||
|
elif containing_type.__module__ == ctypes.__name__:
|
||||||
|
if isinstance(elem_type, type):
|
||||||
|
if issubclass(elem_type, ctypes.Array):
|
||||||
|
ctype_complex_type = ctypes.Array
|
||||||
|
elif issubclass(elem_type, ctypes._Pointer):
|
||||||
|
ctype_complex_type = ctypes._Pointer
|
||||||
|
else:
|
||||||
|
raise TypeError("Unsupported ctypes subclass")
|
||||||
|
else:
|
||||||
|
raise ImportError(
|
||||||
|
f"Unsupported module of {containing_type}"
|
||||||
|
)
|
||||||
|
logger.debug(
|
||||||
|
f"{containing_type} containing type of parent {elem_name} with {elem_type} and ctype {ctype_complex_type} and length {type_length}"
|
||||||
|
)
|
||||||
|
new_dep_node.set_field_containing_type(
|
||||||
|
elem_name, containing_type
|
||||||
|
)
|
||||||
|
new_dep_node.set_field_type_size(elem_name, type_length)
|
||||||
|
new_dep_node.set_field_ctype_complex_type(
|
||||||
|
elem_name, ctype_complex_type
|
||||||
|
)
|
||||||
|
new_dep_node.set_field_type(elem_name, elem_type)
|
||||||
|
if containing_type.__module__ == "vmlinux":
|
||||||
|
process_vmlinux_post_ast(
|
||||||
|
containing_type, llvm_handler, handler, processing_stack
|
||||||
|
)
|
||||||
|
new_dep_node.set_field_ready(elem_name, True)
|
||||||
|
elif containing_type.__module__ == ctypes.__name__:
|
||||||
|
logger.debug(f"Processing ctype internal{containing_type}")
|
||||||
|
new_dep_node.set_field_ready(elem_name, True)
|
||||||
|
else:
|
||||||
|
raise TypeError(
|
||||||
|
"Module not supported in recursive resolution"
|
||||||
|
)
|
||||||
|
else:
|
||||||
|
process_vmlinux_post_ast(
|
||||||
|
elem_type, llvm_handler, handler, processing_stack
|
||||||
|
)
|
||||||
|
new_dep_node.set_field_ready(elem_name, True)
|
||||||
|
else:
|
||||||
|
raise ValueError(
|
||||||
|
f"{elem_name} with type {elem_type} from module {module_name} not supported in recursive resolver"
|
||||||
|
)
|
||||||
|
|
||||||
|
else:
|
||||||
|
raise ImportError("UNSUPPORTED Module")
|
||||||
|
|
||||||
|
logging.info(
|
||||||
|
f"{current_symbol_name} processed and handler readiness {handler.is_ready}"
|
||||||
|
)
|
||||||
|
return True
|
||||||
149
pythonbpf/vmlinux_parser/dependency_handler.py
Normal file
149
pythonbpf/vmlinux_parser/dependency_handler.py
Normal file
@ -0,0 +1,149 @@
|
|||||||
|
from typing import Optional, Dict, List, Iterator
|
||||||
|
from .dependency_node import DependencyNode
|
||||||
|
|
||||||
|
|
||||||
|
class DependencyHandler:
|
||||||
|
"""
|
||||||
|
Manages a collection of DependencyNode objects with no duplicates.
|
||||||
|
|
||||||
|
Ensures that no two nodes with the same name can be added and provides
|
||||||
|
methods to check readiness and retrieve specific nodes.
|
||||||
|
|
||||||
|
Example usage:
|
||||||
|
# Create a handler
|
||||||
|
handler = DependencyHandler()
|
||||||
|
|
||||||
|
# Create some dependency nodes
|
||||||
|
node1 = DependencyNode(name="node1")
|
||||||
|
node1.add_field("field1", str)
|
||||||
|
node1.set_field_value("field1", "value1")
|
||||||
|
|
||||||
|
node2 = DependencyNode(name="node2")
|
||||||
|
node2.add_field("field1", int)
|
||||||
|
|
||||||
|
# Add nodes to the handler
|
||||||
|
handler.add_node(node1)
|
||||||
|
handler.add_node(node2)
|
||||||
|
|
||||||
|
# Check if a specific node exists
|
||||||
|
print(handler.has_node("node1")) # True
|
||||||
|
|
||||||
|
# Get a reference to a node and modify it
|
||||||
|
node = handler.get_node("node2")
|
||||||
|
node.set_field_value("field1", 42)
|
||||||
|
|
||||||
|
# Check if all nodes are ready
|
||||||
|
print(handler.is_ready) # False (node2 is ready, but node1 isn't)
|
||||||
|
"""
|
||||||
|
|
||||||
|
def __init__(self):
|
||||||
|
# Using a dictionary with node names as keys ensures name uniqueness
|
||||||
|
# and provides efficient lookups
|
||||||
|
self._nodes: Dict[str, DependencyNode] = {}
|
||||||
|
|
||||||
|
def add_node(self, node: DependencyNode) -> bool:
|
||||||
|
"""
|
||||||
|
Add a dependency node to the handler.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
node: The DependencyNode to add
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
bool: True if the node was added, False if a node with the same name already exists
|
||||||
|
|
||||||
|
Raises:
|
||||||
|
TypeError: If the provided object is not a DependencyNode
|
||||||
|
"""
|
||||||
|
if not isinstance(node, DependencyNode):
|
||||||
|
raise TypeError(f"Expected DependencyNode, got {type(node).__name__}")
|
||||||
|
|
||||||
|
# Check if a node with this name already exists
|
||||||
|
if node.name in self._nodes:
|
||||||
|
return False
|
||||||
|
|
||||||
|
self._nodes[node.name] = node
|
||||||
|
return True
|
||||||
|
|
||||||
|
@property
|
||||||
|
def is_ready(self) -> bool:
|
||||||
|
"""
|
||||||
|
Check if all nodes are ready.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
bool: True if all nodes are ready (or if there are no nodes), False otherwise
|
||||||
|
"""
|
||||||
|
if not self._nodes:
|
||||||
|
return True
|
||||||
|
|
||||||
|
return all(node.is_ready for node in self._nodes.values())
|
||||||
|
|
||||||
|
def has_node(self, name: str) -> bool:
|
||||||
|
"""
|
||||||
|
Check if a node with the given name exists.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
name: The name to check
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
bool: True if a node with the given name exists, False otherwise
|
||||||
|
"""
|
||||||
|
return name in self._nodes
|
||||||
|
|
||||||
|
def get_node(self, name: str) -> Optional[DependencyNode]:
|
||||||
|
"""
|
||||||
|
Get a node by name for manipulation.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
name: The name of the node to retrieve
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
Optional[DependencyNode]: The node with the given name, or None if not found
|
||||||
|
"""
|
||||||
|
return self._nodes.get(name)
|
||||||
|
|
||||||
|
def remove_node(self, node_or_name) -> bool:
|
||||||
|
"""
|
||||||
|
Remove a node by name or reference.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
node_or_name: The node to remove or its name
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
bool: True if the node was removed, False if not found
|
||||||
|
"""
|
||||||
|
if isinstance(node_or_name, DependencyNode):
|
||||||
|
name = node_or_name.name
|
||||||
|
else:
|
||||||
|
name = node_or_name
|
||||||
|
|
||||||
|
if name in self._nodes:
|
||||||
|
del self._nodes[name]
|
||||||
|
return True
|
||||||
|
return False
|
||||||
|
|
||||||
|
def get_all_nodes(self) -> List[DependencyNode]:
|
||||||
|
"""
|
||||||
|
Get all nodes stored in the handler.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
List[DependencyNode]: List of all nodes
|
||||||
|
"""
|
||||||
|
return list(self._nodes.values())
|
||||||
|
|
||||||
|
def __iter__(self) -> Iterator[DependencyNode]:
|
||||||
|
"""
|
||||||
|
Iterate over all nodes.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
Iterator[DependencyNode]: Iterator over all nodes
|
||||||
|
"""
|
||||||
|
return iter(self._nodes.values())
|
||||||
|
|
||||||
|
def __len__(self) -> int:
|
||||||
|
"""
|
||||||
|
Get the number of nodes in the handler.
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
int: The number of nodes
|
||||||
|
"""
|
||||||
|
return len(self._nodes)
|
||||||
237
pythonbpf/vmlinux_parser/dependency_node.py
Normal file
237
pythonbpf/vmlinux_parser/dependency_node.py
Normal file
@ -0,0 +1,237 @@
|
|||||||
|
from dataclasses import dataclass, field
|
||||||
|
from typing import Dict, Any, Optional
|
||||||
|
|
||||||
|
|
||||||
|
# TODO: FIX THE FUCKING TYPE NAME CONVENTION.
|
||||||
|
@dataclass
|
||||||
|
class Field:
|
||||||
|
"""Represents a field in a dependency node with its type and readiness state."""
|
||||||
|
|
||||||
|
name: str
|
||||||
|
type: type
|
||||||
|
ctype_complex_type: Optional[Any]
|
||||||
|
containing_type: Optional[Any]
|
||||||
|
type_size: Optional[int]
|
||||||
|
bitfield_size: Optional[int]
|
||||||
|
value: Any = None
|
||||||
|
ready: bool = False
|
||||||
|
|
||||||
|
def set_ready(self, is_ready: bool = True) -> None:
|
||||||
|
"""Set the readiness state of this field."""
|
||||||
|
self.ready = is_ready
|
||||||
|
|
||||||
|
def set_value(self, value: Any, mark_ready: bool = False) -> None:
|
||||||
|
"""Set the value of this field and optionally mark it as ready."""
|
||||||
|
self.value = value
|
||||||
|
if mark_ready:
|
||||||
|
self.ready = True
|
||||||
|
|
||||||
|
def set_type(self, given_type, mark_ready: bool = False) -> None:
|
||||||
|
"""Set value of the type field and mark as ready"""
|
||||||
|
self.type = given_type
|
||||||
|
if mark_ready:
|
||||||
|
self.ready = True
|
||||||
|
|
||||||
|
def set_containing_type(
|
||||||
|
self, containing_type: Optional[Any], mark_ready: bool = False
|
||||||
|
) -> None:
|
||||||
|
"""Set the containing_type of this field and optionally mark it as ready."""
|
||||||
|
self.containing_type = containing_type
|
||||||
|
if mark_ready:
|
||||||
|
self.ready = True
|
||||||
|
|
||||||
|
def set_type_size(self, type_size: Any, mark_ready: bool = False) -> None:
|
||||||
|
"""Set the type_size of this field and optionally mark it as ready."""
|
||||||
|
self.type_size = type_size
|
||||||
|
if mark_ready:
|
||||||
|
self.ready = True
|
||||||
|
|
||||||
|
def set_ctype_complex_type(
|
||||||
|
self, ctype_complex_type: Any, mark_ready: bool = False
|
||||||
|
) -> None:
|
||||||
|
"""Set the ctype_complex_type of this field and optionally mark it as ready."""
|
||||||
|
self.ctype_complex_type = ctype_complex_type
|
||||||
|
if mark_ready:
|
||||||
|
self.ready = True
|
||||||
|
|
||||||
|
def set_bitfield_size(self, bitfield_size: Any, mark_ready: bool = False) -> None:
|
||||||
|
"""Set the bitfield_size of this field and optionally mark it as ready."""
|
||||||
|
self.bitfield_size = bitfield_size
|
||||||
|
if mark_ready:
|
||||||
|
self.ready = True
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class DependencyNode:
|
||||||
|
"""
|
||||||
|
A node with typed fields and readiness tracking.
|
||||||
|
|
||||||
|
Example usage:
|
||||||
|
# Create a dependency node for a Person
|
||||||
|
somestruct = DependencyNode(name="struct_1")
|
||||||
|
|
||||||
|
# Add fields with their types
|
||||||
|
somestruct.add_field("field_1", str)
|
||||||
|
somestruct.add_field("field_2", int)
|
||||||
|
somestruct.add_field("field_3", str)
|
||||||
|
|
||||||
|
# Check if the node is ready (should be False initially)
|
||||||
|
print(f"Is node ready? {somestruct.is_ready}") # False
|
||||||
|
|
||||||
|
# Set some field values
|
||||||
|
somestruct.set_field_value("field_1", "someproperty")
|
||||||
|
somestruct.set_field_value("field_2", 30)
|
||||||
|
|
||||||
|
# Check if the node is ready (still False because email is not ready)
|
||||||
|
print(f"Is node ready? {somestruct.is_ready}") # False
|
||||||
|
|
||||||
|
# Set the last field and make the node ready
|
||||||
|
somestruct.set_field_value("field_3", "anotherproperty")
|
||||||
|
|
||||||
|
# Now the node should be ready
|
||||||
|
print(f"Is node ready? {somestruct.is_ready}") # True
|
||||||
|
|
||||||
|
# You can also mark a field as not ready
|
||||||
|
somestruct.set_field_ready("field_3", False)
|
||||||
|
|
||||||
|
# Now the node is not ready again
|
||||||
|
print(f"Is node ready? {somestruct.is_ready}") # False
|
||||||
|
|
||||||
|
# Get all field values
|
||||||
|
print(somestruct.get_field_values()) # {'field_1': 'someproperty', 'field_2': 30, 'field_3': 'anotherproperty'}
|
||||||
|
|
||||||
|
# Get only ready fields
|
||||||
|
ready_fields = somestruct.get_ready_fields()
|
||||||
|
print(f"Ready fields: {[field.name for field in ready_fields.values()]}") # ['field_1', 'field_2']
|
||||||
|
"""
|
||||||
|
|
||||||
|
name: str
|
||||||
|
fields: Dict[str, Field] = field(default_factory=dict)
|
||||||
|
_ready_cache: Optional[bool] = field(default=None, repr=False)
|
||||||
|
|
||||||
|
def add_field(
|
||||||
|
self,
|
||||||
|
name: str,
|
||||||
|
field_type: type,
|
||||||
|
initial_value: Any = None,
|
||||||
|
containing_type: Optional[Any] = None,
|
||||||
|
type_size: Optional[int] = None,
|
||||||
|
ctype_complex_type: Optional[int] = None,
|
||||||
|
bitfield_size: Optional[int] = None,
|
||||||
|
ready: bool = False,
|
||||||
|
) -> None:
|
||||||
|
"""Add a field to the node with an optional initial value and readiness state."""
|
||||||
|
self.fields[name] = Field(
|
||||||
|
name=name,
|
||||||
|
type=field_type,
|
||||||
|
value=initial_value,
|
||||||
|
ready=ready,
|
||||||
|
containing_type=containing_type,
|
||||||
|
type_size=type_size,
|
||||||
|
ctype_complex_type=ctype_complex_type,
|
||||||
|
bitfield_size=bitfield_size,
|
||||||
|
)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def get_field(self, name: str) -> Field:
|
||||||
|
"""Get a field by name."""
|
||||||
|
return self.fields[name]
|
||||||
|
|
||||||
|
def set_field_value(self, name: str, value: Any, mark_ready: bool = False) -> None:
|
||||||
|
"""Set a field's value and optionally mark it as ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_value(value, mark_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def set_field_type(self, name: str, type: Any, mark_ready: bool = False) -> None:
|
||||||
|
"""Set a field's type and optionally mark it as ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_type(type, mark_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def set_field_containing_type(
|
||||||
|
self, name: str, containing_type: Any, mark_ready: bool = False
|
||||||
|
) -> None:
|
||||||
|
"""Set a field's containing_type and optionally mark it as ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_containing_type(containing_type, mark_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def set_field_type_size(
|
||||||
|
self, name: str, type_size: Any, mark_ready: bool = False
|
||||||
|
) -> None:
|
||||||
|
"""Set a field's type_size and optionally mark it as ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_type_size(type_size, mark_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def set_field_ctype_complex_type(
|
||||||
|
self, name: str, ctype_complex_type: Any, mark_ready: bool = False
|
||||||
|
) -> None:
|
||||||
|
"""Set a field's ctype_complex_type and optionally mark it as ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_ctype_complex_type(ctype_complex_type, mark_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def set_field_bitfield_size(
|
||||||
|
self, name: str, bitfield_size: Any, mark_ready: bool = False
|
||||||
|
) -> None:
|
||||||
|
"""Set a field's bitfield_size and optionally mark it as ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_bitfield_size(bitfield_size, mark_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
def set_field_ready(self, name: str, is_ready: bool = False) -> None:
|
||||||
|
"""Mark a field as ready or not ready."""
|
||||||
|
if name not in self.fields:
|
||||||
|
raise KeyError(f"Field '{name}' does not exist in node '{self.name}'")
|
||||||
|
|
||||||
|
self.fields[name].set_ready(is_ready)
|
||||||
|
# Invalidate readiness cache
|
||||||
|
self._ready_cache = None
|
||||||
|
|
||||||
|
@property
|
||||||
|
def is_ready(self) -> bool:
|
||||||
|
"""Check if the node is ready (all fields are ready)."""
|
||||||
|
# Use cached value if available
|
||||||
|
if self._ready_cache is not None:
|
||||||
|
return self._ready_cache
|
||||||
|
|
||||||
|
# Calculate readiness only when needed
|
||||||
|
if not self.fields:
|
||||||
|
self._ready_cache = True
|
||||||
|
return True
|
||||||
|
|
||||||
|
self._ready_cache = all(elem.ready for elem in self.fields.values())
|
||||||
|
return self._ready_cache
|
||||||
|
|
||||||
|
def get_field_values(self) -> Dict[str, Any]:
|
||||||
|
"""Get a dictionary of field names to their values."""
|
||||||
|
return {name: elem.value for name, elem in self.fields.items()}
|
||||||
|
|
||||||
|
def get_ready_fields(self) -> Dict[str, Field]:
|
||||||
|
"""Get all fields that are marked as ready."""
|
||||||
|
return {name: elem for name, elem in self.fields.items() if elem.ready}
|
||||||
|
|
||||||
|
def get_not_ready_fields(self) -> Dict[str, Field]:
|
||||||
|
"""Get all fields that are marked as not ready."""
|
||||||
|
return {name: elem for name, elem in self.fields.items() if not elem.ready}
|
||||||
135
pythonbpf/vmlinux_parser/import_detector.py
Normal file
135
pythonbpf/vmlinux_parser/import_detector.py
Normal file
@ -0,0 +1,135 @@
|
|||||||
|
import ast
|
||||||
|
import logging
|
||||||
|
from typing import List, Tuple, Dict
|
||||||
|
import importlib
|
||||||
|
import inspect
|
||||||
|
|
||||||
|
from .dependency_handler import DependencyHandler
|
||||||
|
from .ir_generation import IRGenerator
|
||||||
|
from .class_handler import process_vmlinux_class
|
||||||
|
|
||||||
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
|
||||||
|
def detect_import_statement(tree: ast.AST) -> List[Tuple[str, ast.ImportFrom]]:
|
||||||
|
"""
|
||||||
|
Parse AST and detect import statements from vmlinux.
|
||||||
|
|
||||||
|
Returns a list of tuples (module_name, imported_item) for vmlinux imports.
|
||||||
|
Raises SyntaxError for invalid import patterns.
|
||||||
|
|
||||||
|
Args:
|
||||||
|
tree: The AST to parse
|
||||||
|
|
||||||
|
Returns:
|
||||||
|
List of tuples containing (module_name, imported_item) for each vmlinux import
|
||||||
|
|
||||||
|
Raises:
|
||||||
|
SyntaxError: If multiple imports from vmlinux are attempted or import * is used
|
||||||
|
"""
|
||||||
|
vmlinux_imports = []
|
||||||
|
|
||||||
|
for node in ast.walk(tree):
|
||||||
|
# Handle "from vmlinux import ..." statements
|
||||||
|
if isinstance(node, ast.ImportFrom):
|
||||||
|
if node.module == "vmlinux":
|
||||||
|
# Check for wildcard import: from vmlinux import *
|
||||||
|
if any(alias.name == "*" for alias in node.names):
|
||||||
|
raise SyntaxError(
|
||||||
|
"Wildcard imports from vmlinux are not supported. "
|
||||||
|
"Please import specific types explicitly."
|
||||||
|
)
|
||||||
|
|
||||||
|
# Check for multiple imports: from vmlinux import A, B, C
|
||||||
|
if len(node.names) > 1:
|
||||||
|
imported_names = [alias.name for alias in node.names]
|
||||||
|
raise SyntaxError(
|
||||||
|
f"Multiple imports from vmlinux are not supported. "
|
||||||
|
f"Found: {', '.join(imported_names)}. "
|
||||||
|
f"Please use separate import statements for each type."
|
||||||
|
)
|
||||||
|
|
||||||
|
# Check if no specific import is specified (should not happen with valid Python)
|
||||||
|
if len(node.names) == 0:
|
||||||
|
raise SyntaxError(
|
||||||
|
"Import from vmlinux must specify at least one type."
|
||||||
|
)
|
||||||
|
|
||||||
|
# Valid single import
|
||||||
|
for alias in node.names:
|
||||||
|
import_name = alias.name
|
||||||
|
# Use alias if provided, otherwise use the original name (commented)
|
||||||
|
# as_name = alias.asname if alias.asname else alias.name
|
||||||
|
vmlinux_imports.append(("vmlinux", node))
|
||||||
|
logger.info(f"Found vmlinux import: {import_name}")
|
||||||
|
|
||||||
|
# Handle "import vmlinux" statements (not typical but should be rejected)
|
||||||
|
elif isinstance(node, ast.Import):
|
||||||
|
for alias in node.names:
|
||||||
|
if alias.name == "vmlinux" or alias.name.startswith("vmlinux."):
|
||||||
|
raise SyntaxError(
|
||||||
|
"Direct import of vmlinux module is not supported. "
|
||||||
|
"Use 'from vmlinux import <type>' instead."
|
||||||
|
)
|
||||||
|
|
||||||
|
logger.info(f"Total vmlinux imports detected: {len(vmlinux_imports)}")
|
||||||
|
return vmlinux_imports
|
||||||
|
|
||||||
|
|
||||||
|
def vmlinux_proc(tree: ast.AST, module):
|
||||||
|
import_statements = detect_import_statement(tree)
|
||||||
|
|
||||||
|
# initialise dependency handler
|
||||||
|
handler = DependencyHandler()
|
||||||
|
# initialise assignment dictionary of name to type
|
||||||
|
assignments: Dict[str, type] = {}
|
||||||
|
|
||||||
|
if not import_statements:
|
||||||
|
logger.info("No vmlinux imports found")
|
||||||
|
return
|
||||||
|
|
||||||
|
# Import vmlinux module directly
|
||||||
|
try:
|
||||||
|
vmlinux_mod = importlib.import_module("vmlinux")
|
||||||
|
except ImportError:
|
||||||
|
logger.warning("Could not import vmlinux module")
|
||||||
|
return
|
||||||
|
|
||||||
|
source_file = inspect.getsourcefile(vmlinux_mod)
|
||||||
|
if source_file is None:
|
||||||
|
logger.warning("Cannot find source for vmlinux module")
|
||||||
|
return
|
||||||
|
|
||||||
|
with open(source_file, "r") as f:
|
||||||
|
mod_ast = ast.parse(f.read(), filename=source_file)
|
||||||
|
|
||||||
|
for import_mod, import_node in import_statements:
|
||||||
|
for alias in import_node.names:
|
||||||
|
imported_name = alias.name
|
||||||
|
found = False
|
||||||
|
for mod_node in mod_ast.body:
|
||||||
|
if (
|
||||||
|
isinstance(mod_node, ast.ClassDef)
|
||||||
|
and mod_node.name == imported_name
|
||||||
|
):
|
||||||
|
process_vmlinux_class(mod_node, module, handler)
|
||||||
|
found = True
|
||||||
|
break
|
||||||
|
if isinstance(mod_node, ast.Assign):
|
||||||
|
for target in mod_node.targets:
|
||||||
|
if isinstance(target, ast.Name) and target.id == imported_name:
|
||||||
|
process_vmlinux_assign(mod_node, module, assignments)
|
||||||
|
found = True
|
||||||
|
break
|
||||||
|
if found:
|
||||||
|
break
|
||||||
|
if not found:
|
||||||
|
logger.info(
|
||||||
|
f"{imported_name} not found as ClassDef or Assign in vmlinux"
|
||||||
|
)
|
||||||
|
|
||||||
|
IRGenerator(module, handler)
|
||||||
|
|
||||||
|
|
||||||
|
def process_vmlinux_assign(node, module, assignments: Dict[str, type]):
|
||||||
|
raise NotImplementedError("Assignment handling has not been implemented yet")
|
||||||
14
pythonbpf/vmlinux_parser/ir_generation.py
Normal file
14
pythonbpf/vmlinux_parser/ir_generation.py
Normal file
@ -0,0 +1,14 @@
|
|||||||
|
import logging
|
||||||
|
from .dependency_handler import DependencyHandler
|
||||||
|
|
||||||
|
logger = logging.getLogger(__name__)
|
||||||
|
|
||||||
|
|
||||||
|
class IRGenerator:
|
||||||
|
def __init__(self, module, handler: DependencyHandler):
|
||||||
|
self.module = module
|
||||||
|
self.handler: DependencyHandler = handler
|
||||||
|
if not handler.is_ready:
|
||||||
|
raise ImportError(
|
||||||
|
"Semantic analysis of vmlinux imports failed. Cannot generate IR"
|
||||||
|
)
|
||||||
@ -1,11 +1,10 @@
|
|||||||
#include <linux/bpf.h>
|
#include "vmlinux.h"
|
||||||
#include <bpf/bpf_helpers.h>
|
#include <bpf/bpf_helpers.h>
|
||||||
#define u64 unsigned long long
|
#include <bpf/bpf_endian.h>
|
||||||
#define u32 unsigned int
|
|
||||||
|
|
||||||
SEC("xdp")
|
SEC("xdp")
|
||||||
int hello(struct xdp_md *ctx) {
|
int hello(struct xdp_md *ctx) {
|
||||||
bpf_printk("Hello, World!\n");
|
bpf_printk("Hello, World! %ud \n", ctx->data);
|
||||||
return XDP_PASS;
|
return XDP_PASS;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|||||||
@ -1,39 +0,0 @@
|
|||||||
from pythonbpf import bpf, map, section, bpfglobal, compile
|
|
||||||
from ctypes import c_void_p, c_int64, c_uint64
|
|
||||||
from pythonbpf.maps import HashMap
|
|
||||||
|
|
||||||
|
|
||||||
# NOTE: This example tries to reinterpret the variable `x` to a different type.
|
|
||||||
# We do not allow this for now, as stack allocations are typed and have to be
|
|
||||||
# done in the first basic block. Allowing re-interpretation would require
|
|
||||||
# re-allocation of stack space (possibly in a new basic block), which is not
|
|
||||||
# supported in eBPF yet.
|
|
||||||
# We can allow bitcasts in cases where the width of the types is the same in
|
|
||||||
# the future. But for now, we do not allow any re-interpretation of variables.
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@map
|
|
||||||
def last() -> HashMap:
|
|
||||||
return HashMap(key=c_uint64, value=c_uint64, max_entries=3)
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
|
||||||
def hello_world(ctx: c_void_p) -> c_int64:
|
|
||||||
last.update(0, 1)
|
|
||||||
x = last.lookup(0)
|
|
||||||
x = 20
|
|
||||||
if x == 2:
|
|
||||||
print("Hello, World!")
|
|
||||||
else:
|
|
||||||
print("Goodbye, World!")
|
|
||||||
return
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@bpfglobal
|
|
||||||
def LICENSE() -> str:
|
|
||||||
return "GPL"
|
|
||||||
|
|
||||||
|
|
||||||
compile()
|
|
||||||
@ -3,16 +3,19 @@ import logging
|
|||||||
from pythonbpf import compile, bpf, section, bpfglobal, compile_to_ir
|
from pythonbpf import compile, bpf, section, bpfglobal, compile_to_ir
|
||||||
from ctypes import c_void_p, c_int64, c_int32
|
from ctypes import c_void_p, c_int64, c_int32
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def somevalue() -> c_int32:
|
def somevalue() -> c_int32:
|
||||||
return c_int32(42)
|
return c_int32(42)
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def somevalue2() -> c_int64:
|
def somevalue2() -> c_int64:
|
||||||
return c_int64(69)
|
return c_int64(69)
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def somevalue1() -> c_int32:
|
def somevalue1() -> c_int32:
|
||||||
@ -21,12 +24,14 @@ def somevalue1() -> c_int32:
|
|||||||
|
|
||||||
# --- Passing examples ---
|
# --- Passing examples ---
|
||||||
|
|
||||||
|
|
||||||
# Simple constant return
|
# Simple constant return
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def g1() -> c_int64:
|
def g1() -> c_int64:
|
||||||
return c_int64(42)
|
return c_int64(42)
|
||||||
|
|
||||||
|
|
||||||
# Constructor with one constant argument
|
# Constructor with one constant argument
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
@ -62,15 +67,17 @@ def g2() -> c_int64:
|
|||||||
# def g6() -> c_int64:
|
# def g6() -> c_int64:
|
||||||
# return c_int64(CONST)
|
# return c_int64(CONST)
|
||||||
|
|
||||||
|
|
||||||
# Constructor with multiple args
|
# Constructor with multiple args
|
||||||
#TODO: this is not working. should it work ?
|
# TODO: this is not working. should it work ?
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def g7() -> c_int64:
|
def g7() -> c_int64:
|
||||||
return c_int64(1)
|
return c_int64(1)
|
||||||
|
|
||||||
|
|
||||||
# Dataclass call
|
# Dataclass call
|
||||||
#TODO: fails with dataclass
|
# TODO: fails with dataclass
|
||||||
# @dataclass
|
# @dataclass
|
||||||
# class Point:
|
# class Point:
|
||||||
# x: c_int64
|
# x: c_int64
|
||||||
@ -91,6 +98,7 @@ def sometag(ctx: c_void_p) -> c_int64:
|
|||||||
print(f"{somevalue}")
|
print(f"{somevalue}")
|
||||||
return c_int64(1)
|
return c_int64(1)
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def LICENSE() -> str:
|
def LICENSE() -> str:
|
||||||
|
|||||||
@ -11,6 +11,7 @@ from ctypes import c_void_p, c_int64
|
|||||||
# We cannot allocate space for the intermediate type now.
|
# We cannot allocate space for the intermediate type now.
|
||||||
# We probably need to track the ref/deref chain for each variable.
|
# We probably need to track the ref/deref chain for each variable.
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@map
|
@map
|
||||||
def count() -> HashMap:
|
def count() -> HashMap:
|
||||||
|
|||||||
@ -3,6 +3,7 @@ import logging
|
|||||||
from pythonbpf import compile, bpf, section, bpfglobal, compile_to_ir
|
from pythonbpf import compile, bpf, section, bpfglobal, compile_to_ir
|
||||||
from ctypes import c_void_p, c_int64
|
from ctypes import c_void_p, c_int64
|
||||||
|
|
||||||
|
|
||||||
# This should not pass as somevalue is not declared at all.
|
# This should not pass as somevalue is not declared at all.
|
||||||
@bpf
|
@bpf
|
||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
@section("tracepoint/syscalls/sys_enter_execve")
|
||||||
@ -11,6 +12,7 @@ def sometag(ctx: c_void_p) -> c_int64:
|
|||||||
print(f"{somevalue}") # noqa: F821
|
print(f"{somevalue}") # noqa: F821
|
||||||
return c_int64(1)
|
return c_int64(1)
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
@bpfglobal
|
@bpfglobal
|
||||||
def LICENSE() -> str:
|
def LICENSE() -> str:
|
||||||
|
|||||||
47
tests/failing_tests/xdp_pass.py
Normal file
47
tests/failing_tests/xdp_pass.py
Normal file
@ -0,0 +1,47 @@
|
|||||||
|
from pythonbpf import bpf, map, section, bpfglobal, compile_to_ir
|
||||||
|
from pythonbpf.maps import HashMap
|
||||||
|
from pythonbpf.helper import XDP_PASS
|
||||||
|
from vmlinux import struct_xdp_md
|
||||||
|
from vmlinux import struct_xdp_buff # noqa: F401
|
||||||
|
from vmlinux import struct_ring_buffer_per_cpu # noqa: F401
|
||||||
|
|
||||||
|
from ctypes import c_int64
|
||||||
|
|
||||||
|
# Instructions to how to run this program
|
||||||
|
# 1. Install PythonBPF: pip install pythonbpf
|
||||||
|
# 2. Run the program: python examples/xdp_pass.py
|
||||||
|
# 3. Run the program with sudo: sudo tools/check.sh run examples/xdp_pass.o
|
||||||
|
# 4. Attach object file to any network device with something like ./check.sh xdp examples/xdp_pass.o tailscale0
|
||||||
|
# 5. send traffic through the device and observe effects
|
||||||
|
|
||||||
|
|
||||||
|
@bpf
|
||||||
|
@map
|
||||||
|
def count() -> HashMap:
|
||||||
|
return HashMap(key=c_int64, value=c_int64, max_entries=1)
|
||||||
|
|
||||||
|
|
||||||
|
@bpf
|
||||||
|
@section("xdp")
|
||||||
|
def hello_world(ctx: struct_xdp_md) -> c_int64:
|
||||||
|
key = 0
|
||||||
|
one = 1
|
||||||
|
prev = count().lookup(key)
|
||||||
|
if prev:
|
||||||
|
prevval = prev + 1
|
||||||
|
print(f"count: {prevval}")
|
||||||
|
count().update(key, prevval)
|
||||||
|
return XDP_PASS
|
||||||
|
else:
|
||||||
|
count().update(key, one)
|
||||||
|
|
||||||
|
return XDP_PASS
|
||||||
|
|
||||||
|
|
||||||
|
@bpf
|
||||||
|
@bpfglobal
|
||||||
|
def LICENSE() -> str:
|
||||||
|
return "GPL"
|
||||||
|
|
||||||
|
|
||||||
|
compile_to_ir("xdp_pass.py", "xdp_pass.ll")
|
||||||
@ -1,69 +0,0 @@
|
|||||||
from pythonbpf import bpf, map, section, bpfglobal, compile, struct
|
|
||||||
from ctypes import c_void_p, c_int64, c_int32, c_uint64
|
|
||||||
from pythonbpf.maps import HashMap
|
|
||||||
from pythonbpf.helper import ktime
|
|
||||||
|
|
||||||
|
|
||||||
# NOTE: This is a comprehensive test combining struct, helper, and map features
|
|
||||||
# Please note that at line 50, though we have used an absurd expression to test
|
|
||||||
# the compiler, it is recommended to use named variables to reduce the amount of
|
|
||||||
# scratch space that needs to be allocated.
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@struct
|
|
||||||
class data_t:
|
|
||||||
pid: c_uint64
|
|
||||||
ts: c_uint64
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@map
|
|
||||||
def last() -> HashMap:
|
|
||||||
return HashMap(key=c_uint64, value=c_uint64, max_entries=3)
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
|
||||||
def hello_world(ctx: c_void_p) -> c_int64:
|
|
||||||
dat = data_t()
|
|
||||||
dat.pid = 123
|
|
||||||
dat.pid = dat.pid + 1
|
|
||||||
print(f"pid is {dat.pid}")
|
|
||||||
tu = 9
|
|
||||||
last.update(0, tu)
|
|
||||||
last.update(1, -last.lookup(0))
|
|
||||||
x = last.lookup(0)
|
|
||||||
print(f"Map value at index 0: {x}")
|
|
||||||
x = x + c_int32(1)
|
|
||||||
print(f"x after adding 32-bit 1 is {x}")
|
|
||||||
x = ktime() - 121
|
|
||||||
print(f"ktime - 121 is {x}")
|
|
||||||
x = last.lookup(0)
|
|
||||||
x = x + 1
|
|
||||||
print(f"x is {x}")
|
|
||||||
if x == 10:
|
|
||||||
jat = data_t()
|
|
||||||
jat.ts = 456
|
|
||||||
print(f"Hello, World!, ts is {jat.ts}")
|
|
||||||
a = last.lookup(0)
|
|
||||||
print(f"a is {a}")
|
|
||||||
last.update(9, 9)
|
|
||||||
last.update(0, last.lookup(last.lookup(0)) +
|
|
||||||
last.lookup(last.lookup(0)) + last.lookup(last.lookup(0)))
|
|
||||||
z = last.lookup(0)
|
|
||||||
print(f"new map val at index 0 is {z}")
|
|
||||||
else:
|
|
||||||
a = last.lookup(0)
|
|
||||||
print("Goodbye, World!")
|
|
||||||
c = last.lookup(1 - 1)
|
|
||||||
print(f"c is {c}")
|
|
||||||
return
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@bpfglobal
|
|
||||||
def LICENSE() -> str:
|
|
||||||
return "GPL"
|
|
||||||
|
|
||||||
|
|
||||||
compile()
|
|
||||||
@ -1,27 +0,0 @@
|
|||||||
from pythonbpf import bpf, section, bpfglobal, compile
|
|
||||||
from ctypes import c_void_p, c_int64
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
|
||||||
def hello_world(ctx: c_void_p) -> c_int64:
|
|
||||||
x = 1
|
|
||||||
print(f"Initial x: {x}")
|
|
||||||
a = 20
|
|
||||||
x = a
|
|
||||||
print(f"Updated x with a: {x}")
|
|
||||||
x = (x + x) * 3
|
|
||||||
if x == 2:
|
|
||||||
print("Hello, World!")
|
|
||||||
else:
|
|
||||||
print(f"Goodbye, World! {x}")
|
|
||||||
return
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@bpfglobal
|
|
||||||
def LICENSE() -> str:
|
|
||||||
return "GPL"
|
|
||||||
|
|
||||||
|
|
||||||
compile()
|
|
||||||
@ -1,34 +0,0 @@
|
|||||||
from pythonbpf import bpf, map, section, bpfglobal, compile
|
|
||||||
from ctypes import c_void_p, c_int64, c_uint64
|
|
||||||
from pythonbpf.maps import HashMap
|
|
||||||
|
|
||||||
# NOTE: An example of i64** assignment with binops on the RHS
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@map
|
|
||||||
def last() -> HashMap:
|
|
||||||
return HashMap(key=c_uint64, value=c_uint64, max_entries=3)
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
|
||||||
def hello_world(ctx: c_void_p) -> c_int64:
|
|
||||||
last.update(0, 1)
|
|
||||||
x = last.lookup(0)
|
|
||||||
print(f"{x}")
|
|
||||||
x = x + 1
|
|
||||||
if x == 2:
|
|
||||||
print("Hello, World!")
|
|
||||||
else:
|
|
||||||
print("Goodbye, World!")
|
|
||||||
return
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@bpfglobal
|
|
||||||
def LICENSE() -> str:
|
|
||||||
return "GPL"
|
|
||||||
|
|
||||||
|
|
||||||
compile()
|
|
||||||
@ -1,40 +0,0 @@
|
|||||||
from pythonbpf import bpf, section, bpfglobal, compile, struct
|
|
||||||
from ctypes import c_void_p, c_int64, c_uint64
|
|
||||||
from pythonbpf.helper import ktime
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@struct
|
|
||||||
class data_t:
|
|
||||||
pid: c_uint64
|
|
||||||
ts: c_uint64
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
|
||||||
def hello_world(ctx: c_void_p) -> c_int64:
|
|
||||||
dat = data_t()
|
|
||||||
dat.pid = 123
|
|
||||||
dat.pid = dat.pid + 1
|
|
||||||
print(f"pid is {dat.pid}")
|
|
||||||
x = ktime() - 121
|
|
||||||
print(f"ktime is {x}")
|
|
||||||
x = 1
|
|
||||||
x = x + 1
|
|
||||||
print(f"x is {x}")
|
|
||||||
if x == 2:
|
|
||||||
jat = data_t()
|
|
||||||
jat.ts = 456
|
|
||||||
print(f"Hello, World!, ts is {jat.ts}")
|
|
||||||
else:
|
|
||||||
print("Goodbye, World!")
|
|
||||||
return
|
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
|
||||||
@bpfglobal
|
|
||||||
def LICENSE() -> str:
|
|
||||||
return "GPL"
|
|
||||||
|
|
||||||
|
|
||||||
compile()
|
|
||||||
@ -6,8 +6,8 @@ from ctypes import c_void_p, c_int32
|
|||||||
@section("tracepoint/syscalls/sys_enter_execve")
|
@section("tracepoint/syscalls/sys_enter_execve")
|
||||||
def hello_world(ctx: c_void_p) -> c_int32:
|
def hello_world(ctx: c_void_p) -> c_int32:
|
||||||
print("Hello, World!")
|
print("Hello, World!")
|
||||||
a = 1 # int64
|
a = 1 # int64
|
||||||
return c_int32(a) # typecast to int32
|
return c_int32(a) # typecast to int32
|
||||||
|
|
||||||
|
|
||||||
@bpf
|
@bpf
|
||||||
|
|||||||
@ -26,8 +26,13 @@ import tempfile
|
|||||||
|
|
||||||
|
|
||||||
class BTFConverter:
|
class BTFConverter:
|
||||||
def __init__(self, btf_source="/sys/kernel/btf/vmlinux", output_file="vmlinux.py",
|
def __init__(
|
||||||
keep_intermediate=False, verbose=False):
|
self,
|
||||||
|
btf_source="/sys/kernel/btf/vmlinux",
|
||||||
|
output_file="vmlinux.py",
|
||||||
|
keep_intermediate=False,
|
||||||
|
verbose=False,
|
||||||
|
):
|
||||||
self.btf_source = btf_source
|
self.btf_source = btf_source
|
||||||
self.output_file = output_file
|
self.output_file = output_file
|
||||||
self.keep_intermediate = keep_intermediate
|
self.keep_intermediate = keep_intermediate
|
||||||
@ -44,11 +49,7 @@ class BTFConverter:
|
|||||||
self.log(f"{description}...")
|
self.log(f"{description}...")
|
||||||
try:
|
try:
|
||||||
result = subprocess.run(
|
result = subprocess.run(
|
||||||
cmd,
|
cmd, shell=True, check=True, capture_output=True, text=True
|
||||||
shell=True,
|
|
||||||
check=True,
|
|
||||||
capture_output=True,
|
|
||||||
text=True
|
|
||||||
)
|
)
|
||||||
if self.verbose and result.stdout:
|
if self.verbose and result.stdout:
|
||||||
print(result.stdout)
|
print(result.stdout)
|
||||||
@ -69,51 +70,55 @@ class BTFConverter:
|
|||||||
"""Step 1.5: Preprocess enum definitions."""
|
"""Step 1.5: Preprocess enum definitions."""
|
||||||
self.log("Preprocessing enum definitions...")
|
self.log("Preprocessing enum definitions...")
|
||||||
|
|
||||||
with open(input_file, 'r') as f:
|
with open(input_file, "r") as f:
|
||||||
original_code = f.read()
|
original_code = f.read()
|
||||||
|
|
||||||
# Extract anonymous enums
|
# Extract anonymous enums
|
||||||
enums = re.findall(
|
enums = re.findall(
|
||||||
r'(?<!typedef\s)(enum\s*\{[^}]*\})\s*(\w+)\s*(?::\s*\d+)?\s*;',
|
r"(?<!typedef\s)(enum\s*\{[^}]*\})\s*(\w+)\s*(?::\s*\d+)?\s*;",
|
||||||
original_code
|
original_code,
|
||||||
)
|
)
|
||||||
enum_defs = [enum_block + ';' for enum_block, _ in enums]
|
enum_defs = [enum_block + ";" for enum_block, _ in enums]
|
||||||
|
|
||||||
# Replace anonymous enums with int declarations
|
# Replace anonymous enums with int declarations
|
||||||
processed_code = re.sub(
|
processed_code = re.sub(
|
||||||
r'(?<!typedef\s)enum\s*\{[^}]*\}\s*(\w+)\s*(?::\s*\d+)?\s*;',
|
r"(?<!typedef\s)enum\s*\{[^}]*\}\s*(\w+)\s*(?::\s*\d+)?\s*;",
|
||||||
r'int \1;',
|
r"int \1;",
|
||||||
original_code
|
original_code,
|
||||||
)
|
)
|
||||||
|
|
||||||
# Prepend enum definitions
|
# Prepend enum definitions
|
||||||
if enum_defs:
|
if enum_defs:
|
||||||
enum_text = '\n'.join(enum_defs) + '\n\n'
|
enum_text = "\n".join(enum_defs) + "\n\n"
|
||||||
processed_code = enum_text + processed_code
|
processed_code = enum_text + processed_code
|
||||||
|
|
||||||
output_file = os.path.join(self.temp_dir, "vmlinux_processed.h")
|
output_file = os.path.join(self.temp_dir, "vmlinux_processed.h")
|
||||||
with open(output_file, 'w') as f:
|
with open(output_file, "w") as f:
|
||||||
f.write(processed_code)
|
f.write(processed_code)
|
||||||
|
|
||||||
return output_file
|
return output_file
|
||||||
|
|
||||||
def step2_5_process_kioctx(self, input_file):
|
def step2_5_process_kioctx(self, input_file):
|
||||||
#TODO: this is a very bad bug and design decision. A single struct has an issue mostly.
|
# TODO: this is a very bad bug and design decision. A single struct has an issue mostly.
|
||||||
"""Step 2.5: Process struct kioctx to extract nested anonymous structs."""
|
"""Step 2.5: Process struct kioctx to extract nested anonymous structs."""
|
||||||
self.log("Processing struct kioctx nested structs...")
|
self.log("Processing struct kioctx nested structs...")
|
||||||
|
|
||||||
with open(input_file, 'r') as f:
|
with open(input_file, "r") as f:
|
||||||
content = f.read()
|
content = f.read()
|
||||||
|
|
||||||
# Pattern to match struct kioctx with its full body (handles multiple nesting levels)
|
# Pattern to match struct kioctx with its full body (handles multiple nesting levels)
|
||||||
kioctx_pattern = r'struct\s+kioctx\s*\{(?:[^{}]|\{(?:[^{}]|\{[^{}]*\})*\})*\}\s*;'
|
kioctx_pattern = (
|
||||||
|
r"struct\s+kioctx\s*\{(?:[^{}]|\{(?:[^{}]|\{[^{}]*\})*\})*\}\s*;"
|
||||||
|
)
|
||||||
|
|
||||||
def process_kioctx_replacement(match):
|
def process_kioctx_replacement(match):
|
||||||
full_struct = match.group(0)
|
full_struct = match.group(0)
|
||||||
self.log(f"Found struct kioctx, length: {len(full_struct)} chars")
|
self.log(f"Found struct kioctx, length: {len(full_struct)} chars")
|
||||||
|
|
||||||
# Extract the struct body (everything between outermost { and })
|
# Extract the struct body (everything between outermost { and })
|
||||||
body_match = re.search(r'struct\s+kioctx\s*\{(.*)\}\s*;', full_struct, re.DOTALL)
|
body_match = re.search(
|
||||||
|
r"struct\s+kioctx\s*\{(.*)\}\s*;", full_struct, re.DOTALL
|
||||||
|
)
|
||||||
if not body_match:
|
if not body_match:
|
||||||
return full_struct
|
return full_struct
|
||||||
|
|
||||||
@ -121,7 +126,7 @@ class BTFConverter:
|
|||||||
|
|
||||||
# Find all anonymous structs within the body
|
# Find all anonymous structs within the body
|
||||||
# Pattern: struct { ... } followed by ; (not a member name)
|
# Pattern: struct { ... } followed by ; (not a member name)
|
||||||
anon_struct_pattern = r'struct\s*\{[^}]*\}'
|
# anon_struct_pattern = r"struct\s*\{[^}]*\}"
|
||||||
|
|
||||||
anon_structs = []
|
anon_structs = []
|
||||||
anon_counter = 4 # Start from 4, counting down to 1
|
anon_counter = 4 # Start from 4, counting down to 1
|
||||||
@ -131,7 +136,9 @@ class BTFConverter:
|
|||||||
anon_struct_content = m.group(0)
|
anon_struct_content = m.group(0)
|
||||||
|
|
||||||
# Extract the body of the anonymous struct
|
# Extract the body of the anonymous struct
|
||||||
anon_body_match = re.search(r'struct\s*\{(.*)\}', anon_struct_content, re.DOTALL)
|
anon_body_match = re.search(
|
||||||
|
r"struct\s*\{(.*)\}", anon_struct_content, re.DOTALL
|
||||||
|
)
|
||||||
if not anon_body_match:
|
if not anon_body_match:
|
||||||
return anon_struct_content
|
return anon_struct_content
|
||||||
|
|
||||||
@ -154,7 +161,7 @@ class BTFConverter:
|
|||||||
processed_body = body
|
processed_body = body
|
||||||
|
|
||||||
# Find all occurrences and process them
|
# Find all occurrences and process them
|
||||||
pattern_with_semicolon = r'struct\s*\{([^}]*)\}\s*;'
|
pattern_with_semicolon = r"struct\s*\{([^}]*)\}\s*;"
|
||||||
matches = list(re.finditer(pattern_with_semicolon, body, re.DOTALL))
|
matches = list(re.finditer(pattern_with_semicolon, body, re.DOTALL))
|
||||||
|
|
||||||
if not matches:
|
if not matches:
|
||||||
@ -178,14 +185,16 @@ class BTFConverter:
|
|||||||
|
|
||||||
# Replace in the body
|
# Replace in the body
|
||||||
replacement = f"struct {anon_name} {member_name};"
|
replacement = f"struct {anon_name} {member_name};"
|
||||||
processed_body = processed_body[:start_pos] + replacement + processed_body[end_pos:]
|
processed_body = (
|
||||||
|
processed_body[:start_pos] + replacement + processed_body[end_pos:]
|
||||||
|
)
|
||||||
|
|
||||||
anon_counter -= 1
|
anon_counter -= 1
|
||||||
|
|
||||||
# Rebuild the complete definition
|
# Rebuild the complete definition
|
||||||
if anon_structs:
|
if anon_structs:
|
||||||
# Prepend the anonymous struct definitions
|
# Prepend the anonymous struct definitions
|
||||||
anon_definitions = '\n'.join(anon_structs) + '\n\n'
|
anon_definitions = "\n".join(anon_structs) + "\n\n"
|
||||||
new_struct = f"struct kioctx {{{processed_body}}};"
|
new_struct = f"struct kioctx {{{processed_body}}};"
|
||||||
return anon_definitions + new_struct
|
return anon_definitions + new_struct
|
||||||
else:
|
else:
|
||||||
@ -193,14 +202,11 @@ class BTFConverter:
|
|||||||
|
|
||||||
# Apply the transformation
|
# Apply the transformation
|
||||||
processed_content = re.sub(
|
processed_content = re.sub(
|
||||||
kioctx_pattern,
|
kioctx_pattern, process_kioctx_replacement, content, flags=re.DOTALL
|
||||||
process_kioctx_replacement,
|
|
||||||
content,
|
|
||||||
flags=re.DOTALL
|
|
||||||
)
|
)
|
||||||
|
|
||||||
output_file = os.path.join(self.temp_dir, "vmlinux_kioctx_processed.h")
|
output_file = os.path.join(self.temp_dir, "vmlinux_kioctx_processed.h")
|
||||||
with open(output_file, 'w') as f:
|
with open(output_file, "w") as f:
|
||||||
f.write(processed_content)
|
f.write(processed_content)
|
||||||
|
|
||||||
self.log(f"Saved kioctx-processed output to {output_file}")
|
self.log(f"Saved kioctx-processed output to {output_file}")
|
||||||
@ -218,7 +224,7 @@ class BTFConverter:
|
|||||||
output_file = os.path.join(self.temp_dir, "vmlinux_raw.py")
|
output_file = os.path.join(self.temp_dir, "vmlinux_raw.py")
|
||||||
cmd = (
|
cmd = (
|
||||||
f"clang2py {input_file} -o {output_file} "
|
f"clang2py {input_file} -o {output_file} "
|
||||||
f"--clang-args=\"-fno-ms-extensions -I/usr/include -I/usr/include/linux\""
|
f'--clang-args="-fno-ms-extensions -I/usr/include -I/usr/include/linux"'
|
||||||
)
|
)
|
||||||
self.run_command(cmd, "Converting to Python ctypes")
|
self.run_command(cmd, "Converting to Python ctypes")
|
||||||
return output_file
|
return output_file
|
||||||
@ -234,14 +240,21 @@ class BTFConverter:
|
|||||||
data = re.sub(r"\('_[0-9]+',\s*ctypes\.[a-zA-Z0-9_]+,\s*0\),?\s*\n?", "", data)
|
data = re.sub(r"\('_[0-9]+',\s*ctypes\.[a-zA-Z0-9_]+,\s*0\),?\s*\n?", "", data)
|
||||||
|
|
||||||
# Replace ('_20', ctypes.c_uint64, 64) → ('_20', ctypes.c_uint64)
|
# Replace ('_20', ctypes.c_uint64, 64) → ('_20', ctypes.c_uint64)
|
||||||
data = re.sub(r"\('(_[0-9]+)',\s*(ctypes\.[a-zA-Z0-9_]+),\s*[0-9]+\)", r"('\1', \2)", data)
|
data = re.sub(
|
||||||
|
r"\('(_[0-9]+)',\s*(ctypes\.[a-zA-Z0-9_]+),\s*[0-9]+\)", r"('\1', \2)", data
|
||||||
|
)
|
||||||
|
|
||||||
# Replace ('_20', ctypes.c_char, 8) with ('_20', ctypes.c_uint8, 8)
|
# Replace ('_20', ctypes.c_char, 8) with ('_20', ctypes.c_uint8, 8)
|
||||||
data = re.sub(
|
data = re.sub(r"(ctypes\.c_char)(\s*,\s*\d+\))", r"ctypes.c_uint8\2", data)
|
||||||
r"(ctypes\.c_char)(\s*,\s*\d+\))",
|
|
||||||
r"ctypes.c_uint8\2",
|
# below to replace those c_bool with bitfield greater than 8
|
||||||
data
|
def repl(m):
|
||||||
)
|
name, bits = m.groups()
|
||||||
|
return (
|
||||||
|
f"('{name}', ctypes.c_uint32, {bits})" if int(bits) > 8 else m.group(0)
|
||||||
|
)
|
||||||
|
|
||||||
|
data = re.sub(r"\('([^']+)',\s*ctypes\.c_bool,\s*(\d+)\)", repl, data)
|
||||||
|
|
||||||
# Remove ctypes. prefix from invalid entries
|
# Remove ctypes. prefix from invalid entries
|
||||||
invalid_ctypes = ["bpf_iter_state", "_cache_type", "fs_context_purpose"]
|
invalid_ctypes = ["bpf_iter_state", "_cache_type", "fs_context_purpose"]
|
||||||
@ -258,6 +271,7 @@ class BTFConverter:
|
|||||||
if not self.keep_intermediate and self.temp_dir != ".":
|
if not self.keep_intermediate and self.temp_dir != ".":
|
||||||
self.log(f"Cleaning up temporary directory: {self.temp_dir}")
|
self.log(f"Cleaning up temporary directory: {self.temp_dir}")
|
||||||
import shutil
|
import shutil
|
||||||
|
|
||||||
shutil.rmtree(self.temp_dir, ignore_errors=True)
|
shutil.rmtree(self.temp_dir, ignore_errors=True)
|
||||||
|
|
||||||
def convert(self):
|
def convert(self):
|
||||||
@ -281,6 +295,7 @@ class BTFConverter:
|
|||||||
except Exception as e:
|
except Exception as e:
|
||||||
print(f"\n✗ Error during conversion: {e}", file=sys.stderr)
|
print(f"\n✗ Error during conversion: {e}", file=sys.stderr)
|
||||||
import traceback
|
import traceback
|
||||||
|
|
||||||
traceback.print_exc()
|
traceback.print_exc()
|
||||||
sys.exit(1)
|
sys.exit(1)
|
||||||
finally:
|
finally:
|
||||||
@ -293,18 +308,13 @@ class BTFConverter:
|
|||||||
dependencies = {
|
dependencies = {
|
||||||
"bpftool": "bpftool --version",
|
"bpftool": "bpftool --version",
|
||||||
"clang": "clang --version",
|
"clang": "clang --version",
|
||||||
"clang2py": "clang2py --version"
|
"clang2py": "clang2py --version",
|
||||||
}
|
}
|
||||||
|
|
||||||
missing = []
|
missing = []
|
||||||
for tool, cmd in dependencies.items():
|
for tool, cmd in dependencies.items():
|
||||||
try:
|
try:
|
||||||
subprocess.run(
|
subprocess.run(cmd, shell=True, check=True, capture_output=True)
|
||||||
cmd,
|
|
||||||
shell=True,
|
|
||||||
check=True,
|
|
||||||
capture_output=True
|
|
||||||
)
|
|
||||||
except subprocess.CalledProcessError:
|
except subprocess.CalledProcessError:
|
||||||
missing.append(tool)
|
missing.append(tool)
|
||||||
|
|
||||||
@ -326,31 +336,31 @@ Examples:
|
|||||||
%(prog)s
|
%(prog)s
|
||||||
%(prog)s -o kernel_types.py
|
%(prog)s -o kernel_types.py
|
||||||
%(prog)s --btf-source /sys/kernel/btf/custom_module -k -v
|
%(prog)s --btf-source /sys/kernel/btf/custom_module -k -v
|
||||||
"""
|
""",
|
||||||
)
|
)
|
||||||
|
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"--btf-source",
|
"--btf-source",
|
||||||
default="/sys/kernel/btf/vmlinux",
|
default="/sys/kernel/btf/vmlinux",
|
||||||
help="Path to BTF source (default: /sys/kernel/btf/vmlinux)"
|
help="Path to BTF source (default: /sys/kernel/btf/vmlinux)",
|
||||||
)
|
)
|
||||||
|
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"-o", "--output",
|
"-o",
|
||||||
|
"--output",
|
||||||
default="vmlinux.py",
|
default="vmlinux.py",
|
||||||
help="Output Python file (default: vmlinux.py)"
|
help="Output Python file (default: vmlinux.py)",
|
||||||
)
|
)
|
||||||
|
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"-k", "--keep-intermediate",
|
"-k",
|
||||||
|
"--keep-intermediate",
|
||||||
action="store_true",
|
action="store_true",
|
||||||
help="Keep intermediate files (vmlinux.h, vmlinux_processed.h, etc.)"
|
help="Keep intermediate files (vmlinux.h, vmlinux_processed.h, etc.)",
|
||||||
)
|
)
|
||||||
|
|
||||||
parser.add_argument(
|
parser.add_argument(
|
||||||
"-v", "--verbose",
|
"-v", "--verbose", action="store_true", help="Enable verbose output"
|
||||||
action="store_true",
|
|
||||||
help="Enable verbose output"
|
|
||||||
)
|
)
|
||||||
|
|
||||||
args = parser.parse_args()
|
args = parser.parse_args()
|
||||||
@ -359,7 +369,7 @@ Examples:
|
|||||||
btf_source=args.btf_source,
|
btf_source=args.btf_source,
|
||||||
output_file=args.output,
|
output_file=args.output,
|
||||||
keep_intermediate=args.keep_intermediate,
|
keep_intermediate=args.keep_intermediate,
|
||||||
verbose=args.verbose
|
verbose=args.verbose,
|
||||||
)
|
)
|
||||||
|
|
||||||
converter.convert()
|
converter.convert()
|
||||||
|
|||||||
Reference in New Issue
Block a user