Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat: adds msgspec back in as it now supports python 3.13 #77

Open
wants to merge 2 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
370 changes: 188 additions & 182 deletions evm_trace/vmtrace.py
Original file line number Diff line number Diff line change
@@ -1,186 +1,192 @@
from __future__ import annotations

import sys

# msgspec does not currently build on python 3.13 so hide it behind a version check
if sys.version_info < (3, 13):

from collections.abc import Iterator
from typing import Any

from eth.vm.memory import Memory
from eth.vm.stack import Stack
from eth_pydantic_types import Address, HexBytes
from eth_utils import to_int
from msgspec import Struct
from msgspec.json import Decoder

# opcodes grouped by the number of items they pop from the stack
# fmt: off
POP_OPCODES = {
1: ["EXTCODEHASH", "ISZERO", "NOT", "BALANCE", "CALLDATALOAD", "EXTCODESIZE", "BLOCKHASH", "POP", "MLOAD", "SLOAD", "JUMP", "SELFDESTRUCT"], # noqa: E501
2: ["SHL", "SHR", "SAR", "REVERT", "ADD", "MUL", "SUB", "DIV", "SDIV", "MOD", "SMOD", "EXP", "SIGNEXTEND", "LT", "GT", "SLT", "SGT", "EQ", "AND", "XOR", "OR", "BYTE", "SHA3", "KECCAK256", "MSTORE", "MSTORE8", "SSTORE", "JUMPI", "RETURN"], # noqa: E501
3: ["RETURNDATACOPY", "ADDMOD", "MULMOD", "CALLDATACOPY", "CODECOPY", "CREATE"],
4: ["CREATE2", "EXTCODECOPY"],
6: ["STATICCALL", "DELEGATECALL"],
7: ["CALL", "CALLCODE"]
}
# fmt: on
POPCODES = {op: n for n, opcodes in POP_OPCODES.items() for op in opcodes}
POPCODES.update({f"LOG{n}": n + 2 for n in range(0, 5)})
POPCODES.update({f"SWAP{i}": i + 1 for i in range(1, 17)})
POPCODES.update({f"DUP{i}": i for i in range(1, 17)})

class uint256(int):
pass

class VMTrace(Struct):
code: HexBytes
"""The code to be executed."""
ops: list[VMOperation]
"""The operations executed."""

class VMOperation(Struct):
pc: int
"""The program counter."""
cost: int
"""The gas cost for this instruction."""
ex: VMExecutedOperation | None
"""Information concerning the execution of the operation."""
sub: VMTrace | None
"""Subordinate trace of the CALL/CREATE if applicable."""
op: str
"""Opcode that is being called."""
idx: str
"""Index in the tree."""

class VMExecutedOperation(Struct):
used: int
"""The amount of remaining gas."""
push: list[HexBytes]
"""The stack item placed, if any."""
mem: MemoryDiff | None
"""If altered, the memory delta."""
store: StorageDiff | None
"""The altered storage value, if any."""

class MemoryDiff(Struct):
off: int
"""Offset into memory the change begins."""
data: HexBytes
"""The changed data."""

class StorageDiff(Struct):
key: uint256
"""Which key in storage is changed."""
val: uint256
"""What the value has been changed to."""

class VMTraceFrame(Struct):
"""
A synthetic trace frame representing the state at a step of execution.
"""

address: str
pc: int
op: str
depth: int
stack: list[int]
memory: bytes | memoryview
storage: dict[int, int]

def to_trace_frames(
trace: VMTrace,
depth: int = 1,
address: str = "",
copy_memory: bool = True,
) -> Iterator[VMTraceFrame]:
"""
Replays a VMTrace and yields trace frames at each step of the execution.
Can be used as a much faster drop-in replacement for Geth-style traces.

Args:
trace (VMTrace): A decoded trace from a `trace_` rpc.
depth (int): A depth of the call being processed. automatically populated.
address (str): The address of the contract being executed. auto populated
except the root call.
copy_memory (bool): Whether to copy memory when returning trace frames.
Disable for a speedup when dealing with traces using a large amount of memory.
when disabled, `VMTraceFrame.memory` becomes `memoryview` instead of `bytes`, which
works like a pointer at the memory `bytearray`. this means you must process the
frames immediately, otherwise you risk memory value mutating further into execution.

Returns:
Iterator[VMTraceFrame]: An iterator of synthetic traces which can be used as a drop-in
replacement for Geth-style traces. also contains the address of the current contract
context.
"""
memory = Memory()
stack = Stack()
storage: dict[int, int] = {}
call_address = ""
read_memory = memory.read_bytes if copy_memory else memory.read

for op in trace.ops:
if op.ex and op.ex.mem:
memory.extend(op.ex.mem.off, len(op.ex.mem.data))

# geth convention is to return after memory expansion, but before operation is applied
yield VMTraceFrame(
address=address,
pc=op.pc,
op=op.op,
depth=depth,
stack=[to_int(val) for val in stack.values],
memory=read_memory(0, len(memory)),
storage=storage.copy(),
from collections.abc import Iterator
from typing import Any

from eth.vm.memory import Memory
from eth.vm.stack import Stack
from eth_pydantic_types import Address, HexBytes
from eth_utils import to_int
from msgspec import Struct
from msgspec.json import Decoder

# opcodes grouped by the number of items they pop from the stack
# fmt: off
POP_OPCODES = {
1: ["EXTCODEHASH", "ISZERO", "NOT", "BALANCE", "CALLDATALOAD", "EXTCODESIZE", "BLOCKHASH", "POP", "MLOAD", "SLOAD", "JUMP", "SELFDESTRUCT"], # noqa: E501
2: ["SHL", "SHR", "SAR", "REVERT", "ADD", "MUL", "SUB", "DIV", "SDIV", "MOD", "SMOD", "EXP", "SIGNEXTEND", "LT", "GT", "SLT", "SGT", "EQ", "AND", "XOR", "OR", "BYTE", "SHA3", "KECCAK256", "MSTORE", "MSTORE8", "SSTORE", "JUMPI", "RETURN"], # noqa: E501
3: ["RETURNDATACOPY", "ADDMOD", "MULMOD", "CALLDATACOPY", "CODECOPY", "CREATE"],
4: ["CREATE2", "EXTCODECOPY"],
6: ["STATICCALL", "DELEGATECALL"],
7: ["CALL", "CALLCODE"]
}
# fmt: on
POPCODES = {op: n for n, opcodes in POP_OPCODES.items() for op in opcodes}
POPCODES.update({f"LOG{n}": n + 2 for n in range(0, 5)})
POPCODES.update({f"SWAP{i}": i + 1 for i in range(1, 17)})
POPCODES.update({f"DUP{i}": i for i in range(1, 17)})


class uint256(int):
pass


class VMTrace(Struct):
code: HexBytes
"""The code to be executed."""
ops: list[VMOperation]
"""The operations executed."""


class VMOperation(Struct):
pc: int
"""The program counter."""
cost: int
"""The gas cost for this instruction."""
ex: VMExecutedOperation | None
"""Information concerning the execution of the operation."""
sub: VMTrace | None
"""Subordinate trace of the CALL/CREATE if applicable."""
op: str
"""Opcode that is being called."""
idx: str
"""Index in the tree."""


class VMExecutedOperation(Struct):
used: int
"""The amount of remaining gas."""
push: list[HexBytes]
"""The stack item placed, if any."""
mem: MemoryDiff | None
"""If altered, the memory delta."""
store: StorageDiff | None
"""The altered storage value, if any."""


class MemoryDiff(Struct):
off: int
"""Offset into memory the change begins."""
data: HexBytes
"""The changed data."""


class StorageDiff(Struct):
key: uint256
"""Which key in storage is changed."""
val: uint256
"""What the value has been changed to."""


class VMTraceFrame(Struct):
"""
A synthetic trace frame representing the state at a step of execution.
"""

address: str
pc: int
op: str
depth: int
stack: list[int]
memory: bytes | memoryview
storage: dict[int, int]


def to_trace_frames(
trace: VMTrace,
depth: int = 1,
address: str = "",
copy_memory: bool = True,
) -> Iterator[VMTraceFrame]:
"""
Replays a VMTrace and yields trace frames at each step of the execution.
Can be used as a much faster drop-in replacement for Geth-style traces.

Args:
trace (VMTrace): A decoded trace from a `trace_` rpc.
depth (int): A depth of the call being processed. automatically populated.
address (str): The address of the contract being executed. auto populated
except the root call.
copy_memory (bool): Whether to copy memory when returning trace frames.
Disable for a speedup when dealing with traces using a large amount of memory.
when disabled, `VMTraceFrame.memory` becomes `memoryview` instead of `bytes`, which
works like a pointer at the memory `bytearray`. this means you must process the
frames immediately, otherwise you risk memory value mutating further into execution.

Returns:
Iterator[VMTraceFrame]: An iterator of synthetic traces which can be used as a drop-in
replacement for Geth-style traces. also contains the address of the current contract
context.
"""
memory = Memory()
stack = Stack()
storage: dict[int, int] = {}
call_address = ""
read_memory = memory.read_bytes if copy_memory else memory.read

for op in trace.ops:
if op.ex and op.ex.mem:
memory.extend(op.ex.mem.off, len(op.ex.mem.data))

# geth convention is to return after memory expansion, but before the operation is applied
yield VMTraceFrame(
address=address,
pc=op.pc,
op=op.op,
depth=depth,
stack=[to_int(val) for val in stack.values],
memory=read_memory(0, len(memory)),
storage=storage.copy(),
)

if op.op in ["CALL", "DELEGATECALL", "STATICCALL"]:
call_address = Address.__eth_pydantic_validate__(stack.values[-2])

if op.ex:
if op.ex.mem:
memory.write(op.ex.mem.off, len(op.ex.mem.data), op.ex.mem.data)

num_pop = POPCODES.get(op.op)
if num_pop:
stack.pop_any(num_pop)

for item in op.ex.push:
stack.push_bytes(item)

# erigon bug: https://github.com/ledgerwatch/erigon/pull/7970
if op.op == "PUSH0" and not op.ex.push:
stack.push_int(0)

if op.ex.store:
storage[op.ex.store.key] = op.ex.store.val

if op.sub:
yield from to_trace_frames(
op.sub, depth=depth + 1, address=call_address, copy_memory=copy_memory
)

if op.op in ["CALL", "DELEGATECALL", "STATICCALL"]:
call_address = Address.__eth_pydantic_validate__(stack.values[-2])

if op.ex:
if op.ex.mem:
memory.write(op.ex.mem.off, len(op.ex.mem.data), op.ex.mem.data)

num_pop = POPCODES.get(op.op)
if num_pop:
stack.pop_any(num_pop)

for item in op.ex.push:
stack.push_bytes(item)

# erigon bug: https://github.com/ledgerwatch/erigon/pull/7970
if op.op == "PUSH0" and not op.ex.push:
stack.push_int(0)

if op.ex.store:
storage[op.ex.store.key] = op.ex.store.val

if op.sub:
yield from to_trace_frames(
op.sub, depth=depth + 1, address=call_address, copy_memory=copy_memory
)

class RPCResponse(Struct):
result: RPCTraceResult | list[RPCTraceResult]

class RPCTraceResult(Struct):
trace: list | None
vmTrace: VMTrace
stateDiff: dict | None

def dec_hook(type: type, obj: Any) -> Any:
if type is uint256:
return uint256(obj, 16)
elif type is HexBytes:
return HexBytes(obj)

def from_rpc_response(buffer: bytes) -> VMTrace | list[VMTrace]:
"""
Decode structured data from a raw `trace_replayTransaction` or
`trace_replayBlockTransactions`.
"""
response = Decoder(RPCResponse, dec_hook=dec_hook).decode(buffer)
result: list[RPCTraceResult] | RPCTraceResult = response.result
return [i.vmTrace for i in result] if isinstance(result, list) else result.vmTrace

class RPCResponse(Struct):
result: RPCTraceResult | list[RPCTraceResult]


class RPCTraceResult(Struct):
trace: list | None
vmTrace: VMTrace
stateDiff: dict | None


def dec_hook(type: type, obj: Any) -> Any:
if type is uint256:
return uint256(obj, 16)
elif type is HexBytes:
return HexBytes(obj)


def from_rpc_response(buffer: bytes) -> VMTrace | list[VMTrace]:
"""
Decode structured data from a raw `trace_replayTransaction` or `trace_replayBlockTransactions`.
"""
response = Decoder(RPCResponse, dec_hook=dec_hook).decode(buffer)
result: list[RPCTraceResult] | RPCTraceResult = response.result
return [i.vmTrace for i in result] if isinstance(result, list) else result.vmTrace
2 changes: 1 addition & 1 deletion setup.py
Original file line number Diff line number Diff line change
Expand Up @@ -65,7 +65,7 @@
"cchecksum>=0.0.3,<1",
"eth-pydantic-types>=0.1.3,<0.2",
"eth-utils>=2.3.1,<6",
"msgspec>=0.8; python_version < '3.13'",
"msgspec>=0.8",
"pydantic>=2.5.2,<3",
"py-evm>=0.10.1b1,<0.11",
],
Expand Down
Loading