Module hebi.optimize.optimize_varlen
Expand source code
from ast import *
from copy import copy
from collections import defaultdict
from ..util import CompilingNodeTransformer, CompilingNodeVisitor
"""
Rewrites all variable names to a minimal length equivalent
"""
class NameCollector(CompilingNodeVisitor):
step = "Collecting occuring variable names"
def __init__(self):
self.vars = defaultdict(int)
def visit_Name(self, node: Name) -> None:
self.vars[node.id] += 1
def visit_ClassDef(self, node: ClassDef):
self.vars[node.name] += 1
# ignore the content (i.e. attribute names) of class definitions
def visit_FunctionDef(self, node: FunctionDef):
self.vars[node.name] += 1
for a in node.args.args:
# ignore type hints
self.vars[a.arg] += 1
for s in node.body:
self.visit(s)
def bs_from_int(i: int):
hex_str = f"{i:x}"
if len(hex_str) % 2 == 1:
hex_str = "0" + hex_str
return bytes.fromhex(hex_str)
class OptimizeVarlen(CompilingNodeTransformer):
step = "Reducing the length of variable names"
varmap = None
def visit_Module(self, node: Module) -> Module:
# collect all variable names
collector = NameCollector()
collector.visit(node)
# sort by most used
varmap = {}
varnames = sorted(collector.vars.items(), key=lambda x: x[1], reverse=True)
for i, (v, _) in enumerate(varnames):
varmap[v] = bs_from_int(i)
self.varmap = varmap
node_cp = copy(node)
node_cp.body = [self.visit(s) for s in node.body]
return node_cp
def visit_Name(self, node: Name) -> Name:
nc = copy(node)
nc.orig_id = node.id
nc.id = self.varmap[node.id]
return nc
def visit_ClassDef(self, node: ClassDef) -> ClassDef:
node_cp = copy(node)
node_cp.orig_name = node.name
node_cp.name = self.varmap[node.name]
# ignore the content of class definitions
return node_cp
def visit_FunctionDef(self, node: FunctionDef) -> FunctionDef:
node_cp = copy(node)
node_cp.orig_name = node.name
node_cp.name = self.varmap[node.name]
node_cp.args = copy(node.args)
node_cp.args.args = []
for a in node.args.args:
a_cp = copy(a)
a_cp.orig_arg = a.arg
a_cp.arg = self.varmap[a.arg]
node_cp.args.args.append(a_cp)
node_cp.body = [self.visit(s) for s in node.body]
return node_cp
Functions
def bs_from_int(i: int)-
Expand source code
def bs_from_int(i: int): hex_str = f"{i:x}" if len(hex_str) % 2 == 1: hex_str = "0" + hex_str return bytes.fromhex(hex_str)
Classes
class NameCollector-
A node visitor base class that walks the abstract syntax tree and calls a visitor function for every node found. This function may return a value which is forwarded by the
visitmethod.This class is meant to be subclassed, with the subclass adding visitor methods.
Per default the visitor functions for the nodes are
'visit_'+ class name of the node. So aTryFinallynode visit function would bevisit_TryFinally. This behavior can be changed by overriding thevisitmethod. If no visitor function exists for a node (return valueNone) thegeneric_visitvisitor is used instead.Don't use the
NodeVisitorif you want to apply changes to nodes during traversing. For this a special visitor exists (NodeTransformer) that allows modifications.Expand source code
class NameCollector(CompilingNodeVisitor): step = "Collecting occuring variable names" def __init__(self): self.vars = defaultdict(int) def visit_Name(self, node: Name) -> None: self.vars[node.id] += 1 def visit_ClassDef(self, node: ClassDef): self.vars[node.name] += 1 # ignore the content (i.e. attribute names) of class definitions def visit_FunctionDef(self, node: FunctionDef): self.vars[node.name] += 1 for a in node.args.args: # ignore type hints self.vars[a.arg] += 1 for s in node.body: self.visit(s)Ancestors
- CompilingNodeVisitor
- TypedNodeVisitor
- ast.NodeVisitor
Class variables
var step
Methods
def visit(self, node)-
Inherited from:
CompilingNodeVisitor.visitVisit a node.
def visit_ClassDef(self, node: _ast.ClassDef)-
Expand source code
def visit_ClassDef(self, node: ClassDef): self.vars[node.name] += 1 # ignore the content (i.e. attribute names) of class definitions def visit_FunctionDef(self, node: _ast.FunctionDef)-
Expand source code
def visit_FunctionDef(self, node: FunctionDef): self.vars[node.name] += 1 for a in node.args.args: # ignore type hints self.vars[a.arg] += 1 for s in node.body: self.visit(s) def visit_Name(self, node: _ast.Name) ‑> None-
Expand source code
def visit_Name(self, node: Name) -> None: self.vars[node.id] += 1
class OptimizeVarlen-
A :class:
NodeVisitorsubclass that walks the abstract syntax tree and allows modification of nodes.The
NodeTransformerwill walk the AST and use the return value of the visitor methods to replace or remove the old node. If the return value of the visitor method isNone, the node will be removed from its location, otherwise it is replaced with the return value. The return value may be the original node in which case no replacement takes place.Here is an example transformer that rewrites all occurrences of name lookups (
foo) todata['foo']::class RewriteName(NodeTransformer):
def visit_Name(self, node): return Subscript( value=Name(id='data', ctx=Load()), slice=Index(value=Str(s=node.id)), ctx=node.ctx )Keep in mind that if the node you're operating on has child nodes you must either transform the child nodes yourself or call the :meth:
generic_visitmethod for the node first.For nodes that were part of a collection of statements (that applies to all statement nodes), the visitor may also return a list of nodes rather than just a single node.
Usually you use the transformer like this::
node = YourTransformer().visit(node)
Expand source code
class OptimizeVarlen(CompilingNodeTransformer): step = "Reducing the length of variable names" varmap = None def visit_Module(self, node: Module) -> Module: # collect all variable names collector = NameCollector() collector.visit(node) # sort by most used varmap = {} varnames = sorted(collector.vars.items(), key=lambda x: x[1], reverse=True) for i, (v, _) in enumerate(varnames): varmap[v] = bs_from_int(i) self.varmap = varmap node_cp = copy(node) node_cp.body = [self.visit(s) for s in node.body] return node_cp def visit_Name(self, node: Name) -> Name: nc = copy(node) nc.orig_id = node.id nc.id = self.varmap[node.id] return nc def visit_ClassDef(self, node: ClassDef) -> ClassDef: node_cp = copy(node) node_cp.orig_name = node.name node_cp.name = self.varmap[node.name] # ignore the content of class definitions return node_cp def visit_FunctionDef(self, node: FunctionDef) -> FunctionDef: node_cp = copy(node) node_cp.orig_name = node.name node_cp.name = self.varmap[node.name] node_cp.args = copy(node.args) node_cp.args.args = [] for a in node.args.args: a_cp = copy(a) a_cp.orig_arg = a.arg a_cp.arg = self.varmap[a.arg] node_cp.args.args.append(a_cp) node_cp.body = [self.visit(s) for s in node.body] return node_cpAncestors
- CompilingNodeTransformer
- TypedNodeTransformer
- ast.NodeTransformer
- ast.NodeVisitor
Class variables
var stepvar varmap
Methods
def visit(self, node)-
Inherited from:
CompilingNodeTransformer.visitVisit a node.
def visit_ClassDef(self, node: _ast.ClassDef) ‑> _ast.ClassDef-
Expand source code
def visit_ClassDef(self, node: ClassDef) -> ClassDef: node_cp = copy(node) node_cp.orig_name = node.name node_cp.name = self.varmap[node.name] # ignore the content of class definitions return node_cp def visit_FunctionDef(self, node: _ast.FunctionDef) ‑> _ast.FunctionDef-
Expand source code
def visit_FunctionDef(self, node: FunctionDef) -> FunctionDef: node_cp = copy(node) node_cp.orig_name = node.name node_cp.name = self.varmap[node.name] node_cp.args = copy(node.args) node_cp.args.args = [] for a in node.args.args: a_cp = copy(a) a_cp.orig_arg = a.arg a_cp.arg = self.varmap[a.arg] node_cp.args.args.append(a_cp) node_cp.body = [self.visit(s) for s in node.body] return node_cp def visit_Module(self, node: _ast.Module) ‑> _ast.Module-
Expand source code
def visit_Module(self, node: Module) -> Module: # collect all variable names collector = NameCollector() collector.visit(node) # sort by most used varmap = {} varnames = sorted(collector.vars.items(), key=lambda x: x[1], reverse=True) for i, (v, _) in enumerate(varnames): varmap[v] = bs_from_int(i) self.varmap = varmap node_cp = copy(node) node_cp.body = [self.visit(s) for s in node.body] return node_cp def visit_Name(self, node: _ast.Name) ‑> _ast.Name-
Expand source code
def visit_Name(self, node: Name) -> Name: nc = copy(node) nc.orig_id = node.id nc.id = self.varmap[node.id] return nc