mirror of
https://github.com/python/cpython.git
synced 2025-10-24 18:33:49 +00:00
785 lines
27 KiB
C
785 lines
27 KiB
C
/* Peephole optimizations for bytecode compiler. */
|
|
|
|
#include "Python.h"
|
|
|
|
#include "Python-ast.h"
|
|
#include "node.h"
|
|
#include "ast.h"
|
|
#include "code.h"
|
|
#include "symtable.h"
|
|
#include "opcode.h"
|
|
#include "wordcode_helpers.h"
|
|
|
|
#define UNCONDITIONAL_JUMP(op) (op==JUMP_ABSOLUTE || op==JUMP_FORWARD)
|
|
#define CONDITIONAL_JUMP(op) (op==POP_JUMP_IF_FALSE || op==POP_JUMP_IF_TRUE \
|
|
|| op==JUMP_IF_FALSE_OR_POP || op==JUMP_IF_TRUE_OR_POP)
|
|
#define ABSOLUTE_JUMP(op) (op==JUMP_ABSOLUTE || op==CONTINUE_LOOP \
|
|
|| op==POP_JUMP_IF_FALSE || op==POP_JUMP_IF_TRUE \
|
|
|| op==JUMP_IF_FALSE_OR_POP || op==JUMP_IF_TRUE_OR_POP)
|
|
#define JUMPS_ON_TRUE(op) (op==POP_JUMP_IF_TRUE || op==JUMP_IF_TRUE_OR_POP)
|
|
#define GETJUMPTGT(arr, i) (get_arg(arr, i) / sizeof(_Py_CODEUNIT) + \
|
|
(ABSOLUTE_JUMP(_Py_OPCODE(arr[i])) ? 0 : i+1))
|
|
#define ISBASICBLOCK(blocks, start, end) \
|
|
(blocks[start]==blocks[end])
|
|
|
|
|
|
#define CONST_STACK_CREATE() { \
|
|
const_stack_size = 256; \
|
|
const_stack = PyMem_New(PyObject *, const_stack_size); \
|
|
if (!const_stack) { \
|
|
PyErr_NoMemory(); \
|
|
goto exitError; \
|
|
} \
|
|
}
|
|
|
|
#define CONST_STACK_DELETE() do { \
|
|
if (const_stack) \
|
|
PyMem_Free(const_stack); \
|
|
} while(0)
|
|
|
|
#define CONST_STACK_LEN() ((unsigned)(const_stack_top + 1))
|
|
|
|
#define CONST_STACK_PUSH_OP(i) do { \
|
|
PyObject *_x; \
|
|
assert(_Py_OPCODE(codestr[i]) == LOAD_CONST); \
|
|
assert(PyList_GET_SIZE(consts) > (Py_ssize_t)get_arg(codestr, i)); \
|
|
_x = PyList_GET_ITEM(consts, get_arg(codestr, i)); \
|
|
if (++const_stack_top >= const_stack_size) { \
|
|
const_stack_size *= 2; \
|
|
PyMem_Resize(const_stack, PyObject *, const_stack_size); \
|
|
if (!const_stack) { \
|
|
PyErr_NoMemory(); \
|
|
goto exitError; \
|
|
} \
|
|
} \
|
|
const_stack[const_stack_top] = _x; \
|
|
in_consts = 1; \
|
|
} while(0)
|
|
|
|
#define CONST_STACK_RESET() do { \
|
|
const_stack_top = -1; \
|
|
} while(0)
|
|
|
|
#define CONST_STACK_LASTN(i) \
|
|
&const_stack[CONST_STACK_LEN() - i]
|
|
|
|
#define CONST_STACK_POP(i) do { \
|
|
assert(CONST_STACK_LEN() >= i); \
|
|
const_stack_top -= i; \
|
|
} while(0)
|
|
|
|
/* Scans back N consecutive LOAD_CONST instructions, skipping NOPs,
|
|
returns index of the Nth last's LOAD_CONST's EXTENDED_ARG prefix.
|
|
Callers are responsible to check CONST_STACK_LEN beforehand.
|
|
*/
|
|
static Py_ssize_t
|
|
lastn_const_start(const _Py_CODEUNIT *codestr, Py_ssize_t i, Py_ssize_t n)
|
|
{
|
|
assert(n > 0);
|
|
for (;;) {
|
|
i--;
|
|
assert(i >= 0);
|
|
if (_Py_OPCODE(codestr[i]) == LOAD_CONST) {
|
|
if (!--n) {
|
|
while (i > 0 && _Py_OPCODE(codestr[i-1]) == EXTENDED_ARG) {
|
|
i--;
|
|
}
|
|
return i;
|
|
}
|
|
}
|
|
else {
|
|
assert(_Py_OPCODE(codestr[i]) == NOP ||
|
|
_Py_OPCODE(codestr[i]) == EXTENDED_ARG);
|
|
}
|
|
}
|
|
}
|
|
|
|
/* Scans through EXTENDED ARGs, seeking the index of the effective opcode */
|
|
static Py_ssize_t
|
|
find_op(const _Py_CODEUNIT *codestr, Py_ssize_t i)
|
|
{
|
|
while (_Py_OPCODE(codestr[i]) == EXTENDED_ARG) {
|
|
i++;
|
|
}
|
|
return i;
|
|
}
|
|
|
|
/* Given the index of the effective opcode,
|
|
scan back to construct the oparg with EXTENDED_ARG */
|
|
static unsigned int
|
|
get_arg(const _Py_CODEUNIT *codestr, Py_ssize_t i)
|
|
{
|
|
_Py_CODEUNIT word;
|
|
unsigned int oparg = _Py_OPARG(codestr[i]);
|
|
if (i >= 1 && _Py_OPCODE(word = codestr[i-1]) == EXTENDED_ARG) {
|
|
oparg |= _Py_OPARG(word) << 8;
|
|
if (i >= 2 && _Py_OPCODE(word = codestr[i-2]) == EXTENDED_ARG) {
|
|
oparg |= _Py_OPARG(word) << 16;
|
|
if (i >= 3 && _Py_OPCODE(word = codestr[i-3]) == EXTENDED_ARG) {
|
|
oparg |= _Py_OPARG(word) << 24;
|
|
}
|
|
}
|
|
}
|
|
return oparg;
|
|
}
|
|
|
|
/* Fill the region with NOPs. */
|
|
static void
|
|
fill_nops(_Py_CODEUNIT *codestr, Py_ssize_t start, Py_ssize_t end)
|
|
{
|
|
memset(codestr + start, NOP, (end - start) * sizeof(_Py_CODEUNIT));
|
|
}
|
|
|
|
/* Given the index of the effective opcode,
|
|
attempt to replace the argument, taking into account EXTENDED_ARG.
|
|
Returns -1 on failure, or the new op index on success */
|
|
static Py_ssize_t
|
|
set_arg(_Py_CODEUNIT *codestr, Py_ssize_t i, unsigned int oparg)
|
|
{
|
|
unsigned int curarg = get_arg(codestr, i);
|
|
int curilen, newilen;
|
|
if (curarg == oparg)
|
|
return i;
|
|
curilen = instrsize(curarg);
|
|
newilen = instrsize(oparg);
|
|
if (curilen < newilen) {
|
|
return -1;
|
|
}
|
|
|
|
write_op_arg(codestr + i + 1 - curilen, _Py_OPCODE(codestr[i]), oparg, newilen);
|
|
fill_nops(codestr, i + 1 - curilen + newilen, i + 1);
|
|
return i-curilen+newilen;
|
|
}
|
|
|
|
/* Attempt to write op/arg at end of specified region of memory.
|
|
Preceding memory in the region is overwritten with NOPs.
|
|
Returns -1 on failure, op index on success */
|
|
static Py_ssize_t
|
|
copy_op_arg(_Py_CODEUNIT *codestr, Py_ssize_t i, unsigned char op,
|
|
unsigned int oparg, Py_ssize_t maxi)
|
|
{
|
|
int ilen = instrsize(oparg);
|
|
if (i + ilen > maxi) {
|
|
return -1;
|
|
}
|
|
write_op_arg(codestr + maxi - ilen, op, oparg, ilen);
|
|
fill_nops(codestr, i, maxi - ilen);
|
|
return maxi - 1;
|
|
}
|
|
|
|
/* Replace LOAD_CONST c1, LOAD_CONST c2 ... LOAD_CONST cn, BUILD_TUPLE n
|
|
with LOAD_CONST (c1, c2, ... cn).
|
|
The consts table must still be in list form so that the
|
|
new constant (c1, c2, ... cn) can be appended.
|
|
Called with codestr pointing to the first LOAD_CONST.
|
|
Bails out with no change if one or more of the LOAD_CONSTs is missing.
|
|
Also works for BUILD_LIST and BUILT_SET when followed by an "in" or "not in"
|
|
test; for BUILD_SET it assembles a frozenset rather than a tuple.
|
|
*/
|
|
static Py_ssize_t
|
|
fold_tuple_on_constants(_Py_CODEUNIT *codestr, Py_ssize_t c_start,
|
|
Py_ssize_t opcode_end, unsigned char opcode,
|
|
PyObject *consts, PyObject **objs, int n)
|
|
{
|
|
PyObject *newconst, *constant;
|
|
Py_ssize_t i, len_consts;
|
|
|
|
/* Pre-conditions */
|
|
assert(PyList_CheckExact(consts));
|
|
|
|
/* Buildup new tuple of constants */
|
|
newconst = PyTuple_New(n);
|
|
if (newconst == NULL) {
|
|
return -1;
|
|
}
|
|
for (i=0 ; i<n ; i++) {
|
|
constant = objs[i];
|
|
Py_INCREF(constant);
|
|
PyTuple_SET_ITEM(newconst, i, constant);
|
|
}
|
|
|
|
/* If it's a BUILD_SET, use the PyTuple we just built to create a
|
|
PyFrozenSet, and use that as the constant instead: */
|
|
if (opcode == BUILD_SET) {
|
|
Py_SETREF(newconst, PyFrozenSet_New(newconst));
|
|
if (newconst == NULL) {
|
|
return -1;
|
|
}
|
|
}
|
|
|
|
/* Append folded constant onto consts */
|
|
len_consts = PyList_GET_SIZE(consts);
|
|
if (PyList_Append(consts, newconst)) {
|
|
Py_DECREF(newconst);
|
|
return -1;
|
|
}
|
|
Py_DECREF(newconst);
|
|
|
|
return copy_op_arg(codestr, c_start, LOAD_CONST, len_consts, opcode_end);
|
|
}
|
|
|
|
/* Replace LOAD_CONST c1, LOAD_CONST c2, BINOP
|
|
with LOAD_CONST binop(c1,c2)
|
|
The consts table must still be in list form so that the
|
|
new constant can be appended.
|
|
Called with codestr pointing to the BINOP.
|
|
Abandons the transformation if the folding fails (i.e. 1+'a').
|
|
If the new constant is a sequence, only folds when the size
|
|
is below a threshold value. That keeps pyc files from
|
|
becoming large in the presence of code like: (None,)*1000.
|
|
*/
|
|
static Py_ssize_t
|
|
fold_binops_on_constants(_Py_CODEUNIT *codestr, Py_ssize_t c_start,
|
|
Py_ssize_t opcode_end, unsigned char opcode,
|
|
PyObject *consts, PyObject **objs)
|
|
{
|
|
PyObject *newconst, *v, *w;
|
|
Py_ssize_t len_consts, size;
|
|
|
|
/* Pre-conditions */
|
|
assert(PyList_CheckExact(consts));
|
|
len_consts = PyList_GET_SIZE(consts);
|
|
|
|
/* Create new constant */
|
|
v = objs[0];
|
|
w = objs[1];
|
|
switch (opcode) {
|
|
case BINARY_POWER:
|
|
newconst = PyNumber_Power(v, w, Py_None);
|
|
break;
|
|
case BINARY_MULTIPLY:
|
|
newconst = PyNumber_Multiply(v, w);
|
|
break;
|
|
case BINARY_TRUE_DIVIDE:
|
|
newconst = PyNumber_TrueDivide(v, w);
|
|
break;
|
|
case BINARY_FLOOR_DIVIDE:
|
|
newconst = PyNumber_FloorDivide(v, w);
|
|
break;
|
|
case BINARY_MODULO:
|
|
newconst = PyNumber_Remainder(v, w);
|
|
break;
|
|
case BINARY_ADD:
|
|
newconst = PyNumber_Add(v, w);
|
|
break;
|
|
case BINARY_SUBTRACT:
|
|
newconst = PyNumber_Subtract(v, w);
|
|
break;
|
|
case BINARY_SUBSCR:
|
|
newconst = PyObject_GetItem(v, w);
|
|
break;
|
|
case BINARY_LSHIFT:
|
|
newconst = PyNumber_Lshift(v, w);
|
|
break;
|
|
case BINARY_RSHIFT:
|
|
newconst = PyNumber_Rshift(v, w);
|
|
break;
|
|
case BINARY_AND:
|
|
newconst = PyNumber_And(v, w);
|
|
break;
|
|
case BINARY_XOR:
|
|
newconst = PyNumber_Xor(v, w);
|
|
break;
|
|
case BINARY_OR:
|
|
newconst = PyNumber_Or(v, w);
|
|
break;
|
|
default:
|
|
/* Called with an unknown opcode */
|
|
PyErr_Format(PyExc_SystemError,
|
|
"unexpected binary operation %d on a constant",
|
|
opcode);
|
|
return -1;
|
|
}
|
|
if (newconst == NULL) {
|
|
if(!PyErr_ExceptionMatches(PyExc_KeyboardInterrupt)) {
|
|
PyErr_Clear();
|
|
}
|
|
return -1;
|
|
}
|
|
size = PyObject_Size(newconst);
|
|
if (size == -1) {
|
|
if (PyErr_ExceptionMatches(PyExc_KeyboardInterrupt)) {
|
|
return -1;
|
|
}
|
|
PyErr_Clear();
|
|
} else if (size > 20) {
|
|
Py_DECREF(newconst);
|
|
return -1;
|
|
}
|
|
|
|
/* Append folded constant into consts table */
|
|
if (PyList_Append(consts, newconst)) {
|
|
Py_DECREF(newconst);
|
|
return -1;
|
|
}
|
|
Py_DECREF(newconst);
|
|
|
|
return copy_op_arg(codestr, c_start, LOAD_CONST, len_consts, opcode_end);
|
|
}
|
|
|
|
static Py_ssize_t
|
|
fold_unaryops_on_constants(_Py_CODEUNIT *codestr, Py_ssize_t c_start,
|
|
Py_ssize_t opcode_end, unsigned char opcode,
|
|
PyObject *consts, PyObject *v)
|
|
{
|
|
PyObject *newconst;
|
|
Py_ssize_t len_consts;
|
|
|
|
/* Pre-conditions */
|
|
assert(PyList_CheckExact(consts));
|
|
len_consts = PyList_GET_SIZE(consts);
|
|
|
|
/* Create new constant */
|
|
switch (opcode) {
|
|
case UNARY_NEGATIVE:
|
|
newconst = PyNumber_Negative(v);
|
|
break;
|
|
case UNARY_INVERT:
|
|
newconst = PyNumber_Invert(v);
|
|
break;
|
|
case UNARY_POSITIVE:
|
|
newconst = PyNumber_Positive(v);
|
|
break;
|
|
default:
|
|
/* Called with an unknown opcode */
|
|
PyErr_Format(PyExc_SystemError,
|
|
"unexpected unary operation %d on a constant",
|
|
opcode);
|
|
return -1;
|
|
}
|
|
if (newconst == NULL) {
|
|
if(!PyErr_ExceptionMatches(PyExc_KeyboardInterrupt)) {
|
|
PyErr_Clear();
|
|
}
|
|
return -1;
|
|
}
|
|
|
|
/* Append folded constant into consts table */
|
|
if (PyList_Append(consts, newconst)) {
|
|
Py_DECREF(newconst);
|
|
PyErr_Clear();
|
|
return -1;
|
|
}
|
|
Py_DECREF(newconst);
|
|
|
|
return copy_op_arg(codestr, c_start, LOAD_CONST, len_consts, opcode_end);
|
|
}
|
|
|
|
static unsigned int *
|
|
markblocks(_Py_CODEUNIT *code, Py_ssize_t len)
|
|
{
|
|
unsigned int *blocks = PyMem_New(unsigned int, len);
|
|
int i, j, opcode, blockcnt = 0;
|
|
|
|
if (blocks == NULL) {
|
|
PyErr_NoMemory();
|
|
return NULL;
|
|
}
|
|
memset(blocks, 0, len*sizeof(int));
|
|
|
|
/* Mark labels in the first pass */
|
|
for (i = 0; i < len; i++) {
|
|
opcode = _Py_OPCODE(code[i]);
|
|
switch (opcode) {
|
|
case FOR_ITER:
|
|
case JUMP_FORWARD:
|
|
case JUMP_IF_FALSE_OR_POP:
|
|
case JUMP_IF_TRUE_OR_POP:
|
|
case POP_JUMP_IF_FALSE:
|
|
case POP_JUMP_IF_TRUE:
|
|
case JUMP_ABSOLUTE:
|
|
case CONTINUE_LOOP:
|
|
case SETUP_LOOP:
|
|
case SETUP_EXCEPT:
|
|
case SETUP_FINALLY:
|
|
case SETUP_WITH:
|
|
case SETUP_ASYNC_WITH:
|
|
j = GETJUMPTGT(code, i);
|
|
assert(j < len);
|
|
blocks[j] = 1;
|
|
break;
|
|
}
|
|
}
|
|
/* Build block numbers in the second pass */
|
|
for (i = 0; i < len; i++) {
|
|
blockcnt += blocks[i]; /* increment blockcnt over labels */
|
|
blocks[i] = blockcnt;
|
|
}
|
|
return blocks;
|
|
}
|
|
|
|
/* Perform basic peephole optimizations to components of a code object.
|
|
The consts object should still be in list form to allow new constants
|
|
to be appended.
|
|
|
|
To keep the optimizer simple, it bails when the lineno table has complex
|
|
encoding for gaps >= 255.
|
|
|
|
Optimizations are restricted to simple transformations occurring within a
|
|
single basic block. All transformations keep the code size the same or
|
|
smaller. For those that reduce size, the gaps are initially filled with
|
|
NOPs. Later those NOPs are removed and the jump addresses retargeted in
|
|
a single pass. */
|
|
|
|
PyObject *
|
|
PyCode_Optimize(PyObject *code, PyObject* consts, PyObject *names,
|
|
PyObject *lnotab_obj)
|
|
{
|
|
Py_ssize_t h, i, nexti, op_start, codelen, tgt;
|
|
unsigned int j, nops;
|
|
unsigned char opcode, nextop;
|
|
_Py_CODEUNIT *codestr = NULL;
|
|
unsigned char *lnotab;
|
|
unsigned int cum_orig_offset, last_offset;
|
|
Py_ssize_t tabsiz;
|
|
PyObject **const_stack = NULL;
|
|
Py_ssize_t const_stack_top = -1;
|
|
Py_ssize_t const_stack_size = 0;
|
|
int in_consts = 0; /* whether we are in a LOAD_CONST sequence */
|
|
unsigned int *blocks = NULL;
|
|
|
|
/* Bail out if an exception is set */
|
|
if (PyErr_Occurred())
|
|
goto exitError;
|
|
|
|
/* Bypass optimization when the lnotab table is too complex */
|
|
assert(PyBytes_Check(lnotab_obj));
|
|
lnotab = (unsigned char*)PyBytes_AS_STRING(lnotab_obj);
|
|
tabsiz = PyBytes_GET_SIZE(lnotab_obj);
|
|
assert(tabsiz == 0 || Py_REFCNT(lnotab_obj) == 1);
|
|
if (memchr(lnotab, 255, tabsiz) != NULL) {
|
|
/* 255 value are used for multibyte bytecode instructions */
|
|
goto exitUnchanged;
|
|
}
|
|
/* Note: -128 and 127 special values for line number delta are ok,
|
|
the peephole optimizer doesn't modify line numbers. */
|
|
|
|
assert(PyBytes_Check(code));
|
|
codelen = PyBytes_GET_SIZE(code);
|
|
assert(codelen % sizeof(_Py_CODEUNIT) == 0);
|
|
|
|
/* Make a modifiable copy of the code string */
|
|
codestr = (_Py_CODEUNIT *)PyMem_Malloc(codelen);
|
|
if (codestr == NULL) {
|
|
PyErr_NoMemory();
|
|
goto exitError;
|
|
}
|
|
memcpy(codestr, PyBytes_AS_STRING(code), codelen);
|
|
codelen /= sizeof(_Py_CODEUNIT);
|
|
|
|
blocks = markblocks(codestr, codelen);
|
|
if (blocks == NULL)
|
|
goto exitError;
|
|
assert(PyList_Check(consts));
|
|
|
|
CONST_STACK_CREATE();
|
|
|
|
for (i=find_op(codestr, 0) ; i<codelen ; i=nexti) {
|
|
opcode = _Py_OPCODE(codestr[i]);
|
|
op_start = i;
|
|
while (op_start >= 1 && _Py_OPCODE(codestr[op_start-1]) == EXTENDED_ARG) {
|
|
op_start--;
|
|
}
|
|
|
|
nexti = i + 1;
|
|
while (nexti < codelen && _Py_OPCODE(codestr[nexti]) == EXTENDED_ARG)
|
|
nexti++;
|
|
nextop = nexti < codelen ? _Py_OPCODE(codestr[nexti]) : 0;
|
|
|
|
if (!in_consts) {
|
|
CONST_STACK_RESET();
|
|
}
|
|
in_consts = 0;
|
|
|
|
switch (opcode) {
|
|
/* not a is b --> a is not b
|
|
not a in b --> a not in b
|
|
not a is not b --> a is b
|
|
not a not in b --> a in b
|
|
*/
|
|
case COMPARE_OP:
|
|
j = get_arg(codestr, i);
|
|
if (j < 6 || j > 9 ||
|
|
nextop != UNARY_NOT ||
|
|
!ISBASICBLOCK(blocks, op_start, i + 1))
|
|
break;
|
|
codestr[i] = PACKOPARG(opcode, j^1);
|
|
fill_nops(codestr, i + 1, nexti + 1);
|
|
break;
|
|
|
|
/* Skip over LOAD_CONST trueconst
|
|
POP_JUMP_IF_FALSE xx. This improves
|
|
"while 1" performance. */
|
|
case LOAD_CONST:
|
|
CONST_STACK_PUSH_OP(i);
|
|
if (nextop != POP_JUMP_IF_FALSE ||
|
|
!ISBASICBLOCK(blocks, op_start, i + 1) ||
|
|
!PyObject_IsTrue(PyList_GET_ITEM(consts, get_arg(codestr, i))))
|
|
break;
|
|
fill_nops(codestr, op_start, nexti + 1);
|
|
CONST_STACK_POP(1);
|
|
break;
|
|
|
|
/* Try to fold tuples of constants (includes a case for lists
|
|
and sets which are only used for "in" and "not in" tests).
|
|
Skip over BUILD_SEQN 1 UNPACK_SEQN 1.
|
|
Replace BUILD_SEQN 2 UNPACK_SEQN 2 with ROT2.
|
|
Replace BUILD_SEQN 3 UNPACK_SEQN 3 with ROT3 ROT2. */
|
|
case BUILD_TUPLE:
|
|
case BUILD_LIST:
|
|
case BUILD_SET:
|
|
j = get_arg(codestr, i);
|
|
if (j > 0 && CONST_STACK_LEN() >= j) {
|
|
h = lastn_const_start(codestr, op_start, j);
|
|
if ((opcode == BUILD_TUPLE &&
|
|
ISBASICBLOCK(blocks, h, op_start)) ||
|
|
((opcode == BUILD_LIST || opcode == BUILD_SET) &&
|
|
((nextop==COMPARE_OP &&
|
|
(_Py_OPARG(codestr[nexti]) == PyCmp_IN ||
|
|
_Py_OPARG(codestr[nexti]) == PyCmp_NOT_IN)) ||
|
|
nextop == GET_ITER) && ISBASICBLOCK(blocks, h, i + 1))) {
|
|
h = fold_tuple_on_constants(codestr, h, i + 1, opcode,
|
|
consts, CONST_STACK_LASTN(j), j);
|
|
if (h >= 0) {
|
|
CONST_STACK_POP(j);
|
|
CONST_STACK_PUSH_OP(h);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
if (nextop != UNPACK_SEQUENCE ||
|
|
!ISBASICBLOCK(blocks, op_start, i + 1) ||
|
|
j != get_arg(codestr, nexti) ||
|
|
opcode == BUILD_SET)
|
|
break;
|
|
if (j < 2) {
|
|
fill_nops(codestr, op_start, nexti + 1);
|
|
} else if (j == 2) {
|
|
codestr[op_start] = PACKOPARG(ROT_TWO, 0);
|
|
fill_nops(codestr, op_start + 1, nexti + 1);
|
|
CONST_STACK_RESET();
|
|
} else if (j == 3) {
|
|
codestr[op_start] = PACKOPARG(ROT_THREE, 0);
|
|
codestr[op_start + 1] = PACKOPARG(ROT_TWO, 0);
|
|
fill_nops(codestr, op_start + 2, nexti + 1);
|
|
CONST_STACK_RESET();
|
|
}
|
|
break;
|
|
|
|
/* Fold binary ops on constants.
|
|
LOAD_CONST c1 LOAD_CONST c2 BINOP --> LOAD_CONST binop(c1,c2) */
|
|
case BINARY_POWER:
|
|
case BINARY_MULTIPLY:
|
|
case BINARY_TRUE_DIVIDE:
|
|
case BINARY_FLOOR_DIVIDE:
|
|
case BINARY_MODULO:
|
|
case BINARY_ADD:
|
|
case BINARY_SUBTRACT:
|
|
case BINARY_SUBSCR:
|
|
case BINARY_LSHIFT:
|
|
case BINARY_RSHIFT:
|
|
case BINARY_AND:
|
|
case BINARY_XOR:
|
|
case BINARY_OR:
|
|
if (CONST_STACK_LEN() < 2)
|
|
break;
|
|
h = lastn_const_start(codestr, op_start, 2);
|
|
if (ISBASICBLOCK(blocks, h, op_start)) {
|
|
h = fold_binops_on_constants(codestr, h, i + 1, opcode,
|
|
consts, CONST_STACK_LASTN(2));
|
|
if (h >= 0) {
|
|
CONST_STACK_POP(2);
|
|
CONST_STACK_PUSH_OP(h);
|
|
}
|
|
}
|
|
break;
|
|
|
|
/* Fold unary ops on constants.
|
|
LOAD_CONST c1 UNARY_OP --> LOAD_CONST unary_op(c) */
|
|
case UNARY_NEGATIVE:
|
|
case UNARY_INVERT:
|
|
case UNARY_POSITIVE:
|
|
if (CONST_STACK_LEN() < 1)
|
|
break;
|
|
h = lastn_const_start(codestr, op_start, 1);
|
|
if (ISBASICBLOCK(blocks, h, op_start)) {
|
|
h = fold_unaryops_on_constants(codestr, h, i + 1, opcode,
|
|
consts, *CONST_STACK_LASTN(1));
|
|
if (h >= 0) {
|
|
CONST_STACK_POP(1);
|
|
CONST_STACK_PUSH_OP(h);
|
|
}
|
|
}
|
|
break;
|
|
|
|
/* Simplify conditional jump to conditional jump where the
|
|
result of the first test implies the success of a similar
|
|
test or the failure of the opposite test.
|
|
Arises in code like:
|
|
"a and b or c"
|
|
"(a and b) and c"
|
|
"(a or b) or c"
|
|
"(a or b) and c"
|
|
x:JUMP_IF_FALSE_OR_POP y y:JUMP_IF_FALSE_OR_POP z
|
|
--> x:JUMP_IF_FALSE_OR_POP z
|
|
x:JUMP_IF_FALSE_OR_POP y y:JUMP_IF_TRUE_OR_POP z
|
|
--> x:POP_JUMP_IF_FALSE y+1
|
|
where y+1 is the instruction following the second test.
|
|
*/
|
|
case JUMP_IF_FALSE_OR_POP:
|
|
case JUMP_IF_TRUE_OR_POP:
|
|
h = get_arg(codestr, i) / sizeof(_Py_CODEUNIT);
|
|
tgt = find_op(codestr, h);
|
|
|
|
j = _Py_OPCODE(codestr[tgt]);
|
|
if (CONDITIONAL_JUMP(j)) {
|
|
/* NOTE: all possible jumps here are absolute. */
|
|
if (JUMPS_ON_TRUE(j) == JUMPS_ON_TRUE(opcode)) {
|
|
/* The second jump will be taken iff the first is.
|
|
The current opcode inherits its target's
|
|
stack effect */
|
|
h = set_arg(codestr, i, get_arg(codestr, tgt));
|
|
} else {
|
|
/* The second jump is not taken if the first is (so
|
|
jump past it), and all conditional jumps pop their
|
|
argument when they're not taken (so change the
|
|
first jump to pop its argument when it's taken). */
|
|
h = set_arg(codestr, i, (tgt + 1) * sizeof(_Py_CODEUNIT));
|
|
j = opcode == JUMP_IF_TRUE_OR_POP ?
|
|
POP_JUMP_IF_TRUE : POP_JUMP_IF_FALSE;
|
|
}
|
|
|
|
if (h >= 0) {
|
|
nexti = h;
|
|
codestr[nexti] = PACKOPARG(j, _Py_OPARG(codestr[nexti]));
|
|
break;
|
|
}
|
|
}
|
|
/* Intentional fallthrough */
|
|
|
|
/* Replace jumps to unconditional jumps */
|
|
case POP_JUMP_IF_FALSE:
|
|
case POP_JUMP_IF_TRUE:
|
|
case FOR_ITER:
|
|
case JUMP_FORWARD:
|
|
case JUMP_ABSOLUTE:
|
|
case CONTINUE_LOOP:
|
|
case SETUP_LOOP:
|
|
case SETUP_EXCEPT:
|
|
case SETUP_FINALLY:
|
|
case SETUP_WITH:
|
|
case SETUP_ASYNC_WITH:
|
|
h = GETJUMPTGT(codestr, i);
|
|
tgt = find_op(codestr, h);
|
|
/* Replace JUMP_* to a RETURN into just a RETURN */
|
|
if (UNCONDITIONAL_JUMP(opcode) &&
|
|
_Py_OPCODE(codestr[tgt]) == RETURN_VALUE) {
|
|
codestr[op_start] = PACKOPARG(RETURN_VALUE, 0);
|
|
fill_nops(codestr, op_start + 1, i + 1);
|
|
} else if (UNCONDITIONAL_JUMP(_Py_OPCODE(codestr[tgt]))) {
|
|
j = GETJUMPTGT(codestr, tgt);
|
|
if (opcode == JUMP_FORWARD) { /* JMP_ABS can go backwards */
|
|
opcode = JUMP_ABSOLUTE;
|
|
} else if (!ABSOLUTE_JUMP(opcode)) {
|
|
if ((Py_ssize_t)j < i + 1) {
|
|
break; /* No backward relative jumps */
|
|
}
|
|
j -= i + 1; /* Calc relative jump addr */
|
|
}
|
|
j *= sizeof(_Py_CODEUNIT);
|
|
copy_op_arg(codestr, op_start, opcode, j, i + 1);
|
|
}
|
|
break;
|
|
|
|
/* Remove unreachable ops after RETURN */
|
|
case RETURN_VALUE:
|
|
h = i + 1;
|
|
while (h < codelen && ISBASICBLOCK(blocks, i, h)) {
|
|
h++;
|
|
}
|
|
if (h > i + 1) {
|
|
fill_nops(codestr, i + 1, h);
|
|
nexti = find_op(codestr, h);
|
|
}
|
|
break;
|
|
}
|
|
}
|
|
|
|
/* Fixup lnotab */
|
|
for (i = 0, nops = 0; i < codelen; i++) {
|
|
assert(i - nops <= INT_MAX);
|
|
/* original code offset => new code offset */
|
|
blocks[i] = i - nops;
|
|
if (_Py_OPCODE(codestr[i]) == NOP)
|
|
nops++;
|
|
}
|
|
cum_orig_offset = 0;
|
|
last_offset = 0;
|
|
for (i=0 ; i < tabsiz ; i+=2) {
|
|
unsigned int offset_delta, new_offset;
|
|
cum_orig_offset += lnotab[i];
|
|
assert(cum_orig_offset % sizeof(_Py_CODEUNIT) == 0);
|
|
new_offset = blocks[cum_orig_offset / sizeof(_Py_CODEUNIT)] *
|
|
sizeof(_Py_CODEUNIT);
|
|
offset_delta = new_offset - last_offset;
|
|
assert(offset_delta <= 255);
|
|
lnotab[i] = (unsigned char)offset_delta;
|
|
last_offset = new_offset;
|
|
}
|
|
|
|
/* Remove NOPs and fixup jump targets */
|
|
for (op_start = i = h = 0; i < codelen; i++, op_start = i) {
|
|
j = _Py_OPARG(codestr[i]);
|
|
while (_Py_OPCODE(codestr[i]) == EXTENDED_ARG) {
|
|
i++;
|
|
j = j<<8 | _Py_OPARG(codestr[i]);
|
|
}
|
|
opcode = _Py_OPCODE(codestr[i]);
|
|
switch (opcode) {
|
|
case NOP:continue;
|
|
|
|
case JUMP_ABSOLUTE:
|
|
case CONTINUE_LOOP:
|
|
case POP_JUMP_IF_FALSE:
|
|
case POP_JUMP_IF_TRUE:
|
|
case JUMP_IF_FALSE_OR_POP:
|
|
case JUMP_IF_TRUE_OR_POP:
|
|
j = blocks[j / sizeof(_Py_CODEUNIT)] * sizeof(_Py_CODEUNIT);
|
|
break;
|
|
|
|
case FOR_ITER:
|
|
case JUMP_FORWARD:
|
|
case SETUP_LOOP:
|
|
case SETUP_EXCEPT:
|
|
case SETUP_FINALLY:
|
|
case SETUP_WITH:
|
|
case SETUP_ASYNC_WITH:
|
|
j = blocks[j / sizeof(_Py_CODEUNIT) + i + 1] - blocks[i] - 1;
|
|
j *= sizeof(_Py_CODEUNIT);
|
|
break;
|
|
}
|
|
nexti = i - op_start + 1;
|
|
if (instrsize(j) > nexti)
|
|
goto exitUnchanged;
|
|
/* If instrsize(j) < nexti, we'll emit EXTENDED_ARG 0 */
|
|
write_op_arg(codestr + h, opcode, j, nexti);
|
|
h += nexti;
|
|
}
|
|
assert(h + (Py_ssize_t)nops == codelen);
|
|
|
|
CONST_STACK_DELETE();
|
|
PyMem_Free(blocks);
|
|
code = PyBytes_FromStringAndSize((char *)codestr, h * sizeof(_Py_CODEUNIT));
|
|
PyMem_Free(codestr);
|
|
return code;
|
|
|
|
exitError:
|
|
code = NULL;
|
|
|
|
exitUnchanged:
|
|
Py_XINCREF(code);
|
|
CONST_STACK_DELETE();
|
|
PyMem_Free(blocks);
|
|
PyMem_Free(codestr);
|
|
return code;
|
|
}
|