mirror of
				https://github.com/python/cpython.git
				synced 2025-11-03 23:21:29 +00:00 
			
		
		
		
	
		
			
				
	
	
		
			592 lines
		
	
	
	
		
			21 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			592 lines
		
	
	
	
		
			21 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
/* Peephole optimizations for bytecode compiler. */
 | 
						|
 | 
						|
#include "Python.h"
 | 
						|
 | 
						|
#include "Python-ast.h"
 | 
						|
#include "node.h"
 | 
						|
#include "ast.h"
 | 
						|
#include "code.h"
 | 
						|
#include "symtable.h"
 | 
						|
#include "opcode.h"
 | 
						|
#include "wordcode_helpers.h"
 | 
						|
 | 
						|
#define UNCONDITIONAL_JUMP(op)  (op==JUMP_ABSOLUTE || op==JUMP_FORWARD)
 | 
						|
#define CONDITIONAL_JUMP(op) (op==POP_JUMP_IF_FALSE || op==POP_JUMP_IF_TRUE \
 | 
						|
    || op==JUMP_IF_FALSE_OR_POP || op==JUMP_IF_TRUE_OR_POP)
 | 
						|
#define ABSOLUTE_JUMP(op) (op==JUMP_ABSOLUTE || op==CONTINUE_LOOP \
 | 
						|
    || op==POP_JUMP_IF_FALSE || op==POP_JUMP_IF_TRUE \
 | 
						|
    || op==JUMP_IF_FALSE_OR_POP || op==JUMP_IF_TRUE_OR_POP)
 | 
						|
#define JUMPS_ON_TRUE(op) (op==POP_JUMP_IF_TRUE || op==JUMP_IF_TRUE_OR_POP)
 | 
						|
#define GETJUMPTGT(arr, i) (get_arg(arr, i) / sizeof(_Py_CODEUNIT) + \
 | 
						|
        (ABSOLUTE_JUMP(_Py_OPCODE(arr[i])) ? 0 : i+1))
 | 
						|
#define ISBASICBLOCK(blocks, start, end) \
 | 
						|
    (blocks[start]==blocks[end])
 | 
						|
 | 
						|
 | 
						|
#define CONST_STACK_CREATE() { \
 | 
						|
    const_stack_size = 256; \
 | 
						|
    const_stack = PyMem_New(PyObject *, const_stack_size); \
 | 
						|
    if (!const_stack) { \
 | 
						|
        PyErr_NoMemory(); \
 | 
						|
        goto exitError; \
 | 
						|
    } \
 | 
						|
    }
 | 
						|
 | 
						|
#define CONST_STACK_DELETE() do { \
 | 
						|
    if (const_stack) \
 | 
						|
        PyMem_Free(const_stack); \
 | 
						|
    } while(0)
 | 
						|
 | 
						|
#define CONST_STACK_LEN() ((unsigned)(const_stack_top + 1))
 | 
						|
 | 
						|
#define CONST_STACK_PUSH_OP(i) do { \
 | 
						|
    PyObject *_x; \
 | 
						|
    assert(_Py_OPCODE(codestr[i]) == LOAD_CONST); \
 | 
						|
    assert(PyList_GET_SIZE(consts) > (Py_ssize_t)get_arg(codestr, i)); \
 | 
						|
    _x = PyList_GET_ITEM(consts, get_arg(codestr, i)); \
 | 
						|
    if (++const_stack_top >= const_stack_size) { \
 | 
						|
        const_stack_size *= 2; \
 | 
						|
        PyMem_Resize(const_stack, PyObject *, const_stack_size); \
 | 
						|
        if (!const_stack) { \
 | 
						|
            PyErr_NoMemory(); \
 | 
						|
            goto exitError; \
 | 
						|
        } \
 | 
						|
    } \
 | 
						|
    const_stack[const_stack_top] = _x; \
 | 
						|
    in_consts = 1; \
 | 
						|
    } while(0)
 | 
						|
 | 
						|
#define CONST_STACK_RESET() do { \
 | 
						|
    const_stack_top = -1; \
 | 
						|
    } while(0)
 | 
						|
 | 
						|
#define CONST_STACK_LASTN(i) \
 | 
						|
    &const_stack[CONST_STACK_LEN() - i]
 | 
						|
 | 
						|
#define CONST_STACK_POP(i) do { \
 | 
						|
    assert(CONST_STACK_LEN() >= i); \
 | 
						|
    const_stack_top -= i; \
 | 
						|
    } while(0)
 | 
						|
 | 
						|
/* Scans back N consecutive LOAD_CONST instructions, skipping NOPs,
 | 
						|
   returns index of the Nth last's LOAD_CONST's EXTENDED_ARG prefix.
 | 
						|
   Callers are responsible to check CONST_STACK_LEN beforehand.
 | 
						|
*/
 | 
						|
static Py_ssize_t
 | 
						|
lastn_const_start(const _Py_CODEUNIT *codestr, Py_ssize_t i, Py_ssize_t n)
 | 
						|
{
 | 
						|
    assert(n > 0);
 | 
						|
    for (;;) {
 | 
						|
        i--;
 | 
						|
        assert(i >= 0);
 | 
						|
        if (_Py_OPCODE(codestr[i]) == LOAD_CONST) {
 | 
						|
            if (!--n) {
 | 
						|
                while (i > 0 && _Py_OPCODE(codestr[i-1]) == EXTENDED_ARG) {
 | 
						|
                    i--;
 | 
						|
                }
 | 
						|
                return i;
 | 
						|
            }
 | 
						|
        }
 | 
						|
        else {
 | 
						|
            assert(_Py_OPCODE(codestr[i]) == NOP ||
 | 
						|
                   _Py_OPCODE(codestr[i]) == EXTENDED_ARG);
 | 
						|
        }
 | 
						|
    }
 | 
						|
}
 | 
						|
 | 
						|
/* Scans through EXTENDED ARGs, seeking the index of the effective opcode */
 | 
						|
static Py_ssize_t
 | 
						|
find_op(const _Py_CODEUNIT *codestr, Py_ssize_t i)
 | 
						|
{
 | 
						|
    while (_Py_OPCODE(codestr[i]) == EXTENDED_ARG) {
 | 
						|
        i++;
 | 
						|
    }
 | 
						|
    return i;
 | 
						|
}
 | 
						|
 | 
						|
/* Given the index of the effective opcode,
 | 
						|
   scan back to construct the oparg with EXTENDED_ARG */
 | 
						|
static unsigned int
 | 
						|
get_arg(const _Py_CODEUNIT *codestr, Py_ssize_t i)
 | 
						|
{
 | 
						|
    _Py_CODEUNIT word;
 | 
						|
    unsigned int oparg = _Py_OPARG(codestr[i]);
 | 
						|
    if (i >= 1 && _Py_OPCODE(word = codestr[i-1]) == EXTENDED_ARG) {
 | 
						|
        oparg |= _Py_OPARG(word) << 8;
 | 
						|
        if (i >= 2 && _Py_OPCODE(word = codestr[i-2]) == EXTENDED_ARG) {
 | 
						|
            oparg |= _Py_OPARG(word) << 16;
 | 
						|
            if (i >= 3 && _Py_OPCODE(word = codestr[i-3]) == EXTENDED_ARG) {
 | 
						|
                oparg |= _Py_OPARG(word) << 24;
 | 
						|
            }
 | 
						|
        }
 | 
						|
    }
 | 
						|
    return oparg;
 | 
						|
}
 | 
						|
 | 
						|
/* Fill the region with NOPs. */
 | 
						|
static void
 | 
						|
fill_nops(_Py_CODEUNIT *codestr, Py_ssize_t start, Py_ssize_t end)
 | 
						|
{
 | 
						|
    memset(codestr + start, NOP, (end - start) * sizeof(_Py_CODEUNIT));
 | 
						|
}
 | 
						|
 | 
						|
/* Given the index of the effective opcode,
 | 
						|
   attempt to replace the argument, taking into account EXTENDED_ARG.
 | 
						|
   Returns -1 on failure, or the new op index on success */
 | 
						|
static Py_ssize_t
 | 
						|
set_arg(_Py_CODEUNIT *codestr, Py_ssize_t i, unsigned int oparg)
 | 
						|
{
 | 
						|
    unsigned int curarg = get_arg(codestr, i);
 | 
						|
    int curilen, newilen;
 | 
						|
    if (curarg == oparg)
 | 
						|
        return i;
 | 
						|
    curilen = instrsize(curarg);
 | 
						|
    newilen = instrsize(oparg);
 | 
						|
    if (curilen < newilen) {
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
 | 
						|
    write_op_arg(codestr + i + 1 - curilen, _Py_OPCODE(codestr[i]), oparg, newilen);
 | 
						|
    fill_nops(codestr, i + 1 - curilen + newilen, i + 1);
 | 
						|
    return i-curilen+newilen;
 | 
						|
}
 | 
						|
 | 
						|
/* Attempt to write op/arg at end of specified region of memory.
 | 
						|
   Preceding memory in the region is overwritten with NOPs.
 | 
						|
   Returns -1 on failure, op index on success */
 | 
						|
static Py_ssize_t
 | 
						|
copy_op_arg(_Py_CODEUNIT *codestr, Py_ssize_t i, unsigned char op,
 | 
						|
            unsigned int oparg, Py_ssize_t maxi)
 | 
						|
{
 | 
						|
    int ilen = instrsize(oparg);
 | 
						|
    if (i + ilen > maxi) {
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
    write_op_arg(codestr + maxi - ilen, op, oparg, ilen);
 | 
						|
    fill_nops(codestr, i, maxi - ilen);
 | 
						|
    return maxi - 1;
 | 
						|
}
 | 
						|
 | 
						|
/* Replace LOAD_CONST c1, LOAD_CONST c2 ... LOAD_CONST cn, BUILD_TUPLE n
 | 
						|
   with    LOAD_CONST (c1, c2, ... cn).
 | 
						|
   The consts table must still be in list form so that the
 | 
						|
   new constant (c1, c2, ... cn) can be appended.
 | 
						|
   Called with codestr pointing to the first LOAD_CONST.
 | 
						|
   Bails out with no change if one or more of the LOAD_CONSTs is missing.
 | 
						|
   Also works for BUILD_LIST and BUILT_SET when followed by an "in" or "not in"
 | 
						|
   test; for BUILD_SET it assembles a frozenset rather than a tuple.
 | 
						|
*/
 | 
						|
static Py_ssize_t
 | 
						|
fold_tuple_on_constants(_Py_CODEUNIT *codestr, Py_ssize_t c_start,
 | 
						|
                        Py_ssize_t opcode_end, unsigned char opcode,
 | 
						|
                        PyObject *consts, PyObject **objs, int n)
 | 
						|
{
 | 
						|
    PyObject *newconst, *constant;
 | 
						|
    Py_ssize_t i, len_consts;
 | 
						|
 | 
						|
    /* Pre-conditions */
 | 
						|
    assert(PyList_CheckExact(consts));
 | 
						|
 | 
						|
    /* Buildup new tuple of constants */
 | 
						|
    newconst = PyTuple_New(n);
 | 
						|
    if (newconst == NULL) {
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
    for (i=0 ; i<n ; i++) {
 | 
						|
        constant = objs[i];
 | 
						|
        Py_INCREF(constant);
 | 
						|
        PyTuple_SET_ITEM(newconst, i, constant);
 | 
						|
    }
 | 
						|
 | 
						|
    /* If it's a BUILD_SET, use the PyTuple we just built to create a
 | 
						|
       PyFrozenSet, and use that as the constant instead: */
 | 
						|
    if (opcode == BUILD_SET) {
 | 
						|
        Py_SETREF(newconst, PyFrozenSet_New(newconst));
 | 
						|
        if (newconst == NULL) {
 | 
						|
            return -1;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    /* Append folded constant onto consts */
 | 
						|
    len_consts = PyList_GET_SIZE(consts);
 | 
						|
    if (PyList_Append(consts, newconst)) {
 | 
						|
        Py_DECREF(newconst);
 | 
						|
        return -1;
 | 
						|
    }
 | 
						|
    Py_DECREF(newconst);
 | 
						|
 | 
						|
    return copy_op_arg(codestr, c_start, LOAD_CONST, len_consts, opcode_end);
 | 
						|
}
 | 
						|
 | 
						|
static unsigned int *
 | 
						|
markblocks(_Py_CODEUNIT *code, Py_ssize_t len)
 | 
						|
{
 | 
						|
    unsigned int *blocks = PyMem_New(unsigned int, len);
 | 
						|
    int i, j, opcode, blockcnt = 0;
 | 
						|
 | 
						|
    if (blocks == NULL) {
 | 
						|
        PyErr_NoMemory();
 | 
						|
        return NULL;
 | 
						|
    }
 | 
						|
    memset(blocks, 0, len*sizeof(int));
 | 
						|
 | 
						|
    /* Mark labels in the first pass */
 | 
						|
    for (i = 0; i < len; i++) {
 | 
						|
        opcode = _Py_OPCODE(code[i]);
 | 
						|
        switch (opcode) {
 | 
						|
            case FOR_ITER:
 | 
						|
            case JUMP_FORWARD:
 | 
						|
            case JUMP_IF_FALSE_OR_POP:
 | 
						|
            case JUMP_IF_TRUE_OR_POP:
 | 
						|
            case POP_JUMP_IF_FALSE:
 | 
						|
            case POP_JUMP_IF_TRUE:
 | 
						|
            case JUMP_ABSOLUTE:
 | 
						|
            case CONTINUE_LOOP:
 | 
						|
            case SETUP_LOOP:
 | 
						|
            case SETUP_EXCEPT:
 | 
						|
            case SETUP_FINALLY:
 | 
						|
            case SETUP_WITH:
 | 
						|
            case SETUP_ASYNC_WITH:
 | 
						|
                j = GETJUMPTGT(code, i);
 | 
						|
                assert(j < len);
 | 
						|
                blocks[j] = 1;
 | 
						|
                break;
 | 
						|
        }
 | 
						|
    }
 | 
						|
    /* Build block numbers in the second pass */
 | 
						|
    for (i = 0; i < len; i++) {
 | 
						|
        blockcnt += blocks[i];          /* increment blockcnt over labels */
 | 
						|
        blocks[i] = blockcnt;
 | 
						|
    }
 | 
						|
    return blocks;
 | 
						|
}
 | 
						|
 | 
						|
/* Perform basic peephole optimizations to components of a code object.
 | 
						|
   The consts object should still be in list form to allow new constants
 | 
						|
   to be appended.
 | 
						|
 | 
						|
   To keep the optimizer simple, it bails when the lineno table has complex
 | 
						|
   encoding for gaps >= 255.
 | 
						|
 | 
						|
   Optimizations are restricted to simple transformations occurring within a
 | 
						|
   single basic block.  All transformations keep the code size the same or
 | 
						|
   smaller.  For those that reduce size, the gaps are initially filled with
 | 
						|
   NOPs.  Later those NOPs are removed and the jump addresses retargeted in
 | 
						|
   a single pass. */
 | 
						|
 | 
						|
PyObject *
 | 
						|
PyCode_Optimize(PyObject *code, PyObject* consts, PyObject *names,
 | 
						|
                PyObject *lnotab_obj)
 | 
						|
{
 | 
						|
    Py_ssize_t h, i, nexti, op_start, codelen, tgt;
 | 
						|
    unsigned int j, nops;
 | 
						|
    unsigned char opcode, nextop;
 | 
						|
    _Py_CODEUNIT *codestr = NULL;
 | 
						|
    unsigned char *lnotab;
 | 
						|
    unsigned int cum_orig_offset, last_offset;
 | 
						|
    Py_ssize_t tabsiz;
 | 
						|
    PyObject **const_stack = NULL;
 | 
						|
    Py_ssize_t const_stack_top = -1;
 | 
						|
    Py_ssize_t const_stack_size = 0;
 | 
						|
    int in_consts = 0;  /* whether we are in a LOAD_CONST sequence */
 | 
						|
    unsigned int *blocks = NULL;
 | 
						|
 | 
						|
    /* Bail out if an exception is set */
 | 
						|
    if (PyErr_Occurred())
 | 
						|
        goto exitError;
 | 
						|
 | 
						|
    /* Bypass optimization when the lnotab table is too complex */
 | 
						|
    assert(PyBytes_Check(lnotab_obj));
 | 
						|
    lnotab = (unsigned char*)PyBytes_AS_STRING(lnotab_obj);
 | 
						|
    tabsiz = PyBytes_GET_SIZE(lnotab_obj);
 | 
						|
    assert(tabsiz == 0 || Py_REFCNT(lnotab_obj) == 1);
 | 
						|
    if (memchr(lnotab, 255, tabsiz) != NULL) {
 | 
						|
        /* 255 value are used for multibyte bytecode instructions */
 | 
						|
        goto exitUnchanged;
 | 
						|
    }
 | 
						|
    /* Note: -128 and 127 special values for line number delta are ok,
 | 
						|
       the peephole optimizer doesn't modify line numbers. */
 | 
						|
 | 
						|
    assert(PyBytes_Check(code));
 | 
						|
    codelen = PyBytes_GET_SIZE(code);
 | 
						|
    assert(codelen % sizeof(_Py_CODEUNIT) == 0);
 | 
						|
 | 
						|
    /* Make a modifiable copy of the code string */
 | 
						|
    codestr = (_Py_CODEUNIT *)PyMem_Malloc(codelen);
 | 
						|
    if (codestr == NULL) {
 | 
						|
        PyErr_NoMemory();
 | 
						|
        goto exitError;
 | 
						|
    }
 | 
						|
    memcpy(codestr, PyBytes_AS_STRING(code), codelen);
 | 
						|
    codelen /= sizeof(_Py_CODEUNIT);
 | 
						|
 | 
						|
    blocks = markblocks(codestr, codelen);
 | 
						|
    if (blocks == NULL)
 | 
						|
        goto exitError;
 | 
						|
    assert(PyList_Check(consts));
 | 
						|
 | 
						|
    CONST_STACK_CREATE();
 | 
						|
 | 
						|
    for (i=find_op(codestr, 0) ; i<codelen ; i=nexti) {
 | 
						|
        opcode = _Py_OPCODE(codestr[i]);
 | 
						|
        op_start = i;
 | 
						|
        while (op_start >= 1 && _Py_OPCODE(codestr[op_start-1]) == EXTENDED_ARG) {
 | 
						|
            op_start--;
 | 
						|
        }
 | 
						|
 | 
						|
        nexti = i + 1;
 | 
						|
        while (nexti < codelen && _Py_OPCODE(codestr[nexti]) == EXTENDED_ARG)
 | 
						|
            nexti++;
 | 
						|
        nextop = nexti < codelen ? _Py_OPCODE(codestr[nexti]) : 0;
 | 
						|
 | 
						|
        if (!in_consts) {
 | 
						|
            CONST_STACK_RESET();
 | 
						|
        }
 | 
						|
        in_consts = 0;
 | 
						|
 | 
						|
        switch (opcode) {
 | 
						|
                /* not a is b -->  a is not b
 | 
						|
                   not a in b -->  a not in b
 | 
						|
                   not a is not b -->  a is b
 | 
						|
                   not a not in b -->  a in b
 | 
						|
                */
 | 
						|
            case COMPARE_OP:
 | 
						|
                j = get_arg(codestr, i);
 | 
						|
                if (j < 6 || j > 9 ||
 | 
						|
                    nextop != UNARY_NOT ||
 | 
						|
                    !ISBASICBLOCK(blocks, op_start, i + 1))
 | 
						|
                    break;
 | 
						|
                codestr[i] = PACKOPARG(opcode, j^1);
 | 
						|
                fill_nops(codestr, i + 1, nexti + 1);
 | 
						|
                break;
 | 
						|
 | 
						|
                /* Skip over LOAD_CONST trueconst
 | 
						|
                   POP_JUMP_IF_FALSE xx.  This improves
 | 
						|
                   "while 1" performance.  */
 | 
						|
            case LOAD_CONST:
 | 
						|
                CONST_STACK_PUSH_OP(i);
 | 
						|
                if (nextop != POP_JUMP_IF_FALSE  ||
 | 
						|
                    !ISBASICBLOCK(blocks, op_start, i + 1)  ||
 | 
						|
                    !PyObject_IsTrue(PyList_GET_ITEM(consts, get_arg(codestr, i))))
 | 
						|
                    break;
 | 
						|
                fill_nops(codestr, op_start, nexti + 1);
 | 
						|
                CONST_STACK_POP(1);
 | 
						|
                break;
 | 
						|
 | 
						|
                /* Try to fold tuples of constants (includes a case for lists
 | 
						|
                   and sets which are only used for "in" and "not in" tests).
 | 
						|
                   Skip over BUILD_SEQN 1 UNPACK_SEQN 1.
 | 
						|
                   Replace BUILD_SEQN 2 UNPACK_SEQN 2 with ROT2.
 | 
						|
                   Replace BUILD_SEQN 3 UNPACK_SEQN 3 with ROT3 ROT2. */
 | 
						|
            case BUILD_TUPLE:
 | 
						|
            case BUILD_LIST:
 | 
						|
            case BUILD_SET:
 | 
						|
                j = get_arg(codestr, i);
 | 
						|
                if (j > 0 && CONST_STACK_LEN() >= j) {
 | 
						|
                    h = lastn_const_start(codestr, op_start, j);
 | 
						|
                    if ((opcode == BUILD_TUPLE &&
 | 
						|
                          ISBASICBLOCK(blocks, h, op_start)) ||
 | 
						|
                         ((opcode == BUILD_LIST || opcode == BUILD_SET) &&
 | 
						|
                          ((nextop==COMPARE_OP &&
 | 
						|
                          (_Py_OPARG(codestr[nexti]) == PyCmp_IN ||
 | 
						|
                           _Py_OPARG(codestr[nexti]) == PyCmp_NOT_IN)) ||
 | 
						|
                          nextop == GET_ITER) && ISBASICBLOCK(blocks, h, i + 1))) {
 | 
						|
                        h = fold_tuple_on_constants(codestr, h, i + 1, opcode,
 | 
						|
                                                    consts, CONST_STACK_LASTN(j), j);
 | 
						|
                        if (h >= 0) {
 | 
						|
                            CONST_STACK_POP(j);
 | 
						|
                            CONST_STACK_PUSH_OP(h);
 | 
						|
                        }
 | 
						|
                        break;
 | 
						|
                    }
 | 
						|
                }
 | 
						|
                if (nextop != UNPACK_SEQUENCE  ||
 | 
						|
                    !ISBASICBLOCK(blocks, op_start, i + 1) ||
 | 
						|
                    j != get_arg(codestr, nexti) ||
 | 
						|
                    opcode == BUILD_SET)
 | 
						|
                    break;
 | 
						|
                if (j < 2) {
 | 
						|
                    fill_nops(codestr, op_start, nexti + 1);
 | 
						|
                } else if (j == 2) {
 | 
						|
                    codestr[op_start] = PACKOPARG(ROT_TWO, 0);
 | 
						|
                    fill_nops(codestr, op_start + 1, nexti + 1);
 | 
						|
                    CONST_STACK_RESET();
 | 
						|
                } else if (j == 3) {
 | 
						|
                    codestr[op_start] = PACKOPARG(ROT_THREE, 0);
 | 
						|
                    codestr[op_start + 1] = PACKOPARG(ROT_TWO, 0);
 | 
						|
                    fill_nops(codestr, op_start + 2, nexti + 1);
 | 
						|
                    CONST_STACK_RESET();
 | 
						|
                }
 | 
						|
                break;
 | 
						|
 | 
						|
                /* Simplify conditional jump to conditional jump where the
 | 
						|
                   result of the first test implies the success of a similar
 | 
						|
                   test or the failure of the opposite test.
 | 
						|
                   Arises in code like:
 | 
						|
                   "a and b or c"
 | 
						|
                   "(a and b) and c"
 | 
						|
                   "(a or b) or c"
 | 
						|
                   "(a or b) and c"
 | 
						|
                   x:JUMP_IF_FALSE_OR_POP y   y:JUMP_IF_FALSE_OR_POP z
 | 
						|
                      -->  x:JUMP_IF_FALSE_OR_POP z
 | 
						|
                   x:JUMP_IF_FALSE_OR_POP y   y:JUMP_IF_TRUE_OR_POP z
 | 
						|
                      -->  x:POP_JUMP_IF_FALSE y+1
 | 
						|
                   where y+1 is the instruction following the second test.
 | 
						|
                */
 | 
						|
            case JUMP_IF_FALSE_OR_POP:
 | 
						|
            case JUMP_IF_TRUE_OR_POP:
 | 
						|
                h = get_arg(codestr, i) / sizeof(_Py_CODEUNIT);
 | 
						|
                tgt = find_op(codestr, h);
 | 
						|
 | 
						|
                j = _Py_OPCODE(codestr[tgt]);
 | 
						|
                if (CONDITIONAL_JUMP(j)) {
 | 
						|
                    /* NOTE: all possible jumps here are absolute. */
 | 
						|
                    if (JUMPS_ON_TRUE(j) == JUMPS_ON_TRUE(opcode)) {
 | 
						|
                        /* The second jump will be taken iff the first is.
 | 
						|
                           The current opcode inherits its target's
 | 
						|
                           stack effect */
 | 
						|
                        h = set_arg(codestr, i, get_arg(codestr, tgt));
 | 
						|
                    } else {
 | 
						|
                        /* The second jump is not taken if the first is (so
 | 
						|
                           jump past it), and all conditional jumps pop their
 | 
						|
                           argument when they're not taken (so change the
 | 
						|
                           first jump to pop its argument when it's taken). */
 | 
						|
                        h = set_arg(codestr, i, (tgt + 1) * sizeof(_Py_CODEUNIT));
 | 
						|
                        j = opcode == JUMP_IF_TRUE_OR_POP ?
 | 
						|
                            POP_JUMP_IF_TRUE : POP_JUMP_IF_FALSE;
 | 
						|
                    }
 | 
						|
 | 
						|
                    if (h >= 0) {
 | 
						|
                        nexti = h;
 | 
						|
                        codestr[nexti] = PACKOPARG(j, _Py_OPARG(codestr[nexti]));
 | 
						|
                        break;
 | 
						|
                    }
 | 
						|
                }
 | 
						|
                /* Intentional fallthrough */
 | 
						|
 | 
						|
                /* Replace jumps to unconditional jumps */
 | 
						|
            case POP_JUMP_IF_FALSE:
 | 
						|
            case POP_JUMP_IF_TRUE:
 | 
						|
            case FOR_ITER:
 | 
						|
            case JUMP_FORWARD:
 | 
						|
            case JUMP_ABSOLUTE:
 | 
						|
            case CONTINUE_LOOP:
 | 
						|
            case SETUP_LOOP:
 | 
						|
            case SETUP_EXCEPT:
 | 
						|
            case SETUP_FINALLY:
 | 
						|
            case SETUP_WITH:
 | 
						|
            case SETUP_ASYNC_WITH:
 | 
						|
                h = GETJUMPTGT(codestr, i);
 | 
						|
                tgt = find_op(codestr, h);
 | 
						|
                /* Replace JUMP_* to a RETURN into just a RETURN */
 | 
						|
                if (UNCONDITIONAL_JUMP(opcode) &&
 | 
						|
                    _Py_OPCODE(codestr[tgt]) == RETURN_VALUE) {
 | 
						|
                    codestr[op_start] = PACKOPARG(RETURN_VALUE, 0);
 | 
						|
                    fill_nops(codestr, op_start + 1, i + 1);
 | 
						|
                } else if (UNCONDITIONAL_JUMP(_Py_OPCODE(codestr[tgt]))) {
 | 
						|
                    j = GETJUMPTGT(codestr, tgt);
 | 
						|
                    if (opcode == JUMP_FORWARD) { /* JMP_ABS can go backwards */
 | 
						|
                        opcode = JUMP_ABSOLUTE;
 | 
						|
                    } else if (!ABSOLUTE_JUMP(opcode)) {
 | 
						|
                        if ((Py_ssize_t)j < i + 1) {
 | 
						|
                            break;           /* No backward relative jumps */
 | 
						|
                        }
 | 
						|
                        j -= i + 1;          /* Calc relative jump addr */
 | 
						|
                    }
 | 
						|
                    j *= sizeof(_Py_CODEUNIT);
 | 
						|
                    copy_op_arg(codestr, op_start, opcode, j, i + 1);
 | 
						|
                }
 | 
						|
                break;
 | 
						|
 | 
						|
                /* Remove unreachable ops after RETURN */
 | 
						|
            case RETURN_VALUE:
 | 
						|
                h = i + 1;
 | 
						|
                while (h < codelen && ISBASICBLOCK(blocks, i, h)) {
 | 
						|
                    h++;
 | 
						|
                }
 | 
						|
                if (h > i + 1) {
 | 
						|
                    fill_nops(codestr, i + 1, h);
 | 
						|
                    nexti = find_op(codestr, h);
 | 
						|
                }
 | 
						|
                break;
 | 
						|
        }
 | 
						|
    }
 | 
						|
 | 
						|
    /* Fixup lnotab */
 | 
						|
    for (i = 0, nops = 0; i < codelen; i++) {
 | 
						|
        assert(i - nops <= INT_MAX);
 | 
						|
        /* original code offset => new code offset */
 | 
						|
        blocks[i] = i - nops;
 | 
						|
        if (_Py_OPCODE(codestr[i]) == NOP)
 | 
						|
            nops++;
 | 
						|
    }
 | 
						|
    cum_orig_offset = 0;
 | 
						|
    last_offset = 0;
 | 
						|
    for (i=0 ; i < tabsiz ; i+=2) {
 | 
						|
        unsigned int offset_delta, new_offset;
 | 
						|
        cum_orig_offset += lnotab[i];
 | 
						|
        assert(cum_orig_offset % sizeof(_Py_CODEUNIT) == 0);
 | 
						|
        new_offset = blocks[cum_orig_offset / sizeof(_Py_CODEUNIT)] *
 | 
						|
                sizeof(_Py_CODEUNIT);
 | 
						|
        offset_delta = new_offset - last_offset;
 | 
						|
        assert(offset_delta <= 255);
 | 
						|
        lnotab[i] = (unsigned char)offset_delta;
 | 
						|
        last_offset = new_offset;
 | 
						|
    }
 | 
						|
 | 
						|
    /* Remove NOPs and fixup jump targets */
 | 
						|
    for (op_start = i = h = 0; i < codelen; i++, op_start = i) {
 | 
						|
        j = _Py_OPARG(codestr[i]);
 | 
						|
        while (_Py_OPCODE(codestr[i]) == EXTENDED_ARG) {
 | 
						|
            i++;
 | 
						|
            j = j<<8 | _Py_OPARG(codestr[i]);
 | 
						|
        }
 | 
						|
        opcode = _Py_OPCODE(codestr[i]);
 | 
						|
        switch (opcode) {
 | 
						|
            case NOP:continue;
 | 
						|
 | 
						|
            case JUMP_ABSOLUTE:
 | 
						|
            case CONTINUE_LOOP:
 | 
						|
            case POP_JUMP_IF_FALSE:
 | 
						|
            case POP_JUMP_IF_TRUE:
 | 
						|
            case JUMP_IF_FALSE_OR_POP:
 | 
						|
            case JUMP_IF_TRUE_OR_POP:
 | 
						|
                j = blocks[j / sizeof(_Py_CODEUNIT)] * sizeof(_Py_CODEUNIT);
 | 
						|
                break;
 | 
						|
 | 
						|
            case FOR_ITER:
 | 
						|
            case JUMP_FORWARD:
 | 
						|
            case SETUP_LOOP:
 | 
						|
            case SETUP_EXCEPT:
 | 
						|
            case SETUP_FINALLY:
 | 
						|
            case SETUP_WITH:
 | 
						|
            case SETUP_ASYNC_WITH:
 | 
						|
                j = blocks[j / sizeof(_Py_CODEUNIT) + i + 1] - blocks[i] - 1;
 | 
						|
                j *= sizeof(_Py_CODEUNIT);
 | 
						|
                break;
 | 
						|
        }
 | 
						|
        nexti = i - op_start + 1;
 | 
						|
        if (instrsize(j) > nexti)
 | 
						|
            goto exitUnchanged;
 | 
						|
        /* If instrsize(j) < nexti, we'll emit EXTENDED_ARG 0 */
 | 
						|
        write_op_arg(codestr + h, opcode, j, nexti);
 | 
						|
        h += nexti;
 | 
						|
    }
 | 
						|
    assert(h + (Py_ssize_t)nops == codelen);
 | 
						|
 | 
						|
    CONST_STACK_DELETE();
 | 
						|
    PyMem_Free(blocks);
 | 
						|
    code = PyBytes_FromStringAndSize((char *)codestr, h * sizeof(_Py_CODEUNIT));
 | 
						|
    PyMem_Free(codestr);
 | 
						|
    return code;
 | 
						|
 | 
						|
 exitError:
 | 
						|
    code = NULL;
 | 
						|
 | 
						|
 exitUnchanged:
 | 
						|
    Py_XINCREF(code);
 | 
						|
    CONST_STACK_DELETE();
 | 
						|
    PyMem_Free(blocks);
 | 
						|
    PyMem_Free(codestr);
 | 
						|
    return code;
 | 
						|
}
 |