Commit b0e93d19 authored by Kevin Modzelewski's avatar Kevin Modzelewski

Improve tuple unpacking behavior

- Use the right unpacking protocol (ie don't check __len__, just try to iterate)
- Handle unpacking exceptions appropriately
- Expand the targets of assigns correctly (think: f().x = 1)
-- this was not just for tuples but came up here first; this also was broken:
[0 for i in xrange(5)][0] = 1
(silly but legal)
parent 1fbf29e8
......@@ -353,7 +353,7 @@ private:
ConcreteCompilerVariable* rtn = new ConcreteCompilerVariable(DICT, v, true);
for (auto& p : symbol_table) {
if (p.first[0] == '!')
if (p.first[0] == '!' || p.first[0] == '#')
continue;
ConcreteCompilerVariable* is_defined_var = static_cast<ConcreteCompilerVariable*>(
......@@ -1260,14 +1260,33 @@ private:
void _doUnpackTuple(AST_Tuple* target, CompilerVariable* val, ExcInfo exc_info) {
assert(state != PARTIAL);
int ntargets = target->elts.size();
// TODO do type recording here?
ConcreteCompilerVariable* len = val->len(emitter, getEmptyOpInfo(exc_info));
emitter.createCall2(exc_info, g.funcs.checkUnpackingLength, getConstantInt(ntargets, g.i64), len->getValue());
// TODO can do faster unpacking of non-instantiated tuples; ie for something like
// a, b = 1, 2
// We shouldn't need to do any runtime error checking or allocations
#ifndef NDEBUG
for (auto e : target->elts) {
ASSERT(e->type == AST_TYPE::Name && ast_cast<AST_Name>(e)->id[0] == '#',
"should only be unpacking tuples into cfg-generated names!");
}
#endif
ConcreteCompilerVariable* converted_val = val->makeConverted(emitter, val->getBoxType());
llvm::Value* unpacked = emitter.createCall2(exc_info, g.funcs.unpackIntoArray, converted_val->getValue(),
getConstantInt(ntargets, g.i64)).getInstruction();
assert(unpacked->getType() == g.llvm_value_type_ptr->getPointerTo());
converted_val->decvref(emitter);
for (int i = 0; i < ntargets; i++) {
CompilerVariable* unpacked = val->getitem(emitter, getEmptyOpInfo(exc_info), makeInt(i));
_doSet(target->elts[i], unpacked, exc_info);
unpacked->decvref(emitter);
llvm::Value* ptr = emitter.getBuilder()->CreateConstGEP1_32(unpacked, i);
llvm::Value* val = emitter.getBuilder()->CreateLoad(ptr);
assert(val->getType() == g.llvm_value_type_ptr);
CompilerVariable* thisval = new ConcreteCompilerVariable(UNKNOWN, val, true);
_doSet(target->elts[i], thisval, exc_info);
thisval->decvref(emitter);
}
}
......
......@@ -200,7 +200,7 @@ void initGlobalFuncs(GlobalState& g) {
GET(yield);
GET(getiter);
GET(checkUnpackingLength);
GET(unpackIntoArray);
GET(raiseAttributeError);
GET(raiseAttributeErrorStr);
GET(raiseNotIterableError);
......
......@@ -39,7 +39,7 @@ struct GlobalFuncs {
*unboxedLen, *getitem, *getclsattr, *getGlobal, *setitem, *unaryop, *import, *importFrom, *importStar, *repr,
*str, *isinstance, *yield, *getiter;
llvm::Value* checkUnpackingLength, *raiseAttributeError, *raiseAttributeErrorStr, *raiseNotIterableError,
llvm::Value* unpackIntoArray, *raiseAttributeError, *raiseAttributeErrorStr, *raiseNotIterableError,
*assertNameDefined, *assertFail;
llvm::Value* printFloat, *listAppendInternal;
llvm::Value* runtimeCall0, *runtimeCall1, *runtimeCall2, *runtimeCall3, *runtimeCall;
......
......@@ -914,6 +914,7 @@ public:
// but aren't directly *exactly* representable as normal Python.
// ClsAttribute would fall into this category, as would isinstance (which
// is not the same as the "isinstance" name since that could get redefined).
// These are basically bytecodes, framed as pseudo-AST-nodes.
class AST_LangPrimitive : public AST_expr {
public:
enum Opcodes {
......
......@@ -97,7 +97,7 @@ private:
assert(value);
CFGBlock* rtn_dest = getReturn();
if (rtn_dest != NULL) {
push_back(makeAssign("#rtnval", value));
pushAssign("#rtnval", value);
AST_Jump* j = makeJump();
j->target = rtn_dest;
......@@ -142,7 +142,7 @@ private:
template <typename ResultASTType, typename CompType> AST_expr* remapComprehension(CompType* node) {
std::string rtn_name = nodeName(node);
push_back(makeAssign(rtn_name, new ResultASTType()));
pushAssign(rtn_name, new ResultASTType());
std::vector<CFGBlock*> exit_blocks;
// Where the current level should jump to after finishing its iteration.
......@@ -159,8 +159,7 @@ private:
AST_LangPrimitive* iter_call = new AST_LangPrimitive(AST_LangPrimitive::GET_ITER);
iter_call->args.push_back(remapped_iter);
std::string iter_name = nodeName(node, "lc_iter", i);
AST_stmt* iter_assign = makeAssign(iter_name, iter_call);
push_back(iter_assign);
pushAssign(iter_name, iter_call);
// TODO bad to save these like this?
AST_expr* hasnext_attr = makeLoadAttribute(makeName(iter_name, AST_TYPE::Load), "__hasnext__", true);
......@@ -198,8 +197,8 @@ private:
push_back(br);
curblock = body_block;
push_back(makeAssign(nodeName(next_attr), makeCall(next_attr)));
push_back(makeAssign(c->target, makeName(nodeName(next_attr), AST_TYPE::Load)));
pushAssign(nodeName(next_attr), makeCall(next_attr));
pushAssign(c->target, makeName(nodeName(next_attr), AST_TYPE::Load));
for (AST_expr* if_condition : c->ifs) {
AST_expr* remapped = remapExpr(if_condition);
......@@ -340,19 +339,69 @@ private:
return call;
}
AST_stmt* makeAssign(AST_expr* target, AST_expr* val) {
void pushAssign(AST_expr* target, AST_expr* val) {
AST_Assign* assign = new AST_Assign();
assign->targets.push_back(target);
assign->value = val;
assign->col_offset = val->col_offset;
assign->lineno = val->lineno;
return assign;
if (target->type == AST_TYPE::Name) {
assign->targets.push_back(target);
push_back(assign);
} else if (target->type == AST_TYPE::Subscript) {
AST_Subscript* s = ast_cast<AST_Subscript>(target);
assert(s->ctx_type == AST_TYPE::Store);
AST_Subscript* s_target = new AST_Subscript();
s_target->value = remapExpr(s->value);
s_target->slice = remapExpr(s->slice);
s_target->ctx_type = AST_TYPE::Store;
s_target->col_offset = s->col_offset;
s_target->lineno = s->lineno;
assign->targets.push_back(s_target);
push_back(assign);
} else if (target->type == AST_TYPE::Attribute) {
AST_Attribute* a = ast_cast<AST_Attribute>(target);
assert(a->ctx_type == AST_TYPE::Store);
AST_Attribute* a_target = new AST_Attribute();
a_target->value = remapExpr(a->value);
a_target->attr = a->attr;
a_target->ctx_type = AST_TYPE::Store;
a_target->col_offset = a->col_offset;
a_target->lineno = a->lineno;
assign->targets.push_back(a_target);
push_back(assign);
} else if (target->type == AST_TYPE::Tuple) {
AST_Tuple* old_target = ast_cast<AST_Tuple>(target);
AST_Tuple* new_target = new AST_Tuple();
new_target->ctx_type = old_target->ctx_type;
new_target->lineno = old_target->lineno;
new_target->col_offset = old_target->col_offset;
// A little hackery: push the assign, even though we're not done constructing it yet,
// so that we can iteratively push more stuff after it
assign->targets.push_back(new_target);
push_back(assign);
for (int i = 0; i < old_target->elts.size(); i++) {
std::string tmp_name = nodeName(target, "", i);
new_target->elts.push_back(makeName(tmp_name, AST_TYPE::Store));
pushAssign(old_target->elts[i], makeName(tmp_name, AST_TYPE::Load));
}
} else {
RELEASE_ASSERT(0, "%d", target->type);
}
}
AST_stmt* makeAssign(const std::string& id, AST_expr* val) {
void pushAssign(const std::string& id, AST_expr* val) {
assert(val);
AST_expr* name = makeName(id, AST_TYPE::Store, val->lineno, 0);
return makeAssign(name, val);
pushAssign(name, val);
}
AST_stmt* makeExpr(AST_expr* expr) {
......@@ -371,7 +420,7 @@ private:
return std::string(buf);
}
std::string nodeName(AST_expr* node, const std::string& suffix, int idx) {
std::string nodeName(AST* node, const std::string& suffix, int idx) {
char buf[50];
snprintf(buf, 50, "#%p_%s_%d", node, suffix.c_str(), idx);
return std::string(buf);
......@@ -406,7 +455,7 @@ private:
for (int i = 0; i < node->values.size() - 1; i++) {
AST_expr* val = remapExpr(node->values[i]);
push_back(makeAssign(name, val));
pushAssign(name, val);
AST_Branch* br = new AST_Branch();
br->test = val;
......@@ -436,7 +485,7 @@ private:
}
AST_expr* final_val = remapExpr(node->values[node->values.size() - 1]);
push_back(makeAssign(name, final_val));
pushAssign(name, final_val);
AST_Jump* j = new AST_Jump();
push_back(j);
......@@ -523,7 +572,7 @@ private:
val->comparators.push_back(right);
val->ops.push_back(node->ops[i]);
push_back(makeAssign(name, val));
pushAssign(name, val);
AST_Branch* br = new AST_Branch();
br->test = makeName(name, AST_TYPE::Load);
......@@ -651,7 +700,7 @@ private:
br->iftrue = iftrue;
starting_block->connectTo(iftrue);
curblock = iftrue;
push_back(makeAssign(rtn_name, remapExpr(node->body)));
pushAssign(rtn_name, remapExpr(node->body));
AST_Jump* jtrue = new AST_Jump();
push_back(jtrue);
CFGBlock* endtrue = curblock;
......@@ -661,7 +710,7 @@ private:
br->iffalse = iffalse;
starting_block->connectTo(iffalse);
curblock = iffalse;
push_back(makeAssign(rtn_name, remapExpr(node->orelse)));
pushAssign(rtn_name, remapExpr(node->orelse));
AST_Jump* jfalse = new AST_Jump();
push_back(jfalse);
CFGBlock* endfalse = curblock;
......@@ -877,7 +926,7 @@ private:
if (wrap_with_assign && (rtn->type != AST_TYPE::Name || ast_cast<AST_Name>(rtn)->id[0] != '#')) {
std::string name = nodeName(node);
push_back(makeAssign(name, rtn));
pushAssign(name, rtn);
return makeName(name, AST_TYPE::Load);
} else {
return rtn;
......@@ -963,7 +1012,10 @@ public:
ExcBlockInfo& exc_info = exc_handlers.back();
curblock = exc_dest;
curblock->push_back(makeAssign(exc_info.exc_obj_name, new AST_LangPrimitive(AST_LangPrimitive::LANDINGPAD)));
AST_Assign* exc_asgn = new AST_Assign();
exc_asgn->targets.push_back(makeName(exc_info.exc_obj_name, AST_TYPE::Store));
exc_asgn->value = new AST_LangPrimitive(AST_LangPrimitive::LANDINGPAD);
curblock->push_back(exc_asgn);
AST_Jump* j = new AST_Jump();
j->target = exc_info.exc_dest;
......@@ -1083,12 +1135,7 @@ public:
AST_expr* remapped_value = remapExpr(node->value);
for (AST_expr* target : node->targets) {
AST_Assign* remapped = new AST_Assign();
remapped->lineno = node->lineno;
remapped->col_offset = node->col_offset;
remapped->value = remapped_value;
remapped->targets.push_back(target);
push_back(remapped);
pushAssign(target, remapped_value);
}
return true;
}
......@@ -1119,7 +1166,7 @@ public:
case AST_TYPE::Name: {
AST_Name* n = ast_cast<AST_Name>(node->target);
assert(n->ctx_type == AST_TYPE::Store);
push_back(makeAssign(nodeName(n), makeName(n->id, AST_TYPE::Load)));
pushAssign(nodeName(n), makeName(n->id, AST_TYPE::Load));
remapped_target = n;
remapped_lhs = makeName(nodeName(n), AST_TYPE::Load);
break;
......@@ -1179,8 +1226,8 @@ public:
binop->col_offset = node->col_offset;
binop->lineno = node->lineno;
push_back(makeAssign(nodeName(node), binop));
push_back(makeAssign(remapped_target, makeName(nodeName(node), AST_TYPE::Load)));
pushAssign(nodeName(node), binop);
pushAssign(remapped_target, makeName(nodeName(node), AST_TYPE::Load));
return true;
}
......@@ -1445,8 +1492,7 @@ public:
char itername_buf[80];
snprintf(itername_buf, 80, "#iter_%p", node);
AST_stmt* iter_assign = makeAssign(itername_buf, iter_call);
push_back(iter_assign);
pushAssign(itername_buf, iter_call);
AST_expr* hasnext_attr = makeLoadAttribute(makeName(itername_buf, AST_TYPE::Load), "__hasnext__", true);
AST_expr* next_attr = makeLoadAttribute(makeName(itername_buf, AST_TYPE::Load), "next", true);
......@@ -1490,8 +1536,8 @@ public:
pushLoop(test_block, end_block);
curblock = loop_block;
push_back(makeAssign(nodeName(next_attr), makeCall(next_attr)));
push_back(makeAssign(node->target, makeName(nodeName(next_attr), AST_TYPE::Load)));
pushAssign(nodeName(next_attr), makeCall(next_attr));
pushAssign(node->target, makeName(nodeName(next_attr), AST_TYPE::Load));
for (int i = 0; i < node->body.size(); i++) {
node->body[i]->accept(this);
......@@ -1627,7 +1673,7 @@ public:
}
if (exc_handler->name) {
push_back(makeAssign(exc_handler->name, exc_obj));
pushAssign(exc_handler->name, exc_obj);
}
for (AST_stmt* subnode : exc_handler->body) {
......@@ -1674,15 +1720,15 @@ public:
char exitname_buf[80];
snprintf(exitname_buf, 80, "#exit_%p", node);
push_back(makeAssign(ctxmgrname_buf, remapExpr(node->context_expr)));
pushAssign(ctxmgrname_buf, remapExpr(node->context_expr));
AST_expr* enter = makeLoadAttribute(makeName(ctxmgrname_buf, AST_TYPE::Load), "__enter__", true);
AST_expr* exit = makeLoadAttribute(makeName(ctxmgrname_buf, AST_TYPE::Load), "__exit__", true);
push_back(makeAssign(exitname_buf, exit));
pushAssign(exitname_buf, exit);
enter = makeCall(enter);
if (node->optional_vars) {
push_back(makeAssign(node->optional_vars, enter));
pushAssign(node->optional_vars, enter);
} else {
push_back(makeExpr(enter));
}
......
......@@ -92,7 +92,7 @@ void force() {
FORCE(yield);
FORCE(getiter);
FORCE(checkUnpackingLength);
FORCE(unpackIntoArray);
FORCE(raiseAttributeError);
FORCE(raiseAttributeErrorStr);
FORCE(raiseNotIterableError);
......
......@@ -368,7 +368,7 @@ extern "C" void raiseNotIterableError(const char* typeName) {
raiseExcHelper(TypeError, "'%s' object is not iterable", typeName);
}
extern "C" void checkUnpackingLength(i64 expected, i64 given) {
static void _checkUnpackingLength(i64 expected, i64 given) {
if (given == expected)
return;
......@@ -382,6 +382,32 @@ extern "C" void checkUnpackingLength(i64 expected, i64 given) {
}
}
extern "C" Box** unpackIntoArray(Box* obj, int64_t expected_size) {
assert(expected_size > 0);
if (obj->cls == tuple_cls) {
BoxedTuple* t = static_cast<BoxedTuple*>(obj);
_checkUnpackingLength(expected_size, t->elts.size());
return &t->elts[0];
}
if (obj->cls == list_cls) {
BoxedList* l = static_cast<BoxedList*>(obj);
_checkUnpackingLength(expected_size, l->size);
return &l->elts->elts[0];
}
BoxedTuple::GCVector elts;
for (auto e : obj->pyElements()) {
elts.push_back(e);
if (elts.size() > expected_size)
break;
}
_checkUnpackingLength(expected_size, elts.size());
return &elts[0];
}
BoxedClass::BoxedClass(BoxedClass* metaclass, BoxedClass* base, gcvisit_func gc_visit, int attrs_offset,
int instance_size, bool is_user_defined)
: BoxVar(metaclass, 0), tp_basicsize(instance_size), tp_dealloc(NULL), base(base), gc_visit(gc_visit),
......@@ -3216,6 +3242,12 @@ extern "C" Box* getiter(Box* o) {
raiseExcHelper(TypeError, "'%s' object is not iterable", getTypeName(o)->c_str());
}
llvm::iterator_range<BoxIterator> Box::pyElements() {
Box* iter = getiter(this);
assert(iter);
return llvm::iterator_range<BoxIterator>(++BoxIterator(iter), BoxIterator(nullptr));
}
// For use on __init__ return values
static void assertInitNone(Box* obj) {
if (obj != None) {
......
......@@ -78,7 +78,7 @@ extern "C" Box* unaryop(Box* operand, int op_type);
extern "C" Box* import(const std::string* name);
extern "C" Box* importFrom(Box* obj, const std::string* attr);
extern "C" void importStar(Box* from_module, BoxedModule* to_module);
extern "C" void checkUnpackingLength(i64 expected, i64 given);
extern "C" Box** unpackIntoArray(Box* obj, int64_t expected_size);
extern "C" void assertNameDefined(bool b, const char* name, BoxedClass* exc_cls, bool local_var_msg);
extern "C" void assertFail(BoxedModule* inModule, Box* msg);
extern "C" bool isSubclass(BoxedClass* child, BoxedClass* parent);
......
......@@ -81,17 +81,6 @@ void BoxIterator::gcHandler(GCVisitor* v) {
v->visitPotential(value);
}
llvm::iterator_range<BoxIterator> Box::pyElements() {
static std::string iter_str("__iter__");
Box* iter = callattr(const_cast<Box*>(this), &iter_str, true, ArgPassSpec(0), NULL, NULL, NULL, NULL, NULL);
if (iter) {
return llvm::iterator_range<BoxIterator>(++BoxIterator(iter), BoxIterator(nullptr));
}
raiseExcHelper(TypeError, "'%s' object is not iterable", getTypeName(this)->c_str());
}
std::string builtinStr("__builtin__");
extern "C" BoxedFunction::BoxedFunction(CLFunction* f)
......
# run_args: -n
# statcheck: stats['slowpath_unboxedlen'] < 10
d = {}
for i in xrange(1000):
d[i] = i ** 2
......
# expected: fail
# - we currently can't even compile this correctly
#
# The unpacking should be atomic: ie either all of the names get set or none of them do.
# We currently assume that unpacking can only throw an exception from the tuple being the
# wrong length, but instead we should be emulating the UNPACK_SEQUENCE bytecode.
# Test the behavior of tuple unpacking in the face of exceptions being thrown at certain points.
# - If an exception gets thrown in the "unpack to a given size" part, none of the targets get set
# - If setting a target throws an exception, then the previous targets had been set, but not the future ones
class C(object):
def __init__(self, n):
self.n = n
def __getitem__(self, i):
print "__getitem__", i
if i == 0:
return 1
if i < self.n:
return i
raise IndexError
def __len__(self):
print "len"
return 2
def f():
def f1():
print "f1"
try:
x, y = C()
except ValueError:
pass
x, y = C(1)
except ValueError, e:
print e
try:
print x
......@@ -30,5 +31,76 @@ def f():
print y
except NameError, e:
print e
f1()
def f2():
print "f2"
class D(object):
pass
d = D()
def f():
print "f"
return d
try:
f().x, f().y = C(1)
except ValueError, e:
print e
print hasattr(d, "x")
print hasattr(d, "y")
f2()
def f3():
print "f3"
class D(object):
pass
d = D()
def f(should_raise):
print "f", should_raise
if should_raise:
1/0
return d
try:
f(False).x, f(True).y, f(False).z = (1, 2, 3)
except ZeroDivisionError, e:
print e
print hasattr(d, "x")
print hasattr(d, "y")
print hasattr(d, "z")
f3()
def f4():
print "f4"
c = C(10000)
try:
x, y = c
except ValueError, e:
print e
f4()
def f5():
print "f5"
def f():
1/0
try:
x, f().x, y = (1, 2, 3)
except ZeroDivisionError, e:
print e
try:
print x
except NameError, e:
print e
f()
try:
print y
except NameError, e:
print e
f5()
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment