Commit 9407f64a authored by Kevin Modzelewski's avatar Kevin Modzelewski

Store live_outs as a bitset

We were storing and passing them as std::unordered_map (and sometimes
switching to std::vector).  But the set can only contain the integers
0 through 15, so just represent it as a bitset.
parent 896bc696
...@@ -183,14 +183,14 @@ ICSlotInfo* ICInfo::pickEntryForRewrite(const char* debug_name) { ...@@ -183,14 +183,14 @@ ICSlotInfo* ICInfo::pickEntryForRewrite(const char* debug_name) {
} }
ICInfo::ICInfo(void* start_addr, void* slowpath_rtn_addr, void* continue_addr, StackInfo stack_info, int num_slots, ICInfo::ICInfo(void* start_addr, void* slowpath_rtn_addr, void* continue_addr, StackInfo stack_info, int num_slots,
int slot_size, llvm::CallingConv::ID calling_conv, const std::unordered_set<int>& live_outs, int slot_size, llvm::CallingConv::ID calling_conv, LiveOutSet _live_outs,
assembler::GenericRegister return_register, TypeRecorder* type_recorder) assembler::GenericRegister return_register, TypeRecorder* type_recorder)
: next_slot_to_try(0), : next_slot_to_try(0),
stack_info(stack_info), stack_info(stack_info),
num_slots(num_slots), num_slots(num_slots),
slot_size(slot_size), slot_size(slot_size),
calling_conv(calling_conv), calling_conv(calling_conv),
live_outs(live_outs.begin(), live_outs.end()), live_outs(std::move(_live_outs)),
return_register(return_register), return_register(return_register),
type_recorder(type_recorder), type_recorder(type_recorder),
retry_in(0), retry_in(0),
...@@ -200,15 +200,14 @@ ICInfo::ICInfo(void* start_addr, void* slowpath_rtn_addr, void* continue_addr, S ...@@ -200,15 +200,14 @@ ICInfo::ICInfo(void* start_addr, void* slowpath_rtn_addr, void* continue_addr, S
slowpath_rtn_addr(slowpath_rtn_addr), slowpath_rtn_addr(slowpath_rtn_addr),
continue_addr(continue_addr) { continue_addr(continue_addr) {
for (int i = 0; i < num_slots; i++) { for (int i = 0; i < num_slots; i++) {
slots.push_back(ICSlotInfo(this, i)); slots.emplace_back(this, i);
} }
} }
static llvm::DenseMap<void*, ICInfo*> ics_by_return_addr; static llvm::DenseMap<void*, ICInfo*> ics_by_return_addr;
std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t* slowpath_start_addr, std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t* slowpath_start_addr,
uint8_t* continue_addr, uint8_t* slowpath_rtn_addr, uint8_t* continue_addr, uint8_t* slowpath_rtn_addr,
const ICSetupInfo* ic, StackInfo stack_info, const ICSetupInfo* ic, StackInfo stack_info, LiveOutSet live_outs) {
std::unordered_set<int> live_outs) {
assert(slowpath_start_addr - start_addr >= ic->num_slots * ic->slot_size); assert(slowpath_start_addr - start_addr >= ic->num_slots * ic->slot_size);
assert(slowpath_rtn_addr > slowpath_start_addr); assert(slowpath_rtn_addr > slowpath_start_addr);
assert(slowpath_rtn_addr <= start_addr + ic->totalSize()); assert(slowpath_rtn_addr <= start_addr + ic->totalSize());
...@@ -221,9 +220,7 @@ std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t* ...@@ -221,9 +220,7 @@ std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t*
static const int DWARF_RAX = 0; static const int DWARF_RAX = 0;
// It's possible that the return value doesn't get used, in which case // It's possible that the return value doesn't get used, in which case
// we can avoid copying back into RAX at the end // we can avoid copying back into RAX at the end
if (live_outs.count(DWARF_RAX)) { live_outs.clear(DWARF_RAX);
live_outs.erase(DWARF_RAX);
}
// TODO we only need to do this if 0 was in live_outs, since if it wasn't, that indicates // TODO we only need to do this if 0 was in live_outs, since if it wasn't, that indicates
// the return value won't be used and we can optimize based on that. // the return value won't be used and we can optimize based on that.
...@@ -247,7 +244,7 @@ std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t* ...@@ -247,7 +244,7 @@ std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t*
} }
ICInfo* icinfo = new ICInfo(start_addr, slowpath_rtn_addr, continue_addr, stack_info, ic->num_slots, ic->slot_size, ICInfo* icinfo = new ICInfo(start_addr, slowpath_rtn_addr, continue_addr, stack_info, ic->num_slots, ic->slot_size,
ic->getCallingConvention(), live_outs, return_register, ic->type_recorder); ic->getCallingConvention(), std::move(live_outs), return_register, ic->type_recorder);
ics_by_return_addr[slowpath_rtn_addr] = icinfo; ics_by_return_addr[slowpath_rtn_addr] = icinfo;
......
...@@ -23,6 +23,7 @@ ...@@ -23,6 +23,7 @@
#include "asm_writing/assembler.h" #include "asm_writing/assembler.h"
#include "asm_writing/types.h" #include "asm_writing/types.h"
#include "core/util.h"
namespace pyston { namespace pyston {
...@@ -91,6 +92,8 @@ public: ...@@ -91,6 +92,8 @@ public:
friend class ICInfo; friend class ICInfo;
}; };
typedef BitSet<16> LiveOutSet;
class ICInfo { class ICInfo {
private: private:
std::vector<ICSlotInfo> slots; std::vector<ICSlotInfo> slots;
...@@ -105,7 +108,7 @@ private: ...@@ -105,7 +108,7 @@ private:
const int num_slots; const int num_slots;
const int slot_size; const int slot_size;
const llvm::CallingConv::ID calling_conv; const llvm::CallingConv::ID calling_conv;
const std::vector<int> live_outs; LiveOutSet live_outs;
const assembler::GenericRegister return_register; const assembler::GenericRegister return_register;
TypeRecorder* const type_recorder; TypeRecorder* const type_recorder;
int retry_in, retry_backoff; int retry_in, retry_backoff;
...@@ -116,14 +119,14 @@ private: ...@@ -116,14 +119,14 @@ private:
public: public:
ICInfo(void* start_addr, void* slowpath_rtn_addr, void* continue_addr, StackInfo stack_info, int num_slots, ICInfo(void* start_addr, void* slowpath_rtn_addr, void* continue_addr, StackInfo stack_info, int num_slots,
int slot_size, llvm::CallingConv::ID calling_conv, const std::unordered_set<int>& live_outs, int slot_size, llvm::CallingConv::ID calling_conv, LiveOutSet live_outs,
assembler::GenericRegister return_register, TypeRecorder* type_recorder); assembler::GenericRegister return_register, TypeRecorder* type_recorder);
void* const start_addr, *const slowpath_rtn_addr, *const continue_addr; void* const start_addr, *const slowpath_rtn_addr, *const continue_addr;
int getSlotSize() { return slot_size; } int getSlotSize() { return slot_size; }
int getNumSlots() { return num_slots; } int getNumSlots() { return num_slots; }
llvm::CallingConv::ID getCallingConvention() { return calling_conv; } llvm::CallingConv::ID getCallingConvention() { return calling_conv; }
const std::vector<int>& getLiveOuts() { return live_outs; } const LiveOutSet& getLiveOuts() { return live_outs; }
std::unique_ptr<ICSlotRewrite> startRewrite(const char* debug_name); std::unique_ptr<ICSlotRewrite> startRewrite(const char* debug_name);
void clear(ICSlotInfo* entry); void clear(ICSlotInfo* entry);
...@@ -138,8 +141,7 @@ class ICSetupInfo; ...@@ -138,8 +141,7 @@ class ICSetupInfo;
struct CompiledFunction; struct CompiledFunction;
std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t* slowpath_start_addr, std::unique_ptr<ICInfo> registerCompiledPatchpoint(uint8_t* start_addr, uint8_t* slowpath_start_addr,
uint8_t* continue_addr, uint8_t* slowpath_rtn_addr, uint8_t* continue_addr, uint8_t* slowpath_rtn_addr,
const ICSetupInfo*, StackInfo stack_info, const ICSetupInfo*, StackInfo stack_info, LiveOutSet live_outs);
std::unordered_set<int> live_outs);
void deregisterCompiledPatchpoint(ICInfo* ic); void deregisterCompiledPatchpoint(ICInfo* ic);
ICInfo* getICInfo(void* rtn_addr); ICInfo* getICInfo(void* rtn_addr);
......
...@@ -1786,7 +1786,7 @@ TypeRecorder* Rewriter::getTypeRecorder() { ...@@ -1786,7 +1786,7 @@ TypeRecorder* Rewriter::getTypeRecorder() {
return rewrite->getTypeRecorder(); return rewrite->getTypeRecorder();
} }
Rewriter::Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const std::vector<int>& live_outs) Rewriter::Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const LiveOutSet& live_outs)
: rewrite(std::move(rewrite)), : rewrite(std::move(rewrite)),
assembler(this->rewrite->getAssembler()), assembler(this->rewrite->getAssembler()),
picked_slot(NULL), picked_slot(NULL),
...@@ -1837,6 +1837,11 @@ Rewriter::Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const s ...@@ -1837,6 +1837,11 @@ Rewriter::Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const s
var->locations.push_back(l); var->locations.push_back(l);
} }
// Make sure there weren't duplicates in the live_outs list.
// Probably not a big deal if there were, but we shouldn't be generating those.
assert(std::find(this->live_out_regs.begin(), this->live_out_regs.end(), dwarf_regnum)
== this->live_out_regs.end());
this->live_outs.push_back(var); this->live_outs.push_back(var);
this->live_out_regs.push_back(dwarf_regnum); this->live_out_regs.push_back(dwarf_regnum);
} }
...@@ -2034,8 +2039,8 @@ void setSlowpathFunc(uint8_t* pp_addr, void* func) { ...@@ -2034,8 +2039,8 @@ void setSlowpathFunc(uint8_t* pp_addr, void* func) {
} }
PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* start_addr, uint8_t* end_addr, PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* start_addr, uint8_t* end_addr,
int scratch_offset, int scratch_size, int scratch_offset, int scratch_size, LiveOutSet live_outs,
const std::unordered_set<int>& live_outs, SpillMap& remapped) { SpillMap& remapped) {
assert(start_addr < end_addr); assert(start_addr < end_addr);
int est_slowpath_size = INITIAL_CALL_SIZE; int est_slowpath_size = INITIAL_CALL_SIZE;
...@@ -2043,8 +2048,6 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* ...@@ -2043,8 +2048,6 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t*
std::vector<assembler::GenericRegister> regs_to_spill; std::vector<assembler::GenericRegister> regs_to_spill;
std::vector<assembler::Register> regs_to_reload; std::vector<assembler::Register> regs_to_reload;
std::unordered_set<int> live_outs_for_slot;
for (int dwarf_regnum : live_outs) { for (int dwarf_regnum : live_outs) {
assembler::GenericRegister ru = assembler::GenericRegister::fromDwarf(dwarf_regnum); assembler::GenericRegister ru = assembler::GenericRegister::fromDwarf(dwarf_regnum);
...@@ -2052,7 +2055,7 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* ...@@ -2052,7 +2055,7 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t*
if (ru.type == assembler::GenericRegister::GP) { if (ru.type == assembler::GenericRegister::GP) {
if (ru.gp == assembler::RSP || ru.gp.isCalleeSave()) { if (ru.gp == assembler::RSP || ru.gp.isCalleeSave()) {
live_outs_for_slot.insert(dwarf_regnum); live_outs.set(dwarf_regnum);
continue; continue;
} }
} }
...@@ -2068,7 +2071,7 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* ...@@ -2068,7 +2071,7 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t*
continue; continue;
} }
live_outs_for_slot.insert(dwarf_regnum); live_outs.set(dwarf_regnum);
regs_to_spill.push_back(ru); regs_to_spill.push_back(ru);
...@@ -2125,7 +2128,6 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* ...@@ -2125,7 +2128,6 @@ PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t*
assem.fillWithNops(); assem.fillWithNops();
assert(!assem.hasFailed()); assert(!assem.hasFailed());
return PatchpointInitializationInfo(slowpath_start, slowpath_rtn_addr, continue_addr, return PatchpointInitializationInfo(slowpath_start, slowpath_rtn_addr, continue_addr, std::move(live_outs));
std::move(live_outs_for_slot));
} }
} }
...@@ -355,7 +355,7 @@ protected: ...@@ -355,7 +355,7 @@ protected:
llvm::SmallVector<RewriterVar*, 8> args; llvm::SmallVector<RewriterVar*, 8> args;
llvm::SmallVector<RewriterVar*, 8> live_outs; llvm::SmallVector<RewriterVar*, 8> live_outs;
Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const std::vector<int>& live_outs); Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const LiveOutSet& live_outs);
llvm::SmallVector<RewriterAction, 32> actions; llvm::SmallVector<RewriterAction, 32> actions;
void addAction(std::function<void()> action, llvm::ArrayRef<RewriterVar*> vars, ActionType type) { void addAction(std::function<void()> action, llvm::ArrayRef<RewriterVar*> vars, ActionType type) {
...@@ -555,10 +555,10 @@ struct PatchpointInitializationInfo { ...@@ -555,10 +555,10 @@ struct PatchpointInitializationInfo {
uint8_t* slowpath_start; uint8_t* slowpath_start;
uint8_t* slowpath_rtn_addr; uint8_t* slowpath_rtn_addr;
uint8_t* continue_addr; uint8_t* continue_addr;
std::unordered_set<int> live_outs; LiveOutSet live_outs;
PatchpointInitializationInfo(uint8_t* slowpath_start, uint8_t* slowpath_rtn_addr, uint8_t* continue_addr, PatchpointInitializationInfo(uint8_t* slowpath_start, uint8_t* slowpath_rtn_addr, uint8_t* continue_addr,
std::unordered_set<int>&& live_outs) LiveOutSet live_outs)
: slowpath_start(slowpath_start), : slowpath_start(slowpath_start),
slowpath_rtn_addr(slowpath_rtn_addr), slowpath_rtn_addr(slowpath_rtn_addr),
continue_addr(continue_addr), continue_addr(continue_addr),
...@@ -566,8 +566,8 @@ struct PatchpointInitializationInfo { ...@@ -566,8 +566,8 @@ struct PatchpointInitializationInfo {
}; };
PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* start_addr, uint8_t* end_addr, PatchpointInitializationInfo initializePatchpoint3(void* slowpath_func, uint8_t* start_addr, uint8_t* end_addr,
int scratch_offset, int scratch_size, int scratch_offset, int scratch_size, LiveOutSet live_outs,
const std::unordered_set<int>& live_outs, SpillMap& remapped); SpillMap& remapped);
template <> inline RewriterVar* RewriterVar::getAttrCast<bool, bool>(int offset, Location loc) { template <> inline RewriterVar* RewriterVar::getAttrCast<bool, bool>(int offset, Location loc) {
return getAttr(offset, loc, assembler::MovType::ZBL); return getAttr(offset, loc, assembler::MovType::ZBL);
......
...@@ -102,7 +102,7 @@ std::unique_ptr<JitFragmentWriter> JitCodeBlock::newFragment(CFGBlock* block, in ...@@ -102,7 +102,7 @@ std::unique_ptr<JitFragmentWriter> JitCodeBlock::newFragment(CFGBlock* block, in
int scratch_offset = num_stack_args * 8; int scratch_offset = num_stack_args * 8;
StackInfo stack_info(scratch_size, scratch_offset); StackInfo stack_info(scratch_size, scratch_offset);
std::unordered_set<int> live_outs; LiveOutSet live_outs;
void* fragment_start = a.curInstPointer() - patch_jump_offset; void* fragment_start = a.curInstPointer() - patch_jump_offset;
long fragment_offset = a.bytesWritten() - patch_jump_offset; long fragment_offset = a.bytesWritten() - patch_jump_offset;
...@@ -612,13 +612,13 @@ int JitFragmentWriter::finishCompilation() { ...@@ -612,13 +612,13 @@ int JitFragmentWriter::finishCompilation() {
uint8_t* end_addr = pp_info.end_addr; uint8_t* end_addr = pp_info.end_addr;
PatchpointInitializationInfo initialization_info PatchpointInitializationInfo initialization_info
= initializePatchpoint3(pp_info.func_addr, start_addr, end_addr, 0 /* scratch_offset */, = initializePatchpoint3(pp_info.func_addr, start_addr, end_addr, 0 /* scratch_offset */,
0 /* scratch_size */, std::unordered_set<int>(), _spill_map); 0 /* scratch_size */, LiveOutSet(), _spill_map);
uint8_t* slowpath_start = initialization_info.slowpath_start; uint8_t* slowpath_start = initialization_info.slowpath_start;
uint8_t* slowpath_rtn_addr = initialization_info.slowpath_rtn_addr; uint8_t* slowpath_rtn_addr = initialization_info.slowpath_rtn_addr;
std::unique_ptr<ICInfo> pp = registerCompiledPatchpoint( std::unique_ptr<ICInfo> pp
start_addr, slowpath_start, initialization_info.continue_addr, slowpath_rtn_addr, pp_info.ic.get(), = registerCompiledPatchpoint(start_addr, slowpath_start, initialization_info.continue_addr,
pp_info.stack_info, std::unordered_set<int>()); slowpath_rtn_addr, pp_info.ic.get(), pp_info.stack_info, LiveOutSet());
pp.release(); pp.release();
} }
......
...@@ -247,7 +247,7 @@ ScopeInfo* IRGenState::getScopeInfoForNode(AST* node) { ...@@ -247,7 +247,7 @@ ScopeInfo* IRGenState::getScopeInfoForNode(AST* node) {
class IREmitterImpl : public IREmitter { class IREmitterImpl : public IREmitter {
private: private:
IRGenState* irstate; IRGenState* irstate;
IRBuilder* builder; std::unique_ptr<IRBuilder> builder;
llvm::BasicBlock*& curblock; llvm::BasicBlock*& curblock;
IRGenerator* irgenerator; IRGenerator* irgenerator;
...@@ -348,6 +348,9 @@ private: ...@@ -348,6 +348,9 @@ private:
public: public:
explicit IREmitterImpl(IRGenState* irstate, llvm::BasicBlock*& curblock, IRGenerator* irgenerator) explicit IREmitterImpl(IRGenState* irstate, llvm::BasicBlock*& curblock, IRGenerator* irgenerator)
: irstate(irstate), builder(new IRBuilder(g.context)), curblock(curblock), irgenerator(irgenerator) { : irstate(irstate), builder(new IRBuilder(g.context)), curblock(curblock), irgenerator(irgenerator) {
// Perf note: it seems to be more efficient to separately allocate the "builder" member,
// even though we could allocate it in-line; maybe it's infrequently used enough that it's better
// to not have it take up cache space.
RELEASE_ASSERT(irstate->getSourceInfo()->scoping->areGlobalsFromModule(), RELEASE_ASSERT(irstate->getSourceInfo()->scoping->areGlobalsFromModule(),
"jit doesn't support custom globals yet"); "jit doesn't support custom globals yet");
...@@ -356,7 +359,7 @@ public: ...@@ -356,7 +359,7 @@ public:
builder->SetInsertPoint(curblock); builder->SetInsertPoint(curblock);
} }
IRBuilder* getBuilder() override { return builder; } IRBuilder* getBuilder() override { return &*builder; }
GCBuilder* getGC() override { return irstate->getGC(); } GCBuilder* getGC() override { return irstate->getGC(); }
...@@ -557,8 +560,6 @@ public: ...@@ -557,8 +560,6 @@ public:
types(types), types(types),
state(RUNNING) {} state(RUNNING) {}
~IRGeneratorImpl() { delete emitter.getBuilder(); }
private: private:
OpInfo getOpInfoForNode(AST* ast, const UnwindInfo& unw_info) { OpInfo getOpInfoForNode(AST* ast, const UnwindInfo& unw_info) {
assert(ast); assert(ast);
......
...@@ -117,14 +117,14 @@ static int extractScratchOffset(PatchpointInfo* pp, StackMap::Record* r) { ...@@ -117,14 +117,14 @@ static int extractScratchOffset(PatchpointInfo* pp, StackMap::Record* r) {
return l.offset; return l.offset;
} }
static std::unordered_set<int> extractLiveOuts(StackMap::Record* r, llvm::CallingConv::ID cc) { static LiveOutSet extractLiveOuts(StackMap::Record* r, llvm::CallingConv::ID cc) {
std::unordered_set<int> live_outs; LiveOutSet live_outs;
// Using the C calling convention, there shouldn't be any non-callee-save registers in here, // Using the C calling convention, there shouldn't be any non-callee-save registers in here,
// but LLVM is conservative and will add some. So with the C cc, ignored the specified live outs // but LLVM is conservative and will add some. So with the C cc, ignored the specified live outs
if (cc != llvm::CallingConv::C) { if (cc != llvm::CallingConv::C) {
for (const auto& live_out : r->live_outs) { for (const auto& live_out : r->live_outs) {
live_outs.insert(live_out.regnum); live_outs.set(live_out.regnum);
} }
} }
...@@ -133,11 +133,11 @@ static std::unordered_set<int> extractLiveOuts(StackMap::Record* r, llvm::Callin ...@@ -133,11 +133,11 @@ static std::unordered_set<int> extractLiveOuts(StackMap::Record* r, llvm::Callin
// sense to track them as live_outs. // sense to track them as live_outs.
// Unfortunately this means we need to be conservative about it unless // Unfortunately this means we need to be conservative about it unless
// we can change llvm's behavior. // we can change llvm's behavior.
live_outs.insert(3); live_outs.set(3);
live_outs.insert(12); live_outs.set(12);
live_outs.insert(13); live_outs.set(13);
live_outs.insert(14); live_outs.set(14);
live_outs.insert(15); live_outs.set(15);
return live_outs; return live_outs;
} }
...@@ -212,12 +212,12 @@ void processStackmap(CompiledFunction* cf, StackMap* stackmap) { ...@@ -212,12 +212,12 @@ void processStackmap(CompiledFunction* cf, StackMap* stackmap) {
if (ic == NULL) { if (ic == NULL) {
// We have to be using the C calling convention here, so we don't need to check the live outs // We have to be using the C calling convention here, so we don't need to check the live outs
// or save them across the call. // or save them across the call.
initializePatchpoint3(slowpath_func, start_addr, end_addr, scratch_rbp_offset, scratch_size, initializePatchpoint3(slowpath_func, start_addr, end_addr, scratch_rbp_offset, scratch_size, LiveOutSet(),
std::unordered_set<int>(), frame_remapped); frame_remapped);
continue; continue;
} }
std::unordered_set<int> live_outs(extractLiveOuts(r, ic->getCallingConvention())); LiveOutSet live_outs(extractLiveOuts(r, ic->getCallingConvention()));
if (ic->hasReturnValue()) { if (ic->hasReturnValue()) {
assert(ic->getCallingConvention() == llvm::CallingConv::C assert(ic->getCallingConvention() == llvm::CallingConv::C
...@@ -226,14 +226,12 @@ void processStackmap(CompiledFunction* cf, StackMap* stackmap) { ...@@ -226,14 +226,12 @@ void processStackmap(CompiledFunction* cf, StackMap* stackmap) {
static const int DWARF_RAX = 0; static const int DWARF_RAX = 0;
// It's possible that the return value doesn't get used, in which case // It's possible that the return value doesn't get used, in which case
// we can avoid copying back into RAX at the end // we can avoid copying back into RAX at the end
if (live_outs.count(DWARF_RAX)) { live_outs.clear(DWARF_RAX);
live_outs.erase(DWARF_RAX);
}
} }
auto initialization_info = initializePatchpoint3(slowpath_func, start_addr, end_addr, scratch_rbp_offset, auto initialization_info = initializePatchpoint3(slowpath_func, start_addr, end_addr, scratch_rbp_offset,
scratch_size, live_outs, frame_remapped); scratch_size, std::move(live_outs), frame_remapped);
ASSERT(initialization_info.slowpath_start - start_addr >= ic->num_slots * ic->slot_size, ASSERT(initialization_info.slowpath_start - start_addr >= ic->num_slots * ic->slot_size,
"Used more slowpath space than expected; change ICSetupInfo::totalSize()?"); "Used more slowpath space than expected; change ICSetupInfo::totalSize()?");
......
...@@ -128,6 +128,62 @@ template <class T1, class T2> bool sameKeyset(T1* lhs, T2* rhs) { ...@@ -128,6 +128,62 @@ template <class T1, class T2> bool sameKeyset(T1* lhs, T2* rhs) {
} }
return good; return good;
} }
// A simple constant-width bitset.
template <int N> struct BitSet {
uint16_t bits = 0;
static_assert(N <= 8 * sizeof(bits), "");
struct iterator {
const BitSet& set;
int cur;
iterator(const BitSet& set, int cur) : set(set), cur(cur) {}
int operator*() {
assert(cur >= 0 && cur < N);
return cur;
}
bool operator==(const iterator& rhs) { return cur == rhs.cur; }
bool operator!=(const iterator& rhs) { return !(*this == rhs); }
iterator& operator++() {
// TODO: this function (and begin()) could be optimized using __builtin_ctz
assert(cur >= 0 && cur < N);
uint16_t tmp = set.bits;
tmp >>= cur + 1;
cur++;
while (cur < N) {
if (tmp & 1)
return *this;
cur++;
tmp >>= 1;
}
assert(cur == N);
return *this;
}
};
void set(int idx) {
assert(idx >= 0 && idx < N);
bits |= (1 << idx);
}
void clear(int idx) {
assert(idx >= 0 && idx < N);
bits &= ~(1 << idx);
}
iterator begin() const {
uint16_t tmp = bits;
for (int i = 0; i < N; i++) {
if (tmp & 1)
return iterator(*this, i);
}
return iterator(*this, N);
}
iterator end() const { return iterator(*this, N); }
};
} }
#endif #endif
...@@ -273,9 +273,8 @@ RuntimeIC::RuntimeIC(void* func_addr, int num_slots, int slot_size) : eh_frame(R ...@@ -273,9 +273,8 @@ RuntimeIC::RuntimeIC(void* func_addr, int num_slots, int slot_size) : eh_frame(R
SpillMap _spill_map; SpillMap _spill_map;
PatchpointInitializationInfo initialization_info PatchpointInitializationInfo initialization_info = initializePatchpoint3(
= initializePatchpoint3(func_addr, pp_start, pp_end, 0 /* scratch_offset */, 0 /* scratch_size */, func_addr, pp_start, pp_end, 0 /* scratch_offset */, 0 /* scratch_size */, LiveOutSet(), _spill_map);
std::unordered_set<int>(), _spill_map);
assert(_spill_map.size() == 0); assert(_spill_map.size() == 0);
assert(initialization_info.slowpath_start == pp_start + patchable_size); assert(initialization_info.slowpath_start == pp_start + patchable_size);
assert(initialization_info.slowpath_rtn_addr == pp_end); assert(initialization_info.slowpath_rtn_addr == pp_end);
...@@ -283,7 +282,7 @@ RuntimeIC::RuntimeIC(void* func_addr, int num_slots, int slot_size) : eh_frame(R ...@@ -283,7 +282,7 @@ RuntimeIC::RuntimeIC(void* func_addr, int num_slots, int slot_size) : eh_frame(R
StackInfo stack_info(SCRATCH_BYTES, 0); StackInfo stack_info(SCRATCH_BYTES, 0);
icinfo = registerCompiledPatchpoint(pp_start, pp_start + patchable_size, pp_end, pp_end, setup_info.get(), icinfo = registerCompiledPatchpoint(pp_start, pp_start + patchable_size, pp_end, pp_end, setup_info.get(),
stack_info, std::unordered_set<int>()); stack_info, LiveOutSet());
assembler::Assembler prologue_assem((uint8_t*)addr, PROLOGUE_SIZE); assembler::Assembler prologue_assem((uint8_t*)addr, PROLOGUE_SIZE);
#if RUNTIMEICS_OMIT_FRAME_PTR #if RUNTIMEICS_OMIT_FRAME_PTR
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment