Commit 5a0f66dd authored by Kevin Modzelewski's avatar Kevin Modzelewski

Merge pull request #729 from kmod/attr_perf

more small perf work
parents 4ba2dfed c78fdcb9
......@@ -1033,9 +1033,9 @@ $(call make_target,_gcc)
$(call make_target,_release_gcc)
nosearch_runpy_% nosearch_pyrun_%: %.py ext_python
$(VERB) PYTHONPATH=test/test_extension/build/lib.linux-x86_64-2.7 zsh -c 'time $(CPYTHON) $<'
$(VERB) PYTHONPATH=test/test_extension/build/lib.linux-x86_64-2.7:$${PYTHONPATH} zsh -c 'time $(CPYTHON) $<'
nosearch_pypyrun_%: %.py ext_python
$(VERB) PYTHONPATH=test/test_extension/build/lib.linux-x86_64-2.7 zsh -c 'time $(PYPY) $<'
$(VERB) PYTHONPATH=test/test_extension/build/lib.linux-x86_64-2.7:$${PYTHONPATH} zsh -c 'time $(PYPY) $<'
$(call make_search,runpy_%)
$(call make_search,pyrun_%)
$(call make_search,pypyrun_%)
......
import os
import sys
sys.path.append(os.path.join(os.path.dirname(__file__), "../integration/django"))
from django.template.base import Variable
for i in xrange(400000):
Variable(u"model.name")
......@@ -5,6 +5,15 @@ def f():
g = getattr
c = C()
c.o = 1
for i in xrange(10000000):
for i in xrange(1000000):
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
g(c, "o")
f()
......@@ -56,17 +56,15 @@ void ICSlotInfo::clear() {
ic->clear(this);
}
ICSlotRewrite::ICSlotRewrite(ICInfo* ic, const char* debug_name) : ic(ic), debug_name(debug_name) {
buf = (uint8_t*)malloc(ic->getSlotSize());
assembler = new Assembler(buf, ic->getSlotSize());
assembler->nop();
ICSlotRewrite::ICSlotRewrite(ICInfo* ic, const char* debug_name)
: ic(ic), debug_name(debug_name), buf((uint8_t*)malloc(ic->getSlotSize())), assembler(buf, ic->getSlotSize()) {
assembler.nop();
if (VERBOSITY() >= 4)
printf("starting %s icentry\n", debug_name);
}
ICSlotRewrite::~ICSlotRewrite() {
delete assembler;
free(buf);
}
......@@ -109,7 +107,7 @@ void ICSlotRewrite::commit(CommitHook* hook) {
if (!do_commit)
return;
assert(!assembler->hasFailed());
assert(!assembler.hasFailed());
for (int i = 0; i < dependencies.size(); i++) {
ICInvalidator* invalidator = dependencies[i].first;
......
......@@ -21,6 +21,7 @@
#include "llvm/IR/CallingConv.h"
#include "asm_writing/assembler.h"
#include "asm_writing/types.h"
namespace pyston {
......@@ -53,12 +54,13 @@ public:
private:
ICInfo* ic;
assembler::Assembler* assembler;
const char* debug_name;
uint8_t* buf;
std::vector<std::pair<ICInvalidator*, int64_t>> dependencies;
assembler::Assembler assembler;
llvm::SmallVector<std::pair<ICInvalidator*, int64_t>, 4> dependencies;
ICSlotInfo* ic_entry;
......@@ -66,7 +68,7 @@ public:
ICSlotRewrite(ICInfo* ic, const char* debug_name);
~ICSlotRewrite();
assembler::Assembler* getAssembler() { return assembler; }
assembler::Assembler* getAssembler() { return &assembler; }
int getSlotSize();
int getScratchRspOffset();
int getScratchSize();
......
......@@ -185,9 +185,11 @@ void Rewriter::ConstLoader::moveImmediate(uint64_t val, assembler::Register dst_
assembler::Register Rewriter::ConstLoader::findConst(uint64_t val, bool& found_value) {
assert(rewriter->phase_emitting);
auto it = constToVar.find(val);
if (it != constToVar.end()) {
RewriterVar* var = it->second;
for (auto& p : consts) {
if (p.first != val)
continue;
RewriterVar* var = p.second;
for (Location l : var->locations) {
if (l.type == Location::Register) {
found_value = true;
......@@ -216,9 +218,9 @@ assembler::Register Rewriter::ConstLoader::loadConst(uint64_t val, Location othe
assert(rewriter->phase_emitting);
bool found_value = false;
assembler::Register reg = findConst(val, found_value);
assembler::Register /*reg = findConst(val, found_value);
if (found_value)
return reg;
return reg;*/
reg = rewriter->allocReg(Location::any(), otherThan);
if (tryLea(val, reg))
......@@ -711,10 +713,15 @@ void Rewriter::_trap() {
RewriterVar* Rewriter::loadConst(int64_t val, Location dest) {
STAT_TIMER(t0, "us_timer_rewriter", 10);
RewriterVar*& const_loader_var = const_loader.constToVar[val];
if (!const_loader_var) {
const_loader_var = createNewConstantVar(val);
for (auto& p : const_loader.consts) {
if (p.first != val)
continue;
return p.second;
}
RewriterVar* const_loader_var = createNewConstantVar(val);
const_loader.consts.push_back(std::make_pair(val, const_loader_var));
return const_loader_var;
}
......@@ -1099,11 +1106,11 @@ void Rewriter::commit() {
for (int i = 0; i < live_outs.size(); i++) {
live_outs[i]->uses.push_back(actions.size());
}
for (RewriterVar* var : vars) {
for (RewriterVar& var : vars) {
// Add a use for every constant. This helps make constants available for the lea stuff
// But since "spilling" a constant has no cost, it shouldn't add register pressure.
if (var->is_constant) {
var->uses.push_back(actions.size());
if (var.is_constant) {
var.uses.push_back(actions.size());
}
}
......@@ -1176,22 +1183,22 @@ void Rewriter::commit() {
// Make sure that we have been calling bumpUse correctly.
// All uses should have been accounted for, other than the live outs
#ifndef NDEBUG
for (RewriterVar* var : vars) {
for (RewriterVar& var : vars) {
int num_as_live_out = 0;
for (RewriterVar* live_out : live_outs) {
if (live_out == var) {
if (live_out == &var) {
num_as_live_out++;
}
}
assert(var->next_use + num_as_live_out + (var->is_constant ? 1 : 0) == var->uses.size());
assert(var.next_use + num_as_live_out + (var.is_constant ? 1 : 0) == var.uses.size());
}
#endif
assert(live_out_regs.size() == live_outs.size());
for (RewriterVar* var : vars) {
if (var->is_constant) {
var->bumpUse();
for (RewriterVar& var : vars) {
if (var.is_constant) {
var.bumpUse();
}
}
......@@ -1686,9 +1693,8 @@ void Rewriter::removeLocationFromVar(RewriterVar* var, Location l) {
RewriterVar* Rewriter::createNewVar() {
assertPhaseCollecting();
RewriterVar* var = new RewriterVar(this);
vars.push_back(var);
return var;
vars.emplace_back(this);
return &vars.back();
}
RewriterVar* Rewriter::createNewConstantVar(uint64_t val) {
......
......@@ -15,6 +15,7 @@
#ifndef PYSTON_ASMWRITING_REWRITER_H
#define PYSTON_ASMWRITING_REWRITER_H
#include <deque>
#include <map>
#include <memory>
#include <tuple>
......@@ -101,6 +102,8 @@ public:
bool operator!=(const Location rhs) const { return !(*this == rhs); }
bool operator<(const Location& rhs) const { return this->asInt() < rhs.asInt(); }
uint64_t asInt() const { return (int)type + ((uint64_t)_data << 4); }
void dump() const;
......@@ -224,7 +227,7 @@ public:
private:
Rewriter* rewriter;
std::unordered_set<Location> locations;
std::set<Location> locations;
bool isInLocation(Location l);
// uses is a vector of the indices into the Rewriter::actions vector
......@@ -317,7 +320,7 @@ protected:
// Loads the constant into any register or if already in a register just return it
assembler::Register loadConst(uint64_t val, Location otherThan = Location::any());
std::unordered_map<uint64_t, RewriterVar*> constToVar;
std::vector<std::pair<uint64_t, RewriterVar*>> consts;
};
......@@ -326,7 +329,7 @@ protected:
ICSlotInfo* picked_slot;
ConstLoader const_loader;
std::vector<RewriterVar*> vars;
std::deque<RewriterVar> vars;
const Location return_location;
......@@ -346,11 +349,11 @@ protected:
void assertPhaseEmitting() {}
#endif
std::vector<int> live_out_regs;
llvm::SmallVector<int, 8> live_out_regs;
LocMap<RewriterVar*> vars_by_location;
std::vector<RewriterVar*> args;
std::vector<RewriterVar*> live_outs;
llvm::SmallVector<RewriterVar*, 8> args;
llvm::SmallVector<RewriterVar*, 8> live_outs;
Rewriter(std::unique_ptr<ICSlotRewrite> rewrite, int num_args, const std::vector<int>& live_outs);
......@@ -443,15 +446,22 @@ protected:
void assertConsistent() {
#ifndef NDEBUG
for (RewriterVar* var : vars) {
for (Location l : var->locations) {
assert(vars_by_location[l] == var);
for (RewriterVar& var : vars) {
for (Location l : var.locations) {
assert(vars_by_location[l] == &var);
}
}
for (std::pair<Location, RewriterVar*> p : vars_by_location.getAsMap()) {
assert(p.second != NULL);
if (p.second != LOCATION_PLACEHOLDER) {
assert(std::find(vars.begin(), vars.end(), p.second) != vars.end());
bool found = false;
for (auto& v : vars) {
if (&v == p.second) {
found = true;
break;
}
}
assert(found);
assert(p.second->locations.count(p.first) == 1);
}
}
......@@ -471,10 +481,6 @@ public:
if (!finished)
this->abort();
assert(finished);
for (RewriterVar* var : vars) {
delete var;
}
}
Location getReturnDestination();
......
......@@ -19,19 +19,8 @@
namespace pyston {
InternedString InternedStringPool::get(llvm::StringRef arg) {
auto it = interned.find(arg);
BoxedString* s;
if (it != interned.end()) {
s = it->second;
} else {
// HACK: should properly track this liveness:
s = internStringImmortal(arg);
// Note: make sure the key points to the value we just created, not the
// argument string:
interned[s->s()] = s;
}
BoxedString* s = internStringImmortal(arg);
#ifndef NDEBUG
return InternedString(s, this);
......
......@@ -89,12 +89,6 @@ public:
};
class InternedStringPool {
private:
// We probably don't need to pull in llvm::StringRef as the key, but it's better than std::string
// which I assume forces extra allocations.
// (We could define a custom string-pointer container but is it worth it?)
std::unordered_map<llvm::StringRef, BoxedString*> interned;
public:
void gcHandler(gc::GCVisitor* v);
InternedString get(llvm::StringRef s);
......
......@@ -43,6 +43,8 @@ static Box* setOption(Box* option, Box* value) {
else CHECK(REOPT_THRESHOLD_BASELINE);
else CHECK(OSR_THRESHOLD_BASELINE);
else CHECK(SPECULATION_THRESHOLD);
else CHECK(ENABLE_ICS);
else CHECK(ENABLE_ICGETATTRS);
else raiseExcHelper(ValueError, "unknown option name '%s", option_string->data());
return None;
......
......@@ -714,7 +714,7 @@ Box* Box::getattr(BoxedString* attr, GetattrRewriteArgs* rewrite_args) {
HCAttrs* attrs = getHCAttrsPtr();
HiddenClass* hcls = attrs->hcls;
if (hcls->type == HiddenClass::DICT_BACKED) {
if (unlikely(hcls->type == HiddenClass::DICT_BACKED)) {
if (rewrite_args)
assert(!rewrite_args->out_success);
rewrite_args = NULL;
......@@ -728,7 +728,7 @@ Box* Box::getattr(BoxedString* attr, GetattrRewriteArgs* rewrite_args) {
assert(hcls->type == HiddenClass::NORMAL || hcls->type == HiddenClass::SINGLETON);
if (rewrite_args) {
if (unlikely(rewrite_args)) {
if (!rewrite_args->obj_hcls_guarded) {
if (cls->attrs_offset < 0) {
REWRITE_ABORTED("");
......@@ -1001,9 +1001,20 @@ Box* typeLookup(BoxedClass* cls, BoxedString* attr, GetattrRewriteArgs* rewrite_
return NULL;
} else {
assert(attr->interned_state != SSTATE_NOT_INTERNED);
assert(cls->tp_mro);
assert(cls->tp_mro->cls == tuple_cls);
for (auto b : *static_cast<BoxedTuple*>(cls->tp_mro)) {
// object_cls will get checked very often, but it only
// has attributes that start with an underscore.
if (b == object_cls) {
if (attr->data()[0] != '_') {
assert(!b->getattr(attr, NULL));
continue;
}
}
val = b->getattr(attr, NULL);
if (val)
return val;
......@@ -1674,7 +1685,7 @@ Box* getattrInternalGeneric(Box* obj, BoxedString* attr, GetattrRewriteArgs* rew
}
if (!cls_only) {
if (!isSubclass(obj->cls, type_cls)) {
if (!PyType_Check(obj)) {
// Look up the val in the object's dictionary and if you find it, return it.
Box* val;
......
Markdown is supported
0%
or
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment