/* Copyright (c) 2008-2009, Avian Contributors Permission to use, copy, modify, and/or distribute this software for any purpose with or without fee is hereby granted, provided that the above copyright notice and this permission notice appear in all copies. There is NO WARRANTY for this software. See license.txt for details. */ #include "compiler.h" #include "assembler.h" using namespace vm; namespace { namespace local { const bool DebugAppend = true; const bool DebugCompile = true; const bool DebugResources = false; const bool DebugFrame = false; const bool DebugControl = false; const bool DebugReads = true; const bool DebugSites = true; const bool DebugMoves = false; const bool DebugBuddies = false; const int AnyFrameIndex = -2; const int NoFrameIndex = -1; const unsigned StealRegisterReserveCount = 2; const unsigned ResolveRegisterReserveCount = 2; class Context; class Value; class Stack; class Site; class ConstantSite; class AddressSite; class RegisterSite; class MemorySite; class Event; class PushEvent; class Read; class MultiRead; class StubRead; class Block; class Snapshot; void NO_RETURN abort(Context*); void apply(Context* c, UnaryOperation op, unsigned s1Size, Site* s1Low, Site* s1High); void apply(Context* c, BinaryOperation op, unsigned s1Size, Site* s1Low, Site* s1High, unsigned s2Size, Site* s2Low, Site* s2High); void apply(Context* c, TernaryOperation op, unsigned s1Size, Site* s1Low, Site* s1High, unsigned s2Size, Site* s2Low, Site* s2High, unsigned s3Size, Site* s3Low, Site* s3High); enum ConstantCompare { CompareNone, CompareLess, CompareGreater, CompareEqual }; class Cell { public: Cell(Cell* next, void* value): next(next), value(value) { } Cell* next; void* value; }; class Local { public: Value* value; }; class SiteMask { public: SiteMask(): typeMask(~0), registerMask(~0), frameIndex(AnyFrameIndex) { } SiteMask(uint8_t typeMask, uint32_t registerMask, int frameIndex): typeMask(typeMask), registerMask(registerMask), frameIndex(frameIndex) { } uint8_t typeMask; uint32_t registerMask; int frameIndex; }; class Site { public: Site(): next(0) { } virtual Site* readTarget(Context*, Read*) { return this; } virtual unsigned toString(Context*, char*, unsigned) = 0; virtual unsigned copyCost(Context*, Site*) = 0; virtual bool match(Context*, const SiteMask&) = 0; virtual bool loneMatch(Context*, const SiteMask&) = 0; virtual bool matchNext(Context*, Site*, unsigned) = 0; virtual void acquire(Context*, Value*) { } virtual void release(Context*, Value*) { } virtual void freeze(Context*, Value*) { } virtual void thaw(Context*, Value*) { } virtual bool frozen(Context*) { return false; } virtual OperandType type(Context*) = 0; virtual void asAssemblerOperand(Context*, Site*, Assembler::Operand*) = 0; virtual Site* copy(Context*) = 0; virtual Site* copyLow(Context*) = 0; virtual Site* copyHigh(Context*) = 0; virtual Site* makeNext(Context*, unsigned) = 0; virtual unsigned registerSize(Context*) { return BytesPerWord; } virtual unsigned registerMask(Context*) { return 0; } Site* next; }; class Stack { public: Stack(unsigned index, Value* value, Stack* next): index(index), value(value), next(next) { } unsigned index; Value* value; Stack* next; }; class ForkElement { public: Value* value; MultiRead* read; bool local; }; class ForkState: public Compiler::State { public: ForkState(Stack* stack, Local* locals, Cell* saved, Event* predecessor, unsigned logicalIp): stack(stack), locals(locals), saved(saved), predecessor(predecessor), logicalIp(logicalIp), readCount(0) { } Stack* stack; Local* locals; Cell* saved; Event* predecessor; unsigned logicalIp; unsigned readCount; ForkElement elements[0]; }; class MySubroutine: public Compiler::Subroutine { public: MySubroutine(): forkState(0) { } ForkState* forkState; }; class LogicalInstruction { public: LogicalInstruction(int index, Stack* stack, Local* locals): firstEvent(0), lastEvent(0), immediatePredecessor(0), stack(stack), locals(locals), machineOffset(0), subroutine(0), index(index) { } Event* firstEvent; Event* lastEvent; LogicalInstruction* immediatePredecessor; Stack* stack; Local* locals; Promise* machineOffset; MySubroutine* subroutine; int index; }; class Resource { public: Resource(bool reserved = false): value(0), site(0), freezeCount(0), referenceCount(0), reserved(reserved) { } virtual void freeze(Context*, Value*) = 0; virtual void thaw(Context*, Value*) = 0; virtual unsigned toString(Context*, char*, unsigned) = 0; Value* value; Site* site; uint8_t freezeCount; uint8_t referenceCount; bool reserved; }; class RegisterResource: public Resource { public: RegisterResource(bool reserved): Resource(reserved) { } virtual void freeze(Context*, Value*); virtual void thaw(Context*, Value*); virtual unsigned toString(Context* c, char* buffer, unsigned bufferSize) { return vm::snprintf(buffer, bufferSize, "register %d", index(c)); } virtual unsigned index(Context*); }; class FrameResource: public Resource { public: virtual void freeze(Context*, Value*); virtual void thaw(Context*, Value*); virtual unsigned toString(Context* c, char* buffer, unsigned bufferSize) { return vm::snprintf(buffer, bufferSize, "frame %d", index(c)); } virtual unsigned index(Context*); }; class ConstantPoolNode { public: ConstantPoolNode(Promise* promise): promise(promise), next(0) { } Promise* promise; ConstantPoolNode* next; }; class Read { public: Read(): value(0), event(0), eventNext(0) { } virtual bool intersect(SiteMask* mask, unsigned depth = 0) = 0; virtual void maybeIntersectWithHighSource(Context* c) { abort(c); } virtual Value* successor() = 0; virtual bool valid() = 0; virtual void append(Context* c, Read* r) = 0; virtual Read* next(Context* c) = 0; Value* value; Event* event; Read* eventNext; }; int intersectFrameIndexes(int a, int b) { if (a == NoFrameIndex or b == NoFrameIndex) return NoFrameIndex; if (a == AnyFrameIndex) return b; if (b == AnyFrameIndex) return a; if (a == b) return a; return NoFrameIndex; } SiteMask intersect(const SiteMask& a, const SiteMask& b) { return SiteMask(a.typeMask & b.typeMask, a.registerMask & b.registerMask, intersectFrameIndexes(a.frameIndex, b.frameIndex)); } class Value: public Compiler::Operand { public: Value(Site* site, Site* target, ValueType type): reads(0), lastRead(0), sites(site), source(0), target(target), buddy(this), next(this), home(NoFrameIndex), type(type), index(0) { } Read* reads; Read* lastRead; Site* sites; Site* source; Site* target; Value* buddy; Value* next; int8_t home; ValueType type; uint8_t index; }; uint32_t registerMask(Assembler::Architecture* arch) { return arch->generalRegisterMask() | arch->floatRegisterMask(); } unsigned maskStart(uint32_t mask) { for (int i = 0; i <= 31; ++i) { if (mask & (1 << i)) return i; } return 32; } unsigned maskLimit(uint32_t mask) { for (int i = 31; i >= 0; --i) { if (mask & (1 << i)) return i + 1; } return 0; } class Context { public: Context(System* system, Assembler* assembler, Zone* zone, Compiler::Client* client): system(system), assembler(assembler), arch(assembler->arch()), zone(zone), client(client), stack(0), locals(0), saved(0), predecessor(0), logicalCode(0), registerStart(maskStart(registerMask(arch))), registerLimit(maskLimit(registerMask(arch))), generalRegisterStart(maskStart(arch->generalRegisterMask())), generalRegisterLimit(maskLimit(arch->generalRegisterMask())), floatRegisterStart(maskStart(arch->floatRegisterMask())), floatRegisterLimit(maskLimit(arch->floatRegisterMask())), registerResources (static_cast (zone->allocate(sizeof(RegisterResource) * registerLimit))), frameResources(0), firstConstant(0), lastConstant(0), machineCode(0), firstEvent(0), lastEvent(0), forkState(0), subroutine(0), logicalIp(-1), constantCount(0), logicalCodeLength(0), parameterFootprint(0), localFootprint(0), machineCodeSize(0), alignedFrameSize(0), availableGeneralRegisterCount(generalRegisterLimit - generalRegisterStart), constantCompare(CompareNone) { for (unsigned i = generalRegisterStart; i < generalRegisterLimit; ++i) { new (registerResources + i) RegisterResource(arch->reserved(i)); if (registerResources[i].reserved) { -- availableGeneralRegisterCount; } } for (unsigned i = floatRegisterStart; i < floatRegisterLimit; ++i) { new (registerResources + i) RegisterResource(arch->reserved(i)); } } System* system; Assembler* assembler; Assembler::Architecture* arch; Zone* zone; Compiler::Client* client; Stack* stack; Local* locals; Cell* saved; Event* predecessor; LogicalInstruction** logicalCode; uint8_t registerStart; uint8_t registerLimit; uint8_t generalRegisterStart; uint8_t generalRegisterLimit; uint8_t floatRegisterStart; uint8_t floatRegisterLimit; RegisterResource* registerResources; FrameResource* frameResources; ConstantPoolNode* firstConstant; ConstantPoolNode* lastConstant; uint8_t* machineCode; Event* firstEvent; Event* lastEvent; ForkState* forkState; MySubroutine* subroutine; int logicalIp; unsigned constantCount; unsigned logicalCodeLength; unsigned parameterFootprint; unsigned localFootprint; unsigned machineCodeSize; unsigned alignedFrameSize; unsigned availableGeneralRegisterCount; ConstantCompare constantCompare; }; unsigned RegisterResource::index(Context* c) { return this - c->registerResources; } unsigned FrameResource::index(Context* c) { return this - c->frameResources; } class PoolPromise: public Promise { public: PoolPromise(Context* c, int key): c(c), key(key) { } virtual int64_t value() { if (resolved()) { return reinterpret_cast (c->machineCode + pad(c->machineCodeSize) + (key * BytesPerWord)); } abort(c); } virtual bool resolved() { return c->machineCode != 0; } Context* c; int key; }; class CodePromise: public Promise { public: CodePromise(Context* c, CodePromise* next): c(c), offset(0), next(next) { } CodePromise(Context* c, Promise* offset): c(c), offset(offset), next(0) { } virtual int64_t value() { if (resolved()) { return reinterpret_cast(c->machineCode + offset->value()); } abort(c); } virtual bool resolved() { return c->machineCode != 0 and offset and offset->resolved(); } Context* c; Promise* offset; CodePromise* next; }; unsigned machineOffset(Context* c, int logicalIp) { return c->logicalCode[logicalIp]->machineOffset->value(); } class IpPromise: public Promise { public: IpPromise(Context* c, int logicalIp): c(c), logicalIp(logicalIp) { } virtual int64_t value() { if (resolved()) { return reinterpret_cast (c->machineCode + machineOffset(c, logicalIp)); } abort(c); } virtual bool resolved() { return c->machineCode != 0; } Context* c; int logicalIp; }; inline void NO_RETURN abort(Context* c) { abort(c->system); } #ifndef NDEBUG inline void assert(Context* c, bool v) { assert(c->system, v); } #endif // not NDEBUG inline void expect(Context* c, bool v) { expect(c->system, v); } unsigned count(Cell* c) { unsigned count = 0; while (c) { ++ count; c = c->next; } return count; } Cell* cons(Context* c, void* value, Cell* next) { return new (c->zone->allocate(sizeof(Cell))) Cell(next, value); } Cell* append(Context* c, Cell* first, Cell* second) { if (first) { if (second) { Cell* start = cons(c, first->value, second); Cell* end = start; for (Cell* cell = first->next; cell; cell = cell->next) { Cell* n = cons(c, cell->value, second); end->next = n; end = n; } return start; } else { return first; } } else { return second; } } Cell* reverseDestroy(Cell* cell) { Cell* previous = 0; while (cell) { Cell* next = cell->next; cell->next = previous; previous = cell; cell = next; } return previous; } class StubReadPair { public: Value* value; StubRead* read; }; class JunctionState { public: JunctionState(unsigned frameFootprint): frameFootprint(frameFootprint) { } unsigned frameFootprint; StubReadPair reads[0]; }; class Link { public: Link(Event* predecessor, Link* nextPredecessor, Event* successor, Link* nextSuccessor, ForkState* forkState): predecessor(predecessor), nextPredecessor(nextPredecessor), successor(successor), nextSuccessor(nextSuccessor), forkState(forkState), junctionState(0) { } Event* predecessor; Link* nextPredecessor; Event* successor; Link* nextSuccessor; ForkState* forkState; JunctionState* junctionState; }; Link* link(Context* c, Event* predecessor, Link* nextPredecessor, Event* successor, Link* nextSuccessor, ForkState* forkState) { return new (c->zone->allocate(sizeof(Link))) Link (predecessor, nextPredecessor, successor, nextSuccessor, forkState); } unsigned countPredecessors(Link* link) { unsigned c = 0; for (; link; link = link->nextPredecessor) ++ c; return c; } Link* lastPredecessor(Link* link) { while (link->nextPredecessor) link = link->nextPredecessor; return link; } unsigned countSuccessors(Link* link) { unsigned c = 0; for (; link; link = link->nextSuccessor) ++ c; return c; } class Event { public: Event(Context* c): next(0), stackBefore(c->stack), localsBefore(c->locals), stackAfter(0), localsAfter(0), promises(0), reads(0), junctionSites(0), snapshots(0), predecessors(0), successors(0), visitLinks(0), block(0), logicalInstruction(c->logicalCode[c->logicalIp]), readCount(0) { } virtual const char* name() = 0; virtual void compile(Context* c) = 0; virtual bool isBranch() { return false; } virtual bool allExits() { return false; } Event* next; Stack* stackBefore; Local* localsBefore; Stack* stackAfter; Local* localsAfter; CodePromise* promises; Read* reads; Site** junctionSites; Snapshot* snapshots; Link* predecessors; Link* successors; Cell* visitLinks; Block* block; LogicalInstruction* logicalInstruction; unsigned readCount; }; unsigned totalFrameSize(Context* c) { return c->alignedFrameSize + c->arch->frameHeaderSize() + c->arch->argumentFootprint(c->parameterFootprint); } int frameIndex(Context* c, int localIndex) { assert(c, localIndex >= 0); int index = c->alignedFrameSize + c->parameterFootprint - localIndex - 1; if (localIndex < static_cast(c->parameterFootprint)) { index += c->arch->frameHeaderSize(); } else { index -= c->arch->frameFooterSize(); } assert(c, index >= 0); assert(c, static_cast(index) < totalFrameSize(c)); return index; } unsigned frameIndexToOffset(Context* c, unsigned frameIndex) { assert(c, frameIndex < totalFrameSize(c)); return (frameIndex + c->arch->frameFooterSize()) * BytesPerWord; } unsigned offsetToFrameIndex(Context* c, unsigned offset) { assert(c, static_cast ((offset / BytesPerWord) - c->arch->frameFooterSize()) >= 0); assert(c, ((offset / BytesPerWord) - c->arch->frameFooterSize()) < totalFrameSize(c)); return (offset / BytesPerWord) - c->arch->frameFooterSize(); } unsigned frameBase(Context* c) { return c->alignedFrameSize - c->arch->frameReturnAddressSize() - c->arch->frameFooterSize() + c->arch->frameHeaderSize(); } class FrameIterator { public: class Element { public: Element(Value* value, unsigned localIndex): value(value), localIndex(localIndex) { } Value* const value; const unsigned localIndex; }; FrameIterator(Context* c, Stack* stack, Local* locals): stack(stack), locals(locals), localIndex(c->localFootprint - 1) { } bool hasMore() { while (stack and stack->value == 0) stack = stack->next; while (localIndex >= 0 and locals[localIndex].value == 0) -- localIndex; return stack != 0 or localIndex >= 0; } Element next(Context* c) { Value* v; unsigned li; if (stack) { Stack* s = stack; v = s->value; li = s->index + c->localFootprint; stack = stack->next; } else { Local* l = locals + localIndex; v = l->value; li = localIndex; -- localIndex; } return Element(v, li); } Stack* stack; Local* locals; int localIndex; }; int frameIndex(Context* c, FrameIterator::Element* element) { return frameIndex(c, element->localIndex); } class SiteIterator { public: SiteIterator(Context* c, Value* v, bool includeBuddies = true, bool includeNext = true): c(c), originalValue(v), currentValue(v), includeBuddies(includeBuddies), includeNext(includeNext), pass(0), next_(findNext(&(v->sites))), previous(0) { } Site** findNext(Site** p) { while (true) { if (*p) { if (pass == 0 or (*p)->registerSize(c) > BytesPerWord) { return p; } else { p = &((*p)->next); } } else { if (includeBuddies) { Value* v = currentValue->buddy; if (v != originalValue) { currentValue = v; p = &(v->sites); continue; } } if (includeNext and pass == 0) { Value* v = originalValue->next; if (v != originalValue) { pass = 1; originalValue = v; currentValue = v; p = &(v->sites); continue; } } return 0; } } } bool hasMore() { if (previous) { next_ = findNext(&((*previous)->next)); previous = 0; } return next_ != 0; } Site* next() { previous = next_; return *previous; } void remove(Context* c) { (*previous)->release(c, originalValue); *previous = (*previous)->next; next_ = findNext(previous); previous = 0; } Context* c; Value* originalValue; Value* currentValue; bool includeBuddies; bool includeNext; uint8_t pass; Site** next_; Site** previous; }; bool hasMoreThanOneSite(Context* c, Value* v) { SiteIterator it(c, v); if (it.hasMore()) { it.next(); return it.hasMore(); } else { return false; } } bool hasSite(Context* c, Value* v) { SiteIterator it(c, v); return it.hasMore(); } bool findSite(Context*, Value* v, Site* site) { for (Site* s = v->sites; s; s = s->next) { if (s == site) return true; } return false; } void addSite(Context* c, Value* v, Site* s) { if (not findSite(c, v, s)) { if (DebugSites) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "add site %s to %p\n", buffer, v); } s->acquire(c, v); s->next = v->sites; v->sites = s; } } void removeSite(Context* c, Value* v, Site* s) { for (SiteIterator it(c, v); it.hasMore();) { if (s == it.next()) { if (DebugSites) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "remove site %s from %p\n", buffer, v); } it.remove(c); break; } } if (DebugSites) { fprintf(stderr, "%p has more: %d\n", v, hasSite(c, v)); } assert(c, not findSite(c, v, s)); } void clearSites(Context* c, Value* v) { if (DebugSites) { fprintf(stderr, "clear sites for %p\n", v); } for (SiteIterator it(c, v); it.hasMore();) { it.next(); it.remove(c); } } bool valid(Read* r) { return r and r->valid(); } Read* live(Value* v) { Value* p = v; do { if (valid(p->reads)) { return p->reads; } p = p->buddy; } while (p != v); return 0; } Read* liveNext(Context* c, Value* v) { Read* r = v->reads->next(c); if (valid(r)) return r; for (Value* p = v->buddy; p != v; p = p->buddy) { if (valid(p->reads)) return p->reads; } return 0; } void deadBuddy(Context* c, Value* v, Read* r UNUSED) { assert(c, v->buddy != v); assert(c, r); if (DebugBuddies) { fprintf(stderr, "remove dead buddy %p from", v); for (Value* p = v->buddy; p != v; p = p->buddy) { fprintf(stderr, " %p", p); } fprintf(stderr, "\n"); } assert(c, v->buddy); Value* next = v->buddy; v->buddy = v; Value* p = next; while (p->buddy != v) p = p->buddy; p->buddy = next; assert(c, p->buddy); for (SiteIterator it(c, v); it.hasMore();) { Site* s = it.next(); it.remove(c); addSite(c, next, s); } } void popRead(Context* c, Event* e UNUSED, Value* v) { assert(c, e == v->reads->event); if (DebugReads) { fprintf(stderr, "pop read %p from %p next %p event %p (%s)\n", v->reads, v, v->reads->next(c), e, (e ? e->name() : 0)); } v->reads = v->reads->next(c); if (not valid(v->reads)) { Read* r = live(v); if (r) { deadBuddy(c, v, r); } else { clearSites(c, v); } } } bool buddies(Value* a, Value* b) { if (a == b) return true; for (Value* p = a->buddy; p != a; p = p->buddy) { if (p == b) return true; } return false; } void decrementAvailableGeneralRegisterCount(Context* c) { assert(c, c->availableGeneralRegisterCount); -- c->availableGeneralRegisterCount; if (DebugResources) { fprintf(stderr, "%d registers available\n", c->availableGeneralRegisterCount); } } void incrementAvailableGeneralRegisterCount(Context* c) { ++ c->availableGeneralRegisterCount; if (DebugResources) { fprintf(stderr, "%d registers available\n", c->availableGeneralRegisterCount); } } void increment(Context* c, RegisterResource* r) { if (not r->reserved) { if (DebugResources) { char buffer[256]; r->toString(c, buffer, 256); fprintf(stderr, "increment %s to %d\n", buffer, r->referenceCount + 1); } ++ r->referenceCount; if (r->referenceCount == 1 and ((1 << r->index(c)) & c->arch->generalRegisterMask())) { decrementAvailableGeneralRegisterCount(c); } } } void decrement(Context* c, RegisterResource* r) { if (not r->reserved) { if (DebugResources) { char buffer[256]; r->toString(c, buffer, 256); fprintf(stderr, "decrement %s to %d\n", buffer, r->referenceCount - 1); } assert(c, r->referenceCount > 0); -- r->referenceCount; if (r->referenceCount == 0 and ((1 << r->index(c)) & c->arch->generalRegisterMask())) { incrementAvailableGeneralRegisterCount(c); } } } void freezeResource(Context* c, Resource* r, Value* v) { if (DebugResources) { char buffer[256]; r->toString(c, buffer, 256); fprintf(stderr, "%p freeze %s to %d\n", v, buffer, r->freezeCount + 1); } ++ r->freezeCount; } void RegisterResource::freeze(Context* c, Value* v) { if (not reserved) { freezeResource(c, this, v); if (freezeCount == 1 and ((1 << index(c)) & c->arch->generalRegisterMask())) { decrementAvailableGeneralRegisterCount(c); } } } void FrameResource::freeze(Context* c, Value* v) { freezeResource(c, this, v); } void thawResource(Context* c, Resource* r, Value* v) { if (not r->reserved) { if (DebugResources) { char buffer[256]; r->toString(c, buffer, 256); fprintf(stderr, "%p thaw %s to %d\n", v, buffer, r->freezeCount - 1); } assert(c, r->freezeCount); -- r->freezeCount; } } void RegisterResource::thaw(Context* c, Value* v) { if (not reserved) { thawResource(c, this, v); if (freezeCount == 0 and ((1 << index(c)) & c->arch->generalRegisterMask())) { incrementAvailableGeneralRegisterCount(c); } } } void FrameResource::thaw(Context* c, Value* v) { thawResource(c, this, v); } class Target { public: static const unsigned MinimumRegisterCost = 0; static const unsigned MinimumFrameCost = 1; static const unsigned StealPenalty = 2; static const unsigned StealUniquePenalty = 4; static const unsigned LowRegisterPenalty = 10; static const unsigned Impossible = 20; Target(): cost(Impossible) { } Target(int index, OperandType type, unsigned cost): index(index), type(type), cost(cost) { } int16_t index; OperandType type; uint8_t cost; }; ValueType valueType(Context* c, Compiler::OperandType type) { switch (type) { case Compiler::ObjectType: case Compiler::AddressType: case Compiler::IntegerType: case Compiler::VoidType: return ValueGeneral; case Compiler::FloatType: return ValueFloat; default: abort(c); } } Target pickTarget(Context* c, Read* r, bool intersectRead, unsigned registerReserveCount); unsigned resourceCost(Context* c UNUSED, Value* v, Resource* r) { if (r->reserved or r->freezeCount or r->referenceCount) { return Target::Impossible; } else if (r->value) { assert(c, findSite(c, r->value, r->site)); if (v and buddies(r->value, v)) { return 0; } else if (hasMoreThanOneSite(c, r->value)) { return Target::StealPenalty; } else { return Target::StealUniquePenalty; } } else { return 0; } } bool pickRegisterTarget(Context* c, int i, Value* v, uint32_t mask, int* target, unsigned* cost) { if ((1 << i) & mask) { RegisterResource* r = c->registerResources + i; unsigned myCost = resourceCost(c, v, r) + Target::MinimumRegisterCost; if ((static_cast(1) << i) == mask) { *cost = myCost; return true; } else if (myCost < *cost) { *cost = myCost; *target = i; } } return false; } int pickRegisterTarget(Context* c, Value* v, uint32_t mask, unsigned* cost) { int target = NoRegister; *cost = Target::Impossible; if (mask & c->arch->generalRegisterMask()) { for (int i = c->generalRegisterLimit - 1; i >= c->generalRegisterStart; --i) { if (pickRegisterTarget(c, i, v, mask, &target, cost)) { return i; } } } if (mask & c->arch->floatRegisterMask()) { for (int i = c->floatRegisterStart; i < static_cast(c->floatRegisterLimit); ++i) { if (pickRegisterTarget(c, i, v, mask, &target, cost)) { return i; } } } return target; } Target pickRegisterTarget(Context* c, Value* v, uint32_t mask) { unsigned cost; int number = pickRegisterTarget(c, v, mask, &cost); return Target(number, RegisterOperand, cost); } unsigned frameCost(Context* c, Value* v, int frameIndex) { return resourceCost(c, v, c->frameResources + frameIndex) + Target::MinimumFrameCost; } Target pickFrameTarget(Context* c, Value* v) { Target best; Value* p = v; do { if (p->home >= 0) { Target mine(p->home, MemoryOperand, frameCost(c, v, p->home)); if (mine.cost == Target::MinimumFrameCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } p = p->buddy; } while (p != v); return best; } Target pickAnyFrameTarget(Context* c, Value* v) { Target best; unsigned count = totalFrameSize(c); for (unsigned i = 0; i < count; ++i) { Target mine(i, MemoryOperand, frameCost(c, v, i)); if (mine.cost == Target::MinimumFrameCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } return best; } Target pickTarget(Context* c, Value* value, const SiteMask& mask, unsigned registerPenalty, Target best) { if (mask.typeMask & (1 << RegisterOperand)) { Target mine = pickRegisterTarget(c, value, mask.registerMask); mine.cost += registerPenalty; if (mine.cost == Target::MinimumRegisterCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } if (mask.typeMask & (1 << MemoryOperand)) { if (mask.frameIndex >= 0) { Target mine(mask.frameIndex, MemoryOperand, frameCost(c, value, mask.frameIndex)); if (mine.cost == Target::MinimumFrameCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } else if (mask.frameIndex == AnyFrameIndex) { Target mine = pickFrameTarget(c, value); if (mine.cost == Target::MinimumFrameCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } } return best; } Target pickTarget(Context* c, Read* read, bool intersectRead, unsigned registerReserveCount) { unsigned registerPenalty = (c->availableGeneralRegisterCount > registerReserveCount ? 0 : Target::LowRegisterPenalty); SiteMask mask; read->intersect(&mask); Target best; Value* value = read->value; Value* successor = read->successor(); if (successor) { Read* r = live(successor); if (r) { SiteMask intersection = mask; if (r->intersect(&intersection)) { best = pickTarget(c, value, intersection, registerPenalty, best); if (best.cost <= Target::MinimumFrameCost) { return best; } } } } best = pickTarget(c, value, mask, registerPenalty, best); if (best.cost <= Target::MinimumFrameCost) { return best; } if (intersectRead) { if (best.cost == Target::Impossible) { fprintf(stderr, "mask type %d reg %d frame %d\n", mask.typeMask, mask.registerMask, mask.frameIndex); asm("int3"); } return best; } { Target mine = pickRegisterTarget(c, value, ~0); mine.cost += registerPenalty; if (mine.cost == Target::MinimumRegisterCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } { Target mine = pickFrameTarget(c, value); if (mine.cost == Target::MinimumFrameCost) { return mine; } else if (mine.cost < best.cost) { best = mine; } } if (best.cost >= Target::StealUniquePenalty and c->availableGeneralRegisterCount == 0) { // there are no free registers left, so moving from memory to // memory isn't an option - try harder to find an available frame // site: best = pickAnyFrameTarget(c, value); assert(c, best.cost <= 3); } if (best.cost == Target::Impossible) asm("int3"); return best; } void acquire(Context* c, Resource* resource, Value* value, Site* site); void release(Context* c, Resource* resource, Value* value, Site* site); ConstantSite* constantSite(Context* c, Promise* value); ShiftMaskPromise* shiftMaskPromise(Context* c, Promise* base, unsigned shift, int64_t mask) { return new (c->zone->allocate(sizeof(ShiftMaskPromise))) ShiftMaskPromise(base, shift, mask); } CombinedPromise* combinedPromise(Context* c, Promise* low, Promise* high) { return new (c->zone->allocate(sizeof(CombinedPromise))) CombinedPromise(low, high); } class ConstantSite: public Site { public: ConstantSite(Promise* value): value(value) { } virtual unsigned toString(Context*, char* buffer, unsigned bufferSize) { if (value->resolved()) { return vm::snprintf (buffer, bufferSize, "constant %"LLD, value->value()); } else { return vm::snprintf(buffer, bufferSize, "constant unresolved"); } } virtual unsigned copyCost(Context*, Site* s) { return (s == this ? 0 : 3); } virtual bool match(Context*, const SiteMask& mask) { return mask.typeMask & (1 << ConstantOperand); } virtual bool loneMatch(Context*, const SiteMask&) { return true; } virtual bool matchNext(Context* c, Site* s, unsigned) { return s->type(c) == ConstantOperand; } virtual OperandType type(Context*) { return ConstantOperand; } virtual void asAssemblerOperand(Context* c, Site* high, Assembler::Operand* result) { Promise* v = value; if (high != this) { v = combinedPromise(c, value, static_cast(high)->value); } new (result) Assembler::Constant(v); } virtual Site* copy(Context* c) { return constantSite(c, value); } virtual Site* copyLow(Context* c) { return constantSite(c, shiftMaskPromise(c, value, 0, 0xFFFFFFFF)); } virtual Site* copyHigh(Context* c) { return constantSite(c, shiftMaskPromise(c, value, 32, 0xFFFFFFFF)); } virtual Site* makeNext(Context* c, unsigned) { abort(c); } Promise* value; }; ConstantSite* constantSite(Context* c, Promise* value) { return new (c->zone->allocate(sizeof(ConstantSite))) ConstantSite(value); } ResolvedPromise* resolved(Context* c, int64_t value) { return new (c->zone->allocate(sizeof(ResolvedPromise))) ResolvedPromise(value); } ConstantSite* constantSite(Context* c, int64_t value) { return constantSite(c, resolved(c, value)); } AddressSite* addressSite(Context* c, Promise* address); class AddressSite: public Site { public: AddressSite(Promise* address): address(address) { } virtual unsigned toString(Context*, char* buffer, unsigned bufferSize) { if (address->resolved()) { return vm::snprintf (buffer, bufferSize, "address %"LLD, address->value()); } else { return vm::snprintf(buffer, bufferSize, "address unresolved"); } } virtual unsigned copyCost(Context*, Site* s) { return (s == this ? 0 : 2); } virtual bool match(Context*, const SiteMask& mask) { return mask.typeMask & (1 << AddressOperand); } virtual bool loneMatch(Context*, const SiteMask&) { return false; } virtual bool matchNext(Context* c, Site*, unsigned) { abort(c); } virtual OperandType type(Context*) { return AddressOperand; } virtual void asAssemblerOperand(Context* c UNUSED, Site* high UNUSED, Assembler::Operand* result) { assert(c, high == this); new (result) Assembler::Address(address); } virtual Site* copy(Context* c) { return addressSite(c, address); } virtual Site* copyLow(Context* c) { abort(c); } virtual Site* copyHigh(Context* c) { abort(c); } virtual Site* makeNext(Context* c, unsigned) { abort(c); } Promise* address; }; AddressSite* addressSite(Context* c, Promise* address) { return new (c->zone->allocate(sizeof(AddressSite))) AddressSite(address); } RegisterSite* freeRegisterSite(Context* c, uint32_t mask); class RegisterSite: public Site { public: RegisterSite(uint32_t mask, int number): mask(mask), number(number) { } virtual unsigned toString(Context*, char* buffer, unsigned bufferSize) { if (number != NoRegister) { return vm::snprintf(buffer, bufferSize, "%p register %d", this, number); } else { return vm::snprintf(buffer, bufferSize, "%p register unacquired", this); } } virtual unsigned copyCost(Context* c, Site* s) { assert(c, number != NoRegister); if (s and (this == s or (s->type(c) == RegisterOperand and (static_cast(s)->mask & (1 << number))))) { return 0; } else { return 1; } } virtual bool match(Context* c UNUSED, const SiteMask& mask) { assert(c, number != NoRegister); if ((mask.typeMask & (1 << RegisterOperand))) { return ((static_cast(1) << number) & mask.registerMask); } else { return false; } } virtual bool loneMatch(Context* c UNUSED, const SiteMask& mask) { assert(c, number != NoRegister); if ((mask.typeMask & (1 << RegisterOperand))) { return ((static_cast(1) << number) == mask.registerMask); } else { return false; } } virtual bool matchNext(Context* c, Site* s, unsigned) { return s->type(c) == RegisterOperand and s->registerSize(c) == BytesPerWord; } virtual void acquire(Context* c, Value* v) { Target target; if (number != NoRegister) { target = Target(number, RegisterOperand, 0); } else { target = pickRegisterTarget(c, v, mask); expect(c, target.cost < Target::Impossible); } RegisterResource* resource = c->registerResources + target.index; local::acquire(c, resource, v, this); number = target.index; } virtual void release(Context* c, Value* v) { assert(c, number != NoRegister); local::release(c, c->registerResources + number, v, this); } virtual void freeze(Context* c, Value* v) { assert(c, number != NoRegister); c->registerResources[number].freeze(c, v); } virtual void thaw(Context* c, Value* v) { assert(c, number != NoRegister); c->registerResources[number].thaw(c, v); } virtual bool frozen(Context* c UNUSED) { assert(c, number != NoRegister); return c->registerResources[number].freezeCount != 0; } virtual OperandType type(Context*) { return RegisterOperand; } virtual void asAssemblerOperand(Context* c UNUSED, Site* high, Assembler::Operand* result) { assert(c, number != NoRegister); int highNumber; if (high != this) { highNumber = static_cast(high)->number; assert(c, highNumber != NoRegister); } else { highNumber = NoRegister; } new (result) Assembler::Register(number, highNumber); } virtual Site* copy(Context* c) { uint32_t mask; if (number != NoRegister) { mask = 1 << number; } else { mask = this->mask; } return freeRegisterSite(c, mask); } virtual Site* copyLow(Context* c) { abort(c); } virtual Site* copyHigh(Context* c) { abort(c); } virtual Site* makeNext(Context* c, unsigned) { return freeRegisterSite(c, c->arch->generalRegisterMask()); } virtual unsigned registerSize(Context* c) { assert(c, number != NoRegister); if ((1 << number) & c->arch->floatRegisterMask()) { return c->arch->floatRegisterSize(); } else { return BytesPerWord; } } virtual unsigned registerMask(Context* c) { assert(c, number != NoRegister); return 1 << number; } uint32_t mask; int number; }; RegisterSite* registerSite(Context* c, int number) { assert(c, number >= 0); assert(c, (1 << number) & (c->arch->generalRegisterMask() | c->arch->floatRegisterMask())); return new (c->zone->allocate(sizeof(RegisterSite))) RegisterSite(1 << number, number); } RegisterSite* freeRegisterSite(Context* c, uint32_t mask) { return new (c->zone->allocate(sizeof(RegisterSite))) RegisterSite(mask, NoRegister); } MemorySite* memorySite(Context* c, int base, int offset = 0, int index = NoRegister, unsigned scale = 1); class MemorySite: public Site { public: MemorySite(int base, int offset, int index, unsigned scale): acquired(false), base(base), offset(offset), index(index), scale(scale) { } virtual unsigned toString(Context*, char* buffer, unsigned bufferSize) { if (acquired) { return vm::snprintf(buffer, bufferSize, "memory %d 0x%x %d %d", base, offset, index, scale); } else { return vm::snprintf(buffer, bufferSize, "memory unacquired"); } } virtual unsigned copyCost(Context* c, Site* s) { assert(c, acquired); if (s and (this == s or (s->type(c) == MemoryOperand and static_cast(s)->base == base and static_cast(s)->offset == offset and static_cast(s)->index == index and static_cast(s)->scale == scale))) { return 0; } else { return 4; } } virtual bool match(Context* c, const SiteMask& mask) { assert(c, acquired); if (mask.typeMask & (1 << MemoryOperand)) { if (base == c->arch->stack()) { assert(c, index == NoRegister); return mask.frameIndex == AnyFrameIndex or (mask.frameIndex != NoFrameIndex and static_cast(frameIndexToOffset(c, mask.frameIndex)) == offset); } else { return true; } } else { return false; } } virtual bool loneMatch(Context* c, const SiteMask& mask) { assert(c, acquired); if (mask.typeMask & (1 << MemoryOperand)) { if (base == c->arch->stack()) { assert(c, index == NoRegister); if (mask.frameIndex == AnyFrameIndex) { return false; } else { return true; } } } return false; } virtual bool matchNext(Context* c, Site* s, unsigned index) { if (s->type(c) == MemoryOperand) { MemorySite* ms = static_cast(s); return ms->base == this->base and ((index == 1 and ms->offset == static_cast (this->offset + BytesPerWord)) or (index == 0 and this->offset == static_cast (ms->offset + BytesPerWord))) and ms->index == this->index and ms->scale == this->scale; } else { return false; } } virtual void acquire(Context* c, Value* v) { increment(c, c->registerResources + base); if (index != NoRegister) { increment(c, c->registerResources + index); } if (base == c->arch->stack()) { assert(c, index == NoRegister); local::acquire (c, c->frameResources + offsetToFrameIndex(c, offset), v, this); } acquired = true; } virtual void release(Context* c, Value* v) { if (base == c->arch->stack()) { assert(c, index == NoRegister); local::release (c, c->frameResources + offsetToFrameIndex(c, offset), v, this); } decrement(c, c->registerResources + base); if (index != NoRegister) { decrement(c, c->registerResources + index); } acquired = false; } virtual void freeze(Context* c, Value* v) { if (base == c->arch->stack()) { c->frameResources[offsetToFrameIndex(c, offset)].freeze(c, v); } } virtual void thaw(Context* c, Value* v) { if (base == c->arch->stack()) { c->frameResources[offsetToFrameIndex(c, offset)].thaw(c, v); } } virtual bool frozen(Context* c) { return base == c->arch->stack() and c->frameResources[offsetToFrameIndex(c, offset)].freezeCount != 0; } virtual OperandType type(Context*) { return MemoryOperand; } virtual void asAssemblerOperand(Context* c UNUSED, Site* high UNUSED, Assembler::Operand* result) { assert(c, high == this or (static_cast(high)->base == base and static_cast(high)->offset == static_cast(offset + BytesPerWord) and static_cast(high)->index == index and static_cast(high)->scale == scale)); assert(c, acquired); new (result) Assembler::Memory(base, offset, index, scale); } virtual Site* copy(Context* c) { return memorySite(c, base, offset, index, scale); } Site* copyHalf(Context* c, bool add) { if (add) { return memorySite(c, base, offset + BytesPerWord, index, scale); } else { return copy(c); } } virtual Site* copyLow(Context* c) { return copyHalf(c, c->arch->bigEndian()); } virtual Site* copyHigh(Context* c) { return copyHalf(c, not c->arch->bigEndian()); } virtual Site* makeNext(Context* c, unsigned index) { return memorySite (c, base, offset + (index == 1 ? BytesPerWord : -BytesPerWord), this->index, scale); } bool acquired; int base; int offset; int index; unsigned scale; }; MemorySite* memorySite(Context* c, int base, int offset, int index, unsigned scale) { return new (c->zone->allocate(sizeof(MemorySite))) MemorySite(base, offset, index, scale); } MemorySite* frameSite(Context* c, int frameIndex) { assert(c, frameIndex >= 0); return memorySite (c, c->arch->stack(), frameIndexToOffset(c, frameIndex), NoRegister, 0); } void move(Context* c, Value* value, Site* src, Site* dst); unsigned sitesToString(Context* c, Site* sites, char* buffer, unsigned size) { unsigned total = 0; for (Site* s = sites; s; s = s->next) { total += s->toString(c, buffer + total, size - total); if (s->next) { assert(c, size > total + 2); memcpy(buffer + total, ", ", 2); total += 2; } } assert(c, size > total); buffer[total] = 0; return total; } unsigned sitesToString(Context* c, Value* v, char* buffer, unsigned size) { unsigned total = 0; Value* p = v; do { if (total) { assert(c, size > total + 2); memcpy(buffer + total, "; ", 2); total += 2; } if (p->sites) { total += vm::snprintf(buffer + total, size - total, "%p has ", p); total += sitesToString(c, p->sites, buffer + total, size - total); } else { total += vm::snprintf(buffer + total, size - total, "%p has nothing", p); } p = p->buddy; } while (p != v); return total; } Site* pickTargetSite(Context* c, Read* read, bool intersectRead = false, unsigned registerReserveCount = 0) { Target target(pickTarget(c, read, intersectRead, registerReserveCount)); expect(c, target.cost < Target::Impossible); if (target.type == MemoryOperand) { return frameSite(c, target.index); } else { return registerSite(c, target.index); } } void steal(Context* c, Resource* r, Value* thief) { if (DebugResources) { char resourceBuffer[256]; r->toString(c, resourceBuffer, 256); char siteBuffer[1024]; sitesToString(c, r->value, siteBuffer, 1024); fprintf(stderr, "%p steal %s from %p (%s)\n", thief, resourceBuffer, r->value, siteBuffer); } if (not ((thief and buddies(thief, r->value)) or hasMoreThanOneSite(c, r->value))) { r->site->freeze(c, r->value); move(c, r->value, r->site, pickTargetSite (c, live(r->value), false, StealRegisterReserveCount)); r->site->thaw(c, r->value); } removeSite(c, r->value, r->site); } void acquire(Context* c, Resource* resource, Value* value, Site* site) { assert(c, value); assert(c, site); if (not resource->reserved) { if (DebugResources) { char buffer[256]; resource->toString(c, buffer, 256); fprintf(stderr, "%p acquire %s\n", value, buffer); } if (resource->value) { assert(c, findSite(c, resource->value, resource->site)); assert(c, not findSite(c, value, resource->site)); steal(c, resource, value); } resource->value = value; resource->site = site; } } void release(Context* c, Resource* resource, Value* value UNUSED, Site* site UNUSED) { if (not resource->reserved) { if (DebugResources) { char buffer[256]; resource->toString(c, buffer, 256); fprintf(stderr, "%p release %s\n", resource->value, buffer); } assert(c, resource->value); assert(c, resource->site); assert(c, buddies(resource->value, value)); assert(c, site == resource->site); resource->value = 0; resource->site = 0; } } class SingleRead: public Read { public: SingleRead(const SiteMask& mask, Value* successor): next_(0), mask(mask), high(0), successor_(successor) { } virtual bool intersect(SiteMask* mask, unsigned) { *mask = local::intersect(*mask, this->mask); return true; } virtual void maybeIntersectWithHighSource(Context* c) { if (high) { Site* s = high->source; this->mask = local::intersect (SiteMask(1 << s->type(c), ~0, AnyFrameIndex), this->mask); } } virtual Value* successor() { return successor_; } virtual bool valid() { return true; } virtual void append(Context* c UNUSED, Read* r) { assert(c, next_ == 0); next_ = r; } virtual Read* next(Context*) { return next_; } Read* next_; SiteMask mask; Value* high; Value* successor_; }; SingleRead* read(Context* c, const SiteMask& mask, Value* successor = 0) { assert(c, (mask.typeMask != 1 << MemoryOperand) or mask.frameIndex >= 0); return new (c->zone->allocate(sizeof(SingleRead))) SingleRead(mask, successor); } SiteMask generalRegisterMask(Context* c) { return SiteMask (1 << RegisterOperand, c->arch->generalRegisterMask(), NoFrameIndex); } SiteMask generalRegisterOrConstantMask(Context* c) { return SiteMask ((1 << RegisterOperand) | (1 << ConstantOperand), c->arch->generalRegisterMask(), NoFrameIndex); } SiteMask fixedRegisterMask(int number) { return SiteMask(1 << RegisterOperand, 1 << number, NoFrameIndex); } class MultiRead: public Read { public: MultiRead(): reads(0), lastRead(0), firstTarget(0), lastTarget(0), visited(false) { } virtual bool intersect(SiteMask* mask, unsigned depth) { if (depth > 0) { // short-circuit recursion to avoid poor performance in // deeply-nested branches return reads != 0; } bool result = false; if (not visited) { visited = true; for (Cell** cell = &reads; *cell;) { Read* r = static_cast((*cell)->value); bool valid = r->intersect(mask, depth + 1); if (valid) { result = true; cell = &((*cell)->next); } else { *cell = (*cell)->next; } } visited = false; } return result; } virtual Value* successor() { return 0; } virtual bool valid() { bool result = false; if (not visited) { visited = true; for (Cell** cell = &reads; *cell;) { Read* r = static_cast((*cell)->value); if (r->valid()) { result = true; cell = &((*cell)->next); } else { *cell = (*cell)->next; } } visited = false; } return result; } virtual void append(Context* c, Read* r) { Cell* cell = cons(c, r, 0); if (lastRead == 0) { reads = cell; } else { lastRead->next = cell; } lastRead = cell; // fprintf(stderr, "append %p to %p for %p\n", r, lastTarget, this); lastTarget->value = r; } virtual Read* next(Context* c) { abort(c); } void allocateTarget(Context* c) { Cell* cell = cons(c, 0, 0); // fprintf(stderr, "allocate target for %p: %p\n", this, cell); if (lastTarget) { lastTarget->next = cell; } else { firstTarget = cell; } lastTarget = cell; } Read* nextTarget() { // fprintf(stderr, "next target for %p: %p\n", this, firstTarget); Read* r = static_cast(firstTarget->value); firstTarget = firstTarget->next; return r; } Cell* reads; Cell* lastRead; Cell* firstTarget; Cell* lastTarget; bool visited; }; MultiRead* multiRead(Context* c) { return new (c->zone->allocate(sizeof(MultiRead))) MultiRead; } class StubRead: public Read { public: StubRead(): next_(0), read(0), visited(false), valid_(true) { } virtual bool intersect(SiteMask* mask, unsigned depth) { if (not visited) { visited = true; if (read) { bool valid = read->intersect(mask, depth); if (not valid) { read = 0; } } visited = false; } return valid_; } virtual Value* successor() { return 0; } virtual bool valid() { return valid_; } virtual void append(Context* c UNUSED, Read* r) { assert(c, next_ == 0); next_ = r; } virtual Read* next(Context*) { return next_; } Read* next_; Read* read; bool visited; bool valid_; }; StubRead* stubRead(Context* c) { return new (c->zone->allocate(sizeof(StubRead))) StubRead; } Site* pickOrMoveSite(Context* c, Value* v, Site* s, unsigned index) { for (SiteIterator it(c, v, true, false); it.hasMore();) { Site* candidate = it.next(); if (s->matchNext(c, candidate, index)) { return candidate; } } Site* n = s->makeNext(c, index); Site* src = 0; unsigned copyCost = 0xFFFFFFFF; for (SiteIterator it(c, v, true, false); it.hasMore();) { Site* candidate = it.next(); unsigned cost = candidate->copyCost(c, n); if (cost < copyCost) { src = candidate; copyCost = cost; } } move(c, v, src, n); return n; } Site* pickOrMoveSite(Context* c, Value* v, Site* s, Site** low, Site** high) { if (v->index == 0) { *low = s; *high = pickOrMoveSite(c, v->next, s, 1); return *high; } else { *low = pickOrMoveSite(c, v->next, s, 0); *high = s; return *low; } } Site* growSite(Context* c, Value* v, Site* s, unsigned index) { Site* n = s->makeNext(c, index); addSite(c, v, n); return n; } Site* growSite(Context* c, Value* v, Site* s, Site** low, Site** high) { if (v->index == 0) { *low = s; *high = growSite(c, v->next, s, 1); return *high; } else { *low = growSite(c, v->next, s, 0); *high = s; return *low; } } bool acceptMatch(Context* c, Site* s, Read*, const SiteMask& mask) { return s->match(c, mask); } bool isHome(Value* v, int frameIndex) { Value* p = v; do { if (p->home == frameIndex) { return true; } p = p->buddy; } while (p != v); return false; } bool acceptForResolve(Context* c, Site* s, Read* read, const SiteMask& mask) { if (acceptMatch(c, s, read, mask) and (not s->frozen(c))) { if (s->type(c) == RegisterOperand) { return c->availableGeneralRegisterCount > ResolveRegisterReserveCount; } else { assert(c, s->match(c, SiteMask(1 << MemoryOperand, 0, AnyFrameIndex))); return isHome(read->value, offsetToFrameIndex (c, static_cast(s)->offset)); } } else { return false; } } Site* pickSourceSite(Context* c, Read* read, Site* target = 0, unsigned* cost = 0, uint8_t typeMask = ~0, bool intersectRead = true, bool includeBuddies = true, bool (*accept)(Context*, Site*, Read*, const SiteMask&) = acceptMatch) { SiteMask mask(typeMask, ~0, AnyFrameIndex); if (intersectRead) { read->intersect(&mask); } Site* site = 0; unsigned copyCost = 0xFFFFFFFF; for (SiteIterator it(c, read->value, includeBuddies); it.hasMore();) { Site* s = it.next(); if (accept(c, s, read, mask)) { unsigned v = s->copyCost(c, target); if (v < copyCost) { site = s; copyCost = v; } } } if (DebugMoves and site and target) { char srcb[256]; site->toString(c, srcb, 256); char dstb[256]; target->toString(c, dstb, 256); fprintf(stderr, "pick source %s to %s for %p cost %d\n", srcb, dstb, read->value, copyCost); } if (cost) *cost = copyCost; return site; } void move(Context* c, Value* value, Site* src, Site* dst) { src->freeze(c, value); addSite(c, value, dst); src->thaw(c, value); uint8_t tmpTypeMask; uint64_t tmpRegisterMask; c->arch->planMove (1 << src->type(c), src->registerMask(c), 1 << dst->type(c), dst->registerMask(c), &tmpTypeMask, &tmpRegisterMask); SiteMask mask(tmpTypeMask, tmpRegisterMask, AnyFrameIndex); if (not src->match(c, mask)) { // we can't move directly from src to dst on this architecture, so // we need to either pick a difference source or use a temporary removeSite(c, value, dst); SingleRead read(mask, 0); read.value = value; Site* newSrc = pickSourceSite(c, &read); if (newSrc) { src = newSrc; } else { src->freeze(c, value); dst->freeze(c, value); Site* tmp = pickTargetSite(c, &read, true); move(c, value, src, tmp); dst->thaw(c, value); src->thaw(c, value); src = tmp; } addSite(c, value, dst); } if (DebugMoves) { char srcb[256]; src->toString(c, srcb, 256); char dstb[256]; dst->toString(c, dstb, 256); fprintf(stderr, "move %s to %s for %p\n", srcb, dstb, value); } src->freeze(c, value); dst->freeze(c, value); unsigned srcSize; unsigned dstSize; if (value->next == value) { srcSize = BytesPerWord; dstSize = BytesPerWord; } else { srcSize = src->registerSize(c); dstSize = dst->registerSize(c); } if (srcSize == dstSize) { apply(c, Move, srcSize, src, src, dstSize, dst, dst); } else if (srcSize > BytesPerWord) { Site* low, *high, *other = growSite(c, value, dst, &low, &high); other->freeze(c, value->next); apply(c, Move, srcSize, src, src, srcSize, low, high); other->thaw(c, value->next); } else { Site* low, *high, *other = pickOrMoveSite(c, value, src, &low, &high); other->freeze(c, value->next); apply(c, Move, dstSize, low, high, dstSize, dst, dst); other->thaw(c, value->next); } dst->thaw(c, value); src->thaw(c, value); } void asAssemblerOperand(Context* c, Site* low, Site* high, Assembler::Operand* result) { low->asAssemblerOperand(c, high, result); } class OperandUnion: public Assembler::Operand { // must be large enough and aligned properly to hold any operand // type (we'd use an actual union type here, except that classes // with constructors cannot be used in a union): uintptr_t padding[4]; }; void apply(Context* c, UnaryOperation op, unsigned s1Size, Site* s1Low, Site* s1High) { assert(c, s1Low->type(c) == s1High->type(c)); OperandType s1Type = s1Low->type(c); OperandUnion s1Union; asAssemblerOperand(c, s1Low, s1High, &s1Union); c->assembler->apply(op, s1Size, s1Type, &s1Union); } void apply(Context* c, BinaryOperation op, unsigned s1Size, Site* s1Low, Site* s1High, unsigned s2Size, Site* s2Low, Site* s2High) { assert(c, s1Low->type(c) == s1High->type(c)); assert(c, s2Low->type(c) == s2High->type(c)); OperandType s1Type = s1Low->type(c); OperandUnion s1Union; asAssemblerOperand(c, s1Low, s1High, &s1Union); OperandType s2Type = s2Low->type(c); OperandUnion s2Union; asAssemblerOperand(c, s2Low, s2High, &s2Union); c->assembler->apply(op, s1Size, s1Type, &s1Union, s2Size, s2Type, &s2Union); } void apply(Context* c, TernaryOperation op, unsigned s1Size, Site* s1Low, Site* s1High, unsigned s2Size, Site* s2Low, Site* s2High, unsigned s3Size, Site* s3Low, Site* s3High) { assert(c, s1Low->type(c) == s1High->type(c)); assert(c, s2Low->type(c) == s2High->type(c)); assert(c, s3Low->type(c) == s3High->type(c)); OperandType s1Type = s1Low->type(c); OperandUnion s1Union; asAssemblerOperand(c, s1Low, s1High, &s1Union); OperandType s2Type = s2Low->type(c); OperandUnion s2Union; asAssemblerOperand(c, s2Low, s2High, &s2Union); OperandType s3Type = s3Low->type(c); OperandUnion s3Union; asAssemblerOperand(c, s3Low, s3High, &s3Union); c->assembler->apply(op, s1Size, s1Type, &s1Union, s2Size, s2Type, &s2Union, s3Size, s3Type, &s3Union); } void addRead(Context* c, Event* e, Value* v, Read* r) { if (DebugReads) { fprintf(stderr, "add read %p to %p last %p event %p (%s)\n", r, v, v->lastRead, e, (e ? e->name() : 0)); } r->value = v; if (e) { r->event = e; r->eventNext = e->reads; e->reads = r; ++ e->readCount; } if (v->lastRead) { // if (DebugReads) { // fprintf(stderr, "append %p to %p for %p\n", r, v->lastRead, v); // } v->lastRead->append(c, r); } else { v->reads = r; } v->lastRead = r; } void addRead(Context* c, Event* e, Value* v, const SiteMask& mask, Value* successor = 0) { addRead(c, e, v, read(c, mask, successor)); } void addReads(Context* c, Event* e, Value* v, unsigned size, const SiteMask& lowMask, Value* lowSuccessor, const SiteMask& highMask, Value* highSuccessor) { SingleRead* r = read(c, lowMask, lowSuccessor); addRead(c, e, v, r); if (size > BytesPerWord) { r->high = v->next; addRead(c, e, v->next, highMask, highSuccessor); } } void addReads(Context* c, Event* e, Value* v, unsigned size, const SiteMask& lowMask, const SiteMask& highMask) { addReads(c, e, v, size, lowMask, 0, highMask, 0); } void clean(Context* c, Value* v, unsigned popIndex) { for (SiteIterator it(c, v); it.hasMore();) { Site* s = it.next(); if (not (s->match(c, SiteMask(1 << MemoryOperand, 0, AnyFrameIndex)) and offsetToFrameIndex (c, static_cast(s)->offset) >= popIndex)) { if (false and s->match(c, SiteMask(1 << MemoryOperand, 0, AnyFrameIndex))) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "remove %s from %p at %d pop offset 0x%x\n", buffer, v, offsetToFrameIndex (c, static_cast(s)->offset), frameIndexToOffset(c, popIndex)); } it.remove(c); } } } void clean(Context* c, Event* e, Stack* stack, Local* locals, Read* reads, unsigned popIndex) { for (FrameIterator it(c, stack, locals); it.hasMore();) { FrameIterator::Element e = it.next(c); clean(c, e.value, popIndex); } for (Read* r = reads; r; r = r->eventNext) { popRead(c, e, r->value); } } CodePromise* codePromise(Context* c, Event* e) { return e->promises = new (c->zone->allocate(sizeof(CodePromise))) CodePromise(c, e->promises); } CodePromise* codePromise(Context* c, Promise* offset) { return new (c->zone->allocate(sizeof(CodePromise))) CodePromise(c, offset); } void append(Context* c, Event* e); void saveLocals(Context* c, Event* e) { for (unsigned li = 0; li < c->localFootprint; ++li) { Local* local = e->localsBefore + li; if (local->value) { if (DebugReads) { fprintf(stderr, "local save read %p at %d of %d\n", local->value, local::frameIndex(c, li), totalFrameSize(c)); } addRead(c, e, local->value, SiteMask (1 << MemoryOperand, 0, local::frameIndex(c, li))); } } } class CallEvent: public Event { public: CallEvent(Context* c, Value* address, unsigned flags, TraceHandler* traceHandler, Value* result, unsigned resultSize, Stack* argumentStack, unsigned argumentCount, unsigned stackArgumentFootprint): Event(c), address(address), traceHandler(traceHandler), result(result), returnAddressSurrogate(0), framePointerSurrogate(0), popIndex(0), stackArgumentIndex(0), flags(flags), resultSize(resultSize), stackArgumentFootprint(stackArgumentFootprint) { uint32_t registerMask = c->arch->generalRegisterMask(); if (argumentCount) { assert(c, (flags & Compiler::TailJump) == 0); assert(c, stackArgumentFootprint == 0); Stack* s = argumentStack; unsigned frameIndex = 0; unsigned index = 0; while (true) { SiteMask targetMask; if (index < c->arch->argumentRegisterCount()) { int number = c->arch->argumentRegister(index); if (DebugReads) { fprintf(stderr, "reg %d arg read %p\n", number, s->value); } targetMask = fixedRegisterMask(number); registerMask &= ~(1 << number); } else { if (DebugReads) { fprintf(stderr, "stack %d arg read %p\n", frameIndex, s->value); } targetMask = SiteMask(1 << MemoryOperand, 0, frameIndex); ++ frameIndex; } addRead(c, this, s->value, targetMask); if ((++ index) < argumentCount) { s = s->next; } else { break; } } } if (DebugReads) { fprintf(stderr, "address read %p\n", address); } { bool thunk; uint8_t typeMask; uint64_t planRegisterMask; c->arch->plan ((flags & Compiler::Aligned) ? AlignedCall : Call, BytesPerWord, &typeMask, &planRegisterMask, &thunk); assert(c, not thunk); addRead(c, this, address, SiteMask (typeMask, registerMask & planRegisterMask, AnyFrameIndex)); } Stack* stack = stackBefore; if (stackArgumentFootprint) { int footprint = stackArgumentFootprint; int returnAddressIndex; int framePointerIndex; int frameOffset; if (TailCalls and (flags & Compiler::TailJump)) { assert(c, argumentCount == 0); int base = frameBase(c); returnAddressIndex = base + c->arch->returnAddressOffset(); framePointerIndex = base + c->arch->framePointerOffset(); frameOffset = totalFrameSize(c) - c->arch->argumentFootprint(stackArgumentFootprint) - 1; } else { returnAddressIndex = -1; framePointerIndex = -1; frameOffset = -1; } while (footprint > 0) { if (stack->value) { int frameIndex = footprint + frameOffset; if (DebugReads) { fprintf(stderr, "stack arg read %p at %d of %d\n", stack->value, frameIndex, totalFrameSize(c)); } if (static_cast(frameIndex) == returnAddressIndex) { returnAddressSurrogate = stack->value; addRead(c, this, stack->value, generalRegisterMask(c)); } else if (static_cast(frameIndex) == framePointerIndex) { framePointerSurrogate = stack->value; addRead(c, this, stack->value, generalRegisterMask(c)); } else { addRead(c, this, stack->value, SiteMask (1 << MemoryOperand, 0, frameIndex)); } } stack = stack->next; -- footprint; } } if ((not TailCalls) or (flags & Compiler::TailJump) == 0) { stackArgumentIndex = c->localFootprint; if (stackBefore) { stackArgumentIndex += stackBefore->index + 1 - stackArgumentFootprint; } popIndex = c->alignedFrameSize + c->parameterFootprint - c->arch->frameFooterSize() - stackArgumentIndex; assert(c, static_cast(popIndex) >= 0); while (stack) { if (stack->value) { unsigned logicalIndex = local::frameIndex (c, stack->index + c->localFootprint); if (DebugReads) { fprintf(stderr, "stack save read %p at %d of %d\n", stack->value, logicalIndex, totalFrameSize(c)); } addRead(c, this, stack->value, SiteMask (1 << MemoryOperand, 0, logicalIndex)); } stack = stack->next; } saveLocals(c, this); } } virtual const char* name() { return "CallEvent"; } virtual void compile(Context* c) { UnaryOperation op; if (TailCalls and (flags & Compiler::TailJump)) { if (flags & Compiler::Aligned) { op = AlignedJump; } else { op = Jump; } assert(c, returnAddressSurrogate == 0 or returnAddressSurrogate->source->type(c) == RegisterOperand); assert(c, framePointerSurrogate == 0 or framePointerSurrogate->source->type(c) == RegisterOperand); int ras; if (returnAddressSurrogate) { returnAddressSurrogate->source->freeze(c, returnAddressSurrogate); ras = static_cast (returnAddressSurrogate->source)->number; } else { ras = NoRegister; } int fps; if (framePointerSurrogate) { framePointerSurrogate->source->freeze(c, framePointerSurrogate); fps = static_cast (framePointerSurrogate->source)->number; } else { fps = NoRegister; } int offset = static_cast(c->arch->argumentFootprint(stackArgumentFootprint)) - static_cast(c->arch->argumentFootprint(c->parameterFootprint)); c->assembler->popFrameForTailCall(c->alignedFrameSize, offset, ras, fps); } else if (flags & Compiler::Aligned) { op = AlignedCall; } else { op = Call; } apply(c, op, BytesPerWord, address->source, address->source); if (traceHandler) { traceHandler->handleTrace(codePromise(c, c->assembler->offset()), stackArgumentIndex); } if (TailCalls) { if (flags & Compiler::TailJump) { if (returnAddressSurrogate) { returnAddressSurrogate->source->thaw(c, returnAddressSurrogate); } if (framePointerSurrogate) { framePointerSurrogate->source->thaw(c, framePointerSurrogate); } } else { unsigned footprint = c->arch->argumentFootprint (stackArgumentFootprint); if (footprint > c->arch->stackAlignmentInWords()) { c->assembler->adjustFrame (footprint - c->arch->stackAlignmentInWords()); } } } clean(c, this, stackBefore, localsBefore, reads, popIndex); if (resultSize and live(result)) { addSite(c, result, registerSite(c, c->arch->returnLow())); if (resultSize > BytesPerWord and live(result->next)) { addSite(c, result->next, registerSite(c, c->arch->returnHigh())); } } } virtual bool allExits() { return (flags & Compiler::TailJump) != 0; } Value* address; TraceHandler* traceHandler; Value* result; Value* returnAddressSurrogate; Value* framePointerSurrogate; unsigned popIndex; unsigned stackArgumentIndex; unsigned flags; unsigned resultSize; unsigned stackArgumentFootprint; }; void appendCall(Context* c, Value* address, unsigned flags, TraceHandler* traceHandler, Value* result, unsigned resultSize, Stack* argumentStack, unsigned argumentCount, unsigned stackArgumentFootprint) { append(c, new (c->zone->allocate(sizeof(CallEvent))) CallEvent(c, address, flags, traceHandler, result, resultSize, argumentStack, argumentCount, stackArgumentFootprint)); } bool unreachable(Event* event) { for (Link* p = event->predecessors; p; p = p->nextPredecessor) { if (not p->predecessor->allExits()) return false; } return event->predecessors != 0; } class ReturnEvent: public Event { public: ReturnEvent(Context* c, unsigned size, Value* value): Event(c), value(value) { if (value) { addReads(c, this, value, size, fixedRegisterMask(c->arch->returnLow()), fixedRegisterMask(c->arch->returnHigh())); } } virtual const char* name() { return "ReturnEvent"; } virtual void compile(Context* c) { for (Read* r = reads; r; r = r->eventNext) { popRead(c, this, r->value); } if (not unreachable(this)) { c->assembler->popFrameAndPopArgumentsAndReturn (c->arch->argumentFootprint(c->parameterFootprint)); } } Value* value; }; void appendReturn(Context* c, unsigned size, Value* value) { append(c, new (c->zone->allocate(sizeof(ReturnEvent))) ReturnEvent(c, size, value)); } void addBuddy(Value* original, Value* buddy) { buddy->buddy = original; Value* p = original; while (p->buddy != original) p = p->buddy; p->buddy = buddy; //buddy->type = original->type; if (DebugBuddies) { fprintf(stderr, "add buddy %p to", buddy); for (Value* p = buddy->buddy; p != buddy; p = p->buddy) { fprintf(stderr, " %p", p); } fprintf(stderr, "\n"); } } void maybeMove(Context* c, BinaryOperation type, unsigned srcSize, unsigned srcSelectSize, Value* src, unsigned dstSize, Value* dst, const SiteMask& dstMask) { Read* read = live(dst); bool isStore = read == 0; Site* target; if (dst->target) { target = dst->target; } else if (isStore) { return; } else { target = pickTargetSite(c, read); } unsigned cost = src->source->copyCost(c, target); if (srcSelectSize < dstSize) cost = 1; if (cost) { bool useTemporary = ((target->type(c) == MemoryOperand and src->source->type(c) == MemoryOperand) or (srcSelectSize < dstSize and target->type(c) != RegisterOperand)); src->source->freeze(c, src); addSite(c, dst, target); src->source->thaw(c, src); bool addOffset = srcSize != srcSelectSize and c->arch->bigEndian() and src->source->type(c) == MemoryOperand; if (addOffset) { static_cast(src->source)->offset += (srcSize - srcSelectSize); } target->freeze(c, dst); if (target->match(c, dstMask) and not useTemporary) { if (DebugMoves) { char srcb[256]; src->source->toString(c, srcb, 256); char dstb[256]; target->toString(c, dstb, 256); fprintf(stderr, "move %s to %s for %p to %p\n", srcb, dstb, src, dst); } src->source->freeze(c, src); apply(c, type, min(srcSelectSize, dstSize), src->source, src->source, dstSize, target, target); src->source->thaw(c, src); } else { // pick a temporary register which is valid as both a // destination and a source for the moves we need to perform: bool thunk; uint8_t srcTypeMask; uint64_t srcRegisterMask; c->arch->planSource(type, dstSize, &srcTypeMask, &srcRegisterMask, dstSize, &thunk); assert(c, dstMask.typeMask & srcTypeMask & (1 << RegisterOperand)); Site* tmpTarget = freeRegisterSite (c, dstMask.registerMask & srcRegisterMask); src->source->freeze(c, src); addSite(c, dst, tmpTarget); tmpTarget->freeze(c, dst); if (DebugMoves) { char srcb[256]; src->source->toString(c, srcb, 256); char dstb[256]; tmpTarget->toString(c, dstb, 256); fprintf(stderr, "move %s to %s for %p to %p\n", srcb, dstb, src, dst); } apply(c, type, srcSelectSize, src->source, src->source, dstSize, tmpTarget, tmpTarget); tmpTarget->thaw(c, dst); src->source->thaw(c, src); if (useTemporary or isStore) { if (DebugMoves) { char srcb[256]; tmpTarget->toString(c, srcb, 256); char dstb[256]; target->toString(c, dstb, 256); fprintf(stderr, "move %s to %s for %p to %p\n", srcb, dstb, src, dst); } tmpTarget->freeze(c, dst); apply(c, Move, dstSize, tmpTarget, tmpTarget, dstSize, target, target); tmpTarget->thaw(c, dst); if (isStore) { removeSite(c, dst, tmpTarget); } } else { removeSite(c, dst, target); } } target->thaw(c, dst); if (addOffset) { static_cast(src->source)->offset -= (srcSize - srcSelectSize); } } else { target = src->source; assert(c, src); assert(c, dst); addBuddy(src, dst); if (DebugMoves) { char dstb[256]; target->toString(c, dstb, 256); fprintf(stderr, "null move in %s for %p to %p\n", dstb, src, dst); } } if (isStore) { removeSite(c, dst, target); } } Value* value(Context* c, ValueType type, Site* site = 0, Site* target = 0) { return new (c->zone->allocate(sizeof(Value))) Value(site, target, type); } void grow(Context* c, Value* v) { assert(c, v->next == v); Value* next = value(c, v->type); v->next = next; next->next = v; next->index = 1; } void split(Context* c, Value* v) { grow(c, v); for (SiteIterator it(c, v); it.hasMore();) { Site* s = it.next(); removeSite(c, v, s); addSite(c, v, s->copyLow(c)); addSite(c, v->next, s->copyHigh(c)); } } void maybeSplit(Context* c, Value* v) { if (v->next == v) { split(c, v); } } class MoveEvent: public Event { public: MoveEvent(Context* c, BinaryOperation type, unsigned srcSize, unsigned srcSelectSize, Value* src, unsigned dstSize, Value* dst, const SiteMask& srcLowMask, const SiteMask& srcHighMask): Event(c), type(type), srcSize(srcSize), srcSelectSize(srcSelectSize), src(src), dstSize(dstSize), dst(dst) { assert(c, srcSelectSize <= srcSize); bool noop = srcSelectSize >= dstSize; if (dstSize > BytesPerWord) { grow(c, dst); } if (srcSelectSize > BytesPerWord) { maybeSplit(c, src); } addReads(c, this, src, srcSelectSize, srcLowMask, noop ? dst : 0, srcHighMask, noop and dstSize > BytesPerWord ? dst->next : 0); } virtual const char* name() { return "MoveEvent"; } virtual void compile(Context* c) { uint8_t dstTypeMask; uint64_t dstRegisterMask; c->arch->planDestination (type, srcSelectSize, 1 << src->source->type(c), (static_cast(src->next->source->registerMask(c)) << 32) | static_cast(src->source->registerMask(c)), dstSize, &dstTypeMask, &dstRegisterMask); SiteMask dstLowMask(dstTypeMask, dstRegisterMask, AnyFrameIndex); SiteMask dstHighMask(dstTypeMask, dstRegisterMask >> 32, AnyFrameIndex); if (srcSelectSize <= BytesPerWord and dstSize <= BytesPerWord) { maybeMove(c, type, srcSize, srcSelectSize, src, dstSize, dst, dstLowMask); } else if (srcSelectSize == dstSize) { maybeMove(c, Move, BytesPerWord, BytesPerWord, src, BytesPerWord, dst, dstLowMask); maybeMove(c, Move, BytesPerWord, BytesPerWord, src->next, BytesPerWord, dst->next, dstHighMask); } else if (srcSize > BytesPerWord) { assert(c, dstSize == BytesPerWord); maybeMove(c, Move, BytesPerWord, BytesPerWord, src, BytesPerWord, dst, dstLowMask); } else { assert(c, srcSize == BytesPerWord); assert(c, srcSelectSize == BytesPerWord); if (dst->next->target or live(dst->next)) { assert(c, dstLowMask.typeMask & (1 << RegisterOperand)); Site* low = freeRegisterSite(c, dstLowMask.registerMask); src->source->freeze(c, src); addSite(c, dst, low); low->freeze(c, dst); if (DebugMoves) { char srcb[256]; src->source->toString(c, srcb, 256); char dstb[256]; low->toString(c, dstb, 256); fprintf(stderr, "move %s to %s for %p\n", srcb, dstb, src); } apply(c, Move, BytesPerWord, src->source, src->source, BytesPerWord, low, low); low->thaw(c, dst); src->source->thaw(c, src); assert(c, dstHighMask.typeMask & (1 << RegisterOperand)); Site* high = freeRegisterSite(c, dstHighMask.registerMask); low->freeze(c, dst); addSite(c, dst->next, high); high->freeze(c, dst->next); if (DebugMoves) { char srcb[256]; low->toString(c, srcb, 256); char dstb[256]; high->toString(c, dstb, 256); fprintf(stderr, "extend %s to %s for %p %p\n", srcb, dstb, dst, dst->next); } apply(c, Move, BytesPerWord, low, low, dstSize, low, high); high->thaw(c, dst->next); low->thaw(c, dst); } else { maybeMove(c, Move, BytesPerWord, BytesPerWord, src, BytesPerWord, dst, dstLowMask); } } for (Read* r = reads; r; r = r->eventNext) { popRead(c, this, r->value); } } BinaryOperation type; unsigned srcSize; unsigned srcSelectSize; Value* src; unsigned dstSize; Value* dst; }; void appendMove(Context* c, BinaryOperation type, unsigned srcSize, unsigned srcSelectSize, Value* src, unsigned dstSize, Value* dst) { bool thunk; uint8_t srcTypeMask; uint64_t srcRegisterMask; c->arch->planSource (type, srcSelectSize, &srcTypeMask, &srcRegisterMask, dstSize, &thunk); assert(c, not thunk); append(c, new (c->zone->allocate(sizeof(MoveEvent))) MoveEvent (c, type, srcSize, srcSelectSize, src, dstSize, dst, SiteMask(srcTypeMask, srcRegisterMask, AnyFrameIndex), SiteMask(srcTypeMask, srcRegisterMask >> 32, AnyFrameIndex))); } ConstantSite* findConstantSite(Context* c, Value* v) { for (SiteIterator it(c, v); it.hasMore();) { Site* s = it.next(); if (s->type(c) == ConstantOperand) { return static_cast(s); } } return 0; } class CompareEvent: public Event { public: CompareEvent(Context* c, BinaryOperation type, unsigned size, Value* first, Value* second, const SiteMask& firstMask, const SiteMask& secondMask): Event(c), type(type), size(size), first(first), second(second) { assert(c, type != FloatCompare or (first->type == ValueFloat and first->type == ValueFloat)); addReads(c, this, first, size, firstMask, firstMask); addReads(c, this, second, size, secondMask, secondMask); } virtual const char* name() { return "CompareEvent"; } virtual void compile(Context* c) { ConstantSite* firstConstant = findConstantSite(c, first); ConstantSite* secondConstant = findConstantSite(c, second); if (firstConstant and secondConstant) { int64_t d = firstConstant->value->value() - secondConstant->value->value(); if (d < 0) { c->constantCompare = CompareLess; } else if (d > 0) { c->constantCompare = CompareGreater; } else { c->constantCompare = CompareEqual; } } else { c->constantCompare = CompareNone; apply(c, type, size, first->source, first->source, size, second->source, second->source); } for (Read* r = reads; r; r = r->eventNext) { popRead(c, this, r->value); } } BinaryOperation type; unsigned size; Value* first; Value* second; }; void appendCompare(Context* c, BinaryOperation op, unsigned size, Value* first, Value* second) { bool thunk; uint8_t firstTypeMask; uint64_t firstRegisterMask; uint8_t secondTypeMask; uint64_t secondRegisterMask; c->arch->planSource (op, size, &firstTypeMask, &firstRegisterMask, size, &thunk); assert(c, not thunk); // todo c->arch->planDestination (op, size, 0, 0, size, &secondTypeMask, &secondRegisterMask); append(c, new (c->zone->allocate(sizeof(CompareEvent))) CompareEvent (c, op, size, first, second, SiteMask(firstTypeMask, firstRegisterMask, AnyFrameIndex), SiteMask(secondTypeMask, secondRegisterMask, AnyFrameIndex))); } void preserve(Context* c, Value* v, Site* s, Read* r) { s->freeze(c, v); move(c, v, s, pickTargetSite(c, r)); s->thaw(c, v); } Site* getTarget(Context* c, Value* value, Value* result, const SiteMask& resultMask) { Site* s; Value* v; Read* r = liveNext(c, value); if (value->source->match (c, static_cast(resultMask)) and (r == 0 or value->source->loneMatch (c, static_cast(resultMask)))) { s = value->source; v = value; if (r and not hasMoreThanOneSite(c, v)) { preserve(c, v, s, r); } } else { SingleRead r(resultMask, 0); s = pickTargetSite(c, &r, true); v = result; addSite(c, result, s); } removeSite(c, v, s); s->freeze(c, v); return s; } Site* source(Value* v, Site* site) { return v ? v->source : site; } void freezeSource(Context* c, unsigned size, Value* v) { v->source->freeze(c, v); if (size > BytesPerWord) { v->next->source->freeze(c, v->next); } } void thawSource(Context* c, unsigned size, Value* v) { v->source->thaw(c, v); if (size > BytesPerWord) { v->next->source->thaw(c, v->next); } } class CombineEvent: public Event { public: CombineEvent(Context* c, TernaryOperation type, unsigned firstSize, Value* first, unsigned secondSize, Value* second, unsigned resultSize, Value* result, const SiteMask& firstLowMask, const SiteMask& firstHighMask, const SiteMask& secondLowMask, const SiteMask& secondHighMask): Event(c), type(type), firstSize(firstSize), first(first), secondSize(secondSize), second(second), resultSize(resultSize), result(result) { addReads(c, this, first, firstSize, firstLowMask, firstHighMask); if (resultSize > BytesPerWord) { grow(c, result); } bool condensed = c->arch->alwaysCondensed(type); addReads(c, this, second, secondSize, secondLowMask, condensed ? result : 0, secondHighMask, condensed ? result->next : 0); } virtual const char* name() { return "CombineEvent"; } virtual void compile(Context* c) { assert(c, first->source->type(c) == first->next->source->type(c)); assert(c, second->source->type(c) == second->next->source->type(c)); freezeSource(c, firstSize, first); uint8_t cTypeMask; uint64_t cRegisterMask; c->arch->planDestination (type, firstSize, 1 << first->source->type(c), (static_cast(first->next->source->registerMask(c)) << 32) | static_cast(first->source->registerMask(c)), secondSize, 1 << second->source->type(c), (static_cast(second->next->source->registerMask(c)) << 32) | static_cast(second->source->registerMask(c)), resultSize, &cTypeMask, &cRegisterMask); SiteMask resultLowMask(cTypeMask, cRegisterMask, AnyFrameIndex); SiteMask resultHighMask(cTypeMask, cRegisterMask >> 32, AnyFrameIndex); Site* low = getTarget(c, second, result, resultLowMask); unsigned lowSize = low->registerSize(c); Site* high = (resultSize > lowSize ? getTarget(c, second->next, result->next, resultHighMask) : low); // fprintf(stderr, "combine %p and %p into %p\n", first, second, result); apply(c, type, firstSize, first->source, source(first->next, first->source), secondSize, second->source, source(second->next, second->source), resultSize, low, high); thawSource(c, firstSize, first); for (Read* r = reads; r; r = r->eventNext) { popRead(c, this, r->value); } low->thaw(c, second); if (resultSize > lowSize) { high->thaw(c, second->next); } if (live(result)) { addSite(c, result, low); if (resultSize > lowSize and live(result->next)) { addSite(c, result->next, high); } } } TernaryOperation type; unsigned firstSize; Value* first; unsigned secondSize; Value* second; unsigned resultSize; Value* result; }; void removeBuddy(Context* c, Value* v) { if (v->buddy != v) { if (DebugBuddies) { fprintf(stderr, "remove buddy %p from", v); for (Value* p = v->buddy; p != v; p = p->buddy) { fprintf(stderr, " %p", p); } fprintf(stderr, "\n"); } assert(c, v->buddy); Value* next = v->buddy; v->buddy = v; Value* p = next; while (p->buddy != v) p = p->buddy; p->buddy = next; assert(c, p->buddy); if (not live(next)) { clearSites(c, next); } if (not live(v)) { clearSites(c, v); } } } Site* copy(Context* c, Site* s) { Site* start = 0; Site* end = 0; for (; s; s = s->next) { Site* n = s->copy(c); if (end) { end->next = n; } else { start = n; } end = n; } return start; } class Snapshot { public: Snapshot(Context* c, Value* value, Snapshot* next): value(value), buddy(value->buddy), sites(copy(c, value->sites)), next(next) { } Value* value; Value* buddy; Site* sites; Snapshot* next; }; Snapshot* snapshot(Context* c, Value* value, Snapshot* next) { if (DebugControl) { char buffer[256]; sitesToString(c, value->sites, buffer, 256); fprintf(stderr, "snapshot %p buddy %p sites %s\n", value, value->buddy, buffer); } return new (c->zone->allocate(sizeof(Snapshot))) Snapshot(c, value, next); } Snapshot* makeSnapshots(Context* c, Value* value, Snapshot* next) { next = snapshot(c, value, next); for (Value* p = value->buddy; p != value; p = p->buddy) { next = snapshot(c, p, next); } return next; } Stack* stack(Context* c, Value* value, Stack* next) { return new (c->zone->allocate(sizeof(Stack))) Stack(next ? next->index + 1 : 0, value, next); } Value* maybeBuddy(Context* c, Value* v); Value* pushWord(Context* c, Value* v) { if (v) { v = maybeBuddy(c, v); } Stack* s = stack(c, v, c->stack); if (DebugFrame) { fprintf(stderr, "push %p\n", v); } if (v) { v->home = frameIndex(c, s->index + c->localFootprint); } c->stack = s; return v; } Value* push(Context* c, unsigned footprint, Value* v, bool reverse) { assert(c, footprint); bool lowFirst = reverse xor c->arch->bigEndian(); Value* low = v; if (lowFirst) { v = pushWord(c, v); } Value* high; if (footprint > 1) { assert(c, footprint == 2); if (BytesPerWord == 4 and low->next == v) { split(c, low); } high = pushWord(c, low->next); } else if (v) { high = v->next; } else { high = 0; } if (not lowFirst) { v = pushWord(c, v); } if (v) { v->next = high; high->next = v; high->index = 1; } return v; } void popWord(Context* c) { Stack* s = c->stack; assert(c, s->value == 0 or s->value->home >= 0); if (DebugFrame) { fprintf(stderr, "pop %p\n", s->value); } c->stack = s->next; } Value* pop(Context* c, unsigned footprint) { assert(c, footprint); Stack* s = 0; bool bigEndian = c->arch->bigEndian(); if (bigEndian) { s = c->stack; } if (footprint > 1) { assert(c, footprint == 2); #ifndef NDEBUG Stack* low; Stack* high; if (bigEndian) { low = c->stack; high = low->next; } else { high = c->stack; low = high->next; } assert(c, low->value->next == high->value and ((BytesPerWord == 8) xor (low->value->next != 0))); #endif // not NDEBUG popWord(c); } if (not bigEndian) { s = c->stack; } popWord(c); return s->value; } Value* storeLocal(Context* c, unsigned footprint, Value* v, unsigned index, bool copy) { assert(c, index + footprint <= c->localFootprint); if (copy) { unsigned sizeInBytes = sizeof(Local) * c->localFootprint; Local* newLocals = static_cast(c->zone->allocate(sizeInBytes)); memcpy(newLocals, c->locals, sizeInBytes); c->locals = newLocals; } Value* high; if (footprint > 1) { assert(c, footprint == 2); unsigned highIndex; unsigned lowIndex; if (c->arch->bigEndian()) { highIndex = index + 1; lowIndex = index; } else { lowIndex = index + 1; highIndex = index; } if (BytesPerWord == 4) { assert(c, v->next); high = storeLocal(c, 1, v->next, highIndex, false); } else { high = 0; } index = lowIndex; } else { high = v->next; } v = maybeBuddy(c, v); v->next = high; high->index = 1; Local* local = c->locals + index; local->value = v; if (DebugFrame) { fprintf(stderr, "store local %p at %d\n", local->value, index); } local->value->home = frameIndex(c, index); return v; } Value* loadLocal(Context* c, unsigned footprint, unsigned index) { assert(c, index + footprint <= c->localFootprint); if (footprint > 1) { assert(c, footprint == 2); if (not c->arch->bigEndian()) { ++ index; } } assert(c, c->locals[index].value); assert(c, c->locals[index].value->home >= 0); if (DebugFrame) { fprintf(stderr, "load local %p at %d\n", c->locals[index].value, index); } return c->locals[index].value; } void appendCombine(Context* c, TernaryOperation type, unsigned firstSize, Value* first, unsigned secondSize, Value* second, unsigned resultSize, Value* result) { bool thunk; uint8_t firstTypeMask; uint64_t firstRegisterMask; uint8_t secondTypeMask; uint64_t secondRegisterMask; c->arch->planSource(type, firstSize, &firstTypeMask, &firstRegisterMask, secondSize, &secondTypeMask, &secondRegisterMask, resultSize, &thunk); if (thunk) { Stack* oldStack = c->stack; local::push(c, ceiling(secondSize, BytesPerWord), second, false); local::push(c, ceiling(firstSize, BytesPerWord), first, false); Stack* argumentStack = c->stack; c->stack = oldStack; appendCall (c, value (c, ValueGeneral, constantSite (c, c->client->getThunk(type, firstSize, resultSize))), 0, 0, result, resultSize, argumentStack, ceiling(secondSize, BytesPerWord) + ceiling(firstSize, BytesPerWord), 0); } else { append (c, new (c->zone->allocate(sizeof(CombineEvent))) CombineEvent (c, type, firstSize, first, secondSize, second, resultSize, result, SiteMask(firstTypeMask, firstRegisterMask, AnyFrameIndex), SiteMask(firstTypeMask, firstRegisterMask >> 32, AnyFrameIndex), SiteMask(secondTypeMask, secondRegisterMask, AnyFrameIndex), SiteMask(secondTypeMask, secondRegisterMask >> 32, AnyFrameIndex))); } } class TranslateEvent: public Event { public: TranslateEvent(Context* c, BinaryOperation type, unsigned valueSize, Value* value, unsigned resultSize, Value* result, const SiteMask& valueLowMask, const SiteMask& valueHighMask): Event(c), type(type), valueSize(valueSize), resultSize(resultSize), value(value), result(result) { bool condensed = c->arch->alwaysCondensed(type); if (resultSize > BytesPerWord) { grow(c, result); } addReads(c, this, value, valueSize, valueLowMask, condensed ? result : 0, valueHighMask, condensed ? result->next : 0); } virtual const char* name() { return "TranslateEvent"; } virtual void compile(Context* c) { uint8_t bTypeMask; uint64_t bRegisterMask; c->arch->planDestination (type, valueSize, 1 << value->source->type(c), (static_cast(value->next->source->registerMask(c)) << 32) | static_cast(value->source->registerMask(c)), resultSize, &bTypeMask, &bRegisterMask); SiteMask resultLowMask(bTypeMask, bRegisterMask, AnyFrameIndex); SiteMask resultHighMask(bTypeMask, bRegisterMask >> 32, AnyFrameIndex); Site* low = getTarget(c, value, result, resultLowMask); unsigned lowSize = low->registerSize(c); Site* high = (resultSize > lowSize ? getTarget(c, value->next, result->next, resultHighMask) : low); apply(c, type, valueSize, value->source, source(value->next, value->source), resultSize, low, high); for (Read* r = reads; r; r = r->eventNext) { popRead(c, this, r->value); } low->thaw(c, value); if (resultSize > lowSize) { high->thaw(c, value->next); } if (live(result)) { addSite(c, result, low); if (resultSize > lowSize and live(result->next)) { addSite(c, result->next, high); } } } BinaryOperation type; unsigned valueSize; unsigned resultSize; Value* value; Value* result; Read* resultRead; SiteMask resultLowMask; SiteMask resultHighMask; }; void appendTranslate(Context* c, BinaryOperation type, unsigned firstSize, Value* first, unsigned resultSize, Value* result) { bool thunk; uint8_t firstTypeMask; uint64_t firstRegisterMask; c->arch->planSource(type, firstSize, &firstTypeMask, &firstRegisterMask, resultSize, &thunk); if (thunk) { Stack* oldStack = c->stack; local::push(c, ceiling(firstSize, BytesPerWord), first, false); Stack* argumentStack = c->stack; c->stack = oldStack; appendCall (c, value (c, ValueGeneral, constantSite (c, c->client->getThunk(type, firstSize, resultSize))), 0, 0, result, resultSize, argumentStack, ceiling(firstSize, BytesPerWord), 0); } else { append(c, new (c->zone->allocate(sizeof(TranslateEvent))) TranslateEvent (c, type, firstSize, first, resultSize, result, SiteMask(firstTypeMask, firstRegisterMask, AnyFrameIndex), SiteMask(firstTypeMask, firstRegisterMask >> 32, AnyFrameIndex))); } } class BarrierEvent: public Event { public: BarrierEvent(Context* c, Operation op): Event(c), op(op) { } virtual const char* name() { return "BarrierEvent"; } virtual void compile(Context* c) { c->assembler->apply(op); } Operation op; }; void appendBarrier(Context* c, Operation op) { append(c, new (c->zone->allocate(sizeof(BarrierEvent))) BarrierEvent(c, op)); } class MemoryEvent: public Event { public: MemoryEvent(Context* c, Value* base, int displacement, Value* index, unsigned scale, Value* result): Event(c), base(base), displacement(displacement), index(index), scale(scale), result(result) { addRead(c, this, base, generalRegisterMask(c)); if (index) { addRead(c, this, index, generalRegisterOrConstantMask(c)); } } virtual const char* name() { return "MemoryEvent"; } virtual void compile(Context* c) { int indexRegister; int displacement = this->displacement; unsigned scale = this->scale; if (index) { ConstantSite* constant = findConstantSite(c, index); if (constant) { indexRegister = NoRegister; displacement += (constant->value->value() * scale); scale = 1; } else { assert(c, index->source->type(c) == RegisterOperand); indexRegister = static_cast(index->source)->number; } } else { indexRegister = NoRegister; } assert(c, base->source->type(c) == RegisterOperand); int baseRegister = static_cast(base->source)->number; popRead(c, this, base); if (index) { if (BytesPerWord == 8 and indexRegister != NoRegister) { apply(c, Move, 4, index->source, index->source, 8, index->source, index->source); } popRead(c, this, index); } Site* site = memorySite (c, baseRegister, displacement, indexRegister, scale); Site* low; if (result->next) { Site* high = site->copyHigh(c); low = site->copyLow(c); result->next->target = high; addSite(c, result->next, high); } else { low = site; } result->target = low; addSite(c, result, low); } Value* base; int displacement; Value* index; unsigned scale; Value* result; }; void appendMemory(Context* c, Value* base, int displacement, Value* index, unsigned scale, Value* result) { append(c, new (c->zone->allocate(sizeof(MemoryEvent))) MemoryEvent(c, base, displacement, index, scale, result)); } class BranchEvent: public Event { public: BranchEvent(Context* c, UnaryOperation type, Value* address, bool exit): Event(c), type(type), address(address), exit(exit) { bool thunk; uint8_t typeMask; uint64_t registerMask; c->arch->plan(type, BytesPerWord, &typeMask, ®isterMask, &thunk); assert(c, not thunk); addRead(c, this, address, SiteMask(typeMask, registerMask, AnyFrameIndex)); } virtual const char* name() { return "BranchEvent"; } virtual void compile(Context* c) { bool jump; UnaryOperation type = this->type; if (type != Jump) { switch (c->constantCompare) { case CompareLess: switch (type) { case JumpIfLess: case JumpIfLessOrEqual: case JumpIfNotEqual: jump = true; type = Jump; break; default: jump = false; } break; case CompareGreater: switch (type) { case JumpIfGreater: case JumpIfGreaterOrEqual: case JumpIfNotEqual: jump = true; type = Jump; break; default: jump = false; } break; case CompareEqual: switch (type) { case JumpIfEqual: case JumpIfLessOrEqual: case JumpIfGreaterOrEqual: jump = true; type = Jump; break; default: jump = false; } break; case CompareNone: jump = true; break; default: abort(c); } } else { jump = true; } if (jump and not unreachable(this)) { apply(c, type, BytesPerWord, address->source, address->source); } popRead(c, this, address); } virtual bool isBranch() { return true; } virtual bool allExits() { return type == Jump and (exit or unreachable(this)); } UnaryOperation type; Value* address; bool exit; }; void appendBranch(Context* c, UnaryOperation type, Value* address, bool exit = false) { append(c, new (c->zone->allocate(sizeof(BranchEvent))) BranchEvent(c, type, address, exit)); } class BoundsCheckEvent: public Event { public: BoundsCheckEvent(Context* c, Value* object, unsigned lengthOffset, Value* index, intptr_t handler): Event(c), object(object), lengthOffset(lengthOffset), index(index), handler(handler) { addRead(c, this, object, generalRegisterMask(c)); addRead(c, this, index, generalRegisterOrConstantMask(c)); } virtual const char* name() { return "BoundsCheckEvent"; } virtual void compile(Context* c) { Assembler* a = c->assembler; ConstantSite* constant = findConstantSite(c, index); CodePromise* nextPromise = codePromise (c, static_cast(0)); CodePromise* outOfBoundsPromise = 0; if (constant) { expect(c, constant->value->value() >= 0); } else { outOfBoundsPromise = codePromise(c, static_cast(0)); Site* zero = constantSite(c, resolved(c, 0)); apply(c, Compare, 4, zero, zero, 4, index->source, index->source); Assembler::Constant outOfBoundsConstant(outOfBoundsPromise); a->apply (JumpIfLess, BytesPerWord, ConstantOperand, &outOfBoundsConstant); } assert(c, object->source->type(c) == RegisterOperand); MemorySite length(static_cast(object->source)->number, lengthOffset, NoRegister, 1); length.acquired = true; apply(c, Compare, 4, index->source, index->source, 4, &length, &length); Assembler::Constant nextConstant(nextPromise); a->apply(JumpIfGreater, BytesPerWord, ConstantOperand, &nextConstant); if (constant == 0) { outOfBoundsPromise->offset = a->offset(); } Assembler::Constant handlerConstant(resolved(c, handler)); a->apply(Call, BytesPerWord, ConstantOperand, &handlerConstant); nextPromise->offset = a->offset(); popRead(c, this, object); popRead(c, this, index); } Value* object; unsigned lengthOffset; Value* index; intptr_t handler; }; void appendBoundsCheck(Context* c, Value* object, unsigned lengthOffset, Value* index, intptr_t handler) { append(c, new (c->zone->allocate(sizeof(BoundsCheckEvent))) BoundsCheckEvent(c, object, lengthOffset, index, handler)); } class FrameSiteEvent: public Event { public: FrameSiteEvent(Context* c, Value* value, int index): Event(c), value(value), index(index) { } virtual const char* name() { return "FrameSiteEvent"; } virtual void compile(Context* c) { if (live(value)) { addSite(c, value, frameSite(c, index)); } } Value* value; int index; }; void appendFrameSite(Context* c, Value* value, int index) { append(c, new (c->zone->allocate(sizeof(FrameSiteEvent))) FrameSiteEvent(c, value, index)); } unsigned frameFootprint(Context* c, Stack* s) { return c->localFootprint + (s ? (s->index + 1) : 0); } void visit(Context* c, Link* link) { // fprintf(stderr, "visit link from %d to %d fork %p junction %p\n", // link->predecessor->logicalInstruction->index, // link->successor->logicalInstruction->index, // link->forkState, // link->junctionState); ForkState* forkState = link->forkState; if (forkState) { for (unsigned i = 0; i < forkState->readCount; ++i) { ForkElement* p = forkState->elements + i; Value* v = p->value; v->reads = p->read->nextTarget(); // fprintf(stderr, "next read %p for %p from %p\n", v->reads, v, p->read); if (not live(v)) { clearSites(c, v); } } } JunctionState* junctionState = link->junctionState; if (junctionState) { for (unsigned i = 0; i < junctionState->frameFootprint; ++i) { StubReadPair* p = junctionState->reads + i; if (p->value and p->value->reads) { assert(c, p->value->reads == p->read); popRead(c, 0, p->value); } } } } class BuddyEvent: public Event { public: BuddyEvent(Context* c, Value* original, Value* buddy): Event(c), original(original), buddy(buddy) { addRead(c, this, original, SiteMask(~0, ~0, AnyFrameIndex)); } virtual const char* name() { return "BuddyEvent"; } virtual void compile(Context* c) { // fprintf(stderr, "original %p buddy %p\n", original, buddy); assert(c, hasSite(c, original)); assert(c, original); assert(c, buddy); addBuddy(original, buddy); popRead(c, this, original); } Value* original; Value* buddy; }; void appendBuddy(Context* c, Value* original, Value* buddy) { append(c, new (c->zone->allocate(sizeof(BuddyEvent))) BuddyEvent(c, original, buddy)); } class SaveLocalsEvent: public Event { public: SaveLocalsEvent(Context* c): Event(c) { saveLocals(c, this); } virtual const char* name() { return "SaveLocalsEvent"; } virtual void compile(Context* c) { for (Read* r = reads; r; r = r->eventNext) { popRead(c, this, r->value); } } }; void appendSaveLocals(Context* c) { append(c, new (c->zone->allocate(sizeof(SaveLocalsEvent))) SaveLocalsEvent(c)); } class CleanLocalsEvent: public Event { public: CleanLocalsEvent(Context* c): Event(c) { } virtual const char* name() { return "CleanLocalsEvent"; } virtual void compile(Context* c) { for (FrameIterator it(c, 0, c->locals); it.hasMore();) { FrameIterator::Element e = it.next(c); clean(c, e.value, 0); } } }; void appendCleanLocals(Context* c) { append(c, new (c->zone->allocate(sizeof(CleanLocalsEvent))) CleanLocalsEvent(c)); } class DummyEvent: public Event { public: DummyEvent(Context* c): Event(c) { } virtual const char* name() { return "DummyEvent"; } virtual void compile(Context*) { } }; void appendDummy(Context* c) { Stack* stack = c->stack; Local* locals = c->locals; LogicalInstruction* i = c->logicalCode[c->logicalIp]; c->stack = i->stack; c->locals = i->locals; append(c, new (c->zone->allocate(sizeof(DummyEvent))) DummyEvent(c)); c->stack = stack; c->locals = locals; } void append(Context* c, Event* e) { LogicalInstruction* i = c->logicalCode[c->logicalIp]; if (c->stack != i->stack or c->locals != i->locals) { appendDummy(c); } if (DebugAppend) { fprintf(stderr, " -- append %s at %d with %d stack before\n", e->name(), e->logicalInstruction->index, c->stack ? c->stack->index + 1 : 0); } if (c->lastEvent) { c->lastEvent->next = e; } else { c->firstEvent = e; } c->lastEvent = e; Event* p = c->predecessor; if (p) { if (DebugAppend) { fprintf(stderr, "%d precedes %d\n", p->logicalInstruction->index, e->logicalInstruction->index); } Link* link = local::link (c, p, e->predecessors, e, p->successors, c->forkState); e->predecessors = link; p->successors = link; } c->forkState = 0; c->predecessor = e; if (e->logicalInstruction->firstEvent == 0) { e->logicalInstruction->firstEvent = e; } e->logicalInstruction->lastEvent = e; } Site* readSource(Context* c, Read* r) { Value* v = r->value; if (DebugReads) { char buffer[1024]; sitesToString(c, v, buffer, 1024); fprintf(stderr, "read source for %p from %s\n", v, buffer); } if (not hasSite(c, v)) { if (DebugReads) { fprintf(stderr, "no sites found for %p\n", v); } return 0; } r->maybeIntersectWithHighSource(c); Site* site = pickSourceSite(c, r); if (site) { return site; } else { Site* target = pickTargetSite(c, r, true); unsigned copyCost; site = pickSourceSite(c, r, target, ©Cost, ~0, false); assert(c, copyCost); move(c, v, site, target); return target; } } void propagateJunctionSites(Context* c, Event* e, Site** sites) { for (Link* pl = e->predecessors; pl; pl = pl->nextPredecessor) { Event* p = pl->predecessor; if (p->junctionSites == 0) { p->junctionSites = sites; for (Link* sl = p->successors; sl; sl = sl->nextSuccessor) { Event* s = sl->successor; propagateJunctionSites(c, s, sites); } } } } void propagateJunctionSites(Context* c, Event* e) { for (Link* sl = e->successors; sl; sl = sl->nextSuccessor) { Event* s = sl->successor; if (s->predecessors->nextPredecessor) { unsigned size = sizeof(Site*) * frameFootprint(c, e->stackAfter); Site** junctionSites = static_cast (c->zone->allocate(size)); memset(junctionSites, 0, size); propagateJunctionSites(c, s, junctionSites); break; } } } class SiteRecord { public: SiteRecord(Site* site, Value* value): site(site), value(value) { } SiteRecord() { } Site* site; Value* value; }; class SiteRecordList { public: SiteRecordList(SiteRecord* records, unsigned capacity): records(records), index(0), capacity(capacity) { } SiteRecord* records; unsigned index; unsigned capacity; }; void freeze(Context* c, SiteRecordList* frozen, Site* s, Value* v) { assert(c, frozen->index < frozen->capacity); s->freeze(c, v); new (frozen->records + (frozen->index ++)) SiteRecord(s, v); } void thaw(Context* c, SiteRecordList* frozen) { while (frozen->index) { SiteRecord* sr = frozen->records + (-- frozen->index); sr->site->thaw(c, sr->value); } } Site* acquireSite(Context* c, SiteRecordList* frozen, Site* target, Value* v, Read* r, bool pickSource) { assert(c, hasSite(c, v)); unsigned copyCost; Site* source; if (pickSource) { source = pickSourceSite(c, r, target, ©Cost, ~0, false); } else { copyCost = 0; source = target; } if (copyCost) { target = target->copy(c); move(c, v, source, target); } else { target = source; } freeze(c, frozen, target, v); return target; } bool resolveOriginalSites(Context* c, Event* e, SiteRecordList* frozen, Site** sites) { bool complete = true; for (FrameIterator it(c, e->stackAfter, e->localsAfter); it.hasMore();) { FrameIterator::Element el = it.next(c); Value* v = el.value; Read* r = live(v); Site* s = sites[el.localIndex]; if (r) { if (s) { if (DebugControl) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "resolve original %s for %p local %d frame %d\n", buffer, v, el.localIndex, frameIndex(c, &el)); } acquireSite(c, frozen, s, v, r, true); } else { complete = false; } } else if (s) { if (DebugControl) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "freeze original %s for %p local %d frame %d\n", buffer, v, el.localIndex, frameIndex(c, &el)); } addSite(c, v, s); removeSite(c, v, s); freeze(c, frozen, s, v); } } return complete; } bool resolveSourceSites(Context* c, Event* e, SiteRecordList* frozen, Site** sites) { bool complete = true; for (FrameIterator it(c, e->stackAfter, e->localsAfter); it.hasMore();) { FrameIterator::Element el = it.next(c); Value* v = el.value; Read* r = live(v); if (r and sites[el.localIndex] == 0) { const uint32_t mask = (1 << RegisterOperand) | (1 << MemoryOperand); Site* s = pickSourceSite (c, r, 0, 0, mask, true, false, acceptForResolve); if (s == 0) { s = pickSourceSite(c, r, 0, 0, mask, false, false, acceptForResolve); } if (s) { if (DebugControl) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "resolve source %s from %p local %d frame %d\n", buffer, v, el.localIndex, frameIndex(c, &el)); } sites[el.localIndex] = acquireSite(c, frozen, s, v, r, false)->copy(c); } else { complete = false; } } } return complete; } void resolveTargetSites(Context* c, Event* e, SiteRecordList* frozen, Site** sites) { for (FrameIterator it(c, e->stackAfter, e->localsAfter); it.hasMore();) { FrameIterator::Element el = it.next(c); Value* v = el.value; Read* r = live(v); if (r and sites[el.localIndex] == 0) { const uint32_t mask = (1 << RegisterOperand) | (1 << MemoryOperand); bool useTarget = false; Site* s = pickSourceSite(c, r, 0, 0, mask, true, true, acceptForResolve); if (s == 0) { s = pickSourceSite(c, r, 0, 0, mask, false, true, acceptForResolve); if (s == 0) { s = pickTargetSite(c, r, false, ResolveRegisterReserveCount); useTarget = true; } } if (DebugControl) { char buffer[256]; s->toString(c, buffer, 256); fprintf(stderr, "resolve target %s for %p local %d frame %d\n", buffer, el.value, el.localIndex, frameIndex(c, &el)); } Site* acquired = acquireSite(c, frozen, s, v, r, useTarget)->copy(c); sites[el.localIndex] = (useTarget ? s : acquired->copy(c)); } } } void resolveJunctionSites(Context* c, Event* e, SiteRecordList* frozen) { bool complete; if (e->junctionSites) { complete = resolveOriginalSites(c, e, frozen, e->junctionSites); } else { propagateJunctionSites(c, e); complete = false; } if (e->junctionSites) { if (not complete) { complete = resolveSourceSites(c, e, frozen, e->junctionSites); if (not complete) { resolveTargetSites(c, e, frozen, e->junctionSites); } } if (DebugControl) { fprintf(stderr, "resolved junction sites %p at %d\n", e->junctionSites, e->logicalInstruction->index); } } } void resolveBranchSites(Context* c, Event* e, SiteRecordList* frozen) { if (e->successors->nextSuccessor and e->junctionSites == 0) { unsigned footprint = frameFootprint(c, e->stackAfter); RUNTIME_ARRAY(Site*, branchSites, footprint); memset(RUNTIME_ARRAY_BODY(branchSites), 0, sizeof(Site*) * footprint); if (not resolveSourceSites(c, e, frozen, RUNTIME_ARRAY_BODY(branchSites))) { resolveTargetSites(c, e, frozen, RUNTIME_ARRAY_BODY(branchSites)); } } } void captureBranchSnapshots(Context* c, Event* e) { if (e->successors->nextSuccessor) { for (FrameIterator it(c, e->stackAfter, e->localsAfter); it.hasMore();) { FrameIterator::Element el = it.next(c); e->snapshots = makeSnapshots(c, el.value, e->snapshots); } for (Cell* sv = e->successors->forkState->saved; sv; sv = sv->next) { e->snapshots = makeSnapshots (c, static_cast(sv->value), e->snapshots); } if (DebugControl) { fprintf(stderr, "captured snapshots %p at %d\n", e->snapshots, e->logicalInstruction->index); } } } void populateSiteTables(Context* c, Event* e, SiteRecordList* frozen) { resolveJunctionSites(c, e, frozen); resolveBranchSites(c, e, frozen); captureBranchSnapshots(c, e); } void setSites(Context* c, Value* v, Site* s) { assert(c, live(v)); for (; s; s = s->next) { addSite(c, v, s->copy(c)); } if (DebugControl) { char buffer[256]; sitesToString(c, v->sites, buffer, 256); fprintf(stderr, "set sites %s for %p\n", buffer, v); } } void resetFrame(Context* c, Event* e) { for (FrameIterator it(c, e->stackBefore, e->localsBefore); it.hasMore();) { FrameIterator::Element el = it.next(c); clearSites(c, el.value); } } void setSites(Context* c, Event* e, Site** sites) { resetFrame(c, e); for (FrameIterator it(c, e->stackBefore, e->localsBefore); it.hasMore();) { FrameIterator::Element el = it.next(c); if (sites[el.localIndex]) { if (live(el.value)) { setSites(c, el.value, sites[el.localIndex]); } else if (DebugControl) { char buffer[256]; sitesToString(c, sites[el.localIndex], buffer, 256); fprintf(stderr, "skip sites %s for %p local %d frame %d\n", buffer, el.value, el.localIndex, frameIndex(c, &el)); } } else if (DebugControl) { fprintf(stderr, "no sites for %p local %d frame %d\n", el.value, el.localIndex, frameIndex(c, &el)); } } } void removeBuddies(Context* c) { for (FrameIterator it(c, c->stack, c->locals); it.hasMore();) { FrameIterator::Element el = it.next(c); removeBuddy(c, el.value); } } void restore(Context* c, Event* e, Snapshot* snapshots) { for (Snapshot* s = snapshots; s; s = s->next) { // char buffer[256]; sitesToString(c, s->sites, buffer, 256); // fprintf(stderr, "restore %p buddy %p sites %s live %p\n", // s->value, s->value->buddy, buffer, live(s->value)); assert(c, s->buddy); s->value->buddy = s->buddy; } resetFrame(c, e); for (Snapshot* s = snapshots; s; s = s->next) { if (live(s->value)) { if (live(s->value) and s->sites and s->value->sites == 0) { setSites(c, s->value, s->sites); } } } } void populateSources(Context* c, Event* e) { RUNTIME_ARRAY(SiteRecord, frozenRecords, e->readCount); SiteRecordList frozen(RUNTIME_ARRAY_BODY(frozenRecords), e->readCount); for (Read* r = e->reads; r; r = r->eventNext) { r->value->source = readSource(c, r); if (r->value->source) { if (DebugReads) { char buffer[256]; r->value->source->toString(c, buffer, 256); fprintf(stderr, "freeze source %s for %p\n", buffer, r->value); } freeze(c, &frozen, r->value->source, r->value); } } thaw(c, &frozen); } void setStubRead(Context* c, StubReadPair* p, Value* v) { if (v) { StubRead* r = stubRead(c); if (DebugReads) { fprintf(stderr, "add stub read %p to %p\n", r, v); } addRead(c, 0, v, r); p->value = v; p->read = r; } } void populateJunctionReads(Context* c, Link* link) { JunctionState* state = new (c->zone->allocate (sizeof(JunctionState) + (sizeof(StubReadPair) * frameFootprint(c, c->stack)))) JunctionState(frameFootprint(c, c->stack)); memset(state->reads, 0, sizeof(StubReadPair) * frameFootprint(c, c->stack)); link->junctionState = state; for (FrameIterator it(c, c->stack, c->locals); it.hasMore();) { FrameIterator::Element e = it.next(c); setStubRead(c, state->reads + e.localIndex, e.value); } } void updateJunctionReads(Context* c, JunctionState* state) { for (FrameIterator it(c, c->stack, c->locals); it.hasMore();) { FrameIterator::Element e = it.next(c); StubReadPair* p = state->reads + e.localIndex; if (p->value and p->read->read == 0) { Read* r = live(e.value); if (r) { if (DebugReads) { fprintf(stderr, "stub read %p for %p valid: %p\n", p->read, p->value, r); } p->read->read = r; } } } for (unsigned i = 0; i < frameFootprint(c, c->stack); ++i) { StubReadPair* p = state->reads + i; if (p->value and p->read->read == 0) { if (DebugReads) { fprintf(stderr, "stub read %p for %p invalid\n", p->read, p->value); } p->read->valid_ = false; } } } LogicalInstruction* next(Context* c, LogicalInstruction* i) { for (unsigned n = i->index + 1; n < c->logicalCodeLength; ++n) { i = c->logicalCode[n]; if (i) return i; } return 0; } class Block { public: Block(Event* head): head(head), nextBlock(0), nextInstruction(0), assemblerBlock(0), start(0) { } Event* head; Block* nextBlock; LogicalInstruction* nextInstruction; Assembler::Block* assemblerBlock; unsigned start; }; Block* block(Context* c, Event* head) { return new (c->zone->allocate(sizeof(Block))) Block(head); } unsigned compile(Context* c) { if (c->logicalCode[c->logicalIp]->lastEvent == 0) { appendDummy(c); } Assembler* a = c->assembler; Block* firstBlock = block(c, c->firstEvent); Block* block = firstBlock; a->allocateFrame(c->alignedFrameSize); for (Event* e = c->firstEvent; e; e = e->next) { if (DebugCompile) { fprintf(stderr, " -- compile %s at %d with %d preds %d succs %d stack\n", e->name(), e->logicalInstruction->index, countPredecessors(e->predecessors), countSuccessors(e->successors), e->stackBefore ? e->stackBefore->index + 1 : 0); } e->block = block; c->stack = e->stackBefore; c->locals = e->localsBefore; if (e->logicalInstruction->machineOffset == 0) { e->logicalInstruction->machineOffset = a->offset(); } if (e->predecessors) { visit(c, lastPredecessor(e->predecessors)); Event* first = e->predecessors->predecessor; if (e->predecessors->nextPredecessor) { for (Link* pl = e->predecessors; pl->nextPredecessor; pl = pl->nextPredecessor) { updateJunctionReads(c, pl->junctionState); } if (DebugControl) { fprintf(stderr, "set sites to junction sites %p at %d\n", first->junctionSites, first->logicalInstruction->index); } setSites(c, e, first->junctionSites); removeBuddies(c); } else if (first->successors->nextSuccessor) { if (DebugControl) { fprintf(stderr, "restore snapshots %p at %d\n", first->snapshots, first->logicalInstruction->index); } restore(c, e, first->snapshots); } } unsigned footprint = frameFootprint(c, e->stackAfter); RUNTIME_ARRAY(SiteRecord, frozenRecords, footprint); SiteRecordList frozen(RUNTIME_ARRAY_BODY(frozenRecords), footprint); bool branch = e->isBranch(); if (branch and e->successors) { populateSiteTables(c, e, &frozen); } populateSources(c, e); thaw(c, &frozen); e->compile(c); if ((not branch) and e->successors) { populateSiteTables(c, e, &frozen); thaw(c, &frozen); } if (e->visitLinks) { for (Cell* cell = reverseDestroy(e->visitLinks); cell; cell = cell->next) { visit(c, static_cast(cell->value)); } e->visitLinks = 0; } for (CodePromise* p = e->promises; p; p = p->next) { p->offset = a->offset(); } LogicalInstruction* nextInstruction = next(c, e->logicalInstruction); if (e->next == 0 or (e->next->logicalInstruction != e->logicalInstruction and (e->next->logicalInstruction != nextInstruction or e != e->logicalInstruction->lastEvent))) { Block* b = e->logicalInstruction->firstEvent->block; while (b->nextBlock) { b = b->nextBlock; } if (b != block) { b->nextBlock = block; } block->nextInstruction = nextInstruction; block->assemblerBlock = a->endBlock(e->next != 0); if (e->next) { block = local::block(c, e->next); } } } block = firstBlock; while (block->nextBlock or block->nextInstruction) { Block* next = block->nextBlock ? block->nextBlock : block->nextInstruction->firstEvent->block; next->start = block->assemblerBlock->resolve (block->start, next->assemblerBlock); block = next; } return block->assemblerBlock->resolve(block->start, 0); } unsigned count(Stack* s) { unsigned c = 0; while (s) { ++ c; s = s->next; } return c; } void restore(Context* c, ForkState* state) { for (unsigned i = 0; i < state->readCount; ++i) { ForkElement* p = state->elements + i; p->value->lastRead = p->read; p->read->allocateTarget(c); } } void addForkElement(Context* c, Value* v, ForkState* state, unsigned index) { MultiRead* r = multiRead(c); if (DebugReads) { fprintf(stderr, "add multi read %p to %p\n", r, v); } addRead(c, 0, v, r); ForkElement* p = state->elements + index; p->value = v; p->read = r; } ForkState* saveState(Context* c) { unsigned elementCount = frameFootprint(c, c->stack) + count(c->saved); ForkState* state = new (c->zone->allocate (sizeof(ForkState) + (sizeof(ForkElement) * elementCount))) ForkState(c->stack, c->locals, c->saved, c->predecessor, c->logicalIp); if (c->predecessor) { c->forkState = state; unsigned count = 0; for (FrameIterator it(c, c->stack, c->locals); it.hasMore();) { FrameIterator::Element e = it.next(c); addForkElement(c, e.value, state, count++); } for (Cell* sv = c->saved; sv; sv = sv->next) { addForkElement(c, static_cast(sv->value), state, count++); } state->readCount = count; } c->saved = 0; return state; } void restoreState(Context* c, ForkState* s) { if (c->logicalCode[c->logicalIp]->lastEvent == 0) { appendDummy(c); } c->stack = s->stack; c->locals = s->locals; c->predecessor = s->predecessor; c->logicalIp = s->logicalIp; if (c->predecessor) { c->forkState = s; restore(c, s); } } Value* maybeBuddy(Context* c, Value* v) { if (v->home >= 0) { Value* n = value(c, v->type); appendBuddy(c, v, n); return n; } else { return v; } } class Client: public Assembler::Client { public: Client(Context* c): c(c) { } virtual int acquireTemporary(uint32_t mask) { unsigned cost; int r = pickRegisterTarget(c, 0, mask, &cost); expect(c, cost < Target::Impossible); save(r); increment(c, c->registerResources + r); return r; } virtual void releaseTemporary(int r) { decrement(c, c->registerResources + r); } virtual void save(int r) { RegisterResource* reg = c->registerResources + r; assert(c, reg->referenceCount == 0); assert(c, reg->freezeCount == 0); assert(c, not reg->reserved); if (reg->value) { steal(c, reg, 0); } } Context* c; }; class MyCompiler: public Compiler { public: MyCompiler(System* s, Assembler* assembler, Zone* zone, Compiler::Client* compilerClient): c(s, assembler, zone, compilerClient), client(&c) { assembler->setClient(&client); } virtual State* saveState() { State* s = local::saveState(&c); restoreState(s); return s; } virtual void restoreState(State* state) { local::restoreState(&c, static_cast(state)); } virtual Subroutine* startSubroutine() { return c.subroutine = new (c.zone->allocate(sizeof(MySubroutine))) MySubroutine; } virtual void endSubroutine(Subroutine* subroutine) { appendCleanLocals(&c); static_cast(subroutine)->forkState = local::saveState(&c); } virtual void linkSubroutine(Subroutine* subroutine) { restoreState(static_cast(subroutine)->forkState); } virtual void init(unsigned logicalCodeLength, unsigned parameterFootprint, unsigned localFootprint, unsigned alignedFrameSize) { c.logicalCodeLength = logicalCodeLength; c.parameterFootprint = parameterFootprint; c.localFootprint = localFootprint; c.alignedFrameSize = alignedFrameSize; unsigned frameResourceCount = totalFrameSize(&c); c.frameResources = static_cast (c.zone->allocate(sizeof(FrameResource) * frameResourceCount)); for (unsigned i = 0; i < frameResourceCount; ++i) { new (c.frameResources + i) FrameResource; } unsigned base = frameBase(&c); c.frameResources[base + c.arch->returnAddressOffset()].reserved = true; c.frameResources[base + c.arch->framePointerOffset()].reserved = true; // leave room for logical instruction -1 unsigned codeSize = sizeof(LogicalInstruction*) * (logicalCodeLength + 1); c.logicalCode = static_cast (c.zone->allocate(codeSize)); memset(c.logicalCode, 0, codeSize); c.logicalCode++; c.locals = static_cast (c.zone->allocate(sizeof(Local) * localFootprint)); memset(c.locals, 0, sizeof(Local) * localFootprint); c.logicalCode[-1] = new (c.zone->allocate(sizeof(LogicalInstruction))) LogicalInstruction(-1, c.stack, c.locals); } virtual void visitLogicalIp(unsigned logicalIp) { assert(&c, logicalIp < c.logicalCodeLength); if (c.logicalCode[c.logicalIp]->lastEvent == 0) { appendDummy(&c); } Event* e = c.logicalCode[logicalIp]->firstEvent; Event* p = c.predecessor; if (p) { if (DebugAppend) { fprintf(stderr, "visit %d pred %d\n", logicalIp, p->logicalInstruction->index); } p->stackAfter = c.stack; p->localsAfter = c.locals; Link* link = local::link (&c, p, e->predecessors, e, p->successors, c.forkState); e->predecessors = link; p->successors = link; c.lastEvent->visitLinks = cons(&c, link, c.lastEvent->visitLinks); if (DebugAppend) { fprintf(stderr, "populate junction reads for %d to %d\n", p->logicalInstruction->index, logicalIp); } populateJunctionReads(&c, link); } if (c.subroutine) { c.subroutine->forkState = c.logicalCode[logicalIp]->subroutine->forkState; c.subroutine = 0; } c.forkState = 0; } virtual void startLogicalIp(unsigned logicalIp) { assert(&c, logicalIp < c.logicalCodeLength); assert(&c, c.logicalCode[logicalIp] == 0); if (c.logicalCode[c.logicalIp]->lastEvent == 0) { appendDummy(&c); } Event* p = c.predecessor; if (p) { p->stackAfter = c.stack; p->localsAfter = c.locals; } c.logicalCode[logicalIp] = new (c.zone->allocate(sizeof(LogicalInstruction))) LogicalInstruction(logicalIp, c.stack, c.locals); bool startSubroutine = c.subroutine != 0; if (startSubroutine) { c.logicalCode[logicalIp]->subroutine = c.subroutine; c.subroutine = 0; } c.logicalIp = logicalIp; if (startSubroutine) { // assume all local variables are initialized on entry to a // subroutine, since other calls to the subroutine may // initialize them: unsigned sizeInBytes = sizeof(Local) * c.localFootprint; Local* newLocals = static_cast(c.zone->allocate(sizeInBytes)); memcpy(newLocals, c.locals, sizeInBytes); c.locals = newLocals; for (unsigned li = 0; li < c.localFootprint; ++li) { Local* local = c.locals + li; if (local->value == 0) { initLocal(1, li, IntegerType); } } } } virtual Promise* machineIp(unsigned logicalIp) { return new (c.zone->allocate(sizeof(IpPromise))) IpPromise(&c, logicalIp); } virtual Promise* poolAppend(intptr_t value) { return poolAppendPromise(resolved(&c, value)); } virtual Promise* poolAppendPromise(Promise* value) { Promise* p = new (c.zone->allocate(sizeof(PoolPromise))) PoolPromise(&c, c.constantCount); ConstantPoolNode* constant = new (c.zone->allocate(sizeof(ConstantPoolNode))) ConstantPoolNode(value); if (c.firstConstant) { c.lastConstant->next = constant; } else { c.firstConstant = constant; } c.lastConstant = constant; ++ c.constantCount; return p; } virtual Operand* constant(int64_t value, OperandType type) { return promiseConstant(resolved(&c, value), type); } virtual Operand* promiseConstant(Promise* value, OperandType type) { return local::value (&c, valueType(&c, type), local::constantSite(&c, value)); } virtual Operand* address(Promise* address) { return value(&c, ValueGeneral, local::addressSite(&c, address)); } virtual Operand* memory(Operand* base, OperandType type, int displacement = 0, Operand* index = 0, unsigned scale = 1) { Value* result = value(&c, valueType(&c, type)); appendMemory(&c, static_cast(base), displacement, static_cast(index), scale, result); return result; } virtual Operand* register_(int number) { assert(&c, (1 << number) & (c.arch->generalRegisterMask() | c.arch->floatRegisterMask())); Site* s = registerSite(&c, number); ValueType type = ((1 << number) & c.arch->floatRegisterMask()) ? ValueFloat: ValueGeneral; return value(&c, type, s, s); } Promise* machineIp() { return codePromise(&c, c.logicalCode[c.logicalIp]->lastEvent); } virtual void push(unsigned footprint UNUSED) { assert(&c, footprint == 1); Value* v = value(&c, ValueFloat); Stack* s = local::stack(&c, v, c.stack); v->home = frameIndex(&c, s->index + c.localFootprint); c.stack = s; } virtual void push(unsigned footprint, Operand* value) { local::push(&c, footprint, static_cast(value), true); } virtual void save(unsigned footprint, Operand* value) { c.saved = cons(&c, static_cast(value), c.saved); if (BytesPerWord == 4 and footprint > 1) { assert(&c, footprint == 2); assert(&c, static_cast(value)->next); save(1, static_cast(value)->next); } } virtual Operand* pop(unsigned footprint) { return local::pop(&c, footprint); } virtual void pushed() { Value* v = value(&c, ValueFloat); appendFrameSite (&c, v, frameIndex (&c, (c.stack ? c.stack->index : 0) + c.localFootprint)); Stack* s = local::stack(&c, v, c.stack); v->home = frameIndex(&c, s->index + c.localFootprint); c.stack = s; } virtual void popped(unsigned footprint) { for (; footprint; -- footprint) { assert(&c, c.stack->value == 0 or c.stack->value->home >= 0); if (DebugFrame) { fprintf(stderr, "popped %p\n", c.stack->value); } c.stack = c.stack->next; } } virtual unsigned topOfStack() { return c.stack->index; } virtual Operand* peek(unsigned footprint, unsigned index) { Stack* s = c.stack; for (unsigned i = index; i > 0; --i) { s = s->next; } if (footprint > 1) { assert(&c, footprint == 2); bool bigEndian = c.arch->bigEndian(); #ifndef NDEBUG Stack* low; Stack* high; if (bigEndian) { low = s; high = s->next; } else { high = s; low = s->next; } assert(&c, low->value->next == high->value and ((BytesPerWord == 8) xor (low->value->next != 0))); #endif // not NDEBUG if (not bigEndian) { s = s->next; } } return s->value; } virtual Operand* call(Operand* address, unsigned flags, TraceHandler* traceHandler, unsigned resultSize, OperandType resultType, unsigned argumentCount, ...) { va_list a; va_start(a, argumentCount); bool bigEndian = c.arch->bigEndian(); unsigned footprint = 0; unsigned size = BytesPerWord; RUNTIME_ARRAY(Value*, arguments, argumentCount); int index = 0; for (unsigned i = 0; i < argumentCount; ++i) { Value* o = va_arg(a, Value*); if (o) { if (bigEndian and size > BytesPerWord) { RUNTIME_ARRAY_BODY(arguments)[index++] = o->next; } RUNTIME_ARRAY_BODY(arguments)[index] = o; if ((not bigEndian) and size > BytesPerWord) { RUNTIME_ARRAY_BODY(arguments)[++index] = o->next; } size = BytesPerWord; ++ index; } else { size = 8; } ++ footprint; } va_end(a); Stack* argumentStack = c.stack; for (int i = index - 1; i >= 0; --i) { argumentStack = local::stack (&c, RUNTIME_ARRAY_BODY(arguments)[i], argumentStack); } Value* result = value(&c, valueType(&c, resultType)); appendCall(&c, static_cast(address), flags, traceHandler, result, resultSize, argumentStack, index, 0); return result; } virtual Operand* stackCall(Operand* address, unsigned flags, TraceHandler* traceHandler, unsigned resultSize, OperandType resultType, unsigned argumentFootprint) { Value* result = value(&c, valueType(&c, resultType)); appendCall(&c, static_cast(address), flags, traceHandler, result, resultSize, c.stack, 0, argumentFootprint); return result; } virtual void return_(unsigned size, Operand* value) { appendReturn(&c, size, static_cast(value)); } virtual void initLocal(unsigned footprint, unsigned index, OperandType type) { assert(&c, index + footprint <= c.localFootprint); Value* v = value(&c, valueType(&c, type)); if (footprint > 1) { assert(&c, footprint == 2); unsigned highIndex; unsigned lowIndex; if (c.arch->bigEndian()) { highIndex = index + 1; lowIndex = index; } else { lowIndex = index + 1; highIndex = index; } if (BytesPerWord == 4) { initLocal(1, highIndex, type); Value* next = c.locals[highIndex].value; v->next = next; next->next = v; next->index = 1; } index = lowIndex; } if (DebugFrame) { fprintf(stderr, "init local %p at %d (%d)\n", v, index, frameIndex(&c, index)); } appendFrameSite(&c, v, frameIndex(&c, index)); Local* local = c.locals + index; local->value = v; v->home = frameIndex(&c, index); } virtual void initLocalsFromLogicalIp(unsigned logicalIp) { assert(&c, logicalIp < c.logicalCodeLength); unsigned footprint = sizeof(Local) * c.localFootprint; Local* newLocals = static_cast(c.zone->allocate(footprint)); memset(newLocals, 0, footprint); c.locals = newLocals; Event* e = c.logicalCode[logicalIp]->firstEvent; for (int i = 0; i < static_cast(c.localFootprint); ++i) { Local* local = e->localsBefore + i; if (local->value) { initLocal (1, i, local->value->type == ValueGeneral ? IntegerType : FloatType); } } for (int i = 0; i < static_cast(c.localFootprint); ++i) { Local* local = e->localsBefore + i; if (local->value) { int highOffset = c.arch->bigEndian() ? 1 : -1; if (i + highOffset >= 0 and i + highOffset < static_cast(c.localFootprint) and local->value->next == local[highOffset].value) { Value* v = c.locals[i].value; Value* next = c.locals[i + highOffset].value; v->next = next; next->next = v; next->index = 1; } } } } virtual void storeLocal(unsigned footprint, Operand* src, unsigned index) { local::storeLocal(&c, footprint, static_cast(src), index, true); } virtual Operand* loadLocal(unsigned footprint, unsigned index) { return local::loadLocal(&c, footprint, index); } virtual void saveLocals() { appendSaveLocals(&c); } virtual void checkBounds(Operand* object, unsigned lengthOffset, Operand* index, intptr_t handler) { appendBoundsCheck(&c, static_cast(object), lengthOffset, static_cast(index), handler); } virtual void store(unsigned srcSize, Operand* src, unsigned dstSize, Operand* dst) { appendMove(&c, Move, srcSize, srcSize, static_cast(src), dstSize, static_cast(dst)); } virtual Operand* load(unsigned srcSize, unsigned srcSelectSize, Operand* src, unsigned dstSize) { assert(&c, dstSize >= BytesPerWord); Value* dst = value(&c, static_cast(src)->type); appendMove(&c, Move, srcSize, srcSelectSize, static_cast(src), dstSize, dst); return dst; } virtual Operand* loadz(unsigned srcSize, unsigned srcSelectSize, Operand* src, unsigned dstSize) { assert(&c, dstSize >= BytesPerWord); Value* dst = value(&c, static_cast(src)->type); appendMove(&c, MoveZ, srcSize, srcSelectSize, static_cast(src), dstSize, dst); return dst; } virtual Operand* lcmp(Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, LongCompare, 8, static_cast(a), 8, static_cast(b), 8, result); return result; } virtual void cmp(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); appendCompare(&c, Compare, size, static_cast(a), static_cast(b)); } virtual void fcmp(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueFloat and static_cast(b)->type == ValueFloat); appendCompare(&c, FloatCompare, size, static_cast(a), static_cast(b)); } virtual void jl(Operand* address) { appendBranch(&c, JumpIfLess, static_cast(address)); } virtual void jg(Operand* address) { appendBranch(&c, JumpIfGreater, static_cast(address)); } virtual void jle(Operand* address) { appendBranch(&c, JumpIfLessOrEqual, static_cast(address)); } virtual void jge(Operand* address) { appendBranch(&c, JumpIfGreaterOrEqual, static_cast(address)); } virtual void je(Operand* address) { appendBranch(&c, JumpIfEqual, static_cast(address)); } virtual void jne(Operand* address) { appendBranch(&c, JumpIfNotEqual, static_cast(address)); } virtual void fjl(Operand* address) { appendBranch(&c, JumpIfFloatLess, static_cast(address)); } virtual void fjg(Operand* address) { appendBranch(&c, JumpIfFloatGreater, static_cast(address)); } virtual void fjle(Operand* address) { appendBranch(&c, JumpIfFloatLessOrEqual, static_cast(address)); } virtual void fjge(Operand* address) { appendBranch(&c, JumpIfFloatGreaterOrEqual, static_cast(address)); } virtual void fje(Operand* address) { appendBranch(&c, JumpIfFloatEqual, static_cast(address)); } virtual void fjne(Operand* address) { appendBranch(&c, JumpIfFloatNotEqual, static_cast(address)); } virtual void fjuo(Operand* address) { appendBranch(&c, JumpIfFloatUnordered, static_cast(address)); } virtual void jmp(Operand* address) { appendBranch(&c, Jump, static_cast(address)); } virtual void exit(Operand* address) { appendBranch(&c, Jump, static_cast(address), true); } virtual Operand* add(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Add, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* sub(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Subtract, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* mul(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Multiply, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* div(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Divide, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* rem(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral and static_cast(b)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Remainder, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* fadd(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueFloat and static_cast(b)->type == ValueFloat); Value* result = value(&c, ValueFloat); static_cast(a)->type = static_cast(b)->type = ValueFloat; appendCombine(&c, FloatAdd, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* fsub(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueFloat and static_cast(b)->type == ValueFloat); Value* result = value(&c, ValueFloat); static_cast(a)->type = static_cast(b)->type = ValueFloat; appendCombine(&c, FloatSubtract, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* fmul(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueFloat and static_cast(b)->type == ValueFloat); Value* result = value(&c, ValueFloat); static_cast(a)->type = static_cast(b)->type = ValueFloat; appendCombine(&c, FloatMultiply, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* fdiv(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueFloat and static_cast(b)->type == ValueFloat); Value* result = value(&c, ValueFloat); appendCombine(&c, FloatDivide, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* frem(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueFloat and static_cast(b)->type == ValueFloat); Value* result = value(&c, ValueFloat); appendCombine(&c, FloatRemainder, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* shl(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, ShiftLeft, BytesPerWord, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* shr(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, ShiftRight, BytesPerWord, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* ushr(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine (&c, UnsignedShiftRight, BytesPerWord, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* and_(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, And, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* or_(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Or, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* xor_(unsigned size, Operand* a, Operand* b) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendCombine(&c, Xor, size, static_cast(a), size, static_cast(b), size, result); return result; } virtual Operand* neg(unsigned size, Operand* a) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueGeneral); appendTranslate(&c, Negate, size, static_cast(a), size, result); return result; } virtual Operand* fneg(unsigned size, Operand* a) { assert(&c, static_cast(a)->type == ValueFloat); Value* result = value(&c, ValueFloat); appendTranslate (&c, FloatNegate, size, static_cast(a), size, result); return result; } virtual Operand* operation(BinaryOperation op, unsigned aSize, unsigned resSize, OperandType resType, Operand* a) { Value* result = value(&c, valueType(&c, resType)); appendTranslate(&c, op, aSize, static_cast(a), resSize, result); return result; } virtual Operand* operation(TernaryOperation op, unsigned aSize, unsigned bSize, unsigned resSize, OperandType resType, Operand* a, Operand* b) { Value* result = value(&c, valueType(&c, resType)); appendCombine (&c, op, aSize, static_cast(a), bSize, static_cast(b), resSize, result); return result; } virtual Operand* f2f(unsigned aSize, unsigned resSize, Operand* a) { assert(&c, static_cast(a)->type == ValueFloat); Value* result = value(&c, ValueFloat); appendTranslate (&c, Float2Float, aSize, static_cast(a), resSize, result); return result; } virtual Operand* f2i(unsigned aSize, unsigned resSize, Operand* a) { assert(&c, static_cast(a)->type == ValueFloat); Value* result = value(&c, ValueGeneral); appendTranslate (&c, Float2Int, aSize, static_cast(a), resSize, result); return result; } virtual Operand* i2f(unsigned aSize, unsigned resSize, Operand* a) { assert(&c, static_cast(a)->type == ValueGeneral); Value* result = value(&c, ValueFloat); appendTranslate (&c, Int2Float, aSize, static_cast(a), resSize, result); return result; } virtual void loadBarrier() { appendBarrier(&c, LoadBarrier); } virtual void storeStoreBarrier() { appendBarrier(&c, StoreStoreBarrier); } virtual void storeLoadBarrier() { appendBarrier(&c, StoreLoadBarrier); } virtual unsigned compile() { return c.machineCodeSize = local::compile(&c); } virtual unsigned poolSize() { return c.constantCount * BytesPerWord; } virtual void writeTo(uint8_t* dst) { c.machineCode = dst; c.assembler->writeTo(dst); int i = 0; for (ConstantPoolNode* n = c.firstConstant; n; n = n->next) { intptr_t* target = reinterpret_cast (dst + pad(c.machineCodeSize) + i); if (n->promise->resolved()) { *target = n->promise->value(); } else { class Listener: public Promise::Listener { public: Listener(intptr_t* target): target(target){ } virtual bool resolve(int64_t value, void** location) { *target = value; if (location) *location = target; return true; } intptr_t* target; }; new (n->promise->listen(sizeof(Listener))) Listener(target); } i += BytesPerWord; } } virtual void dispose() { // ignore } Context c; local::Client client; }; } // namespace local } // namespace namespace vm { Compiler* makeCompiler(System* system, Assembler* assembler, Zone* zone, Compiler::Client* client) { return new (zone->allocate(sizeof(local::MyCompiler))) local::MyCompiler(system, assembler, zone, client); } } // namespace vm