initial sketch of tail call optimization (non-virtual calls only, so far)

This commit is contained in:
Joel Dice 2009-03-31 14:15:08 -06:00
parent b871f430d0
commit 5e740170f2
7 changed files with 420 additions and 122 deletions

View File

@ -277,6 +277,8 @@ class Assembler {
virtual void updateCall(UnaryOperation op, bool assertAlignment, virtual void updateCall(UnaryOperation op, bool assertAlignment,
void* returnAddress, void* newTarget) = 0; void* returnAddress, void* newTarget) = 0;
virtual unsigned constantCallSize() = 0;
virtual uintptr_t getConstant(const void* src) = 0; virtual uintptr_t getConstant(const void* src) = 0;
virtual void setConstant(void* dst, uintptr_t constant) = 0; virtual void setConstant(void* dst, uintptr_t constant) = 0;

View File

@ -426,15 +426,18 @@ class Context;
class TraceElement: public TraceHandler { class TraceElement: public TraceHandler {
public: public:
const unsigned VirtualCall = 1 << 0;
const unsigned TailCall = 1 << 1;
TraceElement(Context* context, object target, TraceElement(Context* context, object target,
bool virtualCall, TraceElement* next): unsigned flags, TraceElement* next):
context(context), context(context),
address(0), address(0),
next(next), next(next),
target(target), target(target),
padIndex(0), padIndex(0),
padding(0), padding(0),
virtualCall(virtualCall) flags(flags)
{ } { }
virtual void handleTrace(Promise* address, unsigned padIndex, virtual void handleTrace(Promise* address, unsigned padIndex,
@ -453,10 +456,27 @@ class TraceElement: public TraceHandler {
object target; object target;
unsigned padIndex; unsigned padIndex;
unsigned padding; unsigned padding;
bool virtualCall; unsigned flags;
uintptr_t map[0]; uintptr_t map[0];
}; };
class TraceElementPromise: public Promise {
public:
TraceElementPromise(TraceElement* trace): trace(trace) { }
virtual int64_t value() {
assert(s, resolved());
return reinterpret_cast<uintptr_t>(trace->address);
}
virtual bool resolved() {
return trace->address != 0;
}
System* s;
TraceElement* trace;
};
enum Event { enum Event {
PushContextEvent, PushContextEvent,
PopContextEvent, PopContextEvent,
@ -1182,12 +1202,12 @@ class Frame {
swapped(); swapped();
} }
TraceElement* trace(object target, bool virtualCall) { TraceElement* trace(object target, unsigned flags) {
unsigned mapSize = frameMapSizeInWords(t, context->method); unsigned mapSize = frameMapSizeInWords(t, context->method);
TraceElement* e = context->traceLog = new TraceElement* e = context->traceLog = new
(context->zone.allocate(sizeof(TraceElement) + (mapSize * BytesPerWord))) (context->zone.allocate(sizeof(TraceElement) + (mapSize * BytesPerWord)))
TraceElement(context, target, virtualCall, context->traceLog); TraceElement(context, target, flags, context->traceLog);
++ context->traceLogCount; ++ context->traceLogCount;
@ -1863,8 +1883,75 @@ emptyMethod(MyThread* t, object method)
and (codeBody(t, methodCode(t, method), 0) == return_); and (codeBody(t, methodCode(t, method), 0) == return_);
} }
Compiler::Operand*
compileDirectInvoke(MyThread* t, Frame* frame, object target, bool tailCall,
bool useThunk, unsigned rSize, Promise* addressPromise)
{
if (tailCall and methodParameterFootprint(t, target)
> methodParameterFootprint(t, frame->context->method))
{
return c->stackCall
(c->constant(tailHelperThunk(t)),
0,
frame->trace(target, 0),
rSize,
methodParameterFootprint(t, target));
} else if (tailCall and (methodFlags(t, target) & ACC_NATIVE)) {
return c->stackCall
(c->constant(nativeTailThunk(t)),
Compiler::TailCall,
frame->trace(target, TraceElement::TailCall),
trace,
rSize,
methodParameterFootprint(t, target));
} else {
unsigned flags = (tailCall ? Compiler::TailCall : 0);
if (useThunk) {
if (tailCall) {
Compiler::Operand* result = c->stackCall
(c->promiseConstant
(new (frame->context->zone.allocate(sizeof(TraceElementPromise)))
TraceElementPromise(t->m->system, frame->trace(0, 0))),
flags | Compiler::Aligned,
0,
rSize,
methodParameterFootprint(t, target));
c->call(c->constant(defaultTailThunk(t)),
0,
frame->trace(target, TraceElement::TailCall),
0,
0);
return result;
} else {
return c->stackCall
(address,
flags | Compiler::Aligned,
frame->trace(target, 0),
rSize,
methodParameterFootprint(t, target));
}
} else {
Compiler::Operand* address =
(addressPromise
? c->promiseConstant(addressPromise)
: c->constant(methodAddress(t, target)));
return c->stackCall
(c->promiseConstant(p),
flags,
tailCall ? 0 : frame->trace
((methodFlags(t, target) & ACC_NATIVE) ? target, 0),
rSize,
methodParameterFootprint(t, target));
}
}
}
void void
compileDirectInvoke(MyThread* t, Frame* frame, object target) compileDirectInvoke(MyThread* t, Frame* frame, object target, bool tailCall)
{ {
Compiler* c = frame->c; Compiler* c = frame->c;
@ -1885,42 +1972,20 @@ compileDirectInvoke(MyThread* t, Frame* frame, object target)
object pointer = makePointer(t, p); object pointer = makePointer(t, p);
bc->calls = makeTriple(t, target, pointer, bc->calls); bc->calls = makeTriple(t, target, pointer, bc->calls);
object traceTarget result = compileDirectInvoke
= (methodFlags(t, target) & ACC_NATIVE) ? target : 0; (t, frame, target, tailCall, false, rSize, p);
result = c->stackCall
(c->promiseConstant(p),
0,
frame->trace(traceTarget, false),
rSize,
methodParameterFootprint(t, target));
} else { } else {
result = c->stackCall result = compileDirectInvoke
(c->constant(defaultThunk(t)), (t, frame, target, tailCall, true, rSize, 0);
Compiler::Aligned,
frame->trace(target, false),
rSize,
methodParameterFootprint(t, target));
} }
} else if (methodAddress(t, target) == defaultThunk(t) } else if (methodAddress(t, target) == defaultThunk(t)
or classNeedsInit(t, methodClass(t, target))) or classNeedsInit(t, methodClass(t, target)))
{ {
result = c->stackCall result = compileDirectInvoke
(c->constant(defaultThunk(t)), (t, frame, target, tailCall, true, rSize, 0);
Compiler::Aligned,
frame->trace(target, false),
rSize,
methodParameterFootprint(t, target));
} else { } else {
object traceTarget result = compileDirectInvoke
= (methodFlags(t, target) & ACC_NATIVE) ? target : 0; (t, frame, target, tailCall, false, rSize, 0);
result = c->stackCall
(c->constant(methodAddress(t, target)),
0,
frame->trace(traceTarget, false),
rSize,
methodParameterFootprint(t, target));
} }
} }
@ -1947,7 +2012,7 @@ handleMonitorEvent(MyThread* t, Frame* frame, intptr_t function)
c->call(c->constant(function), c->call(c->constant(function),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
2, c->thread(), lock); 2, c->thread(), lock);
} }
@ -2059,6 +2124,35 @@ inTryBlock(MyThread* t, object code, unsigned ip)
return false; return false;
} }
bool
needsReturnBarrier(MyThread* t, object method)
{
return (methodFlags(t, method) & ConstructorFlag)
and (classFlags(t, methodClass(t, method)) & HasFinalMemberFlag);
}
bool
isTailCall(MyThread* t, object code, unsigned ip, object caller, object callee)
{
if (((methodFlags(t, caller) & ACC_SYNCHRONIZED) == 0)
and (not inTryBlock(t, code, ip - 1))
and (not needsReturnBarrier(t, caller))
and (methodReturnCode(t, caller) == VoidField
or methodReturnCode(t, caller) == methodReturnCode(t, callee)))
{
switch (codeBody(t, code, ip)) {
case return_:
case areturn:
case ireturn:
case freturn:
case lreturn:
case dreturn:
return true;
}
}
return false;
}
void void
compile(MyThread* t, Frame* initialFrame, unsigned ip, compile(MyThread* t, Frame* initialFrame, unsigned ip,
int exceptionHandlerStart = -1); int exceptionHandlerStart = -1);
@ -2104,7 +2198,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, gcIfNecessaryThunk)), (c->constant(getThunk(t, gcIfNecessaryThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
1, c->thread()); 1, c->thread());
} }
@ -2204,7 +2298,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, setMaybeNullThunk)), (c->constant(getThunk(t, setMaybeNullThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
4, c->thread(), array, 4, c->thread(), array,
c->add(4, c->constant(ArrayBody), c->add(4, c->constant(ArrayBody),
@ -2272,7 +2366,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
(c->call (c->call
(c->constant(getThunk(t, makeBlankObjectArrayThunk)), (c->constant(getThunk(t, makeBlankObjectArrayThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
BytesPerWord, BytesPerWord,
3, c->thread(), frame->append(class_), length)); 3, c->thread(), frame->append(class_), length));
} break; } break;
@ -2314,7 +2408,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, throw_Thunk)), (c->constant(getThunk(t, throw_Thunk)),
Compiler::NoReturn, Compiler::NoReturn,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
2, c->thread(), target); 2, c->thread(), target);
} return; } return;
@ -2335,7 +2429,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, checkCastThunk)), (c->constant(getThunk(t, checkCastThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
3, c->thread(), frame->append(class_), instance); 3, c->thread(), frame->append(class_), instance);
} break; } break;
@ -2616,7 +2710,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, tryInitClassThunk)), (c->constant(getThunk(t, tryInitClassThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
2, c->thread(), frame->append(fieldClass(t, field))); 2, c->thread(), frame->append(fieldClass(t, field)));
} }
@ -2643,7 +2737,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, acquireMonitorForObjectThunk)), (c->constant(getThunk(t, acquireMonitorForObjectThunk)),
0, frame->trace(0, false), 0, 2, c->thread(), fieldOperand); 0, frame->trace(0, 0), 0, 2, c->thread(), fieldOperand);
} }
switch (fieldCode(t, field)) { switch (fieldCode(t, field)) {
@ -2697,7 +2791,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
{ {
c->call c->call
(c->constant(getThunk(t, releaseMonitorForObjectThunk)), (c->constant(getThunk(t, releaseMonitorForObjectThunk)),
0, frame->trace(0, false), 0, 2, c->thread(), fieldOperand); 0, frame->trace(0, 0), 0, 2, c->thread(), fieldOperand);
} else { } else {
c->loadBarrier(); c->loadBarrier();
} }
@ -2994,12 +3088,12 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
(c->constant (c->constant
(getThunk(t, findInterfaceMethodFromInstanceThunk)), (getThunk(t, findInterfaceMethodFromInstanceThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
BytesPerWord, BytesPerWord,
3, c->thread(), frame->append(target), 3, c->thread(), frame->append(target),
c->peek(1, instance)), c->peek(1, instance)),
0, 0,
frame->trace(target, true), frame->trace(target, TraceElement::VirtualCall),
rSize, rSize,
parameterFootprint); parameterFootprint);
@ -3023,7 +3117,8 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
assert(t, (methodFlags(t, target) & ACC_STATIC) == 0); assert(t, (methodFlags(t, target) & ACC_STATIC) == 0);
compileDirectInvoke(t, frame, target); compileDirectInvoke
(t, frame, target, isTailCall(t, code, ip, context->method, target));
} break; } break;
case invokestatic: { case invokestatic: {
@ -3034,7 +3129,8 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
assert(t, methodFlags(t, target) & ACC_STATIC); assert(t, methodFlags(t, target) & ACC_STATIC);
compileDirectInvoke(t, frame, target); compileDirectInvoke
(t, frame, target, isTailCall(t, code, ip, context->method, target));
} break; } break;
case invokevirtual: { case invokevirtual: {
@ -3059,7 +3155,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
(BytesPerWord, c->constant(PointerMask), (BytesPerWord, c->constant(PointerMask),
c->memory(instance, 0, 0, 1)), offset, 0, 1), c->memory(instance, 0, 0, 1)), offset, 0, 1),
0, 0,
frame->trace(target, true), frame->trace(target, TraceElement::VirtualCall),
rSize, rSize,
parameterFootprint); parameterFootprint);
@ -3441,14 +3537,14 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
Compiler::Operand* target = frame->popObject(); Compiler::Operand* target = frame->popObject();
c->call c->call
(c->constant(getThunk(t, acquireMonitorForObjectThunk)), (c->constant(getThunk(t, acquireMonitorForObjectThunk)),
0, frame->trace(0, false), 0, 2, c->thread(), target); 0, frame->trace(0, 0), 0, 2, c->thread(), target);
} break; } break;
case monitorexit: { case monitorexit: {
Compiler::Operand* target = frame->popObject(); Compiler::Operand* target = frame->popObject();
c->call c->call
(c->constant(getThunk(t, releaseMonitorForObjectThunk)), (c->constant(getThunk(t, releaseMonitorForObjectThunk)),
0, frame->trace(0, false), 0, 2, c->thread(), target); 0, frame->trace(0, 0), 0, 2, c->thread(), target);
} break; } break;
case multianewarray: { case multianewarray: {
@ -3468,7 +3564,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
Compiler::Operand* result = c->call Compiler::Operand* result = c->call
(c->constant(getThunk(t, makeMultidimensionalArrayThunk)), (c->constant(getThunk(t, makeMultidimensionalArrayThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
BytesPerWord, BytesPerWord,
4, c->thread(), frame->append(class_), c->constant(dimensions), 4, c->thread(), frame->append(class_), c->constant(dimensions),
c->constant(offset)); c->constant(offset));
@ -3488,7 +3584,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
(c->call (c->call
(c->constant(getThunk(t, makeNewWeakReference64Thunk)), (c->constant(getThunk(t, makeNewWeakReference64Thunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
BytesPerWord, BytesPerWord,
2, c->thread(), frame->append(class_))); 2, c->thread(), frame->append(class_)));
} else { } else {
@ -3496,7 +3592,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
(c->call (c->call
(c->constant(getThunk(t, makeNew64Thunk)), (c->constant(getThunk(t, makeNew64Thunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
BytesPerWord, BytesPerWord,
2, c->thread(), frame->append(class_))); 2, c->thread(), frame->append(class_)));
} }
@ -3511,7 +3607,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
(c->call (c->call
(c->constant(getThunk(t, makeBlankArrayThunk)), (c->constant(getThunk(t, makeBlankArrayThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
BytesPerWord, BytesPerWord,
3, c->thread(), c->constant(type), length)); 3, c->thread(), c->constant(type), length));
} break; } break;
@ -3544,7 +3640,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, tryInitClassThunk)), (c->constant(getThunk(t, tryInitClassThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
2, c->thread(), frame->append(fieldClass(t, field))); 2, c->thread(), frame->append(fieldClass(t, field)));
} }
@ -3600,7 +3696,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, acquireMonitorForObjectThunk)), (c->constant(getThunk(t, acquireMonitorForObjectThunk)),
0, frame->trace(0, false), 0, 2, c->thread(), fieldOperand); 0, frame->trace(0, 0), 0, 2, c->thread(), fieldOperand);
} else { } else {
c->storeStoreBarrier(); c->storeStoreBarrier();
} }
@ -3635,7 +3731,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
c->call c->call
(c->constant(getThunk(t, setMaybeNullThunk)), (c->constant(getThunk(t, setMaybeNullThunk)),
0, 0,
frame->trace(0, false), frame->trace(0, 0),
0, 0,
4, c->thread(), table, c->constant(fieldOffset(t, field)), value); 4, c->thread(), table, c->constant(fieldOffset(t, field)), value);
} else { } else {
@ -3656,7 +3752,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
{ {
c->call c->call
(c->constant(getThunk(t, releaseMonitorForObjectThunk)), (c->constant(getThunk(t, releaseMonitorForObjectThunk)),
0, frame->trace(0, false), 0, 2, c->thread(), fieldOperand); 0, frame->trace(0, 0), 0, 2, c->thread(), fieldOperand);
} else { } else {
c->storeLoadBarrier(); c->storeLoadBarrier();
} }
@ -3669,10 +3765,7 @@ compile(MyThread* t, Frame* initialFrame, unsigned ip,
return; return;
case return_: case return_:
if ((methodFlags(t, context->method) & ConstructorFlag) if (needsReturnBarrier(t, context->method)) {
and (classFlags(t, methodClass(t, context->method))
& HasFinalMemberFlag))
{
c->storeStoreBarrier(); c->storeStoreBarrier();
} }
@ -3909,6 +4002,28 @@ printSet(uintptr_t m, unsigned limit)
} }
} }
void
shiftLeftZeroPadded(void* data, int dataSizeInBytes, int shiftCountInBits)
{
uint8_t* p = static_cast<uint8_t*>(data);
int shiftCountInBytes = shiftCountInBits / 8;
int shift = shiftCountInBits % 8;
int count = dataSizeInBytes - shiftCountInBytes - 1;
for (int i = 0; i < count; ++i) {
int si = i + shiftCountInBytes;
p[i] = (p[si] >> shift) | ((p[si + 1] >> shift) << (8 - shift));
}
if (count >= 0) {
p[count] = (p[count + shiftCountInBytes] >> shift);
}
for (int i = count + 1; i < dataSizeInBytes; ++i) {
p[i] = 0;
}
}
unsigned unsigned
calculateFrameMaps(MyThread* t, Context* context, uintptr_t* originalRoots, calculateFrameMaps(MyThread* t, Context* context, uintptr_t* originalRoots,
unsigned stackPadding, unsigned eventIndex) unsigned stackPadding, unsigned eventIndex)
@ -4021,8 +4136,15 @@ calculateFrameMaps(MyThread* t, Context* context, uintptr_t* originalRoots,
printSet(*roots, mapSize); printSet(*roots, mapSize);
fprintf(stderr, "\n"); fprintf(stderr, "\n");
} }
memcpy(te->map, roots, mapSize * BytesPerWord); memcpy(te->map, roots, mapSize * BytesPerWord);
if (te->flags & TraceElement::TailCall) {
shiftLeftZeroPadded
(te->map, mapSize * BytesPerWord,
usableFrameSize(t, context->method));
}
eventIndex += BytesPerWord; eventIndex += BytesPerWord;
} break; } break;
@ -4172,7 +4294,7 @@ finish(MyThread* t, Allocator* allocator, Context* context)
if (p->target) { if (p->target) {
insertCallNode insertCallNode
(t, makeCallNode (t, makeCallNode
(t, p->address->value(), p->target, p->virtualCall, 0)); (t, p->address->value(), p->target, p->flags, 0));
} }
} }
@ -4402,15 +4524,15 @@ compile(MyThread* t, Allocator* allocator, BootContext* bootContext,
object method); object method);
void* void*
compileMethod2(MyThread* t) compileMethod2(MyThread* t, uintptr_t ip)
{ {
object node = findCallNode(t, t->arch->frameIp(t->stack)); object node = findCallNode(t, ip);
PROTECT(t, node); PROTECT(t, node);
object target = callNodeTarget(t, node); object target = callNodeTarget(t, node);
PROTECT(t, target); PROTECT(t, target);
if (callNodeVirtualCall(t, node)) { if (callNodeFlags(t, node) & TraceElement::VirtualCall) {
target = resolveTarget(t, t->stack, target); target = resolveTarget(t, t->stack, target);
} }
@ -4422,15 +4544,19 @@ compileMethod2(MyThread* t)
return 0; return 0;
} else { } else {
void* address = reinterpret_cast<void*>(methodAddress(t, target)); void* address = reinterpret_cast<void*>(methodAddress(t, target));
if (callNodeVirtualCall(t, node)) { if (callNodeFlags(t, node) & TraceElement::VirtualCall) {
classVtable classVtable
(t, objectClass (t, objectClass
(t, resolveThisPointer(t, t->stack, target)), methodOffset(t, target)) (t, resolveThisPointer(t, t->stack, target)), methodOffset(t, target))
= address; = address;
} else { } else {
uintptr_t updateIp = ip;
if (callNode(t, node) & TraceElement::TailCall) {
updateIp -= t->arch->constantCallSize();
}
updateCall updateCall
(t, Call, true, reinterpret_cast<void*>(callNodeAddress(t, node)), (t, Call, true, reinterpret_cast<void*>(updateIp), address);
address);
} }
return address; return address;
} }
@ -4439,7 +4565,73 @@ compileMethod2(MyThread* t)
uint64_t uint64_t
compileMethod(MyThread* t) compileMethod(MyThread* t)
{ {
void* r = compileMethod2(t); uintptr_t ip;
if (t->tailAddress) {
ip = t->tailAddress;
t->tailAddress = 0;
} else {
ip = t->arch->frameIp(t->stack);
}
void* r = compileMethod2(t, ip);
if (UNLIKELY(t->exception)) {
unwind(t);
} else {
return reinterpret_cast<uintptr_t>(r);
}
}
void*
tailCall2(MyThread* t, uintptr_t ip)
{
object node = findCallNode(t, ip);
PROTECT(t, node);
object target = callNodeTarget(t, node);
PROTECT(t, target);
if (callNodeFlags(t, node) & TraceElement::VirtualCall) {
target = resolveTarget(t, t->stack, target);
}
if (LIKELY(t->exception == 0)) {
compile(t, codeZone(t), 0, target);
}
if (UNLIKELY(t->exception)) {
return 0;
} else {
void* base = t->base;
void* stack = t->stack;
t->arch->nextFrame(&stack, &base);
if (t->arch->matchCall(t->arch->frameIp(stack), tailHelperThunk(t))) {
void* nextBase = base;
void* nextStack = stack;
t->arch->nextFrame(&nextStack, &nextBase);
if (((reinterpret_cast<uintptr_t>(nextStack)
- reinterpret_cast<uintptr_t>(stack))
/ BytesPerWord)
- t->arch->frameFooterSize()
- t->arch->frameHeaderSize()
>= methodParameterFootprint(t, target))
{
// there's room for the parameters in the previous frame, so use it
t->base = base;
t->stack = stack;
}
}
return reinterpret_cast<void*>(methodAddress(t, target));
}
}
uint64_t
tailCall(MyThread* t)
{
void* r = tailCall2(t, t->arch->frameIp(t->stack));
if (UNLIKELY(t->exception)) { if (UNLIKELY(t->exception)) {
unwind(t); unwind(t);
@ -4632,14 +4824,24 @@ uint64_t
invokeNative(MyThread* t) invokeNative(MyThread* t)
{ {
if (t->trace->nativeMethod == 0) { if (t->trace->nativeMethod == 0) {
object node = findCallNode(t, t->arch->frameIp(t->stack)); uintptr_t ip;
if (t->tailAddress) {
ip = t->tailAddress;
t->tailAddress = 0;
} else {
ip = t->arch->frameIp(t->stack);
}
object node = findCallNode(t, ip);
object target = callNodeTarget(t, node); object target = callNodeTarget(t, node);
if (callNodeVirtualCall(t, node)) { if (callNodeFlags(t, node) & TraceElement::VirtualCall) {
target = resolveTarget(t, t->stack, target); target = resolveTarget(t, t->stack, target);
} }
t->trace->nativeMethod = target; t->trace->nativeMethod = target;
} }
assert(t, t->tailAddress == 0);
uint64_t result = 0; uint64_t result = 0;
if (LIKELY(t->exception == 0)) { if (LIKELY(t->exception == 0)) {
@ -5396,7 +5598,7 @@ class MyProcessor: public Processor {
table[index++] = callNodeAddress(t, p) table[index++] = callNodeAddress(t, p)
- reinterpret_cast<uintptr_t>(code); - reinterpret_cast<uintptr_t>(code);
table[index++] = w->map()->find(callNodeTarget(t, p)) table[index++] = w->map()->find(callNodeTarget(t, p))
| (static_cast<unsigned>(callNodeVirtualCall(t, p)) << BootShift); | (static_cast<unsigned>(callNodeFlags(t, node)) << BootShift);
} }
} }
@ -5494,7 +5696,7 @@ resizeTable(MyThread* t, object oldTable, unsigned newLength)
object newNode = makeCallNode object newNode = makeCallNode
(t, callNodeAddress(t, oldNode), (t, callNodeAddress(t, oldNode),
callNodeTarget(t, oldNode), callNodeTarget(t, oldNode),
callNodeVirtualCall(t, oldNode), callNodeFlags(t, oldNode),
arrayBody(t, newTable, index)); arrayBody(t, newTable, index));
set(t, newTable, ArrayBody + (index * BytesPerWord), newNode); set(t, newTable, ArrayBody + (index * BytesPerWord), newNode);
@ -5818,10 +6020,16 @@ compileThunks(MyThread* t, Allocator* allocator, MyProcessor* p,
}; };
Zone zone(t->m->system, t->m->heap, 1024); Zone zone(t->m->system, t->m->heap, 1024);
ThunkContext defaultContext(t, &zone); ThunkContext defaultContext(t, &zone);
unsigned defaultTailOffset;
{ Assembler* a = defaultContext.context.assembler; { Assembler* a = defaultContext.context.assembler;
a->popReturnAddress(difference(&(t->tailAddress), t));
defaultTailOffset = a->length();
a->saveFrame(difference(&(t->stack), t), difference(&(t->base), t)); a->saveFrame(difference(&(t->stack), t), difference(&(t->base), t));
Assembler::Register thread(t->arch->thread()); Assembler::Register thread(t->arch->thread());
@ -5838,10 +6046,35 @@ compileThunks(MyThread* t, Allocator* allocator, MyProcessor* p,
a->endBlock(false)->resolve(0, 0); a->endBlock(false)->resolve(0, 0);
} }
ThunkContext tailHelperContext(t, &zone);
{ Assembler* a = tailHelperContext.context.assembler;
a->saveFrame(difference(&(t->stack), t), difference(&(t->base), t));
Assembler::Register thread(t->arch->thread());
a->pushFrame(1, BytesPerWord, RegisterOperand, &thread);
Assembler::Constant proc(&(tailHelperContext.promise));
a->apply(LongCall, BytesPerWord, ConstantOperand, &proc);
a->restoreFrame(difference(&(t->stack), t), difference(&(t->base), t));
Assembler::Register result(t->arch->returnLow());
a->apply(Jump, BytesPerWord, RegisterOperand, &result);
a->endBlock(false)->resolve(0, 0);
}
ThunkContext nativeContext(t, &zone); ThunkContext nativeContext(t, &zone);
unsigned nativeTailOffset;
{ Assembler* a = nativeContext.context.assembler; { Assembler* a = nativeContext.context.assembler;
a->popReturnAddress(difference(&(t->tailAddress), t));
nativeTailOffset = a->length();
a->saveFrame(difference(&(t->stack), t), difference(&(t->base), t)); a->saveFrame(difference(&(t->stack), t), difference(&(t->base), t));
Assembler::Register thread(t->arch->thread()); Assembler::Register thread(t->arch->thread());
@ -5890,33 +6123,54 @@ compileThunks(MyThread* t, Allocator* allocator, MyProcessor* p,
(codeSingletonSizeInBytes (codeSingletonSizeInBytes
(t, defaultContext.context.assembler->length()) (t, defaultContext.context.assembler->length())
+ codeSingletonSizeInBytes + codeSingletonSizeInBytes
(t, tailHelperContext.context.assembler->length())
+ codeSingletonSizeInBytes
(t, nativeContext.context.assembler->length()) (t, nativeContext.context.assembler->length())
+ codeSingletonSizeInBytes + codeSingletonSizeInBytes
(t, aioobContext.context.assembler->length()) (t, aioobContext.context.assembler->length())
+ codeSingletonSizeInBytes + codeSingletonSizeInBytes
(t, p->thunkSize * ThunkCount))); (t, p->thunkSize * ThunkCount)));
p->defaultThunk = finish p->defaultTailThunk = finish
(t, allocator, defaultContext.context.assembler, "default"); (t, allocator, defaultContext.context.assembler, "default");
p->defaultThunk = p->defaultTailThunk + defaultTailOffset;
{ void* call; { void* call;
defaultContext.promise.listener->resolve defaultContext.promise.listener->resolve
(reinterpret_cast<intptr_t>(voidPointer(compileMethod)), &call); (reinterpret_cast<intptr_t>(voidPointer(compileMethod)), &call);
if (image) { if (image) {
image->defaultTailThunk = p->defaultTailThunk - imageBase;
image->defaultThunk = p->defaultThunk - imageBase; image->defaultThunk = p->defaultThunk - imageBase;
image->compileMethodCall = static_cast<uint8_t*>(call) - imageBase; image->compileMethodCall = static_cast<uint8_t*>(call) - imageBase;
} }
} }
p->nativeThunk = finish p->tailHelperThunk = finish
(t, allocator, defaultContext.context.assembler, "tailHelper");
{ void* call;
tailHelperContext.promise.listener->resolve
(reinterpret_cast<intptr_t>(voidPointer(tailCall)), &call);
if (image) {
image->tailHelperThunk = p->tailHelperThunk - imageBase;
image->tailHelperCall = static_cast<uint8_t*>(call) - imageBase;
}
}
p->nativeTailThunk = finish
(t, allocator, nativeContext.context.assembler, "native"); (t, allocator, nativeContext.context.assembler, "native");
p->nativeThunk = p->nativeTailThunk + nativeTailOffset;
{ void* call; { void* call;
nativeContext.promise.listener->resolve nativeContext.promise.listener->resolve
(reinterpret_cast<intptr_t>(voidPointer(invokeNative)), &call); (reinterpret_cast<intptr_t>(voidPointer(invokeNative)), &call);
if (image) { if (image) {
image->nativeTailThunk = p->nativeTailThunk - imageBase;
image->nativeThunk = p->nativeThunk - imageBase; image->nativeThunk = p->nativeThunk - imageBase;
image->invokeNativeCall = static_cast<uint8_t*>(call) - imageBase; image->invokeNativeCall = static_cast<uint8_t*>(call) - imageBase;
} }

View File

@ -2258,7 +2258,12 @@ class CallEvent: public Event {
uint32_t registerMask = ~0; uint32_t registerMask = ~0;
Stack* s = argumentStack; Stack* s = argumentStack;
unsigned index = 0; unsigned index = 0;
unsigned frameIndex = 0; unsigned frameIndex;
if (flags & (Compiler::TailJump | Compiler::TailCall)) {
frameIndex = usableFrameSize(c);
} else {
frameIndex = 0;
}
if (argumentCount) { if (argumentCount) {
while (true) { while (true) {
@ -2308,56 +2313,59 @@ class CallEvent: public Event {
(typeMask, registerMask & planRegisterMask, AnyFrameIndex))); (typeMask, registerMask & planRegisterMask, AnyFrameIndex)));
} }
int footprint = stackArgumentFootprint; if ((flags & (Compiler::TailJump | Compiler::TailCall)_ == 0) {
for (Stack* s = stackBefore; s; s = s->next) { int footprint = stackArgumentFootprint;
if (s->value) { for (Stack* s = stackBefore; s; s = s->next) {
if (footprint > 0) { if (s->value) {
if (DebugReads) { if (footprint > 0) {
fprintf(stderr, "stack arg read %p at %d of %d\n", if (DebugReads) {
s->value, frameIndex, fprintf(stderr, "stack arg read %p at %d of %d\n",
usableFrameSize(c) + c->parameterFootprint); s->value, frameIndex,
} usableFrameSize(c) + c->parameterFootprint);
}
addRead(c, this, s->value, read addRead(c, this, s->value, read
(c, SiteMask(1 << MemoryOperand, 0, frameIndex))); (c, SiteMask(1 << MemoryOperand, 0, frameIndex)));
} else { } else {
unsigned logicalIndex = ::frameIndex
(c, s->index + c->localFootprint);
if (DebugReads) {
fprintf(stderr, "stack save read %p at %d of %d\n",
s->value, logicalIndex,
usableFrameSize(c) + c->parameterFootprint);
}
addRead(c, this, s->value, read
(c, SiteMask(1 << MemoryOperand, 0, logicalIndex)));
}
}
-- footprint;
if (footprint == 0) {
unsigned logicalIndex = ::frameIndex unsigned logicalIndex = ::frameIndex
(c, s->index + c->localFootprint); (c, s->index + c->localFootprint);
if (DebugReads) { assert(c, logicalIndex >= frameIndex);
fprintf(stderr, "stack save read %p at %d of %d\n",
s->value, logicalIndex,
usableFrameSize(c) + c->parameterFootprint);
}
addRead(c, this, s->value, read padding = logicalIndex - frameIndex;
(c, SiteMask(1 << MemoryOperand, 0, logicalIndex))); padIndex = s->index + c->localFootprint;
} }
++ frameIndex;
} }
-- footprint; popIndex
= usableFrameSize(c)
+ c->parameterFootprint
- (stackBefore ? stackBefore->index + 1 - stackArgumentFootprint : 0)
- c->localFootprint;
if (footprint == 0) { assert(c, static_cast<int>(popIndex) >= 0);
unsigned logicalIndex = ::frameIndex(c, s->index + c->localFootprint);
assert(c, logicalIndex >= frameIndex); saveLocals(c, this);
padding = logicalIndex - frameIndex;
padIndex = s->index + c->localFootprint;
}
++ frameIndex;
} }
popIndex
= usableFrameSize(c)
+ c->parameterFootprint
- (stackBefore ? stackBefore->index + 1 - stackArgumentFootprint : 0)
- c->localFootprint;
assert(c, static_cast<int>(popIndex) >= 0);
saveLocals(c, this);
} }
virtual const char* name() { virtual const char* name() {
@ -2365,8 +2373,33 @@ class CallEvent: public Event {
} }
virtual void compile(Context* c) { virtual void compile(Context* c) {
apply(c, (flags & Compiler::Aligned) ? AlignedCall : Call, BytesPerWord, UnaryOperation op;
address->source, 0);
if (flags & Compiler::TailJump) {
c->assembler->popFrame();
if (flags & Compiler::Aligned) {
op = AlignedJump;
} else {
op = Jump;
}
} else if (flags & Compiler::TailCall) {
c->assembler->popFrame();
if (flags & Compiler::Aligned) {
op = AlignedCall;
} else {
op = Call;
}
} else {
if (flags & Compiler::Aligned) {
op = AlignedCall;
} else {
op = Call;
}
}
apply(c, op, BytesPerWord, address->source, 0);
if (traceHandler) { if (traceHandler) {
traceHandler->handleTrace(codePromise(c, c->assembler->offset()), traceHandler->handleTrace(codePromise(c, c->assembler->offset()),

View File

@ -27,6 +27,7 @@ class Compiler {
static const unsigned Aligned = 1 << 0; static const unsigned Aligned = 1 << 0;
static const unsigned NoReturn = 1 << 1; static const unsigned NoReturn = 1 << 1;
static const unsigned TailCall = 1 << 2;
class Operand { }; class Operand { };
class StackElement { }; class StackElement { };

View File

@ -1734,6 +1734,10 @@ class MyArchitecture: public Assembler::Architecture {
} }
} }
virtual unsigned constantCallSize() {
return 4;
}
virtual uintptr_t getConstant(const void* src) { virtual uintptr_t getConstant(const void* src) {
const int32_t* p = static_cast<const int32_t*>(src); const int32_t* p = static_cast<const int32_t*>(src);
return (p[0] << 16) | (p[1] & 0xFFFF); return (p[0] << 16) | (p[1] & 0xFFFF);

View File

@ -94,7 +94,7 @@
(type callNode (type callNode
(intptr_t address) (intptr_t address)
(object target) (object target)
(uintptr_t virtualCall) (uintptr_t flags)
(object next)) (object next))
(type array (type array

View File

@ -2088,6 +2088,10 @@ class MyArchitecture: public Assembler::Architecture {
} }
} }
virtual unsigned constantCallSize() {
return 5;
}
virtual uintptr_t getConstant(const void* src) { virtual uintptr_t getConstant(const void* src) {
uintptr_t v; uintptr_t v;
memcpy(&v, src, BytesPerWord); memcpy(&v, src, BytesPerWord);